{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9992431561435143, "global_step": 573000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.9956403003658664e-05, "loss": 6.6229, "step": 500 }, { "epoch": 0.0, "learning_rate": 4.991280600731732e-05, "loss": 5.5184, "step": 1000 }, { "epoch": 0.0, "learning_rate": 4.986920901097598e-05, "loss": 5.1215, "step": 1500 }, { "epoch": 0.0, "learning_rate": 4.982561201463464e-05, "loss": 4.8658, "step": 2000 }, { "epoch": 0.0, "learning_rate": 4.97820150182933e-05, "loss": 4.6479, "step": 2500 }, { "epoch": 0.01, "learning_rate": 4.973841802195196e-05, "loss": 4.5154, "step": 3000 }, { "epoch": 0.01, "learning_rate": 4.969482102561062e-05, "loss": 4.3856, "step": 3500 }, { "epoch": 0.01, "learning_rate": 4.965122402926928e-05, "loss": 4.2794, "step": 4000 }, { "epoch": 0.01, "learning_rate": 4.960762703292794e-05, "loss": 4.1869, "step": 4500 }, { "epoch": 0.01, "learning_rate": 4.95640300365866e-05, "loss": 4.1061, "step": 5000 }, { "epoch": 0.01, "learning_rate": 4.9520433040245264e-05, "loss": 4.0322, "step": 5500 }, { "epoch": 0.01, "learning_rate": 4.9476836043903926e-05, "loss": 3.9469, "step": 6000 }, { "epoch": 0.01, "learning_rate": 4.943323904756258e-05, "loss": 3.8693, "step": 6500 }, { "epoch": 0.01, "learning_rate": 4.938964205122124e-05, "loss": 3.8154, "step": 7000 }, { "epoch": 0.01, "learning_rate": 4.93460450548799e-05, "loss": 3.7452, "step": 7500 }, { "epoch": 0.01, "learning_rate": 4.9302448058538564e-05, "loss": 3.6877, "step": 8000 }, { "epoch": 0.01, "learning_rate": 4.925885106219722e-05, "loss": 3.6377, "step": 8500 }, { "epoch": 0.02, "learning_rate": 4.921525406585588e-05, "loss": 3.5988, "step": 9000 }, { "epoch": 0.02, "learning_rate": 4.917165706951454e-05, "loss": 3.5531, "step": 9500 }, { "epoch": 0.02, "learning_rate": 4.9128060073173196e-05, "loss": 3.5133, "step": 10000 }, { "epoch": 0.02, "learning_rate": 4.908446307683186e-05, "loss": 3.4781, "step": 10500 }, { "epoch": 0.02, "learning_rate": 4.904086608049052e-05, "loss": 3.4556, "step": 11000 }, { "epoch": 0.02, "learning_rate": 4.899726908414918e-05, "loss": 3.4205, "step": 11500 }, { "epoch": 0.02, "learning_rate": 4.895367208780784e-05, "loss": 3.4049, "step": 12000 }, { "epoch": 0.02, "learning_rate": 4.89100750914665e-05, "loss": 3.3677, "step": 12500 }, { "epoch": 0.02, "learning_rate": 4.8866478095125165e-05, "loss": 3.3676, "step": 13000 }, { "epoch": 0.02, "learning_rate": 4.882288109878382e-05, "loss": 3.3316, "step": 13500 }, { "epoch": 0.02, "learning_rate": 4.877928410244248e-05, "loss": 3.3093, "step": 14000 }, { "epoch": 0.03, "learning_rate": 4.873568710610114e-05, "loss": 3.311, "step": 14500 }, { "epoch": 0.03, "learning_rate": 4.8692090109759803e-05, "loss": 3.248, "step": 15000 }, { "epoch": 0.03, "learning_rate": 4.864849311341846e-05, "loss": 3.258, "step": 15500 }, { "epoch": 0.03, "learning_rate": 4.860489611707712e-05, "loss": 3.2311, "step": 16000 }, { "epoch": 0.03, "learning_rate": 4.856129912073578e-05, "loss": 3.2173, "step": 16500 }, { "epoch": 0.03, "learning_rate": 4.8517702124394435e-05, "loss": 3.2002, "step": 17000 }, { "epoch": 0.03, "learning_rate": 4.84741051280531e-05, "loss": 3.1813, "step": 17500 }, { "epoch": 0.03, "learning_rate": 4.843050813171176e-05, "loss": 3.1847, "step": 18000 }, { "epoch": 0.03, "learning_rate": 4.838691113537042e-05, "loss": 3.1575, "step": 18500 }, { "epoch": 0.03, "learning_rate": 4.834331413902908e-05, "loss": 3.1634, "step": 19000 }, { "epoch": 0.03, "learning_rate": 4.829971714268774e-05, "loss": 3.1104, "step": 19500 }, { "epoch": 0.03, "learning_rate": 4.8256120146346404e-05, "loss": 3.1243, "step": 20000 }, { "epoch": 0.04, "learning_rate": 4.8212523150005065e-05, "loss": 3.1088, "step": 20500 }, { "epoch": 0.04, "learning_rate": 4.816892615366372e-05, "loss": 3.1038, "step": 21000 }, { "epoch": 0.04, "learning_rate": 4.812532915732238e-05, "loss": 3.0727, "step": 21500 }, { "epoch": 0.04, "learning_rate": 4.808173216098104e-05, "loss": 3.0702, "step": 22000 }, { "epoch": 0.04, "learning_rate": 4.80381351646397e-05, "loss": 3.0794, "step": 22500 }, { "epoch": 0.04, "learning_rate": 4.799453816829836e-05, "loss": 3.0593, "step": 23000 }, { "epoch": 0.04, "learning_rate": 4.795094117195702e-05, "loss": 3.044, "step": 23500 }, { "epoch": 0.04, "learning_rate": 4.790734417561568e-05, "loss": 3.0237, "step": 24000 }, { "epoch": 0.04, "learning_rate": 4.7863747179274336e-05, "loss": 3.0296, "step": 24500 }, { "epoch": 0.04, "learning_rate": 4.7820150182933e-05, "loss": 3.024, "step": 25000 }, { "epoch": 0.04, "learning_rate": 4.777655318659166e-05, "loss": 3.0292, "step": 25500 }, { "epoch": 0.05, "learning_rate": 4.773295619025031e-05, "loss": 3.006, "step": 26000 }, { "epoch": 0.05, "learning_rate": 4.7689359193908975e-05, "loss": 2.996, "step": 26500 }, { "epoch": 0.05, "learning_rate": 4.7645762197567636e-05, "loss": 2.9869, "step": 27000 }, { "epoch": 0.05, "learning_rate": 4.76021652012263e-05, "loss": 2.9667, "step": 27500 }, { "epoch": 0.05, "learning_rate": 4.755856820488496e-05, "loss": 2.9537, "step": 28000 }, { "epoch": 0.05, "learning_rate": 4.751497120854362e-05, "loss": 2.9679, "step": 28500 }, { "epoch": 0.05, "learning_rate": 4.747137421220228e-05, "loss": 2.9606, "step": 29000 }, { "epoch": 0.05, "learning_rate": 4.7427777215860936e-05, "loss": 2.9225, "step": 29500 }, { "epoch": 0.05, "learning_rate": 4.73841802195196e-05, "loss": 2.9253, "step": 30000 }, { "epoch": 0.05, "learning_rate": 4.734058322317826e-05, "loss": 2.945, "step": 30500 }, { "epoch": 0.05, "learning_rate": 4.729698622683692e-05, "loss": 2.9421, "step": 31000 }, { "epoch": 0.05, "learning_rate": 4.7253389230495575e-05, "loss": 2.9291, "step": 31500 }, { "epoch": 0.06, "learning_rate": 4.7209792234154237e-05, "loss": 2.9093, "step": 32000 }, { "epoch": 0.06, "learning_rate": 4.71661952378129e-05, "loss": 2.914, "step": 32500 }, { "epoch": 0.06, "learning_rate": 4.712259824147156e-05, "loss": 2.9038, "step": 33000 }, { "epoch": 0.06, "learning_rate": 4.7079001245130214e-05, "loss": 2.8911, "step": 33500 }, { "epoch": 0.06, "learning_rate": 4.7035404248788875e-05, "loss": 2.8811, "step": 34000 }, { "epoch": 0.06, "learning_rate": 4.699180725244754e-05, "loss": 2.8962, "step": 34500 }, { "epoch": 0.06, "learning_rate": 4.69482102561062e-05, "loss": 2.8896, "step": 35000 }, { "epoch": 0.06, "learning_rate": 4.690461325976486e-05, "loss": 2.886, "step": 35500 }, { "epoch": 0.06, "learning_rate": 4.686101626342352e-05, "loss": 2.8664, "step": 36000 }, { "epoch": 0.06, "learning_rate": 4.681741926708218e-05, "loss": 2.8638, "step": 36500 }, { "epoch": 0.06, "learning_rate": 4.677382227074084e-05, "loss": 2.8561, "step": 37000 }, { "epoch": 0.07, "learning_rate": 4.67302252743995e-05, "loss": 2.8694, "step": 37500 }, { "epoch": 0.07, "learning_rate": 4.668662827805816e-05, "loss": 2.8585, "step": 38000 }, { "epoch": 0.07, "learning_rate": 4.6643031281716814e-05, "loss": 2.8377, "step": 38500 }, { "epoch": 0.07, "learning_rate": 4.6599434285375476e-05, "loss": 2.8471, "step": 39000 }, { "epoch": 0.07, "learning_rate": 4.655583728903414e-05, "loss": 2.855, "step": 39500 }, { "epoch": 0.07, "learning_rate": 4.65122402926928e-05, "loss": 2.8583, "step": 40000 }, { "epoch": 0.07, "learning_rate": 4.646864329635145e-05, "loss": 2.8162, "step": 40500 }, { "epoch": 0.07, "learning_rate": 4.6425046300010114e-05, "loss": 2.8341, "step": 41000 }, { "epoch": 0.07, "learning_rate": 4.6381449303668776e-05, "loss": 2.8176, "step": 41500 }, { "epoch": 0.07, "learning_rate": 4.633785230732744e-05, "loss": 2.8046, "step": 42000 }, { "epoch": 0.07, "learning_rate": 4.62942553109861e-05, "loss": 2.8167, "step": 42500 }, { "epoch": 0.07, "learning_rate": 4.625065831464476e-05, "loss": 2.7942, "step": 43000 }, { "epoch": 0.08, "learning_rate": 4.620706131830342e-05, "loss": 2.8192, "step": 43500 }, { "epoch": 0.08, "learning_rate": 4.6163464321962076e-05, "loss": 2.8207, "step": 44000 }, { "epoch": 0.08, "learning_rate": 4.611986732562074e-05, "loss": 2.7887, "step": 44500 }, { "epoch": 0.08, "learning_rate": 4.60762703292794e-05, "loss": 2.8046, "step": 45000 }, { "epoch": 0.08, "learning_rate": 4.603267333293806e-05, "loss": 2.7617, "step": 45500 }, { "epoch": 0.08, "learning_rate": 4.5989076336596715e-05, "loss": 2.7807, "step": 46000 }, { "epoch": 0.08, "learning_rate": 4.5945479340255376e-05, "loss": 2.7942, "step": 46500 }, { "epoch": 0.08, "learning_rate": 4.590188234391404e-05, "loss": 2.7787, "step": 47000 }, { "epoch": 0.08, "learning_rate": 4.585828534757269e-05, "loss": 2.7708, "step": 47500 }, { "epoch": 0.08, "learning_rate": 4.5814688351231354e-05, "loss": 2.7828, "step": 48000 }, { "epoch": 0.08, "learning_rate": 4.5771091354890015e-05, "loss": 2.7828, "step": 48500 }, { "epoch": 0.09, "learning_rate": 4.5727494358548676e-05, "loss": 2.7639, "step": 49000 }, { "epoch": 0.09, "learning_rate": 4.568389736220733e-05, "loss": 2.7538, "step": 49500 }, { "epoch": 0.09, "learning_rate": 4.564030036586599e-05, "loss": 2.7618, "step": 50000 }, { "epoch": 0.09, "learning_rate": 4.5596703369524654e-05, "loss": 2.7534, "step": 50500 }, { "epoch": 0.09, "learning_rate": 4.5553106373183315e-05, "loss": 2.759, "step": 51000 }, { "epoch": 0.09, "learning_rate": 4.5509509376841977e-05, "loss": 2.7616, "step": 51500 }, { "epoch": 0.09, "learning_rate": 4.546591238050064e-05, "loss": 2.7393, "step": 52000 }, { "epoch": 0.09, "learning_rate": 4.54223153841593e-05, "loss": 2.7513, "step": 52500 }, { "epoch": 0.09, "learning_rate": 4.5378718387817954e-05, "loss": 2.7386, "step": 53000 }, { "epoch": 0.09, "learning_rate": 4.5335121391476615e-05, "loss": 2.7542, "step": 53500 }, { "epoch": 0.09, "learning_rate": 4.529152439513528e-05, "loss": 2.7503, "step": 54000 }, { "epoch": 0.1, "learning_rate": 4.524792739879393e-05, "loss": 2.7396, "step": 54500 }, { "epoch": 0.1, "learning_rate": 4.520433040245259e-05, "loss": 2.7056, "step": 55000 }, { "epoch": 0.1, "learning_rate": 4.5160733406111254e-05, "loss": 2.7219, "step": 55500 }, { "epoch": 0.1, "learning_rate": 4.5117136409769915e-05, "loss": 2.7176, "step": 56000 }, { "epoch": 0.1, "learning_rate": 4.507353941342857e-05, "loss": 2.7235, "step": 56500 }, { "epoch": 0.1, "learning_rate": 4.502994241708723e-05, "loss": 2.7279, "step": 57000 }, { "epoch": 0.1, "learning_rate": 4.498634542074589e-05, "loss": 2.7177, "step": 57500 }, { "epoch": 0.1, "learning_rate": 4.4942748424404554e-05, "loss": 2.7252, "step": 58000 }, { "epoch": 0.1, "learning_rate": 4.4899151428063216e-05, "loss": 2.7003, "step": 58500 }, { "epoch": 0.1, "learning_rate": 4.485555443172188e-05, "loss": 2.7073, "step": 59000 }, { "epoch": 0.1, "learning_rate": 4.481195743538054e-05, "loss": 2.6908, "step": 59500 }, { "epoch": 0.1, "learning_rate": 4.476836043903919e-05, "loss": 2.7133, "step": 60000 }, { "epoch": 0.11, "learning_rate": 4.4724763442697854e-05, "loss": 2.7251, "step": 60500 }, { "epoch": 0.11, "learning_rate": 4.4681166446356516e-05, "loss": 2.6973, "step": 61000 }, { "epoch": 0.11, "learning_rate": 4.463756945001518e-05, "loss": 2.7148, "step": 61500 }, { "epoch": 0.11, "learning_rate": 4.459397245367383e-05, "loss": 2.6953, "step": 62000 }, { "epoch": 0.11, "learning_rate": 4.455037545733249e-05, "loss": 2.6877, "step": 62500 }, { "epoch": 0.11, "learning_rate": 4.4506778460991155e-05, "loss": 2.7098, "step": 63000 }, { "epoch": 0.11, "learning_rate": 4.446318146464981e-05, "loss": 2.6791, "step": 63500 }, { "epoch": 0.11, "learning_rate": 4.441958446830847e-05, "loss": 2.688, "step": 64000 }, { "epoch": 0.11, "learning_rate": 4.437598747196713e-05, "loss": 2.6947, "step": 64500 }, { "epoch": 0.11, "learning_rate": 4.4332390475625793e-05, "loss": 2.6871, "step": 65000 }, { "epoch": 0.11, "learning_rate": 4.4288793479284455e-05, "loss": 2.6713, "step": 65500 }, { "epoch": 0.12, "learning_rate": 4.4245196482943116e-05, "loss": 2.6781, "step": 66000 }, { "epoch": 0.12, "learning_rate": 4.420159948660178e-05, "loss": 2.6799, "step": 66500 }, { "epoch": 0.12, "learning_rate": 4.415800249026043e-05, "loss": 2.6627, "step": 67000 }, { "epoch": 0.12, "learning_rate": 4.4114405493919094e-05, "loss": 2.6837, "step": 67500 }, { "epoch": 0.12, "learning_rate": 4.4070808497577755e-05, "loss": 2.6745, "step": 68000 }, { "epoch": 0.12, "learning_rate": 4.4027211501236416e-05, "loss": 2.6741, "step": 68500 }, { "epoch": 0.12, "learning_rate": 4.398361450489507e-05, "loss": 2.6666, "step": 69000 }, { "epoch": 0.12, "learning_rate": 4.394001750855373e-05, "loss": 2.6748, "step": 69500 }, { "epoch": 0.12, "learning_rate": 4.3896420512212394e-05, "loss": 2.6532, "step": 70000 }, { "epoch": 0.12, "learning_rate": 4.3852823515871055e-05, "loss": 2.6596, "step": 70500 }, { "epoch": 0.12, "learning_rate": 4.380922651952971e-05, "loss": 2.6524, "step": 71000 }, { "epoch": 0.12, "learning_rate": 4.376562952318837e-05, "loss": 2.64, "step": 71500 }, { "epoch": 0.13, "learning_rate": 4.372203252684703e-05, "loss": 2.6664, "step": 72000 }, { "epoch": 0.13, "learning_rate": 4.367843553050569e-05, "loss": 2.6496, "step": 72500 }, { "epoch": 0.13, "learning_rate": 4.363483853416435e-05, "loss": 2.6401, "step": 73000 }, { "epoch": 0.13, "learning_rate": 4.359124153782301e-05, "loss": 2.6422, "step": 73500 }, { "epoch": 0.13, "learning_rate": 4.354764454148167e-05, "loss": 2.6466, "step": 74000 }, { "epoch": 0.13, "learning_rate": 4.350404754514033e-05, "loss": 2.6331, "step": 74500 }, { "epoch": 0.13, "learning_rate": 4.3460450548798994e-05, "loss": 2.6435, "step": 75000 }, { "epoch": 0.13, "learning_rate": 4.3416853552457656e-05, "loss": 2.6557, "step": 75500 }, { "epoch": 0.13, "learning_rate": 4.337325655611631e-05, "loss": 2.6306, "step": 76000 }, { "epoch": 0.13, "learning_rate": 4.332965955977497e-05, "loss": 2.631, "step": 76500 }, { "epoch": 0.13, "learning_rate": 4.328606256343363e-05, "loss": 2.6575, "step": 77000 }, { "epoch": 0.14, "learning_rate": 4.3242465567092294e-05, "loss": 2.6436, "step": 77500 }, { "epoch": 0.14, "learning_rate": 4.319886857075095e-05, "loss": 2.6248, "step": 78000 }, { "epoch": 0.14, "learning_rate": 4.315527157440961e-05, "loss": 2.6213, "step": 78500 }, { "epoch": 0.14, "learning_rate": 4.311167457806827e-05, "loss": 2.6431, "step": 79000 }, { "epoch": 0.14, "learning_rate": 4.3068077581726926e-05, "loss": 2.6397, "step": 79500 }, { "epoch": 0.14, "learning_rate": 4.302448058538559e-05, "loss": 2.6158, "step": 80000 }, { "epoch": 0.14, "learning_rate": 4.298088358904425e-05, "loss": 2.6327, "step": 80500 }, { "epoch": 0.14, "learning_rate": 4.293728659270291e-05, "loss": 2.6201, "step": 81000 }, { "epoch": 0.14, "learning_rate": 4.289368959636157e-05, "loss": 2.6227, "step": 81500 }, { "epoch": 0.14, "learning_rate": 4.285009260002023e-05, "loss": 2.6222, "step": 82000 }, { "epoch": 0.14, "learning_rate": 4.2806495603678895e-05, "loss": 2.6215, "step": 82500 }, { "epoch": 0.14, "learning_rate": 4.276289860733755e-05, "loss": 2.6115, "step": 83000 }, { "epoch": 0.15, "learning_rate": 4.271930161099621e-05, "loss": 2.6067, "step": 83500 }, { "epoch": 0.15, "learning_rate": 4.267570461465487e-05, "loss": 2.6234, "step": 84000 }, { "epoch": 0.15, "learning_rate": 4.2632107618313533e-05, "loss": 2.6084, "step": 84500 }, { "epoch": 0.15, "learning_rate": 4.258851062197219e-05, "loss": 2.6051, "step": 85000 }, { "epoch": 0.15, "learning_rate": 4.254491362563085e-05, "loss": 2.6035, "step": 85500 }, { "epoch": 0.15, "learning_rate": 4.250131662928951e-05, "loss": 2.6023, "step": 86000 }, { "epoch": 0.15, "learning_rate": 4.245771963294817e-05, "loss": 2.5975, "step": 86500 }, { "epoch": 0.15, "learning_rate": 4.241412263660683e-05, "loss": 2.5987, "step": 87000 }, { "epoch": 0.15, "learning_rate": 4.237052564026549e-05, "loss": 2.5887, "step": 87500 }, { "epoch": 0.15, "learning_rate": 4.232692864392415e-05, "loss": 2.617, "step": 88000 }, { "epoch": 0.15, "learning_rate": 4.228333164758281e-05, "loss": 2.5967, "step": 88500 }, { "epoch": 0.16, "learning_rate": 4.223973465124147e-05, "loss": 2.6002, "step": 89000 }, { "epoch": 0.16, "learning_rate": 4.2196137654900134e-05, "loss": 2.5859, "step": 89500 }, { "epoch": 0.16, "learning_rate": 4.2152540658558795e-05, "loss": 2.605, "step": 90000 }, { "epoch": 0.16, "learning_rate": 4.210894366221745e-05, "loss": 2.5834, "step": 90500 }, { "epoch": 0.16, "learning_rate": 4.206534666587611e-05, "loss": 2.5869, "step": 91000 }, { "epoch": 0.16, "learning_rate": 4.202174966953477e-05, "loss": 2.5856, "step": 91500 }, { "epoch": 0.16, "learning_rate": 4.197815267319343e-05, "loss": 2.5791, "step": 92000 }, { "epoch": 0.16, "learning_rate": 4.193455567685209e-05, "loss": 2.5899, "step": 92500 }, { "epoch": 0.16, "learning_rate": 4.189095868051075e-05, "loss": 2.5982, "step": 93000 }, { "epoch": 0.16, "learning_rate": 4.184736168416941e-05, "loss": 2.5828, "step": 93500 }, { "epoch": 0.16, "learning_rate": 4.1803764687828066e-05, "loss": 2.5874, "step": 94000 }, { "epoch": 0.16, "learning_rate": 4.176016769148673e-05, "loss": 2.5749, "step": 94500 }, { "epoch": 0.17, "learning_rate": 4.171657069514539e-05, "loss": 2.5809, "step": 95000 }, { "epoch": 0.17, "learning_rate": 4.167297369880404e-05, "loss": 2.5824, "step": 95500 }, { "epoch": 0.17, "learning_rate": 4.1629376702462705e-05, "loss": 2.584, "step": 96000 }, { "epoch": 0.17, "learning_rate": 4.1585779706121366e-05, "loss": 2.5837, "step": 96500 }, { "epoch": 0.17, "learning_rate": 4.154218270978003e-05, "loss": 2.5784, "step": 97000 }, { "epoch": 0.17, "learning_rate": 4.149858571343869e-05, "loss": 2.5895, "step": 97500 }, { "epoch": 0.17, "learning_rate": 4.145498871709735e-05, "loss": 2.571, "step": 98000 }, { "epoch": 0.17, "learning_rate": 4.141139172075601e-05, "loss": 2.5712, "step": 98500 }, { "epoch": 0.17, "learning_rate": 4.136779472441467e-05, "loss": 2.5636, "step": 99000 }, { "epoch": 0.17, "learning_rate": 4.132419772807333e-05, "loss": 2.5699, "step": 99500 }, { "epoch": 0.17, "learning_rate": 4.128060073173199e-05, "loss": 2.5768, "step": 100000 }, { "epoch": 0.18, "learning_rate": 4.123700373539065e-05, "loss": 2.5644, "step": 100500 }, { "epoch": 0.18, "learning_rate": 4.1193406739049305e-05, "loss": 2.5699, "step": 101000 }, { "epoch": 0.18, "learning_rate": 4.1149809742707966e-05, "loss": 2.5651, "step": 101500 }, { "epoch": 0.18, "learning_rate": 4.110621274636663e-05, "loss": 2.5625, "step": 102000 }, { "epoch": 0.18, "learning_rate": 4.106261575002529e-05, "loss": 2.5617, "step": 102500 }, { "epoch": 0.18, "learning_rate": 4.1019018753683944e-05, "loss": 2.5593, "step": 103000 }, { "epoch": 0.18, "learning_rate": 4.0975421757342605e-05, "loss": 2.5751, "step": 103500 }, { "epoch": 0.18, "learning_rate": 4.093182476100127e-05, "loss": 2.554, "step": 104000 }, { "epoch": 0.18, "learning_rate": 4.088822776465993e-05, "loss": 2.5473, "step": 104500 }, { "epoch": 0.18, "learning_rate": 4.084463076831859e-05, "loss": 2.5546, "step": 105000 }, { "epoch": 0.18, "learning_rate": 4.080103377197725e-05, "loss": 2.5567, "step": 105500 }, { "epoch": 0.18, "learning_rate": 4.075743677563591e-05, "loss": 2.5422, "step": 106000 }, { "epoch": 0.19, "learning_rate": 4.071383977929457e-05, "loss": 2.5428, "step": 106500 }, { "epoch": 0.19, "learning_rate": 4.067024278295323e-05, "loss": 2.5522, "step": 107000 }, { "epoch": 0.19, "learning_rate": 4.062664578661189e-05, "loss": 2.5447, "step": 107500 }, { "epoch": 0.19, "learning_rate": 4.0583048790270544e-05, "loss": 2.5577, "step": 108000 }, { "epoch": 0.19, "learning_rate": 4.0539451793929206e-05, "loss": 2.5512, "step": 108500 }, { "epoch": 0.19, "learning_rate": 4.049585479758787e-05, "loss": 2.5744, "step": 109000 }, { "epoch": 0.19, "learning_rate": 4.045225780124653e-05, "loss": 2.5468, "step": 109500 }, { "epoch": 0.19, "learning_rate": 4.040866080490518e-05, "loss": 2.5397, "step": 110000 }, { "epoch": 0.19, "learning_rate": 4.0365063808563844e-05, "loss": 2.5598, "step": 110500 }, { "epoch": 0.19, "learning_rate": 4.0321466812222506e-05, "loss": 2.5554, "step": 111000 }, { "epoch": 0.19, "learning_rate": 4.027786981588117e-05, "loss": 2.545, "step": 111500 }, { "epoch": 0.2, "learning_rate": 4.023427281953983e-05, "loss": 2.5403, "step": 112000 }, { "epoch": 0.2, "learning_rate": 4.019067582319849e-05, "loss": 2.5293, "step": 112500 }, { "epoch": 0.2, "learning_rate": 4.014707882685715e-05, "loss": 2.557, "step": 113000 }, { "epoch": 0.2, "learning_rate": 4.0103481830515806e-05, "loss": 2.5597, "step": 113500 }, { "epoch": 0.2, "learning_rate": 4.005988483417447e-05, "loss": 2.5351, "step": 114000 }, { "epoch": 0.2, "learning_rate": 4.001628783783313e-05, "loss": 2.5318, "step": 114500 }, { "epoch": 0.2, "learning_rate": 3.997269084149179e-05, "loss": 2.5601, "step": 115000 }, { "epoch": 0.2, "learning_rate": 3.9929093845150445e-05, "loss": 2.5203, "step": 115500 }, { "epoch": 0.2, "learning_rate": 3.9885496848809106e-05, "loss": 2.5251, "step": 116000 }, { "epoch": 0.2, "learning_rate": 3.984189985246777e-05, "loss": 2.5424, "step": 116500 }, { "epoch": 0.2, "learning_rate": 3.979830285612642e-05, "loss": 2.5324, "step": 117000 }, { "epoch": 0.2, "learning_rate": 3.9754705859785084e-05, "loss": 2.5238, "step": 117500 }, { "epoch": 0.21, "learning_rate": 3.9711108863443745e-05, "loss": 2.5231, "step": 118000 }, { "epoch": 0.21, "learning_rate": 3.9667511867102406e-05, "loss": 2.5361, "step": 118500 }, { "epoch": 0.21, "learning_rate": 3.962391487076106e-05, "loss": 2.5367, "step": 119000 }, { "epoch": 0.21, "learning_rate": 3.958031787441972e-05, "loss": 2.5504, "step": 119500 }, { "epoch": 0.21, "learning_rate": 3.9536720878078384e-05, "loss": 2.5164, "step": 120000 }, { "epoch": 0.21, "learning_rate": 3.9493123881737045e-05, "loss": 2.5362, "step": 120500 }, { "epoch": 0.21, "learning_rate": 3.9449526885395707e-05, "loss": 2.5249, "step": 121000 }, { "epoch": 0.21, "learning_rate": 3.940592988905437e-05, "loss": 2.5258, "step": 121500 }, { "epoch": 0.21, "learning_rate": 3.936233289271303e-05, "loss": 2.5254, "step": 122000 }, { "epoch": 0.21, "learning_rate": 3.9318735896371684e-05, "loss": 2.5352, "step": 122500 }, { "epoch": 0.21, "learning_rate": 3.9275138900030345e-05, "loss": 2.516, "step": 123000 }, { "epoch": 0.22, "learning_rate": 3.923154190368901e-05, "loss": 2.5314, "step": 123500 }, { "epoch": 0.22, "learning_rate": 3.918794490734767e-05, "loss": 2.5212, "step": 124000 }, { "epoch": 0.22, "learning_rate": 3.914434791100632e-05, "loss": 2.5217, "step": 124500 }, { "epoch": 0.22, "learning_rate": 3.9100750914664984e-05, "loss": 2.5368, "step": 125000 }, { "epoch": 0.22, "learning_rate": 3.9057153918323645e-05, "loss": 2.5083, "step": 125500 }, { "epoch": 0.22, "learning_rate": 3.90135569219823e-05, "loss": 2.5115, "step": 126000 }, { "epoch": 0.22, "learning_rate": 3.896995992564096e-05, "loss": 2.5327, "step": 126500 }, { "epoch": 0.22, "learning_rate": 3.892636292929962e-05, "loss": 2.4913, "step": 127000 }, { "epoch": 0.22, "learning_rate": 3.8882765932958284e-05, "loss": 2.4975, "step": 127500 }, { "epoch": 0.22, "learning_rate": 3.8839168936616946e-05, "loss": 2.511, "step": 128000 }, { "epoch": 0.22, "learning_rate": 3.879557194027561e-05, "loss": 2.5149, "step": 128500 }, { "epoch": 0.22, "learning_rate": 3.875197494393427e-05, "loss": 2.502, "step": 129000 }, { "epoch": 0.23, "learning_rate": 3.870837794759292e-05, "loss": 2.4992, "step": 129500 }, { "epoch": 0.23, "learning_rate": 3.8664780951251584e-05, "loss": 2.5071, "step": 130000 }, { "epoch": 0.23, "learning_rate": 3.8621183954910246e-05, "loss": 2.5123, "step": 130500 }, { "epoch": 0.23, "learning_rate": 3.857758695856891e-05, "loss": 2.4968, "step": 131000 }, { "epoch": 0.23, "learning_rate": 3.853398996222756e-05, "loss": 2.5091, "step": 131500 }, { "epoch": 0.23, "learning_rate": 3.849039296588622e-05, "loss": 2.5059, "step": 132000 }, { "epoch": 0.23, "learning_rate": 3.8446795969544885e-05, "loss": 2.501, "step": 132500 }, { "epoch": 0.23, "learning_rate": 3.840319897320354e-05, "loss": 2.5034, "step": 133000 }, { "epoch": 0.23, "learning_rate": 3.83596019768622e-05, "loss": 2.5065, "step": 133500 }, { "epoch": 0.23, "learning_rate": 3.831600498052086e-05, "loss": 2.4937, "step": 134000 }, { "epoch": 0.23, "learning_rate": 3.8272407984179523e-05, "loss": 2.5109, "step": 134500 }, { "epoch": 0.24, "learning_rate": 3.8228810987838185e-05, "loss": 2.4983, "step": 135000 }, { "epoch": 0.24, "learning_rate": 3.8185213991496846e-05, "loss": 2.4944, "step": 135500 }, { "epoch": 0.24, "learning_rate": 3.814161699515551e-05, "loss": 2.4964, "step": 136000 }, { "epoch": 0.24, "learning_rate": 3.809801999881417e-05, "loss": 2.4916, "step": 136500 }, { "epoch": 0.24, "learning_rate": 3.8054423002472824e-05, "loss": 2.5128, "step": 137000 }, { "epoch": 0.24, "learning_rate": 3.8010826006131485e-05, "loss": 2.4886, "step": 137500 }, { "epoch": 0.24, "learning_rate": 3.7967229009790146e-05, "loss": 2.4835, "step": 138000 }, { "epoch": 0.24, "learning_rate": 3.79236320134488e-05, "loss": 2.4954, "step": 138500 }, { "epoch": 0.24, "learning_rate": 3.788003501710746e-05, "loss": 2.4935, "step": 139000 }, { "epoch": 0.24, "learning_rate": 3.7836438020766124e-05, "loss": 2.4825, "step": 139500 }, { "epoch": 0.24, "learning_rate": 3.7792841024424785e-05, "loss": 2.5103, "step": 140000 }, { "epoch": 0.25, "learning_rate": 3.774924402808344e-05, "loss": 2.4995, "step": 140500 }, { "epoch": 0.25, "learning_rate": 3.77056470317421e-05, "loss": 2.4935, "step": 141000 }, { "epoch": 0.25, "learning_rate": 3.766205003540076e-05, "loss": 2.5006, "step": 141500 }, { "epoch": 0.25, "learning_rate": 3.761845303905942e-05, "loss": 2.4913, "step": 142000 }, { "epoch": 0.25, "learning_rate": 3.757485604271808e-05, "loss": 2.4799, "step": 142500 }, { "epoch": 0.25, "learning_rate": 3.753125904637674e-05, "loss": 2.4833, "step": 143000 }, { "epoch": 0.25, "learning_rate": 3.748766205003541e-05, "loss": 2.495, "step": 143500 }, { "epoch": 0.25, "learning_rate": 3.744406505369406e-05, "loss": 2.4815, "step": 144000 }, { "epoch": 0.25, "learning_rate": 3.7400468057352724e-05, "loss": 2.4914, "step": 144500 }, { "epoch": 0.25, "learning_rate": 3.7356871061011385e-05, "loss": 2.4826, "step": 145000 }, { "epoch": 0.25, "learning_rate": 3.731327406467004e-05, "loss": 2.4923, "step": 145500 }, { "epoch": 0.25, "learning_rate": 3.72696770683287e-05, "loss": 2.4838, "step": 146000 }, { "epoch": 0.26, "learning_rate": 3.722608007198736e-05, "loss": 2.4831, "step": 146500 }, { "epoch": 0.26, "learning_rate": 3.7182483075646024e-05, "loss": 2.4867, "step": 147000 }, { "epoch": 0.26, "learning_rate": 3.713888607930468e-05, "loss": 2.4856, "step": 147500 }, { "epoch": 0.26, "learning_rate": 3.709528908296334e-05, "loss": 2.4846, "step": 148000 }, { "epoch": 0.26, "learning_rate": 3.7051692086622e-05, "loss": 2.4948, "step": 148500 }, { "epoch": 0.26, "learning_rate": 3.700809509028066e-05, "loss": 2.4816, "step": 149000 }, { "epoch": 0.26, "learning_rate": 3.696449809393932e-05, "loss": 2.4807, "step": 149500 }, { "epoch": 0.26, "learning_rate": 3.692090109759798e-05, "loss": 2.4847, "step": 150000 }, { "epoch": 0.26, "learning_rate": 3.687730410125664e-05, "loss": 2.4854, "step": 150500 }, { "epoch": 0.26, "learning_rate": 3.68337071049153e-05, "loss": 2.45, "step": 151000 }, { "epoch": 0.26, "learning_rate": 3.679011010857396e-05, "loss": 2.467, "step": 151500 }, { "epoch": 0.27, "learning_rate": 3.6746513112232625e-05, "loss": 2.489, "step": 152000 }, { "epoch": 0.27, "learning_rate": 3.6745641172305795e-05, "loss": 2.4486, "step": 152010 }, { "epoch": 0.27, "learning_rate": 3.6744769232378965e-05, "loss": 2.5418, "step": 152020 }, { "epoch": 0.27, "learning_rate": 3.674389729245214e-05, "loss": 2.487, "step": 152030 }, { "epoch": 0.27, "learning_rate": 3.674302535252531e-05, "loss": 2.5183, "step": 152040 }, { "epoch": 0.27, "learning_rate": 3.674215341259849e-05, "loss": 2.5454, "step": 152050 }, { "epoch": 0.27, "learning_rate": 3.674128147267166e-05, "loss": 2.5318, "step": 152060 }, { "epoch": 0.27, "learning_rate": 3.674040953274484e-05, "loss": 2.6745, "step": 152070 }, { "epoch": 0.27, "learning_rate": 3.673953759281801e-05, "loss": 2.539, "step": 152080 }, { "epoch": 0.27, "learning_rate": 3.673866565289118e-05, "loss": 2.5846, "step": 152090 }, { "epoch": 0.27, "learning_rate": 3.6737793712964356e-05, "loss": 2.4039, "step": 152100 }, { "epoch": 0.27, "learning_rate": 3.6736921773037526e-05, "loss": 2.4249, "step": 152110 }, { "epoch": 0.27, "learning_rate": 3.6736049833110696e-05, "loss": 2.4787, "step": 152120 }, { "epoch": 0.27, "learning_rate": 3.6735177893183873e-05, "loss": 2.5389, "step": 152130 }, { "epoch": 0.27, "learning_rate": 3.673430595325705e-05, "loss": 2.4451, "step": 152140 }, { "epoch": 0.27, "learning_rate": 3.673343401333022e-05, "loss": 2.438, "step": 152150 }, { "epoch": 0.27, "learning_rate": 3.673256207340339e-05, "loss": 2.4797, "step": 152160 }, { "epoch": 0.27, "learning_rate": 3.673169013347656e-05, "loss": 2.531, "step": 152170 }, { "epoch": 0.27, "learning_rate": 3.673081819354974e-05, "loss": 2.4701, "step": 152180 }, { "epoch": 0.27, "learning_rate": 3.672994625362291e-05, "loss": 2.347, "step": 152190 }, { "epoch": 0.27, "learning_rate": 3.6729074313696086e-05, "loss": 2.521, "step": 152200 }, { "epoch": 0.27, "learning_rate": 3.6728202373769264e-05, "loss": 2.4582, "step": 152210 }, { "epoch": 0.27, "learning_rate": 3.6727330433842434e-05, "loss": 2.457, "step": 152220 }, { "epoch": 0.27, "learning_rate": 3.6726458493915604e-05, "loss": 2.4437, "step": 152230 }, { "epoch": 0.27, "learning_rate": 3.6725586553988775e-05, "loss": 2.4435, "step": 152240 }, { "epoch": 0.27, "learning_rate": 3.672471461406195e-05, "loss": 2.5245, "step": 152250 }, { "epoch": 0.27, "learning_rate": 3.672384267413512e-05, "loss": 2.4433, "step": 152260 }, { "epoch": 0.27, "learning_rate": 3.672297073420829e-05, "loss": 2.4936, "step": 152270 }, { "epoch": 0.27, "learning_rate": 3.672209879428147e-05, "loss": 2.3041, "step": 152280 }, { "epoch": 0.27, "learning_rate": 3.672122685435465e-05, "loss": 2.3409, "step": 152290 }, { "epoch": 0.27, "learning_rate": 3.672035491442782e-05, "loss": 2.4557, "step": 152300 }, { "epoch": 0.27, "learning_rate": 3.671948297450099e-05, "loss": 2.4309, "step": 152310 }, { "epoch": 0.27, "learning_rate": 3.6718611034574165e-05, "loss": 2.4952, "step": 152320 }, { "epoch": 0.27, "learning_rate": 3.6717739094647335e-05, "loss": 2.4949, "step": 152330 }, { "epoch": 0.27, "learning_rate": 3.6716867154720506e-05, "loss": 2.4713, "step": 152340 }, { "epoch": 0.27, "learning_rate": 3.671599521479368e-05, "loss": 2.3882, "step": 152350 }, { "epoch": 0.27, "learning_rate": 3.671512327486686e-05, "loss": 2.5458, "step": 152360 }, { "epoch": 0.27, "learning_rate": 3.671425133494003e-05, "loss": 2.5279, "step": 152370 }, { "epoch": 0.27, "learning_rate": 3.67133793950132e-05, "loss": 2.5048, "step": 152380 }, { "epoch": 0.27, "learning_rate": 3.671250745508638e-05, "loss": 2.3942, "step": 152390 }, { "epoch": 0.27, "learning_rate": 3.671163551515955e-05, "loss": 2.5749, "step": 152400 }, { "epoch": 0.27, "learning_rate": 3.671076357523272e-05, "loss": 2.4163, "step": 152410 }, { "epoch": 0.27, "learning_rate": 3.6709891635305896e-05, "loss": 2.5594, "step": 152420 }, { "epoch": 0.27, "learning_rate": 3.670901969537907e-05, "loss": 2.5412, "step": 152430 }, { "epoch": 0.27, "learning_rate": 3.6708147755452243e-05, "loss": 2.4455, "step": 152440 }, { "epoch": 0.27, "learning_rate": 3.6707275815525414e-05, "loss": 2.5134, "step": 152450 }, { "epoch": 0.27, "learning_rate": 3.670640387559859e-05, "loss": 2.4105, "step": 152460 }, { "epoch": 0.27, "learning_rate": 3.670553193567176e-05, "loss": 2.4572, "step": 152470 }, { "epoch": 0.27, "learning_rate": 3.670465999574493e-05, "loss": 2.4765, "step": 152480 }, { "epoch": 0.27, "learning_rate": 3.670378805581811e-05, "loss": 2.5432, "step": 152490 }, { "epoch": 0.27, "learning_rate": 3.6702916115891286e-05, "loss": 2.5638, "step": 152500 }, { "epoch": 0.27, "learning_rate": 3.6702044175964456e-05, "loss": 2.4502, "step": 152510 }, { "epoch": 0.27, "learning_rate": 3.670117223603763e-05, "loss": 2.448, "step": 152520 }, { "epoch": 0.27, "learning_rate": 3.6700300296110804e-05, "loss": 2.4897, "step": 152530 }, { "epoch": 0.27, "learning_rate": 3.6699428356183974e-05, "loss": 2.4653, "step": 152540 }, { "epoch": 0.27, "learning_rate": 3.6698556416257145e-05, "loss": 2.3926, "step": 152550 }, { "epoch": 0.27, "learning_rate": 3.6697684476330315e-05, "loss": 2.3552, "step": 152560 }, { "epoch": 0.27, "learning_rate": 3.66968125364035e-05, "loss": 2.475, "step": 152570 }, { "epoch": 0.27, "learning_rate": 3.669594059647667e-05, "loss": 2.6209, "step": 152580 }, { "epoch": 0.27, "learning_rate": 3.669506865654984e-05, "loss": 2.4461, "step": 152590 }, { "epoch": 0.27, "learning_rate": 3.669419671662302e-05, "loss": 2.4276, "step": 152600 }, { "epoch": 0.27, "learning_rate": 3.669332477669619e-05, "loss": 2.4866, "step": 152610 }, { "epoch": 0.27, "learning_rate": 3.669245283676936e-05, "loss": 2.5518, "step": 152620 }, { "epoch": 0.27, "learning_rate": 3.669158089684253e-05, "loss": 2.4193, "step": 152630 }, { "epoch": 0.27, "learning_rate": 3.6690708956915705e-05, "loss": 2.4557, "step": 152640 }, { "epoch": 0.27, "learning_rate": 3.668983701698888e-05, "loss": 2.5545, "step": 152650 }, { "epoch": 0.27, "learning_rate": 3.668896507706205e-05, "loss": 2.4605, "step": 152660 }, { "epoch": 0.27, "learning_rate": 3.668809313713522e-05, "loss": 2.5508, "step": 152670 }, { "epoch": 0.27, "learning_rate": 3.66872211972084e-05, "loss": 2.3837, "step": 152680 }, { "epoch": 0.27, "learning_rate": 3.668634925728157e-05, "loss": 2.5232, "step": 152690 }, { "epoch": 0.27, "learning_rate": 3.668547731735474e-05, "loss": 2.451, "step": 152700 }, { "epoch": 0.27, "learning_rate": 3.668460537742792e-05, "loss": 2.5399, "step": 152710 }, { "epoch": 0.27, "learning_rate": 3.6683733437501095e-05, "loss": 2.4515, "step": 152720 }, { "epoch": 0.27, "learning_rate": 3.6682861497574266e-05, "loss": 2.523, "step": 152730 }, { "epoch": 0.27, "learning_rate": 3.6681989557647436e-05, "loss": 2.3892, "step": 152740 }, { "epoch": 0.27, "learning_rate": 3.668111761772061e-05, "loss": 2.5305, "step": 152750 }, { "epoch": 0.27, "learning_rate": 3.6680245677793784e-05, "loss": 2.4433, "step": 152760 }, { "epoch": 0.27, "learning_rate": 3.6679373737866954e-05, "loss": 2.2944, "step": 152770 }, { "epoch": 0.27, "learning_rate": 3.667850179794013e-05, "loss": 2.4241, "step": 152780 }, { "epoch": 0.27, "learning_rate": 3.66776298580133e-05, "loss": 2.5217, "step": 152790 }, { "epoch": 0.27, "learning_rate": 3.667675791808648e-05, "loss": 2.4226, "step": 152800 }, { "epoch": 0.27, "learning_rate": 3.667588597815965e-05, "loss": 2.3673, "step": 152810 }, { "epoch": 0.27, "learning_rate": 3.6675014038232826e-05, "loss": 2.446, "step": 152820 }, { "epoch": 0.27, "learning_rate": 3.6674142098306e-05, "loss": 2.5055, "step": 152830 }, { "epoch": 0.27, "learning_rate": 3.667327015837917e-05, "loss": 2.4555, "step": 152840 }, { "epoch": 0.27, "learning_rate": 3.6672398218452344e-05, "loss": 2.3256, "step": 152850 }, { "epoch": 0.27, "learning_rate": 3.6671526278525515e-05, "loss": 2.5913, "step": 152860 }, { "epoch": 0.27, "learning_rate": 3.667065433859869e-05, "loss": 2.5243, "step": 152870 }, { "epoch": 0.27, "learning_rate": 3.666978239867186e-05, "loss": 2.518, "step": 152880 }, { "epoch": 0.27, "learning_rate": 3.666891045874504e-05, "loss": 2.3962, "step": 152890 }, { "epoch": 0.27, "learning_rate": 3.666803851881821e-05, "loss": 2.5183, "step": 152900 }, { "epoch": 0.27, "learning_rate": 3.666716657889138e-05, "loss": 2.4048, "step": 152910 }, { "epoch": 0.27, "learning_rate": 3.666629463896456e-05, "loss": 2.4158, "step": 152920 }, { "epoch": 0.27, "learning_rate": 3.666542269903773e-05, "loss": 2.5343, "step": 152930 }, { "epoch": 0.27, "learning_rate": 3.66645507591109e-05, "loss": 2.5247, "step": 152940 }, { "epoch": 0.27, "learning_rate": 3.6663678819184075e-05, "loss": 2.586, "step": 152950 }, { "epoch": 0.27, "learning_rate": 3.666280687925725e-05, "loss": 2.4529, "step": 152960 }, { "epoch": 0.27, "learning_rate": 3.666193493933042e-05, "loss": 2.4641, "step": 152970 }, { "epoch": 0.27, "learning_rate": 3.666106299940359e-05, "loss": 2.473, "step": 152980 }, { "epoch": 0.27, "learning_rate": 3.666019105947677e-05, "loss": 2.6165, "step": 152990 }, { "epoch": 0.27, "learning_rate": 3.665931911954994e-05, "loss": 2.438, "step": 153000 }, { "epoch": 0.27, "learning_rate": 3.665844717962311e-05, "loss": 2.5722, "step": 153010 }, { "epoch": 0.27, "learning_rate": 3.665757523969629e-05, "loss": 2.3216, "step": 153020 }, { "epoch": 0.27, "learning_rate": 3.6656703299769465e-05, "loss": 2.4708, "step": 153030 }, { "epoch": 0.27, "learning_rate": 3.6655831359842636e-05, "loss": 2.4548, "step": 153040 }, { "epoch": 0.27, "learning_rate": 3.6654959419915806e-05, "loss": 2.553, "step": 153050 }, { "epoch": 0.27, "learning_rate": 3.665408747998898e-05, "loss": 2.3702, "step": 153060 }, { "epoch": 0.27, "learning_rate": 3.6653215540062154e-05, "loss": 2.4696, "step": 153070 }, { "epoch": 0.27, "learning_rate": 3.6652343600135324e-05, "loss": 2.4943, "step": 153080 }, { "epoch": 0.27, "learning_rate": 3.6651471660208494e-05, "loss": 2.4602, "step": 153090 }, { "epoch": 0.27, "learning_rate": 3.665059972028168e-05, "loss": 2.5162, "step": 153100 }, { "epoch": 0.27, "learning_rate": 3.664972778035485e-05, "loss": 2.5272, "step": 153110 }, { "epoch": 0.27, "learning_rate": 3.664885584042802e-05, "loss": 2.5137, "step": 153120 }, { "epoch": 0.27, "learning_rate": 3.664798390050119e-05, "loss": 2.4247, "step": 153130 }, { "epoch": 0.27, "learning_rate": 3.664711196057437e-05, "loss": 2.5762, "step": 153140 }, { "epoch": 0.27, "learning_rate": 3.664624002064754e-05, "loss": 2.3815, "step": 153150 }, { "epoch": 0.27, "learning_rate": 3.664536808072071e-05, "loss": 2.5058, "step": 153160 }, { "epoch": 0.27, "learning_rate": 3.664449614079389e-05, "loss": 2.5451, "step": 153170 }, { "epoch": 0.27, "learning_rate": 3.664362420086706e-05, "loss": 2.4483, "step": 153180 }, { "epoch": 0.27, "learning_rate": 3.664275226094023e-05, "loss": 2.5478, "step": 153190 }, { "epoch": 0.27, "learning_rate": 3.66418803210134e-05, "loss": 2.47, "step": 153200 }, { "epoch": 0.27, "learning_rate": 3.664100838108658e-05, "loss": 2.5263, "step": 153210 }, { "epoch": 0.27, "learning_rate": 3.664013644115975e-05, "loss": 2.4633, "step": 153220 }, { "epoch": 0.27, "learning_rate": 3.663926450123292e-05, "loss": 2.4284, "step": 153230 }, { "epoch": 0.27, "learning_rate": 3.66383925613061e-05, "loss": 2.5113, "step": 153240 }, { "epoch": 0.27, "learning_rate": 3.6637520621379275e-05, "loss": 2.5383, "step": 153250 }, { "epoch": 0.27, "learning_rate": 3.6636648681452445e-05, "loss": 2.5392, "step": 153260 }, { "epoch": 0.27, "learning_rate": 3.6635776741525615e-05, "loss": 2.4705, "step": 153270 }, { "epoch": 0.27, "learning_rate": 3.663490480159879e-05, "loss": 2.4512, "step": 153280 }, { "epoch": 0.27, "learning_rate": 3.663403286167196e-05, "loss": 2.4616, "step": 153290 }, { "epoch": 0.27, "learning_rate": 3.6633160921745133e-05, "loss": 2.586, "step": 153300 }, { "epoch": 0.27, "learning_rate": 3.663228898181831e-05, "loss": 2.5649, "step": 153310 }, { "epoch": 0.27, "learning_rate": 3.663141704189149e-05, "loss": 2.3707, "step": 153320 }, { "epoch": 0.27, "learning_rate": 3.663054510196466e-05, "loss": 2.3424, "step": 153330 }, { "epoch": 0.27, "learning_rate": 3.662967316203783e-05, "loss": 2.4832, "step": 153340 }, { "epoch": 0.27, "learning_rate": 3.6628801222111006e-05, "loss": 2.4943, "step": 153350 }, { "epoch": 0.27, "learning_rate": 3.6627929282184176e-05, "loss": 2.4926, "step": 153360 }, { "epoch": 0.27, "learning_rate": 3.6627057342257346e-05, "loss": 2.4588, "step": 153370 }, { "epoch": 0.27, "learning_rate": 3.6626185402330524e-05, "loss": 2.4157, "step": 153380 }, { "epoch": 0.27, "learning_rate": 3.66253134624037e-05, "loss": 2.3983, "step": 153390 }, { "epoch": 0.27, "learning_rate": 3.662444152247687e-05, "loss": 2.5982, "step": 153400 }, { "epoch": 0.27, "learning_rate": 3.662356958255004e-05, "loss": 2.5575, "step": 153410 }, { "epoch": 0.27, "learning_rate": 3.662269764262322e-05, "loss": 2.5491, "step": 153420 }, { "epoch": 0.27, "learning_rate": 3.662182570269639e-05, "loss": 2.6, "step": 153430 }, { "epoch": 0.27, "learning_rate": 3.662095376276956e-05, "loss": 2.4442, "step": 153440 }, { "epoch": 0.27, "learning_rate": 3.6620081822842737e-05, "loss": 2.4518, "step": 153450 }, { "epoch": 0.27, "learning_rate": 3.661920988291591e-05, "loss": 2.4971, "step": 153460 }, { "epoch": 0.27, "learning_rate": 3.6618337942989084e-05, "loss": 2.5864, "step": 153470 }, { "epoch": 0.27, "learning_rate": 3.6617466003062254e-05, "loss": 2.4505, "step": 153480 }, { "epoch": 0.27, "learning_rate": 3.661659406313543e-05, "loss": 2.4895, "step": 153490 }, { "epoch": 0.27, "learning_rate": 3.66157221232086e-05, "loss": 2.4581, "step": 153500 }, { "epoch": 0.27, "learning_rate": 3.661485018328177e-05, "loss": 2.508, "step": 153510 }, { "epoch": 0.27, "learning_rate": 3.661397824335494e-05, "loss": 2.4373, "step": 153520 }, { "epoch": 0.27, "learning_rate": 3.661310630342812e-05, "loss": 2.4385, "step": 153530 }, { "epoch": 0.27, "learning_rate": 3.66122343635013e-05, "loss": 2.4961, "step": 153540 }, { "epoch": 0.27, "learning_rate": 3.661136242357447e-05, "loss": 2.5488, "step": 153550 }, { "epoch": 0.27, "learning_rate": 3.6610490483647645e-05, "loss": 2.5372, "step": 153560 }, { "epoch": 0.27, "learning_rate": 3.6609618543720815e-05, "loss": 2.435, "step": 153570 }, { "epoch": 0.27, "learning_rate": 3.6608746603793985e-05, "loss": 2.477, "step": 153580 }, { "epoch": 0.27, "learning_rate": 3.6607874663867156e-05, "loss": 2.513, "step": 153590 }, { "epoch": 0.27, "learning_rate": 3.660700272394033e-05, "loss": 2.5042, "step": 153600 }, { "epoch": 0.27, "learning_rate": 3.66061307840135e-05, "loss": 2.3907, "step": 153610 }, { "epoch": 0.27, "learning_rate": 3.660525884408668e-05, "loss": 2.3942, "step": 153620 }, { "epoch": 0.27, "learning_rate": 3.660438690415985e-05, "loss": 2.5732, "step": 153630 }, { "epoch": 0.27, "learning_rate": 3.660351496423303e-05, "loss": 2.4726, "step": 153640 }, { "epoch": 0.27, "learning_rate": 3.66026430243062e-05, "loss": 2.6508, "step": 153650 }, { "epoch": 0.27, "learning_rate": 3.660177108437937e-05, "loss": 2.561, "step": 153660 }, { "epoch": 0.27, "learning_rate": 3.6600899144452546e-05, "loss": 2.4914, "step": 153670 }, { "epoch": 0.27, "learning_rate": 3.6600027204525716e-05, "loss": 2.5237, "step": 153680 }, { "epoch": 0.27, "learning_rate": 3.6599155264598893e-05, "loss": 2.5076, "step": 153690 }, { "epoch": 0.27, "learning_rate": 3.6598283324672064e-05, "loss": 2.5305, "step": 153700 }, { "epoch": 0.27, "learning_rate": 3.659741138474524e-05, "loss": 2.4579, "step": 153710 }, { "epoch": 0.27, "learning_rate": 3.659653944481841e-05, "loss": 2.514, "step": 153720 }, { "epoch": 0.27, "learning_rate": 3.659566750489158e-05, "loss": 2.4739, "step": 153730 }, { "epoch": 0.27, "learning_rate": 3.659479556496476e-05, "loss": 2.4183, "step": 153740 }, { "epoch": 0.27, "learning_rate": 3.659392362503793e-05, "loss": 2.5075, "step": 153750 }, { "epoch": 0.27, "learning_rate": 3.65930516851111e-05, "loss": 2.3852, "step": 153760 }, { "epoch": 0.27, "learning_rate": 3.659217974518428e-05, "loss": 2.4561, "step": 153770 }, { "epoch": 0.27, "learning_rate": 3.6591307805257454e-05, "loss": 2.5005, "step": 153780 }, { "epoch": 0.27, "learning_rate": 3.6590435865330624e-05, "loss": 2.4754, "step": 153790 }, { "epoch": 0.27, "learning_rate": 3.6589563925403795e-05, "loss": 2.4185, "step": 153800 }, { "epoch": 0.27, "learning_rate": 3.658869198547697e-05, "loss": 2.4837, "step": 153810 }, { "epoch": 0.27, "learning_rate": 3.658782004555014e-05, "loss": 2.5526, "step": 153820 }, { "epoch": 0.27, "learning_rate": 3.658694810562331e-05, "loss": 2.3712, "step": 153830 }, { "epoch": 0.27, "learning_rate": 3.658607616569649e-05, "loss": 2.5492, "step": 153840 }, { "epoch": 0.27, "learning_rate": 3.658520422576967e-05, "loss": 2.5242, "step": 153850 }, { "epoch": 0.27, "learning_rate": 3.658433228584284e-05, "loss": 2.3864, "step": 153860 }, { "epoch": 0.27, "learning_rate": 3.658346034591601e-05, "loss": 2.5395, "step": 153870 }, { "epoch": 0.27, "learning_rate": 3.6582588405989185e-05, "loss": 2.444, "step": 153880 }, { "epoch": 0.27, "learning_rate": 3.6581716466062355e-05, "loss": 2.5091, "step": 153890 }, { "epoch": 0.27, "learning_rate": 3.6580844526135526e-05, "loss": 2.356, "step": 153900 }, { "epoch": 0.27, "learning_rate": 3.65799725862087e-05, "loss": 2.5168, "step": 153910 }, { "epoch": 0.27, "learning_rate": 3.657910064628188e-05, "loss": 2.5785, "step": 153920 }, { "epoch": 0.27, "learning_rate": 3.657822870635505e-05, "loss": 2.4682, "step": 153930 }, { "epoch": 0.27, "learning_rate": 3.657735676642822e-05, "loss": 2.4289, "step": 153940 }, { "epoch": 0.27, "learning_rate": 3.65764848265014e-05, "loss": 2.5931, "step": 153950 }, { "epoch": 0.27, "learning_rate": 3.657561288657457e-05, "loss": 2.4355, "step": 153960 }, { "epoch": 0.27, "learning_rate": 3.657474094664774e-05, "loss": 2.4306, "step": 153970 }, { "epoch": 0.27, "learning_rate": 3.657386900672091e-05, "loss": 2.421, "step": 153980 }, { "epoch": 0.27, "learning_rate": 3.657299706679409e-05, "loss": 2.4914, "step": 153990 }, { "epoch": 0.27, "learning_rate": 3.6572125126867263e-05, "loss": 2.4436, "step": 154000 }, { "epoch": 0.27, "learning_rate": 3.6571253186940434e-05, "loss": 2.4277, "step": 154010 }, { "epoch": 0.27, "learning_rate": 3.657038124701361e-05, "loss": 2.5265, "step": 154020 }, { "epoch": 0.27, "learning_rate": 3.656950930708678e-05, "loss": 2.3525, "step": 154030 }, { "epoch": 0.27, "learning_rate": 3.656863736715995e-05, "loss": 2.4789, "step": 154040 }, { "epoch": 0.27, "learning_rate": 3.656776542723312e-05, "loss": 2.4033, "step": 154050 }, { "epoch": 0.27, "learning_rate": 3.6566893487306306e-05, "loss": 2.4459, "step": 154060 }, { "epoch": 0.27, "learning_rate": 3.6566021547379476e-05, "loss": 2.5555, "step": 154070 }, { "epoch": 0.27, "learning_rate": 3.656514960745265e-05, "loss": 2.4849, "step": 154080 }, { "epoch": 0.27, "learning_rate": 3.656427766752582e-05, "loss": 2.5541, "step": 154090 }, { "epoch": 0.27, "learning_rate": 3.6563405727598994e-05, "loss": 2.4857, "step": 154100 }, { "epoch": 0.27, "learning_rate": 3.6562533787672165e-05, "loss": 2.5062, "step": 154110 }, { "epoch": 0.27, "learning_rate": 3.6561661847745335e-05, "loss": 2.5225, "step": 154120 }, { "epoch": 0.27, "learning_rate": 3.656078990781851e-05, "loss": 2.5021, "step": 154130 }, { "epoch": 0.27, "learning_rate": 3.655991796789169e-05, "loss": 2.4613, "step": 154140 }, { "epoch": 0.27, "learning_rate": 3.655904602796486e-05, "loss": 2.4709, "step": 154150 }, { "epoch": 0.27, "learning_rate": 3.655817408803803e-05, "loss": 2.432, "step": 154160 }, { "epoch": 0.27, "learning_rate": 3.655730214811121e-05, "loss": 2.444, "step": 154170 }, { "epoch": 0.27, "learning_rate": 3.655643020818438e-05, "loss": 2.4323, "step": 154180 }, { "epoch": 0.27, "learning_rate": 3.655555826825755e-05, "loss": 2.4727, "step": 154190 }, { "epoch": 0.27, "learning_rate": 3.6554686328330725e-05, "loss": 2.4011, "step": 154200 }, { "epoch": 0.27, "learning_rate": 3.65538143884039e-05, "loss": 2.4264, "step": 154210 }, { "epoch": 0.27, "learning_rate": 3.655294244847707e-05, "loss": 2.5412, "step": 154220 }, { "epoch": 0.27, "learning_rate": 3.655207050855024e-05, "loss": 2.4666, "step": 154230 }, { "epoch": 0.27, "learning_rate": 3.655119856862342e-05, "loss": 2.4731, "step": 154240 }, { "epoch": 0.27, "learning_rate": 3.655032662869659e-05, "loss": 2.3906, "step": 154250 }, { "epoch": 0.27, "learning_rate": 3.654945468876976e-05, "loss": 2.4348, "step": 154260 }, { "epoch": 0.27, "learning_rate": 3.654858274884294e-05, "loss": 2.4669, "step": 154270 }, { "epoch": 0.27, "learning_rate": 3.654771080891611e-05, "loss": 2.4968, "step": 154280 }, { "epoch": 0.27, "learning_rate": 3.6546838868989286e-05, "loss": 2.4301, "step": 154290 }, { "epoch": 0.27, "learning_rate": 3.6545966929062456e-05, "loss": 2.54, "step": 154300 }, { "epoch": 0.27, "learning_rate": 3.654509498913563e-05, "loss": 2.5115, "step": 154310 }, { "epoch": 0.27, "learning_rate": 3.6544223049208804e-05, "loss": 2.4678, "step": 154320 }, { "epoch": 0.27, "learning_rate": 3.6543351109281974e-05, "loss": 2.5372, "step": 154330 }, { "epoch": 0.27, "learning_rate": 3.654247916935515e-05, "loss": 2.422, "step": 154340 }, { "epoch": 0.27, "learning_rate": 3.654160722942832e-05, "loss": 2.4744, "step": 154350 }, { "epoch": 0.27, "learning_rate": 3.65407352895015e-05, "loss": 2.571, "step": 154360 }, { "epoch": 0.27, "learning_rate": 3.653986334957467e-05, "loss": 2.4502, "step": 154370 }, { "epoch": 0.27, "learning_rate": 3.6538991409647846e-05, "loss": 2.4257, "step": 154380 }, { "epoch": 0.27, "learning_rate": 3.653811946972102e-05, "loss": 2.5118, "step": 154390 }, { "epoch": 0.27, "learning_rate": 3.653724752979419e-05, "loss": 2.372, "step": 154400 }, { "epoch": 0.27, "learning_rate": 3.6536375589867364e-05, "loss": 2.4393, "step": 154410 }, { "epoch": 0.27, "learning_rate": 3.6535503649940535e-05, "loss": 2.3996, "step": 154420 }, { "epoch": 0.27, "learning_rate": 3.6534631710013705e-05, "loss": 2.534, "step": 154430 }, { "epoch": 0.27, "learning_rate": 3.653375977008688e-05, "loss": 2.4919, "step": 154440 }, { "epoch": 0.27, "learning_rate": 3.653288783016006e-05, "loss": 2.5061, "step": 154450 }, { "epoch": 0.27, "learning_rate": 3.653201589023323e-05, "loss": 2.3938, "step": 154460 }, { "epoch": 0.27, "learning_rate": 3.65311439503064e-05, "loss": 2.3806, "step": 154470 }, { "epoch": 0.27, "learning_rate": 3.653027201037957e-05, "loss": 2.4858, "step": 154480 }, { "epoch": 0.27, "learning_rate": 3.652940007045275e-05, "loss": 2.3837, "step": 154490 }, { "epoch": 0.27, "learning_rate": 3.652852813052592e-05, "loss": 2.5549, "step": 154500 }, { "epoch": 0.27, "learning_rate": 3.6527656190599095e-05, "loss": 2.5551, "step": 154510 }, { "epoch": 0.27, "learning_rate": 3.652678425067227e-05, "loss": 2.4959, "step": 154520 }, { "epoch": 0.27, "learning_rate": 3.652591231074544e-05, "loss": 2.4661, "step": 154530 }, { "epoch": 0.27, "learning_rate": 3.652504037081861e-05, "loss": 2.4459, "step": 154540 }, { "epoch": 0.27, "learning_rate": 3.6524168430891783e-05, "loss": 2.4684, "step": 154550 }, { "epoch": 0.27, "learning_rate": 3.652329649096496e-05, "loss": 2.5005, "step": 154560 }, { "epoch": 0.27, "learning_rate": 3.652242455103813e-05, "loss": 2.4378, "step": 154570 }, { "epoch": 0.27, "learning_rate": 3.652155261111131e-05, "loss": 2.3806, "step": 154580 }, { "epoch": 0.27, "learning_rate": 3.652068067118448e-05, "loss": 2.4518, "step": 154590 }, { "epoch": 0.27, "learning_rate": 3.6519808731257656e-05, "loss": 2.4433, "step": 154600 }, { "epoch": 0.27, "learning_rate": 3.6518936791330826e-05, "loss": 2.4036, "step": 154610 }, { "epoch": 0.27, "learning_rate": 3.6518064851403996e-05, "loss": 2.4838, "step": 154620 }, { "epoch": 0.27, "learning_rate": 3.6517192911477174e-05, "loss": 2.5261, "step": 154630 }, { "epoch": 0.27, "learning_rate": 3.6516320971550344e-05, "loss": 2.4718, "step": 154640 }, { "epoch": 0.27, "learning_rate": 3.6515449031623514e-05, "loss": 2.4859, "step": 154650 }, { "epoch": 0.27, "learning_rate": 3.651457709169669e-05, "loss": 2.4945, "step": 154660 }, { "epoch": 0.27, "learning_rate": 3.651370515176987e-05, "loss": 2.5331, "step": 154670 }, { "epoch": 0.27, "learning_rate": 3.651283321184304e-05, "loss": 2.552, "step": 154680 }, { "epoch": 0.27, "learning_rate": 3.651196127191621e-05, "loss": 2.4628, "step": 154690 }, { "epoch": 0.27, "learning_rate": 3.651108933198939e-05, "loss": 2.4445, "step": 154700 }, { "epoch": 0.27, "learning_rate": 3.651021739206256e-05, "loss": 2.4283, "step": 154710 }, { "epoch": 0.27, "learning_rate": 3.650934545213573e-05, "loss": 2.4362, "step": 154720 }, { "epoch": 0.27, "learning_rate": 3.6508473512208905e-05, "loss": 2.5159, "step": 154730 }, { "epoch": 0.27, "learning_rate": 3.650760157228208e-05, "loss": 2.4871, "step": 154740 }, { "epoch": 0.27, "learning_rate": 3.650672963235525e-05, "loss": 2.5108, "step": 154750 }, { "epoch": 0.27, "learning_rate": 3.650585769242842e-05, "loss": 2.3753, "step": 154760 }, { "epoch": 0.27, "learning_rate": 3.65049857525016e-05, "loss": 2.4486, "step": 154770 }, { "epoch": 0.27, "learning_rate": 3.650411381257477e-05, "loss": 2.5333, "step": 154780 }, { "epoch": 0.27, "learning_rate": 3.650324187264794e-05, "loss": 2.4196, "step": 154790 }, { "epoch": 0.27, "learning_rate": 3.650236993272112e-05, "loss": 2.4526, "step": 154800 }, { "epoch": 0.27, "learning_rate": 3.6501497992794295e-05, "loss": 2.4811, "step": 154810 }, { "epoch": 0.27, "learning_rate": 3.6500626052867465e-05, "loss": 2.4955, "step": 154820 }, { "epoch": 0.27, "learning_rate": 3.6499754112940635e-05, "loss": 2.3906, "step": 154830 }, { "epoch": 0.27, "learning_rate": 3.649888217301381e-05, "loss": 2.4716, "step": 154840 }, { "epoch": 0.27, "learning_rate": 3.649801023308698e-05, "loss": 2.5367, "step": 154850 }, { "epoch": 0.27, "learning_rate": 3.6497138293160153e-05, "loss": 2.4541, "step": 154860 }, { "epoch": 0.27, "learning_rate": 3.6496266353233324e-05, "loss": 2.448, "step": 154870 }, { "epoch": 0.27, "learning_rate": 3.649539441330651e-05, "loss": 2.3652, "step": 154880 }, { "epoch": 0.27, "learning_rate": 3.649452247337968e-05, "loss": 2.4605, "step": 154890 }, { "epoch": 0.27, "learning_rate": 3.649365053345285e-05, "loss": 2.4749, "step": 154900 }, { "epoch": 0.27, "learning_rate": 3.6492778593526026e-05, "loss": 2.4812, "step": 154910 }, { "epoch": 0.27, "learning_rate": 3.6491906653599196e-05, "loss": 2.5383, "step": 154920 }, { "epoch": 0.27, "learning_rate": 3.6491034713672366e-05, "loss": 2.4793, "step": 154930 }, { "epoch": 0.27, "learning_rate": 3.649016277374554e-05, "loss": 2.4586, "step": 154940 }, { "epoch": 0.27, "learning_rate": 3.6489290833818714e-05, "loss": 2.4967, "step": 154950 }, { "epoch": 0.27, "learning_rate": 3.648841889389189e-05, "loss": 2.5468, "step": 154960 }, { "epoch": 0.27, "learning_rate": 3.648754695396506e-05, "loss": 2.5512, "step": 154970 }, { "epoch": 0.27, "learning_rate": 3.648667501403823e-05, "loss": 2.5069, "step": 154980 }, { "epoch": 0.27, "learning_rate": 3.648580307411141e-05, "loss": 2.4701, "step": 154990 }, { "epoch": 0.27, "learning_rate": 3.648493113418458e-05, "loss": 2.5543, "step": 155000 }, { "epoch": 0.27, "learning_rate": 3.648405919425775e-05, "loss": 2.4378, "step": 155010 }, { "epoch": 0.27, "learning_rate": 3.648318725433093e-05, "loss": 2.4965, "step": 155020 }, { "epoch": 0.27, "learning_rate": 3.6482315314404104e-05, "loss": 2.5626, "step": 155030 }, { "epoch": 0.27, "learning_rate": 3.6481443374477275e-05, "loss": 2.4642, "step": 155040 }, { "epoch": 0.27, "learning_rate": 3.6480571434550445e-05, "loss": 2.4567, "step": 155050 }, { "epoch": 0.27, "learning_rate": 3.647969949462362e-05, "loss": 2.6072, "step": 155060 }, { "epoch": 0.27, "learning_rate": 3.647882755469679e-05, "loss": 2.4729, "step": 155070 }, { "epoch": 0.27, "learning_rate": 3.647795561476996e-05, "loss": 2.4355, "step": 155080 }, { "epoch": 0.27, "learning_rate": 3.647708367484314e-05, "loss": 2.437, "step": 155090 }, { "epoch": 0.27, "learning_rate": 3.647621173491632e-05, "loss": 2.3747, "step": 155100 }, { "epoch": 0.27, "learning_rate": 3.647533979498949e-05, "loss": 2.3842, "step": 155110 }, { "epoch": 0.27, "learning_rate": 3.647446785506266e-05, "loss": 2.4239, "step": 155120 }, { "epoch": 0.27, "learning_rate": 3.6473595915135835e-05, "loss": 2.3532, "step": 155130 }, { "epoch": 0.27, "learning_rate": 3.6472723975209005e-05, "loss": 2.4949, "step": 155140 }, { "epoch": 0.27, "learning_rate": 3.6471852035282176e-05, "loss": 2.4654, "step": 155150 }, { "epoch": 0.27, "learning_rate": 3.647098009535535e-05, "loss": 2.4049, "step": 155160 }, { "epoch": 0.27, "learning_rate": 3.647010815542852e-05, "loss": 2.3882, "step": 155170 }, { "epoch": 0.27, "learning_rate": 3.64692362155017e-05, "loss": 2.514, "step": 155180 }, { "epoch": 0.27, "learning_rate": 3.646836427557487e-05, "loss": 2.4248, "step": 155190 }, { "epoch": 0.27, "learning_rate": 3.646749233564805e-05, "loss": 2.5609, "step": 155200 }, { "epoch": 0.27, "learning_rate": 3.646662039572122e-05, "loss": 2.4598, "step": 155210 }, { "epoch": 0.27, "learning_rate": 3.646574845579439e-05, "loss": 2.4837, "step": 155220 }, { "epoch": 0.27, "learning_rate": 3.6464876515867566e-05, "loss": 2.5123, "step": 155230 }, { "epoch": 0.27, "learning_rate": 3.6464004575940736e-05, "loss": 2.4236, "step": 155240 }, { "epoch": 0.27, "learning_rate": 3.6463132636013914e-05, "loss": 2.4939, "step": 155250 }, { "epoch": 0.27, "learning_rate": 3.6462260696087084e-05, "loss": 2.4721, "step": 155260 }, { "epoch": 0.27, "learning_rate": 3.646138875616026e-05, "loss": 2.5476, "step": 155270 }, { "epoch": 0.27, "learning_rate": 3.646051681623343e-05, "loss": 2.4465, "step": 155280 }, { "epoch": 0.27, "learning_rate": 3.64596448763066e-05, "loss": 2.3279, "step": 155290 }, { "epoch": 0.27, "learning_rate": 3.645877293637978e-05, "loss": 2.3808, "step": 155300 }, { "epoch": 0.27, "learning_rate": 3.645790099645295e-05, "loss": 2.3918, "step": 155310 }, { "epoch": 0.27, "learning_rate": 3.645702905652612e-05, "loss": 2.4104, "step": 155320 }, { "epoch": 0.27, "learning_rate": 3.64561571165993e-05, "loss": 2.5214, "step": 155330 }, { "epoch": 0.27, "learning_rate": 3.6455285176672474e-05, "loss": 2.5854, "step": 155340 }, { "epoch": 0.27, "learning_rate": 3.6454413236745644e-05, "loss": 2.4914, "step": 155350 }, { "epoch": 0.27, "learning_rate": 3.6453541296818815e-05, "loss": 2.3887, "step": 155360 }, { "epoch": 0.27, "learning_rate": 3.645266935689199e-05, "loss": 2.4305, "step": 155370 }, { "epoch": 0.27, "learning_rate": 3.645179741696516e-05, "loss": 2.4562, "step": 155380 }, { "epoch": 0.27, "learning_rate": 3.645092547703833e-05, "loss": 2.3466, "step": 155390 }, { "epoch": 0.27, "learning_rate": 3.645005353711151e-05, "loss": 2.2605, "step": 155400 }, { "epoch": 0.27, "learning_rate": 3.644918159718469e-05, "loss": 2.5322, "step": 155410 }, { "epoch": 0.27, "learning_rate": 3.644830965725786e-05, "loss": 2.4933, "step": 155420 }, { "epoch": 0.27, "learning_rate": 3.644743771733103e-05, "loss": 2.5813, "step": 155430 }, { "epoch": 0.27, "learning_rate": 3.64465657774042e-05, "loss": 2.5314, "step": 155440 }, { "epoch": 0.27, "learning_rate": 3.6445693837477375e-05, "loss": 2.5212, "step": 155450 }, { "epoch": 0.27, "learning_rate": 3.6444821897550546e-05, "loss": 2.4556, "step": 155460 }, { "epoch": 0.27, "learning_rate": 3.6443949957623716e-05, "loss": 2.4274, "step": 155470 }, { "epoch": 0.27, "learning_rate": 3.64430780176969e-05, "loss": 2.4236, "step": 155480 }, { "epoch": 0.27, "learning_rate": 3.644220607777007e-05, "loss": 2.4665, "step": 155490 }, { "epoch": 0.27, "learning_rate": 3.644133413784324e-05, "loss": 2.4957, "step": 155500 }, { "epoch": 0.27, "learning_rate": 3.644046219791641e-05, "loss": 2.5674, "step": 155510 }, { "epoch": 0.27, "learning_rate": 3.643959025798959e-05, "loss": 2.4107, "step": 155520 }, { "epoch": 0.27, "learning_rate": 3.643871831806276e-05, "loss": 2.5169, "step": 155530 }, { "epoch": 0.27, "learning_rate": 3.643784637813593e-05, "loss": 2.552, "step": 155540 }, { "epoch": 0.27, "learning_rate": 3.6436974438209106e-05, "loss": 2.5274, "step": 155550 }, { "epoch": 0.27, "learning_rate": 3.6436102498282283e-05, "loss": 2.3424, "step": 155560 }, { "epoch": 0.27, "learning_rate": 3.6435230558355454e-05, "loss": 2.5219, "step": 155570 }, { "epoch": 0.27, "learning_rate": 3.6434358618428624e-05, "loss": 2.4806, "step": 155580 }, { "epoch": 0.27, "learning_rate": 3.64334866785018e-05, "loss": 2.3758, "step": 155590 }, { "epoch": 0.27, "learning_rate": 3.643261473857497e-05, "loss": 2.4223, "step": 155600 }, { "epoch": 0.27, "learning_rate": 3.643174279864814e-05, "loss": 2.494, "step": 155610 }, { "epoch": 0.27, "learning_rate": 3.643087085872132e-05, "loss": 2.4317, "step": 155620 }, { "epoch": 0.27, "learning_rate": 3.6429998918794496e-05, "loss": 2.4989, "step": 155630 }, { "epoch": 0.27, "learning_rate": 3.642912697886767e-05, "loss": 2.418, "step": 155640 }, { "epoch": 0.27, "learning_rate": 3.642825503894084e-05, "loss": 2.5125, "step": 155650 }, { "epoch": 0.27, "learning_rate": 3.6427383099014014e-05, "loss": 2.4109, "step": 155660 }, { "epoch": 0.27, "learning_rate": 3.6426511159087185e-05, "loss": 2.4724, "step": 155670 }, { "epoch": 0.27, "learning_rate": 3.6425639219160355e-05, "loss": 2.5436, "step": 155680 }, { "epoch": 0.27, "learning_rate": 3.642476727923353e-05, "loss": 2.3952, "step": 155690 }, { "epoch": 0.27, "learning_rate": 3.642389533930671e-05, "loss": 2.5672, "step": 155700 }, { "epoch": 0.27, "learning_rate": 3.642302339937988e-05, "loss": 2.4518, "step": 155710 }, { "epoch": 0.27, "learning_rate": 3.642215145945305e-05, "loss": 2.5465, "step": 155720 }, { "epoch": 0.27, "learning_rate": 3.642127951952623e-05, "loss": 2.501, "step": 155730 }, { "epoch": 0.27, "learning_rate": 3.64204075795994e-05, "loss": 2.5318, "step": 155740 }, { "epoch": 0.27, "learning_rate": 3.641953563967257e-05, "loss": 2.4314, "step": 155750 }, { "epoch": 0.27, "learning_rate": 3.6418663699745745e-05, "loss": 2.5144, "step": 155760 }, { "epoch": 0.27, "learning_rate": 3.641779175981892e-05, "loss": 2.4561, "step": 155770 }, { "epoch": 0.27, "learning_rate": 3.641691981989209e-05, "loss": 2.5109, "step": 155780 }, { "epoch": 0.27, "learning_rate": 3.641604787996526e-05, "loss": 2.4761, "step": 155790 }, { "epoch": 0.27, "learning_rate": 3.641517594003844e-05, "loss": 2.4298, "step": 155800 }, { "epoch": 0.27, "learning_rate": 3.641430400011161e-05, "loss": 2.5636, "step": 155810 }, { "epoch": 0.27, "learning_rate": 3.641343206018478e-05, "loss": 2.4865, "step": 155820 }, { "epoch": 0.27, "learning_rate": 3.641256012025795e-05, "loss": 2.4705, "step": 155830 }, { "epoch": 0.27, "learning_rate": 3.641168818033113e-05, "loss": 2.3615, "step": 155840 }, { "epoch": 0.27, "learning_rate": 3.6410816240404306e-05, "loss": 2.3725, "step": 155850 }, { "epoch": 0.27, "learning_rate": 3.6409944300477476e-05, "loss": 2.662, "step": 155860 }, { "epoch": 0.27, "learning_rate": 3.640907236055065e-05, "loss": 2.3241, "step": 155870 }, { "epoch": 0.27, "learning_rate": 3.6408200420623824e-05, "loss": 2.483, "step": 155880 }, { "epoch": 0.27, "learning_rate": 3.6407328480696994e-05, "loss": 2.4559, "step": 155890 }, { "epoch": 0.27, "learning_rate": 3.6406456540770165e-05, "loss": 2.5119, "step": 155900 }, { "epoch": 0.27, "learning_rate": 3.640558460084334e-05, "loss": 2.4485, "step": 155910 }, { "epoch": 0.27, "learning_rate": 3.640471266091652e-05, "loss": 2.3782, "step": 155920 }, { "epoch": 0.27, "learning_rate": 3.640384072098969e-05, "loss": 2.3632, "step": 155930 }, { "epoch": 0.27, "learning_rate": 3.640296878106286e-05, "loss": 2.4593, "step": 155940 }, { "epoch": 0.27, "learning_rate": 3.640209684113604e-05, "loss": 2.5489, "step": 155950 }, { "epoch": 0.27, "learning_rate": 3.640122490120921e-05, "loss": 2.4247, "step": 155960 }, { "epoch": 0.27, "learning_rate": 3.640035296128238e-05, "loss": 2.4403, "step": 155970 }, { "epoch": 0.27, "learning_rate": 3.6399481021355555e-05, "loss": 2.5107, "step": 155980 }, { "epoch": 0.27, "learning_rate": 3.6398609081428725e-05, "loss": 2.4828, "step": 155990 }, { "epoch": 0.27, "learning_rate": 3.63977371415019e-05, "loss": 2.5713, "step": 156000 }, { "epoch": 0.27, "learning_rate": 3.639686520157507e-05, "loss": 2.4321, "step": 156010 }, { "epoch": 0.27, "learning_rate": 3.639599326164825e-05, "loss": 2.5822, "step": 156020 }, { "epoch": 0.27, "learning_rate": 3.639512132172142e-05, "loss": 2.4153, "step": 156030 }, { "epoch": 0.27, "learning_rate": 3.639424938179459e-05, "loss": 2.3516, "step": 156040 }, { "epoch": 0.27, "learning_rate": 3.639337744186777e-05, "loss": 2.3746, "step": 156050 }, { "epoch": 0.27, "learning_rate": 3.639250550194094e-05, "loss": 2.4728, "step": 156060 }, { "epoch": 0.27, "learning_rate": 3.6391633562014115e-05, "loss": 2.5447, "step": 156070 }, { "epoch": 0.27, "learning_rate": 3.6390761622087286e-05, "loss": 2.4828, "step": 156080 }, { "epoch": 0.27, "learning_rate": 3.638988968216046e-05, "loss": 2.5017, "step": 156090 }, { "epoch": 0.27, "learning_rate": 3.638901774223363e-05, "loss": 2.5204, "step": 156100 }, { "epoch": 0.27, "learning_rate": 3.6388145802306804e-05, "loss": 2.4672, "step": 156110 }, { "epoch": 0.27, "learning_rate": 3.638727386237998e-05, "loss": 2.5459, "step": 156120 }, { "epoch": 0.27, "learning_rate": 3.638640192245315e-05, "loss": 2.4295, "step": 156130 }, { "epoch": 0.27, "learning_rate": 3.638552998252632e-05, "loss": 2.5147, "step": 156140 }, { "epoch": 0.27, "learning_rate": 3.63846580425995e-05, "loss": 2.5548, "step": 156150 }, { "epoch": 0.27, "learning_rate": 3.6383786102672676e-05, "loss": 2.4305, "step": 156160 }, { "epoch": 0.27, "learning_rate": 3.6382914162745846e-05, "loss": 2.4602, "step": 156170 }, { "epoch": 0.27, "learning_rate": 3.6382042222819017e-05, "loss": 2.4771, "step": 156180 }, { "epoch": 0.27, "learning_rate": 3.6381170282892194e-05, "loss": 2.4165, "step": 156190 }, { "epoch": 0.27, "learning_rate": 3.6380298342965364e-05, "loss": 2.5503, "step": 156200 }, { "epoch": 0.27, "learning_rate": 3.6379426403038534e-05, "loss": 2.4572, "step": 156210 }, { "epoch": 0.27, "learning_rate": 3.637855446311171e-05, "loss": 2.4384, "step": 156220 }, { "epoch": 0.27, "learning_rate": 3.637768252318489e-05, "loss": 2.3908, "step": 156230 }, { "epoch": 0.27, "learning_rate": 3.637681058325806e-05, "loss": 2.4969, "step": 156240 }, { "epoch": 0.27, "learning_rate": 3.637593864333123e-05, "loss": 2.367, "step": 156250 }, { "epoch": 0.27, "learning_rate": 3.637506670340441e-05, "loss": 2.5095, "step": 156260 }, { "epoch": 0.27, "learning_rate": 3.637419476347758e-05, "loss": 2.4504, "step": 156270 }, { "epoch": 0.27, "learning_rate": 3.637332282355075e-05, "loss": 2.5414, "step": 156280 }, { "epoch": 0.27, "learning_rate": 3.637245088362392e-05, "loss": 2.4773, "step": 156290 }, { "epoch": 0.27, "learning_rate": 3.63715789436971e-05, "loss": 2.4729, "step": 156300 }, { "epoch": 0.27, "learning_rate": 3.637070700377027e-05, "loss": 2.5452, "step": 156310 }, { "epoch": 0.27, "learning_rate": 3.636983506384344e-05, "loss": 2.4456, "step": 156320 }, { "epoch": 0.27, "learning_rate": 3.636896312391661e-05, "loss": 2.5955, "step": 156330 }, { "epoch": 0.27, "learning_rate": 3.636809118398979e-05, "loss": 2.5142, "step": 156340 }, { "epoch": 0.27, "learning_rate": 3.636721924406296e-05, "loss": 2.5174, "step": 156350 }, { "epoch": 0.27, "learning_rate": 3.636634730413613e-05, "loss": 2.5109, "step": 156360 }, { "epoch": 0.27, "learning_rate": 3.6365475364209315e-05, "loss": 2.3371, "step": 156370 }, { "epoch": 0.27, "learning_rate": 3.6364603424282485e-05, "loss": 2.4786, "step": 156380 }, { "epoch": 0.27, "learning_rate": 3.6363731484355656e-05, "loss": 2.513, "step": 156390 }, { "epoch": 0.27, "learning_rate": 3.6362859544428826e-05, "loss": 2.4422, "step": 156400 }, { "epoch": 0.27, "learning_rate": 3.6361987604502e-05, "loss": 2.525, "step": 156410 }, { "epoch": 0.27, "learning_rate": 3.6361115664575173e-05, "loss": 2.4383, "step": 156420 }, { "epoch": 0.27, "learning_rate": 3.6360243724648344e-05, "loss": 2.4084, "step": 156430 }, { "epoch": 0.27, "learning_rate": 3.635937178472152e-05, "loss": 2.5718, "step": 156440 }, { "epoch": 0.27, "learning_rate": 3.63584998447947e-05, "loss": 2.4003, "step": 156450 }, { "epoch": 0.27, "learning_rate": 3.635762790486787e-05, "loss": 2.6099, "step": 156460 }, { "epoch": 0.27, "learning_rate": 3.635675596494104e-05, "loss": 2.506, "step": 156470 }, { "epoch": 0.27, "learning_rate": 3.6355884025014216e-05, "loss": 2.447, "step": 156480 }, { "epoch": 0.27, "learning_rate": 3.6355012085087386e-05, "loss": 2.4893, "step": 156490 }, { "epoch": 0.27, "learning_rate": 3.635414014516056e-05, "loss": 2.4426, "step": 156500 }, { "epoch": 0.27, "learning_rate": 3.6353268205233734e-05, "loss": 2.4573, "step": 156510 }, { "epoch": 0.27, "learning_rate": 3.635239626530691e-05, "loss": 2.4118, "step": 156520 }, { "epoch": 0.27, "learning_rate": 3.635152432538008e-05, "loss": 2.4635, "step": 156530 }, { "epoch": 0.27, "learning_rate": 3.635065238545325e-05, "loss": 2.3155, "step": 156540 }, { "epoch": 0.27, "learning_rate": 3.634978044552643e-05, "loss": 2.4393, "step": 156550 }, { "epoch": 0.27, "learning_rate": 3.63489085055996e-05, "loss": 2.5061, "step": 156560 }, { "epoch": 0.27, "learning_rate": 3.634803656567277e-05, "loss": 2.494, "step": 156570 }, { "epoch": 0.27, "learning_rate": 3.634716462574595e-05, "loss": 2.3617, "step": 156580 }, { "epoch": 0.27, "learning_rate": 3.6346292685819124e-05, "loss": 2.3667, "step": 156590 }, { "epoch": 0.27, "learning_rate": 3.6345420745892295e-05, "loss": 2.4048, "step": 156600 }, { "epoch": 0.27, "learning_rate": 3.6344548805965465e-05, "loss": 2.477, "step": 156610 }, { "epoch": 0.27, "learning_rate": 3.634367686603864e-05, "loss": 2.5504, "step": 156620 }, { "epoch": 0.27, "learning_rate": 3.634280492611181e-05, "loss": 2.5258, "step": 156630 }, { "epoch": 0.27, "learning_rate": 3.634193298618498e-05, "loss": 2.3471, "step": 156640 }, { "epoch": 0.27, "learning_rate": 3.634106104625816e-05, "loss": 2.4454, "step": 156650 }, { "epoch": 0.27, "learning_rate": 3.634018910633133e-05, "loss": 2.6074, "step": 156660 }, { "epoch": 0.27, "learning_rate": 3.633931716640451e-05, "loss": 2.4111, "step": 156670 }, { "epoch": 0.27, "learning_rate": 3.633844522647768e-05, "loss": 2.5251, "step": 156680 }, { "epoch": 0.27, "learning_rate": 3.6337573286550855e-05, "loss": 2.434, "step": 156690 }, { "epoch": 0.27, "learning_rate": 3.6336701346624025e-05, "loss": 2.5038, "step": 156700 }, { "epoch": 0.27, "learning_rate": 3.6335829406697196e-05, "loss": 2.3842, "step": 156710 }, { "epoch": 0.27, "learning_rate": 3.633495746677037e-05, "loss": 2.536, "step": 156720 }, { "epoch": 0.27, "learning_rate": 3.633408552684354e-05, "loss": 2.6134, "step": 156730 }, { "epoch": 0.27, "learning_rate": 3.633321358691672e-05, "loss": 2.4007, "step": 156740 }, { "epoch": 0.27, "learning_rate": 3.633234164698989e-05, "loss": 2.3886, "step": 156750 }, { "epoch": 0.27, "learning_rate": 3.633146970706307e-05, "loss": 2.3241, "step": 156760 }, { "epoch": 0.27, "learning_rate": 3.633059776713624e-05, "loss": 2.5102, "step": 156770 }, { "epoch": 0.27, "learning_rate": 3.632972582720941e-05, "loss": 2.4743, "step": 156780 }, { "epoch": 0.27, "learning_rate": 3.632885388728258e-05, "loss": 2.482, "step": 156790 }, { "epoch": 0.27, "learning_rate": 3.6327981947355756e-05, "loss": 2.5374, "step": 156800 }, { "epoch": 0.27, "learning_rate": 3.632711000742893e-05, "loss": 2.4418, "step": 156810 }, { "epoch": 0.27, "learning_rate": 3.6326238067502104e-05, "loss": 2.3741, "step": 156820 }, { "epoch": 0.27, "learning_rate": 3.632536612757528e-05, "loss": 2.4014, "step": 156830 }, { "epoch": 0.27, "learning_rate": 3.632449418764845e-05, "loss": 2.5746, "step": 156840 }, { "epoch": 0.27, "learning_rate": 3.632362224772162e-05, "loss": 2.4703, "step": 156850 }, { "epoch": 0.27, "learning_rate": 3.632275030779479e-05, "loss": 2.5042, "step": 156860 }, { "epoch": 0.27, "learning_rate": 3.632187836786797e-05, "loss": 2.5316, "step": 156870 }, { "epoch": 0.27, "learning_rate": 3.632100642794114e-05, "loss": 2.3897, "step": 156880 }, { "epoch": 0.27, "learning_rate": 3.632013448801432e-05, "loss": 2.6795, "step": 156890 }, { "epoch": 0.27, "learning_rate": 3.631926254808749e-05, "loss": 2.4771, "step": 156900 }, { "epoch": 0.27, "learning_rate": 3.6318390608160664e-05, "loss": 2.4428, "step": 156910 }, { "epoch": 0.27, "learning_rate": 3.6317518668233835e-05, "loss": 2.5406, "step": 156920 }, { "epoch": 0.27, "learning_rate": 3.6316646728307005e-05, "loss": 2.5282, "step": 156930 }, { "epoch": 0.27, "learning_rate": 3.631577478838018e-05, "loss": 2.4702, "step": 156940 }, { "epoch": 0.27, "learning_rate": 3.631490284845335e-05, "loss": 2.4686, "step": 156950 }, { "epoch": 0.27, "learning_rate": 3.631403090852653e-05, "loss": 2.3784, "step": 156960 }, { "epoch": 0.27, "learning_rate": 3.63131589685997e-05, "loss": 2.4512, "step": 156970 }, { "epoch": 0.27, "learning_rate": 3.631228702867288e-05, "loss": 2.4713, "step": 156980 }, { "epoch": 0.27, "learning_rate": 3.631141508874605e-05, "loss": 2.4541, "step": 156990 }, { "epoch": 0.27, "learning_rate": 3.631054314881922e-05, "loss": 2.5669, "step": 157000 }, { "epoch": 0.27, "learning_rate": 3.6309671208892395e-05, "loss": 2.5455, "step": 157010 }, { "epoch": 0.27, "learning_rate": 3.6308799268965566e-05, "loss": 2.4095, "step": 157020 }, { "epoch": 0.27, "learning_rate": 3.6307927329038736e-05, "loss": 2.3543, "step": 157030 }, { "epoch": 0.27, "learning_rate": 3.630705538911191e-05, "loss": 2.4215, "step": 157040 }, { "epoch": 0.27, "learning_rate": 3.630618344918509e-05, "loss": 2.383, "step": 157050 }, { "epoch": 0.27, "learning_rate": 3.630531150925826e-05, "loss": 2.5181, "step": 157060 }, { "epoch": 0.27, "learning_rate": 3.630443956933143e-05, "loss": 2.5034, "step": 157070 }, { "epoch": 0.27, "learning_rate": 3.630356762940461e-05, "loss": 2.4443, "step": 157080 }, { "epoch": 0.27, "learning_rate": 3.630269568947778e-05, "loss": 2.4164, "step": 157090 }, { "epoch": 0.27, "learning_rate": 3.630182374955095e-05, "loss": 2.4502, "step": 157100 }, { "epoch": 0.27, "learning_rate": 3.6300951809624126e-05, "loss": 2.4662, "step": 157110 }, { "epoch": 0.27, "learning_rate": 3.6300079869697303e-05, "loss": 2.4841, "step": 157120 }, { "epoch": 0.27, "learning_rate": 3.6299207929770474e-05, "loss": 2.4678, "step": 157130 }, { "epoch": 0.27, "learning_rate": 3.6298335989843644e-05, "loss": 2.4524, "step": 157140 }, { "epoch": 0.27, "learning_rate": 3.629746404991682e-05, "loss": 2.4058, "step": 157150 }, { "epoch": 0.27, "learning_rate": 3.629659210998999e-05, "loss": 2.4994, "step": 157160 }, { "epoch": 0.27, "learning_rate": 3.629572017006316e-05, "loss": 2.5034, "step": 157170 }, { "epoch": 0.27, "learning_rate": 3.629484823013633e-05, "loss": 2.4819, "step": 157180 }, { "epoch": 0.27, "learning_rate": 3.6293976290209516e-05, "loss": 2.5782, "step": 157190 }, { "epoch": 0.27, "learning_rate": 3.629310435028269e-05, "loss": 2.3965, "step": 157200 }, { "epoch": 0.27, "learning_rate": 3.629223241035586e-05, "loss": 2.4526, "step": 157210 }, { "epoch": 0.27, "learning_rate": 3.6291360470429034e-05, "loss": 2.4886, "step": 157220 }, { "epoch": 0.27, "learning_rate": 3.6290488530502205e-05, "loss": 2.5081, "step": 157230 }, { "epoch": 0.27, "learning_rate": 3.6289616590575375e-05, "loss": 2.4405, "step": 157240 }, { "epoch": 0.27, "learning_rate": 3.6288744650648546e-05, "loss": 2.5502, "step": 157250 }, { "epoch": 0.27, "learning_rate": 3.628787271072173e-05, "loss": 2.4542, "step": 157260 }, { "epoch": 0.27, "learning_rate": 3.62870007707949e-05, "loss": 2.3706, "step": 157270 }, { "epoch": 0.27, "learning_rate": 3.628612883086807e-05, "loss": 2.5007, "step": 157280 }, { "epoch": 0.27, "learning_rate": 3.628525689094124e-05, "loss": 2.3579, "step": 157290 }, { "epoch": 0.27, "learning_rate": 3.628438495101442e-05, "loss": 2.3731, "step": 157300 }, { "epoch": 0.27, "learning_rate": 3.628351301108759e-05, "loss": 2.4236, "step": 157310 }, { "epoch": 0.27, "learning_rate": 3.628264107116076e-05, "loss": 2.3747, "step": 157320 }, { "epoch": 0.27, "learning_rate": 3.6281769131233936e-05, "loss": 2.4181, "step": 157330 }, { "epoch": 0.27, "learning_rate": 3.628089719130711e-05, "loss": 2.4565, "step": 157340 }, { "epoch": 0.27, "learning_rate": 3.628002525138028e-05, "loss": 2.4621, "step": 157350 }, { "epoch": 0.27, "learning_rate": 3.6279153311453454e-05, "loss": 2.4596, "step": 157360 }, { "epoch": 0.27, "learning_rate": 3.627828137152663e-05, "loss": 2.4082, "step": 157370 }, { "epoch": 0.27, "learning_rate": 3.62774094315998e-05, "loss": 2.4693, "step": 157380 }, { "epoch": 0.27, "learning_rate": 3.627653749167297e-05, "loss": 2.3981, "step": 157390 }, { "epoch": 0.27, "learning_rate": 3.627566555174615e-05, "loss": 2.5457, "step": 157400 }, { "epoch": 0.27, "learning_rate": 3.6274793611819326e-05, "loss": 2.4339, "step": 157410 }, { "epoch": 0.27, "learning_rate": 3.6273921671892496e-05, "loss": 2.4549, "step": 157420 }, { "epoch": 0.27, "learning_rate": 3.6273049731965667e-05, "loss": 2.4571, "step": 157430 }, { "epoch": 0.27, "learning_rate": 3.6272177792038844e-05, "loss": 2.3742, "step": 157440 }, { "epoch": 0.27, "learning_rate": 3.6271305852112014e-05, "loss": 2.6293, "step": 157450 }, { "epoch": 0.27, "learning_rate": 3.6270433912185185e-05, "loss": 2.4379, "step": 157460 }, { "epoch": 0.27, "learning_rate": 3.626956197225836e-05, "loss": 2.5224, "step": 157470 }, { "epoch": 0.27, "learning_rate": 3.626869003233153e-05, "loss": 2.3801, "step": 157480 }, { "epoch": 0.27, "learning_rate": 3.626781809240471e-05, "loss": 2.388, "step": 157490 }, { "epoch": 0.27, "learning_rate": 3.626694615247788e-05, "loss": 2.5315, "step": 157500 }, { "epoch": 0.27, "learning_rate": 3.626607421255106e-05, "loss": 2.4945, "step": 157510 }, { "epoch": 0.27, "learning_rate": 3.626520227262423e-05, "loss": 2.3014, "step": 157520 }, { "epoch": 0.27, "learning_rate": 3.62643303326974e-05, "loss": 2.431, "step": 157530 }, { "epoch": 0.27, "learning_rate": 3.6263458392770575e-05, "loss": 2.4098, "step": 157540 }, { "epoch": 0.27, "learning_rate": 3.6262586452843745e-05, "loss": 2.4461, "step": 157550 }, { "epoch": 0.27, "learning_rate": 3.626171451291692e-05, "loss": 2.5093, "step": 157560 }, { "epoch": 0.27, "learning_rate": 3.626084257299009e-05, "loss": 2.4942, "step": 157570 }, { "epoch": 0.27, "learning_rate": 3.625997063306327e-05, "loss": 2.4958, "step": 157580 }, { "epoch": 0.27, "learning_rate": 3.625909869313644e-05, "loss": 2.518, "step": 157590 }, { "epoch": 0.27, "learning_rate": 3.625822675320961e-05, "loss": 2.5571, "step": 157600 }, { "epoch": 0.27, "learning_rate": 3.625735481328279e-05, "loss": 2.3392, "step": 157610 }, { "epoch": 0.27, "learning_rate": 3.625648287335596e-05, "loss": 2.4738, "step": 157620 }, { "epoch": 0.27, "learning_rate": 3.6255610933429135e-05, "loss": 2.559, "step": 157630 }, { "epoch": 0.27, "learning_rate": 3.6254738993502306e-05, "loss": 2.4398, "step": 157640 }, { "epoch": 0.27, "learning_rate": 3.625386705357548e-05, "loss": 2.385, "step": 157650 }, { "epoch": 0.27, "learning_rate": 3.625299511364865e-05, "loss": 2.4164, "step": 157660 }, { "epoch": 0.27, "learning_rate": 3.6252123173721824e-05, "loss": 2.5259, "step": 157670 }, { "epoch": 0.27, "learning_rate": 3.6251251233794994e-05, "loss": 2.4383, "step": 157680 }, { "epoch": 0.27, "learning_rate": 3.625037929386817e-05, "loss": 2.5332, "step": 157690 }, { "epoch": 0.28, "learning_rate": 3.624950735394134e-05, "loss": 2.4792, "step": 157700 }, { "epoch": 0.28, "learning_rate": 3.624863541401452e-05, "loss": 2.5096, "step": 157710 }, { "epoch": 0.28, "learning_rate": 3.6247763474087696e-05, "loss": 2.4969, "step": 157720 }, { "epoch": 0.28, "learning_rate": 3.6246891534160866e-05, "loss": 2.3412, "step": 157730 }, { "epoch": 0.28, "learning_rate": 3.6246019594234037e-05, "loss": 2.5155, "step": 157740 }, { "epoch": 0.28, "learning_rate": 3.624514765430721e-05, "loss": 2.3689, "step": 157750 }, { "epoch": 0.28, "learning_rate": 3.6244275714380384e-05, "loss": 2.4016, "step": 157760 }, { "epoch": 0.28, "learning_rate": 3.6243403774453554e-05, "loss": 2.5478, "step": 157770 }, { "epoch": 0.28, "learning_rate": 3.624253183452673e-05, "loss": 2.5229, "step": 157780 }, { "epoch": 0.28, "learning_rate": 3.62416598945999e-05, "loss": 2.5097, "step": 157790 }, { "epoch": 0.28, "learning_rate": 3.624078795467308e-05, "loss": 2.3721, "step": 157800 }, { "epoch": 0.28, "learning_rate": 3.623991601474625e-05, "loss": 2.4563, "step": 157810 }, { "epoch": 0.28, "learning_rate": 3.623904407481942e-05, "loss": 2.4738, "step": 157820 }, { "epoch": 0.28, "learning_rate": 3.62381721348926e-05, "loss": 2.4515, "step": 157830 }, { "epoch": 0.28, "learning_rate": 3.623730019496577e-05, "loss": 2.456, "step": 157840 }, { "epoch": 0.28, "learning_rate": 3.623642825503894e-05, "loss": 2.5649, "step": 157850 }, { "epoch": 0.28, "learning_rate": 3.6235556315112115e-05, "loss": 2.5164, "step": 157860 }, { "epoch": 0.28, "learning_rate": 3.623468437518529e-05, "loss": 2.4528, "step": 157870 }, { "epoch": 0.28, "learning_rate": 3.623381243525846e-05, "loss": 2.4888, "step": 157880 }, { "epoch": 0.28, "learning_rate": 3.623294049533163e-05, "loss": 2.4247, "step": 157890 }, { "epoch": 0.28, "learning_rate": 3.623206855540481e-05, "loss": 2.4001, "step": 157900 }, { "epoch": 0.28, "learning_rate": 3.623119661547798e-05, "loss": 2.5063, "step": 157910 }, { "epoch": 0.28, "learning_rate": 3.623032467555115e-05, "loss": 2.4233, "step": 157920 }, { "epoch": 0.28, "learning_rate": 3.622945273562433e-05, "loss": 2.4055, "step": 157930 }, { "epoch": 0.28, "learning_rate": 3.6228580795697505e-05, "loss": 2.4862, "step": 157940 }, { "epoch": 0.28, "learning_rate": 3.6227708855770676e-05, "loss": 2.4465, "step": 157950 }, { "epoch": 0.28, "learning_rate": 3.6226836915843846e-05, "loss": 2.4754, "step": 157960 }, { "epoch": 0.28, "learning_rate": 3.622596497591702e-05, "loss": 2.4737, "step": 157970 }, { "epoch": 0.28, "learning_rate": 3.6225093035990193e-05, "loss": 2.3204, "step": 157980 }, { "epoch": 0.28, "learning_rate": 3.6224221096063364e-05, "loss": 2.5267, "step": 157990 }, { "epoch": 0.28, "learning_rate": 3.622334915613654e-05, "loss": 2.4259, "step": 158000 }, { "epoch": 0.28, "learning_rate": 3.622247721620972e-05, "loss": 2.3581, "step": 158010 }, { "epoch": 0.28, "learning_rate": 3.622160527628289e-05, "loss": 2.4394, "step": 158020 }, { "epoch": 0.28, "learning_rate": 3.622073333635606e-05, "loss": 2.4651, "step": 158030 }, { "epoch": 0.28, "learning_rate": 3.6219861396429236e-05, "loss": 2.4093, "step": 158040 }, { "epoch": 0.28, "learning_rate": 3.6218989456502406e-05, "loss": 2.3624, "step": 158050 }, { "epoch": 0.28, "learning_rate": 3.621811751657558e-05, "loss": 2.4489, "step": 158060 }, { "epoch": 0.28, "learning_rate": 3.6217245576648754e-05, "loss": 2.464, "step": 158070 }, { "epoch": 0.28, "learning_rate": 3.621637363672193e-05, "loss": 2.6171, "step": 158080 }, { "epoch": 0.28, "learning_rate": 3.62155016967951e-05, "loss": 2.4873, "step": 158090 }, { "epoch": 0.28, "learning_rate": 3.621462975686827e-05, "loss": 2.4508, "step": 158100 }, { "epoch": 0.28, "learning_rate": 3.621375781694145e-05, "loss": 2.5439, "step": 158110 }, { "epoch": 0.28, "learning_rate": 3.621288587701462e-05, "loss": 2.4547, "step": 158120 }, { "epoch": 0.28, "learning_rate": 3.621201393708779e-05, "loss": 2.5828, "step": 158130 }, { "epoch": 0.28, "learning_rate": 3.621114199716096e-05, "loss": 2.5051, "step": 158140 }, { "epoch": 0.28, "learning_rate": 3.621027005723414e-05, "loss": 2.4019, "step": 158150 }, { "epoch": 0.28, "learning_rate": 3.6209398117307315e-05, "loss": 2.4636, "step": 158160 }, { "epoch": 0.28, "learning_rate": 3.6208526177380485e-05, "loss": 2.5634, "step": 158170 }, { "epoch": 0.28, "learning_rate": 3.620765423745366e-05, "loss": 2.4104, "step": 158180 }, { "epoch": 0.28, "learning_rate": 3.620678229752683e-05, "loss": 2.4341, "step": 158190 }, { "epoch": 0.28, "learning_rate": 3.62059103576e-05, "loss": 2.555, "step": 158200 }, { "epoch": 0.28, "learning_rate": 3.620503841767317e-05, "loss": 2.4247, "step": 158210 }, { "epoch": 0.28, "learning_rate": 3.620416647774635e-05, "loss": 2.3986, "step": 158220 }, { "epoch": 0.28, "learning_rate": 3.620329453781953e-05, "loss": 2.3833, "step": 158230 }, { "epoch": 0.28, "learning_rate": 3.62024225978927e-05, "loss": 2.4761, "step": 158240 }, { "epoch": 0.28, "learning_rate": 3.620155065796587e-05, "loss": 2.4916, "step": 158250 }, { "epoch": 0.28, "learning_rate": 3.6200678718039045e-05, "loss": 2.4935, "step": 158260 }, { "epoch": 0.28, "learning_rate": 3.6199806778112216e-05, "loss": 2.4511, "step": 158270 }, { "epoch": 0.28, "learning_rate": 3.6198934838185386e-05, "loss": 2.4797, "step": 158280 }, { "epoch": 0.28, "learning_rate": 3.619806289825856e-05, "loss": 2.4778, "step": 158290 }, { "epoch": 0.28, "learning_rate": 3.619719095833174e-05, "loss": 2.4833, "step": 158300 }, { "epoch": 0.28, "learning_rate": 3.619631901840491e-05, "loss": 2.3816, "step": 158310 }, { "epoch": 0.28, "learning_rate": 3.619544707847808e-05, "loss": 2.4974, "step": 158320 }, { "epoch": 0.28, "learning_rate": 3.619457513855126e-05, "loss": 2.4197, "step": 158330 }, { "epoch": 0.28, "learning_rate": 3.619370319862443e-05, "loss": 2.3479, "step": 158340 }, { "epoch": 0.28, "learning_rate": 3.61928312586976e-05, "loss": 2.4866, "step": 158350 }, { "epoch": 0.28, "learning_rate": 3.6191959318770776e-05, "loss": 2.3751, "step": 158360 }, { "epoch": 0.28, "learning_rate": 3.619108737884395e-05, "loss": 2.5667, "step": 158370 }, { "epoch": 0.28, "learning_rate": 3.6190215438917124e-05, "loss": 2.5504, "step": 158380 }, { "epoch": 0.28, "learning_rate": 3.6189343498990294e-05, "loss": 2.4182, "step": 158390 }, { "epoch": 0.28, "learning_rate": 3.618847155906347e-05, "loss": 2.377, "step": 158400 }, { "epoch": 0.28, "learning_rate": 3.618759961913664e-05, "loss": 2.3578, "step": 158410 }, { "epoch": 0.28, "learning_rate": 3.618672767920981e-05, "loss": 2.572, "step": 158420 }, { "epoch": 0.28, "learning_rate": 3.618585573928299e-05, "loss": 2.3768, "step": 158430 }, { "epoch": 0.28, "learning_rate": 3.618498379935616e-05, "loss": 2.636, "step": 158440 }, { "epoch": 0.28, "learning_rate": 3.618411185942934e-05, "loss": 2.3853, "step": 158450 }, { "epoch": 0.28, "learning_rate": 3.618323991950251e-05, "loss": 2.5109, "step": 158460 }, { "epoch": 0.28, "learning_rate": 3.6182367979575684e-05, "loss": 2.3925, "step": 158470 }, { "epoch": 0.28, "learning_rate": 3.6181496039648855e-05, "loss": 2.5192, "step": 158480 }, { "epoch": 0.28, "learning_rate": 3.6180624099722025e-05, "loss": 2.4908, "step": 158490 }, { "epoch": 0.28, "learning_rate": 3.61797521597952e-05, "loss": 2.5071, "step": 158500 }, { "epoch": 0.28, "learning_rate": 3.617888021986837e-05, "loss": 2.382, "step": 158510 }, { "epoch": 0.28, "learning_rate": 3.617800827994154e-05, "loss": 2.4319, "step": 158520 }, { "epoch": 0.28, "learning_rate": 3.617713634001472e-05, "loss": 2.5312, "step": 158530 }, { "epoch": 0.28, "learning_rate": 3.61762644000879e-05, "loss": 2.3542, "step": 158540 }, { "epoch": 0.28, "learning_rate": 3.617539246016107e-05, "loss": 2.3892, "step": 158550 }, { "epoch": 0.28, "learning_rate": 3.617452052023424e-05, "loss": 2.4892, "step": 158560 }, { "epoch": 0.28, "learning_rate": 3.6173648580307415e-05, "loss": 2.5553, "step": 158570 }, { "epoch": 0.28, "learning_rate": 3.6172776640380586e-05, "loss": 2.5329, "step": 158580 }, { "epoch": 0.28, "learning_rate": 3.6171904700453756e-05, "loss": 2.4897, "step": 158590 }, { "epoch": 0.28, "learning_rate": 3.617103276052693e-05, "loss": 2.4238, "step": 158600 }, { "epoch": 0.28, "learning_rate": 3.617016082060011e-05, "loss": 2.5928, "step": 158610 }, { "epoch": 0.28, "learning_rate": 3.616928888067328e-05, "loss": 2.5827, "step": 158620 }, { "epoch": 0.28, "learning_rate": 3.616841694074645e-05, "loss": 2.4721, "step": 158630 }, { "epoch": 0.28, "learning_rate": 3.616754500081962e-05, "loss": 2.4641, "step": 158640 }, { "epoch": 0.28, "learning_rate": 3.61666730608928e-05, "loss": 2.4211, "step": 158650 }, { "epoch": 0.28, "learning_rate": 3.616580112096597e-05, "loss": 2.506, "step": 158660 }, { "epoch": 0.28, "learning_rate": 3.616492918103914e-05, "loss": 2.3982, "step": 158670 }, { "epoch": 0.28, "learning_rate": 3.6164057241112323e-05, "loss": 2.4974, "step": 158680 }, { "epoch": 0.28, "learning_rate": 3.6163185301185494e-05, "loss": 2.3699, "step": 158690 }, { "epoch": 0.28, "learning_rate": 3.6162313361258664e-05, "loss": 2.4624, "step": 158700 }, { "epoch": 0.28, "learning_rate": 3.6161441421331835e-05, "loss": 2.5034, "step": 158710 }, { "epoch": 0.28, "learning_rate": 3.616056948140501e-05, "loss": 2.3561, "step": 158720 }, { "epoch": 0.28, "learning_rate": 3.615969754147818e-05, "loss": 2.2772, "step": 158730 }, { "epoch": 0.28, "learning_rate": 3.615882560155135e-05, "loss": 2.3848, "step": 158740 }, { "epoch": 0.28, "learning_rate": 3.615795366162453e-05, "loss": 2.4483, "step": 158750 }, { "epoch": 0.28, "learning_rate": 3.615708172169771e-05, "loss": 2.4917, "step": 158760 }, { "epoch": 0.28, "learning_rate": 3.615620978177088e-05, "loss": 2.5059, "step": 158770 }, { "epoch": 0.28, "learning_rate": 3.615533784184405e-05, "loss": 2.4944, "step": 158780 }, { "epoch": 0.28, "learning_rate": 3.6154465901917225e-05, "loss": 2.5317, "step": 158790 }, { "epoch": 0.28, "learning_rate": 3.6153593961990395e-05, "loss": 2.5851, "step": 158800 }, { "epoch": 0.28, "learning_rate": 3.6152722022063566e-05, "loss": 2.4465, "step": 158810 }, { "epoch": 0.28, "learning_rate": 3.615185008213674e-05, "loss": 2.5491, "step": 158820 }, { "epoch": 0.28, "learning_rate": 3.615097814220992e-05, "loss": 2.5602, "step": 158830 }, { "epoch": 0.28, "learning_rate": 3.615010620228309e-05, "loss": 2.4775, "step": 158840 }, { "epoch": 0.28, "learning_rate": 3.614923426235626e-05, "loss": 2.2982, "step": 158850 }, { "epoch": 0.28, "learning_rate": 3.614836232242944e-05, "loss": 2.4727, "step": 158860 }, { "epoch": 0.28, "learning_rate": 3.614749038250261e-05, "loss": 2.4499, "step": 158870 }, { "epoch": 0.28, "learning_rate": 3.614661844257578e-05, "loss": 2.5835, "step": 158880 }, { "epoch": 0.28, "learning_rate": 3.6145746502648956e-05, "loss": 2.4609, "step": 158890 }, { "epoch": 0.28, "learning_rate": 3.614487456272213e-05, "loss": 2.4769, "step": 158900 }, { "epoch": 0.28, "learning_rate": 3.61440026227953e-05, "loss": 2.5274, "step": 158910 }, { "epoch": 0.28, "learning_rate": 3.6143130682868474e-05, "loss": 2.4963, "step": 158920 }, { "epoch": 0.28, "learning_rate": 3.614225874294165e-05, "loss": 2.508, "step": 158930 }, { "epoch": 0.28, "learning_rate": 3.614138680301482e-05, "loss": 2.5174, "step": 158940 }, { "epoch": 0.28, "learning_rate": 3.614051486308799e-05, "loss": 2.4868, "step": 158950 }, { "epoch": 0.28, "learning_rate": 3.613964292316117e-05, "loss": 2.5373, "step": 158960 }, { "epoch": 0.28, "learning_rate": 3.6138770983234346e-05, "loss": 2.479, "step": 158970 }, { "epoch": 0.28, "learning_rate": 3.6137899043307516e-05, "loss": 2.3461, "step": 158980 }, { "epoch": 0.28, "learning_rate": 3.613702710338069e-05, "loss": 2.4132, "step": 158990 }, { "epoch": 0.28, "learning_rate": 3.6136155163453864e-05, "loss": 2.6106, "step": 159000 }, { "epoch": 0.28, "learning_rate": 3.6135283223527034e-05, "loss": 2.4851, "step": 159010 }, { "epoch": 0.28, "learning_rate": 3.6134411283600205e-05, "loss": 2.5289, "step": 159020 }, { "epoch": 0.28, "learning_rate": 3.6133539343673375e-05, "loss": 2.4335, "step": 159030 }, { "epoch": 0.28, "learning_rate": 3.613266740374655e-05, "loss": 2.4513, "step": 159040 }, { "epoch": 0.28, "learning_rate": 3.613179546381973e-05, "loss": 2.4876, "step": 159050 }, { "epoch": 0.28, "learning_rate": 3.61309235238929e-05, "loss": 2.5026, "step": 159060 }, { "epoch": 0.28, "learning_rate": 3.613005158396608e-05, "loss": 2.4494, "step": 159070 }, { "epoch": 0.28, "learning_rate": 3.612917964403925e-05, "loss": 2.4427, "step": 159080 }, { "epoch": 0.28, "learning_rate": 3.612830770411242e-05, "loss": 2.4911, "step": 159090 }, { "epoch": 0.28, "learning_rate": 3.612743576418559e-05, "loss": 2.5413, "step": 159100 }, { "epoch": 0.28, "learning_rate": 3.6126563824258765e-05, "loss": 2.4199, "step": 159110 }, { "epoch": 0.28, "learning_rate": 3.612569188433194e-05, "loss": 2.3814, "step": 159120 }, { "epoch": 0.28, "learning_rate": 3.612481994440511e-05, "loss": 2.4526, "step": 159130 }, { "epoch": 0.28, "learning_rate": 3.612394800447828e-05, "loss": 2.4609, "step": 159140 }, { "epoch": 0.28, "learning_rate": 3.612307606455146e-05, "loss": 2.5237, "step": 159150 }, { "epoch": 0.28, "learning_rate": 3.612220412462463e-05, "loss": 2.4578, "step": 159160 }, { "epoch": 0.28, "learning_rate": 3.61213321846978e-05, "loss": 2.4745, "step": 159170 }, { "epoch": 0.28, "learning_rate": 3.612046024477098e-05, "loss": 2.5355, "step": 159180 }, { "epoch": 0.28, "learning_rate": 3.611958830484415e-05, "loss": 2.5195, "step": 159190 }, { "epoch": 0.28, "learning_rate": 3.6118716364917326e-05, "loss": 2.532, "step": 159200 }, { "epoch": 0.28, "learning_rate": 3.6117844424990496e-05, "loss": 2.517, "step": 159210 }, { "epoch": 0.28, "learning_rate": 3.611697248506367e-05, "loss": 2.4345, "step": 159220 }, { "epoch": 0.28, "learning_rate": 3.6116100545136844e-05, "loss": 2.4636, "step": 159230 }, { "epoch": 0.28, "learning_rate": 3.6115228605210014e-05, "loss": 2.4148, "step": 159240 }, { "epoch": 0.28, "learning_rate": 3.611435666528319e-05, "loss": 2.5263, "step": 159250 }, { "epoch": 0.28, "learning_rate": 3.611348472535636e-05, "loss": 2.5123, "step": 159260 }, { "epoch": 0.28, "learning_rate": 3.611261278542954e-05, "loss": 2.4818, "step": 159270 }, { "epoch": 0.28, "learning_rate": 3.611174084550271e-05, "loss": 2.4063, "step": 159280 }, { "epoch": 0.28, "learning_rate": 3.6110868905575886e-05, "loss": 2.4991, "step": 159290 }, { "epoch": 0.28, "learning_rate": 3.6109996965649057e-05, "loss": 2.4683, "step": 159300 }, { "epoch": 0.28, "learning_rate": 3.610912502572223e-05, "loss": 2.3689, "step": 159310 }, { "epoch": 0.28, "learning_rate": 3.6108253085795404e-05, "loss": 2.4414, "step": 159320 }, { "epoch": 0.28, "learning_rate": 3.6107381145868574e-05, "loss": 2.405, "step": 159330 }, { "epoch": 0.28, "learning_rate": 3.6106509205941745e-05, "loss": 2.5283, "step": 159340 }, { "epoch": 0.28, "learning_rate": 3.610563726601492e-05, "loss": 2.5163, "step": 159350 }, { "epoch": 0.28, "learning_rate": 3.61047653260881e-05, "loss": 2.4752, "step": 159360 }, { "epoch": 0.28, "learning_rate": 3.610389338616127e-05, "loss": 2.5769, "step": 159370 }, { "epoch": 0.28, "learning_rate": 3.610302144623444e-05, "loss": 2.4702, "step": 159380 }, { "epoch": 0.28, "learning_rate": 3.610214950630762e-05, "loss": 2.5041, "step": 159390 }, { "epoch": 0.28, "learning_rate": 3.610127756638079e-05, "loss": 2.4992, "step": 159400 }, { "epoch": 0.28, "learning_rate": 3.610040562645396e-05, "loss": 2.4641, "step": 159410 }, { "epoch": 0.28, "learning_rate": 3.6099533686527135e-05, "loss": 2.4176, "step": 159420 }, { "epoch": 0.28, "learning_rate": 3.609866174660031e-05, "loss": 2.502, "step": 159430 }, { "epoch": 0.28, "learning_rate": 3.609778980667348e-05, "loss": 2.4075, "step": 159440 }, { "epoch": 0.28, "learning_rate": 3.609691786674665e-05, "loss": 2.4912, "step": 159450 }, { "epoch": 0.28, "learning_rate": 3.609604592681983e-05, "loss": 2.5276, "step": 159460 }, { "epoch": 0.28, "learning_rate": 3.6095173986893e-05, "loss": 2.4742, "step": 159470 }, { "epoch": 0.28, "learning_rate": 3.609430204696617e-05, "loss": 2.475, "step": 159480 }, { "epoch": 0.28, "learning_rate": 3.609343010703935e-05, "loss": 2.405, "step": 159490 }, { "epoch": 0.28, "learning_rate": 3.6092558167112525e-05, "loss": 2.4384, "step": 159500 }, { "epoch": 0.28, "learning_rate": 3.6091686227185696e-05, "loss": 2.5349, "step": 159510 }, { "epoch": 0.28, "learning_rate": 3.6090814287258866e-05, "loss": 2.4869, "step": 159520 }, { "epoch": 0.28, "learning_rate": 3.608994234733204e-05, "loss": 2.4231, "step": 159530 }, { "epoch": 0.28, "learning_rate": 3.6089070407405213e-05, "loss": 2.5343, "step": 159540 }, { "epoch": 0.28, "learning_rate": 3.6088198467478384e-05, "loss": 2.4278, "step": 159550 }, { "epoch": 0.28, "learning_rate": 3.6087326527551554e-05, "loss": 2.3507, "step": 159560 }, { "epoch": 0.28, "learning_rate": 3.608645458762474e-05, "loss": 2.3748, "step": 159570 }, { "epoch": 0.28, "learning_rate": 3.608558264769791e-05, "loss": 2.3294, "step": 159580 }, { "epoch": 0.28, "learning_rate": 3.608471070777108e-05, "loss": 2.3537, "step": 159590 }, { "epoch": 0.28, "learning_rate": 3.608383876784425e-05, "loss": 2.4014, "step": 159600 }, { "epoch": 0.28, "learning_rate": 3.6082966827917426e-05, "loss": 2.4964, "step": 159610 }, { "epoch": 0.28, "learning_rate": 3.60820948879906e-05, "loss": 2.5006, "step": 159620 }, { "epoch": 0.28, "learning_rate": 3.608122294806377e-05, "loss": 2.3333, "step": 159630 }, { "epoch": 0.28, "learning_rate": 3.608035100813695e-05, "loss": 2.5203, "step": 159640 }, { "epoch": 0.28, "learning_rate": 3.607947906821012e-05, "loss": 2.4291, "step": 159650 }, { "epoch": 0.28, "learning_rate": 3.607860712828329e-05, "loss": 2.5787, "step": 159660 }, { "epoch": 0.28, "learning_rate": 3.607773518835646e-05, "loss": 2.5119, "step": 159670 }, { "epoch": 0.28, "learning_rate": 3.607686324842964e-05, "loss": 2.382, "step": 159680 }, { "epoch": 0.28, "learning_rate": 3.607599130850281e-05, "loss": 2.5071, "step": 159690 }, { "epoch": 0.28, "learning_rate": 3.607511936857598e-05, "loss": 2.5098, "step": 159700 }, { "epoch": 0.28, "learning_rate": 3.607424742864916e-05, "loss": 2.5453, "step": 159710 }, { "epoch": 0.28, "learning_rate": 3.6073375488722335e-05, "loss": 2.4523, "step": 159720 }, { "epoch": 0.28, "learning_rate": 3.6072503548795505e-05, "loss": 2.3715, "step": 159730 }, { "epoch": 0.28, "learning_rate": 3.6071631608868675e-05, "loss": 2.5125, "step": 159740 }, { "epoch": 0.28, "learning_rate": 3.607075966894185e-05, "loss": 2.4511, "step": 159750 }, { "epoch": 0.28, "learning_rate": 3.606988772901502e-05, "loss": 2.5003, "step": 159760 }, { "epoch": 0.28, "learning_rate": 3.606901578908819e-05, "loss": 2.4033, "step": 159770 }, { "epoch": 0.28, "learning_rate": 3.606814384916137e-05, "loss": 2.3536, "step": 159780 }, { "epoch": 0.28, "learning_rate": 3.606727190923455e-05, "loss": 2.3868, "step": 159790 }, { "epoch": 0.28, "learning_rate": 3.606639996930772e-05, "loss": 2.3987, "step": 159800 }, { "epoch": 0.28, "learning_rate": 3.606552802938089e-05, "loss": 2.5167, "step": 159810 }, { "epoch": 0.28, "learning_rate": 3.6064656089454065e-05, "loss": 2.5118, "step": 159820 }, { "epoch": 0.28, "learning_rate": 3.6063784149527236e-05, "loss": 2.4024, "step": 159830 }, { "epoch": 0.28, "learning_rate": 3.6062912209600406e-05, "loss": 2.4471, "step": 159840 }, { "epoch": 0.28, "learning_rate": 3.6062040269673583e-05, "loss": 2.4761, "step": 159850 }, { "epoch": 0.28, "learning_rate": 3.6061168329746754e-05, "loss": 2.566, "step": 159860 }, { "epoch": 0.28, "learning_rate": 3.606029638981993e-05, "loss": 2.4395, "step": 159870 }, { "epoch": 0.28, "learning_rate": 3.60594244498931e-05, "loss": 2.3773, "step": 159880 }, { "epoch": 0.28, "learning_rate": 3.605855250996628e-05, "loss": 2.5625, "step": 159890 }, { "epoch": 0.28, "learning_rate": 3.605768057003945e-05, "loss": 2.3982, "step": 159900 }, { "epoch": 0.28, "learning_rate": 3.605680863011262e-05, "loss": 2.5109, "step": 159910 }, { "epoch": 0.28, "learning_rate": 3.6055936690185796e-05, "loss": 2.4417, "step": 159920 }, { "epoch": 0.28, "learning_rate": 3.605506475025897e-05, "loss": 2.5569, "step": 159930 }, { "epoch": 0.28, "learning_rate": 3.6054192810332144e-05, "loss": 2.4019, "step": 159940 }, { "epoch": 0.28, "learning_rate": 3.6053320870405314e-05, "loss": 2.3759, "step": 159950 }, { "epoch": 0.28, "learning_rate": 3.605244893047849e-05, "loss": 2.5832, "step": 159960 }, { "epoch": 0.28, "learning_rate": 3.605157699055166e-05, "loss": 2.4822, "step": 159970 }, { "epoch": 0.28, "learning_rate": 3.605070505062483e-05, "loss": 2.5388, "step": 159980 }, { "epoch": 0.28, "learning_rate": 3.6049833110698e-05, "loss": 2.4319, "step": 159990 }, { "epoch": 0.28, "learning_rate": 3.604896117077118e-05, "loss": 2.4019, "step": 160000 }, { "epoch": 0.28, "learning_rate": 3.604808923084435e-05, "loss": 2.4911, "step": 160010 }, { "epoch": 0.28, "learning_rate": 3.604721729091753e-05, "loss": 2.3876, "step": 160020 }, { "epoch": 0.28, "learning_rate": 3.6046345350990704e-05, "loss": 2.6499, "step": 160030 }, { "epoch": 0.28, "learning_rate": 3.6045473411063875e-05, "loss": 2.5657, "step": 160040 }, { "epoch": 0.28, "learning_rate": 3.6044601471137045e-05, "loss": 2.4525, "step": 160050 }, { "epoch": 0.28, "learning_rate": 3.6043729531210216e-05, "loss": 2.527, "step": 160060 }, { "epoch": 0.28, "learning_rate": 3.604285759128339e-05, "loss": 2.5589, "step": 160070 }, { "epoch": 0.28, "learning_rate": 3.604198565135656e-05, "loss": 2.5113, "step": 160080 }, { "epoch": 0.28, "learning_rate": 3.604111371142974e-05, "loss": 2.5132, "step": 160090 }, { "epoch": 0.28, "learning_rate": 3.604024177150291e-05, "loss": 2.4847, "step": 160100 }, { "epoch": 0.28, "learning_rate": 3.603936983157609e-05, "loss": 2.365, "step": 160110 }, { "epoch": 0.28, "learning_rate": 3.603849789164926e-05, "loss": 2.5025, "step": 160120 }, { "epoch": 0.28, "learning_rate": 3.603762595172243e-05, "loss": 2.4683, "step": 160130 }, { "epoch": 0.28, "learning_rate": 3.6036754011795606e-05, "loss": 2.5249, "step": 160140 }, { "epoch": 0.28, "learning_rate": 3.6035882071868776e-05, "loss": 2.4792, "step": 160150 }, { "epoch": 0.28, "learning_rate": 3.603501013194195e-05, "loss": 2.5081, "step": 160160 }, { "epoch": 0.28, "learning_rate": 3.6034138192015124e-05, "loss": 2.3498, "step": 160170 }, { "epoch": 0.28, "learning_rate": 3.60332662520883e-05, "loss": 2.54, "step": 160180 }, { "epoch": 0.28, "learning_rate": 3.603239431216147e-05, "loss": 2.4053, "step": 160190 }, { "epoch": 0.28, "learning_rate": 3.603152237223464e-05, "loss": 2.4748, "step": 160200 }, { "epoch": 0.28, "learning_rate": 3.603065043230782e-05, "loss": 2.475, "step": 160210 }, { "epoch": 0.28, "learning_rate": 3.602977849238099e-05, "loss": 2.5056, "step": 160220 }, { "epoch": 0.28, "learning_rate": 3.602890655245416e-05, "loss": 2.533, "step": 160230 }, { "epoch": 0.28, "learning_rate": 3.602803461252734e-05, "loss": 2.509, "step": 160240 }, { "epoch": 0.28, "learning_rate": 3.6027162672600514e-05, "loss": 2.5158, "step": 160250 }, { "epoch": 0.28, "learning_rate": 3.6026290732673684e-05, "loss": 2.43, "step": 160260 }, { "epoch": 0.28, "learning_rate": 3.6025418792746855e-05, "loss": 2.3634, "step": 160270 }, { "epoch": 0.28, "learning_rate": 3.602454685282003e-05, "loss": 2.4561, "step": 160280 }, { "epoch": 0.28, "learning_rate": 3.60236749128932e-05, "loss": 2.4939, "step": 160290 }, { "epoch": 0.28, "learning_rate": 3.602280297296637e-05, "loss": 2.533, "step": 160300 }, { "epoch": 0.28, "learning_rate": 3.602193103303955e-05, "loss": 2.4733, "step": 160310 }, { "epoch": 0.28, "learning_rate": 3.602105909311273e-05, "loss": 2.5626, "step": 160320 }, { "epoch": 0.28, "learning_rate": 3.60201871531859e-05, "loss": 2.4411, "step": 160330 }, { "epoch": 0.28, "learning_rate": 3.601931521325907e-05, "loss": 2.4735, "step": 160340 }, { "epoch": 0.28, "learning_rate": 3.6018443273332245e-05, "loss": 2.5209, "step": 160350 }, { "epoch": 0.28, "learning_rate": 3.6017571333405415e-05, "loss": 2.3299, "step": 160360 }, { "epoch": 0.28, "learning_rate": 3.6016699393478586e-05, "loss": 2.6316, "step": 160370 }, { "epoch": 0.28, "learning_rate": 3.6015827453551756e-05, "loss": 2.5081, "step": 160380 }, { "epoch": 0.28, "learning_rate": 3.601495551362494e-05, "loss": 2.5134, "step": 160390 }, { "epoch": 0.28, "learning_rate": 3.601408357369811e-05, "loss": 2.39, "step": 160400 }, { "epoch": 0.28, "learning_rate": 3.601321163377128e-05, "loss": 2.4445, "step": 160410 }, { "epoch": 0.28, "learning_rate": 3.601233969384446e-05, "loss": 2.5235, "step": 160420 }, { "epoch": 0.28, "learning_rate": 3.601146775391763e-05, "loss": 2.5852, "step": 160430 }, { "epoch": 0.28, "learning_rate": 3.60105958139908e-05, "loss": 2.3619, "step": 160440 }, { "epoch": 0.28, "learning_rate": 3.600972387406397e-05, "loss": 2.5189, "step": 160450 }, { "epoch": 0.28, "learning_rate": 3.600885193413715e-05, "loss": 2.5251, "step": 160460 }, { "epoch": 0.28, "learning_rate": 3.600797999421032e-05, "loss": 2.5485, "step": 160470 }, { "epoch": 0.28, "learning_rate": 3.6007108054283494e-05, "loss": 2.5654, "step": 160480 }, { "epoch": 0.28, "learning_rate": 3.6006236114356664e-05, "loss": 2.5539, "step": 160490 }, { "epoch": 0.28, "learning_rate": 3.600536417442984e-05, "loss": 2.3799, "step": 160500 }, { "epoch": 0.28, "learning_rate": 3.600449223450301e-05, "loss": 2.4116, "step": 160510 }, { "epoch": 0.28, "learning_rate": 3.600362029457618e-05, "loss": 2.5031, "step": 160520 }, { "epoch": 0.28, "learning_rate": 3.600274835464936e-05, "loss": 2.5526, "step": 160530 }, { "epoch": 0.28, "learning_rate": 3.6001876414722536e-05, "loss": 2.501, "step": 160540 }, { "epoch": 0.28, "learning_rate": 3.600100447479571e-05, "loss": 2.5118, "step": 160550 }, { "epoch": 0.28, "learning_rate": 3.600013253486888e-05, "loss": 2.3993, "step": 160560 }, { "epoch": 0.28, "learning_rate": 3.5999260594942054e-05, "loss": 2.4398, "step": 160570 }, { "epoch": 0.28, "learning_rate": 3.5998388655015225e-05, "loss": 2.475, "step": 160580 }, { "epoch": 0.28, "learning_rate": 3.5997516715088395e-05, "loss": 2.4782, "step": 160590 }, { "epoch": 0.28, "learning_rate": 3.599664477516157e-05, "loss": 2.4373, "step": 160600 }, { "epoch": 0.28, "learning_rate": 3.599577283523475e-05, "loss": 2.4974, "step": 160610 }, { "epoch": 0.28, "learning_rate": 3.599490089530792e-05, "loss": 2.5432, "step": 160620 }, { "epoch": 0.28, "learning_rate": 3.599402895538109e-05, "loss": 2.4291, "step": 160630 }, { "epoch": 0.28, "learning_rate": 3.599315701545427e-05, "loss": 2.5297, "step": 160640 }, { "epoch": 0.28, "learning_rate": 3.599228507552744e-05, "loss": 2.428, "step": 160650 }, { "epoch": 0.28, "learning_rate": 3.599141313560061e-05, "loss": 2.5287, "step": 160660 }, { "epoch": 0.28, "learning_rate": 3.5990541195673785e-05, "loss": 2.489, "step": 160670 }, { "epoch": 0.28, "learning_rate": 3.5989669255746955e-05, "loss": 2.4336, "step": 160680 }, { "epoch": 0.28, "learning_rate": 3.598879731582013e-05, "loss": 2.4365, "step": 160690 }, { "epoch": 0.28, "learning_rate": 3.59879253758933e-05, "loss": 2.523, "step": 160700 }, { "epoch": 0.28, "learning_rate": 3.598705343596648e-05, "loss": 2.4898, "step": 160710 }, { "epoch": 0.28, "learning_rate": 3.598618149603965e-05, "loss": 2.51, "step": 160720 }, { "epoch": 0.28, "learning_rate": 3.598530955611282e-05, "loss": 2.3696, "step": 160730 }, { "epoch": 0.28, "learning_rate": 3.5984437616186e-05, "loss": 2.4365, "step": 160740 }, { "epoch": 0.28, "learning_rate": 3.598356567625917e-05, "loss": 2.5552, "step": 160750 }, { "epoch": 0.28, "learning_rate": 3.5982693736332346e-05, "loss": 2.373, "step": 160760 }, { "epoch": 0.28, "learning_rate": 3.5981821796405516e-05, "loss": 2.5448, "step": 160770 }, { "epoch": 0.28, "learning_rate": 3.598094985647869e-05, "loss": 2.4785, "step": 160780 }, { "epoch": 0.28, "learning_rate": 3.5980077916551864e-05, "loss": 2.4516, "step": 160790 }, { "epoch": 0.28, "learning_rate": 3.5979205976625034e-05, "loss": 2.4978, "step": 160800 }, { "epoch": 0.28, "learning_rate": 3.597833403669821e-05, "loss": 2.42, "step": 160810 }, { "epoch": 0.28, "learning_rate": 3.597746209677138e-05, "loss": 2.4461, "step": 160820 }, { "epoch": 0.28, "learning_rate": 3.597659015684456e-05, "loss": 2.45, "step": 160830 }, { "epoch": 0.28, "learning_rate": 3.597571821691773e-05, "loss": 2.371, "step": 160840 }, { "epoch": 0.28, "learning_rate": 3.5974846276990906e-05, "loss": 2.4641, "step": 160850 }, { "epoch": 0.28, "learning_rate": 3.5973974337064077e-05, "loss": 2.5072, "step": 160860 }, { "epoch": 0.28, "learning_rate": 3.597310239713725e-05, "loss": 2.5882, "step": 160870 }, { "epoch": 0.28, "learning_rate": 3.5972230457210424e-05, "loss": 2.512, "step": 160880 }, { "epoch": 0.28, "learning_rate": 3.5971358517283594e-05, "loss": 2.4811, "step": 160890 }, { "epoch": 0.28, "learning_rate": 3.5970486577356765e-05, "loss": 2.4684, "step": 160900 }, { "epoch": 0.28, "learning_rate": 3.596961463742994e-05, "loss": 2.4771, "step": 160910 }, { "epoch": 0.28, "learning_rate": 3.596874269750312e-05, "loss": 2.528, "step": 160920 }, { "epoch": 0.28, "learning_rate": 3.596787075757629e-05, "loss": 2.4297, "step": 160930 }, { "epoch": 0.28, "learning_rate": 3.596699881764946e-05, "loss": 2.5184, "step": 160940 }, { "epoch": 0.28, "learning_rate": 3.596612687772263e-05, "loss": 2.5246, "step": 160950 }, { "epoch": 0.28, "learning_rate": 3.596525493779581e-05, "loss": 2.3287, "step": 160960 }, { "epoch": 0.28, "learning_rate": 3.596438299786898e-05, "loss": 2.5457, "step": 160970 }, { "epoch": 0.28, "learning_rate": 3.5963511057942155e-05, "loss": 2.4036, "step": 160980 }, { "epoch": 0.28, "learning_rate": 3.596263911801533e-05, "loss": 2.5145, "step": 160990 }, { "epoch": 0.28, "learning_rate": 3.59617671780885e-05, "loss": 2.4885, "step": 161000 }, { "epoch": 0.28, "learning_rate": 3.596089523816167e-05, "loss": 2.6295, "step": 161010 }, { "epoch": 0.28, "learning_rate": 3.596002329823484e-05, "loss": 2.4541, "step": 161020 }, { "epoch": 0.28, "learning_rate": 3.595915135830802e-05, "loss": 2.4291, "step": 161030 }, { "epoch": 0.28, "learning_rate": 3.595827941838119e-05, "loss": 2.5297, "step": 161040 }, { "epoch": 0.28, "learning_rate": 3.595740747845436e-05, "loss": 2.3596, "step": 161050 }, { "epoch": 0.28, "learning_rate": 3.595653553852754e-05, "loss": 2.535, "step": 161060 }, { "epoch": 0.28, "learning_rate": 3.5955663598600716e-05, "loss": 2.4637, "step": 161070 }, { "epoch": 0.28, "learning_rate": 3.5954791658673886e-05, "loss": 2.4817, "step": 161080 }, { "epoch": 0.28, "learning_rate": 3.5953919718747056e-05, "loss": 2.3421, "step": 161090 }, { "epoch": 0.28, "learning_rate": 3.5953047778820233e-05, "loss": 2.4885, "step": 161100 }, { "epoch": 0.28, "learning_rate": 3.5952175838893404e-05, "loss": 2.4621, "step": 161110 }, { "epoch": 0.28, "learning_rate": 3.5951303898966574e-05, "loss": 2.5066, "step": 161120 }, { "epoch": 0.28, "learning_rate": 3.595043195903975e-05, "loss": 2.4639, "step": 161130 }, { "epoch": 0.28, "learning_rate": 3.594956001911293e-05, "loss": 2.3893, "step": 161140 }, { "epoch": 0.28, "learning_rate": 3.59486880791861e-05, "loss": 2.552, "step": 161150 }, { "epoch": 0.28, "learning_rate": 3.594781613925927e-05, "loss": 2.4569, "step": 161160 }, { "epoch": 0.28, "learning_rate": 3.5946944199332446e-05, "loss": 2.5544, "step": 161170 }, { "epoch": 0.28, "learning_rate": 3.594607225940562e-05, "loss": 2.4857, "step": 161180 }, { "epoch": 0.28, "learning_rate": 3.594520031947879e-05, "loss": 2.518, "step": 161190 }, { "epoch": 0.28, "learning_rate": 3.5944328379551964e-05, "loss": 2.5083, "step": 161200 }, { "epoch": 0.28, "learning_rate": 3.594345643962514e-05, "loss": 2.4356, "step": 161210 }, { "epoch": 0.28, "learning_rate": 3.594258449969831e-05, "loss": 2.4845, "step": 161220 }, { "epoch": 0.28, "learning_rate": 3.594171255977148e-05, "loss": 2.4358, "step": 161230 }, { "epoch": 0.28, "learning_rate": 3.594084061984466e-05, "loss": 2.4577, "step": 161240 }, { "epoch": 0.28, "learning_rate": 3.593996867991783e-05, "loss": 2.4873, "step": 161250 }, { "epoch": 0.28, "learning_rate": 3.5939096739991e-05, "loss": 2.5052, "step": 161260 }, { "epoch": 0.28, "learning_rate": 3.593822480006418e-05, "loss": 2.4967, "step": 161270 }, { "epoch": 0.28, "learning_rate": 3.5937352860137355e-05, "loss": 2.4035, "step": 161280 }, { "epoch": 0.28, "learning_rate": 3.5936480920210525e-05, "loss": 2.4148, "step": 161290 }, { "epoch": 0.28, "learning_rate": 3.5935608980283695e-05, "loss": 2.535, "step": 161300 }, { "epoch": 0.28, "learning_rate": 3.593473704035687e-05, "loss": 2.4256, "step": 161310 }, { "epoch": 0.28, "learning_rate": 3.593386510043004e-05, "loss": 2.4302, "step": 161320 }, { "epoch": 0.28, "learning_rate": 3.593299316050321e-05, "loss": 2.5056, "step": 161330 }, { "epoch": 0.28, "learning_rate": 3.5932121220576384e-05, "loss": 2.4575, "step": 161340 }, { "epoch": 0.28, "learning_rate": 3.593124928064957e-05, "loss": 2.3701, "step": 161350 }, { "epoch": 0.28, "learning_rate": 3.593037734072274e-05, "loss": 2.5588, "step": 161360 }, { "epoch": 0.28, "learning_rate": 3.592950540079591e-05, "loss": 2.3768, "step": 161370 }, { "epoch": 0.28, "learning_rate": 3.5928633460869085e-05, "loss": 2.516, "step": 161380 }, { "epoch": 0.28, "learning_rate": 3.5927761520942256e-05, "loss": 2.264, "step": 161390 }, { "epoch": 0.28, "learning_rate": 3.5926889581015426e-05, "loss": 2.5461, "step": 161400 }, { "epoch": 0.28, "learning_rate": 3.59260176410886e-05, "loss": 2.4103, "step": 161410 }, { "epoch": 0.28, "learning_rate": 3.5925145701161774e-05, "loss": 2.525, "step": 161420 }, { "epoch": 0.28, "learning_rate": 3.592427376123495e-05, "loss": 2.4775, "step": 161430 }, { "epoch": 0.28, "learning_rate": 3.592340182130812e-05, "loss": 2.4087, "step": 161440 }, { "epoch": 0.28, "learning_rate": 3.592252988138129e-05, "loss": 2.4634, "step": 161450 }, { "epoch": 0.28, "learning_rate": 3.592165794145447e-05, "loss": 2.5198, "step": 161460 }, { "epoch": 0.28, "learning_rate": 3.592078600152764e-05, "loss": 2.4963, "step": 161470 }, { "epoch": 0.28, "learning_rate": 3.591991406160081e-05, "loss": 2.4908, "step": 161480 }, { "epoch": 0.28, "learning_rate": 3.591904212167399e-05, "loss": 2.4373, "step": 161490 }, { "epoch": 0.28, "learning_rate": 3.5918170181747164e-05, "loss": 2.4841, "step": 161500 }, { "epoch": 0.28, "learning_rate": 3.5917298241820334e-05, "loss": 2.5065, "step": 161510 }, { "epoch": 0.28, "learning_rate": 3.5916426301893505e-05, "loss": 2.4846, "step": 161520 }, { "epoch": 0.28, "learning_rate": 3.591555436196668e-05, "loss": 2.4356, "step": 161530 }, { "epoch": 0.28, "learning_rate": 3.591468242203985e-05, "loss": 2.3448, "step": 161540 }, { "epoch": 0.28, "learning_rate": 3.591381048211302e-05, "loss": 2.4578, "step": 161550 }, { "epoch": 0.28, "learning_rate": 3.59129385421862e-05, "loss": 2.4142, "step": 161560 }, { "epoch": 0.28, "learning_rate": 3.591206660225937e-05, "loss": 2.4362, "step": 161570 }, { "epoch": 0.28, "learning_rate": 3.591119466233255e-05, "loss": 2.4127, "step": 161580 }, { "epoch": 0.28, "learning_rate": 3.591032272240572e-05, "loss": 2.4763, "step": 161590 }, { "epoch": 0.28, "learning_rate": 3.5909450782478895e-05, "loss": 2.4136, "step": 161600 }, { "epoch": 0.28, "learning_rate": 3.5908578842552065e-05, "loss": 2.4938, "step": 161610 }, { "epoch": 0.28, "learning_rate": 3.5907706902625236e-05, "loss": 2.4925, "step": 161620 }, { "epoch": 0.28, "learning_rate": 3.590683496269841e-05, "loss": 2.3786, "step": 161630 }, { "epoch": 0.28, "learning_rate": 3.590596302277158e-05, "loss": 2.4216, "step": 161640 }, { "epoch": 0.28, "learning_rate": 3.590509108284476e-05, "loss": 2.5383, "step": 161650 }, { "epoch": 0.28, "learning_rate": 3.590421914291793e-05, "loss": 2.4748, "step": 161660 }, { "epoch": 0.28, "learning_rate": 3.590334720299111e-05, "loss": 2.475, "step": 161670 }, { "epoch": 0.28, "learning_rate": 3.590247526306428e-05, "loss": 2.4389, "step": 161680 }, { "epoch": 0.28, "learning_rate": 3.590160332313745e-05, "loss": 2.3216, "step": 161690 }, { "epoch": 0.28, "learning_rate": 3.5900731383210626e-05, "loss": 2.4488, "step": 161700 }, { "epoch": 0.28, "learning_rate": 3.5899859443283796e-05, "loss": 2.4684, "step": 161710 }, { "epoch": 0.28, "learning_rate": 3.5898987503356967e-05, "loss": 2.3212, "step": 161720 }, { "epoch": 0.28, "learning_rate": 3.5898115563430144e-05, "loss": 2.3901, "step": 161730 }, { "epoch": 0.28, "learning_rate": 3.589724362350332e-05, "loss": 2.5628, "step": 161740 }, { "epoch": 0.28, "learning_rate": 3.589637168357649e-05, "loss": 2.4605, "step": 161750 }, { "epoch": 0.28, "learning_rate": 3.589549974364966e-05, "loss": 2.5451, "step": 161760 }, { "epoch": 0.28, "learning_rate": 3.589462780372284e-05, "loss": 2.3324, "step": 161770 }, { "epoch": 0.28, "learning_rate": 3.589375586379601e-05, "loss": 2.3672, "step": 161780 }, { "epoch": 0.28, "learning_rate": 3.589288392386918e-05, "loss": 2.4037, "step": 161790 }, { "epoch": 0.28, "learning_rate": 3.589201198394236e-05, "loss": 2.539, "step": 161800 }, { "epoch": 0.28, "learning_rate": 3.5891140044015534e-05, "loss": 2.4081, "step": 161810 }, { "epoch": 0.28, "learning_rate": 3.5890268104088704e-05, "loss": 2.5872, "step": 161820 }, { "epoch": 0.28, "learning_rate": 3.5889396164161875e-05, "loss": 2.5146, "step": 161830 }, { "epoch": 0.28, "learning_rate": 3.5888524224235045e-05, "loss": 2.562, "step": 161840 }, { "epoch": 0.28, "learning_rate": 3.588765228430822e-05, "loss": 2.5189, "step": 161850 }, { "epoch": 0.28, "learning_rate": 3.588678034438139e-05, "loss": 2.3453, "step": 161860 }, { "epoch": 0.28, "learning_rate": 3.588590840445456e-05, "loss": 2.4748, "step": 161870 }, { "epoch": 0.28, "learning_rate": 3.588503646452775e-05, "loss": 2.4053, "step": 161880 }, { "epoch": 0.28, "learning_rate": 3.588416452460092e-05, "loss": 2.4021, "step": 161890 }, { "epoch": 0.28, "learning_rate": 3.588329258467409e-05, "loss": 2.4935, "step": 161900 }, { "epoch": 0.28, "learning_rate": 3.588242064474726e-05, "loss": 2.581, "step": 161910 }, { "epoch": 0.28, "learning_rate": 3.5881548704820435e-05, "loss": 2.4478, "step": 161920 }, { "epoch": 0.28, "learning_rate": 3.5880676764893606e-05, "loss": 2.4383, "step": 161930 }, { "epoch": 0.28, "learning_rate": 3.5879804824966776e-05, "loss": 2.4971, "step": 161940 }, { "epoch": 0.28, "learning_rate": 3.587893288503995e-05, "loss": 2.4982, "step": 161950 }, { "epoch": 0.28, "learning_rate": 3.587806094511313e-05, "loss": 2.4975, "step": 161960 }, { "epoch": 0.28, "learning_rate": 3.58771890051863e-05, "loss": 2.4346, "step": 161970 }, { "epoch": 0.28, "learning_rate": 3.587631706525947e-05, "loss": 2.4912, "step": 161980 }, { "epoch": 0.28, "learning_rate": 3.587544512533265e-05, "loss": 2.373, "step": 161990 }, { "epoch": 0.28, "learning_rate": 3.587457318540582e-05, "loss": 2.5432, "step": 162000 }, { "epoch": 0.28, "learning_rate": 3.587370124547899e-05, "loss": 2.5072, "step": 162010 }, { "epoch": 0.28, "learning_rate": 3.5872829305552166e-05, "loss": 2.4547, "step": 162020 }, { "epoch": 0.28, "learning_rate": 3.587195736562534e-05, "loss": 2.5613, "step": 162030 }, { "epoch": 0.28, "learning_rate": 3.5871085425698514e-05, "loss": 2.4657, "step": 162040 }, { "epoch": 0.28, "learning_rate": 3.5870213485771684e-05, "loss": 2.5226, "step": 162050 }, { "epoch": 0.28, "learning_rate": 3.586934154584486e-05, "loss": 2.4084, "step": 162060 }, { "epoch": 0.28, "learning_rate": 3.586846960591803e-05, "loss": 2.3903, "step": 162070 }, { "epoch": 0.28, "learning_rate": 3.58675976659912e-05, "loss": 2.4147, "step": 162080 }, { "epoch": 0.28, "learning_rate": 3.586672572606438e-05, "loss": 2.5282, "step": 162090 }, { "epoch": 0.28, "learning_rate": 3.5865853786137556e-05, "loss": 2.4644, "step": 162100 }, { "epoch": 0.28, "learning_rate": 3.586498184621073e-05, "loss": 2.4641, "step": 162110 }, { "epoch": 0.28, "learning_rate": 3.58641099062839e-05, "loss": 2.4437, "step": 162120 }, { "epoch": 0.28, "learning_rate": 3.5863237966357074e-05, "loss": 2.3976, "step": 162130 }, { "epoch": 0.28, "learning_rate": 3.5862366026430245e-05, "loss": 2.5111, "step": 162140 }, { "epoch": 0.28, "learning_rate": 3.5861494086503415e-05, "loss": 2.4028, "step": 162150 }, { "epoch": 0.28, "learning_rate": 3.586062214657659e-05, "loss": 2.5139, "step": 162160 }, { "epoch": 0.28, "learning_rate": 3.585975020664977e-05, "loss": 2.5538, "step": 162170 }, { "epoch": 0.28, "learning_rate": 3.585887826672294e-05, "loss": 2.4415, "step": 162180 }, { "epoch": 0.28, "learning_rate": 3.585800632679611e-05, "loss": 2.4173, "step": 162190 }, { "epoch": 0.28, "learning_rate": 3.585713438686929e-05, "loss": 2.4297, "step": 162200 }, { "epoch": 0.28, "learning_rate": 3.585626244694246e-05, "loss": 2.3451, "step": 162210 }, { "epoch": 0.28, "learning_rate": 3.585539050701563e-05, "loss": 2.479, "step": 162220 }, { "epoch": 0.28, "learning_rate": 3.5854518567088805e-05, "loss": 2.4393, "step": 162230 }, { "epoch": 0.28, "learning_rate": 3.5853646627161975e-05, "loss": 2.4763, "step": 162240 }, { "epoch": 0.28, "learning_rate": 3.585277468723515e-05, "loss": 2.5125, "step": 162250 }, { "epoch": 0.28, "learning_rate": 3.585190274730832e-05, "loss": 2.595, "step": 162260 }, { "epoch": 0.28, "learning_rate": 3.58510308073815e-05, "loss": 2.4609, "step": 162270 }, { "epoch": 0.28, "learning_rate": 3.585015886745467e-05, "loss": 2.5116, "step": 162280 }, { "epoch": 0.28, "learning_rate": 3.584928692752784e-05, "loss": 2.4604, "step": 162290 }, { "epoch": 0.28, "learning_rate": 3.584841498760101e-05, "loss": 2.3033, "step": 162300 }, { "epoch": 0.28, "learning_rate": 3.584754304767419e-05, "loss": 2.575, "step": 162310 }, { "epoch": 0.28, "learning_rate": 3.5846671107747366e-05, "loss": 2.5025, "step": 162320 }, { "epoch": 0.28, "learning_rate": 3.5845799167820536e-05, "loss": 2.4327, "step": 162330 }, { "epoch": 0.28, "learning_rate": 3.584492722789371e-05, "loss": 2.5581, "step": 162340 }, { "epoch": 0.28, "learning_rate": 3.5844055287966884e-05, "loss": 2.5169, "step": 162350 }, { "epoch": 0.28, "learning_rate": 3.5843183348040054e-05, "loss": 2.485, "step": 162360 }, { "epoch": 0.28, "learning_rate": 3.5842311408113224e-05, "loss": 2.4712, "step": 162370 }, { "epoch": 0.28, "learning_rate": 3.58414394681864e-05, "loss": 2.4284, "step": 162380 }, { "epoch": 0.28, "learning_rate": 3.584056752825957e-05, "loss": 2.3953, "step": 162390 }, { "epoch": 0.28, "learning_rate": 3.583969558833275e-05, "loss": 2.4782, "step": 162400 }, { "epoch": 0.28, "learning_rate": 3.583882364840592e-05, "loss": 2.4561, "step": 162410 }, { "epoch": 0.28, "learning_rate": 3.5837951708479097e-05, "loss": 2.4739, "step": 162420 }, { "epoch": 0.28, "learning_rate": 3.583707976855227e-05, "loss": 2.4242, "step": 162430 }, { "epoch": 0.28, "learning_rate": 3.583620782862544e-05, "loss": 2.5245, "step": 162440 }, { "epoch": 0.28, "learning_rate": 3.5835335888698614e-05, "loss": 2.5443, "step": 162450 }, { "epoch": 0.28, "learning_rate": 3.5834463948771785e-05, "loss": 2.539, "step": 162460 }, { "epoch": 0.28, "learning_rate": 3.583359200884496e-05, "loss": 2.5217, "step": 162470 }, { "epoch": 0.28, "learning_rate": 3.583272006891813e-05, "loss": 2.3403, "step": 162480 }, { "epoch": 0.28, "learning_rate": 3.583184812899131e-05, "loss": 2.397, "step": 162490 }, { "epoch": 0.28, "learning_rate": 3.583097618906448e-05, "loss": 2.4368, "step": 162500 }, { "epoch": 0.28, "learning_rate": 3.583010424913765e-05, "loss": 2.5124, "step": 162510 }, { "epoch": 0.28, "learning_rate": 3.582923230921083e-05, "loss": 2.4834, "step": 162520 }, { "epoch": 0.28, "learning_rate": 3.5828360369284e-05, "loss": 2.3832, "step": 162530 }, { "epoch": 0.28, "learning_rate": 3.582748842935717e-05, "loss": 2.4137, "step": 162540 }, { "epoch": 0.28, "learning_rate": 3.5826616489430345e-05, "loss": 2.3535, "step": 162550 }, { "epoch": 0.28, "learning_rate": 3.582574454950352e-05, "loss": 2.4871, "step": 162560 }, { "epoch": 0.28, "learning_rate": 3.582487260957669e-05, "loss": 2.4627, "step": 162570 }, { "epoch": 0.28, "learning_rate": 3.582400066964986e-05, "loss": 2.3643, "step": 162580 }, { "epoch": 0.28, "learning_rate": 3.582312872972304e-05, "loss": 2.4921, "step": 162590 }, { "epoch": 0.28, "learning_rate": 3.582225678979621e-05, "loss": 2.4221, "step": 162600 }, { "epoch": 0.28, "learning_rate": 3.582138484986938e-05, "loss": 2.2779, "step": 162610 }, { "epoch": 0.28, "learning_rate": 3.582051290994256e-05, "loss": 2.4719, "step": 162620 }, { "epoch": 0.28, "learning_rate": 3.5819640970015736e-05, "loss": 2.4631, "step": 162630 }, { "epoch": 0.28, "learning_rate": 3.5818769030088906e-05, "loss": 2.5035, "step": 162640 }, { "epoch": 0.28, "learning_rate": 3.5817897090162076e-05, "loss": 2.4025, "step": 162650 }, { "epoch": 0.28, "learning_rate": 3.5817025150235253e-05, "loss": 2.3971, "step": 162660 }, { "epoch": 0.28, "learning_rate": 3.5816153210308424e-05, "loss": 2.4036, "step": 162670 }, { "epoch": 0.28, "learning_rate": 3.5815281270381594e-05, "loss": 2.401, "step": 162680 }, { "epoch": 0.28, "learning_rate": 3.581440933045477e-05, "loss": 2.4388, "step": 162690 }, { "epoch": 0.28, "learning_rate": 3.581353739052795e-05, "loss": 2.4638, "step": 162700 }, { "epoch": 0.28, "learning_rate": 3.581266545060112e-05, "loss": 2.527, "step": 162710 }, { "epoch": 0.28, "learning_rate": 3.581179351067429e-05, "loss": 2.5276, "step": 162720 }, { "epoch": 0.28, "learning_rate": 3.5810921570747466e-05, "loss": 2.5474, "step": 162730 }, { "epoch": 0.28, "learning_rate": 3.581004963082064e-05, "loss": 2.4129, "step": 162740 }, { "epoch": 0.28, "learning_rate": 3.580917769089381e-05, "loss": 2.4962, "step": 162750 }, { "epoch": 0.28, "learning_rate": 3.580830575096698e-05, "loss": 2.4513, "step": 162760 }, { "epoch": 0.28, "learning_rate": 3.580743381104016e-05, "loss": 2.5142, "step": 162770 }, { "epoch": 0.28, "learning_rate": 3.580656187111333e-05, "loss": 2.5034, "step": 162780 }, { "epoch": 0.28, "learning_rate": 3.58056899311865e-05, "loss": 2.5083, "step": 162790 }, { "epoch": 0.28, "learning_rate": 3.580481799125967e-05, "loss": 2.412, "step": 162800 }, { "epoch": 0.28, "learning_rate": 3.580394605133285e-05, "loss": 2.4903, "step": 162810 }, { "epoch": 0.28, "learning_rate": 3.580307411140602e-05, "loss": 2.5649, "step": 162820 }, { "epoch": 0.28, "learning_rate": 3.580220217147919e-05, "loss": 2.4464, "step": 162830 }, { "epoch": 0.28, "learning_rate": 3.5801330231552375e-05, "loss": 2.4823, "step": 162840 }, { "epoch": 0.28, "learning_rate": 3.5800458291625545e-05, "loss": 2.4688, "step": 162850 }, { "epoch": 0.28, "learning_rate": 3.5799586351698715e-05, "loss": 2.3645, "step": 162860 }, { "epoch": 0.28, "learning_rate": 3.5798714411771886e-05, "loss": 2.4538, "step": 162870 }, { "epoch": 0.28, "learning_rate": 3.579784247184506e-05, "loss": 2.4637, "step": 162880 }, { "epoch": 0.28, "learning_rate": 3.579697053191823e-05, "loss": 2.519, "step": 162890 }, { "epoch": 0.28, "learning_rate": 3.5796098591991404e-05, "loss": 2.515, "step": 162900 }, { "epoch": 0.28, "learning_rate": 3.579522665206458e-05, "loss": 2.3999, "step": 162910 }, { "epoch": 0.28, "learning_rate": 3.579435471213776e-05, "loss": 2.5164, "step": 162920 }, { "epoch": 0.28, "learning_rate": 3.579348277221093e-05, "loss": 2.3545, "step": 162930 }, { "epoch": 0.28, "learning_rate": 3.57926108322841e-05, "loss": 2.5532, "step": 162940 }, { "epoch": 0.28, "learning_rate": 3.5791738892357276e-05, "loss": 2.4029, "step": 162950 }, { "epoch": 0.28, "learning_rate": 3.5790866952430446e-05, "loss": 2.4644, "step": 162960 }, { "epoch": 0.28, "learning_rate": 3.578999501250362e-05, "loss": 2.4687, "step": 162970 }, { "epoch": 0.28, "learning_rate": 3.5789123072576794e-05, "loss": 2.5753, "step": 162980 }, { "epoch": 0.28, "learning_rate": 3.578825113264997e-05, "loss": 2.5615, "step": 162990 }, { "epoch": 0.28, "learning_rate": 3.578737919272314e-05, "loss": 2.4235, "step": 163000 }, { "epoch": 0.28, "learning_rate": 3.578650725279631e-05, "loss": 2.3957, "step": 163010 }, { "epoch": 0.28, "learning_rate": 3.578563531286949e-05, "loss": 2.6168, "step": 163020 }, { "epoch": 0.28, "learning_rate": 3.578476337294266e-05, "loss": 2.3729, "step": 163030 }, { "epoch": 0.28, "learning_rate": 3.578389143301583e-05, "loss": 2.6107, "step": 163040 }, { "epoch": 0.28, "learning_rate": 3.578301949308901e-05, "loss": 2.5027, "step": 163050 }, { "epoch": 0.28, "learning_rate": 3.578214755316218e-05, "loss": 2.4279, "step": 163060 }, { "epoch": 0.28, "learning_rate": 3.5781275613235354e-05, "loss": 2.5548, "step": 163070 }, { "epoch": 0.28, "learning_rate": 3.5780403673308525e-05, "loss": 2.3662, "step": 163080 }, { "epoch": 0.28, "learning_rate": 3.57795317333817e-05, "loss": 2.4031, "step": 163090 }, { "epoch": 0.28, "learning_rate": 3.577865979345487e-05, "loss": 2.4124, "step": 163100 }, { "epoch": 0.28, "learning_rate": 3.577778785352804e-05, "loss": 2.4811, "step": 163110 }, { "epoch": 0.28, "learning_rate": 3.577691591360122e-05, "loss": 2.4216, "step": 163120 }, { "epoch": 0.28, "learning_rate": 3.577604397367439e-05, "loss": 2.4655, "step": 163130 }, { "epoch": 0.28, "learning_rate": 3.577517203374757e-05, "loss": 2.4212, "step": 163140 }, { "epoch": 0.28, "learning_rate": 3.577430009382074e-05, "loss": 2.4961, "step": 163150 }, { "epoch": 0.28, "learning_rate": 3.5773428153893915e-05, "loss": 2.5018, "step": 163160 }, { "epoch": 0.28, "learning_rate": 3.5772556213967085e-05, "loss": 2.4043, "step": 163170 }, { "epoch": 0.28, "learning_rate": 3.5771684274040256e-05, "loss": 2.3424, "step": 163180 }, { "epoch": 0.28, "learning_rate": 3.5770812334113426e-05, "loss": 2.4613, "step": 163190 }, { "epoch": 0.28, "learning_rate": 3.57699403941866e-05, "loss": 2.5123, "step": 163200 }, { "epoch": 0.28, "learning_rate": 3.5769068454259774e-05, "loss": 2.5497, "step": 163210 }, { "epoch": 0.28, "learning_rate": 3.576819651433295e-05, "loss": 2.5294, "step": 163220 }, { "epoch": 0.28, "learning_rate": 3.576732457440613e-05, "loss": 2.3783, "step": 163230 }, { "epoch": 0.28, "learning_rate": 3.57664526344793e-05, "loss": 2.4957, "step": 163240 }, { "epoch": 0.28, "learning_rate": 3.576558069455247e-05, "loss": 2.4889, "step": 163250 }, { "epoch": 0.28, "learning_rate": 3.576470875462564e-05, "loss": 2.383, "step": 163260 }, { "epoch": 0.28, "learning_rate": 3.5763836814698816e-05, "loss": 2.3913, "step": 163270 }, { "epoch": 0.28, "learning_rate": 3.5762964874771987e-05, "loss": 2.3977, "step": 163280 }, { "epoch": 0.28, "learning_rate": 3.5762092934845164e-05, "loss": 2.4546, "step": 163290 }, { "epoch": 0.28, "learning_rate": 3.5761220994918334e-05, "loss": 2.5295, "step": 163300 }, { "epoch": 0.28, "learning_rate": 3.576034905499151e-05, "loss": 2.5171, "step": 163310 }, { "epoch": 0.28, "learning_rate": 3.575947711506468e-05, "loss": 2.443, "step": 163320 }, { "epoch": 0.28, "learning_rate": 3.575860517513785e-05, "loss": 2.4957, "step": 163330 }, { "epoch": 0.28, "learning_rate": 3.575773323521103e-05, "loss": 2.3504, "step": 163340 }, { "epoch": 0.28, "learning_rate": 3.57568612952842e-05, "loss": 2.49, "step": 163350 }, { "epoch": 0.28, "learning_rate": 3.575598935535738e-05, "loss": 2.4671, "step": 163360 }, { "epoch": 0.28, "learning_rate": 3.575511741543055e-05, "loss": 2.5163, "step": 163370 }, { "epoch": 0.28, "learning_rate": 3.5754245475503724e-05, "loss": 2.511, "step": 163380 }, { "epoch": 0.28, "learning_rate": 3.5753373535576895e-05, "loss": 2.4355, "step": 163390 }, { "epoch": 0.28, "learning_rate": 3.5752501595650065e-05, "loss": 2.3787, "step": 163400 }, { "epoch": 0.28, "learning_rate": 3.575162965572324e-05, "loss": 2.5262, "step": 163410 }, { "epoch": 0.28, "learning_rate": 3.575075771579641e-05, "loss": 2.4935, "step": 163420 }, { "epoch": 0.29, "learning_rate": 3.574988577586958e-05, "loss": 2.4503, "step": 163430 }, { "epoch": 0.29, "learning_rate": 3.574901383594276e-05, "loss": 2.3568, "step": 163440 }, { "epoch": 0.29, "learning_rate": 3.574814189601594e-05, "loss": 2.4373, "step": 163450 }, { "epoch": 0.29, "learning_rate": 3.574726995608911e-05, "loss": 2.4647, "step": 163460 }, { "epoch": 0.29, "learning_rate": 3.574639801616228e-05, "loss": 2.467, "step": 163470 }, { "epoch": 0.29, "learning_rate": 3.5745526076235455e-05, "loss": 2.4688, "step": 163480 }, { "epoch": 0.29, "learning_rate": 3.5744654136308626e-05, "loss": 2.5826, "step": 163490 }, { "epoch": 0.29, "learning_rate": 3.5743782196381796e-05, "loss": 2.4336, "step": 163500 }, { "epoch": 0.29, "learning_rate": 3.574291025645497e-05, "loss": 2.3839, "step": 163510 }, { "epoch": 0.29, "learning_rate": 3.574203831652815e-05, "loss": 2.4228, "step": 163520 }, { "epoch": 0.29, "learning_rate": 3.574116637660132e-05, "loss": 2.6131, "step": 163530 }, { "epoch": 0.29, "learning_rate": 3.574029443667449e-05, "loss": 2.38, "step": 163540 }, { "epoch": 0.29, "learning_rate": 3.573942249674767e-05, "loss": 2.5222, "step": 163550 }, { "epoch": 0.29, "learning_rate": 3.573855055682084e-05, "loss": 2.3964, "step": 163560 }, { "epoch": 0.29, "learning_rate": 3.573767861689401e-05, "loss": 2.5504, "step": 163570 }, { "epoch": 0.29, "learning_rate": 3.5736806676967186e-05, "loss": 2.3896, "step": 163580 }, { "epoch": 0.29, "learning_rate": 3.573593473704036e-05, "loss": 2.4043, "step": 163590 }, { "epoch": 0.29, "learning_rate": 3.5735062797113534e-05, "loss": 2.3889, "step": 163600 }, { "epoch": 0.29, "learning_rate": 3.5734190857186704e-05, "loss": 2.5412, "step": 163610 }, { "epoch": 0.29, "learning_rate": 3.573331891725988e-05, "loss": 2.484, "step": 163620 }, { "epoch": 0.29, "learning_rate": 3.573244697733305e-05, "loss": 2.5485, "step": 163630 }, { "epoch": 0.29, "learning_rate": 3.573157503740622e-05, "loss": 2.4472, "step": 163640 }, { "epoch": 0.29, "learning_rate": 3.573070309747939e-05, "loss": 2.4013, "step": 163650 }, { "epoch": 0.29, "learning_rate": 3.5729831157552576e-05, "loss": 2.5532, "step": 163660 }, { "epoch": 0.29, "learning_rate": 3.572895921762575e-05, "loss": 2.4734, "step": 163670 }, { "epoch": 0.29, "learning_rate": 3.572808727769892e-05, "loss": 2.381, "step": 163680 }, { "epoch": 0.29, "learning_rate": 3.5727215337772094e-05, "loss": 2.4884, "step": 163690 }, { "epoch": 0.29, "learning_rate": 3.5726343397845265e-05, "loss": 2.4463, "step": 163700 }, { "epoch": 0.29, "learning_rate": 3.5725471457918435e-05, "loss": 2.426, "step": 163710 }, { "epoch": 0.29, "learning_rate": 3.5724599517991605e-05, "loss": 2.4908, "step": 163720 }, { "epoch": 0.29, "learning_rate": 3.572372757806478e-05, "loss": 2.478, "step": 163730 }, { "epoch": 0.29, "learning_rate": 3.572285563813796e-05, "loss": 2.4896, "step": 163740 }, { "epoch": 0.29, "learning_rate": 3.572198369821113e-05, "loss": 2.3766, "step": 163750 }, { "epoch": 0.29, "learning_rate": 3.57211117582843e-05, "loss": 2.487, "step": 163760 }, { "epoch": 0.29, "learning_rate": 3.572023981835748e-05, "loss": 2.4702, "step": 163770 }, { "epoch": 0.29, "learning_rate": 3.571936787843065e-05, "loss": 2.4704, "step": 163780 }, { "epoch": 0.29, "learning_rate": 3.571849593850382e-05, "loss": 2.2693, "step": 163790 }, { "epoch": 0.29, "learning_rate": 3.5717623998576995e-05, "loss": 2.4605, "step": 163800 }, { "epoch": 0.29, "learning_rate": 3.571675205865017e-05, "loss": 2.5936, "step": 163810 }, { "epoch": 0.29, "learning_rate": 3.571588011872334e-05, "loss": 2.3992, "step": 163820 }, { "epoch": 0.29, "learning_rate": 3.5715008178796513e-05, "loss": 2.5256, "step": 163830 }, { "epoch": 0.29, "learning_rate": 3.571413623886969e-05, "loss": 2.4283, "step": 163840 }, { "epoch": 0.29, "learning_rate": 3.571326429894286e-05, "loss": 2.3965, "step": 163850 }, { "epoch": 0.29, "learning_rate": 3.571239235901603e-05, "loss": 2.3946, "step": 163860 }, { "epoch": 0.29, "learning_rate": 3.571152041908921e-05, "loss": 2.4976, "step": 163870 }, { "epoch": 0.29, "learning_rate": 3.5710648479162386e-05, "loss": 2.4436, "step": 163880 }, { "epoch": 0.29, "learning_rate": 3.5709776539235556e-05, "loss": 2.3958, "step": 163890 }, { "epoch": 0.29, "learning_rate": 3.5708904599308726e-05, "loss": 2.3972, "step": 163900 }, { "epoch": 0.29, "learning_rate": 3.5708032659381904e-05, "loss": 2.4612, "step": 163910 }, { "epoch": 0.29, "learning_rate": 3.5707160719455074e-05, "loss": 2.3444, "step": 163920 }, { "epoch": 0.29, "learning_rate": 3.5706288779528244e-05, "loss": 2.4478, "step": 163930 }, { "epoch": 0.29, "learning_rate": 3.570541683960142e-05, "loss": 2.4753, "step": 163940 }, { "epoch": 0.29, "learning_rate": 3.570454489967459e-05, "loss": 2.4726, "step": 163950 }, { "epoch": 0.29, "learning_rate": 3.570367295974777e-05, "loss": 2.3975, "step": 163960 }, { "epoch": 0.29, "learning_rate": 3.570280101982094e-05, "loss": 2.4568, "step": 163970 }, { "epoch": 0.29, "learning_rate": 3.5701929079894117e-05, "loss": 2.4907, "step": 163980 }, { "epoch": 0.29, "learning_rate": 3.570105713996729e-05, "loss": 2.4617, "step": 163990 }, { "epoch": 0.29, "learning_rate": 3.570018520004046e-05, "loss": 2.3885, "step": 164000 }, { "epoch": 0.29, "learning_rate": 3.5699313260113635e-05, "loss": 2.3687, "step": 164010 }, { "epoch": 0.29, "learning_rate": 3.5698441320186805e-05, "loss": 2.3566, "step": 164020 }, { "epoch": 0.29, "learning_rate": 3.569756938025998e-05, "loss": 2.4889, "step": 164030 }, { "epoch": 0.29, "learning_rate": 3.569669744033315e-05, "loss": 2.5355, "step": 164040 }, { "epoch": 0.29, "learning_rate": 3.569582550040633e-05, "loss": 2.4097, "step": 164050 }, { "epoch": 0.29, "learning_rate": 3.56949535604795e-05, "loss": 2.4413, "step": 164060 }, { "epoch": 0.29, "learning_rate": 3.569408162055267e-05, "loss": 2.5077, "step": 164070 }, { "epoch": 0.29, "learning_rate": 3.569320968062585e-05, "loss": 2.5464, "step": 164080 }, { "epoch": 0.29, "learning_rate": 3.569233774069902e-05, "loss": 2.5293, "step": 164090 }, { "epoch": 0.29, "learning_rate": 3.569146580077219e-05, "loss": 2.4624, "step": 164100 }, { "epoch": 0.29, "learning_rate": 3.5690593860845365e-05, "loss": 2.3749, "step": 164110 }, { "epoch": 0.29, "learning_rate": 3.568972192091854e-05, "loss": 2.4282, "step": 164120 }, { "epoch": 0.29, "learning_rate": 3.568884998099171e-05, "loss": 2.4281, "step": 164130 }, { "epoch": 0.29, "learning_rate": 3.568797804106488e-05, "loss": 2.394, "step": 164140 }, { "epoch": 0.29, "learning_rate": 3.5687106101138054e-05, "loss": 2.5526, "step": 164150 }, { "epoch": 0.29, "learning_rate": 3.568623416121123e-05, "loss": 2.4958, "step": 164160 }, { "epoch": 0.29, "learning_rate": 3.56853622212844e-05, "loss": 2.4447, "step": 164170 }, { "epoch": 0.29, "learning_rate": 3.568449028135758e-05, "loss": 2.3417, "step": 164180 }, { "epoch": 0.29, "learning_rate": 3.5683618341430756e-05, "loss": 2.4386, "step": 164190 }, { "epoch": 0.29, "learning_rate": 3.5682746401503926e-05, "loss": 2.5449, "step": 164200 }, { "epoch": 0.29, "learning_rate": 3.5681874461577096e-05, "loss": 2.4397, "step": 164210 }, { "epoch": 0.29, "learning_rate": 3.568100252165027e-05, "loss": 2.4285, "step": 164220 }, { "epoch": 0.29, "learning_rate": 3.5680130581723444e-05, "loss": 2.495, "step": 164230 }, { "epoch": 0.29, "learning_rate": 3.5679258641796614e-05, "loss": 2.424, "step": 164240 }, { "epoch": 0.29, "learning_rate": 3.5678386701869785e-05, "loss": 2.4263, "step": 164250 }, { "epoch": 0.29, "learning_rate": 3.567751476194296e-05, "loss": 2.4559, "step": 164260 }, { "epoch": 0.29, "learning_rate": 3.567664282201614e-05, "loss": 2.4739, "step": 164270 }, { "epoch": 0.29, "learning_rate": 3.567577088208931e-05, "loss": 2.2774, "step": 164280 }, { "epoch": 0.29, "learning_rate": 3.567489894216248e-05, "loss": 2.494, "step": 164290 }, { "epoch": 0.29, "learning_rate": 3.567402700223566e-05, "loss": 2.4299, "step": 164300 }, { "epoch": 0.29, "learning_rate": 3.567315506230883e-05, "loss": 2.3825, "step": 164310 }, { "epoch": 0.29, "learning_rate": 3.5672283122382e-05, "loss": 2.4311, "step": 164320 }, { "epoch": 0.29, "learning_rate": 3.5671411182455175e-05, "loss": 2.4683, "step": 164330 }, { "epoch": 0.29, "learning_rate": 3.567053924252835e-05, "loss": 2.4806, "step": 164340 }, { "epoch": 0.29, "learning_rate": 3.566966730260152e-05, "loss": 2.4548, "step": 164350 }, { "epoch": 0.29, "learning_rate": 3.566879536267469e-05, "loss": 2.544, "step": 164360 }, { "epoch": 0.29, "learning_rate": 3.566792342274787e-05, "loss": 2.3951, "step": 164370 }, { "epoch": 0.29, "learning_rate": 3.566705148282104e-05, "loss": 2.4092, "step": 164380 }, { "epoch": 0.29, "learning_rate": 3.566617954289421e-05, "loss": 2.4913, "step": 164390 }, { "epoch": 0.29, "learning_rate": 3.566530760296739e-05, "loss": 2.2802, "step": 164400 }, { "epoch": 0.29, "learning_rate": 3.5664435663040565e-05, "loss": 2.4012, "step": 164410 }, { "epoch": 0.29, "learning_rate": 3.5663563723113735e-05, "loss": 2.4172, "step": 164420 }, { "epoch": 0.29, "learning_rate": 3.5662691783186906e-05, "loss": 2.4683, "step": 164430 }, { "epoch": 0.29, "learning_rate": 3.566181984326008e-05, "loss": 2.4777, "step": 164440 }, { "epoch": 0.29, "learning_rate": 3.566094790333325e-05, "loss": 2.5168, "step": 164450 }, { "epoch": 0.29, "learning_rate": 3.5660075963406424e-05, "loss": 2.4752, "step": 164460 }, { "epoch": 0.29, "learning_rate": 3.56592040234796e-05, "loss": 2.4125, "step": 164470 }, { "epoch": 0.29, "learning_rate": 3.565833208355278e-05, "loss": 2.4447, "step": 164480 }, { "epoch": 0.29, "learning_rate": 3.565746014362595e-05, "loss": 2.3651, "step": 164490 }, { "epoch": 0.29, "learning_rate": 3.565658820369912e-05, "loss": 2.5025, "step": 164500 }, { "epoch": 0.29, "learning_rate": 3.5655716263772296e-05, "loss": 2.3765, "step": 164510 }, { "epoch": 0.29, "learning_rate": 3.5654844323845466e-05, "loss": 2.3971, "step": 164520 }, { "epoch": 0.29, "learning_rate": 3.565397238391864e-05, "loss": 2.4514, "step": 164530 }, { "epoch": 0.29, "learning_rate": 3.565310044399181e-05, "loss": 2.5132, "step": 164540 }, { "epoch": 0.29, "learning_rate": 3.565222850406499e-05, "loss": 2.4848, "step": 164550 }, { "epoch": 0.29, "learning_rate": 3.565135656413816e-05, "loss": 2.4414, "step": 164560 }, { "epoch": 0.29, "learning_rate": 3.565048462421133e-05, "loss": 2.4461, "step": 164570 }, { "epoch": 0.29, "learning_rate": 3.564961268428451e-05, "loss": 2.4283, "step": 164580 }, { "epoch": 0.29, "learning_rate": 3.564874074435768e-05, "loss": 2.4562, "step": 164590 }, { "epoch": 0.29, "learning_rate": 3.564786880443085e-05, "loss": 2.4519, "step": 164600 }, { "epoch": 0.29, "learning_rate": 3.564699686450402e-05, "loss": 2.393, "step": 164610 }, { "epoch": 0.29, "learning_rate": 3.56461249245772e-05, "loss": 2.4844, "step": 164620 }, { "epoch": 0.29, "learning_rate": 3.5645252984650374e-05, "loss": 2.3434, "step": 164630 }, { "epoch": 0.29, "learning_rate": 3.5644381044723545e-05, "loss": 2.5201, "step": 164640 }, { "epoch": 0.29, "learning_rate": 3.5643509104796715e-05, "loss": 2.4117, "step": 164650 }, { "epoch": 0.29, "learning_rate": 3.564263716486989e-05, "loss": 2.381, "step": 164660 }, { "epoch": 0.29, "learning_rate": 3.564176522494306e-05, "loss": 2.5044, "step": 164670 }, { "epoch": 0.29, "learning_rate": 3.564089328501623e-05, "loss": 2.5189, "step": 164680 }, { "epoch": 0.29, "learning_rate": 3.564002134508941e-05, "loss": 2.3945, "step": 164690 }, { "epoch": 0.29, "learning_rate": 3.563914940516259e-05, "loss": 2.4969, "step": 164700 }, { "epoch": 0.29, "learning_rate": 3.563827746523576e-05, "loss": 2.3678, "step": 164710 }, { "epoch": 0.29, "learning_rate": 3.563740552530893e-05, "loss": 2.4734, "step": 164720 }, { "epoch": 0.29, "learning_rate": 3.5636533585382105e-05, "loss": 2.4138, "step": 164730 }, { "epoch": 0.29, "learning_rate": 3.5635661645455276e-05, "loss": 2.5524, "step": 164740 }, { "epoch": 0.29, "learning_rate": 3.5634789705528446e-05, "loss": 2.4349, "step": 164750 }, { "epoch": 0.29, "learning_rate": 3.563391776560162e-05, "loss": 2.5142, "step": 164760 }, { "epoch": 0.29, "learning_rate": 3.5633045825674794e-05, "loss": 2.5149, "step": 164770 }, { "epoch": 0.29, "learning_rate": 3.563217388574797e-05, "loss": 2.3948, "step": 164780 }, { "epoch": 0.29, "learning_rate": 3.563130194582114e-05, "loss": 2.4952, "step": 164790 }, { "epoch": 0.29, "learning_rate": 3.563043000589432e-05, "loss": 2.3797, "step": 164800 }, { "epoch": 0.29, "learning_rate": 3.562955806596749e-05, "loss": 2.4534, "step": 164810 }, { "epoch": 0.29, "learning_rate": 3.562868612604066e-05, "loss": 2.5144, "step": 164820 }, { "epoch": 0.29, "learning_rate": 3.5627814186113836e-05, "loss": 2.4112, "step": 164830 }, { "epoch": 0.29, "learning_rate": 3.5626942246187007e-05, "loss": 2.4588, "step": 164840 }, { "epoch": 0.29, "learning_rate": 3.5626070306260184e-05, "loss": 2.4273, "step": 164850 }, { "epoch": 0.29, "learning_rate": 3.5625198366333354e-05, "loss": 2.4635, "step": 164860 }, { "epoch": 0.29, "learning_rate": 3.562432642640653e-05, "loss": 2.5639, "step": 164870 }, { "epoch": 0.29, "learning_rate": 3.56234544864797e-05, "loss": 2.4065, "step": 164880 }, { "epoch": 0.29, "learning_rate": 3.562258254655287e-05, "loss": 2.4314, "step": 164890 }, { "epoch": 0.29, "learning_rate": 3.562171060662605e-05, "loss": 2.4086, "step": 164900 }, { "epoch": 0.29, "learning_rate": 3.562083866669922e-05, "loss": 2.4424, "step": 164910 }, { "epoch": 0.29, "learning_rate": 3.561996672677239e-05, "loss": 2.4522, "step": 164920 }, { "epoch": 0.29, "learning_rate": 3.561909478684557e-05, "loss": 2.4733, "step": 164930 }, { "epoch": 0.29, "learning_rate": 3.5618222846918744e-05, "loss": 2.4848, "step": 164940 }, { "epoch": 0.29, "learning_rate": 3.5617350906991915e-05, "loss": 2.5818, "step": 164950 }, { "epoch": 0.29, "learning_rate": 3.5616478967065085e-05, "loss": 2.5364, "step": 164960 }, { "epoch": 0.29, "learning_rate": 3.561560702713826e-05, "loss": 2.4628, "step": 164970 }, { "epoch": 0.29, "learning_rate": 3.561473508721143e-05, "loss": 2.44, "step": 164980 }, { "epoch": 0.29, "learning_rate": 3.56138631472846e-05, "loss": 2.5132, "step": 164990 }, { "epoch": 0.29, "learning_rate": 3.561299120735778e-05, "loss": 2.4146, "step": 165000 }, { "epoch": 0.29, "learning_rate": 3.561211926743096e-05, "loss": 2.5654, "step": 165010 }, { "epoch": 0.29, "learning_rate": 3.561124732750413e-05, "loss": 2.4368, "step": 165020 }, { "epoch": 0.29, "learning_rate": 3.56103753875773e-05, "loss": 2.4794, "step": 165030 }, { "epoch": 0.29, "learning_rate": 3.5609503447650475e-05, "loss": 2.4145, "step": 165040 }, { "epoch": 0.29, "learning_rate": 3.5608631507723646e-05, "loss": 2.4795, "step": 165050 }, { "epoch": 0.29, "learning_rate": 3.5607759567796816e-05, "loss": 2.5096, "step": 165060 }, { "epoch": 0.29, "learning_rate": 3.5606887627869986e-05, "loss": 2.3871, "step": 165070 }, { "epoch": 0.29, "learning_rate": 3.560601568794317e-05, "loss": 2.4988, "step": 165080 }, { "epoch": 0.29, "learning_rate": 3.560514374801634e-05, "loss": 2.4883, "step": 165090 }, { "epoch": 0.29, "learning_rate": 3.560427180808951e-05, "loss": 2.5418, "step": 165100 }, { "epoch": 0.29, "learning_rate": 3.560339986816268e-05, "loss": 2.5093, "step": 165110 }, { "epoch": 0.29, "learning_rate": 3.560252792823586e-05, "loss": 2.5039, "step": 165120 }, { "epoch": 0.29, "learning_rate": 3.560165598830903e-05, "loss": 2.4575, "step": 165130 }, { "epoch": 0.29, "learning_rate": 3.56007840483822e-05, "loss": 2.3921, "step": 165140 }, { "epoch": 0.29, "learning_rate": 3.559991210845538e-05, "loss": 2.5532, "step": 165150 }, { "epoch": 0.29, "learning_rate": 3.5599040168528554e-05, "loss": 2.4609, "step": 165160 }, { "epoch": 0.29, "learning_rate": 3.5598168228601724e-05, "loss": 2.4985, "step": 165170 }, { "epoch": 0.29, "learning_rate": 3.5597296288674894e-05, "loss": 2.4029, "step": 165180 }, { "epoch": 0.29, "learning_rate": 3.559642434874807e-05, "loss": 2.451, "step": 165190 }, { "epoch": 0.29, "learning_rate": 3.559555240882124e-05, "loss": 2.4447, "step": 165200 }, { "epoch": 0.29, "learning_rate": 3.559468046889441e-05, "loss": 2.5557, "step": 165210 }, { "epoch": 0.29, "learning_rate": 3.559380852896759e-05, "loss": 2.4692, "step": 165220 }, { "epoch": 0.29, "learning_rate": 3.559293658904077e-05, "loss": 2.4048, "step": 165230 }, { "epoch": 0.29, "learning_rate": 3.559206464911394e-05, "loss": 2.5142, "step": 165240 }, { "epoch": 0.29, "learning_rate": 3.559119270918711e-05, "loss": 2.4792, "step": 165250 }, { "epoch": 0.29, "learning_rate": 3.5590320769260285e-05, "loss": 2.5196, "step": 165260 }, { "epoch": 0.29, "learning_rate": 3.5589448829333455e-05, "loss": 2.3687, "step": 165270 }, { "epoch": 0.29, "learning_rate": 3.5588576889406625e-05, "loss": 2.4878, "step": 165280 }, { "epoch": 0.29, "learning_rate": 3.55877049494798e-05, "loss": 2.5611, "step": 165290 }, { "epoch": 0.29, "learning_rate": 3.558683300955298e-05, "loss": 2.3713, "step": 165300 }, { "epoch": 0.29, "learning_rate": 3.558596106962615e-05, "loss": 2.4958, "step": 165310 }, { "epoch": 0.29, "learning_rate": 3.558508912969932e-05, "loss": 2.4929, "step": 165320 }, { "epoch": 0.29, "learning_rate": 3.55842171897725e-05, "loss": 2.5568, "step": 165330 }, { "epoch": 0.29, "learning_rate": 3.558334524984567e-05, "loss": 2.5188, "step": 165340 }, { "epoch": 0.29, "learning_rate": 3.558247330991884e-05, "loss": 2.489, "step": 165350 }, { "epoch": 0.29, "learning_rate": 3.5581601369992016e-05, "loss": 2.4606, "step": 165360 }, { "epoch": 0.29, "learning_rate": 3.558072943006519e-05, "loss": 2.5154, "step": 165370 }, { "epoch": 0.29, "learning_rate": 3.557985749013836e-05, "loss": 2.529, "step": 165380 }, { "epoch": 0.29, "learning_rate": 3.5578985550211533e-05, "loss": 2.4099, "step": 165390 }, { "epoch": 0.29, "learning_rate": 3.557811361028471e-05, "loss": 2.3799, "step": 165400 }, { "epoch": 0.29, "learning_rate": 3.557724167035788e-05, "loss": 2.4736, "step": 165410 }, { "epoch": 0.29, "learning_rate": 3.557636973043105e-05, "loss": 2.4705, "step": 165420 }, { "epoch": 0.29, "learning_rate": 3.557549779050423e-05, "loss": 2.4442, "step": 165430 }, { "epoch": 0.29, "learning_rate": 3.55746258505774e-05, "loss": 2.4921, "step": 165440 }, { "epoch": 0.29, "learning_rate": 3.5573753910650576e-05, "loss": 2.4556, "step": 165450 }, { "epoch": 0.29, "learning_rate": 3.5572881970723746e-05, "loss": 2.3888, "step": 165460 }, { "epoch": 0.29, "learning_rate": 3.5572010030796924e-05, "loss": 2.3655, "step": 165470 }, { "epoch": 0.29, "learning_rate": 3.5571138090870094e-05, "loss": 2.5085, "step": 165480 }, { "epoch": 0.29, "learning_rate": 3.5570266150943264e-05, "loss": 2.3582, "step": 165490 }, { "epoch": 0.29, "learning_rate": 3.5569394211016435e-05, "loss": 2.4073, "step": 165500 }, { "epoch": 0.29, "learning_rate": 3.556852227108961e-05, "loss": 2.5286, "step": 165510 }, { "epoch": 0.29, "learning_rate": 3.556765033116279e-05, "loss": 2.464, "step": 165520 }, { "epoch": 0.29, "learning_rate": 3.556677839123596e-05, "loss": 2.4177, "step": 165530 }, { "epoch": 0.29, "learning_rate": 3.5565906451309137e-05, "loss": 2.4397, "step": 165540 }, { "epoch": 0.29, "learning_rate": 3.556503451138231e-05, "loss": 2.4099, "step": 165550 }, { "epoch": 0.29, "learning_rate": 3.556416257145548e-05, "loss": 2.4783, "step": 165560 }, { "epoch": 0.29, "learning_rate": 3.556329063152865e-05, "loss": 2.5651, "step": 165570 }, { "epoch": 0.29, "learning_rate": 3.5562418691601825e-05, "loss": 2.5295, "step": 165580 }, { "epoch": 0.29, "learning_rate": 3.5561546751674995e-05, "loss": 2.474, "step": 165590 }, { "epoch": 0.29, "learning_rate": 3.556067481174817e-05, "loss": 2.4217, "step": 165600 }, { "epoch": 0.29, "learning_rate": 3.555980287182134e-05, "loss": 2.5536, "step": 165610 }, { "epoch": 0.29, "learning_rate": 3.555893093189452e-05, "loss": 2.3338, "step": 165620 }, { "epoch": 0.29, "learning_rate": 3.555805899196769e-05, "loss": 2.476, "step": 165630 }, { "epoch": 0.29, "learning_rate": 3.555718705204086e-05, "loss": 2.4061, "step": 165640 }, { "epoch": 0.29, "learning_rate": 3.555631511211404e-05, "loss": 2.4849, "step": 165650 }, { "epoch": 0.29, "learning_rate": 3.555544317218721e-05, "loss": 2.482, "step": 165660 }, { "epoch": 0.29, "learning_rate": 3.5554571232260385e-05, "loss": 2.5204, "step": 165670 }, { "epoch": 0.29, "learning_rate": 3.5553699292333556e-05, "loss": 2.4538, "step": 165680 }, { "epoch": 0.29, "learning_rate": 3.555282735240673e-05, "loss": 2.3613, "step": 165690 }, { "epoch": 0.29, "learning_rate": 3.55519554124799e-05, "loss": 2.4801, "step": 165700 }, { "epoch": 0.29, "learning_rate": 3.5551083472553074e-05, "loss": 2.4775, "step": 165710 }, { "epoch": 0.29, "learning_rate": 3.555021153262625e-05, "loss": 2.5998, "step": 165720 }, { "epoch": 0.29, "learning_rate": 3.554933959269942e-05, "loss": 2.5338, "step": 165730 }, { "epoch": 0.29, "learning_rate": 3.55484676527726e-05, "loss": 2.3647, "step": 165740 }, { "epoch": 0.29, "learning_rate": 3.554759571284577e-05, "loss": 2.4646, "step": 165750 }, { "epoch": 0.29, "learning_rate": 3.5546723772918946e-05, "loss": 2.5317, "step": 165760 }, { "epoch": 0.29, "learning_rate": 3.5545851832992116e-05, "loss": 2.4301, "step": 165770 }, { "epoch": 0.29, "learning_rate": 3.554497989306529e-05, "loss": 2.3837, "step": 165780 }, { "epoch": 0.29, "learning_rate": 3.5544107953138464e-05, "loss": 2.3855, "step": 165790 }, { "epoch": 0.29, "learning_rate": 3.5543236013211634e-05, "loss": 2.4639, "step": 165800 }, { "epoch": 0.29, "learning_rate": 3.5542364073284805e-05, "loss": 2.3749, "step": 165810 }, { "epoch": 0.29, "learning_rate": 3.554149213335798e-05, "loss": 2.4193, "step": 165820 }, { "epoch": 0.29, "learning_rate": 3.554062019343116e-05, "loss": 2.4932, "step": 165830 }, { "epoch": 0.29, "learning_rate": 3.553974825350433e-05, "loss": 2.5595, "step": 165840 }, { "epoch": 0.29, "learning_rate": 3.55388763135775e-05, "loss": 2.4528, "step": 165850 }, { "epoch": 0.29, "learning_rate": 3.553800437365068e-05, "loss": 2.46, "step": 165860 }, { "epoch": 0.29, "learning_rate": 3.553713243372385e-05, "loss": 2.5175, "step": 165870 }, { "epoch": 0.29, "learning_rate": 3.553626049379702e-05, "loss": 2.5066, "step": 165880 }, { "epoch": 0.29, "learning_rate": 3.5535388553870195e-05, "loss": 2.4617, "step": 165890 }, { "epoch": 0.29, "learning_rate": 3.553451661394337e-05, "loss": 2.4986, "step": 165900 }, { "epoch": 0.29, "learning_rate": 3.553364467401654e-05, "loss": 2.5352, "step": 165910 }, { "epoch": 0.29, "learning_rate": 3.553277273408971e-05, "loss": 2.5039, "step": 165920 }, { "epoch": 0.29, "learning_rate": 3.553190079416289e-05, "loss": 2.4456, "step": 165930 }, { "epoch": 0.29, "learning_rate": 3.553102885423606e-05, "loss": 2.4385, "step": 165940 }, { "epoch": 0.29, "learning_rate": 3.553015691430923e-05, "loss": 2.5003, "step": 165950 }, { "epoch": 0.29, "learning_rate": 3.55292849743824e-05, "loss": 2.4418, "step": 165960 }, { "epoch": 0.29, "learning_rate": 3.5528413034455585e-05, "loss": 2.4694, "step": 165970 }, { "epoch": 0.29, "learning_rate": 3.5527541094528755e-05, "loss": 2.4026, "step": 165980 }, { "epoch": 0.29, "learning_rate": 3.5526669154601926e-05, "loss": 2.4127, "step": 165990 }, { "epoch": 0.29, "learning_rate": 3.5525797214675096e-05, "loss": 2.4963, "step": 166000 }, { "epoch": 0.29, "learning_rate": 3.552492527474827e-05, "loss": 2.4053, "step": 166010 }, { "epoch": 0.29, "learning_rate": 3.5524053334821444e-05, "loss": 2.4972, "step": 166020 }, { "epoch": 0.29, "learning_rate": 3.5523181394894614e-05, "loss": 2.4792, "step": 166030 }, { "epoch": 0.29, "learning_rate": 3.55223094549678e-05, "loss": 2.502, "step": 166040 }, { "epoch": 0.29, "learning_rate": 3.552143751504097e-05, "loss": 2.4581, "step": 166050 }, { "epoch": 0.29, "learning_rate": 3.552056557511414e-05, "loss": 2.4615, "step": 166060 }, { "epoch": 0.29, "learning_rate": 3.551969363518731e-05, "loss": 2.4633, "step": 166070 }, { "epoch": 0.29, "learning_rate": 3.5518821695260486e-05, "loss": 2.528, "step": 166080 }, { "epoch": 0.29, "learning_rate": 3.551794975533366e-05, "loss": 2.4119, "step": 166090 }, { "epoch": 0.29, "learning_rate": 3.551707781540683e-05, "loss": 2.4505, "step": 166100 }, { "epoch": 0.29, "learning_rate": 3.5516205875480004e-05, "loss": 2.3717, "step": 166110 }, { "epoch": 0.29, "learning_rate": 3.551533393555318e-05, "loss": 2.4343, "step": 166120 }, { "epoch": 0.29, "learning_rate": 3.551446199562635e-05, "loss": 2.4637, "step": 166130 }, { "epoch": 0.29, "learning_rate": 3.551359005569952e-05, "loss": 2.5498, "step": 166140 }, { "epoch": 0.29, "learning_rate": 3.55127181157727e-05, "loss": 2.495, "step": 166150 }, { "epoch": 0.29, "learning_rate": 3.551184617584587e-05, "loss": 2.4986, "step": 166160 }, { "epoch": 0.29, "learning_rate": 3.551097423591904e-05, "loss": 2.4281, "step": 166170 }, { "epoch": 0.29, "learning_rate": 3.551010229599222e-05, "loss": 2.4873, "step": 166180 }, { "epoch": 0.29, "learning_rate": 3.5509230356065394e-05, "loss": 2.5315, "step": 166190 }, { "epoch": 0.29, "learning_rate": 3.5508358416138565e-05, "loss": 2.5263, "step": 166200 }, { "epoch": 0.29, "learning_rate": 3.5507486476211735e-05, "loss": 2.5171, "step": 166210 }, { "epoch": 0.29, "learning_rate": 3.550661453628491e-05, "loss": 2.408, "step": 166220 }, { "epoch": 0.29, "learning_rate": 3.550574259635808e-05, "loss": 2.3325, "step": 166230 }, { "epoch": 0.29, "learning_rate": 3.550487065643125e-05, "loss": 2.5064, "step": 166240 }, { "epoch": 0.29, "learning_rate": 3.550399871650443e-05, "loss": 2.531, "step": 166250 }, { "epoch": 0.29, "learning_rate": 3.55031267765776e-05, "loss": 2.4481, "step": 166260 }, { "epoch": 0.29, "learning_rate": 3.550225483665078e-05, "loss": 2.6393, "step": 166270 }, { "epoch": 0.29, "learning_rate": 3.550138289672395e-05, "loss": 2.3866, "step": 166280 }, { "epoch": 0.29, "learning_rate": 3.5500510956797125e-05, "loss": 2.4442, "step": 166290 }, { "epoch": 0.29, "learning_rate": 3.5499639016870296e-05, "loss": 2.3262, "step": 166300 }, { "epoch": 0.29, "learning_rate": 3.5498767076943466e-05, "loss": 2.3473, "step": 166310 }, { "epoch": 0.29, "learning_rate": 3.549789513701664e-05, "loss": 2.4574, "step": 166320 }, { "epoch": 0.29, "learning_rate": 3.5497023197089814e-05, "loss": 2.4369, "step": 166330 }, { "epoch": 0.29, "learning_rate": 3.549615125716299e-05, "loss": 2.4616, "step": 166340 }, { "epoch": 0.29, "learning_rate": 3.549527931723616e-05, "loss": 2.5159, "step": 166350 }, { "epoch": 0.29, "learning_rate": 3.549440737730934e-05, "loss": 2.2647, "step": 166360 }, { "epoch": 0.29, "learning_rate": 3.549353543738251e-05, "loss": 2.5083, "step": 166370 }, { "epoch": 0.29, "learning_rate": 3.549266349745568e-05, "loss": 2.4601, "step": 166380 }, { "epoch": 0.29, "learning_rate": 3.5491791557528856e-05, "loss": 2.4143, "step": 166390 }, { "epoch": 0.29, "learning_rate": 3.5490919617602027e-05, "loss": 2.3872, "step": 166400 }, { "epoch": 0.29, "learning_rate": 3.5490047677675204e-05, "loss": 2.4757, "step": 166410 }, { "epoch": 0.29, "learning_rate": 3.5489175737748374e-05, "loss": 2.426, "step": 166420 }, { "epoch": 0.29, "learning_rate": 3.548830379782155e-05, "loss": 2.4325, "step": 166430 }, { "epoch": 0.29, "learning_rate": 3.548743185789472e-05, "loss": 2.5182, "step": 166440 }, { "epoch": 0.29, "learning_rate": 3.548655991796789e-05, "loss": 2.4776, "step": 166450 }, { "epoch": 0.29, "learning_rate": 3.548568797804106e-05, "loss": 2.4819, "step": 166460 }, { "epoch": 0.29, "learning_rate": 3.548481603811424e-05, "loss": 2.4571, "step": 166470 }, { "epoch": 0.29, "learning_rate": 3.548394409818741e-05, "loss": 2.4906, "step": 166480 }, { "epoch": 0.29, "learning_rate": 3.548307215826059e-05, "loss": 2.3059, "step": 166490 }, { "epoch": 0.29, "learning_rate": 3.5482200218333764e-05, "loss": 2.5139, "step": 166500 }, { "epoch": 0.29, "learning_rate": 3.5481328278406935e-05, "loss": 2.4645, "step": 166510 }, { "epoch": 0.29, "learning_rate": 3.5480456338480105e-05, "loss": 2.4584, "step": 166520 }, { "epoch": 0.29, "learning_rate": 3.5479584398553275e-05, "loss": 2.5249, "step": 166530 }, { "epoch": 0.29, "learning_rate": 3.547871245862645e-05, "loss": 2.3972, "step": 166540 }, { "epoch": 0.29, "learning_rate": 3.547784051869962e-05, "loss": 2.5353, "step": 166550 }, { "epoch": 0.29, "learning_rate": 3.54769685787728e-05, "loss": 2.4966, "step": 166560 }, { "epoch": 0.29, "learning_rate": 3.547609663884597e-05, "loss": 2.5684, "step": 166570 }, { "epoch": 0.29, "learning_rate": 3.547522469891915e-05, "loss": 2.477, "step": 166580 }, { "epoch": 0.29, "learning_rate": 3.547435275899232e-05, "loss": 2.3517, "step": 166590 }, { "epoch": 0.29, "learning_rate": 3.547348081906549e-05, "loss": 2.3799, "step": 166600 }, { "epoch": 0.29, "learning_rate": 3.5472608879138666e-05, "loss": 2.5365, "step": 166610 }, { "epoch": 0.29, "learning_rate": 3.5471736939211836e-05, "loss": 2.448, "step": 166620 }, { "epoch": 0.29, "learning_rate": 3.5470864999285006e-05, "loss": 2.4269, "step": 166630 }, { "epoch": 0.29, "learning_rate": 3.5469993059358184e-05, "loss": 2.5941, "step": 166640 }, { "epoch": 0.29, "learning_rate": 3.546912111943136e-05, "loss": 2.466, "step": 166650 }, { "epoch": 0.29, "learning_rate": 3.546824917950453e-05, "loss": 2.3849, "step": 166660 }, { "epoch": 0.29, "learning_rate": 3.54673772395777e-05, "loss": 2.4722, "step": 166670 }, { "epoch": 0.29, "learning_rate": 3.546650529965088e-05, "loss": 2.534, "step": 166680 }, { "epoch": 0.29, "learning_rate": 3.546563335972405e-05, "loss": 2.551, "step": 166690 }, { "epoch": 0.29, "learning_rate": 3.546476141979722e-05, "loss": 2.3644, "step": 166700 }, { "epoch": 0.29, "learning_rate": 3.5463889479870397e-05, "loss": 2.3399, "step": 166710 }, { "epoch": 0.29, "learning_rate": 3.5463017539943574e-05, "loss": 2.4451, "step": 166720 }, { "epoch": 0.29, "learning_rate": 3.5462145600016744e-05, "loss": 2.4629, "step": 166730 }, { "epoch": 0.29, "learning_rate": 3.5461273660089914e-05, "loss": 2.4476, "step": 166740 }, { "epoch": 0.29, "learning_rate": 3.546040172016309e-05, "loss": 2.3844, "step": 166750 }, { "epoch": 0.29, "learning_rate": 3.545952978023626e-05, "loss": 2.4374, "step": 166760 }, { "epoch": 0.29, "learning_rate": 3.545865784030943e-05, "loss": 2.6131, "step": 166770 }, { "epoch": 0.29, "learning_rate": 3.545778590038261e-05, "loss": 2.4787, "step": 166780 }, { "epoch": 0.29, "learning_rate": 3.545691396045579e-05, "loss": 2.4375, "step": 166790 }, { "epoch": 0.29, "learning_rate": 3.545604202052896e-05, "loss": 2.4365, "step": 166800 }, { "epoch": 0.29, "learning_rate": 3.545517008060213e-05, "loss": 2.5628, "step": 166810 }, { "epoch": 0.29, "learning_rate": 3.5454298140675305e-05, "loss": 2.4755, "step": 166820 }, { "epoch": 0.29, "learning_rate": 3.5453426200748475e-05, "loss": 2.4974, "step": 166830 }, { "epoch": 0.29, "learning_rate": 3.5452554260821645e-05, "loss": 2.5527, "step": 166840 }, { "epoch": 0.29, "learning_rate": 3.5451682320894816e-05, "loss": 2.554, "step": 166850 }, { "epoch": 0.29, "learning_rate": 3.5450810380968e-05, "loss": 2.4496, "step": 166860 }, { "epoch": 0.29, "learning_rate": 3.544993844104117e-05, "loss": 2.4068, "step": 166870 }, { "epoch": 0.29, "learning_rate": 3.544906650111434e-05, "loss": 2.3906, "step": 166880 }, { "epoch": 0.29, "learning_rate": 3.544819456118752e-05, "loss": 2.4405, "step": 166890 }, { "epoch": 0.29, "learning_rate": 3.544732262126069e-05, "loss": 2.4183, "step": 166900 }, { "epoch": 0.29, "learning_rate": 3.544645068133386e-05, "loss": 2.4636, "step": 166910 }, { "epoch": 0.29, "learning_rate": 3.544557874140703e-05, "loss": 2.3897, "step": 166920 }, { "epoch": 0.29, "learning_rate": 3.5444706801480206e-05, "loss": 2.4287, "step": 166930 }, { "epoch": 0.29, "learning_rate": 3.544383486155338e-05, "loss": 2.5287, "step": 166940 }, { "epoch": 0.29, "learning_rate": 3.5442962921626553e-05, "loss": 2.5049, "step": 166950 }, { "epoch": 0.29, "learning_rate": 3.5442090981699724e-05, "loss": 2.4281, "step": 166960 }, { "epoch": 0.29, "learning_rate": 3.54412190417729e-05, "loss": 2.4498, "step": 166970 }, { "epoch": 0.29, "learning_rate": 3.544034710184607e-05, "loss": 2.3228, "step": 166980 }, { "epoch": 0.29, "learning_rate": 3.543947516191924e-05, "loss": 2.4957, "step": 166990 }, { "epoch": 0.29, "learning_rate": 3.543860322199242e-05, "loss": 2.5492, "step": 167000 }, { "epoch": 0.29, "learning_rate": 3.5437731282065596e-05, "loss": 2.5168, "step": 167010 }, { "epoch": 0.29, "learning_rate": 3.5436859342138766e-05, "loss": 2.5529, "step": 167020 }, { "epoch": 0.29, "learning_rate": 3.543598740221194e-05, "loss": 2.4013, "step": 167030 }, { "epoch": 0.29, "learning_rate": 3.5435115462285114e-05, "loss": 2.367, "step": 167040 }, { "epoch": 0.29, "learning_rate": 3.5434243522358284e-05, "loss": 2.5402, "step": 167050 }, { "epoch": 0.29, "learning_rate": 3.5433371582431455e-05, "loss": 2.5249, "step": 167060 }, { "epoch": 0.29, "learning_rate": 3.543249964250463e-05, "loss": 2.3472, "step": 167070 }, { "epoch": 0.29, "learning_rate": 3.543162770257781e-05, "loss": 2.3929, "step": 167080 }, { "epoch": 0.29, "learning_rate": 3.543075576265098e-05, "loss": 2.5685, "step": 167090 }, { "epoch": 0.29, "learning_rate": 3.542988382272415e-05, "loss": 2.3922, "step": 167100 }, { "epoch": 0.29, "learning_rate": 3.542901188279733e-05, "loss": 2.4528, "step": 167110 }, { "epoch": 0.29, "learning_rate": 3.54281399428705e-05, "loss": 2.4981, "step": 167120 }, { "epoch": 0.29, "learning_rate": 3.542726800294367e-05, "loss": 2.4471, "step": 167130 }, { "epoch": 0.29, "learning_rate": 3.5426396063016845e-05, "loss": 2.4437, "step": 167140 }, { "epoch": 0.29, "learning_rate": 3.5425524123090015e-05, "loss": 2.3641, "step": 167150 }, { "epoch": 0.29, "learning_rate": 3.542465218316319e-05, "loss": 2.4525, "step": 167160 }, { "epoch": 0.29, "learning_rate": 3.542378024323636e-05, "loss": 2.3183, "step": 167170 }, { "epoch": 0.29, "learning_rate": 3.542290830330954e-05, "loss": 2.5476, "step": 167180 }, { "epoch": 0.29, "learning_rate": 3.542203636338271e-05, "loss": 2.4978, "step": 167190 }, { "epoch": 0.29, "learning_rate": 3.542116442345588e-05, "loss": 2.5051, "step": 167200 }, { "epoch": 0.29, "learning_rate": 3.542029248352906e-05, "loss": 2.5498, "step": 167210 }, { "epoch": 0.29, "learning_rate": 3.541942054360223e-05, "loss": 2.3269, "step": 167220 }, { "epoch": 0.29, "learning_rate": 3.5418548603675405e-05, "loss": 2.4043, "step": 167230 }, { "epoch": 0.29, "learning_rate": 3.5417676663748576e-05, "loss": 2.4945, "step": 167240 }, { "epoch": 0.29, "learning_rate": 3.541680472382175e-05, "loss": 2.4872, "step": 167250 }, { "epoch": 0.29, "learning_rate": 3.541593278389492e-05, "loss": 2.4399, "step": 167260 }, { "epoch": 0.29, "learning_rate": 3.5415060843968094e-05, "loss": 2.4093, "step": 167270 }, { "epoch": 0.29, "learning_rate": 3.541418890404127e-05, "loss": 2.5422, "step": 167280 }, { "epoch": 0.29, "learning_rate": 3.541331696411444e-05, "loss": 2.4887, "step": 167290 }, { "epoch": 0.29, "learning_rate": 3.541244502418761e-05, "loss": 2.4559, "step": 167300 }, { "epoch": 0.29, "learning_rate": 3.541157308426079e-05, "loss": 2.4926, "step": 167310 }, { "epoch": 0.29, "learning_rate": 3.5410701144333966e-05, "loss": 2.5435, "step": 167320 }, { "epoch": 0.29, "learning_rate": 3.5409829204407136e-05, "loss": 2.5389, "step": 167330 }, { "epoch": 0.29, "learning_rate": 3.540895726448031e-05, "loss": 2.4541, "step": 167340 }, { "epoch": 0.29, "learning_rate": 3.540808532455348e-05, "loss": 2.3828, "step": 167350 }, { "epoch": 0.29, "learning_rate": 3.5407213384626654e-05, "loss": 2.4292, "step": 167360 }, { "epoch": 0.29, "learning_rate": 3.5406341444699825e-05, "loss": 2.4625, "step": 167370 }, { "epoch": 0.29, "learning_rate": 3.5405469504773e-05, "loss": 2.408, "step": 167380 }, { "epoch": 0.29, "learning_rate": 3.540459756484618e-05, "loss": 2.5149, "step": 167390 }, { "epoch": 0.29, "learning_rate": 3.540372562491935e-05, "loss": 2.4246, "step": 167400 }, { "epoch": 0.29, "learning_rate": 3.540285368499252e-05, "loss": 2.513, "step": 167410 }, { "epoch": 0.29, "learning_rate": 3.540198174506569e-05, "loss": 2.4599, "step": 167420 }, { "epoch": 0.29, "learning_rate": 3.540110980513887e-05, "loss": 2.5593, "step": 167430 }, { "epoch": 0.29, "learning_rate": 3.540023786521204e-05, "loss": 2.4391, "step": 167440 }, { "epoch": 0.29, "learning_rate": 3.539936592528521e-05, "loss": 2.3684, "step": 167450 }, { "epoch": 0.29, "learning_rate": 3.5398493985358385e-05, "loss": 2.4891, "step": 167460 }, { "epoch": 0.29, "learning_rate": 3.539762204543156e-05, "loss": 2.3801, "step": 167470 }, { "epoch": 0.29, "learning_rate": 3.539675010550473e-05, "loss": 2.4378, "step": 167480 }, { "epoch": 0.29, "learning_rate": 3.53958781655779e-05, "loss": 2.5027, "step": 167490 }, { "epoch": 0.29, "learning_rate": 3.539500622565108e-05, "loss": 2.5005, "step": 167500 }, { "epoch": 0.29, "learning_rate": 3.539413428572425e-05, "loss": 2.5704, "step": 167510 }, { "epoch": 0.29, "learning_rate": 3.539326234579742e-05, "loss": 2.4681, "step": 167520 }, { "epoch": 0.29, "learning_rate": 3.53923904058706e-05, "loss": 2.4243, "step": 167530 }, { "epoch": 0.29, "learning_rate": 3.5391518465943775e-05, "loss": 2.5039, "step": 167540 }, { "epoch": 0.29, "learning_rate": 3.5390646526016946e-05, "loss": 2.5044, "step": 167550 }, { "epoch": 0.29, "learning_rate": 3.5389774586090116e-05, "loss": 2.3394, "step": 167560 }, { "epoch": 0.29, "learning_rate": 3.538890264616329e-05, "loss": 2.6213, "step": 167570 }, { "epoch": 0.29, "learning_rate": 3.5388030706236464e-05, "loss": 2.3932, "step": 167580 }, { "epoch": 0.29, "learning_rate": 3.5387158766309634e-05, "loss": 2.4945, "step": 167590 }, { "epoch": 0.29, "learning_rate": 3.538628682638281e-05, "loss": 2.3556, "step": 167600 }, { "epoch": 0.29, "learning_rate": 3.538541488645599e-05, "loss": 2.3652, "step": 167610 }, { "epoch": 0.29, "learning_rate": 3.538454294652916e-05, "loss": 2.4347, "step": 167620 }, { "epoch": 0.29, "learning_rate": 3.538367100660233e-05, "loss": 2.5093, "step": 167630 }, { "epoch": 0.29, "learning_rate": 3.5382799066675506e-05, "loss": 2.4627, "step": 167640 }, { "epoch": 0.29, "learning_rate": 3.538192712674868e-05, "loss": 2.4024, "step": 167650 }, { "epoch": 0.29, "learning_rate": 3.538105518682185e-05, "loss": 2.5644, "step": 167660 }, { "epoch": 0.29, "learning_rate": 3.5380183246895024e-05, "loss": 2.3824, "step": 167670 }, { "epoch": 0.29, "learning_rate": 3.53793113069682e-05, "loss": 2.484, "step": 167680 }, { "epoch": 0.29, "learning_rate": 3.537843936704137e-05, "loss": 2.4867, "step": 167690 }, { "epoch": 0.29, "learning_rate": 3.537756742711454e-05, "loss": 2.3815, "step": 167700 }, { "epoch": 0.29, "learning_rate": 3.537669548718772e-05, "loss": 2.4159, "step": 167710 }, { "epoch": 0.29, "learning_rate": 3.537582354726089e-05, "loss": 2.4514, "step": 167720 }, { "epoch": 0.29, "learning_rate": 3.537495160733406e-05, "loss": 2.4168, "step": 167730 }, { "epoch": 0.29, "learning_rate": 3.537407966740724e-05, "loss": 2.516, "step": 167740 }, { "epoch": 0.29, "learning_rate": 3.5373207727480414e-05, "loss": 2.4593, "step": 167750 }, { "epoch": 0.29, "learning_rate": 3.5372335787553585e-05, "loss": 2.4126, "step": 167760 }, { "epoch": 0.29, "learning_rate": 3.5371463847626755e-05, "loss": 2.5254, "step": 167770 }, { "epoch": 0.29, "learning_rate": 3.537059190769993e-05, "loss": 2.4948, "step": 167780 }, { "epoch": 0.29, "learning_rate": 3.53697199677731e-05, "loss": 2.4072, "step": 167790 }, { "epoch": 0.29, "learning_rate": 3.536884802784627e-05, "loss": 2.4212, "step": 167800 }, { "epoch": 0.29, "learning_rate": 3.5367976087919443e-05, "loss": 2.5912, "step": 167810 }, { "epoch": 0.29, "learning_rate": 3.536710414799262e-05, "loss": 2.4645, "step": 167820 }, { "epoch": 0.29, "learning_rate": 3.53662322080658e-05, "loss": 2.4082, "step": 167830 }, { "epoch": 0.29, "learning_rate": 3.536536026813897e-05, "loss": 2.3787, "step": 167840 }, { "epoch": 0.29, "learning_rate": 3.5364488328212145e-05, "loss": 2.5597, "step": 167850 }, { "epoch": 0.29, "learning_rate": 3.5363616388285316e-05, "loss": 2.3858, "step": 167860 }, { "epoch": 0.29, "learning_rate": 3.5362744448358486e-05, "loss": 2.4648, "step": 167870 }, { "epoch": 0.29, "learning_rate": 3.5361872508431656e-05, "loss": 2.3653, "step": 167880 }, { "epoch": 0.29, "learning_rate": 3.5361000568504834e-05, "loss": 2.309, "step": 167890 }, { "epoch": 0.29, "learning_rate": 3.536012862857801e-05, "loss": 2.5142, "step": 167900 }, { "epoch": 0.29, "learning_rate": 3.535925668865118e-05, "loss": 2.5591, "step": 167910 }, { "epoch": 0.29, "learning_rate": 3.535838474872435e-05, "loss": 2.5658, "step": 167920 }, { "epoch": 0.29, "learning_rate": 3.535751280879753e-05, "loss": 2.4736, "step": 167930 }, { "epoch": 0.29, "learning_rate": 3.53566408688707e-05, "loss": 2.4847, "step": 167940 }, { "epoch": 0.29, "learning_rate": 3.535576892894387e-05, "loss": 2.4867, "step": 167950 }, { "epoch": 0.29, "learning_rate": 3.535489698901705e-05, "loss": 2.5061, "step": 167960 }, { "epoch": 0.29, "learning_rate": 3.535402504909022e-05, "loss": 2.4292, "step": 167970 }, { "epoch": 0.29, "learning_rate": 3.5353153109163394e-05, "loss": 2.4158, "step": 167980 }, { "epoch": 0.29, "learning_rate": 3.5352281169236565e-05, "loss": 2.3662, "step": 167990 }, { "epoch": 0.29, "learning_rate": 3.535140922930974e-05, "loss": 2.3809, "step": 168000 }, { "epoch": 0.29, "learning_rate": 3.535053728938291e-05, "loss": 2.4851, "step": 168010 }, { "epoch": 0.29, "learning_rate": 3.534966534945608e-05, "loss": 2.5539, "step": 168020 }, { "epoch": 0.29, "learning_rate": 3.534879340952926e-05, "loss": 2.4808, "step": 168030 }, { "epoch": 0.29, "learning_rate": 3.534792146960243e-05, "loss": 2.4078, "step": 168040 }, { "epoch": 0.29, "learning_rate": 3.534704952967561e-05, "loss": 2.4229, "step": 168050 }, { "epoch": 0.29, "learning_rate": 3.534617758974878e-05, "loss": 2.5643, "step": 168060 }, { "epoch": 0.29, "learning_rate": 3.5345305649821955e-05, "loss": 2.4597, "step": 168070 }, { "epoch": 0.29, "learning_rate": 3.5344433709895125e-05, "loss": 2.4128, "step": 168080 }, { "epoch": 0.29, "learning_rate": 3.5343561769968295e-05, "loss": 2.4249, "step": 168090 }, { "epoch": 0.29, "learning_rate": 3.534268983004147e-05, "loss": 2.4253, "step": 168100 }, { "epoch": 0.29, "learning_rate": 3.534181789011464e-05, "loss": 2.4292, "step": 168110 }, { "epoch": 0.29, "learning_rate": 3.534094595018781e-05, "loss": 2.3837, "step": 168120 }, { "epoch": 0.29, "learning_rate": 3.534007401026099e-05, "loss": 2.4647, "step": 168130 }, { "epoch": 0.29, "learning_rate": 3.533920207033417e-05, "loss": 2.3561, "step": 168140 }, { "epoch": 0.29, "learning_rate": 3.533833013040734e-05, "loss": 2.4867, "step": 168150 }, { "epoch": 0.29, "learning_rate": 3.533745819048051e-05, "loss": 2.4032, "step": 168160 }, { "epoch": 0.29, "learning_rate": 3.5336586250553686e-05, "loss": 2.5519, "step": 168170 }, { "epoch": 0.29, "learning_rate": 3.5335714310626856e-05, "loss": 2.3794, "step": 168180 }, { "epoch": 0.29, "learning_rate": 3.5334842370700026e-05, "loss": 2.3873, "step": 168190 }, { "epoch": 0.29, "learning_rate": 3.5333970430773204e-05, "loss": 2.427, "step": 168200 }, { "epoch": 0.29, "learning_rate": 3.533309849084638e-05, "loss": 2.3977, "step": 168210 }, { "epoch": 0.29, "learning_rate": 3.533222655091955e-05, "loss": 2.4215, "step": 168220 }, { "epoch": 0.29, "learning_rate": 3.533135461099272e-05, "loss": 2.4187, "step": 168230 }, { "epoch": 0.29, "learning_rate": 3.53304826710659e-05, "loss": 2.5239, "step": 168240 }, { "epoch": 0.29, "learning_rate": 3.532961073113907e-05, "loss": 2.4903, "step": 168250 }, { "epoch": 0.29, "learning_rate": 3.532873879121224e-05, "loss": 2.4396, "step": 168260 }, { "epoch": 0.29, "learning_rate": 3.5327866851285417e-05, "loss": 2.4269, "step": 168270 }, { "epoch": 0.29, "learning_rate": 3.5326994911358594e-05, "loss": 2.5431, "step": 168280 }, { "epoch": 0.29, "learning_rate": 3.5326122971431764e-05, "loss": 2.5244, "step": 168290 }, { "epoch": 0.29, "learning_rate": 3.5325251031504934e-05, "loss": 2.531, "step": 168300 }, { "epoch": 0.29, "learning_rate": 3.5324379091578105e-05, "loss": 2.3828, "step": 168310 }, { "epoch": 0.29, "learning_rate": 3.532350715165128e-05, "loss": 2.4002, "step": 168320 }, { "epoch": 0.29, "learning_rate": 3.532263521172445e-05, "loss": 2.4119, "step": 168330 }, { "epoch": 0.29, "learning_rate": 3.532176327179762e-05, "loss": 2.4092, "step": 168340 }, { "epoch": 0.29, "learning_rate": 3.532089133187081e-05, "loss": 2.4178, "step": 168350 }, { "epoch": 0.29, "learning_rate": 3.532001939194398e-05, "loss": 2.385, "step": 168360 }, { "epoch": 0.29, "learning_rate": 3.531914745201715e-05, "loss": 2.3948, "step": 168370 }, { "epoch": 0.29, "learning_rate": 3.531827551209032e-05, "loss": 2.44, "step": 168380 }, { "epoch": 0.29, "learning_rate": 3.5317403572163495e-05, "loss": 2.4606, "step": 168390 }, { "epoch": 0.29, "learning_rate": 3.5316531632236665e-05, "loss": 2.4639, "step": 168400 }, { "epoch": 0.29, "learning_rate": 3.5315659692309836e-05, "loss": 2.5539, "step": 168410 }, { "epoch": 0.29, "learning_rate": 3.531478775238301e-05, "loss": 2.3607, "step": 168420 }, { "epoch": 0.29, "learning_rate": 3.531391581245619e-05, "loss": 2.5212, "step": 168430 }, { "epoch": 0.29, "learning_rate": 3.531304387252936e-05, "loss": 2.504, "step": 168440 }, { "epoch": 0.29, "learning_rate": 3.531217193260253e-05, "loss": 2.3469, "step": 168450 }, { "epoch": 0.29, "learning_rate": 3.531129999267571e-05, "loss": 2.5591, "step": 168460 }, { "epoch": 0.29, "learning_rate": 3.531042805274888e-05, "loss": 2.4587, "step": 168470 }, { "epoch": 0.29, "learning_rate": 3.530955611282205e-05, "loss": 2.598, "step": 168480 }, { "epoch": 0.29, "learning_rate": 3.5308684172895226e-05, "loss": 2.4452, "step": 168490 }, { "epoch": 0.29, "learning_rate": 3.53078122329684e-05, "loss": 2.5471, "step": 168500 }, { "epoch": 0.29, "learning_rate": 3.5306940293041573e-05, "loss": 2.4438, "step": 168510 }, { "epoch": 0.29, "learning_rate": 3.5306068353114744e-05, "loss": 2.5603, "step": 168520 }, { "epoch": 0.29, "learning_rate": 3.530519641318792e-05, "loss": 2.4473, "step": 168530 }, { "epoch": 0.29, "learning_rate": 3.530432447326109e-05, "loss": 2.5166, "step": 168540 }, { "epoch": 0.29, "learning_rate": 3.530345253333426e-05, "loss": 2.3941, "step": 168550 }, { "epoch": 0.29, "learning_rate": 3.530258059340744e-05, "loss": 2.4741, "step": 168560 }, { "epoch": 0.29, "learning_rate": 3.5301708653480616e-05, "loss": 2.535, "step": 168570 }, { "epoch": 0.29, "learning_rate": 3.5300836713553786e-05, "loss": 2.4841, "step": 168580 }, { "epoch": 0.29, "learning_rate": 3.529996477362696e-05, "loss": 2.4588, "step": 168590 }, { "epoch": 0.29, "learning_rate": 3.5299092833700134e-05, "loss": 2.5207, "step": 168600 }, { "epoch": 0.29, "learning_rate": 3.5298220893773304e-05, "loss": 2.4895, "step": 168610 }, { "epoch": 0.29, "learning_rate": 3.5297348953846475e-05, "loss": 2.4612, "step": 168620 }, { "epoch": 0.29, "learning_rate": 3.529647701391965e-05, "loss": 2.4685, "step": 168630 }, { "epoch": 0.29, "learning_rate": 3.529560507399282e-05, "loss": 2.5118, "step": 168640 }, { "epoch": 0.29, "learning_rate": 3.5294733134066e-05, "loss": 2.3397, "step": 168650 }, { "epoch": 0.29, "learning_rate": 3.529386119413917e-05, "loss": 2.3591, "step": 168660 }, { "epoch": 0.29, "learning_rate": 3.529298925421235e-05, "loss": 2.5084, "step": 168670 }, { "epoch": 0.29, "learning_rate": 3.529211731428552e-05, "loss": 2.4749, "step": 168680 }, { "epoch": 0.29, "learning_rate": 3.529124537435869e-05, "loss": 2.5872, "step": 168690 }, { "epoch": 0.29, "learning_rate": 3.529037343443186e-05, "loss": 2.4919, "step": 168700 }, { "epoch": 0.29, "learning_rate": 3.5289501494505035e-05, "loss": 2.3341, "step": 168710 }, { "epoch": 0.29, "learning_rate": 3.528862955457821e-05, "loss": 2.3201, "step": 168720 }, { "epoch": 0.29, "learning_rate": 3.528775761465138e-05, "loss": 2.4643, "step": 168730 }, { "epoch": 0.29, "learning_rate": 3.528688567472456e-05, "loss": 2.4143, "step": 168740 }, { "epoch": 0.29, "learning_rate": 3.528601373479773e-05, "loss": 2.4467, "step": 168750 }, { "epoch": 0.29, "learning_rate": 3.52851417948709e-05, "loss": 2.4602, "step": 168760 }, { "epoch": 0.29, "learning_rate": 3.528426985494407e-05, "loss": 2.438, "step": 168770 }, { "epoch": 0.29, "learning_rate": 3.528339791501725e-05, "loss": 2.4321, "step": 168780 }, { "epoch": 0.29, "learning_rate": 3.528252597509042e-05, "loss": 2.336, "step": 168790 }, { "epoch": 0.29, "learning_rate": 3.5281654035163596e-05, "loss": 2.473, "step": 168800 }, { "epoch": 0.29, "learning_rate": 3.5280782095236766e-05, "loss": 2.5285, "step": 168810 }, { "epoch": 0.29, "learning_rate": 3.5279910155309943e-05, "loss": 2.4396, "step": 168820 }, { "epoch": 0.29, "learning_rate": 3.5279038215383114e-05, "loss": 2.5216, "step": 168830 }, { "epoch": 0.29, "learning_rate": 3.5278166275456284e-05, "loss": 2.4411, "step": 168840 }, { "epoch": 0.29, "learning_rate": 3.527729433552946e-05, "loss": 2.4334, "step": 168850 }, { "epoch": 0.29, "learning_rate": 3.527642239560263e-05, "loss": 2.4952, "step": 168860 }, { "epoch": 0.29, "learning_rate": 3.527555045567581e-05, "loss": 2.4104, "step": 168870 }, { "epoch": 0.29, "learning_rate": 3.527467851574898e-05, "loss": 2.4974, "step": 168880 }, { "epoch": 0.29, "learning_rate": 3.5273806575822156e-05, "loss": 2.5858, "step": 168890 }, { "epoch": 0.29, "learning_rate": 3.527293463589533e-05, "loss": 2.5843, "step": 168900 }, { "epoch": 0.29, "learning_rate": 3.52720626959685e-05, "loss": 2.5252, "step": 168910 }, { "epoch": 0.29, "learning_rate": 3.5271190756041674e-05, "loss": 2.4999, "step": 168920 }, { "epoch": 0.29, "learning_rate": 3.5270318816114845e-05, "loss": 2.5392, "step": 168930 }, { "epoch": 0.29, "learning_rate": 3.526944687618802e-05, "loss": 2.4938, "step": 168940 }, { "epoch": 0.29, "learning_rate": 3.526857493626119e-05, "loss": 2.4556, "step": 168950 }, { "epoch": 0.29, "learning_rate": 3.526770299633437e-05, "loss": 2.481, "step": 168960 }, { "epoch": 0.29, "learning_rate": 3.526683105640754e-05, "loss": 2.4818, "step": 168970 }, { "epoch": 0.29, "learning_rate": 3.526595911648071e-05, "loss": 2.5869, "step": 168980 }, { "epoch": 0.29, "learning_rate": 3.526508717655389e-05, "loss": 2.3808, "step": 168990 }, { "epoch": 0.29, "learning_rate": 3.526421523662706e-05, "loss": 2.3291, "step": 169000 }, { "epoch": 0.29, "learning_rate": 3.526334329670023e-05, "loss": 2.431, "step": 169010 }, { "epoch": 0.29, "learning_rate": 3.5262471356773405e-05, "loss": 2.3751, "step": 169020 }, { "epoch": 0.29, "learning_rate": 3.526159941684658e-05, "loss": 2.4939, "step": 169030 }, { "epoch": 0.29, "learning_rate": 3.526072747691975e-05, "loss": 2.4091, "step": 169040 }, { "epoch": 0.29, "learning_rate": 3.525985553699292e-05, "loss": 2.5762, "step": 169050 }, { "epoch": 0.29, "learning_rate": 3.52589835970661e-05, "loss": 2.4489, "step": 169060 }, { "epoch": 0.29, "learning_rate": 3.525811165713927e-05, "loss": 2.4814, "step": 169070 }, { "epoch": 0.29, "learning_rate": 3.525723971721244e-05, "loss": 2.5183, "step": 169080 }, { "epoch": 0.29, "learning_rate": 3.525636777728562e-05, "loss": 2.5138, "step": 169090 }, { "epoch": 0.29, "learning_rate": 3.5255495837358795e-05, "loss": 2.3706, "step": 169100 }, { "epoch": 0.29, "learning_rate": 3.5254623897431966e-05, "loss": 2.3754, "step": 169110 }, { "epoch": 0.29, "learning_rate": 3.5253751957505136e-05, "loss": 2.4297, "step": 169120 }, { "epoch": 0.29, "learning_rate": 3.525288001757831e-05, "loss": 2.4091, "step": 169130 }, { "epoch": 0.29, "learning_rate": 3.5252008077651484e-05, "loss": 2.5541, "step": 169140 }, { "epoch": 0.29, "learning_rate": 3.5251136137724654e-05, "loss": 2.518, "step": 169150 }, { "epoch": 0.29, "learning_rate": 3.5250264197797824e-05, "loss": 2.4313, "step": 169160 }, { "epoch": 0.3, "learning_rate": 3.524939225787101e-05, "loss": 2.4291, "step": 169170 }, { "epoch": 0.3, "learning_rate": 3.524852031794418e-05, "loss": 2.4187, "step": 169180 }, { "epoch": 0.3, "learning_rate": 3.524764837801735e-05, "loss": 2.3611, "step": 169190 }, { "epoch": 0.3, "learning_rate": 3.5246776438090526e-05, "loss": 2.5302, "step": 169200 }, { "epoch": 0.3, "learning_rate": 3.52459044981637e-05, "loss": 2.6025, "step": 169210 }, { "epoch": 0.3, "learning_rate": 3.524503255823687e-05, "loss": 2.4825, "step": 169220 }, { "epoch": 0.3, "learning_rate": 3.524416061831004e-05, "loss": 2.2108, "step": 169230 }, { "epoch": 0.3, "learning_rate": 3.524328867838322e-05, "loss": 2.4297, "step": 169240 }, { "epoch": 0.3, "learning_rate": 3.524241673845639e-05, "loss": 2.3878, "step": 169250 }, { "epoch": 0.3, "learning_rate": 3.524154479852956e-05, "loss": 2.4975, "step": 169260 }, { "epoch": 0.3, "learning_rate": 3.524067285860273e-05, "loss": 2.4923, "step": 169270 }, { "epoch": 0.3, "learning_rate": 3.523980091867591e-05, "loss": 2.4842, "step": 169280 }, { "epoch": 0.3, "learning_rate": 3.523892897874908e-05, "loss": 2.4116, "step": 169290 }, { "epoch": 0.3, "learning_rate": 3.523805703882225e-05, "loss": 2.4319, "step": 169300 }, { "epoch": 0.3, "learning_rate": 3.523718509889543e-05, "loss": 2.4734, "step": 169310 }, { "epoch": 0.3, "learning_rate": 3.5236313158968605e-05, "loss": 2.4038, "step": 169320 }, { "epoch": 0.3, "learning_rate": 3.5235441219041775e-05, "loss": 2.5087, "step": 169330 }, { "epoch": 0.3, "learning_rate": 3.5234569279114946e-05, "loss": 2.4814, "step": 169340 }, { "epoch": 0.3, "learning_rate": 3.523369733918812e-05, "loss": 2.4497, "step": 169350 }, { "epoch": 0.3, "learning_rate": 3.523282539926129e-05, "loss": 2.411, "step": 169360 }, { "epoch": 0.3, "learning_rate": 3.5231953459334463e-05, "loss": 2.4608, "step": 169370 }, { "epoch": 0.3, "learning_rate": 3.523108151940764e-05, "loss": 2.4122, "step": 169380 }, { "epoch": 0.3, "learning_rate": 3.523020957948082e-05, "loss": 2.5392, "step": 169390 }, { "epoch": 0.3, "learning_rate": 3.522933763955399e-05, "loss": 2.4991, "step": 169400 }, { "epoch": 0.3, "learning_rate": 3.522846569962716e-05, "loss": 2.4316, "step": 169410 }, { "epoch": 0.3, "learning_rate": 3.5227593759700336e-05, "loss": 2.4634, "step": 169420 }, { "epoch": 0.3, "learning_rate": 3.5226721819773506e-05, "loss": 2.3525, "step": 169430 }, { "epoch": 0.3, "learning_rate": 3.5225849879846676e-05, "loss": 2.4535, "step": 169440 }, { "epoch": 0.3, "learning_rate": 3.5224977939919854e-05, "loss": 2.4728, "step": 169450 }, { "epoch": 0.3, "learning_rate": 3.5224105999993024e-05, "loss": 2.4439, "step": 169460 }, { "epoch": 0.3, "learning_rate": 3.52232340600662e-05, "loss": 2.4124, "step": 169470 }, { "epoch": 0.3, "learning_rate": 3.522236212013937e-05, "loss": 2.5247, "step": 169480 }, { "epoch": 0.3, "learning_rate": 3.522149018021255e-05, "loss": 2.4999, "step": 169490 }, { "epoch": 0.3, "learning_rate": 3.522061824028572e-05, "loss": 2.4822, "step": 169500 }, { "epoch": 0.3, "learning_rate": 3.521974630035889e-05, "loss": 2.4564, "step": 169510 }, { "epoch": 0.3, "learning_rate": 3.521887436043207e-05, "loss": 2.548, "step": 169520 }, { "epoch": 0.3, "learning_rate": 3.521800242050524e-05, "loss": 2.4801, "step": 169530 }, { "epoch": 0.3, "learning_rate": 3.5217130480578414e-05, "loss": 2.4971, "step": 169540 }, { "epoch": 0.3, "learning_rate": 3.5216258540651585e-05, "loss": 2.428, "step": 169550 }, { "epoch": 0.3, "learning_rate": 3.521538660072476e-05, "loss": 2.4959, "step": 169560 }, { "epoch": 0.3, "learning_rate": 3.521451466079793e-05, "loss": 2.3543, "step": 169570 }, { "epoch": 0.3, "learning_rate": 3.52136427208711e-05, "loss": 2.4471, "step": 169580 }, { "epoch": 0.3, "learning_rate": 3.521277078094428e-05, "loss": 2.5954, "step": 169590 }, { "epoch": 0.3, "learning_rate": 3.521189884101745e-05, "loss": 2.4725, "step": 169600 }, { "epoch": 0.3, "learning_rate": 3.521102690109063e-05, "loss": 2.6089, "step": 169610 }, { "epoch": 0.3, "learning_rate": 3.52101549611638e-05, "loss": 2.514, "step": 169620 }, { "epoch": 0.3, "learning_rate": 3.5209283021236975e-05, "loss": 2.4704, "step": 169630 }, { "epoch": 0.3, "learning_rate": 3.5208411081310145e-05, "loss": 2.461, "step": 169640 }, { "epoch": 0.3, "learning_rate": 3.5207539141383315e-05, "loss": 2.4368, "step": 169650 }, { "epoch": 0.3, "learning_rate": 3.5206667201456486e-05, "loss": 2.4786, "step": 169660 }, { "epoch": 0.3, "learning_rate": 3.520579526152966e-05, "loss": 2.4035, "step": 169670 }, { "epoch": 0.3, "learning_rate": 3.5204923321602833e-05, "loss": 2.4433, "step": 169680 }, { "epoch": 0.3, "learning_rate": 3.520405138167601e-05, "loss": 2.4052, "step": 169690 }, { "epoch": 0.3, "learning_rate": 3.520317944174919e-05, "loss": 2.4469, "step": 169700 }, { "epoch": 0.3, "learning_rate": 3.520230750182236e-05, "loss": 2.584, "step": 169710 }, { "epoch": 0.3, "learning_rate": 3.520143556189553e-05, "loss": 2.4628, "step": 169720 }, { "epoch": 0.3, "learning_rate": 3.52005636219687e-05, "loss": 2.3857, "step": 169730 }, { "epoch": 0.3, "learning_rate": 3.5199691682041876e-05, "loss": 2.4345, "step": 169740 }, { "epoch": 0.3, "learning_rate": 3.5198819742115046e-05, "loss": 2.4244, "step": 169750 }, { "epoch": 0.3, "learning_rate": 3.5197947802188224e-05, "loss": 2.3823, "step": 169760 }, { "epoch": 0.3, "learning_rate": 3.5197075862261394e-05, "loss": 2.4318, "step": 169770 }, { "epoch": 0.3, "learning_rate": 3.519620392233457e-05, "loss": 2.562, "step": 169780 }, { "epoch": 0.3, "learning_rate": 3.519533198240774e-05, "loss": 2.5123, "step": 169790 }, { "epoch": 0.3, "learning_rate": 3.519446004248091e-05, "loss": 2.3934, "step": 169800 }, { "epoch": 0.3, "learning_rate": 3.519358810255409e-05, "loss": 2.4599, "step": 169810 }, { "epoch": 0.3, "learning_rate": 3.519271616262726e-05, "loss": 2.4926, "step": 169820 }, { "epoch": 0.3, "learning_rate": 3.519184422270043e-05, "loss": 2.4292, "step": 169830 }, { "epoch": 0.3, "learning_rate": 3.519097228277361e-05, "loss": 2.5683, "step": 169840 }, { "epoch": 0.3, "learning_rate": 3.5190100342846784e-05, "loss": 2.4025, "step": 169850 }, { "epoch": 0.3, "learning_rate": 3.5189228402919954e-05, "loss": 2.2624, "step": 169860 }, { "epoch": 0.3, "learning_rate": 3.5188356462993125e-05, "loss": 2.412, "step": 169870 }, { "epoch": 0.3, "learning_rate": 3.51874845230663e-05, "loss": 2.4542, "step": 169880 }, { "epoch": 0.3, "learning_rate": 3.518661258313947e-05, "loss": 2.506, "step": 169890 }, { "epoch": 0.3, "learning_rate": 3.518574064321264e-05, "loss": 2.4993, "step": 169900 }, { "epoch": 0.3, "learning_rate": 3.518486870328582e-05, "loss": 2.5845, "step": 169910 }, { "epoch": 0.3, "learning_rate": 3.5183996763359e-05, "loss": 2.4467, "step": 169920 }, { "epoch": 0.3, "learning_rate": 3.518312482343217e-05, "loss": 2.5103, "step": 169930 }, { "epoch": 0.3, "learning_rate": 3.518225288350534e-05, "loss": 2.4377, "step": 169940 }, { "epoch": 0.3, "learning_rate": 3.5181380943578515e-05, "loss": 2.4834, "step": 169950 }, { "epoch": 0.3, "learning_rate": 3.5180509003651685e-05, "loss": 2.4566, "step": 169960 }, { "epoch": 0.3, "learning_rate": 3.5179637063724856e-05, "loss": 2.5547, "step": 169970 }, { "epoch": 0.3, "learning_rate": 3.517876512379803e-05, "loss": 2.4644, "step": 169980 }, { "epoch": 0.3, "learning_rate": 3.517789318387121e-05, "loss": 2.4691, "step": 169990 }, { "epoch": 0.3, "learning_rate": 3.517702124394438e-05, "loss": 2.509, "step": 170000 }, { "epoch": 0.3, "learning_rate": 3.517614930401755e-05, "loss": 2.4427, "step": 170010 }, { "epoch": 0.3, "learning_rate": 3.517527736409073e-05, "loss": 2.3924, "step": 170020 }, { "epoch": 0.3, "learning_rate": 3.51744054241639e-05, "loss": 2.4402, "step": 170030 }, { "epoch": 0.3, "learning_rate": 3.517353348423707e-05, "loss": 2.2973, "step": 170040 }, { "epoch": 0.3, "learning_rate": 3.517266154431024e-05, "loss": 2.41, "step": 170050 }, { "epoch": 0.3, "learning_rate": 3.517178960438342e-05, "loss": 2.4829, "step": 170060 }, { "epoch": 0.3, "learning_rate": 3.5170917664456593e-05, "loss": 2.5026, "step": 170070 }, { "epoch": 0.3, "learning_rate": 3.5170045724529764e-05, "loss": 2.4643, "step": 170080 }, { "epoch": 0.3, "learning_rate": 3.516917378460294e-05, "loss": 2.4412, "step": 170090 }, { "epoch": 0.3, "learning_rate": 3.516830184467611e-05, "loss": 2.4897, "step": 170100 }, { "epoch": 0.3, "learning_rate": 3.516742990474928e-05, "loss": 2.4402, "step": 170110 }, { "epoch": 0.3, "learning_rate": 3.516655796482245e-05, "loss": 2.5482, "step": 170120 }, { "epoch": 0.3, "learning_rate": 3.5165686024895636e-05, "loss": 2.4534, "step": 170130 }, { "epoch": 0.3, "learning_rate": 3.5164814084968806e-05, "loss": 2.5417, "step": 170140 }, { "epoch": 0.3, "learning_rate": 3.516394214504198e-05, "loss": 2.4766, "step": 170150 }, { "epoch": 0.3, "learning_rate": 3.516307020511515e-05, "loss": 2.3702, "step": 170160 }, { "epoch": 0.3, "learning_rate": 3.5162198265188324e-05, "loss": 2.4652, "step": 170170 }, { "epoch": 0.3, "learning_rate": 3.5161326325261495e-05, "loss": 2.4069, "step": 170180 }, { "epoch": 0.3, "learning_rate": 3.5160454385334665e-05, "loss": 2.4813, "step": 170190 }, { "epoch": 0.3, "learning_rate": 3.515958244540784e-05, "loss": 2.506, "step": 170200 }, { "epoch": 0.3, "learning_rate": 3.515871050548102e-05, "loss": 2.4427, "step": 170210 }, { "epoch": 0.3, "learning_rate": 3.515783856555419e-05, "loss": 2.4545, "step": 170220 }, { "epoch": 0.3, "learning_rate": 3.515696662562736e-05, "loss": 2.4909, "step": 170230 }, { "epoch": 0.3, "learning_rate": 3.515609468570054e-05, "loss": 2.4418, "step": 170240 }, { "epoch": 0.3, "learning_rate": 3.515522274577371e-05, "loss": 2.4183, "step": 170250 }, { "epoch": 0.3, "learning_rate": 3.515435080584688e-05, "loss": 2.5243, "step": 170260 }, { "epoch": 0.3, "learning_rate": 3.5153478865920055e-05, "loss": 2.3377, "step": 170270 }, { "epoch": 0.3, "learning_rate": 3.515260692599323e-05, "loss": 2.4375, "step": 170280 }, { "epoch": 0.3, "learning_rate": 3.51517349860664e-05, "loss": 2.3941, "step": 170290 }, { "epoch": 0.3, "learning_rate": 3.515086304613957e-05, "loss": 2.4843, "step": 170300 }, { "epoch": 0.3, "learning_rate": 3.514999110621275e-05, "loss": 2.4441, "step": 170310 }, { "epoch": 0.3, "learning_rate": 3.514911916628592e-05, "loss": 2.5799, "step": 170320 }, { "epoch": 0.3, "learning_rate": 3.514824722635909e-05, "loss": 2.5459, "step": 170330 }, { "epoch": 0.3, "learning_rate": 3.514737528643227e-05, "loss": 2.5358, "step": 170340 }, { "epoch": 0.3, "learning_rate": 3.514650334650544e-05, "loss": 2.402, "step": 170350 }, { "epoch": 0.3, "learning_rate": 3.5145631406578616e-05, "loss": 2.5565, "step": 170360 }, { "epoch": 0.3, "learning_rate": 3.5144759466651786e-05, "loss": 2.4677, "step": 170370 }, { "epoch": 0.3, "learning_rate": 3.5143887526724963e-05, "loss": 2.3627, "step": 170380 }, { "epoch": 0.3, "learning_rate": 3.5143015586798134e-05, "loss": 2.3271, "step": 170390 }, { "epoch": 0.3, "learning_rate": 3.5142143646871304e-05, "loss": 2.4371, "step": 170400 }, { "epoch": 0.3, "learning_rate": 3.514127170694448e-05, "loss": 2.5496, "step": 170410 }, { "epoch": 0.3, "learning_rate": 3.514039976701765e-05, "loss": 2.4879, "step": 170420 }, { "epoch": 0.3, "learning_rate": 3.513952782709083e-05, "loss": 2.441, "step": 170430 }, { "epoch": 0.3, "learning_rate": 3.5138655887164e-05, "loss": 2.5028, "step": 170440 }, { "epoch": 0.3, "learning_rate": 3.5137783947237176e-05, "loss": 2.4815, "step": 170450 }, { "epoch": 0.3, "learning_rate": 3.513691200731035e-05, "loss": 2.4727, "step": 170460 }, { "epoch": 0.3, "learning_rate": 3.513604006738352e-05, "loss": 2.4404, "step": 170470 }, { "epoch": 0.3, "learning_rate": 3.5135168127456694e-05, "loss": 2.4508, "step": 170480 }, { "epoch": 0.3, "learning_rate": 3.5134296187529865e-05, "loss": 2.3534, "step": 170490 }, { "epoch": 0.3, "learning_rate": 3.5133424247603035e-05, "loss": 2.4178, "step": 170500 }, { "epoch": 0.3, "learning_rate": 3.513255230767621e-05, "loss": 2.3128, "step": 170510 }, { "epoch": 0.3, "learning_rate": 3.513168036774939e-05, "loss": 2.401, "step": 170520 }, { "epoch": 0.3, "learning_rate": 3.513080842782256e-05, "loss": 2.4872, "step": 170530 }, { "epoch": 0.3, "learning_rate": 3.512993648789573e-05, "loss": 2.4247, "step": 170540 }, { "epoch": 0.3, "learning_rate": 3.512906454796891e-05, "loss": 2.4046, "step": 170550 }, { "epoch": 0.3, "learning_rate": 3.512819260804208e-05, "loss": 2.3925, "step": 170560 }, { "epoch": 0.3, "learning_rate": 3.512732066811525e-05, "loss": 2.3637, "step": 170570 }, { "epoch": 0.3, "learning_rate": 3.5126448728188425e-05, "loss": 2.4699, "step": 170580 }, { "epoch": 0.3, "learning_rate": 3.51255767882616e-05, "loss": 2.5448, "step": 170590 }, { "epoch": 0.3, "learning_rate": 3.512470484833477e-05, "loss": 2.4501, "step": 170600 }, { "epoch": 0.3, "learning_rate": 3.512383290840794e-05, "loss": 2.4357, "step": 170610 }, { "epoch": 0.3, "learning_rate": 3.5122960968481114e-05, "loss": 2.4215, "step": 170620 }, { "epoch": 0.3, "learning_rate": 3.512208902855429e-05, "loss": 2.474, "step": 170630 }, { "epoch": 0.3, "learning_rate": 3.512121708862746e-05, "loss": 2.3257, "step": 170640 }, { "epoch": 0.3, "learning_rate": 3.512034514870063e-05, "loss": 2.4396, "step": 170650 }, { "epoch": 0.3, "learning_rate": 3.5119473208773815e-05, "loss": 2.5419, "step": 170660 }, { "epoch": 0.3, "learning_rate": 3.5118601268846986e-05, "loss": 2.4137, "step": 170670 }, { "epoch": 0.3, "learning_rate": 3.5117729328920156e-05, "loss": 2.4571, "step": 170680 }, { "epoch": 0.3, "learning_rate": 3.5116857388993327e-05, "loss": 2.3385, "step": 170690 }, { "epoch": 0.3, "learning_rate": 3.5115985449066504e-05, "loss": 2.5011, "step": 170700 }, { "epoch": 0.3, "learning_rate": 3.5115113509139674e-05, "loss": 2.5838, "step": 170710 }, { "epoch": 0.3, "learning_rate": 3.5114241569212844e-05, "loss": 2.4617, "step": 170720 }, { "epoch": 0.3, "learning_rate": 3.511336962928602e-05, "loss": 2.4591, "step": 170730 }, { "epoch": 0.3, "learning_rate": 3.51124976893592e-05, "loss": 2.4133, "step": 170740 }, { "epoch": 0.3, "learning_rate": 3.511162574943237e-05, "loss": 2.422, "step": 170750 }, { "epoch": 0.3, "learning_rate": 3.511075380950554e-05, "loss": 2.4892, "step": 170760 }, { "epoch": 0.3, "learning_rate": 3.510988186957872e-05, "loss": 2.4556, "step": 170770 }, { "epoch": 0.3, "learning_rate": 3.510900992965189e-05, "loss": 2.4703, "step": 170780 }, { "epoch": 0.3, "learning_rate": 3.510813798972506e-05, "loss": 2.4509, "step": 170790 }, { "epoch": 0.3, "learning_rate": 3.5107266049798235e-05, "loss": 2.4998, "step": 170800 }, { "epoch": 0.3, "learning_rate": 3.510639410987141e-05, "loss": 2.5058, "step": 170810 }, { "epoch": 0.3, "learning_rate": 3.510552216994458e-05, "loss": 2.34, "step": 170820 }, { "epoch": 0.3, "learning_rate": 3.510465023001775e-05, "loss": 2.3594, "step": 170830 }, { "epoch": 0.3, "learning_rate": 3.510377829009093e-05, "loss": 2.4802, "step": 170840 }, { "epoch": 0.3, "learning_rate": 3.51029063501641e-05, "loss": 2.4529, "step": 170850 }, { "epoch": 0.3, "learning_rate": 3.510203441023727e-05, "loss": 2.5129, "step": 170860 }, { "epoch": 0.3, "learning_rate": 3.510116247031045e-05, "loss": 2.4836, "step": 170870 }, { "epoch": 0.3, "learning_rate": 3.5100290530383625e-05, "loss": 2.3228, "step": 170880 }, { "epoch": 0.3, "learning_rate": 3.5099418590456795e-05, "loss": 2.5659, "step": 170890 }, { "epoch": 0.3, "learning_rate": 3.5098546650529966e-05, "loss": 2.3954, "step": 170900 }, { "epoch": 0.3, "learning_rate": 3.509767471060314e-05, "loss": 2.3909, "step": 170910 }, { "epoch": 0.3, "learning_rate": 3.509680277067631e-05, "loss": 2.4788, "step": 170920 }, { "epoch": 0.3, "learning_rate": 3.5095930830749483e-05, "loss": 2.5497, "step": 170930 }, { "epoch": 0.3, "learning_rate": 3.509505889082266e-05, "loss": 2.4048, "step": 170940 }, { "epoch": 0.3, "learning_rate": 3.509418695089584e-05, "loss": 2.4873, "step": 170950 }, { "epoch": 0.3, "learning_rate": 3.509331501096901e-05, "loss": 2.4359, "step": 170960 }, { "epoch": 0.3, "learning_rate": 3.509244307104218e-05, "loss": 2.5613, "step": 170970 }, { "epoch": 0.3, "learning_rate": 3.5091571131115356e-05, "loss": 2.3702, "step": 170980 }, { "epoch": 0.3, "learning_rate": 3.5090699191188526e-05, "loss": 2.5211, "step": 170990 }, { "epoch": 0.3, "learning_rate": 3.5089827251261696e-05, "loss": 2.4112, "step": 171000 }, { "epoch": 0.3, "learning_rate": 3.508895531133487e-05, "loss": 2.5257, "step": 171010 }, { "epoch": 0.3, "learning_rate": 3.5088083371408044e-05, "loss": 2.4561, "step": 171020 }, { "epoch": 0.3, "learning_rate": 3.508721143148122e-05, "loss": 2.5636, "step": 171030 }, { "epoch": 0.3, "learning_rate": 3.508633949155439e-05, "loss": 2.5467, "step": 171040 }, { "epoch": 0.3, "learning_rate": 3.508546755162757e-05, "loss": 2.4854, "step": 171050 }, { "epoch": 0.3, "learning_rate": 3.508459561170074e-05, "loss": 2.4307, "step": 171060 }, { "epoch": 0.3, "learning_rate": 3.508372367177391e-05, "loss": 2.4238, "step": 171070 }, { "epoch": 0.3, "learning_rate": 3.508285173184708e-05, "loss": 2.4302, "step": 171080 }, { "epoch": 0.3, "learning_rate": 3.508197979192026e-05, "loss": 2.4378, "step": 171090 }, { "epoch": 0.3, "learning_rate": 3.5081107851993434e-05, "loss": 2.3462, "step": 171100 }, { "epoch": 0.3, "learning_rate": 3.5080235912066605e-05, "loss": 2.4127, "step": 171110 }, { "epoch": 0.3, "learning_rate": 3.5079363972139775e-05, "loss": 2.3591, "step": 171120 }, { "epoch": 0.3, "learning_rate": 3.507849203221295e-05, "loss": 2.4109, "step": 171130 }, { "epoch": 0.3, "learning_rate": 3.507762009228612e-05, "loss": 2.4182, "step": 171140 }, { "epoch": 0.3, "learning_rate": 3.507674815235929e-05, "loss": 2.4908, "step": 171150 }, { "epoch": 0.3, "learning_rate": 3.507587621243247e-05, "loss": 2.4484, "step": 171160 }, { "epoch": 0.3, "learning_rate": 3.507500427250564e-05, "loss": 2.4686, "step": 171170 }, { "epoch": 0.3, "learning_rate": 3.507413233257882e-05, "loss": 2.3781, "step": 171180 }, { "epoch": 0.3, "learning_rate": 3.507326039265199e-05, "loss": 2.4609, "step": 171190 }, { "epoch": 0.3, "learning_rate": 3.5072388452725165e-05, "loss": 2.4689, "step": 171200 }, { "epoch": 0.3, "learning_rate": 3.5071516512798335e-05, "loss": 2.5941, "step": 171210 }, { "epoch": 0.3, "learning_rate": 3.5070644572871506e-05, "loss": 2.5562, "step": 171220 }, { "epoch": 0.3, "learning_rate": 3.506977263294468e-05, "loss": 2.5365, "step": 171230 }, { "epoch": 0.3, "learning_rate": 3.5068900693017853e-05, "loss": 2.4518, "step": 171240 }, { "epoch": 0.3, "learning_rate": 3.506802875309103e-05, "loss": 2.4065, "step": 171250 }, { "epoch": 0.3, "learning_rate": 3.50671568131642e-05, "loss": 2.4452, "step": 171260 }, { "epoch": 0.3, "learning_rate": 3.506628487323738e-05, "loss": 2.3516, "step": 171270 }, { "epoch": 0.3, "learning_rate": 3.506541293331055e-05, "loss": 2.5136, "step": 171280 }, { "epoch": 0.3, "learning_rate": 3.506454099338372e-05, "loss": 2.4296, "step": 171290 }, { "epoch": 0.3, "learning_rate": 3.5063669053456896e-05, "loss": 2.5232, "step": 171300 }, { "epoch": 0.3, "learning_rate": 3.5062797113530066e-05, "loss": 2.3535, "step": 171310 }, { "epoch": 0.3, "learning_rate": 3.506192517360324e-05, "loss": 2.3023, "step": 171320 }, { "epoch": 0.3, "learning_rate": 3.5061053233676414e-05, "loss": 2.5012, "step": 171330 }, { "epoch": 0.3, "learning_rate": 3.506018129374959e-05, "loss": 2.3717, "step": 171340 }, { "epoch": 0.3, "learning_rate": 3.505930935382276e-05, "loss": 2.3418, "step": 171350 }, { "epoch": 0.3, "learning_rate": 3.505843741389593e-05, "loss": 2.4048, "step": 171360 }, { "epoch": 0.3, "learning_rate": 3.505756547396911e-05, "loss": 2.495, "step": 171370 }, { "epoch": 0.3, "learning_rate": 3.505669353404228e-05, "loss": 2.4059, "step": 171380 }, { "epoch": 0.3, "learning_rate": 3.505582159411545e-05, "loss": 2.4908, "step": 171390 }, { "epoch": 0.3, "learning_rate": 3.505494965418863e-05, "loss": 2.4911, "step": 171400 }, { "epoch": 0.3, "learning_rate": 3.5054077714261804e-05, "loss": 2.4146, "step": 171410 }, { "epoch": 0.3, "learning_rate": 3.5053205774334974e-05, "loss": 2.4893, "step": 171420 }, { "epoch": 0.3, "learning_rate": 3.5052333834408145e-05, "loss": 2.5168, "step": 171430 }, { "epoch": 0.3, "learning_rate": 3.505146189448132e-05, "loss": 2.5788, "step": 171440 }, { "epoch": 0.3, "learning_rate": 3.505058995455449e-05, "loss": 2.4354, "step": 171450 }, { "epoch": 0.3, "learning_rate": 3.504971801462766e-05, "loss": 2.4416, "step": 171460 }, { "epoch": 0.3, "learning_rate": 3.504884607470084e-05, "loss": 2.3826, "step": 171470 }, { "epoch": 0.3, "learning_rate": 3.504797413477402e-05, "loss": 2.4962, "step": 171480 }, { "epoch": 0.3, "learning_rate": 3.504710219484719e-05, "loss": 2.4921, "step": 171490 }, { "epoch": 0.3, "learning_rate": 3.504623025492036e-05, "loss": 2.4196, "step": 171500 }, { "epoch": 0.3, "learning_rate": 3.504535831499353e-05, "loss": 2.4541, "step": 171510 }, { "epoch": 0.3, "learning_rate": 3.5044486375066705e-05, "loss": 2.4221, "step": 171520 }, { "epoch": 0.3, "learning_rate": 3.5043614435139876e-05, "loss": 2.4274, "step": 171530 }, { "epoch": 0.3, "learning_rate": 3.5042742495213046e-05, "loss": 2.4186, "step": 171540 }, { "epoch": 0.3, "learning_rate": 3.504187055528623e-05, "loss": 2.3856, "step": 171550 }, { "epoch": 0.3, "learning_rate": 3.50409986153594e-05, "loss": 2.4765, "step": 171560 }, { "epoch": 0.3, "learning_rate": 3.504012667543257e-05, "loss": 2.5352, "step": 171570 }, { "epoch": 0.3, "learning_rate": 3.503925473550574e-05, "loss": 2.4771, "step": 171580 }, { "epoch": 0.3, "learning_rate": 3.503838279557892e-05, "loss": 2.5548, "step": 171590 }, { "epoch": 0.3, "learning_rate": 3.503751085565209e-05, "loss": 2.3618, "step": 171600 }, { "epoch": 0.3, "learning_rate": 3.503663891572526e-05, "loss": 2.3714, "step": 171610 }, { "epoch": 0.3, "learning_rate": 3.5035766975798436e-05, "loss": 2.4445, "step": 171620 }, { "epoch": 0.3, "learning_rate": 3.5034895035871613e-05, "loss": 2.4638, "step": 171630 }, { "epoch": 0.3, "learning_rate": 3.5034023095944784e-05, "loss": 2.447, "step": 171640 }, { "epoch": 0.3, "learning_rate": 3.5033151156017954e-05, "loss": 2.4627, "step": 171650 }, { "epoch": 0.3, "learning_rate": 3.503227921609113e-05, "loss": 2.3996, "step": 171660 }, { "epoch": 0.3, "learning_rate": 3.50314072761643e-05, "loss": 2.3845, "step": 171670 }, { "epoch": 0.3, "learning_rate": 3.503053533623747e-05, "loss": 2.5237, "step": 171680 }, { "epoch": 0.3, "learning_rate": 3.502966339631065e-05, "loss": 2.441, "step": 171690 }, { "epoch": 0.3, "learning_rate": 3.5028791456383826e-05, "loss": 2.5339, "step": 171700 }, { "epoch": 0.3, "learning_rate": 3.5027919516457e-05, "loss": 2.3801, "step": 171710 }, { "epoch": 0.3, "learning_rate": 3.502704757653017e-05, "loss": 2.4769, "step": 171720 }, { "epoch": 0.3, "learning_rate": 3.5026175636603344e-05, "loss": 2.3532, "step": 171730 }, { "epoch": 0.3, "learning_rate": 3.5025303696676515e-05, "loss": 2.4735, "step": 171740 }, { "epoch": 0.3, "learning_rate": 3.5024431756749685e-05, "loss": 2.5605, "step": 171750 }, { "epoch": 0.3, "learning_rate": 3.502355981682286e-05, "loss": 2.4867, "step": 171760 }, { "epoch": 0.3, "learning_rate": 3.502268787689604e-05, "loss": 2.556, "step": 171770 }, { "epoch": 0.3, "learning_rate": 3.502181593696921e-05, "loss": 2.5071, "step": 171780 }, { "epoch": 0.3, "learning_rate": 3.502094399704238e-05, "loss": 2.4085, "step": 171790 }, { "epoch": 0.3, "learning_rate": 3.502007205711556e-05, "loss": 2.3597, "step": 171800 }, { "epoch": 0.3, "learning_rate": 3.501920011718873e-05, "loss": 2.4776, "step": 171810 }, { "epoch": 0.3, "learning_rate": 3.50183281772619e-05, "loss": 2.4976, "step": 171820 }, { "epoch": 0.3, "learning_rate": 3.5017456237335075e-05, "loss": 2.472, "step": 171830 }, { "epoch": 0.3, "learning_rate": 3.5016584297408246e-05, "loss": 2.5214, "step": 171840 }, { "epoch": 0.3, "learning_rate": 3.501571235748142e-05, "loss": 2.4435, "step": 171850 }, { "epoch": 0.3, "learning_rate": 3.501484041755459e-05, "loss": 2.4794, "step": 171860 }, { "epoch": 0.3, "learning_rate": 3.501396847762777e-05, "loss": 2.2727, "step": 171870 }, { "epoch": 0.3, "learning_rate": 3.501309653770094e-05, "loss": 2.4919, "step": 171880 }, { "epoch": 0.3, "learning_rate": 3.501222459777411e-05, "loss": 2.4122, "step": 171890 }, { "epoch": 0.3, "learning_rate": 3.501135265784729e-05, "loss": 2.4942, "step": 171900 }, { "epoch": 0.3, "learning_rate": 3.501048071792046e-05, "loss": 2.458, "step": 171910 }, { "epoch": 0.3, "learning_rate": 3.5009608777993636e-05, "loss": 2.4895, "step": 171920 }, { "epoch": 0.3, "learning_rate": 3.5008736838066806e-05, "loss": 2.4068, "step": 171930 }, { "epoch": 0.3, "learning_rate": 3.5007864898139983e-05, "loss": 2.4267, "step": 171940 }, { "epoch": 0.3, "learning_rate": 3.5006992958213154e-05, "loss": 2.5237, "step": 171950 }, { "epoch": 0.3, "learning_rate": 3.5006121018286324e-05, "loss": 2.5134, "step": 171960 }, { "epoch": 0.3, "learning_rate": 3.5005249078359495e-05, "loss": 2.6451, "step": 171970 }, { "epoch": 0.3, "learning_rate": 3.500437713843267e-05, "loss": 2.4712, "step": 171980 }, { "epoch": 0.3, "learning_rate": 3.500350519850584e-05, "loss": 2.4843, "step": 171990 }, { "epoch": 0.3, "learning_rate": 3.500263325857902e-05, "loss": 2.4127, "step": 172000 }, { "epoch": 0.3, "learning_rate": 3.5001761318652196e-05, "loss": 2.5146, "step": 172010 }, { "epoch": 0.3, "learning_rate": 3.500088937872537e-05, "loss": 2.3642, "step": 172020 }, { "epoch": 0.3, "learning_rate": 3.500001743879854e-05, "loss": 2.4779, "step": 172030 }, { "epoch": 0.3, "learning_rate": 3.499914549887171e-05, "loss": 2.4252, "step": 172040 }, { "epoch": 0.3, "learning_rate": 3.4998273558944885e-05, "loss": 2.5739, "step": 172050 }, { "epoch": 0.3, "learning_rate": 3.4997401619018055e-05, "loss": 2.4672, "step": 172060 }, { "epoch": 0.3, "learning_rate": 3.499652967909123e-05, "loss": 2.3631, "step": 172070 }, { "epoch": 0.3, "learning_rate": 3.49956577391644e-05, "loss": 2.4231, "step": 172080 }, { "epoch": 0.3, "learning_rate": 3.499478579923758e-05, "loss": 2.3321, "step": 172090 }, { "epoch": 0.3, "learning_rate": 3.499391385931075e-05, "loss": 2.4321, "step": 172100 }, { "epoch": 0.3, "learning_rate": 3.499304191938392e-05, "loss": 2.3201, "step": 172110 }, { "epoch": 0.3, "learning_rate": 3.49921699794571e-05, "loss": 2.4805, "step": 172120 }, { "epoch": 0.3, "learning_rate": 3.499129803953027e-05, "loss": 2.5232, "step": 172130 }, { "epoch": 0.3, "learning_rate": 3.4990426099603445e-05, "loss": 2.5427, "step": 172140 }, { "epoch": 0.3, "learning_rate": 3.4989554159676616e-05, "loss": 2.4634, "step": 172150 }, { "epoch": 0.3, "learning_rate": 3.498868221974979e-05, "loss": 2.4523, "step": 172160 }, { "epoch": 0.3, "learning_rate": 3.498781027982296e-05, "loss": 2.4458, "step": 172170 }, { "epoch": 0.3, "learning_rate": 3.4986938339896134e-05, "loss": 2.2425, "step": 172180 }, { "epoch": 0.3, "learning_rate": 3.498606639996931e-05, "loss": 2.4235, "step": 172190 }, { "epoch": 0.3, "learning_rate": 3.498519446004248e-05, "loss": 2.4964, "step": 172200 }, { "epoch": 0.3, "learning_rate": 3.498432252011565e-05, "loss": 2.4409, "step": 172210 }, { "epoch": 0.3, "learning_rate": 3.498345058018883e-05, "loss": 2.318, "step": 172220 }, { "epoch": 0.3, "learning_rate": 3.4982578640262006e-05, "loss": 2.4677, "step": 172230 }, { "epoch": 0.3, "learning_rate": 3.4981706700335176e-05, "loss": 2.4221, "step": 172240 }, { "epoch": 0.3, "learning_rate": 3.4980834760408347e-05, "loss": 2.484, "step": 172250 }, { "epoch": 0.3, "learning_rate": 3.4979962820481524e-05, "loss": 2.4463, "step": 172260 }, { "epoch": 0.3, "learning_rate": 3.4979090880554694e-05, "loss": 2.3864, "step": 172270 }, { "epoch": 0.3, "learning_rate": 3.4978218940627864e-05, "loss": 2.4007, "step": 172280 }, { "epoch": 0.3, "learning_rate": 3.497734700070104e-05, "loss": 2.5035, "step": 172290 }, { "epoch": 0.3, "learning_rate": 3.497647506077422e-05, "loss": 2.3414, "step": 172300 }, { "epoch": 0.3, "learning_rate": 3.497560312084739e-05, "loss": 2.4183, "step": 172310 }, { "epoch": 0.3, "learning_rate": 3.497473118092056e-05, "loss": 2.4935, "step": 172320 }, { "epoch": 0.3, "learning_rate": 3.497385924099374e-05, "loss": 2.4761, "step": 172330 }, { "epoch": 0.3, "learning_rate": 3.497298730106691e-05, "loss": 2.572, "step": 172340 }, { "epoch": 0.3, "learning_rate": 3.497211536114008e-05, "loss": 2.5572, "step": 172350 }, { "epoch": 0.3, "learning_rate": 3.497124342121325e-05, "loss": 2.4397, "step": 172360 }, { "epoch": 0.3, "learning_rate": 3.497037148128643e-05, "loss": 2.4417, "step": 172370 }, { "epoch": 0.3, "learning_rate": 3.49694995413596e-05, "loss": 2.5231, "step": 172380 }, { "epoch": 0.3, "learning_rate": 3.496862760143277e-05, "loss": 2.4672, "step": 172390 }, { "epoch": 0.3, "learning_rate": 3.496775566150595e-05, "loss": 2.5936, "step": 172400 }, { "epoch": 0.3, "learning_rate": 3.496688372157912e-05, "loss": 2.4218, "step": 172410 }, { "epoch": 0.3, "learning_rate": 3.496601178165229e-05, "loss": 2.4802, "step": 172420 }, { "epoch": 0.3, "learning_rate": 3.496513984172546e-05, "loss": 2.4744, "step": 172430 }, { "epoch": 0.3, "learning_rate": 3.4964267901798645e-05, "loss": 2.3543, "step": 172440 }, { "epoch": 0.3, "learning_rate": 3.4963395961871815e-05, "loss": 2.3905, "step": 172450 }, { "epoch": 0.3, "learning_rate": 3.4962524021944986e-05, "loss": 2.5011, "step": 172460 }, { "epoch": 0.3, "learning_rate": 3.4961652082018156e-05, "loss": 2.4851, "step": 172470 }, { "epoch": 0.3, "learning_rate": 3.496078014209133e-05, "loss": 2.443, "step": 172480 }, { "epoch": 0.3, "learning_rate": 3.4959908202164503e-05, "loss": 2.3522, "step": 172490 }, { "epoch": 0.3, "learning_rate": 3.4959036262237674e-05, "loss": 2.5204, "step": 172500 }, { "epoch": 0.3, "learning_rate": 3.495816432231085e-05, "loss": 2.5476, "step": 172510 }, { "epoch": 0.3, "learning_rate": 3.495729238238403e-05, "loss": 2.6021, "step": 172520 }, { "epoch": 0.3, "learning_rate": 3.49564204424572e-05, "loss": 2.6045, "step": 172530 }, { "epoch": 0.3, "learning_rate": 3.495554850253037e-05, "loss": 2.379, "step": 172540 }, { "epoch": 0.3, "learning_rate": 3.4954676562603546e-05, "loss": 2.4226, "step": 172550 }, { "epoch": 0.3, "learning_rate": 3.4953804622676716e-05, "loss": 2.5259, "step": 172560 }, { "epoch": 0.3, "learning_rate": 3.495293268274989e-05, "loss": 2.4543, "step": 172570 }, { "epoch": 0.3, "learning_rate": 3.4952060742823064e-05, "loss": 2.3957, "step": 172580 }, { "epoch": 0.3, "learning_rate": 3.495118880289624e-05, "loss": 2.4094, "step": 172590 }, { "epoch": 0.3, "learning_rate": 3.495031686296941e-05, "loss": 2.5011, "step": 172600 }, { "epoch": 0.3, "learning_rate": 3.494944492304258e-05, "loss": 2.4671, "step": 172610 }, { "epoch": 0.3, "learning_rate": 3.494857298311576e-05, "loss": 2.5067, "step": 172620 }, { "epoch": 0.3, "learning_rate": 3.494770104318893e-05, "loss": 2.471, "step": 172630 }, { "epoch": 0.3, "learning_rate": 3.49468291032621e-05, "loss": 2.4192, "step": 172640 }, { "epoch": 0.3, "learning_rate": 3.494595716333528e-05, "loss": 2.4633, "step": 172650 }, { "epoch": 0.3, "learning_rate": 3.4945085223408454e-05, "loss": 2.5677, "step": 172660 }, { "epoch": 0.3, "learning_rate": 3.4944213283481625e-05, "loss": 2.3439, "step": 172670 }, { "epoch": 0.3, "learning_rate": 3.4943341343554795e-05, "loss": 2.4964, "step": 172680 }, { "epoch": 0.3, "learning_rate": 3.494246940362797e-05, "loss": 2.515, "step": 172690 }, { "epoch": 0.3, "learning_rate": 3.494159746370114e-05, "loss": 2.5015, "step": 172700 }, { "epoch": 0.3, "learning_rate": 3.494072552377431e-05, "loss": 2.5017, "step": 172710 }, { "epoch": 0.3, "learning_rate": 3.493985358384749e-05, "loss": 2.512, "step": 172720 }, { "epoch": 0.3, "learning_rate": 3.493898164392066e-05, "loss": 2.3934, "step": 172730 }, { "epoch": 0.3, "learning_rate": 3.493810970399384e-05, "loss": 2.4473, "step": 172740 }, { "epoch": 0.3, "learning_rate": 3.493723776406701e-05, "loss": 2.4241, "step": 172750 }, { "epoch": 0.3, "learning_rate": 3.4936365824140185e-05, "loss": 2.4689, "step": 172760 }, { "epoch": 0.3, "learning_rate": 3.4935493884213356e-05, "loss": 2.411, "step": 172770 }, { "epoch": 0.3, "learning_rate": 3.4934621944286526e-05, "loss": 2.4489, "step": 172780 }, { "epoch": 0.3, "learning_rate": 3.49337500043597e-05, "loss": 2.4208, "step": 172790 }, { "epoch": 0.3, "learning_rate": 3.4932878064432873e-05, "loss": 2.4827, "step": 172800 }, { "epoch": 0.3, "learning_rate": 3.493200612450605e-05, "loss": 2.3382, "step": 172810 }, { "epoch": 0.3, "learning_rate": 3.493113418457922e-05, "loss": 2.4919, "step": 172820 }, { "epoch": 0.3, "learning_rate": 3.49302622446524e-05, "loss": 2.3415, "step": 172830 }, { "epoch": 0.3, "learning_rate": 3.492939030472557e-05, "loss": 2.3312, "step": 172840 }, { "epoch": 0.3, "learning_rate": 3.492851836479874e-05, "loss": 2.4628, "step": 172850 }, { "epoch": 0.3, "learning_rate": 3.492764642487191e-05, "loss": 2.3773, "step": 172860 }, { "epoch": 0.3, "learning_rate": 3.4926774484945086e-05, "loss": 2.4302, "step": 172870 }, { "epoch": 0.3, "learning_rate": 3.492590254501826e-05, "loss": 2.4348, "step": 172880 }, { "epoch": 0.3, "learning_rate": 3.4925030605091434e-05, "loss": 2.504, "step": 172890 }, { "epoch": 0.3, "learning_rate": 3.492415866516461e-05, "loss": 2.4739, "step": 172900 }, { "epoch": 0.3, "learning_rate": 3.492328672523778e-05, "loss": 2.4738, "step": 172910 }, { "epoch": 0.3, "learning_rate": 3.492241478531095e-05, "loss": 2.4861, "step": 172920 }, { "epoch": 0.3, "learning_rate": 3.492154284538412e-05, "loss": 2.465, "step": 172930 }, { "epoch": 0.3, "learning_rate": 3.49206709054573e-05, "loss": 2.5145, "step": 172940 }, { "epoch": 0.3, "learning_rate": 3.491979896553047e-05, "loss": 2.4295, "step": 172950 }, { "epoch": 0.3, "learning_rate": 3.491892702560365e-05, "loss": 2.4914, "step": 172960 }, { "epoch": 0.3, "learning_rate": 3.491805508567682e-05, "loss": 2.444, "step": 172970 }, { "epoch": 0.3, "learning_rate": 3.4917183145749995e-05, "loss": 2.5587, "step": 172980 }, { "epoch": 0.3, "learning_rate": 3.4916311205823165e-05, "loss": 2.5549, "step": 172990 }, { "epoch": 0.3, "learning_rate": 3.4915439265896335e-05, "loss": 2.4583, "step": 173000 }, { "epoch": 0.3, "learning_rate": 3.491456732596951e-05, "loss": 2.3826, "step": 173010 }, { "epoch": 0.3, "learning_rate": 3.491369538604268e-05, "loss": 2.4852, "step": 173020 }, { "epoch": 0.3, "learning_rate": 3.491282344611585e-05, "loss": 2.4781, "step": 173030 }, { "epoch": 0.3, "learning_rate": 3.491195150618903e-05, "loss": 2.472, "step": 173040 }, { "epoch": 0.3, "learning_rate": 3.491107956626221e-05, "loss": 2.484, "step": 173050 }, { "epoch": 0.3, "learning_rate": 3.491020762633538e-05, "loss": 2.2318, "step": 173060 }, { "epoch": 0.3, "learning_rate": 3.490933568640855e-05, "loss": 2.4088, "step": 173070 }, { "epoch": 0.3, "learning_rate": 3.4908463746481725e-05, "loss": 2.5226, "step": 173080 }, { "epoch": 0.3, "learning_rate": 3.4907591806554896e-05, "loss": 2.3705, "step": 173090 }, { "epoch": 0.3, "learning_rate": 3.4906719866628066e-05, "loss": 2.5224, "step": 173100 }, { "epoch": 0.3, "learning_rate": 3.490584792670124e-05, "loss": 2.392, "step": 173110 }, { "epoch": 0.3, "learning_rate": 3.490497598677442e-05, "loss": 2.3669, "step": 173120 }, { "epoch": 0.3, "learning_rate": 3.490410404684759e-05, "loss": 2.4271, "step": 173130 }, { "epoch": 0.3, "learning_rate": 3.490323210692076e-05, "loss": 2.5656, "step": 173140 }, { "epoch": 0.3, "learning_rate": 3.490236016699394e-05, "loss": 2.3506, "step": 173150 }, { "epoch": 0.3, "learning_rate": 3.490148822706711e-05, "loss": 2.5092, "step": 173160 }, { "epoch": 0.3, "learning_rate": 3.490061628714028e-05, "loss": 2.4334, "step": 173170 }, { "epoch": 0.3, "learning_rate": 3.4899744347213456e-05, "loss": 2.5404, "step": 173180 }, { "epoch": 0.3, "learning_rate": 3.4898872407286634e-05, "loss": 2.4191, "step": 173190 }, { "epoch": 0.3, "learning_rate": 3.4898000467359804e-05, "loss": 2.417, "step": 173200 }, { "epoch": 0.3, "learning_rate": 3.4897128527432974e-05, "loss": 2.4899, "step": 173210 }, { "epoch": 0.3, "learning_rate": 3.489625658750615e-05, "loss": 2.4811, "step": 173220 }, { "epoch": 0.3, "learning_rate": 3.489538464757932e-05, "loss": 2.3615, "step": 173230 }, { "epoch": 0.3, "learning_rate": 3.489451270765249e-05, "loss": 2.5496, "step": 173240 }, { "epoch": 0.3, "learning_rate": 3.489364076772567e-05, "loss": 2.4099, "step": 173250 }, { "epoch": 0.3, "learning_rate": 3.4892768827798847e-05, "loss": 2.5481, "step": 173260 }, { "epoch": 0.3, "learning_rate": 3.489189688787202e-05, "loss": 2.4822, "step": 173270 }, { "epoch": 0.3, "learning_rate": 3.489102494794519e-05, "loss": 2.4966, "step": 173280 }, { "epoch": 0.3, "learning_rate": 3.4890153008018364e-05, "loss": 2.5644, "step": 173290 }, { "epoch": 0.3, "learning_rate": 3.4889281068091535e-05, "loss": 2.4028, "step": 173300 }, { "epoch": 0.3, "learning_rate": 3.4888409128164705e-05, "loss": 2.4477, "step": 173310 }, { "epoch": 0.3, "learning_rate": 3.4887537188237876e-05, "loss": 2.5061, "step": 173320 }, { "epoch": 0.3, "learning_rate": 3.488666524831106e-05, "loss": 2.3554, "step": 173330 }, { "epoch": 0.3, "learning_rate": 3.488579330838423e-05, "loss": 2.5149, "step": 173340 }, { "epoch": 0.3, "learning_rate": 3.48849213684574e-05, "loss": 2.4374, "step": 173350 }, { "epoch": 0.3, "learning_rate": 3.488404942853058e-05, "loss": 2.2803, "step": 173360 }, { "epoch": 0.3, "learning_rate": 3.488317748860375e-05, "loss": 2.4691, "step": 173370 }, { "epoch": 0.3, "learning_rate": 3.488230554867692e-05, "loss": 2.2296, "step": 173380 }, { "epoch": 0.3, "learning_rate": 3.488143360875009e-05, "loss": 2.4108, "step": 173390 }, { "epoch": 0.3, "learning_rate": 3.4880561668823266e-05, "loss": 2.4885, "step": 173400 }, { "epoch": 0.3, "learning_rate": 3.487968972889644e-05, "loss": 2.5633, "step": 173410 }, { "epoch": 0.3, "learning_rate": 3.487881778896961e-05, "loss": 2.5516, "step": 173420 }, { "epoch": 0.3, "learning_rate": 3.4877945849042784e-05, "loss": 2.4711, "step": 173430 }, { "epoch": 0.3, "learning_rate": 3.487707390911596e-05, "loss": 2.4092, "step": 173440 }, { "epoch": 0.3, "learning_rate": 3.487620196918913e-05, "loss": 2.5631, "step": 173450 }, { "epoch": 0.3, "learning_rate": 3.48753300292623e-05, "loss": 2.4351, "step": 173460 }, { "epoch": 0.3, "learning_rate": 3.487445808933548e-05, "loss": 2.355, "step": 173470 }, { "epoch": 0.3, "learning_rate": 3.4873586149408656e-05, "loss": 2.5041, "step": 173480 }, { "epoch": 0.3, "learning_rate": 3.4872714209481826e-05, "loss": 2.4566, "step": 173490 }, { "epoch": 0.3, "learning_rate": 3.4871842269555e-05, "loss": 2.4446, "step": 173500 }, { "epoch": 0.3, "learning_rate": 3.4870970329628174e-05, "loss": 2.3408, "step": 173510 }, { "epoch": 0.3, "learning_rate": 3.4870098389701344e-05, "loss": 2.4805, "step": 173520 }, { "epoch": 0.3, "learning_rate": 3.4869226449774515e-05, "loss": 2.4147, "step": 173530 }, { "epoch": 0.3, "learning_rate": 3.486835450984769e-05, "loss": 2.4256, "step": 173540 }, { "epoch": 0.3, "learning_rate": 3.486748256992086e-05, "loss": 2.5505, "step": 173550 }, { "epoch": 0.3, "learning_rate": 3.486661062999404e-05, "loss": 2.3998, "step": 173560 }, { "epoch": 0.3, "learning_rate": 3.486573869006721e-05, "loss": 2.3542, "step": 173570 }, { "epoch": 0.3, "learning_rate": 3.486486675014039e-05, "loss": 2.4336, "step": 173580 }, { "epoch": 0.3, "learning_rate": 3.486399481021356e-05, "loss": 2.5114, "step": 173590 }, { "epoch": 0.3, "learning_rate": 3.486312287028673e-05, "loss": 2.3971, "step": 173600 }, { "epoch": 0.3, "learning_rate": 3.4862250930359905e-05, "loss": 2.4421, "step": 173610 }, { "epoch": 0.3, "learning_rate": 3.4861378990433075e-05, "loss": 2.4251, "step": 173620 }, { "epoch": 0.3, "learning_rate": 3.486050705050625e-05, "loss": 2.3288, "step": 173630 }, { "epoch": 0.3, "learning_rate": 3.485963511057942e-05, "loss": 2.3257, "step": 173640 }, { "epoch": 0.3, "learning_rate": 3.48587631706526e-05, "loss": 2.613, "step": 173650 }, { "epoch": 0.3, "learning_rate": 3.485789123072577e-05, "loss": 2.586, "step": 173660 }, { "epoch": 0.3, "learning_rate": 3.485701929079894e-05, "loss": 2.4779, "step": 173670 }, { "epoch": 0.3, "learning_rate": 3.485614735087212e-05, "loss": 2.4202, "step": 173680 }, { "epoch": 0.3, "learning_rate": 3.485527541094529e-05, "loss": 2.4837, "step": 173690 }, { "epoch": 0.3, "learning_rate": 3.485440347101846e-05, "loss": 2.3195, "step": 173700 }, { "epoch": 0.3, "learning_rate": 3.4853531531091636e-05, "loss": 2.4638, "step": 173710 }, { "epoch": 0.3, "learning_rate": 3.485265959116481e-05, "loss": 2.4716, "step": 173720 }, { "epoch": 0.3, "learning_rate": 3.485178765123798e-05, "loss": 2.3992, "step": 173730 }, { "epoch": 0.3, "learning_rate": 3.4850915711311154e-05, "loss": 2.5135, "step": 173740 }, { "epoch": 0.3, "learning_rate": 3.485004377138433e-05, "loss": 2.4338, "step": 173750 }, { "epoch": 0.3, "learning_rate": 3.48491718314575e-05, "loss": 2.3258, "step": 173760 }, { "epoch": 0.3, "learning_rate": 3.484829989153067e-05, "loss": 2.3267, "step": 173770 }, { "epoch": 0.3, "learning_rate": 3.484742795160385e-05, "loss": 2.569, "step": 173780 }, { "epoch": 0.3, "learning_rate": 3.4846556011677026e-05, "loss": 2.4554, "step": 173790 }, { "epoch": 0.3, "learning_rate": 3.4845684071750196e-05, "loss": 2.5476, "step": 173800 }, { "epoch": 0.3, "learning_rate": 3.4844812131823367e-05, "loss": 2.5154, "step": 173810 }, { "epoch": 0.3, "learning_rate": 3.484394019189654e-05, "loss": 2.353, "step": 173820 }, { "epoch": 0.3, "learning_rate": 3.4843068251969714e-05, "loss": 2.4405, "step": 173830 }, { "epoch": 0.3, "learning_rate": 3.4842196312042885e-05, "loss": 2.405, "step": 173840 }, { "epoch": 0.3, "learning_rate": 3.4841324372116055e-05, "loss": 2.4776, "step": 173850 }, { "epoch": 0.3, "learning_rate": 3.484045243218924e-05, "loss": 2.3168, "step": 173860 }, { "epoch": 0.3, "learning_rate": 3.483958049226241e-05, "loss": 2.4475, "step": 173870 }, { "epoch": 0.3, "learning_rate": 3.483870855233558e-05, "loss": 2.4341, "step": 173880 }, { "epoch": 0.3, "learning_rate": 3.483783661240875e-05, "loss": 2.4252, "step": 173890 }, { "epoch": 0.3, "learning_rate": 3.483696467248193e-05, "loss": 2.4537, "step": 173900 }, { "epoch": 0.3, "learning_rate": 3.48360927325551e-05, "loss": 2.4927, "step": 173910 }, { "epoch": 0.3, "learning_rate": 3.483522079262827e-05, "loss": 2.5147, "step": 173920 }, { "epoch": 0.3, "learning_rate": 3.4834348852701445e-05, "loss": 2.4302, "step": 173930 }, { "epoch": 0.3, "learning_rate": 3.483347691277462e-05, "loss": 2.4615, "step": 173940 }, { "epoch": 0.3, "learning_rate": 3.483260497284779e-05, "loss": 2.5192, "step": 173950 }, { "epoch": 0.3, "learning_rate": 3.483173303292096e-05, "loss": 2.4314, "step": 173960 }, { "epoch": 0.3, "learning_rate": 3.483086109299414e-05, "loss": 2.4989, "step": 173970 }, { "epoch": 0.3, "learning_rate": 3.482998915306731e-05, "loss": 2.5497, "step": 173980 }, { "epoch": 0.3, "learning_rate": 3.482911721314048e-05, "loss": 2.5144, "step": 173990 }, { "epoch": 0.3, "learning_rate": 3.482824527321366e-05, "loss": 2.4828, "step": 174000 }, { "epoch": 0.3, "learning_rate": 3.4827373333286835e-05, "loss": 2.5554, "step": 174010 }, { "epoch": 0.3, "learning_rate": 3.4826501393360006e-05, "loss": 2.374, "step": 174020 }, { "epoch": 0.3, "learning_rate": 3.4825629453433176e-05, "loss": 2.4285, "step": 174030 }, { "epoch": 0.3, "learning_rate": 3.482475751350635e-05, "loss": 2.363, "step": 174040 }, { "epoch": 0.3, "learning_rate": 3.4823885573579524e-05, "loss": 2.5932, "step": 174050 }, { "epoch": 0.3, "learning_rate": 3.4823013633652694e-05, "loss": 2.4809, "step": 174060 }, { "epoch": 0.3, "learning_rate": 3.482214169372587e-05, "loss": 2.4399, "step": 174070 }, { "epoch": 0.3, "learning_rate": 3.482126975379905e-05, "loss": 2.4875, "step": 174080 }, { "epoch": 0.3, "learning_rate": 3.482039781387222e-05, "loss": 2.4083, "step": 174090 }, { "epoch": 0.3, "learning_rate": 3.481952587394539e-05, "loss": 2.4835, "step": 174100 }, { "epoch": 0.3, "learning_rate": 3.4818653934018566e-05, "loss": 2.4701, "step": 174110 }, { "epoch": 0.3, "learning_rate": 3.4817781994091737e-05, "loss": 2.4823, "step": 174120 }, { "epoch": 0.3, "learning_rate": 3.481691005416491e-05, "loss": 2.479, "step": 174130 }, { "epoch": 0.3, "learning_rate": 3.4816038114238084e-05, "loss": 2.3501, "step": 174140 }, { "epoch": 0.3, "learning_rate": 3.481516617431126e-05, "loss": 2.4484, "step": 174150 }, { "epoch": 0.3, "learning_rate": 3.481429423438443e-05, "loss": 2.4404, "step": 174160 }, { "epoch": 0.3, "learning_rate": 3.48134222944576e-05, "loss": 2.4419, "step": 174170 }, { "epoch": 0.3, "learning_rate": 3.481255035453078e-05, "loss": 2.5225, "step": 174180 }, { "epoch": 0.3, "learning_rate": 3.481167841460395e-05, "loss": 2.3593, "step": 174190 }, { "epoch": 0.3, "learning_rate": 3.481080647467712e-05, "loss": 2.4979, "step": 174200 }, { "epoch": 0.3, "learning_rate": 3.480993453475029e-05, "loss": 2.4331, "step": 174210 }, { "epoch": 0.3, "learning_rate": 3.480906259482347e-05, "loss": 2.5201, "step": 174220 }, { "epoch": 0.3, "learning_rate": 3.4808190654896645e-05, "loss": 2.3525, "step": 174230 }, { "epoch": 0.3, "learning_rate": 3.4807318714969815e-05, "loss": 2.3253, "step": 174240 }, { "epoch": 0.3, "learning_rate": 3.480644677504299e-05, "loss": 2.4275, "step": 174250 }, { "epoch": 0.3, "learning_rate": 3.480557483511616e-05, "loss": 2.4007, "step": 174260 }, { "epoch": 0.3, "learning_rate": 3.480470289518933e-05, "loss": 2.3693, "step": 174270 }, { "epoch": 0.3, "learning_rate": 3.48038309552625e-05, "loss": 2.524, "step": 174280 }, { "epoch": 0.3, "learning_rate": 3.480295901533568e-05, "loss": 2.5016, "step": 174290 }, { "epoch": 0.3, "learning_rate": 3.480208707540886e-05, "loss": 2.5021, "step": 174300 }, { "epoch": 0.3, "learning_rate": 3.480121513548203e-05, "loss": 2.4369, "step": 174310 }, { "epoch": 0.3, "learning_rate": 3.48003431955552e-05, "loss": 2.525, "step": 174320 }, { "epoch": 0.3, "learning_rate": 3.4799471255628376e-05, "loss": 2.3806, "step": 174330 }, { "epoch": 0.3, "learning_rate": 3.4798599315701546e-05, "loss": 2.5232, "step": 174340 }, { "epoch": 0.3, "learning_rate": 3.4797727375774716e-05, "loss": 2.4216, "step": 174350 }, { "epoch": 0.3, "learning_rate": 3.4796855435847893e-05, "loss": 2.5351, "step": 174360 }, { "epoch": 0.3, "learning_rate": 3.4795983495921064e-05, "loss": 2.4246, "step": 174370 }, { "epoch": 0.3, "learning_rate": 3.479511155599424e-05, "loss": 2.4667, "step": 174380 }, { "epoch": 0.3, "learning_rate": 3.479423961606741e-05, "loss": 2.4235, "step": 174390 }, { "epoch": 0.3, "learning_rate": 3.479336767614059e-05, "loss": 2.4986, "step": 174400 }, { "epoch": 0.3, "learning_rate": 3.479249573621376e-05, "loss": 2.5107, "step": 174410 }, { "epoch": 0.3, "learning_rate": 3.479162379628693e-05, "loss": 2.5386, "step": 174420 }, { "epoch": 0.3, "learning_rate": 3.4790751856360106e-05, "loss": 2.5733, "step": 174430 }, { "epoch": 0.3, "learning_rate": 3.478987991643328e-05, "loss": 2.4199, "step": 174440 }, { "epoch": 0.3, "learning_rate": 3.4789007976506454e-05, "loss": 2.3961, "step": 174450 }, { "epoch": 0.3, "learning_rate": 3.4788136036579624e-05, "loss": 2.4946, "step": 174460 }, { "epoch": 0.3, "learning_rate": 3.47872640966528e-05, "loss": 2.4838, "step": 174470 }, { "epoch": 0.3, "learning_rate": 3.478639215672597e-05, "loss": 2.4738, "step": 174480 }, { "epoch": 0.3, "learning_rate": 3.478552021679914e-05, "loss": 2.4961, "step": 174490 }, { "epoch": 0.3, "learning_rate": 3.478464827687232e-05, "loss": 2.469, "step": 174500 }, { "epoch": 0.3, "learning_rate": 3.478377633694549e-05, "loss": 2.4876, "step": 174510 }, { "epoch": 0.3, "learning_rate": 3.478290439701867e-05, "loss": 2.5279, "step": 174520 }, { "epoch": 0.3, "learning_rate": 3.478203245709184e-05, "loss": 2.4916, "step": 174530 }, { "epoch": 0.3, "learning_rate": 3.4781160517165015e-05, "loss": 2.4571, "step": 174540 }, { "epoch": 0.3, "learning_rate": 3.4780288577238185e-05, "loss": 2.4274, "step": 174550 }, { "epoch": 0.3, "learning_rate": 3.4779416637311355e-05, "loss": 2.4681, "step": 174560 }, { "epoch": 0.3, "learning_rate": 3.477854469738453e-05, "loss": 2.4727, "step": 174570 }, { "epoch": 0.3, "learning_rate": 3.47776727574577e-05, "loss": 2.3817, "step": 174580 }, { "epoch": 0.3, "learning_rate": 3.477680081753087e-05, "loss": 2.5025, "step": 174590 }, { "epoch": 0.3, "learning_rate": 3.477592887760405e-05, "loss": 2.4287, "step": 174600 }, { "epoch": 0.3, "learning_rate": 3.477505693767723e-05, "loss": 2.4456, "step": 174610 }, { "epoch": 0.3, "learning_rate": 3.47741849977504e-05, "loss": 2.5446, "step": 174620 }, { "epoch": 0.3, "learning_rate": 3.477331305782357e-05, "loss": 2.5698, "step": 174630 }, { "epoch": 0.3, "learning_rate": 3.4772441117896745e-05, "loss": 2.5314, "step": 174640 }, { "epoch": 0.3, "learning_rate": 3.4771569177969916e-05, "loss": 2.4314, "step": 174650 }, { "epoch": 0.3, "learning_rate": 3.4770697238043086e-05, "loss": 2.5183, "step": 174660 }, { "epoch": 0.3, "learning_rate": 3.476982529811626e-05, "loss": 2.5006, "step": 174670 }, { "epoch": 0.3, "learning_rate": 3.476895335818944e-05, "loss": 2.3844, "step": 174680 }, { "epoch": 0.3, "learning_rate": 3.476808141826261e-05, "loss": 2.5086, "step": 174690 }, { "epoch": 0.3, "learning_rate": 3.476720947833578e-05, "loss": 2.4865, "step": 174700 }, { "epoch": 0.3, "learning_rate": 3.476633753840896e-05, "loss": 2.3941, "step": 174710 }, { "epoch": 0.3, "learning_rate": 3.476546559848213e-05, "loss": 2.4696, "step": 174720 }, { "epoch": 0.3, "learning_rate": 3.47645936585553e-05, "loss": 2.4036, "step": 174730 }, { "epoch": 0.3, "learning_rate": 3.476372171862847e-05, "loss": 2.3725, "step": 174740 }, { "epoch": 0.3, "learning_rate": 3.4762849778701654e-05, "loss": 2.4611, "step": 174750 }, { "epoch": 0.3, "learning_rate": 3.4761977838774824e-05, "loss": 2.3847, "step": 174760 }, { "epoch": 0.3, "learning_rate": 3.4761105898847994e-05, "loss": 2.559, "step": 174770 }, { "epoch": 0.3, "learning_rate": 3.4760233958921165e-05, "loss": 2.4422, "step": 174780 }, { "epoch": 0.3, "learning_rate": 3.475936201899434e-05, "loss": 2.5638, "step": 174790 }, { "epoch": 0.3, "learning_rate": 3.475849007906751e-05, "loss": 2.5028, "step": 174800 }, { "epoch": 0.3, "learning_rate": 3.475761813914068e-05, "loss": 2.532, "step": 174810 }, { "epoch": 0.3, "learning_rate": 3.4756746199213867e-05, "loss": 2.2778, "step": 174820 }, { "epoch": 0.3, "learning_rate": 3.475587425928704e-05, "loss": 2.4432, "step": 174830 }, { "epoch": 0.3, "learning_rate": 3.475500231936021e-05, "loss": 2.5242, "step": 174840 }, { "epoch": 0.3, "learning_rate": 3.475413037943338e-05, "loss": 2.3776, "step": 174850 }, { "epoch": 0.3, "learning_rate": 3.4753258439506555e-05, "loss": 2.5092, "step": 174860 }, { "epoch": 0.3, "learning_rate": 3.4752386499579725e-05, "loss": 2.3722, "step": 174870 }, { "epoch": 0.3, "learning_rate": 3.4751514559652896e-05, "loss": 2.491, "step": 174880 }, { "epoch": 0.3, "learning_rate": 3.475064261972607e-05, "loss": 2.5153, "step": 174890 }, { "epoch": 0.31, "learning_rate": 3.474977067979925e-05, "loss": 2.5439, "step": 174900 }, { "epoch": 0.31, "learning_rate": 3.474889873987242e-05, "loss": 2.4165, "step": 174910 }, { "epoch": 0.31, "learning_rate": 3.474802679994559e-05, "loss": 2.4636, "step": 174920 }, { "epoch": 0.31, "learning_rate": 3.474715486001877e-05, "loss": 2.4366, "step": 174930 }, { "epoch": 0.31, "learning_rate": 3.474628292009194e-05, "loss": 2.3586, "step": 174940 }, { "epoch": 0.31, "learning_rate": 3.474541098016511e-05, "loss": 2.4234, "step": 174950 }, { "epoch": 0.31, "learning_rate": 3.4744539040238286e-05, "loss": 2.4701, "step": 174960 }, { "epoch": 0.31, "learning_rate": 3.474366710031146e-05, "loss": 2.458, "step": 174970 }, { "epoch": 0.31, "learning_rate": 3.474279516038463e-05, "loss": 2.4575, "step": 174980 }, { "epoch": 0.31, "learning_rate": 3.4741923220457804e-05, "loss": 2.4922, "step": 174990 }, { "epoch": 0.31, "learning_rate": 3.474105128053098e-05, "loss": 2.5298, "step": 175000 }, { "epoch": 0.31, "learning_rate": 3.474017934060415e-05, "loss": 2.4862, "step": 175010 }, { "epoch": 0.31, "learning_rate": 3.473930740067732e-05, "loss": 2.3974, "step": 175020 }, { "epoch": 0.31, "learning_rate": 3.47384354607505e-05, "loss": 2.5298, "step": 175030 }, { "epoch": 0.31, "learning_rate": 3.473756352082367e-05, "loss": 2.507, "step": 175040 }, { "epoch": 0.31, "learning_rate": 3.4736691580896846e-05, "loss": 2.4723, "step": 175050 }, { "epoch": 0.31, "learning_rate": 3.473581964097002e-05, "loss": 2.3929, "step": 175060 }, { "epoch": 0.31, "learning_rate": 3.4734947701043194e-05, "loss": 2.4837, "step": 175070 }, { "epoch": 0.31, "learning_rate": 3.4734075761116364e-05, "loss": 2.4299, "step": 175080 }, { "epoch": 0.31, "learning_rate": 3.4733203821189535e-05, "loss": 2.3951, "step": 175090 }, { "epoch": 0.31, "learning_rate": 3.473233188126271e-05, "loss": 2.4494, "step": 175100 }, { "epoch": 0.31, "learning_rate": 3.473145994133588e-05, "loss": 2.4101, "step": 175110 }, { "epoch": 0.31, "learning_rate": 3.473058800140906e-05, "loss": 2.3644, "step": 175120 }, { "epoch": 0.31, "learning_rate": 3.472971606148223e-05, "loss": 2.3514, "step": 175130 }, { "epoch": 0.31, "learning_rate": 3.472884412155541e-05, "loss": 2.4023, "step": 175140 }, { "epoch": 0.31, "learning_rate": 3.472797218162858e-05, "loss": 2.4909, "step": 175150 }, { "epoch": 0.31, "learning_rate": 3.472710024170175e-05, "loss": 2.3896, "step": 175160 }, { "epoch": 0.31, "learning_rate": 3.472622830177492e-05, "loss": 2.3426, "step": 175170 }, { "epoch": 0.31, "learning_rate": 3.4725356361848095e-05, "loss": 2.4574, "step": 175180 }, { "epoch": 0.31, "learning_rate": 3.472448442192127e-05, "loss": 2.3787, "step": 175190 }, { "epoch": 0.31, "learning_rate": 3.472361248199444e-05, "loss": 2.5224, "step": 175200 }, { "epoch": 0.31, "learning_rate": 3.472274054206762e-05, "loss": 2.3911, "step": 175210 }, { "epoch": 0.31, "learning_rate": 3.472186860214079e-05, "loss": 2.4904, "step": 175220 }, { "epoch": 0.31, "learning_rate": 3.472099666221396e-05, "loss": 2.391, "step": 175230 }, { "epoch": 0.31, "learning_rate": 3.472012472228713e-05, "loss": 2.4988, "step": 175240 }, { "epoch": 0.31, "learning_rate": 3.471925278236031e-05, "loss": 2.3873, "step": 175250 }, { "epoch": 0.31, "learning_rate": 3.471838084243348e-05, "loss": 2.4731, "step": 175260 }, { "epoch": 0.31, "learning_rate": 3.4717508902506656e-05, "loss": 2.4042, "step": 175270 }, { "epoch": 0.31, "learning_rate": 3.4716636962579826e-05, "loss": 2.4563, "step": 175280 }, { "epoch": 0.31, "learning_rate": 3.4715765022653e-05, "loss": 2.384, "step": 175290 }, { "epoch": 0.31, "learning_rate": 3.4714893082726174e-05, "loss": 2.3981, "step": 175300 }, { "epoch": 0.31, "learning_rate": 3.4714021142799344e-05, "loss": 2.5356, "step": 175310 }, { "epoch": 0.31, "learning_rate": 3.471314920287252e-05, "loss": 2.4311, "step": 175320 }, { "epoch": 0.31, "learning_rate": 3.471227726294569e-05, "loss": 2.515, "step": 175330 }, { "epoch": 0.31, "learning_rate": 3.471140532301887e-05, "loss": 2.5068, "step": 175340 }, { "epoch": 0.31, "learning_rate": 3.471053338309204e-05, "loss": 2.4462, "step": 175350 }, { "epoch": 0.31, "learning_rate": 3.4709661443165216e-05, "loss": 2.5589, "step": 175360 }, { "epoch": 0.31, "learning_rate": 3.4708789503238387e-05, "loss": 2.4457, "step": 175370 }, { "epoch": 0.31, "learning_rate": 3.470791756331156e-05, "loss": 2.4681, "step": 175380 }, { "epoch": 0.31, "learning_rate": 3.4707045623384734e-05, "loss": 2.4073, "step": 175390 }, { "epoch": 0.31, "learning_rate": 3.4706173683457905e-05, "loss": 2.3495, "step": 175400 }, { "epoch": 0.31, "learning_rate": 3.4705301743531075e-05, "loss": 2.296, "step": 175410 }, { "epoch": 0.31, "learning_rate": 3.470442980360425e-05, "loss": 2.4465, "step": 175420 }, { "epoch": 0.31, "learning_rate": 3.470355786367743e-05, "loss": 2.429, "step": 175430 }, { "epoch": 0.31, "learning_rate": 3.47026859237506e-05, "loss": 2.439, "step": 175440 }, { "epoch": 0.31, "learning_rate": 3.470181398382377e-05, "loss": 2.4023, "step": 175450 }, { "epoch": 0.31, "learning_rate": 3.470094204389695e-05, "loss": 2.4124, "step": 175460 }, { "epoch": 0.31, "learning_rate": 3.470007010397012e-05, "loss": 2.4838, "step": 175470 }, { "epoch": 0.31, "learning_rate": 3.469919816404329e-05, "loss": 2.4952, "step": 175480 }, { "epoch": 0.31, "learning_rate": 3.4698326224116465e-05, "loss": 2.4994, "step": 175490 }, { "epoch": 0.31, "learning_rate": 3.469745428418964e-05, "loss": 2.463, "step": 175500 }, { "epoch": 0.31, "learning_rate": 3.469658234426281e-05, "loss": 2.4003, "step": 175510 }, { "epoch": 0.31, "learning_rate": 3.469571040433598e-05, "loss": 2.4021, "step": 175520 }, { "epoch": 0.31, "learning_rate": 3.469483846440916e-05, "loss": 2.479, "step": 175530 }, { "epoch": 0.31, "learning_rate": 3.469396652448233e-05, "loss": 2.4018, "step": 175540 }, { "epoch": 0.31, "learning_rate": 3.46930945845555e-05, "loss": 2.4388, "step": 175550 }, { "epoch": 0.31, "learning_rate": 3.469222264462867e-05, "loss": 2.4173, "step": 175560 }, { "epoch": 0.31, "learning_rate": 3.4691350704701855e-05, "loss": 2.5095, "step": 175570 }, { "epoch": 0.31, "learning_rate": 3.4690478764775026e-05, "loss": 2.4909, "step": 175580 }, { "epoch": 0.31, "learning_rate": 3.4689606824848196e-05, "loss": 2.5051, "step": 175590 }, { "epoch": 0.31, "learning_rate": 3.468873488492137e-05, "loss": 2.4509, "step": 175600 }, { "epoch": 0.31, "learning_rate": 3.4687862944994544e-05, "loss": 2.4873, "step": 175610 }, { "epoch": 0.31, "learning_rate": 3.4686991005067714e-05, "loss": 2.2958, "step": 175620 }, { "epoch": 0.31, "learning_rate": 3.4686119065140884e-05, "loss": 2.3316, "step": 175630 }, { "epoch": 0.31, "learning_rate": 3.468524712521407e-05, "loss": 2.5188, "step": 175640 }, { "epoch": 0.31, "learning_rate": 3.468437518528724e-05, "loss": 2.4654, "step": 175650 }, { "epoch": 0.31, "learning_rate": 3.468350324536041e-05, "loss": 2.4817, "step": 175660 }, { "epoch": 0.31, "learning_rate": 3.468263130543358e-05, "loss": 2.3804, "step": 175670 }, { "epoch": 0.31, "learning_rate": 3.4681759365506757e-05, "loss": 2.4678, "step": 175680 }, { "epoch": 0.31, "learning_rate": 3.468088742557993e-05, "loss": 2.3927, "step": 175690 }, { "epoch": 0.31, "learning_rate": 3.46800154856531e-05, "loss": 2.4953, "step": 175700 }, { "epoch": 0.31, "learning_rate": 3.4679143545726274e-05, "loss": 2.4123, "step": 175710 }, { "epoch": 0.31, "learning_rate": 3.467827160579945e-05, "loss": 2.4909, "step": 175720 }, { "epoch": 0.31, "learning_rate": 3.467739966587262e-05, "loss": 2.3377, "step": 175730 }, { "epoch": 0.31, "learning_rate": 3.467652772594579e-05, "loss": 2.4691, "step": 175740 }, { "epoch": 0.31, "learning_rate": 3.467565578601897e-05, "loss": 2.4052, "step": 175750 }, { "epoch": 0.31, "learning_rate": 3.467478384609214e-05, "loss": 2.4771, "step": 175760 }, { "epoch": 0.31, "learning_rate": 3.467391190616531e-05, "loss": 2.5331, "step": 175770 }, { "epoch": 0.31, "learning_rate": 3.467303996623849e-05, "loss": 2.5493, "step": 175780 }, { "epoch": 0.31, "learning_rate": 3.4672168026311665e-05, "loss": 2.5149, "step": 175790 }, { "epoch": 0.31, "learning_rate": 3.4671296086384835e-05, "loss": 2.416, "step": 175800 }, { "epoch": 0.31, "learning_rate": 3.4670424146458005e-05, "loss": 2.3879, "step": 175810 }, { "epoch": 0.31, "learning_rate": 3.466955220653118e-05, "loss": 2.4943, "step": 175820 }, { "epoch": 0.31, "learning_rate": 3.466868026660435e-05, "loss": 2.5891, "step": 175830 }, { "epoch": 0.31, "learning_rate": 3.466780832667752e-05, "loss": 2.3969, "step": 175840 }, { "epoch": 0.31, "learning_rate": 3.46669363867507e-05, "loss": 2.4807, "step": 175850 }, { "epoch": 0.31, "learning_rate": 3.466606444682388e-05, "loss": 2.3174, "step": 175860 }, { "epoch": 0.31, "learning_rate": 3.466519250689705e-05, "loss": 2.3968, "step": 175870 }, { "epoch": 0.31, "learning_rate": 3.466432056697022e-05, "loss": 2.4663, "step": 175880 }, { "epoch": 0.31, "learning_rate": 3.4663448627043396e-05, "loss": 2.4311, "step": 175890 }, { "epoch": 0.31, "learning_rate": 3.4662576687116566e-05, "loss": 2.5489, "step": 175900 }, { "epoch": 0.31, "learning_rate": 3.4661704747189736e-05, "loss": 2.3934, "step": 175910 }, { "epoch": 0.31, "learning_rate": 3.4660832807262913e-05, "loss": 2.3865, "step": 175920 }, { "epoch": 0.31, "learning_rate": 3.4659960867336084e-05, "loss": 2.2773, "step": 175930 }, { "epoch": 0.31, "learning_rate": 3.465908892740926e-05, "loss": 2.501, "step": 175940 }, { "epoch": 0.31, "learning_rate": 3.465821698748243e-05, "loss": 2.4966, "step": 175950 }, { "epoch": 0.31, "learning_rate": 3.465734504755561e-05, "loss": 2.4709, "step": 175960 }, { "epoch": 0.31, "learning_rate": 3.465647310762878e-05, "loss": 2.4808, "step": 175970 }, { "epoch": 0.31, "learning_rate": 3.465560116770195e-05, "loss": 2.3991, "step": 175980 }, { "epoch": 0.31, "learning_rate": 3.4654729227775126e-05, "loss": 2.3801, "step": 175990 }, { "epoch": 0.31, "learning_rate": 3.46538572878483e-05, "loss": 2.4486, "step": 176000 }, { "epoch": 0.31, "learning_rate": 3.4652985347921474e-05, "loss": 2.5249, "step": 176010 }, { "epoch": 0.31, "learning_rate": 3.4652113407994644e-05, "loss": 2.4286, "step": 176020 }, { "epoch": 0.31, "learning_rate": 3.465124146806782e-05, "loss": 2.4907, "step": 176030 }, { "epoch": 0.31, "learning_rate": 3.465036952814099e-05, "loss": 2.4314, "step": 176040 }, { "epoch": 0.31, "learning_rate": 3.464949758821416e-05, "loss": 2.3974, "step": 176050 }, { "epoch": 0.31, "learning_rate": 3.464862564828734e-05, "loss": 2.4264, "step": 176060 }, { "epoch": 0.31, "learning_rate": 3.464775370836051e-05, "loss": 2.4542, "step": 176070 }, { "epoch": 0.31, "learning_rate": 3.464688176843368e-05, "loss": 2.2812, "step": 176080 }, { "epoch": 0.31, "learning_rate": 3.464600982850686e-05, "loss": 2.5055, "step": 176090 }, { "epoch": 0.31, "learning_rate": 3.4645137888580035e-05, "loss": 2.5393, "step": 176100 }, { "epoch": 0.31, "learning_rate": 3.4644265948653205e-05, "loss": 2.4789, "step": 176110 }, { "epoch": 0.31, "learning_rate": 3.4643394008726375e-05, "loss": 2.4033, "step": 176120 }, { "epoch": 0.31, "learning_rate": 3.4642522068799546e-05, "loss": 2.504, "step": 176130 }, { "epoch": 0.31, "learning_rate": 3.464165012887272e-05, "loss": 2.4328, "step": 176140 }, { "epoch": 0.31, "learning_rate": 3.464077818894589e-05, "loss": 2.4493, "step": 176150 }, { "epoch": 0.31, "learning_rate": 3.463990624901907e-05, "loss": 2.5134, "step": 176160 }, { "epoch": 0.31, "learning_rate": 3.463903430909225e-05, "loss": 2.4889, "step": 176170 }, { "epoch": 0.31, "learning_rate": 3.463816236916542e-05, "loss": 2.4257, "step": 176180 }, { "epoch": 0.31, "learning_rate": 3.463729042923859e-05, "loss": 2.3495, "step": 176190 }, { "epoch": 0.31, "learning_rate": 3.463641848931176e-05, "loss": 2.4787, "step": 176200 }, { "epoch": 0.31, "learning_rate": 3.4635546549384936e-05, "loss": 2.3976, "step": 176210 }, { "epoch": 0.31, "learning_rate": 3.4634674609458106e-05, "loss": 2.3269, "step": 176220 }, { "epoch": 0.31, "learning_rate": 3.4633802669531277e-05, "loss": 2.4284, "step": 176230 }, { "epoch": 0.31, "learning_rate": 3.4632930729604454e-05, "loss": 2.4397, "step": 176240 }, { "epoch": 0.31, "learning_rate": 3.463205878967763e-05, "loss": 2.4515, "step": 176250 }, { "epoch": 0.31, "learning_rate": 3.46311868497508e-05, "loss": 2.3573, "step": 176260 }, { "epoch": 0.31, "learning_rate": 3.463031490982397e-05, "loss": 2.2911, "step": 176270 }, { "epoch": 0.31, "learning_rate": 3.462944296989715e-05, "loss": 2.6332, "step": 176280 }, { "epoch": 0.31, "learning_rate": 3.462857102997032e-05, "loss": 2.3279, "step": 176290 }, { "epoch": 0.31, "learning_rate": 3.462769909004349e-05, "loss": 2.4828, "step": 176300 }, { "epoch": 0.31, "learning_rate": 3.462682715011667e-05, "loss": 2.3914, "step": 176310 }, { "epoch": 0.31, "learning_rate": 3.4625955210189844e-05, "loss": 2.4212, "step": 176320 }, { "epoch": 0.31, "learning_rate": 3.4625083270263014e-05, "loss": 2.3999, "step": 176330 }, { "epoch": 0.31, "learning_rate": 3.4624211330336185e-05, "loss": 2.4394, "step": 176340 }, { "epoch": 0.31, "learning_rate": 3.462333939040936e-05, "loss": 2.4594, "step": 176350 }, { "epoch": 0.31, "learning_rate": 3.462246745048253e-05, "loss": 2.4719, "step": 176360 }, { "epoch": 0.31, "learning_rate": 3.46215955105557e-05, "loss": 2.462, "step": 176370 }, { "epoch": 0.31, "learning_rate": 3.462072357062888e-05, "loss": 2.5107, "step": 176380 }, { "epoch": 0.31, "learning_rate": 3.461985163070206e-05, "loss": 2.3965, "step": 176390 }, { "epoch": 0.31, "learning_rate": 3.461897969077523e-05, "loss": 2.4677, "step": 176400 }, { "epoch": 0.31, "learning_rate": 3.46181077508484e-05, "loss": 2.3647, "step": 176410 }, { "epoch": 0.31, "learning_rate": 3.4617235810921575e-05, "loss": 2.421, "step": 176420 }, { "epoch": 0.31, "learning_rate": 3.4616363870994745e-05, "loss": 2.2811, "step": 176430 }, { "epoch": 0.31, "learning_rate": 3.4615491931067916e-05, "loss": 2.336, "step": 176440 }, { "epoch": 0.31, "learning_rate": 3.461461999114109e-05, "loss": 2.48, "step": 176450 }, { "epoch": 0.31, "learning_rate": 3.461374805121427e-05, "loss": 2.4977, "step": 176460 }, { "epoch": 0.31, "learning_rate": 3.461287611128744e-05, "loss": 2.4027, "step": 176470 }, { "epoch": 0.31, "learning_rate": 3.461200417136061e-05, "loss": 2.3477, "step": 176480 }, { "epoch": 0.31, "learning_rate": 3.461113223143379e-05, "loss": 2.5662, "step": 176490 }, { "epoch": 0.31, "learning_rate": 3.461026029150696e-05, "loss": 2.505, "step": 176500 }, { "epoch": 0.31, "learning_rate": 3.460938835158013e-05, "loss": 2.399, "step": 176510 }, { "epoch": 0.31, "learning_rate": 3.46085164116533e-05, "loss": 2.4818, "step": 176520 }, { "epoch": 0.31, "learning_rate": 3.460764447172648e-05, "loss": 2.386, "step": 176530 }, { "epoch": 0.31, "learning_rate": 3.460677253179965e-05, "loss": 2.4832, "step": 176540 }, { "epoch": 0.31, "learning_rate": 3.4605900591872824e-05, "loss": 2.3386, "step": 176550 }, { "epoch": 0.31, "learning_rate": 3.4605028651946e-05, "loss": 2.5109, "step": 176560 }, { "epoch": 0.31, "learning_rate": 3.460415671201917e-05, "loss": 2.4837, "step": 176570 }, { "epoch": 0.31, "learning_rate": 3.460328477209234e-05, "loss": 2.4303, "step": 176580 }, { "epoch": 0.31, "learning_rate": 3.460241283216551e-05, "loss": 2.4654, "step": 176590 }, { "epoch": 0.31, "learning_rate": 3.460154089223869e-05, "loss": 2.3725, "step": 176600 }, { "epoch": 0.31, "learning_rate": 3.4600668952311866e-05, "loss": 2.4561, "step": 176610 }, { "epoch": 0.31, "learning_rate": 3.459979701238504e-05, "loss": 2.593, "step": 176620 }, { "epoch": 0.31, "learning_rate": 3.459892507245821e-05, "loss": 2.448, "step": 176630 }, { "epoch": 0.31, "learning_rate": 3.4598053132531384e-05, "loss": 2.4317, "step": 176640 }, { "epoch": 0.31, "learning_rate": 3.4597181192604555e-05, "loss": 2.4625, "step": 176650 }, { "epoch": 0.31, "learning_rate": 3.4596309252677725e-05, "loss": 2.5161, "step": 176660 }, { "epoch": 0.31, "learning_rate": 3.45954373127509e-05, "loss": 2.4167, "step": 176670 }, { "epoch": 0.31, "learning_rate": 3.459456537282408e-05, "loss": 2.4126, "step": 176680 }, { "epoch": 0.31, "learning_rate": 3.459369343289725e-05, "loss": 2.4601, "step": 176690 }, { "epoch": 0.31, "learning_rate": 3.459282149297042e-05, "loss": 2.5293, "step": 176700 }, { "epoch": 0.31, "learning_rate": 3.45919495530436e-05, "loss": 2.3067, "step": 176710 }, { "epoch": 0.31, "learning_rate": 3.459107761311677e-05, "loss": 2.5347, "step": 176720 }, { "epoch": 0.31, "learning_rate": 3.459020567318994e-05, "loss": 2.4159, "step": 176730 }, { "epoch": 0.31, "learning_rate": 3.4589333733263115e-05, "loss": 2.3181, "step": 176740 }, { "epoch": 0.31, "learning_rate": 3.4588461793336286e-05, "loss": 2.443, "step": 176750 }, { "epoch": 0.31, "learning_rate": 3.458758985340946e-05, "loss": 2.3403, "step": 176760 }, { "epoch": 0.31, "learning_rate": 3.458671791348263e-05, "loss": 2.4158, "step": 176770 }, { "epoch": 0.31, "learning_rate": 3.458584597355581e-05, "loss": 2.4101, "step": 176780 }, { "epoch": 0.31, "learning_rate": 3.458497403362898e-05, "loss": 2.5524, "step": 176790 }, { "epoch": 0.31, "learning_rate": 3.458410209370215e-05, "loss": 2.4513, "step": 176800 }, { "epoch": 0.31, "learning_rate": 3.458323015377533e-05, "loss": 2.4213, "step": 176810 }, { "epoch": 0.31, "learning_rate": 3.45823582138485e-05, "loss": 2.3921, "step": 176820 }, { "epoch": 0.31, "learning_rate": 3.4581486273921676e-05, "loss": 2.5129, "step": 176830 }, { "epoch": 0.31, "learning_rate": 3.4580614333994846e-05, "loss": 2.3777, "step": 176840 }, { "epoch": 0.31, "learning_rate": 3.457974239406802e-05, "loss": 2.5096, "step": 176850 }, { "epoch": 0.31, "learning_rate": 3.4578870454141194e-05, "loss": 2.4708, "step": 176860 }, { "epoch": 0.31, "learning_rate": 3.4577998514214364e-05, "loss": 2.331, "step": 176870 }, { "epoch": 0.31, "learning_rate": 3.457712657428754e-05, "loss": 2.4943, "step": 176880 }, { "epoch": 0.31, "learning_rate": 3.457625463436071e-05, "loss": 2.4888, "step": 176890 }, { "epoch": 0.31, "learning_rate": 3.457538269443388e-05, "loss": 2.4724, "step": 176900 }, { "epoch": 0.31, "learning_rate": 3.457451075450706e-05, "loss": 2.3371, "step": 176910 }, { "epoch": 0.31, "learning_rate": 3.4573638814580236e-05, "loss": 2.5098, "step": 176920 }, { "epoch": 0.31, "learning_rate": 3.457276687465341e-05, "loss": 2.4303, "step": 176930 }, { "epoch": 0.31, "learning_rate": 3.457189493472658e-05, "loss": 2.5357, "step": 176940 }, { "epoch": 0.31, "learning_rate": 3.4571022994799754e-05, "loss": 2.4667, "step": 176950 }, { "epoch": 0.31, "learning_rate": 3.4570151054872925e-05, "loss": 2.3857, "step": 176960 }, { "epoch": 0.31, "learning_rate": 3.4569279114946095e-05, "loss": 2.5795, "step": 176970 }, { "epoch": 0.31, "learning_rate": 3.456840717501927e-05, "loss": 2.4464, "step": 176980 }, { "epoch": 0.31, "learning_rate": 3.456753523509245e-05, "loss": 2.5866, "step": 176990 }, { "epoch": 0.31, "learning_rate": 3.456666329516562e-05, "loss": 2.4656, "step": 177000 }, { "epoch": 0.31, "learning_rate": 3.456579135523879e-05, "loss": 2.5063, "step": 177010 }, { "epoch": 0.31, "learning_rate": 3.456491941531196e-05, "loss": 2.3609, "step": 177020 }, { "epoch": 0.31, "learning_rate": 3.456404747538514e-05, "loss": 2.4255, "step": 177030 }, { "epoch": 0.31, "learning_rate": 3.456317553545831e-05, "loss": 2.4608, "step": 177040 }, { "epoch": 0.31, "learning_rate": 3.4562303595531485e-05, "loss": 2.2851, "step": 177050 }, { "epoch": 0.31, "learning_rate": 3.456143165560466e-05, "loss": 2.4759, "step": 177060 }, { "epoch": 0.31, "learning_rate": 3.456055971567783e-05, "loss": 2.4174, "step": 177070 }, { "epoch": 0.31, "learning_rate": 3.4559687775751e-05, "loss": 2.5096, "step": 177080 }, { "epoch": 0.31, "learning_rate": 3.455881583582417e-05, "loss": 2.4195, "step": 177090 }, { "epoch": 0.31, "learning_rate": 3.455794389589735e-05, "loss": 2.5528, "step": 177100 }, { "epoch": 0.31, "learning_rate": 3.455707195597052e-05, "loss": 2.4368, "step": 177110 }, { "epoch": 0.31, "learning_rate": 3.455620001604369e-05, "loss": 2.4419, "step": 177120 }, { "epoch": 0.31, "learning_rate": 3.455532807611687e-05, "loss": 2.483, "step": 177130 }, { "epoch": 0.31, "learning_rate": 3.4554456136190046e-05, "loss": 2.5722, "step": 177140 }, { "epoch": 0.31, "learning_rate": 3.4553584196263216e-05, "loss": 2.5083, "step": 177150 }, { "epoch": 0.31, "learning_rate": 3.4552712256336386e-05, "loss": 2.5109, "step": 177160 }, { "epoch": 0.31, "learning_rate": 3.4551840316409564e-05, "loss": 2.4664, "step": 177170 }, { "epoch": 0.31, "learning_rate": 3.4550968376482734e-05, "loss": 2.4735, "step": 177180 }, { "epoch": 0.31, "learning_rate": 3.4550096436555904e-05, "loss": 2.5632, "step": 177190 }, { "epoch": 0.31, "learning_rate": 3.454922449662908e-05, "loss": 2.436, "step": 177200 }, { "epoch": 0.31, "learning_rate": 3.454835255670226e-05, "loss": 2.4984, "step": 177210 }, { "epoch": 0.31, "learning_rate": 3.454748061677543e-05, "loss": 2.4736, "step": 177220 }, { "epoch": 0.31, "learning_rate": 3.45466086768486e-05, "loss": 2.4547, "step": 177230 }, { "epoch": 0.31, "learning_rate": 3.4545736736921777e-05, "loss": 2.4207, "step": 177240 }, { "epoch": 0.31, "learning_rate": 3.454486479699495e-05, "loss": 2.2302, "step": 177250 }, { "epoch": 0.31, "learning_rate": 3.454399285706812e-05, "loss": 2.4443, "step": 177260 }, { "epoch": 0.31, "learning_rate": 3.4543120917141294e-05, "loss": 2.3802, "step": 177270 }, { "epoch": 0.31, "learning_rate": 3.454224897721447e-05, "loss": 2.4855, "step": 177280 }, { "epoch": 0.31, "learning_rate": 3.454137703728764e-05, "loss": 2.4569, "step": 177290 }, { "epoch": 0.31, "learning_rate": 3.454050509736081e-05, "loss": 2.5284, "step": 177300 }, { "epoch": 0.31, "learning_rate": 3.453963315743399e-05, "loss": 2.3929, "step": 177310 }, { "epoch": 0.31, "learning_rate": 3.453876121750716e-05, "loss": 2.5053, "step": 177320 }, { "epoch": 0.31, "learning_rate": 3.453788927758033e-05, "loss": 2.4229, "step": 177330 }, { "epoch": 0.31, "learning_rate": 3.453701733765351e-05, "loss": 2.5473, "step": 177340 }, { "epoch": 0.31, "learning_rate": 3.4536145397726685e-05, "loss": 2.4733, "step": 177350 }, { "epoch": 0.31, "learning_rate": 3.4535273457799855e-05, "loss": 2.379, "step": 177360 }, { "epoch": 0.31, "learning_rate": 3.4534401517873025e-05, "loss": 2.5046, "step": 177370 }, { "epoch": 0.31, "learning_rate": 3.45335295779462e-05, "loss": 2.2803, "step": 177380 }, { "epoch": 0.31, "learning_rate": 3.453265763801937e-05, "loss": 2.5086, "step": 177390 }, { "epoch": 0.31, "learning_rate": 3.453178569809254e-05, "loss": 2.4484, "step": 177400 }, { "epoch": 0.31, "learning_rate": 3.453091375816572e-05, "loss": 2.5267, "step": 177410 }, { "epoch": 0.31, "learning_rate": 3.453004181823889e-05, "loss": 2.4489, "step": 177420 }, { "epoch": 0.31, "learning_rate": 3.452916987831207e-05, "loss": 2.5536, "step": 177430 }, { "epoch": 0.31, "learning_rate": 3.452829793838524e-05, "loss": 2.4722, "step": 177440 }, { "epoch": 0.31, "learning_rate": 3.4527425998458416e-05, "loss": 2.3636, "step": 177450 }, { "epoch": 0.31, "learning_rate": 3.4526554058531586e-05, "loss": 2.4939, "step": 177460 }, { "epoch": 0.31, "learning_rate": 3.4525682118604756e-05, "loss": 2.4014, "step": 177470 }, { "epoch": 0.31, "learning_rate": 3.452481017867793e-05, "loss": 2.4997, "step": 177480 }, { "epoch": 0.31, "learning_rate": 3.4523938238751104e-05, "loss": 2.502, "step": 177490 }, { "epoch": 0.31, "learning_rate": 3.452306629882428e-05, "loss": 2.2767, "step": 177500 }, { "epoch": 0.31, "learning_rate": 3.452219435889745e-05, "loss": 2.3046, "step": 177510 }, { "epoch": 0.31, "learning_rate": 3.452132241897063e-05, "loss": 2.4831, "step": 177520 }, { "epoch": 0.31, "learning_rate": 3.45204504790438e-05, "loss": 2.4384, "step": 177530 }, { "epoch": 0.31, "learning_rate": 3.451957853911697e-05, "loss": 2.348, "step": 177540 }, { "epoch": 0.31, "learning_rate": 3.451870659919014e-05, "loss": 2.4649, "step": 177550 }, { "epoch": 0.31, "learning_rate": 3.451783465926332e-05, "loss": 2.3746, "step": 177560 }, { "epoch": 0.31, "learning_rate": 3.451696271933649e-05, "loss": 2.5051, "step": 177570 }, { "epoch": 0.31, "learning_rate": 3.4516090779409664e-05, "loss": 2.4917, "step": 177580 }, { "epoch": 0.31, "learning_rate": 3.4515218839482835e-05, "loss": 2.4552, "step": 177590 }, { "epoch": 0.31, "learning_rate": 3.451434689955601e-05, "loss": 2.4258, "step": 177600 }, { "epoch": 0.31, "learning_rate": 3.451347495962918e-05, "loss": 2.4257, "step": 177610 }, { "epoch": 0.31, "learning_rate": 3.451260301970235e-05, "loss": 2.3749, "step": 177620 }, { "epoch": 0.31, "learning_rate": 3.451173107977553e-05, "loss": 2.5044, "step": 177630 }, { "epoch": 0.31, "learning_rate": 3.45108591398487e-05, "loss": 2.4904, "step": 177640 }, { "epoch": 0.31, "learning_rate": 3.450998719992188e-05, "loss": 2.3916, "step": 177650 }, { "epoch": 0.31, "learning_rate": 3.450911525999505e-05, "loss": 2.5031, "step": 177660 }, { "epoch": 0.31, "learning_rate": 3.4508243320068225e-05, "loss": 2.3587, "step": 177670 }, { "epoch": 0.31, "learning_rate": 3.4507371380141395e-05, "loss": 2.3501, "step": 177680 }, { "epoch": 0.31, "learning_rate": 3.4506499440214566e-05, "loss": 2.4078, "step": 177690 }, { "epoch": 0.31, "learning_rate": 3.450562750028774e-05, "loss": 2.5198, "step": 177700 }, { "epoch": 0.31, "learning_rate": 3.450475556036091e-05, "loss": 2.4924, "step": 177710 }, { "epoch": 0.31, "learning_rate": 3.450388362043409e-05, "loss": 2.443, "step": 177720 }, { "epoch": 0.31, "learning_rate": 3.450301168050726e-05, "loss": 2.4946, "step": 177730 }, { "epoch": 0.31, "learning_rate": 3.450213974058044e-05, "loss": 2.5387, "step": 177740 }, { "epoch": 0.31, "learning_rate": 3.450126780065361e-05, "loss": 2.422, "step": 177750 }, { "epoch": 0.31, "learning_rate": 3.450039586072678e-05, "loss": 2.552, "step": 177760 }, { "epoch": 0.31, "learning_rate": 3.4499523920799956e-05, "loss": 2.5253, "step": 177770 }, { "epoch": 0.31, "learning_rate": 3.4498651980873126e-05, "loss": 2.4517, "step": 177780 }, { "epoch": 0.31, "learning_rate": 3.44977800409463e-05, "loss": 2.4195, "step": 177790 }, { "epoch": 0.31, "learning_rate": 3.4496908101019474e-05, "loss": 2.4582, "step": 177800 }, { "epoch": 0.31, "learning_rate": 3.449603616109265e-05, "loss": 2.5251, "step": 177810 }, { "epoch": 0.31, "learning_rate": 3.449516422116582e-05, "loss": 2.495, "step": 177820 }, { "epoch": 0.31, "learning_rate": 3.449429228123899e-05, "loss": 2.4383, "step": 177830 }, { "epoch": 0.31, "learning_rate": 3.449342034131217e-05, "loss": 2.4725, "step": 177840 }, { "epoch": 0.31, "learning_rate": 3.449254840138534e-05, "loss": 2.3961, "step": 177850 }, { "epoch": 0.31, "learning_rate": 3.449167646145851e-05, "loss": 2.5526, "step": 177860 }, { "epoch": 0.31, "learning_rate": 3.449080452153169e-05, "loss": 2.482, "step": 177870 }, { "epoch": 0.31, "learning_rate": 3.4489932581604864e-05, "loss": 2.3158, "step": 177880 }, { "epoch": 0.31, "learning_rate": 3.4489060641678034e-05, "loss": 2.4396, "step": 177890 }, { "epoch": 0.31, "learning_rate": 3.4488188701751205e-05, "loss": 2.4649, "step": 177900 }, { "epoch": 0.31, "learning_rate": 3.448731676182438e-05, "loss": 2.5164, "step": 177910 }, { "epoch": 0.31, "learning_rate": 3.448644482189755e-05, "loss": 2.4655, "step": 177920 }, { "epoch": 0.31, "learning_rate": 3.448557288197072e-05, "loss": 2.4916, "step": 177930 }, { "epoch": 0.31, "learning_rate": 3.448470094204389e-05, "loss": 2.3897, "step": 177940 }, { "epoch": 0.31, "learning_rate": 3.448382900211708e-05, "loss": 2.4846, "step": 177950 }, { "epoch": 0.31, "learning_rate": 3.448295706219025e-05, "loss": 2.5546, "step": 177960 }, { "epoch": 0.31, "learning_rate": 3.448208512226342e-05, "loss": 2.427, "step": 177970 }, { "epoch": 0.31, "learning_rate": 3.448121318233659e-05, "loss": 2.4372, "step": 177980 }, { "epoch": 0.31, "learning_rate": 3.4480341242409765e-05, "loss": 2.6407, "step": 177990 }, { "epoch": 0.31, "learning_rate": 3.4479469302482936e-05, "loss": 2.4726, "step": 178000 }, { "epoch": 0.31, "learning_rate": 3.4478597362556106e-05, "loss": 2.5005, "step": 178010 }, { "epoch": 0.31, "learning_rate": 3.447772542262929e-05, "loss": 2.5465, "step": 178020 }, { "epoch": 0.31, "learning_rate": 3.447685348270246e-05, "loss": 2.4928, "step": 178030 }, { "epoch": 0.31, "learning_rate": 3.447598154277563e-05, "loss": 2.4959, "step": 178040 }, { "epoch": 0.31, "learning_rate": 3.44751096028488e-05, "loss": 2.3871, "step": 178050 }, { "epoch": 0.31, "learning_rate": 3.447423766292198e-05, "loss": 2.4779, "step": 178060 }, { "epoch": 0.31, "learning_rate": 3.447336572299515e-05, "loss": 2.5135, "step": 178070 }, { "epoch": 0.31, "learning_rate": 3.447249378306832e-05, "loss": 2.5244, "step": 178080 }, { "epoch": 0.31, "learning_rate": 3.4471621843141496e-05, "loss": 2.512, "step": 178090 }, { "epoch": 0.31, "learning_rate": 3.447074990321467e-05, "loss": 2.4825, "step": 178100 }, { "epoch": 0.31, "learning_rate": 3.4469877963287844e-05, "loss": 2.441, "step": 178110 }, { "epoch": 0.31, "learning_rate": 3.4469006023361014e-05, "loss": 2.3713, "step": 178120 }, { "epoch": 0.31, "learning_rate": 3.446813408343419e-05, "loss": 2.3909, "step": 178130 }, { "epoch": 0.31, "learning_rate": 3.446726214350736e-05, "loss": 2.4093, "step": 178140 }, { "epoch": 0.31, "learning_rate": 3.446639020358053e-05, "loss": 2.5052, "step": 178150 }, { "epoch": 0.31, "learning_rate": 3.446551826365371e-05, "loss": 2.3169, "step": 178160 }, { "epoch": 0.31, "learning_rate": 3.4464646323726886e-05, "loss": 2.463, "step": 178170 }, { "epoch": 0.31, "learning_rate": 3.446377438380006e-05, "loss": 2.5167, "step": 178180 }, { "epoch": 0.31, "learning_rate": 3.446290244387323e-05, "loss": 2.3485, "step": 178190 }, { "epoch": 0.31, "learning_rate": 3.4462030503946404e-05, "loss": 2.3939, "step": 178200 }, { "epoch": 0.31, "learning_rate": 3.4461158564019575e-05, "loss": 2.2944, "step": 178210 }, { "epoch": 0.31, "learning_rate": 3.4460286624092745e-05, "loss": 2.4506, "step": 178220 }, { "epoch": 0.31, "learning_rate": 3.445941468416592e-05, "loss": 2.424, "step": 178230 }, { "epoch": 0.31, "learning_rate": 3.445854274423909e-05, "loss": 2.4659, "step": 178240 }, { "epoch": 0.31, "learning_rate": 3.445767080431227e-05, "loss": 2.4847, "step": 178250 }, { "epoch": 0.31, "learning_rate": 3.445679886438544e-05, "loss": 2.4413, "step": 178260 }, { "epoch": 0.31, "learning_rate": 3.445592692445862e-05, "loss": 2.4261, "step": 178270 }, { "epoch": 0.31, "learning_rate": 3.445505498453179e-05, "loss": 2.4658, "step": 178280 }, { "epoch": 0.31, "learning_rate": 3.445418304460496e-05, "loss": 2.4115, "step": 178290 }, { "epoch": 0.31, "learning_rate": 3.4453311104678135e-05, "loss": 2.3159, "step": 178300 }, { "epoch": 0.31, "learning_rate": 3.4452439164751306e-05, "loss": 2.453, "step": 178310 }, { "epoch": 0.31, "learning_rate": 3.445156722482448e-05, "loss": 2.4535, "step": 178320 }, { "epoch": 0.31, "learning_rate": 3.445069528489765e-05, "loss": 2.4171, "step": 178330 }, { "epoch": 0.31, "learning_rate": 3.444982334497083e-05, "loss": 2.4288, "step": 178340 }, { "epoch": 0.31, "learning_rate": 3.4448951405044e-05, "loss": 2.241, "step": 178350 }, { "epoch": 0.31, "learning_rate": 3.444807946511717e-05, "loss": 2.4042, "step": 178360 }, { "epoch": 0.31, "learning_rate": 3.444720752519034e-05, "loss": 2.5267, "step": 178370 }, { "epoch": 0.31, "learning_rate": 3.444633558526352e-05, "loss": 2.3826, "step": 178380 }, { "epoch": 0.31, "learning_rate": 3.4445463645336696e-05, "loss": 2.4298, "step": 178390 }, { "epoch": 0.31, "learning_rate": 3.4444591705409866e-05, "loss": 2.4341, "step": 178400 }, { "epoch": 0.31, "learning_rate": 3.444371976548304e-05, "loss": 2.4896, "step": 178410 }, { "epoch": 0.31, "learning_rate": 3.4442847825556214e-05, "loss": 2.4538, "step": 178420 }, { "epoch": 0.31, "learning_rate": 3.4441975885629384e-05, "loss": 2.4394, "step": 178430 }, { "epoch": 0.31, "learning_rate": 3.4441103945702554e-05, "loss": 2.4293, "step": 178440 }, { "epoch": 0.31, "learning_rate": 3.444023200577573e-05, "loss": 2.3673, "step": 178450 }, { "epoch": 0.31, "learning_rate": 3.44393600658489e-05, "loss": 2.4195, "step": 178460 }, { "epoch": 0.31, "learning_rate": 3.443848812592208e-05, "loss": 2.3694, "step": 178470 }, { "epoch": 0.31, "learning_rate": 3.443761618599525e-05, "loss": 2.3659, "step": 178480 }, { "epoch": 0.31, "learning_rate": 3.443674424606843e-05, "loss": 2.3667, "step": 178490 }, { "epoch": 0.31, "learning_rate": 3.44358723061416e-05, "loss": 2.2577, "step": 178500 }, { "epoch": 0.31, "learning_rate": 3.443500036621477e-05, "loss": 2.4335, "step": 178510 }, { "epoch": 0.31, "learning_rate": 3.4434128426287945e-05, "loss": 2.4022, "step": 178520 }, { "epoch": 0.31, "learning_rate": 3.4433256486361115e-05, "loss": 2.4139, "step": 178530 }, { "epoch": 0.31, "learning_rate": 3.443238454643429e-05, "loss": 2.4278, "step": 178540 }, { "epoch": 0.31, "learning_rate": 3.443151260650746e-05, "loss": 2.3724, "step": 178550 }, { "epoch": 0.31, "learning_rate": 3.443064066658064e-05, "loss": 2.2945, "step": 178560 }, { "epoch": 0.31, "learning_rate": 3.442976872665381e-05, "loss": 2.454, "step": 178570 }, { "epoch": 0.31, "learning_rate": 3.442889678672698e-05, "loss": 2.5059, "step": 178580 }, { "epoch": 0.31, "learning_rate": 3.442802484680016e-05, "loss": 2.3414, "step": 178590 }, { "epoch": 0.31, "learning_rate": 3.442715290687333e-05, "loss": 2.3703, "step": 178600 }, { "epoch": 0.31, "learning_rate": 3.44262809669465e-05, "loss": 2.4825, "step": 178610 }, { "epoch": 0.31, "learning_rate": 3.4425409027019675e-05, "loss": 2.3662, "step": 178620 }, { "epoch": 0.31, "learning_rate": 3.442453708709285e-05, "loss": 2.4738, "step": 178630 }, { "epoch": 0.31, "learning_rate": 3.442366514716602e-05, "loss": 2.5802, "step": 178640 }, { "epoch": 0.31, "learning_rate": 3.4422793207239193e-05, "loss": 2.4503, "step": 178650 }, { "epoch": 0.31, "learning_rate": 3.442192126731237e-05, "loss": 2.456, "step": 178660 }, { "epoch": 0.31, "learning_rate": 3.442104932738554e-05, "loss": 2.4155, "step": 178670 }, { "epoch": 0.31, "learning_rate": 3.442017738745871e-05, "loss": 2.2935, "step": 178680 }, { "epoch": 0.31, "learning_rate": 3.441930544753189e-05, "loss": 2.6265, "step": 178690 }, { "epoch": 0.31, "learning_rate": 3.4418433507605066e-05, "loss": 2.4024, "step": 178700 }, { "epoch": 0.31, "learning_rate": 3.4417561567678236e-05, "loss": 2.5004, "step": 178710 }, { "epoch": 0.31, "learning_rate": 3.4416689627751406e-05, "loss": 2.4706, "step": 178720 }, { "epoch": 0.31, "learning_rate": 3.4415817687824584e-05, "loss": 2.3923, "step": 178730 }, { "epoch": 0.31, "learning_rate": 3.4414945747897754e-05, "loss": 2.3466, "step": 178740 }, { "epoch": 0.31, "learning_rate": 3.4414073807970924e-05, "loss": 2.4881, "step": 178750 }, { "epoch": 0.31, "learning_rate": 3.44132018680441e-05, "loss": 2.4288, "step": 178760 }, { "epoch": 0.31, "learning_rate": 3.441232992811728e-05, "loss": 2.3944, "step": 178770 }, { "epoch": 0.31, "learning_rate": 3.441145798819045e-05, "loss": 2.4008, "step": 178780 }, { "epoch": 0.31, "learning_rate": 3.441058604826362e-05, "loss": 2.4794, "step": 178790 }, { "epoch": 0.31, "learning_rate": 3.4409714108336797e-05, "loss": 2.4088, "step": 178800 }, { "epoch": 0.31, "learning_rate": 3.440884216840997e-05, "loss": 2.4659, "step": 178810 }, { "epoch": 0.31, "learning_rate": 3.440797022848314e-05, "loss": 2.5015, "step": 178820 }, { "epoch": 0.31, "learning_rate": 3.440709828855631e-05, "loss": 2.5493, "step": 178830 }, { "epoch": 0.31, "learning_rate": 3.440622634862949e-05, "loss": 2.4204, "step": 178840 }, { "epoch": 0.31, "learning_rate": 3.440535440870266e-05, "loss": 2.4063, "step": 178850 }, { "epoch": 0.31, "learning_rate": 3.440448246877583e-05, "loss": 2.4502, "step": 178860 }, { "epoch": 0.31, "learning_rate": 3.440361052884901e-05, "loss": 2.3614, "step": 178870 }, { "epoch": 0.31, "learning_rate": 3.440273858892218e-05, "loss": 2.4522, "step": 178880 }, { "epoch": 0.31, "learning_rate": 3.440186664899535e-05, "loss": 2.3663, "step": 178890 }, { "epoch": 0.31, "learning_rate": 3.440099470906852e-05, "loss": 2.4305, "step": 178900 }, { "epoch": 0.31, "learning_rate": 3.4400122769141705e-05, "loss": 2.4586, "step": 178910 }, { "epoch": 0.31, "learning_rate": 3.4399250829214875e-05, "loss": 2.3135, "step": 178920 }, { "epoch": 0.31, "learning_rate": 3.4398378889288045e-05, "loss": 2.3065, "step": 178930 }, { "epoch": 0.31, "learning_rate": 3.4397506949361216e-05, "loss": 2.4024, "step": 178940 }, { "epoch": 0.31, "learning_rate": 3.439663500943439e-05, "loss": 2.4086, "step": 178950 }, { "epoch": 0.31, "learning_rate": 3.439576306950756e-05, "loss": 2.3734, "step": 178960 }, { "epoch": 0.31, "learning_rate": 3.4394891129580734e-05, "loss": 2.4569, "step": 178970 }, { "epoch": 0.31, "learning_rate": 3.439401918965391e-05, "loss": 2.3995, "step": 178980 }, { "epoch": 0.31, "learning_rate": 3.439314724972709e-05, "loss": 2.4935, "step": 178990 }, { "epoch": 0.31, "learning_rate": 3.439227530980026e-05, "loss": 2.4557, "step": 179000 }, { "epoch": 0.31, "learning_rate": 3.439140336987343e-05, "loss": 2.5347, "step": 179010 }, { "epoch": 0.31, "learning_rate": 3.4390531429946606e-05, "loss": 2.4366, "step": 179020 }, { "epoch": 0.31, "learning_rate": 3.4389659490019776e-05, "loss": 2.4941, "step": 179030 }, { "epoch": 0.31, "learning_rate": 3.438878755009295e-05, "loss": 2.4503, "step": 179040 }, { "epoch": 0.31, "learning_rate": 3.4387915610166124e-05, "loss": 2.4028, "step": 179050 }, { "epoch": 0.31, "learning_rate": 3.43870436702393e-05, "loss": 2.2831, "step": 179060 }, { "epoch": 0.31, "learning_rate": 3.438617173031247e-05, "loss": 2.4475, "step": 179070 }, { "epoch": 0.31, "learning_rate": 3.438529979038564e-05, "loss": 2.5232, "step": 179080 }, { "epoch": 0.31, "learning_rate": 3.438442785045882e-05, "loss": 2.3864, "step": 179090 }, { "epoch": 0.31, "learning_rate": 3.438355591053199e-05, "loss": 2.434, "step": 179100 }, { "epoch": 0.31, "learning_rate": 3.438268397060516e-05, "loss": 2.4928, "step": 179110 }, { "epoch": 0.31, "learning_rate": 3.438181203067834e-05, "loss": 2.3524, "step": 179120 }, { "epoch": 0.31, "learning_rate": 3.438094009075151e-05, "loss": 2.487, "step": 179130 }, { "epoch": 0.31, "learning_rate": 3.4380068150824684e-05, "loss": 2.5601, "step": 179140 }, { "epoch": 0.31, "learning_rate": 3.4379196210897855e-05, "loss": 2.3997, "step": 179150 }, { "epoch": 0.31, "learning_rate": 3.437832427097103e-05, "loss": 2.5378, "step": 179160 }, { "epoch": 0.31, "learning_rate": 3.43774523310442e-05, "loss": 2.4441, "step": 179170 }, { "epoch": 0.31, "learning_rate": 3.437658039111737e-05, "loss": 2.4585, "step": 179180 }, { "epoch": 0.31, "learning_rate": 3.437570845119055e-05, "loss": 2.5612, "step": 179190 }, { "epoch": 0.31, "learning_rate": 3.437483651126372e-05, "loss": 2.299, "step": 179200 }, { "epoch": 0.31, "learning_rate": 3.43739645713369e-05, "loss": 2.5094, "step": 179210 }, { "epoch": 0.31, "learning_rate": 3.437309263141007e-05, "loss": 2.4593, "step": 179220 }, { "epoch": 0.31, "learning_rate": 3.4372220691483245e-05, "loss": 2.4299, "step": 179230 }, { "epoch": 0.31, "learning_rate": 3.4371348751556415e-05, "loss": 2.4129, "step": 179240 }, { "epoch": 0.31, "learning_rate": 3.4370476811629586e-05, "loss": 2.4272, "step": 179250 }, { "epoch": 0.31, "learning_rate": 3.436960487170276e-05, "loss": 2.4304, "step": 179260 }, { "epoch": 0.31, "learning_rate": 3.436873293177593e-05, "loss": 2.2521, "step": 179270 }, { "epoch": 0.31, "learning_rate": 3.4367860991849104e-05, "loss": 2.3523, "step": 179280 }, { "epoch": 0.31, "learning_rate": 3.436698905192228e-05, "loss": 2.4252, "step": 179290 }, { "epoch": 0.31, "learning_rate": 3.436611711199546e-05, "loss": 2.3935, "step": 179300 }, { "epoch": 0.31, "learning_rate": 3.436524517206863e-05, "loss": 2.4435, "step": 179310 }, { "epoch": 0.31, "learning_rate": 3.43643732321418e-05, "loss": 2.4973, "step": 179320 }, { "epoch": 0.31, "learning_rate": 3.436350129221497e-05, "loss": 2.4781, "step": 179330 }, { "epoch": 0.31, "learning_rate": 3.4362629352288146e-05, "loss": 2.4721, "step": 179340 }, { "epoch": 0.31, "learning_rate": 3.436175741236132e-05, "loss": 2.4268, "step": 179350 }, { "epoch": 0.31, "learning_rate": 3.4360885472434494e-05, "loss": 2.4326, "step": 179360 }, { "epoch": 0.31, "learning_rate": 3.436001353250767e-05, "loss": 2.2353, "step": 179370 }, { "epoch": 0.31, "learning_rate": 3.435914159258084e-05, "loss": 2.4181, "step": 179380 }, { "epoch": 0.31, "learning_rate": 3.435826965265401e-05, "loss": 2.5071, "step": 179390 }, { "epoch": 0.31, "learning_rate": 3.435739771272718e-05, "loss": 2.3592, "step": 179400 }, { "epoch": 0.31, "learning_rate": 3.435652577280036e-05, "loss": 2.3133, "step": 179410 }, { "epoch": 0.31, "learning_rate": 3.435565383287353e-05, "loss": 2.4075, "step": 179420 }, { "epoch": 0.31, "learning_rate": 3.43547818929467e-05, "loss": 2.4953, "step": 179430 }, { "epoch": 0.31, "learning_rate": 3.435390995301988e-05, "loss": 2.5216, "step": 179440 }, { "epoch": 0.31, "learning_rate": 3.4353038013093054e-05, "loss": 2.4226, "step": 179450 }, { "epoch": 0.31, "learning_rate": 3.4352166073166225e-05, "loss": 2.2645, "step": 179460 }, { "epoch": 0.31, "learning_rate": 3.4351294133239395e-05, "loss": 2.4233, "step": 179470 }, { "epoch": 0.31, "learning_rate": 3.435042219331257e-05, "loss": 2.4423, "step": 179480 }, { "epoch": 0.31, "learning_rate": 3.434955025338574e-05, "loss": 2.3901, "step": 179490 }, { "epoch": 0.31, "learning_rate": 3.434867831345891e-05, "loss": 2.5459, "step": 179500 }, { "epoch": 0.31, "learning_rate": 3.434780637353209e-05, "loss": 2.3465, "step": 179510 }, { "epoch": 0.31, "learning_rate": 3.434693443360527e-05, "loss": 2.3793, "step": 179520 }, { "epoch": 0.31, "learning_rate": 3.434606249367844e-05, "loss": 2.4672, "step": 179530 }, { "epoch": 0.31, "learning_rate": 3.434519055375161e-05, "loss": 2.3712, "step": 179540 }, { "epoch": 0.31, "learning_rate": 3.4344318613824785e-05, "loss": 2.5043, "step": 179550 }, { "epoch": 0.31, "learning_rate": 3.4343446673897956e-05, "loss": 2.4581, "step": 179560 }, { "epoch": 0.31, "learning_rate": 3.4342574733971126e-05, "loss": 2.5077, "step": 179570 }, { "epoch": 0.31, "learning_rate": 3.43417027940443e-05, "loss": 2.4286, "step": 179580 }, { "epoch": 0.31, "learning_rate": 3.434083085411748e-05, "loss": 2.4663, "step": 179590 }, { "epoch": 0.31, "learning_rate": 3.433995891419065e-05, "loss": 2.4009, "step": 179600 }, { "epoch": 0.31, "learning_rate": 3.433908697426382e-05, "loss": 2.4186, "step": 179610 }, { "epoch": 0.31, "learning_rate": 3.4338215034337e-05, "loss": 2.4538, "step": 179620 }, { "epoch": 0.31, "learning_rate": 3.433734309441017e-05, "loss": 2.4226, "step": 179630 }, { "epoch": 0.31, "learning_rate": 3.433647115448334e-05, "loss": 2.3881, "step": 179640 }, { "epoch": 0.31, "learning_rate": 3.4335599214556516e-05, "loss": 2.4386, "step": 179650 }, { "epoch": 0.31, "learning_rate": 3.433472727462969e-05, "loss": 2.3684, "step": 179660 }, { "epoch": 0.31, "learning_rate": 3.4333855334702864e-05, "loss": 2.4503, "step": 179670 }, { "epoch": 0.31, "learning_rate": 3.4332983394776034e-05, "loss": 2.4649, "step": 179680 }, { "epoch": 0.31, "learning_rate": 3.433211145484921e-05, "loss": 2.2999, "step": 179690 }, { "epoch": 0.31, "learning_rate": 3.433123951492238e-05, "loss": 2.3706, "step": 179700 }, { "epoch": 0.31, "learning_rate": 3.433036757499555e-05, "loss": 2.4586, "step": 179710 }, { "epoch": 0.31, "learning_rate": 3.432949563506873e-05, "loss": 2.4798, "step": 179720 }, { "epoch": 0.31, "learning_rate": 3.4328623695141906e-05, "loss": 2.449, "step": 179730 }, { "epoch": 0.31, "learning_rate": 3.432775175521508e-05, "loss": 2.4438, "step": 179740 }, { "epoch": 0.31, "learning_rate": 3.432687981528825e-05, "loss": 2.4743, "step": 179750 }, { "epoch": 0.31, "learning_rate": 3.4326007875361424e-05, "loss": 2.5212, "step": 179760 }, { "epoch": 0.31, "learning_rate": 3.4325135935434595e-05, "loss": 2.3916, "step": 179770 }, { "epoch": 0.31, "learning_rate": 3.4324263995507765e-05, "loss": 2.4617, "step": 179780 }, { "epoch": 0.31, "learning_rate": 3.4323392055580935e-05, "loss": 2.4928, "step": 179790 }, { "epoch": 0.31, "learning_rate": 3.432252011565411e-05, "loss": 2.4724, "step": 179800 }, { "epoch": 0.31, "learning_rate": 3.432164817572729e-05, "loss": 2.5039, "step": 179810 }, { "epoch": 0.31, "learning_rate": 3.432077623580046e-05, "loss": 2.4206, "step": 179820 }, { "epoch": 0.31, "learning_rate": 3.431990429587364e-05, "loss": 2.4838, "step": 179830 }, { "epoch": 0.31, "learning_rate": 3.431903235594681e-05, "loss": 2.4254, "step": 179840 }, { "epoch": 0.31, "learning_rate": 3.431816041601998e-05, "loss": 2.519, "step": 179850 }, { "epoch": 0.31, "learning_rate": 3.431728847609315e-05, "loss": 2.427, "step": 179860 }, { "epoch": 0.31, "learning_rate": 3.4316416536166326e-05, "loss": 2.5143, "step": 179870 }, { "epoch": 0.31, "learning_rate": 3.43155445962395e-05, "loss": 2.5267, "step": 179880 }, { "epoch": 0.31, "learning_rate": 3.431467265631267e-05, "loss": 2.4347, "step": 179890 }, { "epoch": 0.31, "learning_rate": 3.4313800716385843e-05, "loss": 2.4461, "step": 179900 }, { "epoch": 0.31, "learning_rate": 3.431292877645902e-05, "loss": 2.3454, "step": 179910 }, { "epoch": 0.31, "learning_rate": 3.431205683653219e-05, "loss": 2.4606, "step": 179920 }, { "epoch": 0.31, "learning_rate": 3.431118489660536e-05, "loss": 2.4903, "step": 179930 }, { "epoch": 0.31, "learning_rate": 3.431031295667854e-05, "loss": 2.4503, "step": 179940 }, { "epoch": 0.31, "learning_rate": 3.430944101675171e-05, "loss": 2.4668, "step": 179950 }, { "epoch": 0.31, "learning_rate": 3.4308569076824886e-05, "loss": 2.4788, "step": 179960 }, { "epoch": 0.31, "learning_rate": 3.4307697136898056e-05, "loss": 2.4052, "step": 179970 }, { "epoch": 0.31, "learning_rate": 3.4306825196971234e-05, "loss": 2.356, "step": 179980 }, { "epoch": 0.31, "learning_rate": 3.4305953257044404e-05, "loss": 2.3503, "step": 179990 }, { "epoch": 0.31, "learning_rate": 3.4305081317117574e-05, "loss": 2.4196, "step": 180000 }, { "epoch": 0.31, "learning_rate": 3.430420937719075e-05, "loss": 2.3143, "step": 180010 }, { "epoch": 0.31, "learning_rate": 3.430333743726392e-05, "loss": 2.353, "step": 180020 }, { "epoch": 0.31, "learning_rate": 3.43024654973371e-05, "loss": 2.4456, "step": 180030 }, { "epoch": 0.31, "learning_rate": 3.430159355741027e-05, "loss": 2.4303, "step": 180040 }, { "epoch": 0.31, "learning_rate": 3.430072161748345e-05, "loss": 2.3267, "step": 180050 }, { "epoch": 0.31, "learning_rate": 3.429984967755662e-05, "loss": 2.3519, "step": 180060 }, { "epoch": 0.31, "learning_rate": 3.429897773762979e-05, "loss": 2.4951, "step": 180070 }, { "epoch": 0.31, "learning_rate": 3.4298105797702965e-05, "loss": 2.5871, "step": 180080 }, { "epoch": 0.31, "learning_rate": 3.4297233857776135e-05, "loss": 2.4403, "step": 180090 }, { "epoch": 0.31, "learning_rate": 3.4296361917849305e-05, "loss": 2.4444, "step": 180100 }, { "epoch": 0.31, "learning_rate": 3.429548997792248e-05, "loss": 2.4355, "step": 180110 }, { "epoch": 0.31, "learning_rate": 3.429461803799566e-05, "loss": 2.4301, "step": 180120 }, { "epoch": 0.31, "learning_rate": 3.429374609806883e-05, "loss": 2.4532, "step": 180130 }, { "epoch": 0.31, "learning_rate": 3.4292874158142e-05, "loss": 2.3771, "step": 180140 }, { "epoch": 0.31, "learning_rate": 3.429200221821518e-05, "loss": 2.45, "step": 180150 }, { "epoch": 0.31, "learning_rate": 3.429113027828835e-05, "loss": 2.3684, "step": 180160 }, { "epoch": 0.31, "learning_rate": 3.429025833836152e-05, "loss": 2.4955, "step": 180170 }, { "epoch": 0.31, "learning_rate": 3.4289386398434695e-05, "loss": 2.5002, "step": 180180 }, { "epoch": 0.31, "learning_rate": 3.428851445850787e-05, "loss": 2.4987, "step": 180190 }, { "epoch": 0.31, "learning_rate": 3.428764251858104e-05, "loss": 2.4202, "step": 180200 }, { "epoch": 0.31, "learning_rate": 3.4286770578654213e-05, "loss": 2.3966, "step": 180210 }, { "epoch": 0.31, "learning_rate": 3.428589863872739e-05, "loss": 2.4858, "step": 180220 }, { "epoch": 0.31, "learning_rate": 3.428502669880056e-05, "loss": 2.398, "step": 180230 }, { "epoch": 0.31, "learning_rate": 3.428415475887373e-05, "loss": 2.3928, "step": 180240 }, { "epoch": 0.31, "learning_rate": 3.428328281894691e-05, "loss": 2.3756, "step": 180250 }, { "epoch": 0.31, "learning_rate": 3.4282410879020086e-05, "loss": 2.3851, "step": 180260 }, { "epoch": 0.31, "learning_rate": 3.4281538939093256e-05, "loss": 2.369, "step": 180270 }, { "epoch": 0.31, "learning_rate": 3.4280666999166426e-05, "loss": 2.4055, "step": 180280 }, { "epoch": 0.31, "learning_rate": 3.42797950592396e-05, "loss": 2.4631, "step": 180290 }, { "epoch": 0.31, "learning_rate": 3.4278923119312774e-05, "loss": 2.4653, "step": 180300 }, { "epoch": 0.31, "learning_rate": 3.4278051179385944e-05, "loss": 2.5684, "step": 180310 }, { "epoch": 0.31, "learning_rate": 3.4277179239459115e-05, "loss": 2.3773, "step": 180320 }, { "epoch": 0.31, "learning_rate": 3.42763072995323e-05, "loss": 2.5222, "step": 180330 }, { "epoch": 0.31, "learning_rate": 3.427543535960547e-05, "loss": 2.4235, "step": 180340 }, { "epoch": 0.31, "learning_rate": 3.427456341967864e-05, "loss": 2.4613, "step": 180350 }, { "epoch": 0.31, "learning_rate": 3.427369147975181e-05, "loss": 2.4426, "step": 180360 }, { "epoch": 0.31, "learning_rate": 3.427281953982499e-05, "loss": 2.4763, "step": 180370 }, { "epoch": 0.31, "learning_rate": 3.427194759989816e-05, "loss": 2.3751, "step": 180380 }, { "epoch": 0.31, "learning_rate": 3.427107565997133e-05, "loss": 2.465, "step": 180390 }, { "epoch": 0.31, "learning_rate": 3.4270203720044505e-05, "loss": 2.4713, "step": 180400 }, { "epoch": 0.31, "learning_rate": 3.426933178011768e-05, "loss": 2.4146, "step": 180410 }, { "epoch": 0.31, "learning_rate": 3.426845984019085e-05, "loss": 2.4029, "step": 180420 }, { "epoch": 0.31, "learning_rate": 3.426758790026402e-05, "loss": 2.4912, "step": 180430 }, { "epoch": 0.31, "learning_rate": 3.42667159603372e-05, "loss": 2.4811, "step": 180440 }, { "epoch": 0.31, "learning_rate": 3.426584402041037e-05, "loss": 2.4035, "step": 180450 }, { "epoch": 0.31, "learning_rate": 3.426497208048354e-05, "loss": 2.5189, "step": 180460 }, { "epoch": 0.31, "learning_rate": 3.426410014055672e-05, "loss": 2.4069, "step": 180470 }, { "epoch": 0.31, "learning_rate": 3.4263228200629895e-05, "loss": 2.3242, "step": 180480 }, { "epoch": 0.31, "learning_rate": 3.4262356260703065e-05, "loss": 2.4078, "step": 180490 }, { "epoch": 0.31, "learning_rate": 3.4261484320776236e-05, "loss": 2.3777, "step": 180500 }, { "epoch": 0.31, "learning_rate": 3.426061238084941e-05, "loss": 2.3783, "step": 180510 }, { "epoch": 0.31, "learning_rate": 3.425974044092258e-05, "loss": 2.4492, "step": 180520 }, { "epoch": 0.31, "learning_rate": 3.4258868500995754e-05, "loss": 2.451, "step": 180530 }, { "epoch": 0.31, "learning_rate": 3.425799656106893e-05, "loss": 2.4429, "step": 180540 }, { "epoch": 0.31, "learning_rate": 3.425712462114211e-05, "loss": 2.4083, "step": 180550 }, { "epoch": 0.31, "learning_rate": 3.425625268121528e-05, "loss": 2.501, "step": 180560 }, { "epoch": 0.31, "learning_rate": 3.425538074128845e-05, "loss": 2.4761, "step": 180570 }, { "epoch": 0.31, "learning_rate": 3.4254508801361626e-05, "loss": 2.4314, "step": 180580 }, { "epoch": 0.31, "learning_rate": 3.4253636861434796e-05, "loss": 2.4772, "step": 180590 }, { "epoch": 0.31, "learning_rate": 3.425276492150797e-05, "loss": 2.4462, "step": 180600 }, { "epoch": 0.31, "learning_rate": 3.4251892981581144e-05, "loss": 2.4165, "step": 180610 }, { "epoch": 0.31, "learning_rate": 3.4251021041654314e-05, "loss": 2.4258, "step": 180620 }, { "epoch": 0.31, "learning_rate": 3.425014910172749e-05, "loss": 2.5166, "step": 180630 }, { "epoch": 0.32, "learning_rate": 3.424927716180066e-05, "loss": 2.4217, "step": 180640 }, { "epoch": 0.32, "learning_rate": 3.424840522187384e-05, "loss": 2.4961, "step": 180650 }, { "epoch": 0.32, "learning_rate": 3.424753328194701e-05, "loss": 2.4082, "step": 180660 }, { "epoch": 0.32, "learning_rate": 3.424666134202018e-05, "loss": 2.4226, "step": 180670 }, { "epoch": 0.32, "learning_rate": 3.424578940209335e-05, "loss": 2.4301, "step": 180680 }, { "epoch": 0.32, "learning_rate": 3.424491746216653e-05, "loss": 2.2655, "step": 180690 }, { "epoch": 0.32, "learning_rate": 3.4244045522239704e-05, "loss": 2.4105, "step": 180700 }, { "epoch": 0.32, "learning_rate": 3.4243173582312875e-05, "loss": 2.4332, "step": 180710 }, { "epoch": 0.32, "learning_rate": 3.424230164238605e-05, "loss": 2.3709, "step": 180720 }, { "epoch": 0.32, "learning_rate": 3.424142970245922e-05, "loss": 2.3866, "step": 180730 }, { "epoch": 0.32, "learning_rate": 3.424055776253239e-05, "loss": 2.3909, "step": 180740 }, { "epoch": 0.32, "learning_rate": 3.423968582260556e-05, "loss": 2.4965, "step": 180750 }, { "epoch": 0.32, "learning_rate": 3.423881388267874e-05, "loss": 2.4613, "step": 180760 }, { "epoch": 0.32, "learning_rate": 3.423794194275192e-05, "loss": 2.4647, "step": 180770 }, { "epoch": 0.32, "learning_rate": 3.423707000282509e-05, "loss": 2.3249, "step": 180780 }, { "epoch": 0.32, "learning_rate": 3.423619806289826e-05, "loss": 2.4496, "step": 180790 }, { "epoch": 0.32, "learning_rate": 3.4235326122971435e-05, "loss": 2.372, "step": 180800 }, { "epoch": 0.32, "learning_rate": 3.4234454183044606e-05, "loss": 2.4142, "step": 180810 }, { "epoch": 0.32, "learning_rate": 3.4233582243117776e-05, "loss": 2.39, "step": 180820 }, { "epoch": 0.32, "learning_rate": 3.423271030319095e-05, "loss": 2.4712, "step": 180830 }, { "epoch": 0.32, "learning_rate": 3.4231838363264124e-05, "loss": 2.5297, "step": 180840 }, { "epoch": 0.32, "learning_rate": 3.42309664233373e-05, "loss": 2.4817, "step": 180850 }, { "epoch": 0.32, "learning_rate": 3.423009448341047e-05, "loss": 2.4643, "step": 180860 }, { "epoch": 0.32, "learning_rate": 3.422922254348365e-05, "loss": 2.431, "step": 180870 }, { "epoch": 0.32, "learning_rate": 3.422835060355682e-05, "loss": 2.4053, "step": 180880 }, { "epoch": 0.32, "learning_rate": 3.422747866362999e-05, "loss": 2.3776, "step": 180890 }, { "epoch": 0.32, "learning_rate": 3.4226606723703166e-05, "loss": 2.3682, "step": 180900 }, { "epoch": 0.32, "learning_rate": 3.422573478377634e-05, "loss": 2.4754, "step": 180910 }, { "epoch": 0.32, "learning_rate": 3.4224862843849514e-05, "loss": 2.4852, "step": 180920 }, { "epoch": 0.32, "learning_rate": 3.4223990903922684e-05, "loss": 2.5134, "step": 180930 }, { "epoch": 0.32, "learning_rate": 3.422311896399586e-05, "loss": 2.4635, "step": 180940 }, { "epoch": 0.32, "learning_rate": 3.422224702406903e-05, "loss": 2.4091, "step": 180950 }, { "epoch": 0.32, "learning_rate": 3.42213750841422e-05, "loss": 2.4948, "step": 180960 }, { "epoch": 0.32, "learning_rate": 3.422050314421538e-05, "loss": 2.3231, "step": 180970 }, { "epoch": 0.32, "learning_rate": 3.421963120428855e-05, "loss": 2.3084, "step": 180980 }, { "epoch": 0.32, "learning_rate": 3.421875926436172e-05, "loss": 2.4786, "step": 180990 }, { "epoch": 0.32, "learning_rate": 3.42178873244349e-05, "loss": 2.4062, "step": 181000 }, { "epoch": 0.32, "learning_rate": 3.4217015384508074e-05, "loss": 2.4519, "step": 181010 }, { "epoch": 0.32, "learning_rate": 3.4216143444581245e-05, "loss": 2.5184, "step": 181020 }, { "epoch": 0.32, "learning_rate": 3.4215271504654415e-05, "loss": 2.4035, "step": 181030 }, { "epoch": 0.32, "learning_rate": 3.421439956472759e-05, "loss": 2.4537, "step": 181040 }, { "epoch": 0.32, "learning_rate": 3.421352762480076e-05, "loss": 2.2689, "step": 181050 }, { "epoch": 0.32, "learning_rate": 3.421265568487393e-05, "loss": 2.4714, "step": 181060 }, { "epoch": 0.32, "learning_rate": 3.421178374494711e-05, "loss": 2.3761, "step": 181070 }, { "epoch": 0.32, "learning_rate": 3.421091180502029e-05, "loss": 2.3689, "step": 181080 }, { "epoch": 0.32, "learning_rate": 3.421003986509346e-05, "loss": 2.3878, "step": 181090 }, { "epoch": 0.32, "learning_rate": 3.420916792516663e-05, "loss": 2.4994, "step": 181100 }, { "epoch": 0.32, "learning_rate": 3.4208295985239805e-05, "loss": 2.5007, "step": 181110 }, { "epoch": 0.32, "learning_rate": 3.4207424045312976e-05, "loss": 2.5461, "step": 181120 }, { "epoch": 0.32, "learning_rate": 3.4206552105386146e-05, "loss": 2.3568, "step": 181130 }, { "epoch": 0.32, "learning_rate": 3.4205680165459316e-05, "loss": 2.3864, "step": 181140 }, { "epoch": 0.32, "learning_rate": 3.42048082255325e-05, "loss": 2.4071, "step": 181150 }, { "epoch": 0.32, "learning_rate": 3.420393628560567e-05, "loss": 2.4504, "step": 181160 }, { "epoch": 0.32, "learning_rate": 3.420306434567884e-05, "loss": 2.5011, "step": 181170 }, { "epoch": 0.32, "learning_rate": 3.420219240575202e-05, "loss": 2.4765, "step": 181180 }, { "epoch": 0.32, "learning_rate": 3.420132046582519e-05, "loss": 2.4942, "step": 181190 }, { "epoch": 0.32, "learning_rate": 3.420044852589836e-05, "loss": 2.4376, "step": 181200 }, { "epoch": 0.32, "learning_rate": 3.419957658597153e-05, "loss": 2.5374, "step": 181210 }, { "epoch": 0.32, "learning_rate": 3.419870464604471e-05, "loss": 2.4343, "step": 181220 }, { "epoch": 0.32, "learning_rate": 3.4197832706117884e-05, "loss": 2.4572, "step": 181230 }, { "epoch": 0.32, "learning_rate": 3.4196960766191054e-05, "loss": 2.4438, "step": 181240 }, { "epoch": 0.32, "learning_rate": 3.4196088826264224e-05, "loss": 2.4942, "step": 181250 }, { "epoch": 0.32, "learning_rate": 3.41952168863374e-05, "loss": 2.447, "step": 181260 }, { "epoch": 0.32, "learning_rate": 3.419434494641057e-05, "loss": 2.5612, "step": 181270 }, { "epoch": 0.32, "learning_rate": 3.419347300648374e-05, "loss": 2.3861, "step": 181280 }, { "epoch": 0.32, "learning_rate": 3.419260106655692e-05, "loss": 2.3341, "step": 181290 }, { "epoch": 0.32, "learning_rate": 3.41917291266301e-05, "loss": 2.4521, "step": 181300 }, { "epoch": 0.32, "learning_rate": 3.419085718670327e-05, "loss": 2.4088, "step": 181310 }, { "epoch": 0.32, "learning_rate": 3.418998524677644e-05, "loss": 2.4004, "step": 181320 }, { "epoch": 0.32, "learning_rate": 3.4189113306849615e-05, "loss": 2.542, "step": 181330 }, { "epoch": 0.32, "learning_rate": 3.4188241366922785e-05, "loss": 2.412, "step": 181340 }, { "epoch": 0.32, "learning_rate": 3.4187369426995955e-05, "loss": 2.468, "step": 181350 }, { "epoch": 0.32, "learning_rate": 3.418649748706913e-05, "loss": 2.3443, "step": 181360 }, { "epoch": 0.32, "learning_rate": 3.418562554714231e-05, "loss": 2.4158, "step": 181370 }, { "epoch": 0.32, "learning_rate": 3.418475360721548e-05, "loss": 2.4017, "step": 181380 }, { "epoch": 0.32, "learning_rate": 3.418388166728865e-05, "loss": 2.3, "step": 181390 }, { "epoch": 0.32, "learning_rate": 3.418300972736183e-05, "loss": 2.5037, "step": 181400 }, { "epoch": 0.32, "learning_rate": 3.4182137787435e-05, "loss": 2.5087, "step": 181410 }, { "epoch": 0.32, "learning_rate": 3.418126584750817e-05, "loss": 2.3, "step": 181420 }, { "epoch": 0.32, "learning_rate": 3.4180393907581346e-05, "loss": 2.3831, "step": 181430 }, { "epoch": 0.32, "learning_rate": 3.417952196765452e-05, "loss": 2.3476, "step": 181440 }, { "epoch": 0.32, "learning_rate": 3.417865002772769e-05, "loss": 2.3569, "step": 181450 }, { "epoch": 0.32, "learning_rate": 3.4177778087800863e-05, "loss": 2.452, "step": 181460 }, { "epoch": 0.32, "learning_rate": 3.417690614787404e-05, "loss": 2.4119, "step": 181470 }, { "epoch": 0.32, "learning_rate": 3.417603420794721e-05, "loss": 2.5435, "step": 181480 }, { "epoch": 0.32, "learning_rate": 3.417516226802038e-05, "loss": 2.3641, "step": 181490 }, { "epoch": 0.32, "learning_rate": 3.417429032809356e-05, "loss": 2.4316, "step": 181500 }, { "epoch": 0.32, "learning_rate": 3.417341838816673e-05, "loss": 2.5153, "step": 181510 }, { "epoch": 0.32, "learning_rate": 3.4172546448239906e-05, "loss": 2.4728, "step": 181520 }, { "epoch": 0.32, "learning_rate": 3.4171674508313076e-05, "loss": 2.5123, "step": 181530 }, { "epoch": 0.32, "learning_rate": 3.4170802568386254e-05, "loss": 2.3965, "step": 181540 }, { "epoch": 0.32, "learning_rate": 3.4169930628459424e-05, "loss": 2.4831, "step": 181550 }, { "epoch": 0.32, "learning_rate": 3.4169058688532594e-05, "loss": 2.359, "step": 181560 }, { "epoch": 0.32, "learning_rate": 3.416818674860577e-05, "loss": 2.3825, "step": 181570 }, { "epoch": 0.32, "learning_rate": 3.416731480867894e-05, "loss": 2.4399, "step": 181580 }, { "epoch": 0.32, "learning_rate": 3.416644286875212e-05, "loss": 2.4042, "step": 181590 }, { "epoch": 0.32, "learning_rate": 3.416557092882529e-05, "loss": 2.3958, "step": 181600 }, { "epoch": 0.32, "learning_rate": 3.416469898889847e-05, "loss": 2.4216, "step": 181610 }, { "epoch": 0.32, "learning_rate": 3.416382704897164e-05, "loss": 2.4657, "step": 181620 }, { "epoch": 0.32, "learning_rate": 3.416295510904481e-05, "loss": 2.3353, "step": 181630 }, { "epoch": 0.32, "learning_rate": 3.416208316911798e-05, "loss": 2.4629, "step": 181640 }, { "epoch": 0.32, "learning_rate": 3.4161211229191155e-05, "loss": 2.3279, "step": 181650 }, { "epoch": 0.32, "learning_rate": 3.4160339289264325e-05, "loss": 2.4812, "step": 181660 }, { "epoch": 0.32, "learning_rate": 3.41594673493375e-05, "loss": 2.4956, "step": 181670 }, { "epoch": 0.32, "learning_rate": 3.415859540941068e-05, "loss": 2.4382, "step": 181680 }, { "epoch": 0.32, "learning_rate": 3.415772346948385e-05, "loss": 2.298, "step": 181690 }, { "epoch": 0.32, "learning_rate": 3.415685152955702e-05, "loss": 2.5166, "step": 181700 }, { "epoch": 0.32, "learning_rate": 3.415597958963019e-05, "loss": 2.5194, "step": 181710 }, { "epoch": 0.32, "learning_rate": 3.415510764970337e-05, "loss": 2.581, "step": 181720 }, { "epoch": 0.32, "learning_rate": 3.415423570977654e-05, "loss": 2.3805, "step": 181730 }, { "epoch": 0.32, "learning_rate": 3.4153363769849716e-05, "loss": 2.4392, "step": 181740 }, { "epoch": 0.32, "learning_rate": 3.4152491829922886e-05, "loss": 2.3789, "step": 181750 }, { "epoch": 0.32, "learning_rate": 3.415161988999606e-05, "loss": 2.482, "step": 181760 }, { "epoch": 0.32, "learning_rate": 3.4150747950069233e-05, "loss": 2.4247, "step": 181770 }, { "epoch": 0.32, "learning_rate": 3.4149876010142404e-05, "loss": 2.3953, "step": 181780 }, { "epoch": 0.32, "learning_rate": 3.414900407021558e-05, "loss": 2.4089, "step": 181790 }, { "epoch": 0.32, "learning_rate": 3.414813213028875e-05, "loss": 2.4754, "step": 181800 }, { "epoch": 0.32, "learning_rate": 3.414726019036192e-05, "loss": 2.4614, "step": 181810 }, { "epoch": 0.32, "learning_rate": 3.41463882504351e-05, "loss": 2.459, "step": 181820 }, { "epoch": 0.32, "learning_rate": 3.4145516310508276e-05, "loss": 2.4191, "step": 181830 }, { "epoch": 0.32, "learning_rate": 3.4144644370581446e-05, "loss": 2.4465, "step": 181840 }, { "epoch": 0.32, "learning_rate": 3.414377243065462e-05, "loss": 2.4783, "step": 181850 }, { "epoch": 0.32, "learning_rate": 3.4142900490727794e-05, "loss": 2.486, "step": 181860 }, { "epoch": 0.32, "learning_rate": 3.4142028550800964e-05, "loss": 2.4283, "step": 181870 }, { "epoch": 0.32, "learning_rate": 3.4141156610874135e-05, "loss": 2.4732, "step": 181880 }, { "epoch": 0.32, "learning_rate": 3.414028467094731e-05, "loss": 2.4253, "step": 181890 }, { "epoch": 0.32, "learning_rate": 3.413941273102049e-05, "loss": 2.399, "step": 181900 }, { "epoch": 0.32, "learning_rate": 3.413854079109366e-05, "loss": 2.451, "step": 181910 }, { "epoch": 0.32, "learning_rate": 3.413766885116683e-05, "loss": 2.4329, "step": 181920 }, { "epoch": 0.32, "learning_rate": 3.413679691124001e-05, "loss": 2.4963, "step": 181930 }, { "epoch": 0.32, "learning_rate": 3.413592497131318e-05, "loss": 2.4945, "step": 181940 }, { "epoch": 0.32, "learning_rate": 3.413505303138635e-05, "loss": 2.519, "step": 181950 }, { "epoch": 0.32, "learning_rate": 3.4134181091459525e-05, "loss": 2.4347, "step": 181960 }, { "epoch": 0.32, "learning_rate": 3.41333091515327e-05, "loss": 2.3356, "step": 181970 }, { "epoch": 0.32, "learning_rate": 3.413243721160587e-05, "loss": 2.4907, "step": 181980 }, { "epoch": 0.32, "learning_rate": 3.413156527167904e-05, "loss": 2.4549, "step": 181990 }, { "epoch": 0.32, "learning_rate": 3.413069333175222e-05, "loss": 2.4624, "step": 182000 }, { "epoch": 0.32, "learning_rate": 3.412982139182539e-05, "loss": 2.4196, "step": 182010 }, { "epoch": 0.32, "learning_rate": 3.412894945189856e-05, "loss": 2.4266, "step": 182020 }, { "epoch": 0.32, "learning_rate": 3.412807751197173e-05, "loss": 2.4986, "step": 182030 }, { "epoch": 0.32, "learning_rate": 3.4127205572044915e-05, "loss": 2.3633, "step": 182040 }, { "epoch": 0.32, "learning_rate": 3.4126333632118085e-05, "loss": 2.4452, "step": 182050 }, { "epoch": 0.32, "learning_rate": 3.4125461692191256e-05, "loss": 2.4495, "step": 182060 }, { "epoch": 0.32, "learning_rate": 3.412458975226443e-05, "loss": 2.4336, "step": 182070 }, { "epoch": 0.32, "learning_rate": 3.41237178123376e-05, "loss": 2.4442, "step": 182080 }, { "epoch": 0.32, "learning_rate": 3.4122845872410774e-05, "loss": 2.4023, "step": 182090 }, { "epoch": 0.32, "learning_rate": 3.4121973932483944e-05, "loss": 2.4229, "step": 182100 }, { "epoch": 0.32, "learning_rate": 3.412110199255713e-05, "loss": 2.4753, "step": 182110 }, { "epoch": 0.32, "learning_rate": 3.41202300526303e-05, "loss": 2.4098, "step": 182120 }, { "epoch": 0.32, "learning_rate": 3.411935811270347e-05, "loss": 2.49, "step": 182130 }, { "epoch": 0.32, "learning_rate": 3.411848617277664e-05, "loss": 2.434, "step": 182140 }, { "epoch": 0.32, "learning_rate": 3.4117614232849816e-05, "loss": 2.4354, "step": 182150 }, { "epoch": 0.32, "learning_rate": 3.411674229292299e-05, "loss": 2.4192, "step": 182160 }, { "epoch": 0.32, "learning_rate": 3.411587035299616e-05, "loss": 2.4653, "step": 182170 }, { "epoch": 0.32, "learning_rate": 3.4114998413069334e-05, "loss": 2.3946, "step": 182180 }, { "epoch": 0.32, "learning_rate": 3.411412647314251e-05, "loss": 2.3488, "step": 182190 }, { "epoch": 0.32, "learning_rate": 3.411325453321568e-05, "loss": 2.4951, "step": 182200 }, { "epoch": 0.32, "learning_rate": 3.411238259328885e-05, "loss": 2.4846, "step": 182210 }, { "epoch": 0.32, "learning_rate": 3.411151065336203e-05, "loss": 2.5127, "step": 182220 }, { "epoch": 0.32, "learning_rate": 3.41106387134352e-05, "loss": 2.3252, "step": 182230 }, { "epoch": 0.32, "learning_rate": 3.410976677350837e-05, "loss": 2.49, "step": 182240 }, { "epoch": 0.32, "learning_rate": 3.410889483358155e-05, "loss": 2.5279, "step": 182250 }, { "epoch": 0.32, "learning_rate": 3.4108022893654724e-05, "loss": 2.4182, "step": 182260 }, { "epoch": 0.32, "learning_rate": 3.4107150953727895e-05, "loss": 2.4989, "step": 182270 }, { "epoch": 0.32, "learning_rate": 3.4106279013801065e-05, "loss": 2.416, "step": 182280 }, { "epoch": 0.32, "learning_rate": 3.410540707387424e-05, "loss": 2.4919, "step": 182290 }, { "epoch": 0.32, "learning_rate": 3.410453513394741e-05, "loss": 2.5124, "step": 182300 }, { "epoch": 0.32, "learning_rate": 3.410366319402058e-05, "loss": 2.555, "step": 182310 }, { "epoch": 0.32, "learning_rate": 3.410279125409376e-05, "loss": 2.4974, "step": 182320 }, { "epoch": 0.32, "learning_rate": 3.410191931416693e-05, "loss": 2.3959, "step": 182330 }, { "epoch": 0.32, "learning_rate": 3.410104737424011e-05, "loss": 2.5149, "step": 182340 }, { "epoch": 0.32, "learning_rate": 3.410017543431328e-05, "loss": 2.4596, "step": 182350 }, { "epoch": 0.32, "learning_rate": 3.4099303494386455e-05, "loss": 2.5419, "step": 182360 }, { "epoch": 0.32, "learning_rate": 3.4098431554459626e-05, "loss": 2.4918, "step": 182370 }, { "epoch": 0.32, "learning_rate": 3.4097559614532796e-05, "loss": 2.3558, "step": 182380 }, { "epoch": 0.32, "learning_rate": 3.409668767460597e-05, "loss": 2.5143, "step": 182390 }, { "epoch": 0.32, "learning_rate": 3.4095815734679144e-05, "loss": 2.4736, "step": 182400 }, { "epoch": 0.32, "learning_rate": 3.409494379475232e-05, "loss": 2.3672, "step": 182410 }, { "epoch": 0.32, "learning_rate": 3.409407185482549e-05, "loss": 2.5061, "step": 182420 }, { "epoch": 0.32, "learning_rate": 3.409319991489867e-05, "loss": 2.6046, "step": 182430 }, { "epoch": 0.32, "learning_rate": 3.409232797497184e-05, "loss": 2.4739, "step": 182440 }, { "epoch": 0.32, "learning_rate": 3.409145603504501e-05, "loss": 2.529, "step": 182450 }, { "epoch": 0.32, "learning_rate": 3.4090584095118186e-05, "loss": 2.5273, "step": 182460 }, { "epoch": 0.32, "learning_rate": 3.408971215519136e-05, "loss": 2.4741, "step": 182470 }, { "epoch": 0.32, "learning_rate": 3.408884021526453e-05, "loss": 2.484, "step": 182480 }, { "epoch": 0.32, "learning_rate": 3.4087968275337704e-05, "loss": 2.3741, "step": 182490 }, { "epoch": 0.32, "learning_rate": 3.408709633541088e-05, "loss": 2.3735, "step": 182500 }, { "epoch": 0.32, "learning_rate": 3.408622439548405e-05, "loss": 2.4127, "step": 182510 }, { "epoch": 0.32, "learning_rate": 3.408535245555722e-05, "loss": 2.4996, "step": 182520 }, { "epoch": 0.32, "learning_rate": 3.40844805156304e-05, "loss": 2.4271, "step": 182530 }, { "epoch": 0.32, "learning_rate": 3.408360857570357e-05, "loss": 2.4688, "step": 182540 }, { "epoch": 0.32, "learning_rate": 3.408273663577674e-05, "loss": 2.401, "step": 182550 }, { "epoch": 0.32, "learning_rate": 3.408186469584992e-05, "loss": 2.4069, "step": 182560 }, { "epoch": 0.32, "learning_rate": 3.4080992755923094e-05, "loss": 2.3595, "step": 182570 }, { "epoch": 0.32, "learning_rate": 3.4080120815996265e-05, "loss": 2.4614, "step": 182580 }, { "epoch": 0.32, "learning_rate": 3.4079248876069435e-05, "loss": 2.3549, "step": 182590 }, { "epoch": 0.32, "learning_rate": 3.4078376936142606e-05, "loss": 2.4085, "step": 182600 }, { "epoch": 0.32, "learning_rate": 3.407750499621578e-05, "loss": 2.4808, "step": 182610 }, { "epoch": 0.32, "learning_rate": 3.407663305628895e-05, "loss": 2.507, "step": 182620 }, { "epoch": 0.32, "learning_rate": 3.4075761116362123e-05, "loss": 2.4004, "step": 182630 }, { "epoch": 0.32, "learning_rate": 3.407488917643531e-05, "loss": 2.4158, "step": 182640 }, { "epoch": 0.32, "learning_rate": 3.407401723650848e-05, "loss": 2.4993, "step": 182650 }, { "epoch": 0.32, "learning_rate": 3.407314529658165e-05, "loss": 2.4191, "step": 182660 }, { "epoch": 0.32, "learning_rate": 3.407227335665482e-05, "loss": 2.322, "step": 182670 }, { "epoch": 0.32, "learning_rate": 3.4071401416727996e-05, "loss": 2.399, "step": 182680 }, { "epoch": 0.32, "learning_rate": 3.4070529476801166e-05, "loss": 2.4415, "step": 182690 }, { "epoch": 0.32, "learning_rate": 3.4069657536874336e-05, "loss": 2.2884, "step": 182700 }, { "epoch": 0.32, "learning_rate": 3.4068785596947514e-05, "loss": 2.519, "step": 182710 }, { "epoch": 0.32, "learning_rate": 3.406791365702069e-05, "loss": 2.4375, "step": 182720 }, { "epoch": 0.32, "learning_rate": 3.406704171709386e-05, "loss": 2.5529, "step": 182730 }, { "epoch": 0.32, "learning_rate": 3.406616977716703e-05, "loss": 2.3951, "step": 182740 }, { "epoch": 0.32, "learning_rate": 3.406529783724021e-05, "loss": 2.3971, "step": 182750 }, { "epoch": 0.32, "learning_rate": 3.406442589731338e-05, "loss": 2.389, "step": 182760 }, { "epoch": 0.32, "learning_rate": 3.406355395738655e-05, "loss": 2.4827, "step": 182770 }, { "epoch": 0.32, "learning_rate": 3.4062682017459727e-05, "loss": 2.4722, "step": 182780 }, { "epoch": 0.32, "learning_rate": 3.4061810077532904e-05, "loss": 2.3975, "step": 182790 }, { "epoch": 0.32, "learning_rate": 3.4060938137606074e-05, "loss": 2.4654, "step": 182800 }, { "epoch": 0.32, "learning_rate": 3.4060066197679245e-05, "loss": 2.3762, "step": 182810 }, { "epoch": 0.32, "learning_rate": 3.405919425775242e-05, "loss": 2.3382, "step": 182820 }, { "epoch": 0.32, "learning_rate": 3.405832231782559e-05, "loss": 2.3225, "step": 182830 }, { "epoch": 0.32, "learning_rate": 3.405745037789876e-05, "loss": 2.5992, "step": 182840 }, { "epoch": 0.32, "learning_rate": 3.405657843797194e-05, "loss": 2.3843, "step": 182850 }, { "epoch": 0.32, "learning_rate": 3.405570649804512e-05, "loss": 2.42, "step": 182860 }, { "epoch": 0.32, "learning_rate": 3.405483455811829e-05, "loss": 2.4415, "step": 182870 }, { "epoch": 0.32, "learning_rate": 3.405396261819146e-05, "loss": 2.4178, "step": 182880 }, { "epoch": 0.32, "learning_rate": 3.4053090678264635e-05, "loss": 2.508, "step": 182890 }, { "epoch": 0.32, "learning_rate": 3.4052218738337805e-05, "loss": 2.4363, "step": 182900 }, { "epoch": 0.32, "learning_rate": 3.4051346798410975e-05, "loss": 2.3682, "step": 182910 }, { "epoch": 0.32, "learning_rate": 3.405047485848415e-05, "loss": 2.4251, "step": 182920 }, { "epoch": 0.32, "learning_rate": 3.404960291855733e-05, "loss": 2.5009, "step": 182930 }, { "epoch": 0.32, "learning_rate": 3.40487309786305e-05, "loss": 2.3652, "step": 182940 }, { "epoch": 0.32, "learning_rate": 3.404785903870367e-05, "loss": 2.4005, "step": 182950 }, { "epoch": 0.32, "learning_rate": 3.404698709877685e-05, "loss": 2.4745, "step": 182960 }, { "epoch": 0.32, "learning_rate": 3.404611515885002e-05, "loss": 2.3535, "step": 182970 }, { "epoch": 0.32, "learning_rate": 3.404524321892319e-05, "loss": 2.4048, "step": 182980 }, { "epoch": 0.32, "learning_rate": 3.404437127899636e-05, "loss": 2.5371, "step": 182990 }, { "epoch": 0.32, "learning_rate": 3.4043499339069536e-05, "loss": 2.4242, "step": 183000 }, { "epoch": 0.32, "learning_rate": 3.404262739914271e-05, "loss": 2.3661, "step": 183010 }, { "epoch": 0.32, "learning_rate": 3.4041755459215884e-05, "loss": 2.3614, "step": 183020 }, { "epoch": 0.32, "learning_rate": 3.404088351928906e-05, "loss": 2.3447, "step": 183030 }, { "epoch": 0.32, "learning_rate": 3.404001157936223e-05, "loss": 2.3867, "step": 183040 }, { "epoch": 0.32, "learning_rate": 3.40391396394354e-05, "loss": 2.3345, "step": 183050 }, { "epoch": 0.32, "learning_rate": 3.403826769950857e-05, "loss": 2.4934, "step": 183060 }, { "epoch": 0.32, "learning_rate": 3.403739575958175e-05, "loss": 2.526, "step": 183070 }, { "epoch": 0.32, "learning_rate": 3.4036523819654926e-05, "loss": 2.4967, "step": 183080 }, { "epoch": 0.32, "learning_rate": 3.4035651879728097e-05, "loss": 2.5146, "step": 183090 }, { "epoch": 0.32, "learning_rate": 3.403477993980127e-05, "loss": 2.3262, "step": 183100 }, { "epoch": 0.32, "learning_rate": 3.4033907999874444e-05, "loss": 2.348, "step": 183110 }, { "epoch": 0.32, "learning_rate": 3.4033036059947614e-05, "loss": 2.3284, "step": 183120 }, { "epoch": 0.32, "learning_rate": 3.4032164120020785e-05, "loss": 2.5334, "step": 183130 }, { "epoch": 0.32, "learning_rate": 3.403129218009396e-05, "loss": 2.4353, "step": 183140 }, { "epoch": 0.32, "learning_rate": 3.403042024016713e-05, "loss": 2.3758, "step": 183150 }, { "epoch": 0.32, "learning_rate": 3.402954830024031e-05, "loss": 2.4222, "step": 183160 }, { "epoch": 0.32, "learning_rate": 3.402867636031348e-05, "loss": 2.4197, "step": 183170 }, { "epoch": 0.32, "learning_rate": 3.402780442038666e-05, "loss": 2.3955, "step": 183180 }, { "epoch": 0.32, "learning_rate": 3.402693248045983e-05, "loss": 2.4446, "step": 183190 }, { "epoch": 0.32, "learning_rate": 3.4026060540533e-05, "loss": 2.4697, "step": 183200 }, { "epoch": 0.32, "learning_rate": 3.4025188600606175e-05, "loss": 2.4134, "step": 183210 }, { "epoch": 0.32, "learning_rate": 3.4024316660679345e-05, "loss": 2.4341, "step": 183220 }, { "epoch": 0.32, "learning_rate": 3.402344472075252e-05, "loss": 2.3573, "step": 183230 }, { "epoch": 0.32, "learning_rate": 3.402257278082569e-05, "loss": 2.4588, "step": 183240 }, { "epoch": 0.32, "learning_rate": 3.402170084089887e-05, "loss": 2.5339, "step": 183250 }, { "epoch": 0.32, "learning_rate": 3.402082890097204e-05, "loss": 2.4213, "step": 183260 }, { "epoch": 0.32, "learning_rate": 3.401995696104521e-05, "loss": 2.5089, "step": 183270 }, { "epoch": 0.32, "learning_rate": 3.401908502111839e-05, "loss": 2.3452, "step": 183280 }, { "epoch": 0.32, "learning_rate": 3.401821308119156e-05, "loss": 2.465, "step": 183290 }, { "epoch": 0.32, "learning_rate": 3.4017341141264736e-05, "loss": 2.4622, "step": 183300 }, { "epoch": 0.32, "learning_rate": 3.4016469201337906e-05, "loss": 2.4518, "step": 183310 }, { "epoch": 0.32, "learning_rate": 3.401559726141108e-05, "loss": 2.3686, "step": 183320 }, { "epoch": 0.32, "learning_rate": 3.4014725321484253e-05, "loss": 2.4838, "step": 183330 }, { "epoch": 0.32, "learning_rate": 3.4013853381557424e-05, "loss": 2.2734, "step": 183340 }, { "epoch": 0.32, "learning_rate": 3.40129814416306e-05, "loss": 2.405, "step": 183350 }, { "epoch": 0.32, "learning_rate": 3.401210950170377e-05, "loss": 2.4095, "step": 183360 }, { "epoch": 0.32, "learning_rate": 3.401123756177694e-05, "loss": 2.4979, "step": 183370 }, { "epoch": 0.32, "learning_rate": 3.401036562185012e-05, "loss": 2.525, "step": 183380 }, { "epoch": 0.32, "learning_rate": 3.4009493681923296e-05, "loss": 2.3983, "step": 183390 }, { "epoch": 0.32, "learning_rate": 3.4008621741996466e-05, "loss": 2.3764, "step": 183400 }, { "epoch": 0.32, "learning_rate": 3.400774980206964e-05, "loss": 2.4705, "step": 183410 }, { "epoch": 0.32, "learning_rate": 3.4006877862142814e-05, "loss": 2.4844, "step": 183420 }, { "epoch": 0.32, "learning_rate": 3.4006005922215984e-05, "loss": 2.4824, "step": 183430 }, { "epoch": 0.32, "learning_rate": 3.4005133982289155e-05, "loss": 2.3806, "step": 183440 }, { "epoch": 0.32, "learning_rate": 3.400426204236233e-05, "loss": 2.485, "step": 183450 }, { "epoch": 0.32, "learning_rate": 3.400339010243551e-05, "loss": 2.4623, "step": 183460 }, { "epoch": 0.32, "learning_rate": 3.400251816250868e-05, "loss": 2.4229, "step": 183470 }, { "epoch": 0.32, "learning_rate": 3.400164622258185e-05, "loss": 2.5375, "step": 183480 }, { "epoch": 0.32, "learning_rate": 3.400077428265502e-05, "loss": 2.2974, "step": 183490 }, { "epoch": 0.32, "learning_rate": 3.39999023427282e-05, "loss": 2.5437, "step": 183500 }, { "epoch": 0.32, "learning_rate": 3.399903040280137e-05, "loss": 2.3359, "step": 183510 }, { "epoch": 0.32, "learning_rate": 3.399815846287454e-05, "loss": 2.489, "step": 183520 }, { "epoch": 0.32, "learning_rate": 3.399728652294772e-05, "loss": 2.285, "step": 183530 }, { "epoch": 0.32, "learning_rate": 3.399641458302089e-05, "loss": 2.4511, "step": 183540 }, { "epoch": 0.32, "learning_rate": 3.399554264309406e-05, "loss": 2.4074, "step": 183550 }, { "epoch": 0.32, "learning_rate": 3.399467070316723e-05, "loss": 2.3316, "step": 183560 }, { "epoch": 0.32, "learning_rate": 3.399379876324041e-05, "loss": 2.4362, "step": 183570 }, { "epoch": 0.32, "learning_rate": 3.399292682331358e-05, "loss": 2.4166, "step": 183580 }, { "epoch": 0.32, "learning_rate": 3.399205488338675e-05, "loss": 2.5126, "step": 183590 }, { "epoch": 0.32, "learning_rate": 3.399118294345993e-05, "loss": 2.5088, "step": 183600 }, { "epoch": 0.32, "learning_rate": 3.3990311003533105e-05, "loss": 2.4248, "step": 183610 }, { "epoch": 0.32, "learning_rate": 3.3989439063606276e-05, "loss": 2.3561, "step": 183620 }, { "epoch": 0.32, "learning_rate": 3.3988567123679446e-05, "loss": 2.475, "step": 183630 }, { "epoch": 0.32, "learning_rate": 3.398769518375262e-05, "loss": 2.494, "step": 183640 }, { "epoch": 0.32, "learning_rate": 3.3986823243825794e-05, "loss": 2.46, "step": 183650 }, { "epoch": 0.32, "learning_rate": 3.3985951303898964e-05, "loss": 2.4539, "step": 183660 }, { "epoch": 0.32, "learning_rate": 3.398507936397214e-05, "loss": 2.4798, "step": 183670 }, { "epoch": 0.32, "learning_rate": 3.398420742404532e-05, "loss": 2.368, "step": 183680 }, { "epoch": 0.32, "learning_rate": 3.398333548411849e-05, "loss": 2.291, "step": 183690 }, { "epoch": 0.32, "learning_rate": 3.398246354419166e-05, "loss": 2.5213, "step": 183700 }, { "epoch": 0.32, "learning_rate": 3.3981591604264836e-05, "loss": 2.4236, "step": 183710 }, { "epoch": 0.32, "learning_rate": 3.398071966433801e-05, "loss": 2.488, "step": 183720 }, { "epoch": 0.32, "learning_rate": 3.397984772441118e-05, "loss": 2.4463, "step": 183730 }, { "epoch": 0.32, "learning_rate": 3.3978975784484354e-05, "loss": 2.4366, "step": 183740 }, { "epoch": 0.32, "learning_rate": 3.397810384455753e-05, "loss": 2.3856, "step": 183750 }, { "epoch": 0.32, "learning_rate": 3.39772319046307e-05, "loss": 2.5343, "step": 183760 }, { "epoch": 0.32, "learning_rate": 3.397635996470387e-05, "loss": 2.4048, "step": 183770 }, { "epoch": 0.32, "learning_rate": 3.397548802477705e-05, "loss": 2.5708, "step": 183780 }, { "epoch": 0.32, "learning_rate": 3.397461608485022e-05, "loss": 2.5129, "step": 183790 }, { "epoch": 0.32, "learning_rate": 3.397374414492339e-05, "loss": 2.4056, "step": 183800 }, { "epoch": 0.32, "learning_rate": 3.397287220499657e-05, "loss": 2.4454, "step": 183810 }, { "epoch": 0.32, "learning_rate": 3.397200026506974e-05, "loss": 2.4262, "step": 183820 }, { "epoch": 0.32, "learning_rate": 3.3971128325142915e-05, "loss": 2.4484, "step": 183830 }, { "epoch": 0.32, "learning_rate": 3.3970256385216085e-05, "loss": 2.5566, "step": 183840 }, { "epoch": 0.32, "learning_rate": 3.396938444528926e-05, "loss": 2.4267, "step": 183850 }, { "epoch": 0.32, "learning_rate": 3.396851250536243e-05, "loss": 2.3885, "step": 183860 }, { "epoch": 0.32, "learning_rate": 3.39676405654356e-05, "loss": 2.4194, "step": 183870 }, { "epoch": 0.32, "learning_rate": 3.396676862550878e-05, "loss": 2.3334, "step": 183880 }, { "epoch": 0.32, "learning_rate": 3.396589668558195e-05, "loss": 2.3684, "step": 183890 }, { "epoch": 0.32, "learning_rate": 3.396502474565513e-05, "loss": 2.4161, "step": 183900 }, { "epoch": 0.32, "learning_rate": 3.39641528057283e-05, "loss": 2.4981, "step": 183910 }, { "epoch": 0.32, "learning_rate": 3.3963280865801475e-05, "loss": 2.5065, "step": 183920 }, { "epoch": 0.32, "learning_rate": 3.3962408925874646e-05, "loss": 2.4388, "step": 183930 }, { "epoch": 0.32, "learning_rate": 3.3961536985947816e-05, "loss": 2.4363, "step": 183940 }, { "epoch": 0.32, "learning_rate": 3.3960665046020987e-05, "loss": 2.3862, "step": 183950 }, { "epoch": 0.32, "learning_rate": 3.3959793106094164e-05, "loss": 2.3493, "step": 183960 }, { "epoch": 0.32, "learning_rate": 3.395892116616734e-05, "loss": 2.4066, "step": 183970 }, { "epoch": 0.32, "learning_rate": 3.395804922624051e-05, "loss": 2.4777, "step": 183980 }, { "epoch": 0.32, "learning_rate": 3.395717728631369e-05, "loss": 2.503, "step": 183990 }, { "epoch": 0.32, "learning_rate": 3.395630534638686e-05, "loss": 2.2871, "step": 184000 }, { "epoch": 0.32, "learning_rate": 3.395543340646003e-05, "loss": 2.4798, "step": 184010 }, { "epoch": 0.32, "learning_rate": 3.39545614665332e-05, "loss": 2.4758, "step": 184020 }, { "epoch": 0.32, "learning_rate": 3.395368952660638e-05, "loss": 2.3666, "step": 184030 }, { "epoch": 0.32, "learning_rate": 3.395281758667955e-05, "loss": 2.4513, "step": 184040 }, { "epoch": 0.32, "learning_rate": 3.3951945646752724e-05, "loss": 2.3143, "step": 184050 }, { "epoch": 0.32, "learning_rate": 3.3951073706825895e-05, "loss": 2.4392, "step": 184060 }, { "epoch": 0.32, "learning_rate": 3.395020176689907e-05, "loss": 2.4229, "step": 184070 }, { "epoch": 0.32, "learning_rate": 3.394932982697224e-05, "loss": 2.4357, "step": 184080 }, { "epoch": 0.32, "learning_rate": 3.394845788704541e-05, "loss": 2.4561, "step": 184090 }, { "epoch": 0.32, "learning_rate": 3.394758594711859e-05, "loss": 2.4301, "step": 184100 }, { "epoch": 0.32, "learning_rate": 3.394671400719176e-05, "loss": 2.5076, "step": 184110 }, { "epoch": 0.32, "learning_rate": 3.394584206726494e-05, "loss": 2.4351, "step": 184120 }, { "epoch": 0.32, "learning_rate": 3.394497012733811e-05, "loss": 2.4456, "step": 184130 }, { "epoch": 0.32, "learning_rate": 3.3944098187411285e-05, "loss": 2.5202, "step": 184140 }, { "epoch": 0.32, "learning_rate": 3.3943226247484455e-05, "loss": 2.5656, "step": 184150 }, { "epoch": 0.32, "learning_rate": 3.3942354307557626e-05, "loss": 2.4449, "step": 184160 }, { "epoch": 0.32, "learning_rate": 3.39414823676308e-05, "loss": 2.4795, "step": 184170 }, { "epoch": 0.32, "learning_rate": 3.394061042770397e-05, "loss": 2.4575, "step": 184180 }, { "epoch": 0.32, "learning_rate": 3.3939738487777143e-05, "loss": 2.5442, "step": 184190 }, { "epoch": 0.32, "learning_rate": 3.393886654785032e-05, "loss": 2.3655, "step": 184200 }, { "epoch": 0.32, "learning_rate": 3.39379946079235e-05, "loss": 2.4254, "step": 184210 }, { "epoch": 0.32, "learning_rate": 3.393712266799667e-05, "loss": 2.4849, "step": 184220 }, { "epoch": 0.32, "learning_rate": 3.393625072806984e-05, "loss": 2.4098, "step": 184230 }, { "epoch": 0.32, "learning_rate": 3.3935378788143016e-05, "loss": 2.353, "step": 184240 }, { "epoch": 0.32, "learning_rate": 3.3934506848216186e-05, "loss": 2.3732, "step": 184250 }, { "epoch": 0.32, "learning_rate": 3.3933634908289356e-05, "loss": 2.4198, "step": 184260 }, { "epoch": 0.32, "learning_rate": 3.3932762968362534e-05, "loss": 2.3151, "step": 184270 }, { "epoch": 0.32, "learning_rate": 3.393189102843571e-05, "loss": 2.405, "step": 184280 }, { "epoch": 0.32, "learning_rate": 3.393101908850888e-05, "loss": 2.4132, "step": 184290 }, { "epoch": 0.32, "learning_rate": 3.393014714858205e-05, "loss": 2.3474, "step": 184300 }, { "epoch": 0.32, "learning_rate": 3.392927520865523e-05, "loss": 2.5441, "step": 184310 }, { "epoch": 0.32, "learning_rate": 3.39284032687284e-05, "loss": 2.3145, "step": 184320 }, { "epoch": 0.32, "learning_rate": 3.392753132880157e-05, "loss": 2.4745, "step": 184330 }, { "epoch": 0.32, "learning_rate": 3.392665938887474e-05, "loss": 2.3436, "step": 184340 }, { "epoch": 0.32, "learning_rate": 3.3925787448947924e-05, "loss": 2.4452, "step": 184350 }, { "epoch": 0.32, "learning_rate": 3.3924915509021094e-05, "loss": 2.6217, "step": 184360 }, { "epoch": 0.32, "learning_rate": 3.3924043569094265e-05, "loss": 2.3715, "step": 184370 }, { "epoch": 0.32, "learning_rate": 3.392317162916744e-05, "loss": 2.4146, "step": 184380 }, { "epoch": 0.32, "learning_rate": 3.392229968924061e-05, "loss": 2.3575, "step": 184390 }, { "epoch": 0.32, "learning_rate": 3.392142774931378e-05, "loss": 2.4469, "step": 184400 }, { "epoch": 0.32, "learning_rate": 3.392055580938695e-05, "loss": 2.4877, "step": 184410 }, { "epoch": 0.32, "learning_rate": 3.391968386946014e-05, "loss": 2.3601, "step": 184420 }, { "epoch": 0.32, "learning_rate": 3.391881192953331e-05, "loss": 2.3658, "step": 184430 }, { "epoch": 0.32, "learning_rate": 3.391793998960648e-05, "loss": 2.4057, "step": 184440 }, { "epoch": 0.32, "learning_rate": 3.391706804967965e-05, "loss": 2.3706, "step": 184450 }, { "epoch": 0.32, "learning_rate": 3.3916196109752825e-05, "loss": 2.4588, "step": 184460 }, { "epoch": 0.32, "learning_rate": 3.3915324169825995e-05, "loss": 2.5113, "step": 184470 }, { "epoch": 0.32, "learning_rate": 3.3914452229899166e-05, "loss": 2.5097, "step": 184480 }, { "epoch": 0.32, "learning_rate": 3.391358028997234e-05, "loss": 2.458, "step": 184490 }, { "epoch": 0.32, "learning_rate": 3.391270835004552e-05, "loss": 2.4859, "step": 184500 }, { "epoch": 0.32, "learning_rate": 3.391183641011869e-05, "loss": 2.4128, "step": 184510 }, { "epoch": 0.32, "learning_rate": 3.391096447019186e-05, "loss": 2.5628, "step": 184520 }, { "epoch": 0.32, "learning_rate": 3.391009253026504e-05, "loss": 2.4401, "step": 184530 }, { "epoch": 0.32, "learning_rate": 3.390922059033821e-05, "loss": 2.435, "step": 184540 }, { "epoch": 0.32, "learning_rate": 3.390834865041138e-05, "loss": 2.4897, "step": 184550 }, { "epoch": 0.32, "learning_rate": 3.3907476710484556e-05, "loss": 2.388, "step": 184560 }, { "epoch": 0.32, "learning_rate": 3.390660477055773e-05, "loss": 2.4067, "step": 184570 }, { "epoch": 0.32, "learning_rate": 3.3905732830630904e-05, "loss": 2.4715, "step": 184580 }, { "epoch": 0.32, "learning_rate": 3.3904860890704074e-05, "loss": 2.3972, "step": 184590 }, { "epoch": 0.32, "learning_rate": 3.390398895077725e-05, "loss": 2.4441, "step": 184600 }, { "epoch": 0.32, "learning_rate": 3.390311701085042e-05, "loss": 2.425, "step": 184610 }, { "epoch": 0.32, "learning_rate": 3.390224507092359e-05, "loss": 2.5168, "step": 184620 }, { "epoch": 0.32, "learning_rate": 3.390137313099677e-05, "loss": 2.4173, "step": 184630 }, { "epoch": 0.32, "learning_rate": 3.3900501191069946e-05, "loss": 2.6083, "step": 184640 }, { "epoch": 0.32, "learning_rate": 3.3899629251143117e-05, "loss": 2.5281, "step": 184650 }, { "epoch": 0.32, "learning_rate": 3.389875731121629e-05, "loss": 2.3556, "step": 184660 }, { "epoch": 0.32, "learning_rate": 3.3897885371289464e-05, "loss": 2.5294, "step": 184670 }, { "epoch": 0.32, "learning_rate": 3.3897013431362634e-05, "loss": 2.3611, "step": 184680 }, { "epoch": 0.32, "learning_rate": 3.3896141491435805e-05, "loss": 2.469, "step": 184690 }, { "epoch": 0.32, "learning_rate": 3.389526955150898e-05, "loss": 2.3267, "step": 184700 }, { "epoch": 0.32, "learning_rate": 3.389439761158215e-05, "loss": 2.4025, "step": 184710 }, { "epoch": 0.32, "learning_rate": 3.389352567165533e-05, "loss": 2.3811, "step": 184720 }, { "epoch": 0.32, "learning_rate": 3.38926537317285e-05, "loss": 2.4953, "step": 184730 }, { "epoch": 0.32, "learning_rate": 3.389178179180168e-05, "loss": 2.3731, "step": 184740 }, { "epoch": 0.32, "learning_rate": 3.389090985187485e-05, "loss": 2.3287, "step": 184750 }, { "epoch": 0.32, "learning_rate": 3.389003791194802e-05, "loss": 2.4795, "step": 184760 }, { "epoch": 0.32, "learning_rate": 3.3889165972021195e-05, "loss": 2.4997, "step": 184770 }, { "epoch": 0.32, "learning_rate": 3.3888294032094365e-05, "loss": 2.4453, "step": 184780 }, { "epoch": 0.32, "learning_rate": 3.388742209216754e-05, "loss": 2.4558, "step": 184790 }, { "epoch": 0.32, "learning_rate": 3.388655015224071e-05, "loss": 2.4239, "step": 184800 }, { "epoch": 0.32, "learning_rate": 3.388567821231389e-05, "loss": 2.3631, "step": 184810 }, { "epoch": 0.32, "learning_rate": 3.388480627238706e-05, "loss": 2.4131, "step": 184820 }, { "epoch": 0.32, "learning_rate": 3.388393433246023e-05, "loss": 2.3918, "step": 184830 }, { "epoch": 0.32, "learning_rate": 3.38830623925334e-05, "loss": 2.427, "step": 184840 }, { "epoch": 0.32, "learning_rate": 3.388219045260658e-05, "loss": 2.4944, "step": 184850 }, { "epoch": 0.32, "learning_rate": 3.388131851267975e-05, "loss": 2.4298, "step": 184860 }, { "epoch": 0.32, "learning_rate": 3.3880446572752926e-05, "loss": 2.4965, "step": 184870 }, { "epoch": 0.32, "learning_rate": 3.38795746328261e-05, "loss": 2.4051, "step": 184880 }, { "epoch": 0.32, "learning_rate": 3.3878702692899273e-05, "loss": 2.3611, "step": 184890 }, { "epoch": 0.32, "learning_rate": 3.3877830752972444e-05, "loss": 2.4047, "step": 184900 }, { "epoch": 0.32, "learning_rate": 3.3876958813045614e-05, "loss": 2.3576, "step": 184910 }, { "epoch": 0.32, "learning_rate": 3.387608687311879e-05, "loss": 2.3989, "step": 184920 }, { "epoch": 0.32, "learning_rate": 3.387521493319196e-05, "loss": 2.309, "step": 184930 }, { "epoch": 0.32, "learning_rate": 3.387434299326514e-05, "loss": 2.343, "step": 184940 }, { "epoch": 0.32, "learning_rate": 3.387347105333831e-05, "loss": 2.387, "step": 184950 }, { "epoch": 0.32, "learning_rate": 3.3872599113411486e-05, "loss": 2.4012, "step": 184960 }, { "epoch": 0.32, "learning_rate": 3.387172717348466e-05, "loss": 2.467, "step": 184970 }, { "epoch": 0.32, "learning_rate": 3.387085523355783e-05, "loss": 2.4205, "step": 184980 }, { "epoch": 0.32, "learning_rate": 3.3869983293631004e-05, "loss": 2.4574, "step": 184990 }, { "epoch": 0.32, "learning_rate": 3.3869111353704175e-05, "loss": 2.4167, "step": 185000 }, { "epoch": 0.32, "learning_rate": 3.3868239413777345e-05, "loss": 2.4929, "step": 185010 }, { "epoch": 0.32, "learning_rate": 3.386736747385052e-05, "loss": 2.4262, "step": 185020 }, { "epoch": 0.32, "learning_rate": 3.38664955339237e-05, "loss": 2.3831, "step": 185030 }, { "epoch": 0.32, "learning_rate": 3.386562359399687e-05, "loss": 2.3498, "step": 185040 }, { "epoch": 0.32, "learning_rate": 3.386475165407004e-05, "loss": 2.3643, "step": 185050 }, { "epoch": 0.32, "learning_rate": 3.386387971414322e-05, "loss": 2.2579, "step": 185060 }, { "epoch": 0.32, "learning_rate": 3.386300777421639e-05, "loss": 2.4827, "step": 185070 }, { "epoch": 0.32, "learning_rate": 3.386213583428956e-05, "loss": 2.4079, "step": 185080 }, { "epoch": 0.32, "learning_rate": 3.3861263894362735e-05, "loss": 2.4876, "step": 185090 }, { "epoch": 0.32, "learning_rate": 3.386039195443591e-05, "loss": 2.5349, "step": 185100 }, { "epoch": 0.32, "learning_rate": 3.385952001450908e-05, "loss": 2.4277, "step": 185110 }, { "epoch": 0.32, "learning_rate": 3.385864807458225e-05, "loss": 2.433, "step": 185120 }, { "epoch": 0.32, "learning_rate": 3.385777613465543e-05, "loss": 2.5276, "step": 185130 }, { "epoch": 0.32, "learning_rate": 3.38569041947286e-05, "loss": 2.5316, "step": 185140 }, { "epoch": 0.32, "learning_rate": 3.385603225480177e-05, "loss": 2.522, "step": 185150 }, { "epoch": 0.32, "learning_rate": 3.385516031487495e-05, "loss": 2.5053, "step": 185160 }, { "epoch": 0.32, "learning_rate": 3.3854288374948125e-05, "loss": 2.2844, "step": 185170 }, { "epoch": 0.32, "learning_rate": 3.3853416435021296e-05, "loss": 2.4017, "step": 185180 }, { "epoch": 0.32, "learning_rate": 3.3852544495094466e-05, "loss": 2.4466, "step": 185190 }, { "epoch": 0.32, "learning_rate": 3.385167255516764e-05, "loss": 2.433, "step": 185200 }, { "epoch": 0.32, "learning_rate": 3.3850800615240814e-05, "loss": 2.5239, "step": 185210 }, { "epoch": 0.32, "learning_rate": 3.3849928675313984e-05, "loss": 2.4652, "step": 185220 }, { "epoch": 0.32, "learning_rate": 3.384905673538716e-05, "loss": 2.4177, "step": 185230 }, { "epoch": 0.32, "learning_rate": 3.384818479546034e-05, "loss": 2.4688, "step": 185240 }, { "epoch": 0.32, "learning_rate": 3.384731285553351e-05, "loss": 2.3758, "step": 185250 }, { "epoch": 0.32, "learning_rate": 3.384644091560668e-05, "loss": 2.4823, "step": 185260 }, { "epoch": 0.32, "learning_rate": 3.3845568975679856e-05, "loss": 2.5183, "step": 185270 }, { "epoch": 0.32, "learning_rate": 3.384469703575303e-05, "loss": 2.4251, "step": 185280 }, { "epoch": 0.32, "learning_rate": 3.38438250958262e-05, "loss": 2.4279, "step": 185290 }, { "epoch": 0.32, "learning_rate": 3.384295315589937e-05, "loss": 2.4908, "step": 185300 }, { "epoch": 0.32, "learning_rate": 3.384208121597255e-05, "loss": 2.3444, "step": 185310 }, { "epoch": 0.32, "learning_rate": 3.384120927604572e-05, "loss": 2.3846, "step": 185320 }, { "epoch": 0.32, "learning_rate": 3.384033733611889e-05, "loss": 2.4735, "step": 185330 }, { "epoch": 0.32, "learning_rate": 3.383946539619207e-05, "loss": 2.4167, "step": 185340 }, { "epoch": 0.32, "learning_rate": 3.383859345626524e-05, "loss": 2.5344, "step": 185350 }, { "epoch": 0.32, "learning_rate": 3.383772151633841e-05, "loss": 2.3708, "step": 185360 }, { "epoch": 0.32, "learning_rate": 3.383684957641158e-05, "loss": 2.4144, "step": 185370 }, { "epoch": 0.32, "learning_rate": 3.383597763648476e-05, "loss": 2.3832, "step": 185380 }, { "epoch": 0.32, "learning_rate": 3.3835105696557935e-05, "loss": 2.4784, "step": 185390 }, { "epoch": 0.32, "learning_rate": 3.3834233756631105e-05, "loss": 2.2918, "step": 185400 }, { "epoch": 0.32, "learning_rate": 3.3833361816704276e-05, "loss": 2.5397, "step": 185410 }, { "epoch": 0.32, "learning_rate": 3.383248987677745e-05, "loss": 2.3688, "step": 185420 }, { "epoch": 0.32, "learning_rate": 3.383161793685062e-05, "loss": 2.3587, "step": 185430 }, { "epoch": 0.32, "learning_rate": 3.3830745996923794e-05, "loss": 2.4156, "step": 185440 }, { "epoch": 0.32, "learning_rate": 3.382987405699697e-05, "loss": 2.4676, "step": 185450 }, { "epoch": 0.32, "learning_rate": 3.382900211707015e-05, "loss": 2.4115, "step": 185460 }, { "epoch": 0.32, "learning_rate": 3.382813017714332e-05, "loss": 2.4778, "step": 185470 }, { "epoch": 0.32, "learning_rate": 3.382725823721649e-05, "loss": 2.3937, "step": 185480 }, { "epoch": 0.32, "learning_rate": 3.3826386297289666e-05, "loss": 2.6008, "step": 185490 }, { "epoch": 0.32, "learning_rate": 3.3825514357362836e-05, "loss": 2.3789, "step": 185500 }, { "epoch": 0.32, "learning_rate": 3.3824642417436007e-05, "loss": 2.5184, "step": 185510 }, { "epoch": 0.32, "learning_rate": 3.3823770477509184e-05, "loss": 2.4604, "step": 185520 }, { "epoch": 0.32, "learning_rate": 3.3822898537582354e-05, "loss": 2.4658, "step": 185530 }, { "epoch": 0.32, "learning_rate": 3.382202659765553e-05, "loss": 2.3234, "step": 185540 }, { "epoch": 0.32, "learning_rate": 3.38211546577287e-05, "loss": 2.4373, "step": 185550 }, { "epoch": 0.32, "learning_rate": 3.382028271780188e-05, "loss": 2.4099, "step": 185560 }, { "epoch": 0.32, "learning_rate": 3.381941077787505e-05, "loss": 2.4382, "step": 185570 }, { "epoch": 0.32, "learning_rate": 3.381853883794822e-05, "loss": 2.5034, "step": 185580 }, { "epoch": 0.32, "learning_rate": 3.38176668980214e-05, "loss": 2.3126, "step": 185590 }, { "epoch": 0.32, "learning_rate": 3.381679495809457e-05, "loss": 2.5828, "step": 185600 }, { "epoch": 0.32, "learning_rate": 3.3815923018167744e-05, "loss": 2.3845, "step": 185610 }, { "epoch": 0.32, "learning_rate": 3.3815051078240915e-05, "loss": 2.335, "step": 185620 }, { "epoch": 0.32, "learning_rate": 3.381417913831409e-05, "loss": 2.4537, "step": 185630 }, { "epoch": 0.32, "learning_rate": 3.381330719838726e-05, "loss": 2.4975, "step": 185640 }, { "epoch": 0.32, "learning_rate": 3.381243525846043e-05, "loss": 2.4886, "step": 185650 }, { "epoch": 0.32, "learning_rate": 3.381156331853361e-05, "loss": 2.4998, "step": 185660 }, { "epoch": 0.32, "learning_rate": 3.381069137860678e-05, "loss": 2.4556, "step": 185670 }, { "epoch": 0.32, "learning_rate": 3.380981943867995e-05, "loss": 2.4317, "step": 185680 }, { "epoch": 0.32, "learning_rate": 3.380894749875313e-05, "loss": 2.4039, "step": 185690 }, { "epoch": 0.32, "learning_rate": 3.3808075558826305e-05, "loss": 2.3627, "step": 185700 }, { "epoch": 0.32, "learning_rate": 3.3807203618899475e-05, "loss": 2.5082, "step": 185710 }, { "epoch": 0.32, "learning_rate": 3.3806331678972646e-05, "loss": 2.4431, "step": 185720 }, { "epoch": 0.32, "learning_rate": 3.380545973904582e-05, "loss": 2.3924, "step": 185730 }, { "epoch": 0.32, "learning_rate": 3.380458779911899e-05, "loss": 2.4992, "step": 185740 }, { "epoch": 0.32, "learning_rate": 3.3803715859192163e-05, "loss": 2.3573, "step": 185750 }, { "epoch": 0.32, "learning_rate": 3.380284391926534e-05, "loss": 2.3494, "step": 185760 }, { "epoch": 0.32, "learning_rate": 3.380197197933852e-05, "loss": 2.4166, "step": 185770 }, { "epoch": 0.32, "learning_rate": 3.380110003941169e-05, "loss": 2.395, "step": 185780 }, { "epoch": 0.32, "learning_rate": 3.380022809948486e-05, "loss": 2.4249, "step": 185790 }, { "epoch": 0.32, "learning_rate": 3.379935615955803e-05, "loss": 2.4474, "step": 185800 }, { "epoch": 0.32, "learning_rate": 3.3798484219631206e-05, "loss": 2.3559, "step": 185810 }, { "epoch": 0.32, "learning_rate": 3.3797612279704376e-05, "loss": 2.6205, "step": 185820 }, { "epoch": 0.32, "learning_rate": 3.3796740339777554e-05, "loss": 2.4012, "step": 185830 }, { "epoch": 0.32, "learning_rate": 3.379586839985073e-05, "loss": 2.364, "step": 185840 }, { "epoch": 0.32, "learning_rate": 3.37949964599239e-05, "loss": 2.2339, "step": 185850 }, { "epoch": 0.32, "learning_rate": 3.379412451999707e-05, "loss": 2.5014, "step": 185860 }, { "epoch": 0.32, "learning_rate": 3.379325258007024e-05, "loss": 2.5375, "step": 185870 }, { "epoch": 0.32, "learning_rate": 3.379238064014342e-05, "loss": 2.4665, "step": 185880 }, { "epoch": 0.32, "learning_rate": 3.379150870021659e-05, "loss": 2.3536, "step": 185890 }, { "epoch": 0.32, "learning_rate": 3.379063676028976e-05, "loss": 2.4277, "step": 185900 }, { "epoch": 0.32, "learning_rate": 3.378976482036294e-05, "loss": 2.4033, "step": 185910 }, { "epoch": 0.32, "learning_rate": 3.3788892880436114e-05, "loss": 2.4116, "step": 185920 }, { "epoch": 0.32, "learning_rate": 3.3788020940509285e-05, "loss": 2.4886, "step": 185930 }, { "epoch": 0.32, "learning_rate": 3.3787149000582455e-05, "loss": 2.4315, "step": 185940 }, { "epoch": 0.32, "learning_rate": 3.378627706065563e-05, "loss": 2.3811, "step": 185950 }, { "epoch": 0.32, "learning_rate": 3.37854051207288e-05, "loss": 2.4186, "step": 185960 }, { "epoch": 0.32, "learning_rate": 3.378453318080197e-05, "loss": 2.3642, "step": 185970 }, { "epoch": 0.32, "learning_rate": 3.378366124087515e-05, "loss": 2.4252, "step": 185980 }, { "epoch": 0.32, "learning_rate": 3.378278930094833e-05, "loss": 2.4103, "step": 185990 }, { "epoch": 0.32, "learning_rate": 3.37819173610215e-05, "loss": 2.4297, "step": 186000 }, { "epoch": 0.32, "learning_rate": 3.378104542109467e-05, "loss": 2.3413, "step": 186010 }, { "epoch": 0.32, "learning_rate": 3.3780173481167845e-05, "loss": 2.3871, "step": 186020 }, { "epoch": 0.32, "learning_rate": 3.3779301541241015e-05, "loss": 2.4028, "step": 186030 }, { "epoch": 0.32, "learning_rate": 3.3778429601314186e-05, "loss": 2.4323, "step": 186040 }, { "epoch": 0.32, "learning_rate": 3.377755766138736e-05, "loss": 2.421, "step": 186050 }, { "epoch": 0.32, "learning_rate": 3.377668572146054e-05, "loss": 2.4696, "step": 186060 }, { "epoch": 0.32, "learning_rate": 3.377581378153371e-05, "loss": 2.3663, "step": 186070 }, { "epoch": 0.32, "learning_rate": 3.377494184160688e-05, "loss": 2.3972, "step": 186080 }, { "epoch": 0.32, "learning_rate": 3.377406990168006e-05, "loss": 2.4624, "step": 186090 }, { "epoch": 0.32, "learning_rate": 3.377319796175323e-05, "loss": 2.3885, "step": 186100 }, { "epoch": 0.32, "learning_rate": 3.37723260218264e-05, "loss": 2.4572, "step": 186110 }, { "epoch": 0.32, "learning_rate": 3.3771454081899576e-05, "loss": 2.4589, "step": 186120 }, { "epoch": 0.32, "learning_rate": 3.377058214197275e-05, "loss": 2.6446, "step": 186130 }, { "epoch": 0.32, "learning_rate": 3.3769710202045924e-05, "loss": 2.2499, "step": 186140 }, { "epoch": 0.32, "learning_rate": 3.3768838262119094e-05, "loss": 2.4642, "step": 186150 }, { "epoch": 0.32, "learning_rate": 3.376796632219227e-05, "loss": 2.4271, "step": 186160 }, { "epoch": 0.32, "learning_rate": 3.376709438226544e-05, "loss": 2.3983, "step": 186170 }, { "epoch": 0.32, "learning_rate": 3.376622244233861e-05, "loss": 2.4427, "step": 186180 }, { "epoch": 0.32, "learning_rate": 3.376535050241178e-05, "loss": 2.4767, "step": 186190 }, { "epoch": 0.32, "learning_rate": 3.376447856248496e-05, "loss": 2.4248, "step": 186200 }, { "epoch": 0.32, "learning_rate": 3.3763606622558137e-05, "loss": 2.3521, "step": 186210 }, { "epoch": 0.32, "learning_rate": 3.376273468263131e-05, "loss": 2.3493, "step": 186220 }, { "epoch": 0.32, "learning_rate": 3.3761862742704484e-05, "loss": 2.375, "step": 186230 }, { "epoch": 0.32, "learning_rate": 3.3760990802777654e-05, "loss": 2.4347, "step": 186240 }, { "epoch": 0.32, "learning_rate": 3.3760118862850825e-05, "loss": 2.4967, "step": 186250 }, { "epoch": 0.32, "learning_rate": 3.3759246922923995e-05, "loss": 2.5443, "step": 186260 }, { "epoch": 0.32, "learning_rate": 3.375837498299717e-05, "loss": 2.3057, "step": 186270 }, { "epoch": 0.32, "learning_rate": 3.375750304307035e-05, "loss": 2.5084, "step": 186280 }, { "epoch": 0.32, "learning_rate": 3.375663110314352e-05, "loss": 2.5466, "step": 186290 }, { "epoch": 0.32, "learning_rate": 3.375575916321669e-05, "loss": 2.4103, "step": 186300 }, { "epoch": 0.32, "learning_rate": 3.375488722328987e-05, "loss": 2.3543, "step": 186310 }, { "epoch": 0.32, "learning_rate": 3.375401528336304e-05, "loss": 2.4083, "step": 186320 }, { "epoch": 0.32, "learning_rate": 3.375314334343621e-05, "loss": 2.427, "step": 186330 }, { "epoch": 0.32, "learning_rate": 3.3752271403509385e-05, "loss": 2.4894, "step": 186340 }, { "epoch": 0.32, "learning_rate": 3.3751399463582556e-05, "loss": 2.5105, "step": 186350 }, { "epoch": 0.32, "learning_rate": 3.375052752365573e-05, "loss": 2.4023, "step": 186360 }, { "epoch": 0.33, "learning_rate": 3.37496555837289e-05, "loss": 2.3667, "step": 186370 }, { "epoch": 0.33, "learning_rate": 3.374878364380208e-05, "loss": 2.4208, "step": 186380 }, { "epoch": 0.33, "learning_rate": 3.374791170387525e-05, "loss": 2.5263, "step": 186390 }, { "epoch": 0.33, "learning_rate": 3.374703976394842e-05, "loss": 2.4588, "step": 186400 }, { "epoch": 0.33, "learning_rate": 3.37461678240216e-05, "loss": 2.4637, "step": 186410 }, { "epoch": 0.33, "learning_rate": 3.374529588409477e-05, "loss": 2.3748, "step": 186420 }, { "epoch": 0.33, "learning_rate": 3.3744423944167946e-05, "loss": 2.435, "step": 186430 }, { "epoch": 0.33, "learning_rate": 3.3743552004241116e-05, "loss": 2.4452, "step": 186440 }, { "epoch": 0.33, "learning_rate": 3.3742680064314293e-05, "loss": 2.409, "step": 186450 }, { "epoch": 0.33, "learning_rate": 3.3741808124387464e-05, "loss": 2.3132, "step": 186460 }, { "epoch": 0.33, "learning_rate": 3.3740936184460634e-05, "loss": 2.4378, "step": 186470 }, { "epoch": 0.33, "learning_rate": 3.374006424453381e-05, "loss": 2.367, "step": 186480 }, { "epoch": 0.33, "learning_rate": 3.373919230460698e-05, "loss": 2.4874, "step": 186490 }, { "epoch": 0.33, "learning_rate": 3.373832036468016e-05, "loss": 2.575, "step": 186500 }, { "epoch": 0.33, "learning_rate": 3.373744842475333e-05, "loss": 2.5241, "step": 186510 }, { "epoch": 0.33, "learning_rate": 3.3736576484826506e-05, "loss": 2.3321, "step": 186520 }, { "epoch": 0.33, "learning_rate": 3.373570454489968e-05, "loss": 2.4275, "step": 186530 }, { "epoch": 0.33, "learning_rate": 3.373483260497285e-05, "loss": 2.461, "step": 186540 }, { "epoch": 0.33, "learning_rate": 3.3733960665046024e-05, "loss": 2.4467, "step": 186550 }, { "epoch": 0.33, "learning_rate": 3.3733088725119195e-05, "loss": 2.4204, "step": 186560 }, { "epoch": 0.33, "learning_rate": 3.3732216785192365e-05, "loss": 2.4826, "step": 186570 }, { "epoch": 0.33, "learning_rate": 3.373134484526554e-05, "loss": 2.42, "step": 186580 }, { "epoch": 0.33, "learning_rate": 3.373047290533872e-05, "loss": 2.4091, "step": 186590 }, { "epoch": 0.33, "learning_rate": 3.372960096541189e-05, "loss": 2.5413, "step": 186600 }, { "epoch": 0.33, "learning_rate": 3.372872902548506e-05, "loss": 2.4294, "step": 186610 }, { "epoch": 0.33, "learning_rate": 3.372785708555824e-05, "loss": 2.5432, "step": 186620 }, { "epoch": 0.33, "learning_rate": 3.372698514563141e-05, "loss": 2.4697, "step": 186630 }, { "epoch": 0.33, "learning_rate": 3.372611320570458e-05, "loss": 2.5437, "step": 186640 }, { "epoch": 0.33, "learning_rate": 3.3725241265777755e-05, "loss": 2.4964, "step": 186650 }, { "epoch": 0.33, "learning_rate": 3.372436932585093e-05, "loss": 2.4463, "step": 186660 }, { "epoch": 0.33, "learning_rate": 3.37234973859241e-05, "loss": 2.5834, "step": 186670 }, { "epoch": 0.33, "learning_rate": 3.372262544599727e-05, "loss": 2.4709, "step": 186680 }, { "epoch": 0.33, "learning_rate": 3.372175350607045e-05, "loss": 2.4337, "step": 186690 }, { "epoch": 0.33, "learning_rate": 3.372088156614362e-05, "loss": 2.4135, "step": 186700 }, { "epoch": 0.33, "learning_rate": 3.372000962621679e-05, "loss": 2.3792, "step": 186710 }, { "epoch": 0.33, "learning_rate": 3.371913768628996e-05, "loss": 2.4102, "step": 186720 }, { "epoch": 0.33, "learning_rate": 3.3718265746363145e-05, "loss": 2.3583, "step": 186730 }, { "epoch": 0.33, "learning_rate": 3.3717393806436316e-05, "loss": 2.2898, "step": 186740 }, { "epoch": 0.33, "learning_rate": 3.3716521866509486e-05, "loss": 2.386, "step": 186750 }, { "epoch": 0.33, "learning_rate": 3.371564992658266e-05, "loss": 2.3832, "step": 186760 }, { "epoch": 0.33, "learning_rate": 3.3714777986655834e-05, "loss": 2.4145, "step": 186770 }, { "epoch": 0.33, "learning_rate": 3.3713906046729004e-05, "loss": 2.3867, "step": 186780 }, { "epoch": 0.33, "learning_rate": 3.3713034106802175e-05, "loss": 2.391, "step": 186790 }, { "epoch": 0.33, "learning_rate": 3.371216216687536e-05, "loss": 2.3987, "step": 186800 }, { "epoch": 0.33, "learning_rate": 3.371129022694853e-05, "loss": 2.3901, "step": 186810 }, { "epoch": 0.33, "learning_rate": 3.37104182870217e-05, "loss": 2.3973, "step": 186820 }, { "epoch": 0.33, "learning_rate": 3.370954634709487e-05, "loss": 2.3991, "step": 186830 }, { "epoch": 0.33, "learning_rate": 3.370867440716805e-05, "loss": 2.4347, "step": 186840 }, { "epoch": 0.33, "learning_rate": 3.370780246724122e-05, "loss": 2.3038, "step": 186850 }, { "epoch": 0.33, "learning_rate": 3.370693052731439e-05, "loss": 2.4704, "step": 186860 }, { "epoch": 0.33, "learning_rate": 3.3706058587387565e-05, "loss": 2.4831, "step": 186870 }, { "epoch": 0.33, "learning_rate": 3.370518664746074e-05, "loss": 2.4123, "step": 186880 }, { "epoch": 0.33, "learning_rate": 3.370431470753391e-05, "loss": 2.5022, "step": 186890 }, { "epoch": 0.33, "learning_rate": 3.370344276760708e-05, "loss": 2.438, "step": 186900 }, { "epoch": 0.33, "learning_rate": 3.370257082768026e-05, "loss": 2.3635, "step": 186910 }, { "epoch": 0.33, "learning_rate": 3.370169888775343e-05, "loss": 2.3533, "step": 186920 }, { "epoch": 0.33, "learning_rate": 3.37008269478266e-05, "loss": 2.4397, "step": 186930 }, { "epoch": 0.33, "learning_rate": 3.369995500789978e-05, "loss": 2.3947, "step": 186940 }, { "epoch": 0.33, "learning_rate": 3.3699083067972955e-05, "loss": 2.4716, "step": 186950 }, { "epoch": 0.33, "learning_rate": 3.3698211128046125e-05, "loss": 2.3458, "step": 186960 }, { "epoch": 0.33, "learning_rate": 3.3697339188119296e-05, "loss": 2.4197, "step": 186970 }, { "epoch": 0.33, "learning_rate": 3.369646724819247e-05, "loss": 2.4035, "step": 186980 }, { "epoch": 0.33, "learning_rate": 3.369559530826564e-05, "loss": 2.4253, "step": 186990 }, { "epoch": 0.33, "learning_rate": 3.3694723368338814e-05, "loss": 2.4414, "step": 187000 }, { "epoch": 0.33, "learning_rate": 3.369385142841199e-05, "loss": 2.3991, "step": 187010 }, { "epoch": 0.33, "learning_rate": 3.369297948848516e-05, "loss": 2.5385, "step": 187020 }, { "epoch": 0.33, "learning_rate": 3.369210754855834e-05, "loss": 2.4992, "step": 187030 }, { "epoch": 0.33, "learning_rate": 3.369123560863151e-05, "loss": 2.4274, "step": 187040 }, { "epoch": 0.33, "learning_rate": 3.3690363668704686e-05, "loss": 2.3283, "step": 187050 }, { "epoch": 0.33, "learning_rate": 3.3689491728777856e-05, "loss": 2.4782, "step": 187060 }, { "epoch": 0.33, "learning_rate": 3.3688619788851027e-05, "loss": 2.5264, "step": 187070 }, { "epoch": 0.33, "learning_rate": 3.3687747848924204e-05, "loss": 2.3358, "step": 187080 }, { "epoch": 0.33, "learning_rate": 3.3686875908997374e-05, "loss": 2.4943, "step": 187090 }, { "epoch": 0.33, "learning_rate": 3.368600396907055e-05, "loss": 2.468, "step": 187100 }, { "epoch": 0.33, "learning_rate": 3.368513202914372e-05, "loss": 2.4046, "step": 187110 }, { "epoch": 0.33, "learning_rate": 3.36842600892169e-05, "loss": 2.4882, "step": 187120 }, { "epoch": 0.33, "learning_rate": 3.368338814929007e-05, "loss": 2.3885, "step": 187130 }, { "epoch": 0.33, "learning_rate": 3.368251620936324e-05, "loss": 2.2899, "step": 187140 }, { "epoch": 0.33, "learning_rate": 3.368164426943641e-05, "loss": 2.3922, "step": 187150 }, { "epoch": 0.33, "learning_rate": 3.368077232950959e-05, "loss": 2.4451, "step": 187160 }, { "epoch": 0.33, "learning_rate": 3.3679900389582764e-05, "loss": 2.4985, "step": 187170 }, { "epoch": 0.33, "learning_rate": 3.3679028449655935e-05, "loss": 2.4307, "step": 187180 }, { "epoch": 0.33, "learning_rate": 3.367815650972911e-05, "loss": 2.3884, "step": 187190 }, { "epoch": 0.33, "learning_rate": 3.367728456980228e-05, "loss": 2.4542, "step": 187200 }, { "epoch": 0.33, "learning_rate": 3.367641262987545e-05, "loss": 2.3913, "step": 187210 }, { "epoch": 0.33, "learning_rate": 3.367554068994862e-05, "loss": 2.5733, "step": 187220 }, { "epoch": 0.33, "learning_rate": 3.36746687500218e-05, "loss": 2.4684, "step": 187230 }, { "epoch": 0.33, "learning_rate": 3.367379681009497e-05, "loss": 2.3966, "step": 187240 }, { "epoch": 0.33, "learning_rate": 3.367292487016815e-05, "loss": 2.4411, "step": 187250 }, { "epoch": 0.33, "learning_rate": 3.367205293024132e-05, "loss": 2.4423, "step": 187260 }, { "epoch": 0.33, "learning_rate": 3.3671180990314495e-05, "loss": 2.3319, "step": 187270 }, { "epoch": 0.33, "learning_rate": 3.3670309050387666e-05, "loss": 2.5238, "step": 187280 }, { "epoch": 0.33, "learning_rate": 3.3669437110460836e-05, "loss": 2.3715, "step": 187290 }, { "epoch": 0.33, "learning_rate": 3.366856517053401e-05, "loss": 2.3798, "step": 187300 }, { "epoch": 0.33, "learning_rate": 3.3667693230607183e-05, "loss": 2.422, "step": 187310 }, { "epoch": 0.33, "learning_rate": 3.366682129068036e-05, "loss": 2.4433, "step": 187320 }, { "epoch": 0.33, "learning_rate": 3.366594935075353e-05, "loss": 2.4842, "step": 187330 }, { "epoch": 0.33, "learning_rate": 3.366507741082671e-05, "loss": 2.4917, "step": 187340 }, { "epoch": 0.33, "learning_rate": 3.366420547089988e-05, "loss": 2.4431, "step": 187350 }, { "epoch": 0.33, "learning_rate": 3.366333353097305e-05, "loss": 2.321, "step": 187360 }, { "epoch": 0.33, "learning_rate": 3.3662461591046226e-05, "loss": 2.4105, "step": 187370 }, { "epoch": 0.33, "learning_rate": 3.3661589651119396e-05, "loss": 2.3863, "step": 187380 }, { "epoch": 0.33, "learning_rate": 3.366071771119257e-05, "loss": 2.5224, "step": 187390 }, { "epoch": 0.33, "learning_rate": 3.3659845771265744e-05, "loss": 2.3934, "step": 187400 }, { "epoch": 0.33, "learning_rate": 3.365897383133892e-05, "loss": 2.3863, "step": 187410 }, { "epoch": 0.33, "learning_rate": 3.365810189141209e-05, "loss": 2.4614, "step": 187420 }, { "epoch": 0.33, "learning_rate": 3.365722995148526e-05, "loss": 2.4524, "step": 187430 }, { "epoch": 0.33, "learning_rate": 3.365635801155844e-05, "loss": 2.3551, "step": 187440 }, { "epoch": 0.33, "learning_rate": 3.365548607163161e-05, "loss": 2.4502, "step": 187450 }, { "epoch": 0.33, "learning_rate": 3.365461413170478e-05, "loss": 2.464, "step": 187460 }, { "epoch": 0.33, "learning_rate": 3.365374219177796e-05, "loss": 2.4404, "step": 187470 }, { "epoch": 0.33, "learning_rate": 3.3652870251851134e-05, "loss": 2.5784, "step": 187480 }, { "epoch": 0.33, "learning_rate": 3.3651998311924305e-05, "loss": 2.2893, "step": 187490 }, { "epoch": 0.33, "learning_rate": 3.3651126371997475e-05, "loss": 2.3041, "step": 187500 }, { "epoch": 0.33, "learning_rate": 3.365025443207065e-05, "loss": 2.4584, "step": 187510 }, { "epoch": 0.33, "learning_rate": 3.364938249214382e-05, "loss": 2.4467, "step": 187520 }, { "epoch": 0.33, "learning_rate": 3.364851055221699e-05, "loss": 2.4889, "step": 187530 }, { "epoch": 0.33, "learning_rate": 3.364763861229016e-05, "loss": 2.3827, "step": 187540 }, { "epoch": 0.33, "learning_rate": 3.364676667236335e-05, "loss": 2.3975, "step": 187550 }, { "epoch": 0.33, "learning_rate": 3.364589473243652e-05, "loss": 2.4316, "step": 187560 }, { "epoch": 0.33, "learning_rate": 3.364502279250969e-05, "loss": 2.4471, "step": 187570 }, { "epoch": 0.33, "learning_rate": 3.3644150852582865e-05, "loss": 2.4387, "step": 187580 }, { "epoch": 0.33, "learning_rate": 3.3643278912656035e-05, "loss": 2.4339, "step": 187590 }, { "epoch": 0.33, "learning_rate": 3.3642406972729206e-05, "loss": 2.479, "step": 187600 }, { "epoch": 0.33, "learning_rate": 3.3641535032802376e-05, "loss": 2.5941, "step": 187610 }, { "epoch": 0.33, "learning_rate": 3.364066309287556e-05, "loss": 2.5235, "step": 187620 }, { "epoch": 0.33, "learning_rate": 3.363979115294873e-05, "loss": 2.3967, "step": 187630 }, { "epoch": 0.33, "learning_rate": 3.36389192130219e-05, "loss": 2.4778, "step": 187640 }, { "epoch": 0.33, "learning_rate": 3.363804727309507e-05, "loss": 2.4797, "step": 187650 }, { "epoch": 0.33, "learning_rate": 3.363717533316825e-05, "loss": 2.2695, "step": 187660 }, { "epoch": 0.33, "learning_rate": 3.363630339324142e-05, "loss": 2.3642, "step": 187670 }, { "epoch": 0.33, "learning_rate": 3.363543145331459e-05, "loss": 2.4431, "step": 187680 }, { "epoch": 0.33, "learning_rate": 3.363455951338777e-05, "loss": 2.4717, "step": 187690 }, { "epoch": 0.33, "learning_rate": 3.3633687573460944e-05, "loss": 2.54, "step": 187700 }, { "epoch": 0.33, "learning_rate": 3.3632815633534114e-05, "loss": 2.3796, "step": 187710 }, { "epoch": 0.33, "learning_rate": 3.3631943693607284e-05, "loss": 2.5043, "step": 187720 }, { "epoch": 0.33, "learning_rate": 3.363107175368046e-05, "loss": 2.4027, "step": 187730 }, { "epoch": 0.33, "learning_rate": 3.363019981375363e-05, "loss": 2.4352, "step": 187740 }, { "epoch": 0.33, "learning_rate": 3.36293278738268e-05, "loss": 2.3622, "step": 187750 }, { "epoch": 0.33, "learning_rate": 3.362845593389998e-05, "loss": 2.4902, "step": 187760 }, { "epoch": 0.33, "learning_rate": 3.3627583993973157e-05, "loss": 2.5447, "step": 187770 }, { "epoch": 0.33, "learning_rate": 3.362671205404633e-05, "loss": 2.4536, "step": 187780 }, { "epoch": 0.33, "learning_rate": 3.36258401141195e-05, "loss": 2.4395, "step": 187790 }, { "epoch": 0.33, "learning_rate": 3.3624968174192674e-05, "loss": 2.3794, "step": 187800 }, { "epoch": 0.33, "learning_rate": 3.3624096234265845e-05, "loss": 2.426, "step": 187810 }, { "epoch": 0.33, "learning_rate": 3.3623224294339015e-05, "loss": 2.4444, "step": 187820 }, { "epoch": 0.33, "learning_rate": 3.362235235441219e-05, "loss": 2.4609, "step": 187830 }, { "epoch": 0.33, "learning_rate": 3.362148041448537e-05, "loss": 2.5456, "step": 187840 }, { "epoch": 0.33, "learning_rate": 3.362060847455854e-05, "loss": 2.4735, "step": 187850 }, { "epoch": 0.33, "learning_rate": 3.361973653463171e-05, "loss": 2.4007, "step": 187860 }, { "epoch": 0.33, "learning_rate": 3.361886459470489e-05, "loss": 2.4055, "step": 187870 }, { "epoch": 0.33, "learning_rate": 3.361799265477806e-05, "loss": 2.4245, "step": 187880 }, { "epoch": 0.33, "learning_rate": 3.361712071485123e-05, "loss": 2.4822, "step": 187890 }, { "epoch": 0.33, "learning_rate": 3.3616248774924405e-05, "loss": 2.5009, "step": 187900 }, { "epoch": 0.33, "learning_rate": 3.3615376834997576e-05, "loss": 2.3937, "step": 187910 }, { "epoch": 0.33, "learning_rate": 3.361450489507075e-05, "loss": 2.3937, "step": 187920 }, { "epoch": 0.33, "learning_rate": 3.361363295514392e-05, "loss": 2.3209, "step": 187930 }, { "epoch": 0.33, "learning_rate": 3.36127610152171e-05, "loss": 2.4492, "step": 187940 }, { "epoch": 0.33, "learning_rate": 3.361188907529027e-05, "loss": 2.4285, "step": 187950 }, { "epoch": 0.33, "learning_rate": 3.361101713536344e-05, "loss": 2.4578, "step": 187960 }, { "epoch": 0.33, "learning_rate": 3.361014519543662e-05, "loss": 2.4346, "step": 187970 }, { "epoch": 0.33, "learning_rate": 3.360927325550979e-05, "loss": 2.3956, "step": 187980 }, { "epoch": 0.33, "learning_rate": 3.3608401315582966e-05, "loss": 2.5002, "step": 187990 }, { "epoch": 0.33, "learning_rate": 3.3607529375656136e-05, "loss": 2.3356, "step": 188000 }, { "epoch": 0.33, "learning_rate": 3.3606657435729313e-05, "loss": 2.4225, "step": 188010 }, { "epoch": 0.33, "learning_rate": 3.3605785495802484e-05, "loss": 2.4621, "step": 188020 }, { "epoch": 0.33, "learning_rate": 3.3604913555875654e-05, "loss": 2.3798, "step": 188030 }, { "epoch": 0.33, "learning_rate": 3.360404161594883e-05, "loss": 2.3195, "step": 188040 }, { "epoch": 0.33, "learning_rate": 3.3603169676022e-05, "loss": 2.4567, "step": 188050 }, { "epoch": 0.33, "learning_rate": 3.360229773609517e-05, "loss": 2.5278, "step": 188060 }, { "epoch": 0.33, "learning_rate": 3.360142579616835e-05, "loss": 2.4522, "step": 188070 }, { "epoch": 0.33, "learning_rate": 3.3600553856241526e-05, "loss": 2.361, "step": 188080 }, { "epoch": 0.33, "learning_rate": 3.35996819163147e-05, "loss": 2.4513, "step": 188090 }, { "epoch": 0.33, "learning_rate": 3.359880997638787e-05, "loss": 2.5194, "step": 188100 }, { "epoch": 0.33, "learning_rate": 3.359793803646104e-05, "loss": 2.4706, "step": 188110 }, { "epoch": 0.33, "learning_rate": 3.3597066096534215e-05, "loss": 2.2757, "step": 188120 }, { "epoch": 0.33, "learning_rate": 3.3596194156607385e-05, "loss": 2.4817, "step": 188130 }, { "epoch": 0.33, "learning_rate": 3.359532221668056e-05, "loss": 2.4637, "step": 188140 }, { "epoch": 0.33, "learning_rate": 3.359445027675374e-05, "loss": 2.5056, "step": 188150 }, { "epoch": 0.33, "learning_rate": 3.359357833682691e-05, "loss": 2.4133, "step": 188160 }, { "epoch": 0.33, "learning_rate": 3.359270639690008e-05, "loss": 2.4447, "step": 188170 }, { "epoch": 0.33, "learning_rate": 3.359183445697325e-05, "loss": 2.4338, "step": 188180 }, { "epoch": 0.33, "learning_rate": 3.359096251704643e-05, "loss": 2.3172, "step": 188190 }, { "epoch": 0.33, "learning_rate": 3.35900905771196e-05, "loss": 2.3234, "step": 188200 }, { "epoch": 0.33, "learning_rate": 3.358921863719277e-05, "loss": 2.3524, "step": 188210 }, { "epoch": 0.33, "learning_rate": 3.3588346697265946e-05, "loss": 2.4676, "step": 188220 }, { "epoch": 0.33, "learning_rate": 3.358747475733912e-05, "loss": 2.4722, "step": 188230 }, { "epoch": 0.33, "learning_rate": 3.358660281741229e-05, "loss": 2.422, "step": 188240 }, { "epoch": 0.33, "learning_rate": 3.3585730877485464e-05, "loss": 2.5847, "step": 188250 }, { "epoch": 0.33, "learning_rate": 3.358485893755864e-05, "loss": 2.4144, "step": 188260 }, { "epoch": 0.33, "learning_rate": 3.358398699763181e-05, "loss": 2.428, "step": 188270 }, { "epoch": 0.33, "learning_rate": 3.358311505770498e-05, "loss": 2.4266, "step": 188280 }, { "epoch": 0.33, "learning_rate": 3.358224311777816e-05, "loss": 2.4684, "step": 188290 }, { "epoch": 0.33, "learning_rate": 3.3581371177851336e-05, "loss": 2.3116, "step": 188300 }, { "epoch": 0.33, "learning_rate": 3.3580499237924506e-05, "loss": 2.4097, "step": 188310 }, { "epoch": 0.33, "learning_rate": 3.357962729799768e-05, "loss": 2.435, "step": 188320 }, { "epoch": 0.33, "learning_rate": 3.3578755358070854e-05, "loss": 2.3724, "step": 188330 }, { "epoch": 0.33, "learning_rate": 3.3577883418144024e-05, "loss": 2.3298, "step": 188340 }, { "epoch": 0.33, "learning_rate": 3.3577011478217195e-05, "loss": 2.4695, "step": 188350 }, { "epoch": 0.33, "learning_rate": 3.357613953829037e-05, "loss": 2.5158, "step": 188360 }, { "epoch": 0.33, "learning_rate": 3.357526759836355e-05, "loss": 2.4352, "step": 188370 }, { "epoch": 0.33, "learning_rate": 3.357439565843672e-05, "loss": 2.4552, "step": 188380 }, { "epoch": 0.33, "learning_rate": 3.357352371850989e-05, "loss": 2.4107, "step": 188390 }, { "epoch": 0.33, "learning_rate": 3.357265177858307e-05, "loss": 2.498, "step": 188400 }, { "epoch": 0.33, "learning_rate": 3.357177983865624e-05, "loss": 2.459, "step": 188410 }, { "epoch": 0.33, "learning_rate": 3.357090789872941e-05, "loss": 2.37, "step": 188420 }, { "epoch": 0.33, "learning_rate": 3.3570035958802585e-05, "loss": 2.4365, "step": 188430 }, { "epoch": 0.33, "learning_rate": 3.356916401887576e-05, "loss": 2.631, "step": 188440 }, { "epoch": 0.33, "learning_rate": 3.356829207894893e-05, "loss": 2.5303, "step": 188450 }, { "epoch": 0.33, "learning_rate": 3.35674201390221e-05, "loss": 2.4006, "step": 188460 }, { "epoch": 0.33, "learning_rate": 3.356654819909528e-05, "loss": 2.4611, "step": 188470 }, { "epoch": 0.33, "learning_rate": 3.356567625916845e-05, "loss": 2.4934, "step": 188480 }, { "epoch": 0.33, "learning_rate": 3.356480431924162e-05, "loss": 2.465, "step": 188490 }, { "epoch": 0.33, "learning_rate": 3.356393237931479e-05, "loss": 2.4593, "step": 188500 }, { "epoch": 0.33, "learning_rate": 3.3563060439387975e-05, "loss": 2.4563, "step": 188510 }, { "epoch": 0.33, "learning_rate": 3.3562188499461145e-05, "loss": 2.3968, "step": 188520 }, { "epoch": 0.33, "learning_rate": 3.3561316559534316e-05, "loss": 2.5582, "step": 188530 }, { "epoch": 0.33, "learning_rate": 3.356044461960749e-05, "loss": 2.4697, "step": 188540 }, { "epoch": 0.33, "learning_rate": 3.355957267968066e-05, "loss": 2.3266, "step": 188550 }, { "epoch": 0.33, "learning_rate": 3.3558700739753834e-05, "loss": 2.5055, "step": 188560 }, { "epoch": 0.33, "learning_rate": 3.3557828799827004e-05, "loss": 2.5233, "step": 188570 }, { "epoch": 0.33, "learning_rate": 3.355695685990018e-05, "loss": 2.5394, "step": 188580 }, { "epoch": 0.33, "learning_rate": 3.355608491997336e-05, "loss": 2.4772, "step": 188590 }, { "epoch": 0.33, "learning_rate": 3.355521298004653e-05, "loss": 2.5527, "step": 188600 }, { "epoch": 0.33, "learning_rate": 3.35543410401197e-05, "loss": 2.4514, "step": 188610 }, { "epoch": 0.33, "learning_rate": 3.3553469100192876e-05, "loss": 2.3815, "step": 188620 }, { "epoch": 0.33, "learning_rate": 3.3552597160266047e-05, "loss": 2.4575, "step": 188630 }, { "epoch": 0.33, "learning_rate": 3.355172522033922e-05, "loss": 2.4541, "step": 188640 }, { "epoch": 0.33, "learning_rate": 3.3550853280412394e-05, "loss": 2.4547, "step": 188650 }, { "epoch": 0.33, "learning_rate": 3.354998134048557e-05, "loss": 2.5815, "step": 188660 }, { "epoch": 0.33, "learning_rate": 3.354910940055874e-05, "loss": 2.4729, "step": 188670 }, { "epoch": 0.33, "learning_rate": 3.354823746063191e-05, "loss": 2.4883, "step": 188680 }, { "epoch": 0.33, "learning_rate": 3.354736552070509e-05, "loss": 2.4641, "step": 188690 }, { "epoch": 0.33, "learning_rate": 3.354649358077826e-05, "loss": 2.4387, "step": 188700 }, { "epoch": 0.33, "learning_rate": 3.354562164085143e-05, "loss": 2.4269, "step": 188710 }, { "epoch": 0.33, "learning_rate": 3.354474970092461e-05, "loss": 2.3209, "step": 188720 }, { "epoch": 0.33, "learning_rate": 3.354387776099778e-05, "loss": 2.5372, "step": 188730 }, { "epoch": 0.33, "learning_rate": 3.3543005821070955e-05, "loss": 2.4825, "step": 188740 }, { "epoch": 0.33, "learning_rate": 3.3542133881144125e-05, "loss": 2.4641, "step": 188750 }, { "epoch": 0.33, "learning_rate": 3.35412619412173e-05, "loss": 2.4351, "step": 188760 }, { "epoch": 0.33, "learning_rate": 3.354039000129047e-05, "loss": 2.4893, "step": 188770 }, { "epoch": 0.33, "learning_rate": 3.353951806136364e-05, "loss": 2.456, "step": 188780 }, { "epoch": 0.33, "learning_rate": 3.353864612143682e-05, "loss": 2.4659, "step": 188790 }, { "epoch": 0.33, "learning_rate": 3.353777418150999e-05, "loss": 2.4726, "step": 188800 }, { "epoch": 0.33, "learning_rate": 3.353690224158317e-05, "loss": 2.3798, "step": 188810 }, { "epoch": 0.33, "learning_rate": 3.353603030165634e-05, "loss": 2.4226, "step": 188820 }, { "epoch": 0.33, "learning_rate": 3.3535158361729515e-05, "loss": 2.3944, "step": 188830 }, { "epoch": 0.33, "learning_rate": 3.3534286421802686e-05, "loss": 2.4519, "step": 188840 }, { "epoch": 0.33, "learning_rate": 3.3533414481875856e-05, "loss": 2.5094, "step": 188850 }, { "epoch": 0.33, "learning_rate": 3.353254254194903e-05, "loss": 2.4752, "step": 188860 }, { "epoch": 0.33, "learning_rate": 3.3531670602022203e-05, "loss": 2.4526, "step": 188870 }, { "epoch": 0.33, "learning_rate": 3.3530798662095374e-05, "loss": 2.3856, "step": 188880 }, { "epoch": 0.33, "learning_rate": 3.352992672216855e-05, "loss": 2.5045, "step": 188890 }, { "epoch": 0.33, "learning_rate": 3.352905478224173e-05, "loss": 2.5707, "step": 188900 }, { "epoch": 0.33, "learning_rate": 3.35281828423149e-05, "loss": 2.4387, "step": 188910 }, { "epoch": 0.33, "learning_rate": 3.352731090238807e-05, "loss": 2.3362, "step": 188920 }, { "epoch": 0.33, "learning_rate": 3.3526438962461246e-05, "loss": 2.3654, "step": 188930 }, { "epoch": 0.33, "learning_rate": 3.3525567022534416e-05, "loss": 2.4981, "step": 188940 }, { "epoch": 0.33, "learning_rate": 3.352469508260759e-05, "loss": 2.395, "step": 188950 }, { "epoch": 0.33, "learning_rate": 3.3523823142680764e-05, "loss": 2.4528, "step": 188960 }, { "epoch": 0.33, "learning_rate": 3.352295120275394e-05, "loss": 2.4737, "step": 188970 }, { "epoch": 0.33, "learning_rate": 3.352207926282711e-05, "loss": 2.3364, "step": 188980 }, { "epoch": 0.33, "learning_rate": 3.352120732290028e-05, "loss": 2.5527, "step": 188990 }, { "epoch": 0.33, "learning_rate": 3.352033538297345e-05, "loss": 2.3962, "step": 189000 }, { "epoch": 0.33, "learning_rate": 3.351946344304663e-05, "loss": 2.4004, "step": 189010 }, { "epoch": 0.33, "learning_rate": 3.35185915031198e-05, "loss": 2.4486, "step": 189020 }, { "epoch": 0.33, "learning_rate": 3.351771956319298e-05, "loss": 2.4786, "step": 189030 }, { "epoch": 0.33, "learning_rate": 3.3516847623266154e-05, "loss": 2.5427, "step": 189040 }, { "epoch": 0.33, "learning_rate": 3.3515975683339325e-05, "loss": 2.4162, "step": 189050 }, { "epoch": 0.33, "learning_rate": 3.3515103743412495e-05, "loss": 2.3391, "step": 189060 }, { "epoch": 0.33, "learning_rate": 3.3514231803485665e-05, "loss": 2.4635, "step": 189070 }, { "epoch": 0.33, "learning_rate": 3.351335986355884e-05, "loss": 2.417, "step": 189080 }, { "epoch": 0.33, "learning_rate": 3.351248792363201e-05, "loss": 2.3962, "step": 189090 }, { "epoch": 0.33, "learning_rate": 3.351161598370518e-05, "loss": 2.6302, "step": 189100 }, { "epoch": 0.33, "learning_rate": 3.351074404377836e-05, "loss": 2.4463, "step": 189110 }, { "epoch": 0.33, "learning_rate": 3.350987210385154e-05, "loss": 2.4588, "step": 189120 }, { "epoch": 0.33, "learning_rate": 3.350900016392471e-05, "loss": 2.3591, "step": 189130 }, { "epoch": 0.33, "learning_rate": 3.350812822399788e-05, "loss": 2.4357, "step": 189140 }, { "epoch": 0.33, "learning_rate": 3.3507256284071055e-05, "loss": 2.4485, "step": 189150 }, { "epoch": 0.33, "learning_rate": 3.3506384344144226e-05, "loss": 2.4804, "step": 189160 }, { "epoch": 0.33, "learning_rate": 3.3505512404217396e-05, "loss": 2.4532, "step": 189170 }, { "epoch": 0.33, "learning_rate": 3.3504640464290573e-05, "loss": 2.3312, "step": 189180 }, { "epoch": 0.33, "learning_rate": 3.350376852436375e-05, "loss": 2.4259, "step": 189190 }, { "epoch": 0.33, "learning_rate": 3.350289658443692e-05, "loss": 2.4539, "step": 189200 }, { "epoch": 0.33, "learning_rate": 3.350202464451009e-05, "loss": 2.545, "step": 189210 }, { "epoch": 0.33, "learning_rate": 3.350115270458327e-05, "loss": 2.4594, "step": 189220 }, { "epoch": 0.33, "learning_rate": 3.350028076465644e-05, "loss": 2.3898, "step": 189230 }, { "epoch": 0.33, "learning_rate": 3.349940882472961e-05, "loss": 2.5334, "step": 189240 }, { "epoch": 0.33, "learning_rate": 3.3498536884802786e-05, "loss": 2.3728, "step": 189250 }, { "epoch": 0.33, "learning_rate": 3.3497664944875964e-05, "loss": 2.3776, "step": 189260 }, { "epoch": 0.33, "learning_rate": 3.3496793004949134e-05, "loss": 2.4419, "step": 189270 }, { "epoch": 0.33, "learning_rate": 3.3495921065022304e-05, "loss": 2.4705, "step": 189280 }, { "epoch": 0.33, "learning_rate": 3.349504912509548e-05, "loss": 2.4252, "step": 189290 }, { "epoch": 0.33, "learning_rate": 3.349417718516865e-05, "loss": 2.415, "step": 189300 }, { "epoch": 0.33, "learning_rate": 3.349330524524182e-05, "loss": 2.3208, "step": 189310 }, { "epoch": 0.33, "learning_rate": 3.3492433305315e-05, "loss": 2.5459, "step": 189320 }, { "epoch": 0.33, "learning_rate": 3.3491561365388177e-05, "loss": 2.4719, "step": 189330 }, { "epoch": 0.33, "learning_rate": 3.349068942546135e-05, "loss": 2.3204, "step": 189340 }, { "epoch": 0.33, "learning_rate": 3.348981748553452e-05, "loss": 2.4498, "step": 189350 }, { "epoch": 0.33, "learning_rate": 3.3488945545607694e-05, "loss": 2.4479, "step": 189360 }, { "epoch": 0.33, "learning_rate": 3.3488073605680865e-05, "loss": 2.5143, "step": 189370 }, { "epoch": 0.33, "learning_rate": 3.3487201665754035e-05, "loss": 2.3713, "step": 189380 }, { "epoch": 0.33, "learning_rate": 3.348632972582721e-05, "loss": 2.3719, "step": 189390 }, { "epoch": 0.33, "learning_rate": 3.348545778590038e-05, "loss": 2.4116, "step": 189400 }, { "epoch": 0.33, "learning_rate": 3.348458584597356e-05, "loss": 2.4287, "step": 189410 }, { "epoch": 0.33, "learning_rate": 3.348371390604673e-05, "loss": 2.4713, "step": 189420 }, { "epoch": 0.33, "learning_rate": 3.348284196611991e-05, "loss": 2.4337, "step": 189430 }, { "epoch": 0.33, "learning_rate": 3.348197002619308e-05, "loss": 2.4378, "step": 189440 }, { "epoch": 0.33, "learning_rate": 3.348109808626625e-05, "loss": 2.375, "step": 189450 }, { "epoch": 0.33, "learning_rate": 3.348022614633942e-05, "loss": 2.4759, "step": 189460 }, { "epoch": 0.33, "learning_rate": 3.3479354206412596e-05, "loss": 2.5032, "step": 189470 }, { "epoch": 0.33, "learning_rate": 3.347848226648577e-05, "loss": 2.377, "step": 189480 }, { "epoch": 0.33, "learning_rate": 3.347761032655894e-05, "loss": 2.3652, "step": 189490 }, { "epoch": 0.33, "learning_rate": 3.347673838663212e-05, "loss": 2.517, "step": 189500 }, { "epoch": 0.33, "learning_rate": 3.347586644670529e-05, "loss": 2.5485, "step": 189510 }, { "epoch": 0.33, "learning_rate": 3.347499450677846e-05, "loss": 2.5048, "step": 189520 }, { "epoch": 0.33, "learning_rate": 3.347412256685163e-05, "loss": 2.5847, "step": 189530 }, { "epoch": 0.33, "learning_rate": 3.347325062692481e-05, "loss": 2.4297, "step": 189540 }, { "epoch": 0.33, "learning_rate": 3.3472378686997986e-05, "loss": 2.4619, "step": 189550 }, { "epoch": 0.33, "learning_rate": 3.3471506747071156e-05, "loss": 2.4174, "step": 189560 }, { "epoch": 0.33, "learning_rate": 3.347063480714433e-05, "loss": 2.5105, "step": 189570 }, { "epoch": 0.33, "learning_rate": 3.3469762867217504e-05, "loss": 2.4842, "step": 189580 }, { "epoch": 0.33, "learning_rate": 3.3468890927290674e-05, "loss": 2.4943, "step": 189590 }, { "epoch": 0.33, "learning_rate": 3.3468018987363845e-05, "loss": 2.3686, "step": 189600 }, { "epoch": 0.33, "learning_rate": 3.346714704743702e-05, "loss": 2.4572, "step": 189610 }, { "epoch": 0.33, "learning_rate": 3.346627510751019e-05, "loss": 2.3874, "step": 189620 }, { "epoch": 0.33, "learning_rate": 3.346540316758337e-05, "loss": 2.4242, "step": 189630 }, { "epoch": 0.33, "learning_rate": 3.346453122765654e-05, "loss": 2.2941, "step": 189640 }, { "epoch": 0.33, "learning_rate": 3.346365928772972e-05, "loss": 2.4447, "step": 189650 }, { "epoch": 0.33, "learning_rate": 3.346278734780289e-05, "loss": 2.4004, "step": 189660 }, { "epoch": 0.33, "learning_rate": 3.346191540787606e-05, "loss": 2.3907, "step": 189670 }, { "epoch": 0.33, "learning_rate": 3.3461043467949235e-05, "loss": 2.4707, "step": 189680 }, { "epoch": 0.33, "learning_rate": 3.3460171528022405e-05, "loss": 2.4773, "step": 189690 }, { "epoch": 0.33, "learning_rate": 3.345929958809558e-05, "loss": 2.4986, "step": 189700 }, { "epoch": 0.33, "learning_rate": 3.345842764816875e-05, "loss": 2.4874, "step": 189710 }, { "epoch": 0.33, "learning_rate": 3.345755570824193e-05, "loss": 2.5817, "step": 189720 }, { "epoch": 0.33, "learning_rate": 3.34566837683151e-05, "loss": 2.3001, "step": 189730 }, { "epoch": 0.33, "learning_rate": 3.345581182838827e-05, "loss": 2.5117, "step": 189740 }, { "epoch": 0.33, "learning_rate": 3.345493988846145e-05, "loss": 2.4254, "step": 189750 }, { "epoch": 0.33, "learning_rate": 3.345406794853462e-05, "loss": 2.4289, "step": 189760 }, { "epoch": 0.33, "learning_rate": 3.345319600860779e-05, "loss": 2.4878, "step": 189770 }, { "epoch": 0.33, "learning_rate": 3.3452324068680966e-05, "loss": 2.4707, "step": 189780 }, { "epoch": 0.33, "learning_rate": 3.345145212875414e-05, "loss": 2.4896, "step": 189790 }, { "epoch": 0.33, "learning_rate": 3.345058018882731e-05, "loss": 2.4485, "step": 189800 }, { "epoch": 0.33, "learning_rate": 3.3449708248900484e-05, "loss": 2.405, "step": 189810 }, { "epoch": 0.33, "learning_rate": 3.344883630897366e-05, "loss": 2.3866, "step": 189820 }, { "epoch": 0.33, "learning_rate": 3.344796436904683e-05, "loss": 2.4105, "step": 189830 }, { "epoch": 0.33, "learning_rate": 3.344709242912e-05, "loss": 2.4214, "step": 189840 }, { "epoch": 0.33, "learning_rate": 3.344622048919318e-05, "loss": 2.4637, "step": 189850 }, { "epoch": 0.33, "learning_rate": 3.3445348549266356e-05, "loss": 2.3966, "step": 189860 }, { "epoch": 0.33, "learning_rate": 3.3444476609339526e-05, "loss": 2.3942, "step": 189870 }, { "epoch": 0.33, "learning_rate": 3.34436046694127e-05, "loss": 2.3534, "step": 189880 }, { "epoch": 0.33, "learning_rate": 3.3442732729485874e-05, "loss": 2.4966, "step": 189890 }, { "epoch": 0.33, "learning_rate": 3.3441860789559044e-05, "loss": 2.4865, "step": 189900 }, { "epoch": 0.33, "learning_rate": 3.3440988849632215e-05, "loss": 2.5208, "step": 189910 }, { "epoch": 0.33, "learning_rate": 3.3440116909705385e-05, "loss": 2.5085, "step": 189920 }, { "epoch": 0.33, "learning_rate": 3.343924496977857e-05, "loss": 2.4809, "step": 189930 }, { "epoch": 0.33, "learning_rate": 3.343837302985174e-05, "loss": 2.4838, "step": 189940 }, { "epoch": 0.33, "learning_rate": 3.343750108992491e-05, "loss": 2.5057, "step": 189950 }, { "epoch": 0.33, "learning_rate": 3.343662914999808e-05, "loss": 2.4082, "step": 189960 }, { "epoch": 0.33, "learning_rate": 3.343575721007126e-05, "loss": 2.5087, "step": 189970 }, { "epoch": 0.33, "learning_rate": 3.343488527014443e-05, "loss": 2.3558, "step": 189980 }, { "epoch": 0.33, "learning_rate": 3.34340133302176e-05, "loss": 2.4274, "step": 189990 }, { "epoch": 0.33, "learning_rate": 3.343314139029078e-05, "loss": 2.3603, "step": 190000 }, { "epoch": 0.33, "learning_rate": 3.343226945036395e-05, "loss": 2.3927, "step": 190010 }, { "epoch": 0.33, "learning_rate": 3.343139751043712e-05, "loss": 2.4216, "step": 190020 }, { "epoch": 0.33, "learning_rate": 3.343052557051029e-05, "loss": 2.492, "step": 190030 }, { "epoch": 0.33, "learning_rate": 3.342965363058347e-05, "loss": 2.4217, "step": 190040 }, { "epoch": 0.33, "learning_rate": 3.342878169065664e-05, "loss": 2.4628, "step": 190050 }, { "epoch": 0.33, "learning_rate": 3.342790975072981e-05, "loss": 2.5597, "step": 190060 }, { "epoch": 0.33, "learning_rate": 3.342703781080299e-05, "loss": 2.4214, "step": 190070 }, { "epoch": 0.33, "learning_rate": 3.3426165870876165e-05, "loss": 2.4455, "step": 190080 }, { "epoch": 0.33, "learning_rate": 3.3425293930949336e-05, "loss": 2.3705, "step": 190090 }, { "epoch": 0.33, "learning_rate": 3.3424421991022506e-05, "loss": 2.4675, "step": 190100 }, { "epoch": 0.33, "learning_rate": 3.342355005109568e-05, "loss": 2.3701, "step": 190110 }, { "epoch": 0.33, "learning_rate": 3.3422678111168854e-05, "loss": 2.3746, "step": 190120 }, { "epoch": 0.33, "learning_rate": 3.3421806171242024e-05, "loss": 2.3206, "step": 190130 }, { "epoch": 0.33, "learning_rate": 3.34209342313152e-05, "loss": 2.4819, "step": 190140 }, { "epoch": 0.33, "learning_rate": 3.342006229138838e-05, "loss": 2.3426, "step": 190150 }, { "epoch": 0.33, "learning_rate": 3.341919035146155e-05, "loss": 2.2801, "step": 190160 }, { "epoch": 0.33, "learning_rate": 3.341831841153472e-05, "loss": 2.4322, "step": 190170 }, { "epoch": 0.33, "learning_rate": 3.3417446471607896e-05, "loss": 2.5053, "step": 190180 }, { "epoch": 0.33, "learning_rate": 3.3416574531681067e-05, "loss": 2.4894, "step": 190190 }, { "epoch": 0.33, "learning_rate": 3.341570259175424e-05, "loss": 2.2786, "step": 190200 }, { "epoch": 0.33, "learning_rate": 3.3414830651827414e-05, "loss": 2.4732, "step": 190210 }, { "epoch": 0.33, "learning_rate": 3.341395871190059e-05, "loss": 2.5745, "step": 190220 }, { "epoch": 0.33, "learning_rate": 3.341308677197376e-05, "loss": 2.4764, "step": 190230 }, { "epoch": 0.33, "learning_rate": 3.341221483204693e-05, "loss": 2.426, "step": 190240 }, { "epoch": 0.33, "learning_rate": 3.341134289212011e-05, "loss": 2.299, "step": 190250 }, { "epoch": 0.33, "learning_rate": 3.341047095219328e-05, "loss": 2.4376, "step": 190260 }, { "epoch": 0.33, "learning_rate": 3.340959901226645e-05, "loss": 2.357, "step": 190270 }, { "epoch": 0.33, "learning_rate": 3.340872707233963e-05, "loss": 2.3893, "step": 190280 }, { "epoch": 0.33, "learning_rate": 3.34078551324128e-05, "loss": 2.4699, "step": 190290 }, { "epoch": 0.33, "learning_rate": 3.3406983192485975e-05, "loss": 2.4328, "step": 190300 }, { "epoch": 0.33, "learning_rate": 3.3406111252559145e-05, "loss": 2.3998, "step": 190310 }, { "epoch": 0.33, "learning_rate": 3.340523931263232e-05, "loss": 2.4372, "step": 190320 }, { "epoch": 0.33, "learning_rate": 3.340436737270549e-05, "loss": 2.4449, "step": 190330 }, { "epoch": 0.33, "learning_rate": 3.340349543277866e-05, "loss": 2.4499, "step": 190340 }, { "epoch": 0.33, "learning_rate": 3.340262349285183e-05, "loss": 2.3565, "step": 190350 }, { "epoch": 0.33, "learning_rate": 3.340175155292501e-05, "loss": 2.4982, "step": 190360 }, { "epoch": 0.33, "learning_rate": 3.340087961299819e-05, "loss": 2.5079, "step": 190370 }, { "epoch": 0.33, "learning_rate": 3.340000767307136e-05, "loss": 2.5706, "step": 190380 }, { "epoch": 0.33, "learning_rate": 3.3399135733144535e-05, "loss": 2.2872, "step": 190390 }, { "epoch": 0.33, "learning_rate": 3.3398263793217706e-05, "loss": 2.3859, "step": 190400 }, { "epoch": 0.33, "learning_rate": 3.3397391853290876e-05, "loss": 2.3716, "step": 190410 }, { "epoch": 0.33, "learning_rate": 3.3396519913364046e-05, "loss": 2.2884, "step": 190420 }, { "epoch": 0.33, "learning_rate": 3.3395647973437223e-05, "loss": 2.5887, "step": 190430 }, { "epoch": 0.33, "learning_rate": 3.3394776033510394e-05, "loss": 2.4318, "step": 190440 }, { "epoch": 0.33, "learning_rate": 3.339390409358357e-05, "loss": 2.448, "step": 190450 }, { "epoch": 0.33, "learning_rate": 3.339303215365674e-05, "loss": 2.459, "step": 190460 }, { "epoch": 0.33, "learning_rate": 3.339216021372992e-05, "loss": 2.4976, "step": 190470 }, { "epoch": 0.33, "learning_rate": 3.339128827380309e-05, "loss": 2.3874, "step": 190480 }, { "epoch": 0.33, "learning_rate": 3.339041633387626e-05, "loss": 2.3926, "step": 190490 }, { "epoch": 0.33, "learning_rate": 3.3389544393949436e-05, "loss": 2.3924, "step": 190500 }, { "epoch": 0.33, "learning_rate": 3.338867245402261e-05, "loss": 2.5253, "step": 190510 }, { "epoch": 0.33, "learning_rate": 3.3387800514095784e-05, "loss": 2.4164, "step": 190520 }, { "epoch": 0.33, "learning_rate": 3.3386928574168954e-05, "loss": 2.409, "step": 190530 }, { "epoch": 0.33, "learning_rate": 3.338605663424213e-05, "loss": 2.4724, "step": 190540 }, { "epoch": 0.33, "learning_rate": 3.33851846943153e-05, "loss": 2.4732, "step": 190550 }, { "epoch": 0.33, "learning_rate": 3.338431275438847e-05, "loss": 2.5336, "step": 190560 }, { "epoch": 0.33, "learning_rate": 3.338344081446165e-05, "loss": 2.4003, "step": 190570 }, { "epoch": 0.33, "learning_rate": 3.338256887453482e-05, "loss": 2.4209, "step": 190580 }, { "epoch": 0.33, "learning_rate": 3.338169693460799e-05, "loss": 2.4703, "step": 190590 }, { "epoch": 0.33, "learning_rate": 3.338082499468117e-05, "loss": 2.3704, "step": 190600 }, { "epoch": 0.33, "learning_rate": 3.3379953054754345e-05, "loss": 2.2732, "step": 190610 }, { "epoch": 0.33, "learning_rate": 3.3379081114827515e-05, "loss": 2.3875, "step": 190620 }, { "epoch": 0.33, "learning_rate": 3.3378209174900685e-05, "loss": 2.3805, "step": 190630 }, { "epoch": 0.33, "learning_rate": 3.337733723497386e-05, "loss": 2.4338, "step": 190640 }, { "epoch": 0.33, "learning_rate": 3.337646529504703e-05, "loss": 2.4178, "step": 190650 }, { "epoch": 0.33, "learning_rate": 3.33755933551202e-05, "loss": 2.5433, "step": 190660 }, { "epoch": 0.33, "learning_rate": 3.337472141519338e-05, "loss": 2.404, "step": 190670 }, { "epoch": 0.33, "learning_rate": 3.337384947526656e-05, "loss": 2.4139, "step": 190680 }, { "epoch": 0.33, "learning_rate": 3.337297753533973e-05, "loss": 2.3875, "step": 190690 }, { "epoch": 0.33, "learning_rate": 3.33721055954129e-05, "loss": 2.4912, "step": 190700 }, { "epoch": 0.33, "learning_rate": 3.3371233655486076e-05, "loss": 2.434, "step": 190710 }, { "epoch": 0.33, "learning_rate": 3.3370361715559246e-05, "loss": 2.4334, "step": 190720 }, { "epoch": 0.33, "learning_rate": 3.3369489775632416e-05, "loss": 2.54, "step": 190730 }, { "epoch": 0.33, "learning_rate": 3.3368617835705593e-05, "loss": 2.4742, "step": 190740 }, { "epoch": 0.33, "learning_rate": 3.336774589577877e-05, "loss": 2.478, "step": 190750 }, { "epoch": 0.33, "learning_rate": 3.336687395585194e-05, "loss": 2.4799, "step": 190760 }, { "epoch": 0.33, "learning_rate": 3.336600201592511e-05, "loss": 2.3174, "step": 190770 }, { "epoch": 0.33, "learning_rate": 3.336513007599829e-05, "loss": 2.5017, "step": 190780 }, { "epoch": 0.33, "learning_rate": 3.336425813607146e-05, "loss": 2.3806, "step": 190790 }, { "epoch": 0.33, "learning_rate": 3.336338619614463e-05, "loss": 2.4903, "step": 190800 }, { "epoch": 0.33, "learning_rate": 3.33625142562178e-05, "loss": 2.4707, "step": 190810 }, { "epoch": 0.33, "learning_rate": 3.3361642316290984e-05, "loss": 2.4336, "step": 190820 }, { "epoch": 0.33, "learning_rate": 3.3360770376364154e-05, "loss": 2.4717, "step": 190830 }, { "epoch": 0.33, "learning_rate": 3.3359898436437324e-05, "loss": 2.4101, "step": 190840 }, { "epoch": 0.33, "learning_rate": 3.33590264965105e-05, "loss": 2.4818, "step": 190850 }, { "epoch": 0.33, "learning_rate": 3.335815455658367e-05, "loss": 2.4568, "step": 190860 }, { "epoch": 0.33, "learning_rate": 3.335728261665684e-05, "loss": 2.5177, "step": 190870 }, { "epoch": 0.33, "learning_rate": 3.335641067673001e-05, "loss": 2.3422, "step": 190880 }, { "epoch": 0.33, "learning_rate": 3.3355538736803197e-05, "loss": 2.4604, "step": 190890 }, { "epoch": 0.33, "learning_rate": 3.335466679687637e-05, "loss": 2.4187, "step": 190900 }, { "epoch": 0.33, "learning_rate": 3.335379485694954e-05, "loss": 2.4026, "step": 190910 }, { "epoch": 0.33, "learning_rate": 3.335292291702271e-05, "loss": 2.3168, "step": 190920 }, { "epoch": 0.33, "learning_rate": 3.3352050977095885e-05, "loss": 2.5947, "step": 190930 }, { "epoch": 0.33, "learning_rate": 3.3351179037169055e-05, "loss": 2.4356, "step": 190940 }, { "epoch": 0.33, "learning_rate": 3.3350307097242226e-05, "loss": 2.4428, "step": 190950 }, { "epoch": 0.33, "learning_rate": 3.33494351573154e-05, "loss": 2.3631, "step": 190960 }, { "epoch": 0.33, "learning_rate": 3.334856321738858e-05, "loss": 2.6188, "step": 190970 }, { "epoch": 0.33, "learning_rate": 3.334769127746175e-05, "loss": 2.4927, "step": 190980 }, { "epoch": 0.33, "learning_rate": 3.334681933753492e-05, "loss": 2.5502, "step": 190990 }, { "epoch": 0.33, "learning_rate": 3.33459473976081e-05, "loss": 2.5034, "step": 191000 }, { "epoch": 0.33, "learning_rate": 3.334507545768127e-05, "loss": 2.4449, "step": 191010 }, { "epoch": 0.33, "learning_rate": 3.334420351775444e-05, "loss": 2.4811, "step": 191020 }, { "epoch": 0.33, "learning_rate": 3.3343331577827616e-05, "loss": 2.5197, "step": 191030 }, { "epoch": 0.33, "learning_rate": 3.334245963790079e-05, "loss": 2.5593, "step": 191040 }, { "epoch": 0.33, "learning_rate": 3.334158769797396e-05, "loss": 2.424, "step": 191050 }, { "epoch": 0.33, "learning_rate": 3.3340715758047134e-05, "loss": 2.3978, "step": 191060 }, { "epoch": 0.33, "learning_rate": 3.333984381812031e-05, "loss": 2.4826, "step": 191070 }, { "epoch": 0.33, "learning_rate": 3.333897187819348e-05, "loss": 2.541, "step": 191080 }, { "epoch": 0.33, "learning_rate": 3.333809993826665e-05, "loss": 2.3744, "step": 191090 }, { "epoch": 0.33, "learning_rate": 3.333722799833983e-05, "loss": 2.4154, "step": 191100 }, { "epoch": 0.33, "learning_rate": 3.3336356058413e-05, "loss": 2.2399, "step": 191110 }, { "epoch": 0.33, "learning_rate": 3.3335484118486176e-05, "loss": 2.4484, "step": 191120 }, { "epoch": 0.33, "learning_rate": 3.333461217855935e-05, "loss": 2.2706, "step": 191130 }, { "epoch": 0.33, "learning_rate": 3.3333740238632524e-05, "loss": 2.4782, "step": 191140 }, { "epoch": 0.33, "learning_rate": 3.3332868298705694e-05, "loss": 2.4446, "step": 191150 }, { "epoch": 0.33, "learning_rate": 3.3331996358778865e-05, "loss": 2.5012, "step": 191160 }, { "epoch": 0.33, "learning_rate": 3.333112441885204e-05, "loss": 2.4386, "step": 191170 }, { "epoch": 0.33, "learning_rate": 3.333025247892521e-05, "loss": 2.3215, "step": 191180 }, { "epoch": 0.33, "learning_rate": 3.332938053899839e-05, "loss": 2.519, "step": 191190 }, { "epoch": 0.33, "learning_rate": 3.332850859907156e-05, "loss": 2.5019, "step": 191200 }, { "epoch": 0.33, "learning_rate": 3.332763665914474e-05, "loss": 2.4418, "step": 191210 }, { "epoch": 0.33, "learning_rate": 3.332676471921791e-05, "loss": 2.3303, "step": 191220 }, { "epoch": 0.33, "learning_rate": 3.332589277929108e-05, "loss": 2.472, "step": 191230 }, { "epoch": 0.33, "learning_rate": 3.3325020839364255e-05, "loss": 2.4854, "step": 191240 }, { "epoch": 0.33, "learning_rate": 3.3324148899437425e-05, "loss": 2.3412, "step": 191250 }, { "epoch": 0.33, "learning_rate": 3.3323276959510596e-05, "loss": 2.4379, "step": 191260 }, { "epoch": 0.33, "learning_rate": 3.332240501958377e-05, "loss": 2.372, "step": 191270 }, { "epoch": 0.33, "learning_rate": 3.332153307965695e-05, "loss": 2.5306, "step": 191280 }, { "epoch": 0.33, "learning_rate": 3.332066113973012e-05, "loss": 2.5011, "step": 191290 }, { "epoch": 0.33, "learning_rate": 3.331978919980329e-05, "loss": 2.4494, "step": 191300 }, { "epoch": 0.33, "learning_rate": 3.331891725987646e-05, "loss": 2.2895, "step": 191310 }, { "epoch": 0.33, "learning_rate": 3.331804531994964e-05, "loss": 2.3783, "step": 191320 }, { "epoch": 0.33, "learning_rate": 3.331717338002281e-05, "loss": 2.4078, "step": 191330 }, { "epoch": 0.33, "learning_rate": 3.3316301440095986e-05, "loss": 2.4505, "step": 191340 }, { "epoch": 0.33, "learning_rate": 3.331542950016916e-05, "loss": 2.4461, "step": 191350 }, { "epoch": 0.33, "learning_rate": 3.331455756024233e-05, "loss": 2.4529, "step": 191360 }, { "epoch": 0.33, "learning_rate": 3.3313685620315504e-05, "loss": 2.4609, "step": 191370 }, { "epoch": 0.33, "learning_rate": 3.3312813680388674e-05, "loss": 2.5884, "step": 191380 }, { "epoch": 0.33, "learning_rate": 3.331194174046185e-05, "loss": 2.3083, "step": 191390 }, { "epoch": 0.33, "learning_rate": 3.331106980053502e-05, "loss": 2.3947, "step": 191400 }, { "epoch": 0.33, "learning_rate": 3.331019786060819e-05, "loss": 2.5387, "step": 191410 }, { "epoch": 0.33, "learning_rate": 3.330932592068137e-05, "loss": 2.3948, "step": 191420 }, { "epoch": 0.33, "learning_rate": 3.3308453980754546e-05, "loss": 2.4072, "step": 191430 }, { "epoch": 0.33, "learning_rate": 3.330758204082772e-05, "loss": 2.3705, "step": 191440 }, { "epoch": 0.33, "learning_rate": 3.330671010090089e-05, "loss": 2.4317, "step": 191450 }, { "epoch": 0.33, "learning_rate": 3.3305838160974064e-05, "loss": 2.3718, "step": 191460 }, { "epoch": 0.33, "learning_rate": 3.3304966221047235e-05, "loss": 2.3715, "step": 191470 }, { "epoch": 0.33, "learning_rate": 3.3304094281120405e-05, "loss": 2.409, "step": 191480 }, { "epoch": 0.33, "learning_rate": 3.330322234119358e-05, "loss": 2.4777, "step": 191490 }, { "epoch": 0.33, "learning_rate": 3.330235040126676e-05, "loss": 2.4054, "step": 191500 }, { "epoch": 0.33, "learning_rate": 3.330147846133993e-05, "loss": 2.4156, "step": 191510 }, { "epoch": 0.33, "learning_rate": 3.33006065214131e-05, "loss": 2.39, "step": 191520 }, { "epoch": 0.33, "learning_rate": 3.329973458148628e-05, "loss": 2.4797, "step": 191530 }, { "epoch": 0.33, "learning_rate": 3.329886264155945e-05, "loss": 2.4143, "step": 191540 }, { "epoch": 0.33, "learning_rate": 3.329799070163262e-05, "loss": 2.2633, "step": 191550 }, { "epoch": 0.33, "learning_rate": 3.3297118761705795e-05, "loss": 2.3777, "step": 191560 }, { "epoch": 0.33, "learning_rate": 3.329624682177897e-05, "loss": 2.445, "step": 191570 }, { "epoch": 0.33, "learning_rate": 3.329537488185214e-05, "loss": 2.4504, "step": 191580 }, { "epoch": 0.33, "learning_rate": 3.329450294192531e-05, "loss": 2.47, "step": 191590 }, { "epoch": 0.33, "learning_rate": 3.329363100199849e-05, "loss": 2.294, "step": 191600 }, { "epoch": 0.33, "learning_rate": 3.329275906207166e-05, "loss": 2.39, "step": 191610 }, { "epoch": 0.33, "learning_rate": 3.329188712214483e-05, "loss": 2.5158, "step": 191620 }, { "epoch": 0.33, "learning_rate": 3.329101518221801e-05, "loss": 2.4104, "step": 191630 }, { "epoch": 0.33, "learning_rate": 3.3290143242291185e-05, "loss": 2.4792, "step": 191640 }, { "epoch": 0.33, "learning_rate": 3.3289271302364356e-05, "loss": 2.4448, "step": 191650 }, { "epoch": 0.33, "learning_rate": 3.3288399362437526e-05, "loss": 2.3836, "step": 191660 }, { "epoch": 0.33, "learning_rate": 3.32875274225107e-05, "loss": 2.6129, "step": 191670 }, { "epoch": 0.33, "learning_rate": 3.3286655482583874e-05, "loss": 2.3731, "step": 191680 }, { "epoch": 0.33, "learning_rate": 3.3285783542657044e-05, "loss": 2.3332, "step": 191690 }, { "epoch": 0.33, "learning_rate": 3.3284911602730214e-05, "loss": 2.5014, "step": 191700 }, { "epoch": 0.33, "learning_rate": 3.32840396628034e-05, "loss": 2.4134, "step": 191710 }, { "epoch": 0.33, "learning_rate": 3.328316772287657e-05, "loss": 2.4786, "step": 191720 }, { "epoch": 0.33, "learning_rate": 3.328229578294974e-05, "loss": 2.469, "step": 191730 }, { "epoch": 0.33, "learning_rate": 3.3281423843022916e-05, "loss": 2.4182, "step": 191740 }, { "epoch": 0.33, "learning_rate": 3.3280551903096087e-05, "loss": 2.4667, "step": 191750 }, { "epoch": 0.33, "learning_rate": 3.327967996316926e-05, "loss": 2.3379, "step": 191760 }, { "epoch": 0.33, "learning_rate": 3.327880802324243e-05, "loss": 2.291, "step": 191770 }, { "epoch": 0.33, "learning_rate": 3.3277936083315605e-05, "loss": 2.4346, "step": 191780 }, { "epoch": 0.33, "learning_rate": 3.327706414338878e-05, "loss": 2.3154, "step": 191790 }, { "epoch": 0.33, "learning_rate": 3.327619220346195e-05, "loss": 2.3453, "step": 191800 }, { "epoch": 0.33, "learning_rate": 3.327532026353512e-05, "loss": 2.4225, "step": 191810 }, { "epoch": 0.33, "learning_rate": 3.32744483236083e-05, "loss": 2.4165, "step": 191820 }, { "epoch": 0.33, "learning_rate": 3.327357638368147e-05, "loss": 2.2875, "step": 191830 }, { "epoch": 0.33, "learning_rate": 3.327270444375464e-05, "loss": 2.4933, "step": 191840 }, { "epoch": 0.33, "learning_rate": 3.327183250382782e-05, "loss": 2.3382, "step": 191850 }, { "epoch": 0.33, "learning_rate": 3.3270960563900995e-05, "loss": 2.5299, "step": 191860 }, { "epoch": 0.33, "learning_rate": 3.3270088623974165e-05, "loss": 2.4061, "step": 191870 }, { "epoch": 0.33, "learning_rate": 3.3269216684047335e-05, "loss": 2.3445, "step": 191880 }, { "epoch": 0.33, "learning_rate": 3.326834474412051e-05, "loss": 2.3511, "step": 191890 }, { "epoch": 0.33, "learning_rate": 3.326747280419368e-05, "loss": 2.5167, "step": 191900 }, { "epoch": 0.33, "learning_rate": 3.326660086426685e-05, "loss": 2.4076, "step": 191910 }, { "epoch": 0.33, "learning_rate": 3.326572892434003e-05, "loss": 2.4197, "step": 191920 }, { "epoch": 0.33, "learning_rate": 3.32648569844132e-05, "loss": 2.3165, "step": 191930 }, { "epoch": 0.33, "learning_rate": 3.326398504448638e-05, "loss": 2.5103, "step": 191940 }, { "epoch": 0.33, "learning_rate": 3.326311310455955e-05, "loss": 2.3432, "step": 191950 }, { "epoch": 0.33, "learning_rate": 3.3262241164632726e-05, "loss": 2.3434, "step": 191960 }, { "epoch": 0.33, "learning_rate": 3.3261369224705896e-05, "loss": 2.2802, "step": 191970 }, { "epoch": 0.33, "learning_rate": 3.3260497284779066e-05, "loss": 2.4481, "step": 191980 }, { "epoch": 0.33, "learning_rate": 3.3259625344852244e-05, "loss": 2.4515, "step": 191990 }, { "epoch": 0.33, "learning_rate": 3.3258753404925414e-05, "loss": 2.3934, "step": 192000 }, { "epoch": 0.33, "learning_rate": 3.325788146499859e-05, "loss": 2.4725, "step": 192010 }, { "epoch": 0.33, "learning_rate": 3.325700952507176e-05, "loss": 2.4504, "step": 192020 }, { "epoch": 0.33, "learning_rate": 3.325613758514494e-05, "loss": 2.4248, "step": 192030 }, { "epoch": 0.33, "learning_rate": 3.325526564521811e-05, "loss": 2.4741, "step": 192040 }, { "epoch": 0.33, "learning_rate": 3.325439370529128e-05, "loss": 2.3226, "step": 192050 }, { "epoch": 0.33, "learning_rate": 3.3253521765364457e-05, "loss": 2.538, "step": 192060 }, { "epoch": 0.33, "learning_rate": 3.325264982543763e-05, "loss": 2.3361, "step": 192070 }, { "epoch": 0.33, "learning_rate": 3.3251777885510804e-05, "loss": 2.454, "step": 192080 }, { "epoch": 0.33, "learning_rate": 3.3250905945583974e-05, "loss": 2.5529, "step": 192090 }, { "epoch": 0.33, "learning_rate": 3.325003400565715e-05, "loss": 2.5235, "step": 192100 }, { "epoch": 0.34, "learning_rate": 3.324916206573032e-05, "loss": 2.4516, "step": 192110 }, { "epoch": 0.34, "learning_rate": 3.324829012580349e-05, "loss": 2.4504, "step": 192120 }, { "epoch": 0.34, "learning_rate": 3.324741818587667e-05, "loss": 2.4027, "step": 192130 }, { "epoch": 0.34, "learning_rate": 3.324654624594984e-05, "loss": 2.3929, "step": 192140 }, { "epoch": 0.34, "learning_rate": 3.324567430602301e-05, "loss": 2.3891, "step": 192150 }, { "epoch": 0.34, "learning_rate": 3.324480236609619e-05, "loss": 2.4718, "step": 192160 }, { "epoch": 0.34, "learning_rate": 3.3243930426169365e-05, "loss": 2.4602, "step": 192170 }, { "epoch": 0.34, "learning_rate": 3.3243058486242535e-05, "loss": 2.4821, "step": 192180 }, { "epoch": 0.34, "learning_rate": 3.3242186546315705e-05, "loss": 2.4666, "step": 192190 }, { "epoch": 0.34, "learning_rate": 3.324131460638888e-05, "loss": 2.4397, "step": 192200 }, { "epoch": 0.34, "learning_rate": 3.324044266646205e-05, "loss": 2.3757, "step": 192210 }, { "epoch": 0.34, "learning_rate": 3.323957072653522e-05, "loss": 2.6443, "step": 192220 }, { "epoch": 0.34, "learning_rate": 3.32386987866084e-05, "loss": 2.377, "step": 192230 }, { "epoch": 0.34, "learning_rate": 3.323782684668158e-05, "loss": 2.4891, "step": 192240 }, { "epoch": 0.34, "learning_rate": 3.323695490675475e-05, "loss": 2.4077, "step": 192250 }, { "epoch": 0.34, "learning_rate": 3.323608296682792e-05, "loss": 2.3957, "step": 192260 }, { "epoch": 0.34, "learning_rate": 3.323521102690109e-05, "loss": 2.4682, "step": 192270 }, { "epoch": 0.34, "learning_rate": 3.3234339086974266e-05, "loss": 2.3475, "step": 192280 }, { "epoch": 0.34, "learning_rate": 3.3233467147047436e-05, "loss": 2.4577, "step": 192290 }, { "epoch": 0.34, "learning_rate": 3.323259520712061e-05, "loss": 2.4962, "step": 192300 }, { "epoch": 0.34, "learning_rate": 3.323172326719379e-05, "loss": 2.4228, "step": 192310 }, { "epoch": 0.34, "learning_rate": 3.323085132726696e-05, "loss": 2.4265, "step": 192320 }, { "epoch": 0.34, "learning_rate": 3.322997938734013e-05, "loss": 2.3484, "step": 192330 }, { "epoch": 0.34, "learning_rate": 3.32291074474133e-05, "loss": 2.4704, "step": 192340 }, { "epoch": 0.34, "learning_rate": 3.322823550748648e-05, "loss": 2.5081, "step": 192350 }, { "epoch": 0.34, "learning_rate": 3.322736356755965e-05, "loss": 2.3777, "step": 192360 }, { "epoch": 0.34, "learning_rate": 3.322649162763282e-05, "loss": 2.5145, "step": 192370 }, { "epoch": 0.34, "learning_rate": 3.3225619687706e-05, "loss": 2.3224, "step": 192380 }, { "epoch": 0.34, "learning_rate": 3.3224747747779174e-05, "loss": 2.5004, "step": 192390 }, { "epoch": 0.34, "learning_rate": 3.3223875807852344e-05, "loss": 2.4774, "step": 192400 }, { "epoch": 0.34, "learning_rate": 3.3223003867925515e-05, "loss": 2.5468, "step": 192410 }, { "epoch": 0.34, "learning_rate": 3.322213192799869e-05, "loss": 2.3892, "step": 192420 }, { "epoch": 0.34, "learning_rate": 3.322125998807186e-05, "loss": 2.3257, "step": 192430 }, { "epoch": 0.34, "learning_rate": 3.322038804814503e-05, "loss": 2.3381, "step": 192440 }, { "epoch": 0.34, "learning_rate": 3.321951610821821e-05, "loss": 2.42, "step": 192450 }, { "epoch": 0.34, "learning_rate": 3.321864416829139e-05, "loss": 2.322, "step": 192460 }, { "epoch": 0.34, "learning_rate": 3.321777222836456e-05, "loss": 2.3762, "step": 192470 }, { "epoch": 0.34, "learning_rate": 3.321690028843773e-05, "loss": 2.4978, "step": 192480 }, { "epoch": 0.34, "learning_rate": 3.3216028348510905e-05, "loss": 2.5228, "step": 192490 }, { "epoch": 0.34, "learning_rate": 3.3215156408584075e-05, "loss": 2.3638, "step": 192500 }, { "epoch": 0.34, "learning_rate": 3.3214284468657246e-05, "loss": 2.2971, "step": 192510 }, { "epoch": 0.34, "learning_rate": 3.321341252873042e-05, "loss": 2.4831, "step": 192520 }, { "epoch": 0.34, "learning_rate": 3.32125405888036e-05, "loss": 2.3396, "step": 192530 }, { "epoch": 0.34, "learning_rate": 3.321166864887677e-05, "loss": 2.3068, "step": 192540 }, { "epoch": 0.34, "learning_rate": 3.321079670894994e-05, "loss": 2.5457, "step": 192550 }, { "epoch": 0.34, "learning_rate": 3.320992476902312e-05, "loss": 2.411, "step": 192560 }, { "epoch": 0.34, "learning_rate": 3.320905282909629e-05, "loss": 2.486, "step": 192570 }, { "epoch": 0.34, "learning_rate": 3.320818088916946e-05, "loss": 2.4924, "step": 192580 }, { "epoch": 0.34, "learning_rate": 3.3207308949242636e-05, "loss": 2.4024, "step": 192590 }, { "epoch": 0.34, "learning_rate": 3.3206437009315806e-05, "loss": 2.5566, "step": 192600 }, { "epoch": 0.34, "learning_rate": 3.320556506938898e-05, "loss": 2.5425, "step": 192610 }, { "epoch": 0.34, "learning_rate": 3.3204693129462154e-05, "loss": 2.3568, "step": 192620 }, { "epoch": 0.34, "learning_rate": 3.320382118953533e-05, "loss": 2.4847, "step": 192630 }, { "epoch": 0.34, "learning_rate": 3.32029492496085e-05, "loss": 2.3947, "step": 192640 }, { "epoch": 0.34, "learning_rate": 3.320207730968167e-05, "loss": 2.3653, "step": 192650 }, { "epoch": 0.34, "learning_rate": 3.320120536975484e-05, "loss": 2.4084, "step": 192660 }, { "epoch": 0.34, "learning_rate": 3.320033342982802e-05, "loss": 2.2821, "step": 192670 }, { "epoch": 0.34, "learning_rate": 3.3199461489901196e-05, "loss": 2.394, "step": 192680 }, { "epoch": 0.34, "learning_rate": 3.319858954997437e-05, "loss": 2.3042, "step": 192690 }, { "epoch": 0.34, "learning_rate": 3.3197717610047544e-05, "loss": 2.3762, "step": 192700 }, { "epoch": 0.34, "learning_rate": 3.3196845670120714e-05, "loss": 2.5112, "step": 192710 }, { "epoch": 0.34, "learning_rate": 3.3195973730193885e-05, "loss": 2.4113, "step": 192720 }, { "epoch": 0.34, "learning_rate": 3.3195101790267055e-05, "loss": 2.4546, "step": 192730 }, { "epoch": 0.34, "learning_rate": 3.319422985034023e-05, "loss": 2.3143, "step": 192740 }, { "epoch": 0.34, "learning_rate": 3.319335791041341e-05, "loss": 2.5473, "step": 192750 }, { "epoch": 0.34, "learning_rate": 3.319248597048658e-05, "loss": 2.3107, "step": 192760 }, { "epoch": 0.34, "learning_rate": 3.319161403055975e-05, "loss": 2.3703, "step": 192770 }, { "epoch": 0.34, "learning_rate": 3.319074209063293e-05, "loss": 2.5208, "step": 192780 }, { "epoch": 0.34, "learning_rate": 3.31898701507061e-05, "loss": 2.4401, "step": 192790 }, { "epoch": 0.34, "learning_rate": 3.318899821077927e-05, "loss": 2.3506, "step": 192800 }, { "epoch": 0.34, "learning_rate": 3.3188126270852445e-05, "loss": 2.3429, "step": 192810 }, { "epoch": 0.34, "learning_rate": 3.3187254330925616e-05, "loss": 2.455, "step": 192820 }, { "epoch": 0.34, "learning_rate": 3.318638239099879e-05, "loss": 2.3035, "step": 192830 }, { "epoch": 0.34, "learning_rate": 3.318551045107196e-05, "loss": 2.4524, "step": 192840 }, { "epoch": 0.34, "learning_rate": 3.318463851114514e-05, "loss": 2.4177, "step": 192850 }, { "epoch": 0.34, "learning_rate": 3.318376657121831e-05, "loss": 2.4365, "step": 192860 }, { "epoch": 0.34, "learning_rate": 3.318289463129148e-05, "loss": 2.3642, "step": 192870 }, { "epoch": 0.34, "learning_rate": 3.318202269136466e-05, "loss": 2.5531, "step": 192880 }, { "epoch": 0.34, "learning_rate": 3.318115075143783e-05, "loss": 2.5109, "step": 192890 }, { "epoch": 0.34, "learning_rate": 3.3180278811511006e-05, "loss": 2.4013, "step": 192900 }, { "epoch": 0.34, "learning_rate": 3.3179406871584176e-05, "loss": 2.3285, "step": 192910 }, { "epoch": 0.34, "learning_rate": 3.317853493165735e-05, "loss": 2.3825, "step": 192920 }, { "epoch": 0.34, "learning_rate": 3.3177662991730524e-05, "loss": 2.3802, "step": 192930 }, { "epoch": 0.34, "learning_rate": 3.3176791051803694e-05, "loss": 2.4713, "step": 192940 }, { "epoch": 0.34, "learning_rate": 3.317591911187687e-05, "loss": 2.4325, "step": 192950 }, { "epoch": 0.34, "learning_rate": 3.317504717195004e-05, "loss": 2.4037, "step": 192960 }, { "epoch": 0.34, "learning_rate": 3.317417523202321e-05, "loss": 2.4993, "step": 192970 }, { "epoch": 0.34, "learning_rate": 3.317330329209639e-05, "loss": 2.3834, "step": 192980 }, { "epoch": 0.34, "learning_rate": 3.3172431352169566e-05, "loss": 2.5672, "step": 192990 }, { "epoch": 0.34, "learning_rate": 3.317155941224274e-05, "loss": 2.4699, "step": 193000 }, { "epoch": 0.34, "learning_rate": 3.317068747231591e-05, "loss": 2.4578, "step": 193010 }, { "epoch": 0.34, "learning_rate": 3.3169815532389084e-05, "loss": 2.4521, "step": 193020 }, { "epoch": 0.34, "learning_rate": 3.3168943592462255e-05, "loss": 2.4899, "step": 193030 }, { "epoch": 0.34, "learning_rate": 3.3168071652535425e-05, "loss": 2.393, "step": 193040 }, { "epoch": 0.34, "learning_rate": 3.31671997126086e-05, "loss": 2.4331, "step": 193050 }, { "epoch": 0.34, "learning_rate": 3.316632777268178e-05, "loss": 2.4286, "step": 193060 }, { "epoch": 0.34, "learning_rate": 3.316545583275495e-05, "loss": 2.4385, "step": 193070 }, { "epoch": 0.34, "learning_rate": 3.316458389282812e-05, "loss": 2.4328, "step": 193080 }, { "epoch": 0.34, "learning_rate": 3.31637119529013e-05, "loss": 2.5086, "step": 193090 }, { "epoch": 0.34, "learning_rate": 3.316284001297447e-05, "loss": 2.4362, "step": 193100 }, { "epoch": 0.34, "learning_rate": 3.316196807304764e-05, "loss": 2.4469, "step": 193110 }, { "epoch": 0.34, "learning_rate": 3.316109613312081e-05, "loss": 2.4381, "step": 193120 }, { "epoch": 0.34, "learning_rate": 3.316022419319399e-05, "loss": 2.3801, "step": 193130 }, { "epoch": 0.34, "learning_rate": 3.315935225326716e-05, "loss": 2.4589, "step": 193140 }, { "epoch": 0.34, "learning_rate": 3.315848031334033e-05, "loss": 2.4109, "step": 193150 }, { "epoch": 0.34, "learning_rate": 3.3157608373413503e-05, "loss": 2.325, "step": 193160 }, { "epoch": 0.34, "learning_rate": 3.315673643348668e-05, "loss": 2.3225, "step": 193170 }, { "epoch": 0.34, "learning_rate": 3.315586449355985e-05, "loss": 2.4517, "step": 193180 }, { "epoch": 0.34, "learning_rate": 3.315499255363302e-05, "loss": 2.51, "step": 193190 }, { "epoch": 0.34, "learning_rate": 3.3154120613706205e-05, "loss": 2.457, "step": 193200 }, { "epoch": 0.34, "learning_rate": 3.3153248673779376e-05, "loss": 2.3673, "step": 193210 }, { "epoch": 0.34, "learning_rate": 3.3152376733852546e-05, "loss": 2.4826, "step": 193220 }, { "epoch": 0.34, "learning_rate": 3.3151504793925716e-05, "loss": 2.4564, "step": 193230 }, { "epoch": 0.34, "learning_rate": 3.3150632853998894e-05, "loss": 2.4204, "step": 193240 }, { "epoch": 0.34, "learning_rate": 3.3149760914072064e-05, "loss": 2.3578, "step": 193250 }, { "epoch": 0.34, "learning_rate": 3.3148888974145234e-05, "loss": 2.4918, "step": 193260 }, { "epoch": 0.34, "learning_rate": 3.314801703421841e-05, "loss": 2.4652, "step": 193270 }, { "epoch": 0.34, "learning_rate": 3.314714509429159e-05, "loss": 2.446, "step": 193280 }, { "epoch": 0.34, "learning_rate": 3.314627315436476e-05, "loss": 2.4129, "step": 193290 }, { "epoch": 0.34, "learning_rate": 3.314540121443793e-05, "loss": 2.2954, "step": 193300 }, { "epoch": 0.34, "learning_rate": 3.3144529274511107e-05, "loss": 2.4354, "step": 193310 }, { "epoch": 0.34, "learning_rate": 3.314365733458428e-05, "loss": 2.3995, "step": 193320 }, { "epoch": 0.34, "learning_rate": 3.314278539465745e-05, "loss": 2.5063, "step": 193330 }, { "epoch": 0.34, "learning_rate": 3.3141913454730625e-05, "loss": 2.4427, "step": 193340 }, { "epoch": 0.34, "learning_rate": 3.31410415148038e-05, "loss": 2.4377, "step": 193350 }, { "epoch": 0.34, "learning_rate": 3.314016957487697e-05, "loss": 2.4731, "step": 193360 }, { "epoch": 0.34, "learning_rate": 3.313929763495014e-05, "loss": 2.4404, "step": 193370 }, { "epoch": 0.34, "learning_rate": 3.313842569502332e-05, "loss": 2.4158, "step": 193380 }, { "epoch": 0.34, "learning_rate": 3.313755375509649e-05, "loss": 2.3362, "step": 193390 }, { "epoch": 0.34, "learning_rate": 3.313668181516966e-05, "loss": 2.4743, "step": 193400 }, { "epoch": 0.34, "learning_rate": 3.313580987524284e-05, "loss": 2.4323, "step": 193410 }, { "epoch": 0.34, "learning_rate": 3.3134937935316015e-05, "loss": 2.2747, "step": 193420 }, { "epoch": 0.34, "learning_rate": 3.3134065995389185e-05, "loss": 2.4482, "step": 193430 }, { "epoch": 0.34, "learning_rate": 3.3133194055462355e-05, "loss": 2.4293, "step": 193440 }, { "epoch": 0.34, "learning_rate": 3.313232211553553e-05, "loss": 2.3803, "step": 193450 }, { "epoch": 0.34, "learning_rate": 3.31314501756087e-05, "loss": 2.4494, "step": 193460 }, { "epoch": 0.34, "learning_rate": 3.313057823568187e-05, "loss": 2.4583, "step": 193470 }, { "epoch": 0.34, "learning_rate": 3.312970629575505e-05, "loss": 2.5495, "step": 193480 }, { "epoch": 0.34, "learning_rate": 3.312883435582822e-05, "loss": 2.4301, "step": 193490 }, { "epoch": 0.34, "learning_rate": 3.31279624159014e-05, "loss": 2.3632, "step": 193500 }, { "epoch": 0.34, "learning_rate": 3.312709047597457e-05, "loss": 2.455, "step": 193510 }, { "epoch": 0.34, "learning_rate": 3.3126218536047746e-05, "loss": 2.4514, "step": 193520 }, { "epoch": 0.34, "learning_rate": 3.3125346596120916e-05, "loss": 2.3447, "step": 193530 }, { "epoch": 0.34, "learning_rate": 3.3124474656194086e-05, "loss": 2.4309, "step": 193540 }, { "epoch": 0.34, "learning_rate": 3.3123602716267264e-05, "loss": 2.5727, "step": 193550 }, { "epoch": 0.34, "learning_rate": 3.3122730776340434e-05, "loss": 2.3626, "step": 193560 }, { "epoch": 0.34, "learning_rate": 3.312185883641361e-05, "loss": 2.3082, "step": 193570 }, { "epoch": 0.34, "learning_rate": 3.312098689648678e-05, "loss": 2.4508, "step": 193580 }, { "epoch": 0.34, "learning_rate": 3.312011495655996e-05, "loss": 2.45, "step": 193590 }, { "epoch": 0.34, "learning_rate": 3.311924301663313e-05, "loss": 2.4831, "step": 193600 }, { "epoch": 0.34, "learning_rate": 3.31183710767063e-05, "loss": 2.4057, "step": 193610 }, { "epoch": 0.34, "learning_rate": 3.311749913677947e-05, "loss": 2.4203, "step": 193620 }, { "epoch": 0.34, "learning_rate": 3.311662719685265e-05, "loss": 2.4026, "step": 193630 }, { "epoch": 0.34, "learning_rate": 3.311575525692582e-05, "loss": 2.4461, "step": 193640 }, { "epoch": 0.34, "learning_rate": 3.3114883316998994e-05, "loss": 2.5093, "step": 193650 }, { "epoch": 0.34, "learning_rate": 3.311401137707217e-05, "loss": 2.4198, "step": 193660 }, { "epoch": 0.34, "learning_rate": 3.311313943714534e-05, "loss": 2.4377, "step": 193670 }, { "epoch": 0.34, "learning_rate": 3.311226749721851e-05, "loss": 2.3823, "step": 193680 }, { "epoch": 0.34, "learning_rate": 3.311139555729168e-05, "loss": 2.4657, "step": 193690 }, { "epoch": 0.34, "learning_rate": 3.311052361736486e-05, "loss": 2.4662, "step": 193700 }, { "epoch": 0.34, "learning_rate": 3.310965167743803e-05, "loss": 2.4642, "step": 193710 }, { "epoch": 0.34, "learning_rate": 3.310877973751121e-05, "loss": 2.4697, "step": 193720 }, { "epoch": 0.34, "learning_rate": 3.310790779758438e-05, "loss": 2.3557, "step": 193730 }, { "epoch": 0.34, "learning_rate": 3.3107035857657555e-05, "loss": 2.4406, "step": 193740 }, { "epoch": 0.34, "learning_rate": 3.3106163917730725e-05, "loss": 2.4376, "step": 193750 }, { "epoch": 0.34, "learning_rate": 3.3105291977803896e-05, "loss": 2.328, "step": 193760 }, { "epoch": 0.34, "learning_rate": 3.310442003787707e-05, "loss": 2.4054, "step": 193770 }, { "epoch": 0.34, "learning_rate": 3.310354809795024e-05, "loss": 2.2929, "step": 193780 }, { "epoch": 0.34, "learning_rate": 3.3102676158023414e-05, "loss": 2.5431, "step": 193790 }, { "epoch": 0.34, "learning_rate": 3.310180421809659e-05, "loss": 2.3436, "step": 193800 }, { "epoch": 0.34, "learning_rate": 3.310093227816977e-05, "loss": 2.4661, "step": 193810 }, { "epoch": 0.34, "learning_rate": 3.310006033824294e-05, "loss": 2.4452, "step": 193820 }, { "epoch": 0.34, "learning_rate": 3.309918839831611e-05, "loss": 2.4171, "step": 193830 }, { "epoch": 0.34, "learning_rate": 3.3098316458389286e-05, "loss": 2.4338, "step": 193840 }, { "epoch": 0.34, "learning_rate": 3.3097444518462456e-05, "loss": 2.3268, "step": 193850 }, { "epoch": 0.34, "learning_rate": 3.309657257853563e-05, "loss": 2.4305, "step": 193860 }, { "epoch": 0.34, "learning_rate": 3.3095700638608804e-05, "loss": 2.3772, "step": 193870 }, { "epoch": 0.34, "learning_rate": 3.309482869868198e-05, "loss": 2.4303, "step": 193880 }, { "epoch": 0.34, "learning_rate": 3.309395675875515e-05, "loss": 2.3843, "step": 193890 }, { "epoch": 0.34, "learning_rate": 3.309308481882832e-05, "loss": 2.3819, "step": 193900 }, { "epoch": 0.34, "learning_rate": 3.30922128789015e-05, "loss": 2.4441, "step": 193910 }, { "epoch": 0.34, "learning_rate": 3.309134093897467e-05, "loss": 2.4818, "step": 193920 }, { "epoch": 0.34, "learning_rate": 3.309046899904784e-05, "loss": 2.4069, "step": 193930 }, { "epoch": 0.34, "learning_rate": 3.308959705912102e-05, "loss": 2.4206, "step": 193940 }, { "epoch": 0.34, "learning_rate": 3.3088725119194194e-05, "loss": 2.3917, "step": 193950 }, { "epoch": 0.34, "learning_rate": 3.3087853179267364e-05, "loss": 2.4352, "step": 193960 }, { "epoch": 0.34, "learning_rate": 3.3086981239340535e-05, "loss": 2.3454, "step": 193970 }, { "epoch": 0.34, "learning_rate": 3.308610929941371e-05, "loss": 2.5658, "step": 193980 }, { "epoch": 0.34, "learning_rate": 3.308523735948688e-05, "loss": 2.4465, "step": 193990 }, { "epoch": 0.34, "learning_rate": 3.308436541956005e-05, "loss": 2.3165, "step": 194000 }, { "epoch": 0.34, "learning_rate": 3.308349347963322e-05, "loss": 2.3528, "step": 194010 }, { "epoch": 0.34, "learning_rate": 3.308262153970641e-05, "loss": 2.3399, "step": 194020 }, { "epoch": 0.34, "learning_rate": 3.308174959977958e-05, "loss": 2.5062, "step": 194030 }, { "epoch": 0.34, "learning_rate": 3.308087765985275e-05, "loss": 2.4537, "step": 194040 }, { "epoch": 0.34, "learning_rate": 3.3080005719925925e-05, "loss": 2.4072, "step": 194050 }, { "epoch": 0.34, "learning_rate": 3.3079133779999095e-05, "loss": 2.4253, "step": 194060 }, { "epoch": 0.34, "learning_rate": 3.3078261840072266e-05, "loss": 2.3759, "step": 194070 }, { "epoch": 0.34, "learning_rate": 3.3077389900145436e-05, "loss": 2.3782, "step": 194080 }, { "epoch": 0.34, "learning_rate": 3.307651796021862e-05, "loss": 2.3931, "step": 194090 }, { "epoch": 0.34, "learning_rate": 3.307564602029179e-05, "loss": 2.3278, "step": 194100 }, { "epoch": 0.34, "learning_rate": 3.307477408036496e-05, "loss": 2.3083, "step": 194110 }, { "epoch": 0.34, "learning_rate": 3.307390214043813e-05, "loss": 2.4369, "step": 194120 }, { "epoch": 0.34, "learning_rate": 3.307303020051131e-05, "loss": 2.4228, "step": 194130 }, { "epoch": 0.34, "learning_rate": 3.307215826058448e-05, "loss": 2.353, "step": 194140 }, { "epoch": 0.34, "learning_rate": 3.307128632065765e-05, "loss": 2.3752, "step": 194150 }, { "epoch": 0.34, "learning_rate": 3.3070414380730826e-05, "loss": 2.4835, "step": 194160 }, { "epoch": 0.34, "learning_rate": 3.3069542440804e-05, "loss": 2.3901, "step": 194170 }, { "epoch": 0.34, "learning_rate": 3.3068670500877174e-05, "loss": 2.3488, "step": 194180 }, { "epoch": 0.34, "learning_rate": 3.3067798560950344e-05, "loss": 2.3111, "step": 194190 }, { "epoch": 0.34, "learning_rate": 3.306692662102352e-05, "loss": 2.4337, "step": 194200 }, { "epoch": 0.34, "learning_rate": 3.306605468109669e-05, "loss": 2.4515, "step": 194210 }, { "epoch": 0.34, "learning_rate": 3.306518274116986e-05, "loss": 2.4374, "step": 194220 }, { "epoch": 0.34, "learning_rate": 3.306431080124304e-05, "loss": 2.5623, "step": 194230 }, { "epoch": 0.34, "learning_rate": 3.3063438861316216e-05, "loss": 2.4458, "step": 194240 }, { "epoch": 0.34, "learning_rate": 3.306256692138939e-05, "loss": 2.4435, "step": 194250 }, { "epoch": 0.34, "learning_rate": 3.306169498146256e-05, "loss": 2.5066, "step": 194260 }, { "epoch": 0.34, "learning_rate": 3.3060823041535734e-05, "loss": 2.4488, "step": 194270 }, { "epoch": 0.34, "learning_rate": 3.3059951101608905e-05, "loss": 2.4348, "step": 194280 }, { "epoch": 0.34, "learning_rate": 3.3059079161682075e-05, "loss": 2.374, "step": 194290 }, { "epoch": 0.34, "learning_rate": 3.305820722175525e-05, "loss": 2.341, "step": 194300 }, { "epoch": 0.34, "learning_rate": 3.305733528182842e-05, "loss": 2.4225, "step": 194310 }, { "epoch": 0.34, "learning_rate": 3.30564633419016e-05, "loss": 2.4747, "step": 194320 }, { "epoch": 0.34, "learning_rate": 3.305559140197477e-05, "loss": 2.4524, "step": 194330 }, { "epoch": 0.34, "learning_rate": 3.305471946204795e-05, "loss": 2.4515, "step": 194340 }, { "epoch": 0.34, "learning_rate": 3.305384752212112e-05, "loss": 2.4063, "step": 194350 }, { "epoch": 0.34, "learning_rate": 3.305297558219429e-05, "loss": 2.5356, "step": 194360 }, { "epoch": 0.34, "learning_rate": 3.3052103642267465e-05, "loss": 2.4062, "step": 194370 }, { "epoch": 0.34, "learning_rate": 3.3051231702340636e-05, "loss": 2.4851, "step": 194380 }, { "epoch": 0.34, "learning_rate": 3.305035976241381e-05, "loss": 2.4727, "step": 194390 }, { "epoch": 0.34, "learning_rate": 3.304948782248698e-05, "loss": 2.4758, "step": 194400 }, { "epoch": 0.34, "learning_rate": 3.304861588256016e-05, "loss": 2.4609, "step": 194410 }, { "epoch": 0.34, "learning_rate": 3.304774394263333e-05, "loss": 2.4537, "step": 194420 }, { "epoch": 0.34, "learning_rate": 3.30468720027065e-05, "loss": 2.4332, "step": 194430 }, { "epoch": 0.34, "learning_rate": 3.304600006277968e-05, "loss": 2.3538, "step": 194440 }, { "epoch": 0.34, "learning_rate": 3.304512812285285e-05, "loss": 2.4692, "step": 194450 }, { "epoch": 0.34, "learning_rate": 3.304425618292602e-05, "loss": 2.4031, "step": 194460 }, { "epoch": 0.34, "learning_rate": 3.3043384242999196e-05, "loss": 2.433, "step": 194470 }, { "epoch": 0.34, "learning_rate": 3.304251230307237e-05, "loss": 2.419, "step": 194480 }, { "epoch": 0.34, "learning_rate": 3.3041640363145544e-05, "loss": 2.4645, "step": 194490 }, { "epoch": 0.34, "learning_rate": 3.3040768423218714e-05, "loss": 2.4822, "step": 194500 }, { "epoch": 0.34, "learning_rate": 3.3039896483291884e-05, "loss": 2.4139, "step": 194510 }, { "epoch": 0.34, "learning_rate": 3.303902454336506e-05, "loss": 2.3682, "step": 194520 }, { "epoch": 0.34, "learning_rate": 3.303815260343823e-05, "loss": 2.3006, "step": 194530 }, { "epoch": 0.34, "learning_rate": 3.303728066351141e-05, "loss": 2.3557, "step": 194540 }, { "epoch": 0.34, "learning_rate": 3.3036408723584586e-05, "loss": 2.437, "step": 194550 }, { "epoch": 0.34, "learning_rate": 3.303553678365776e-05, "loss": 2.3903, "step": 194560 }, { "epoch": 0.34, "learning_rate": 3.303466484373093e-05, "loss": 2.5014, "step": 194570 }, { "epoch": 0.34, "learning_rate": 3.30337929038041e-05, "loss": 2.5314, "step": 194580 }, { "epoch": 0.34, "learning_rate": 3.3032920963877275e-05, "loss": 2.3841, "step": 194590 }, { "epoch": 0.34, "learning_rate": 3.3032049023950445e-05, "loss": 2.3789, "step": 194600 }, { "epoch": 0.34, "learning_rate": 3.303117708402362e-05, "loss": 2.3565, "step": 194610 }, { "epoch": 0.34, "learning_rate": 3.303030514409679e-05, "loss": 2.4982, "step": 194620 }, { "epoch": 0.34, "learning_rate": 3.302943320416997e-05, "loss": 2.199, "step": 194630 }, { "epoch": 0.34, "learning_rate": 3.302856126424314e-05, "loss": 2.4505, "step": 194640 }, { "epoch": 0.34, "learning_rate": 3.302768932431631e-05, "loss": 2.4036, "step": 194650 }, { "epoch": 0.34, "learning_rate": 3.302681738438949e-05, "loss": 2.3676, "step": 194660 }, { "epoch": 0.34, "learning_rate": 3.302594544446266e-05, "loss": 2.5948, "step": 194670 }, { "epoch": 0.34, "learning_rate": 3.302507350453583e-05, "loss": 2.404, "step": 194680 }, { "epoch": 0.34, "learning_rate": 3.3024201564609006e-05, "loss": 2.4483, "step": 194690 }, { "epoch": 0.34, "learning_rate": 3.302332962468218e-05, "loss": 2.3434, "step": 194700 }, { "epoch": 0.34, "learning_rate": 3.302245768475535e-05, "loss": 2.577, "step": 194710 }, { "epoch": 0.34, "learning_rate": 3.3021585744828523e-05, "loss": 2.5122, "step": 194720 }, { "epoch": 0.34, "learning_rate": 3.30207138049017e-05, "loss": 2.3342, "step": 194730 }, { "epoch": 0.34, "learning_rate": 3.301984186497487e-05, "loss": 2.4233, "step": 194740 }, { "epoch": 0.34, "learning_rate": 3.301896992504804e-05, "loss": 2.4828, "step": 194750 }, { "epoch": 0.34, "learning_rate": 3.301809798512122e-05, "loss": 2.4428, "step": 194760 }, { "epoch": 0.34, "learning_rate": 3.3017226045194396e-05, "loss": 2.518, "step": 194770 }, { "epoch": 0.34, "learning_rate": 3.3016354105267566e-05, "loss": 2.4626, "step": 194780 }, { "epoch": 0.34, "learning_rate": 3.3015482165340736e-05, "loss": 2.3645, "step": 194790 }, { "epoch": 0.34, "learning_rate": 3.3014610225413914e-05, "loss": 2.4595, "step": 194800 }, { "epoch": 0.34, "learning_rate": 3.3013738285487084e-05, "loss": 2.5236, "step": 194810 }, { "epoch": 0.34, "learning_rate": 3.3012866345560254e-05, "loss": 2.5007, "step": 194820 }, { "epoch": 0.34, "learning_rate": 3.301199440563343e-05, "loss": 2.2951, "step": 194830 }, { "epoch": 0.34, "learning_rate": 3.301112246570661e-05, "loss": 2.4262, "step": 194840 }, { "epoch": 0.34, "learning_rate": 3.301025052577978e-05, "loss": 2.4841, "step": 194850 }, { "epoch": 0.34, "learning_rate": 3.300937858585295e-05, "loss": 2.421, "step": 194860 }, { "epoch": 0.34, "learning_rate": 3.300850664592613e-05, "loss": 2.4949, "step": 194870 }, { "epoch": 0.34, "learning_rate": 3.30076347059993e-05, "loss": 2.4524, "step": 194880 }, { "epoch": 0.34, "learning_rate": 3.300676276607247e-05, "loss": 2.3849, "step": 194890 }, { "epoch": 0.34, "learning_rate": 3.3005890826145645e-05, "loss": 2.2879, "step": 194900 }, { "epoch": 0.34, "learning_rate": 3.300501888621882e-05, "loss": 2.4527, "step": 194910 }, { "epoch": 0.34, "learning_rate": 3.300414694629199e-05, "loss": 2.3848, "step": 194920 }, { "epoch": 0.34, "learning_rate": 3.300327500636516e-05, "loss": 2.4362, "step": 194930 }, { "epoch": 0.34, "learning_rate": 3.300240306643834e-05, "loss": 2.4454, "step": 194940 }, { "epoch": 0.34, "learning_rate": 3.300153112651151e-05, "loss": 2.4034, "step": 194950 }, { "epoch": 0.34, "learning_rate": 3.300065918658468e-05, "loss": 2.5513, "step": 194960 }, { "epoch": 0.34, "learning_rate": 3.299978724665785e-05, "loss": 2.4858, "step": 194970 }, { "epoch": 0.34, "learning_rate": 3.299891530673103e-05, "loss": 2.452, "step": 194980 }, { "epoch": 0.34, "learning_rate": 3.2998043366804205e-05, "loss": 2.5097, "step": 194990 }, { "epoch": 0.34, "learning_rate": 3.2997171426877375e-05, "loss": 2.3902, "step": 195000 }, { "epoch": 0.34, "learning_rate": 3.299629948695055e-05, "loss": 2.4648, "step": 195010 }, { "epoch": 0.34, "learning_rate": 3.299542754702372e-05, "loss": 2.365, "step": 195020 }, { "epoch": 0.34, "learning_rate": 3.299455560709689e-05, "loss": 2.4414, "step": 195030 }, { "epoch": 0.34, "learning_rate": 3.2993683667170064e-05, "loss": 2.4892, "step": 195040 }, { "epoch": 0.34, "learning_rate": 3.299281172724324e-05, "loss": 2.4146, "step": 195050 }, { "epoch": 0.34, "learning_rate": 3.299193978731642e-05, "loss": 2.4699, "step": 195060 }, { "epoch": 0.34, "learning_rate": 3.299106784738959e-05, "loss": 2.4364, "step": 195070 }, { "epoch": 0.34, "learning_rate": 3.299019590746276e-05, "loss": 2.4444, "step": 195080 }, { "epoch": 0.34, "learning_rate": 3.2989323967535936e-05, "loss": 2.3237, "step": 195090 }, { "epoch": 0.34, "learning_rate": 3.2988452027609106e-05, "loss": 2.4424, "step": 195100 }, { "epoch": 0.34, "learning_rate": 3.298758008768228e-05, "loss": 2.3058, "step": 195110 }, { "epoch": 0.34, "learning_rate": 3.2986708147755454e-05, "loss": 2.3586, "step": 195120 }, { "epoch": 0.34, "learning_rate": 3.2985836207828624e-05, "loss": 2.3803, "step": 195130 }, { "epoch": 0.34, "learning_rate": 3.29849642679018e-05, "loss": 2.5268, "step": 195140 }, { "epoch": 0.34, "learning_rate": 3.298409232797497e-05, "loss": 2.4222, "step": 195150 }, { "epoch": 0.34, "learning_rate": 3.298322038804815e-05, "loss": 2.4853, "step": 195160 }, { "epoch": 0.34, "learning_rate": 3.298234844812132e-05, "loss": 2.5044, "step": 195170 }, { "epoch": 0.34, "learning_rate": 3.298147650819449e-05, "loss": 2.551, "step": 195180 }, { "epoch": 0.34, "learning_rate": 3.298060456826767e-05, "loss": 2.4921, "step": 195190 }, { "epoch": 0.34, "learning_rate": 3.297973262834084e-05, "loss": 2.5335, "step": 195200 }, { "epoch": 0.34, "learning_rate": 3.2978860688414014e-05, "loss": 2.3852, "step": 195210 }, { "epoch": 0.34, "learning_rate": 3.2977988748487185e-05, "loss": 2.5035, "step": 195220 }, { "epoch": 0.34, "learning_rate": 3.297711680856036e-05, "loss": 2.5327, "step": 195230 }, { "epoch": 0.34, "learning_rate": 3.297624486863353e-05, "loss": 2.5531, "step": 195240 }, { "epoch": 0.34, "learning_rate": 3.29753729287067e-05, "loss": 2.5099, "step": 195250 }, { "epoch": 0.34, "learning_rate": 3.297450098877988e-05, "loss": 2.3819, "step": 195260 }, { "epoch": 0.34, "learning_rate": 3.297362904885305e-05, "loss": 2.431, "step": 195270 }, { "epoch": 0.34, "learning_rate": 3.297275710892623e-05, "loss": 2.3013, "step": 195280 }, { "epoch": 0.34, "learning_rate": 3.29718851689994e-05, "loss": 2.4968, "step": 195290 }, { "epoch": 0.34, "learning_rate": 3.2971013229072575e-05, "loss": 2.4667, "step": 195300 }, { "epoch": 0.34, "learning_rate": 3.2970141289145745e-05, "loss": 2.3711, "step": 195310 }, { "epoch": 0.34, "learning_rate": 3.2969269349218916e-05, "loss": 2.431, "step": 195320 }, { "epoch": 0.34, "learning_rate": 3.296839740929209e-05, "loss": 2.3606, "step": 195330 }, { "epoch": 0.34, "learning_rate": 3.296752546936526e-05, "loss": 2.336, "step": 195340 }, { "epoch": 0.34, "learning_rate": 3.2966653529438434e-05, "loss": 2.4474, "step": 195350 }, { "epoch": 0.34, "learning_rate": 3.296578158951161e-05, "loss": 2.4252, "step": 195360 }, { "epoch": 0.34, "learning_rate": 3.296490964958479e-05, "loss": 2.5484, "step": 195370 }, { "epoch": 0.34, "learning_rate": 3.296403770965796e-05, "loss": 2.3289, "step": 195380 }, { "epoch": 0.34, "learning_rate": 3.296316576973113e-05, "loss": 2.392, "step": 195390 }, { "epoch": 0.34, "learning_rate": 3.2962293829804306e-05, "loss": 2.5111, "step": 195400 }, { "epoch": 0.34, "learning_rate": 3.2961421889877476e-05, "loss": 2.3768, "step": 195410 }, { "epoch": 0.34, "learning_rate": 3.296054994995065e-05, "loss": 2.4207, "step": 195420 }, { "epoch": 0.34, "learning_rate": 3.2959678010023824e-05, "loss": 2.4897, "step": 195430 }, { "epoch": 0.34, "learning_rate": 3.2958806070097e-05, "loss": 2.2932, "step": 195440 }, { "epoch": 0.34, "learning_rate": 3.295793413017017e-05, "loss": 2.4267, "step": 195450 }, { "epoch": 0.34, "learning_rate": 3.295706219024334e-05, "loss": 2.3956, "step": 195460 }, { "epoch": 0.34, "learning_rate": 3.295619025031651e-05, "loss": 2.4517, "step": 195470 }, { "epoch": 0.34, "learning_rate": 3.295531831038969e-05, "loss": 2.3154, "step": 195480 }, { "epoch": 0.34, "learning_rate": 3.295444637046286e-05, "loss": 2.4418, "step": 195490 }, { "epoch": 0.34, "learning_rate": 3.295357443053603e-05, "loss": 2.3954, "step": 195500 }, { "epoch": 0.34, "learning_rate": 3.2952702490609214e-05, "loss": 2.383, "step": 195510 }, { "epoch": 0.34, "learning_rate": 3.2951830550682384e-05, "loss": 2.3856, "step": 195520 }, { "epoch": 0.34, "learning_rate": 3.2950958610755555e-05, "loss": 2.4079, "step": 195530 }, { "epoch": 0.34, "learning_rate": 3.2950086670828725e-05, "loss": 2.3877, "step": 195540 }, { "epoch": 0.34, "learning_rate": 3.29492147309019e-05, "loss": 2.3346, "step": 195550 }, { "epoch": 0.34, "learning_rate": 3.294834279097507e-05, "loss": 2.3229, "step": 195560 }, { "epoch": 0.34, "learning_rate": 3.294747085104824e-05, "loss": 2.4965, "step": 195570 }, { "epoch": 0.34, "learning_rate": 3.294659891112142e-05, "loss": 2.3875, "step": 195580 }, { "epoch": 0.34, "learning_rate": 3.29457269711946e-05, "loss": 2.5118, "step": 195590 }, { "epoch": 0.34, "learning_rate": 3.294485503126777e-05, "loss": 2.4796, "step": 195600 }, { "epoch": 0.34, "learning_rate": 3.294398309134094e-05, "loss": 2.3503, "step": 195610 }, { "epoch": 0.34, "learning_rate": 3.2943111151414115e-05, "loss": 2.4926, "step": 195620 }, { "epoch": 0.34, "learning_rate": 3.2942239211487286e-05, "loss": 2.4564, "step": 195630 }, { "epoch": 0.34, "learning_rate": 3.2941367271560456e-05, "loss": 2.3809, "step": 195640 }, { "epoch": 0.34, "learning_rate": 3.294049533163363e-05, "loss": 2.3878, "step": 195650 }, { "epoch": 0.34, "learning_rate": 3.293962339170681e-05, "loss": 2.3591, "step": 195660 }, { "epoch": 0.34, "learning_rate": 3.293875145177998e-05, "loss": 2.5826, "step": 195670 }, { "epoch": 0.34, "learning_rate": 3.293787951185315e-05, "loss": 2.4256, "step": 195680 }, { "epoch": 0.34, "learning_rate": 3.293700757192633e-05, "loss": 2.4177, "step": 195690 }, { "epoch": 0.34, "learning_rate": 3.29361356319995e-05, "loss": 2.2731, "step": 195700 }, { "epoch": 0.34, "learning_rate": 3.293526369207267e-05, "loss": 2.4207, "step": 195710 }, { "epoch": 0.34, "learning_rate": 3.2934391752145846e-05, "loss": 2.479, "step": 195720 }, { "epoch": 0.34, "learning_rate": 3.2933519812219023e-05, "loss": 2.3537, "step": 195730 }, { "epoch": 0.34, "learning_rate": 3.2932647872292194e-05, "loss": 2.433, "step": 195740 }, { "epoch": 0.34, "learning_rate": 3.2931775932365364e-05, "loss": 2.4844, "step": 195750 }, { "epoch": 0.34, "learning_rate": 3.293090399243854e-05, "loss": 2.4362, "step": 195760 }, { "epoch": 0.34, "learning_rate": 3.293003205251171e-05, "loss": 2.5045, "step": 195770 }, { "epoch": 0.34, "learning_rate": 3.292916011258488e-05, "loss": 2.5006, "step": 195780 }, { "epoch": 0.34, "learning_rate": 3.292828817265806e-05, "loss": 2.3688, "step": 195790 }, { "epoch": 0.34, "learning_rate": 3.292741623273123e-05, "loss": 2.3847, "step": 195800 }, { "epoch": 0.34, "learning_rate": 3.292654429280441e-05, "loss": 2.349, "step": 195810 }, { "epoch": 0.34, "learning_rate": 3.292567235287758e-05, "loss": 2.4771, "step": 195820 }, { "epoch": 0.34, "learning_rate": 3.2924800412950754e-05, "loss": 2.395, "step": 195830 }, { "epoch": 0.34, "learning_rate": 3.2923928473023925e-05, "loss": 2.4429, "step": 195840 }, { "epoch": 0.34, "learning_rate": 3.2923056533097095e-05, "loss": 2.3885, "step": 195850 }, { "epoch": 0.34, "learning_rate": 3.2922184593170265e-05, "loss": 2.3345, "step": 195860 }, { "epoch": 0.34, "learning_rate": 3.292131265324344e-05, "loss": 2.4395, "step": 195870 }, { "epoch": 0.34, "learning_rate": 3.292044071331662e-05, "loss": 2.4213, "step": 195880 }, { "epoch": 0.34, "learning_rate": 3.291956877338979e-05, "loss": 2.4485, "step": 195890 }, { "epoch": 0.34, "learning_rate": 3.291869683346297e-05, "loss": 2.5571, "step": 195900 }, { "epoch": 0.34, "learning_rate": 3.291782489353614e-05, "loss": 2.4477, "step": 195910 }, { "epoch": 0.34, "learning_rate": 3.291695295360931e-05, "loss": 2.4242, "step": 195920 }, { "epoch": 0.34, "learning_rate": 3.291608101368248e-05, "loss": 2.4496, "step": 195930 }, { "epoch": 0.34, "learning_rate": 3.2915209073755656e-05, "loss": 2.4595, "step": 195940 }, { "epoch": 0.34, "learning_rate": 3.291433713382883e-05, "loss": 2.4314, "step": 195950 }, { "epoch": 0.34, "learning_rate": 3.2913465193902e-05, "loss": 2.4445, "step": 195960 }, { "epoch": 0.34, "learning_rate": 3.2912593253975174e-05, "loss": 2.5034, "step": 195970 }, { "epoch": 0.34, "learning_rate": 3.291172131404835e-05, "loss": 2.4866, "step": 195980 }, { "epoch": 0.34, "learning_rate": 3.291084937412152e-05, "loss": 2.3646, "step": 195990 }, { "epoch": 0.34, "learning_rate": 3.290997743419469e-05, "loss": 2.3915, "step": 196000 }, { "epoch": 0.34, "learning_rate": 3.290910549426787e-05, "loss": 2.4029, "step": 196010 }, { "epoch": 0.34, "learning_rate": 3.290823355434104e-05, "loss": 2.3731, "step": 196020 }, { "epoch": 0.34, "learning_rate": 3.2907361614414216e-05, "loss": 2.2222, "step": 196030 }, { "epoch": 0.34, "learning_rate": 3.2906489674487387e-05, "loss": 2.3923, "step": 196040 }, { "epoch": 0.34, "learning_rate": 3.2905617734560564e-05, "loss": 2.336, "step": 196050 }, { "epoch": 0.34, "learning_rate": 3.2904745794633734e-05, "loss": 2.3057, "step": 196060 }, { "epoch": 0.34, "learning_rate": 3.2903873854706904e-05, "loss": 2.525, "step": 196070 }, { "epoch": 0.34, "learning_rate": 3.290300191478008e-05, "loss": 2.4401, "step": 196080 }, { "epoch": 0.34, "learning_rate": 3.290212997485325e-05, "loss": 2.4996, "step": 196090 }, { "epoch": 0.34, "learning_rate": 3.290125803492643e-05, "loss": 2.4439, "step": 196100 }, { "epoch": 0.34, "learning_rate": 3.29003860949996e-05, "loss": 2.4193, "step": 196110 }, { "epoch": 0.34, "learning_rate": 3.289951415507278e-05, "loss": 2.3983, "step": 196120 }, { "epoch": 0.34, "learning_rate": 3.289864221514595e-05, "loss": 2.4759, "step": 196130 }, { "epoch": 0.34, "learning_rate": 3.289777027521912e-05, "loss": 2.5924, "step": 196140 }, { "epoch": 0.34, "learning_rate": 3.2896898335292295e-05, "loss": 2.419, "step": 196150 }, { "epoch": 0.34, "learning_rate": 3.2896026395365465e-05, "loss": 2.4186, "step": 196160 }, { "epoch": 0.34, "learning_rate": 3.2895154455438635e-05, "loss": 2.3971, "step": 196170 }, { "epoch": 0.34, "learning_rate": 3.289428251551181e-05, "loss": 2.5124, "step": 196180 }, { "epoch": 0.34, "learning_rate": 3.289341057558499e-05, "loss": 2.4813, "step": 196190 }, { "epoch": 0.34, "learning_rate": 3.289253863565816e-05, "loss": 2.3771, "step": 196200 }, { "epoch": 0.34, "learning_rate": 3.289166669573133e-05, "loss": 2.4428, "step": 196210 }, { "epoch": 0.34, "learning_rate": 3.289079475580451e-05, "loss": 2.5916, "step": 196220 }, { "epoch": 0.34, "learning_rate": 3.288992281587768e-05, "loss": 2.4995, "step": 196230 }, { "epoch": 0.34, "learning_rate": 3.288905087595085e-05, "loss": 2.4555, "step": 196240 }, { "epoch": 0.34, "learning_rate": 3.2888178936024026e-05, "loss": 2.4908, "step": 196250 }, { "epoch": 0.34, "learning_rate": 3.28873069960972e-05, "loss": 2.4987, "step": 196260 }, { "epoch": 0.34, "learning_rate": 3.288643505617037e-05, "loss": 2.3531, "step": 196270 }, { "epoch": 0.34, "learning_rate": 3.2885563116243543e-05, "loss": 2.4454, "step": 196280 }, { "epoch": 0.34, "learning_rate": 3.288469117631672e-05, "loss": 2.5531, "step": 196290 }, { "epoch": 0.34, "learning_rate": 3.288381923638989e-05, "loss": 2.4689, "step": 196300 }, { "epoch": 0.34, "learning_rate": 3.288294729646306e-05, "loss": 2.5183, "step": 196310 }, { "epoch": 0.34, "learning_rate": 3.288207535653623e-05, "loss": 2.3593, "step": 196320 }, { "epoch": 0.34, "learning_rate": 3.2881203416609416e-05, "loss": 2.4692, "step": 196330 }, { "epoch": 0.34, "learning_rate": 3.2880331476682586e-05, "loss": 2.4414, "step": 196340 }, { "epoch": 0.34, "learning_rate": 3.2879459536755756e-05, "loss": 2.4312, "step": 196350 }, { "epoch": 0.34, "learning_rate": 3.2878587596828934e-05, "loss": 2.3258, "step": 196360 }, { "epoch": 0.34, "learning_rate": 3.2877715656902104e-05, "loss": 2.547, "step": 196370 }, { "epoch": 0.34, "learning_rate": 3.2876843716975274e-05, "loss": 2.463, "step": 196380 }, { "epoch": 0.34, "learning_rate": 3.2875971777048445e-05, "loss": 2.3565, "step": 196390 }, { "epoch": 0.34, "learning_rate": 3.287509983712163e-05, "loss": 2.3105, "step": 196400 }, { "epoch": 0.34, "learning_rate": 3.28742278971948e-05, "loss": 2.4097, "step": 196410 }, { "epoch": 0.34, "learning_rate": 3.287335595726797e-05, "loss": 2.4992, "step": 196420 }, { "epoch": 0.34, "learning_rate": 3.287248401734114e-05, "loss": 2.4154, "step": 196430 }, { "epoch": 0.34, "learning_rate": 3.287161207741432e-05, "loss": 2.4619, "step": 196440 }, { "epoch": 0.34, "learning_rate": 3.287074013748749e-05, "loss": 2.4778, "step": 196450 }, { "epoch": 0.34, "learning_rate": 3.286986819756066e-05, "loss": 2.4179, "step": 196460 }, { "epoch": 0.34, "learning_rate": 3.286899625763384e-05, "loss": 2.4269, "step": 196470 }, { "epoch": 0.34, "learning_rate": 3.286812431770701e-05, "loss": 2.5742, "step": 196480 }, { "epoch": 0.34, "learning_rate": 3.286725237778018e-05, "loss": 2.3355, "step": 196490 }, { "epoch": 0.34, "learning_rate": 3.286638043785335e-05, "loss": 2.5561, "step": 196500 }, { "epoch": 0.34, "learning_rate": 3.286550849792653e-05, "loss": 2.4422, "step": 196510 }, { "epoch": 0.34, "learning_rate": 3.28646365579997e-05, "loss": 2.3579, "step": 196520 }, { "epoch": 0.34, "learning_rate": 3.286376461807287e-05, "loss": 2.3806, "step": 196530 }, { "epoch": 0.34, "learning_rate": 3.286289267814605e-05, "loss": 2.4357, "step": 196540 }, { "epoch": 0.34, "learning_rate": 3.2862020738219225e-05, "loss": 2.4337, "step": 196550 }, { "epoch": 0.34, "learning_rate": 3.2861148798292395e-05, "loss": 2.5019, "step": 196560 }, { "epoch": 0.34, "learning_rate": 3.2860276858365566e-05, "loss": 2.3138, "step": 196570 }, { "epoch": 0.34, "learning_rate": 3.285940491843874e-05, "loss": 2.4566, "step": 196580 }, { "epoch": 0.34, "learning_rate": 3.2858532978511913e-05, "loss": 2.4665, "step": 196590 }, { "epoch": 0.34, "learning_rate": 3.2857661038585084e-05, "loss": 2.3649, "step": 196600 }, { "epoch": 0.34, "learning_rate": 3.285678909865826e-05, "loss": 2.3847, "step": 196610 }, { "epoch": 0.34, "learning_rate": 3.285591715873144e-05, "loss": 2.4399, "step": 196620 }, { "epoch": 0.34, "learning_rate": 3.285504521880461e-05, "loss": 2.3267, "step": 196630 }, { "epoch": 0.34, "learning_rate": 3.285417327887778e-05, "loss": 2.414, "step": 196640 }, { "epoch": 0.34, "learning_rate": 3.2853301338950956e-05, "loss": 2.4315, "step": 196650 }, { "epoch": 0.34, "learning_rate": 3.2852429399024126e-05, "loss": 2.3586, "step": 196660 }, { "epoch": 0.34, "learning_rate": 3.28515574590973e-05, "loss": 2.4564, "step": 196670 }, { "epoch": 0.34, "learning_rate": 3.2850685519170474e-05, "loss": 2.4476, "step": 196680 }, { "epoch": 0.34, "learning_rate": 3.2849813579243644e-05, "loss": 2.3552, "step": 196690 }, { "epoch": 0.34, "learning_rate": 3.284894163931682e-05, "loss": 2.4156, "step": 196700 }, { "epoch": 0.34, "learning_rate": 3.284806969938999e-05, "loss": 2.398, "step": 196710 }, { "epoch": 0.34, "learning_rate": 3.284719775946317e-05, "loss": 2.365, "step": 196720 }, { "epoch": 0.34, "learning_rate": 3.284632581953634e-05, "loss": 2.4704, "step": 196730 }, { "epoch": 0.34, "learning_rate": 3.284545387960951e-05, "loss": 2.5401, "step": 196740 }, { "epoch": 0.34, "learning_rate": 3.284458193968269e-05, "loss": 2.3435, "step": 196750 }, { "epoch": 0.34, "learning_rate": 3.284370999975586e-05, "loss": 2.4099, "step": 196760 }, { "epoch": 0.34, "learning_rate": 3.2842838059829034e-05, "loss": 2.3921, "step": 196770 }, { "epoch": 0.34, "learning_rate": 3.2841966119902205e-05, "loss": 2.385, "step": 196780 }, { "epoch": 0.34, "learning_rate": 3.284109417997538e-05, "loss": 2.5766, "step": 196790 }, { "epoch": 0.34, "learning_rate": 3.284022224004855e-05, "loss": 2.3179, "step": 196800 }, { "epoch": 0.34, "learning_rate": 3.283935030012172e-05, "loss": 2.501, "step": 196810 }, { "epoch": 0.34, "learning_rate": 3.283847836019489e-05, "loss": 2.434, "step": 196820 }, { "epoch": 0.34, "learning_rate": 3.283760642026807e-05, "loss": 2.3942, "step": 196830 }, { "epoch": 0.34, "learning_rate": 3.283673448034124e-05, "loss": 2.4678, "step": 196840 }, { "epoch": 0.34, "learning_rate": 3.283586254041442e-05, "loss": 2.3404, "step": 196850 }, { "epoch": 0.34, "learning_rate": 3.2834990600487595e-05, "loss": 2.4059, "step": 196860 }, { "epoch": 0.34, "learning_rate": 3.2834118660560765e-05, "loss": 2.3999, "step": 196870 }, { "epoch": 0.34, "learning_rate": 3.2833246720633936e-05, "loss": 2.4223, "step": 196880 }, { "epoch": 0.34, "learning_rate": 3.2832374780707106e-05, "loss": 2.4292, "step": 196890 }, { "epoch": 0.34, "learning_rate": 3.283150284078028e-05, "loss": 2.5726, "step": 196900 }, { "epoch": 0.34, "learning_rate": 3.2830630900853454e-05, "loss": 2.4264, "step": 196910 }, { "epoch": 0.34, "learning_rate": 3.282975896092663e-05, "loss": 2.5193, "step": 196920 }, { "epoch": 0.34, "learning_rate": 3.28288870209998e-05, "loss": 2.4353, "step": 196930 }, { "epoch": 0.34, "learning_rate": 3.282801508107298e-05, "loss": 2.329, "step": 196940 }, { "epoch": 0.34, "learning_rate": 3.282714314114615e-05, "loss": 2.3524, "step": 196950 }, { "epoch": 0.34, "learning_rate": 3.282627120121932e-05, "loss": 2.3616, "step": 196960 }, { "epoch": 0.34, "learning_rate": 3.2825399261292496e-05, "loss": 2.4817, "step": 196970 }, { "epoch": 0.34, "learning_rate": 3.282452732136567e-05, "loss": 2.4201, "step": 196980 }, { "epoch": 0.34, "learning_rate": 3.282365538143884e-05, "loss": 2.4115, "step": 196990 }, { "epoch": 0.34, "learning_rate": 3.2822783441512014e-05, "loss": 2.4124, "step": 197000 }, { "epoch": 0.34, "learning_rate": 3.282191150158519e-05, "loss": 2.3631, "step": 197010 }, { "epoch": 0.34, "learning_rate": 3.282103956165836e-05, "loss": 2.414, "step": 197020 }, { "epoch": 0.34, "learning_rate": 3.282016762173153e-05, "loss": 2.4704, "step": 197030 }, { "epoch": 0.34, "learning_rate": 3.281929568180471e-05, "loss": 2.5027, "step": 197040 }, { "epoch": 0.34, "learning_rate": 3.281842374187788e-05, "loss": 2.3949, "step": 197050 }, { "epoch": 0.34, "learning_rate": 3.281755180195105e-05, "loss": 2.3845, "step": 197060 }, { "epoch": 0.34, "learning_rate": 3.281667986202423e-05, "loss": 2.3689, "step": 197070 }, { "epoch": 0.34, "learning_rate": 3.2815807922097404e-05, "loss": 2.3801, "step": 197080 }, { "epoch": 0.34, "learning_rate": 3.2814935982170575e-05, "loss": 2.4366, "step": 197090 }, { "epoch": 0.34, "learning_rate": 3.2814064042243745e-05, "loss": 2.2625, "step": 197100 }, { "epoch": 0.34, "learning_rate": 3.281319210231692e-05, "loss": 2.4049, "step": 197110 }, { "epoch": 0.34, "learning_rate": 3.281232016239009e-05, "loss": 2.4485, "step": 197120 }, { "epoch": 0.34, "learning_rate": 3.281144822246326e-05, "loss": 2.455, "step": 197130 }, { "epoch": 0.34, "learning_rate": 3.281057628253644e-05, "loss": 2.3916, "step": 197140 }, { "epoch": 0.34, "learning_rate": 3.280970434260962e-05, "loss": 2.4447, "step": 197150 }, { "epoch": 0.34, "learning_rate": 3.280883240268279e-05, "loss": 2.3374, "step": 197160 }, { "epoch": 0.34, "learning_rate": 3.280796046275596e-05, "loss": 2.4143, "step": 197170 }, { "epoch": 0.34, "learning_rate": 3.2807088522829135e-05, "loss": 2.3823, "step": 197180 }, { "epoch": 0.34, "learning_rate": 3.2806216582902306e-05, "loss": 2.5207, "step": 197190 }, { "epoch": 0.34, "learning_rate": 3.2805344642975476e-05, "loss": 2.3257, "step": 197200 }, { "epoch": 0.34, "learning_rate": 3.2804472703048646e-05, "loss": 2.4762, "step": 197210 }, { "epoch": 0.34, "learning_rate": 3.280360076312183e-05, "loss": 2.3175, "step": 197220 }, { "epoch": 0.34, "learning_rate": 3.2802728823195e-05, "loss": 2.3376, "step": 197230 }, { "epoch": 0.34, "learning_rate": 3.280185688326817e-05, "loss": 2.5033, "step": 197240 }, { "epoch": 0.34, "learning_rate": 3.280098494334135e-05, "loss": 2.3689, "step": 197250 }, { "epoch": 0.34, "learning_rate": 3.280011300341452e-05, "loss": 2.3967, "step": 197260 }, { "epoch": 0.34, "learning_rate": 3.279924106348769e-05, "loss": 2.4953, "step": 197270 }, { "epoch": 0.34, "learning_rate": 3.279836912356086e-05, "loss": 2.478, "step": 197280 }, { "epoch": 0.34, "learning_rate": 3.2797497183634043e-05, "loss": 2.3888, "step": 197290 }, { "epoch": 0.34, "learning_rate": 3.2796625243707214e-05, "loss": 2.4684, "step": 197300 }, { "epoch": 0.34, "learning_rate": 3.2795753303780384e-05, "loss": 2.2935, "step": 197310 }, { "epoch": 0.34, "learning_rate": 3.2794881363853555e-05, "loss": 2.43, "step": 197320 }, { "epoch": 0.34, "learning_rate": 3.279400942392673e-05, "loss": 2.3893, "step": 197330 }, { "epoch": 0.34, "learning_rate": 3.27931374839999e-05, "loss": 2.3266, "step": 197340 }, { "epoch": 0.34, "learning_rate": 3.279226554407307e-05, "loss": 2.287, "step": 197350 }, { "epoch": 0.34, "learning_rate": 3.279139360414625e-05, "loss": 2.4158, "step": 197360 }, { "epoch": 0.34, "learning_rate": 3.279052166421943e-05, "loss": 2.4059, "step": 197370 }, { "epoch": 0.34, "learning_rate": 3.27896497242926e-05, "loss": 2.3842, "step": 197380 }, { "epoch": 0.34, "learning_rate": 3.278877778436577e-05, "loss": 2.3955, "step": 197390 }, { "epoch": 0.34, "learning_rate": 3.2787905844438945e-05, "loss": 2.3588, "step": 197400 }, { "epoch": 0.34, "learning_rate": 3.2787033904512115e-05, "loss": 2.2616, "step": 197410 }, { "epoch": 0.34, "learning_rate": 3.2786161964585285e-05, "loss": 2.4946, "step": 197420 }, { "epoch": 0.34, "learning_rate": 3.278529002465846e-05, "loss": 2.3678, "step": 197430 }, { "epoch": 0.34, "learning_rate": 3.278441808473164e-05, "loss": 2.4445, "step": 197440 }, { "epoch": 0.34, "learning_rate": 3.278354614480481e-05, "loss": 2.4463, "step": 197450 }, { "epoch": 0.34, "learning_rate": 3.278267420487798e-05, "loss": 2.5301, "step": 197460 }, { "epoch": 0.34, "learning_rate": 3.278180226495116e-05, "loss": 2.42, "step": 197470 }, { "epoch": 0.34, "learning_rate": 3.278093032502433e-05, "loss": 2.4671, "step": 197480 }, { "epoch": 0.34, "learning_rate": 3.27800583850975e-05, "loss": 2.4242, "step": 197490 }, { "epoch": 0.34, "learning_rate": 3.2779186445170676e-05, "loss": 2.338, "step": 197500 }, { "epoch": 0.34, "learning_rate": 3.2778314505243846e-05, "loss": 2.3659, "step": 197510 }, { "epoch": 0.34, "learning_rate": 3.277744256531702e-05, "loss": 2.4196, "step": 197520 }, { "epoch": 0.34, "learning_rate": 3.2776570625390194e-05, "loss": 2.5184, "step": 197530 }, { "epoch": 0.34, "learning_rate": 3.277569868546337e-05, "loss": 2.3613, "step": 197540 }, { "epoch": 0.34, "learning_rate": 3.277482674553654e-05, "loss": 2.4309, "step": 197550 }, { "epoch": 0.34, "learning_rate": 3.277395480560971e-05, "loss": 2.4146, "step": 197560 }, { "epoch": 0.34, "learning_rate": 3.277308286568289e-05, "loss": 2.4372, "step": 197570 }, { "epoch": 0.34, "learning_rate": 3.277221092575606e-05, "loss": 2.2628, "step": 197580 }, { "epoch": 0.34, "learning_rate": 3.2771338985829236e-05, "loss": 2.5031, "step": 197590 }, { "epoch": 0.34, "learning_rate": 3.2770467045902407e-05, "loss": 2.3892, "step": 197600 }, { "epoch": 0.34, "learning_rate": 3.2769595105975584e-05, "loss": 2.4125, "step": 197610 }, { "epoch": 0.34, "learning_rate": 3.2768723166048754e-05, "loss": 2.4465, "step": 197620 }, { "epoch": 0.34, "learning_rate": 3.2767851226121924e-05, "loss": 2.4173, "step": 197630 }, { "epoch": 0.34, "learning_rate": 3.27669792861951e-05, "loss": 2.5536, "step": 197640 }, { "epoch": 0.34, "learning_rate": 3.276610734626827e-05, "loss": 2.3995, "step": 197650 }, { "epoch": 0.34, "learning_rate": 3.276523540634144e-05, "loss": 2.3616, "step": 197660 }, { "epoch": 0.34, "learning_rate": 3.276436346641462e-05, "loss": 2.3817, "step": 197670 }, { "epoch": 0.34, "learning_rate": 3.27634915264878e-05, "loss": 2.3813, "step": 197680 }, { "epoch": 0.34, "learning_rate": 3.276261958656097e-05, "loss": 2.4029, "step": 197690 }, { "epoch": 0.34, "learning_rate": 3.276174764663414e-05, "loss": 2.3832, "step": 197700 }, { "epoch": 0.34, "learning_rate": 3.2760875706707315e-05, "loss": 2.4866, "step": 197710 }, { "epoch": 0.34, "learning_rate": 3.2760003766780485e-05, "loss": 2.3855, "step": 197720 }, { "epoch": 0.34, "learning_rate": 3.2759131826853655e-05, "loss": 2.5165, "step": 197730 }, { "epoch": 0.34, "learning_rate": 3.275825988692683e-05, "loss": 2.489, "step": 197740 }, { "epoch": 0.34, "learning_rate": 3.275738794700001e-05, "loss": 2.4633, "step": 197750 }, { "epoch": 0.34, "learning_rate": 3.275651600707318e-05, "loss": 2.4175, "step": 197760 }, { "epoch": 0.34, "learning_rate": 3.275564406714635e-05, "loss": 2.3845, "step": 197770 }, { "epoch": 0.34, "learning_rate": 3.275477212721952e-05, "loss": 2.4227, "step": 197780 }, { "epoch": 0.34, "learning_rate": 3.27539001872927e-05, "loss": 2.3905, "step": 197790 }, { "epoch": 0.34, "learning_rate": 3.275302824736587e-05, "loss": 2.3225, "step": 197800 }, { "epoch": 0.34, "learning_rate": 3.2752156307439046e-05, "loss": 2.4173, "step": 197810 }, { "epoch": 0.34, "learning_rate": 3.275128436751222e-05, "loss": 2.3955, "step": 197820 }, { "epoch": 0.34, "learning_rate": 3.275041242758539e-05, "loss": 2.3891, "step": 197830 }, { "epoch": 0.35, "learning_rate": 3.2749540487658563e-05, "loss": 2.3459, "step": 197840 }, { "epoch": 0.35, "learning_rate": 3.2748668547731734e-05, "loss": 2.3574, "step": 197850 }, { "epoch": 0.35, "learning_rate": 3.274779660780491e-05, "loss": 2.3638, "step": 197860 }, { "epoch": 0.35, "learning_rate": 3.274692466787808e-05, "loss": 2.4282, "step": 197870 }, { "epoch": 0.35, "learning_rate": 3.274605272795125e-05, "loss": 2.4323, "step": 197880 }, { "epoch": 0.35, "learning_rate": 3.274518078802443e-05, "loss": 2.3476, "step": 197890 }, { "epoch": 0.35, "learning_rate": 3.2744308848097606e-05, "loss": 2.4799, "step": 197900 }, { "epoch": 0.35, "learning_rate": 3.2743436908170776e-05, "loss": 2.4199, "step": 197910 }, { "epoch": 0.35, "learning_rate": 3.274256496824395e-05, "loss": 2.4037, "step": 197920 }, { "epoch": 0.35, "learning_rate": 3.2741693028317124e-05, "loss": 2.4509, "step": 197930 }, { "epoch": 0.35, "learning_rate": 3.2740821088390294e-05, "loss": 2.448, "step": 197940 }, { "epoch": 0.35, "learning_rate": 3.2739949148463465e-05, "loss": 2.4416, "step": 197950 }, { "epoch": 0.35, "learning_rate": 3.273907720853664e-05, "loss": 2.4769, "step": 197960 }, { "epoch": 0.35, "learning_rate": 3.273820526860982e-05, "loss": 2.4829, "step": 197970 }, { "epoch": 0.35, "learning_rate": 3.273733332868299e-05, "loss": 2.4326, "step": 197980 }, { "epoch": 0.35, "learning_rate": 3.273646138875616e-05, "loss": 2.4176, "step": 197990 }, { "epoch": 0.35, "learning_rate": 3.273558944882934e-05, "loss": 2.5475, "step": 198000 }, { "epoch": 0.35, "learning_rate": 3.273471750890251e-05, "loss": 2.312, "step": 198010 }, { "epoch": 0.35, "learning_rate": 3.273384556897568e-05, "loss": 2.4056, "step": 198020 }, { "epoch": 0.35, "learning_rate": 3.2732973629048855e-05, "loss": 2.3903, "step": 198030 }, { "epoch": 0.35, "learning_rate": 3.273210168912203e-05, "loss": 2.4798, "step": 198040 }, { "epoch": 0.35, "learning_rate": 3.27312297491952e-05, "loss": 2.3929, "step": 198050 }, { "epoch": 0.35, "learning_rate": 3.273035780926837e-05, "loss": 2.4085, "step": 198060 }, { "epoch": 0.35, "learning_rate": 3.272948586934155e-05, "loss": 2.4689, "step": 198070 }, { "epoch": 0.35, "learning_rate": 3.272861392941472e-05, "loss": 2.5175, "step": 198080 }, { "epoch": 0.35, "learning_rate": 3.272774198948789e-05, "loss": 2.3855, "step": 198090 }, { "epoch": 0.35, "learning_rate": 3.272687004956107e-05, "loss": 2.2596, "step": 198100 }, { "epoch": 0.35, "learning_rate": 3.2725998109634245e-05, "loss": 2.3381, "step": 198110 }, { "epoch": 0.35, "learning_rate": 3.2725126169707415e-05, "loss": 2.5421, "step": 198120 }, { "epoch": 0.35, "learning_rate": 3.2724254229780586e-05, "loss": 2.4908, "step": 198130 }, { "epoch": 0.35, "learning_rate": 3.272338228985376e-05, "loss": 2.3996, "step": 198140 }, { "epoch": 0.35, "learning_rate": 3.2722510349926933e-05, "loss": 2.4501, "step": 198150 }, { "epoch": 0.35, "learning_rate": 3.2721638410000104e-05, "loss": 2.4486, "step": 198160 }, { "epoch": 0.35, "learning_rate": 3.2720766470073274e-05, "loss": 2.3831, "step": 198170 }, { "epoch": 0.35, "learning_rate": 3.271989453014645e-05, "loss": 2.4209, "step": 198180 }, { "epoch": 0.35, "learning_rate": 3.271902259021963e-05, "loss": 2.3984, "step": 198190 }, { "epoch": 0.35, "learning_rate": 3.27181506502928e-05, "loss": 2.4279, "step": 198200 }, { "epoch": 0.35, "learning_rate": 3.2717278710365976e-05, "loss": 2.524, "step": 198210 }, { "epoch": 0.35, "learning_rate": 3.2716406770439146e-05, "loss": 2.5045, "step": 198220 }, { "epoch": 0.35, "learning_rate": 3.271553483051232e-05, "loss": 2.5091, "step": 198230 }, { "epoch": 0.35, "learning_rate": 3.271466289058549e-05, "loss": 2.4571, "step": 198240 }, { "epoch": 0.35, "learning_rate": 3.2713790950658664e-05, "loss": 2.3588, "step": 198250 }, { "epoch": 0.35, "learning_rate": 3.271291901073184e-05, "loss": 2.4771, "step": 198260 }, { "epoch": 0.35, "learning_rate": 3.271204707080501e-05, "loss": 2.4653, "step": 198270 }, { "epoch": 0.35, "learning_rate": 3.271117513087818e-05, "loss": 2.369, "step": 198280 }, { "epoch": 0.35, "learning_rate": 3.271030319095136e-05, "loss": 2.3752, "step": 198290 }, { "epoch": 0.35, "learning_rate": 3.270943125102453e-05, "loss": 2.3578, "step": 198300 }, { "epoch": 0.35, "learning_rate": 3.27085593110977e-05, "loss": 2.3974, "step": 198310 }, { "epoch": 0.35, "learning_rate": 3.270768737117088e-05, "loss": 2.487, "step": 198320 }, { "epoch": 0.35, "learning_rate": 3.2706815431244054e-05, "loss": 2.5572, "step": 198330 }, { "epoch": 0.35, "learning_rate": 3.2705943491317225e-05, "loss": 2.3625, "step": 198340 }, { "epoch": 0.35, "learning_rate": 3.2705071551390395e-05, "loss": 2.4762, "step": 198350 }, { "epoch": 0.35, "learning_rate": 3.270419961146357e-05, "loss": 2.4687, "step": 198360 }, { "epoch": 0.35, "learning_rate": 3.270332767153674e-05, "loss": 2.5188, "step": 198370 }, { "epoch": 0.35, "learning_rate": 3.270245573160991e-05, "loss": 2.3417, "step": 198380 }, { "epoch": 0.35, "learning_rate": 3.270158379168309e-05, "loss": 2.3281, "step": 198390 }, { "epoch": 0.35, "learning_rate": 3.270071185175626e-05, "loss": 2.4652, "step": 198400 }, { "epoch": 0.35, "learning_rate": 3.269983991182944e-05, "loss": 2.5224, "step": 198410 }, { "epoch": 0.35, "learning_rate": 3.269896797190261e-05, "loss": 2.4124, "step": 198420 }, { "epoch": 0.35, "learning_rate": 3.2698096031975785e-05, "loss": 2.4789, "step": 198430 }, { "epoch": 0.35, "learning_rate": 3.2697224092048956e-05, "loss": 2.4617, "step": 198440 }, { "epoch": 0.35, "learning_rate": 3.2696352152122126e-05, "loss": 2.4195, "step": 198450 }, { "epoch": 0.35, "learning_rate": 3.26954802121953e-05, "loss": 2.4181, "step": 198460 }, { "epoch": 0.35, "learning_rate": 3.2694608272268474e-05, "loss": 2.3752, "step": 198470 }, { "epoch": 0.35, "learning_rate": 3.269373633234165e-05, "loss": 2.4485, "step": 198480 }, { "epoch": 0.35, "learning_rate": 3.269286439241482e-05, "loss": 2.5333, "step": 198490 }, { "epoch": 0.35, "learning_rate": 3.2691992452488e-05, "loss": 2.5055, "step": 198500 }, { "epoch": 0.35, "learning_rate": 3.269112051256117e-05, "loss": 2.4167, "step": 198510 }, { "epoch": 0.35, "learning_rate": 3.269024857263434e-05, "loss": 2.325, "step": 198520 }, { "epoch": 0.35, "learning_rate": 3.2689376632707516e-05, "loss": 2.4221, "step": 198530 }, { "epoch": 0.35, "learning_rate": 3.268850469278069e-05, "loss": 2.3227, "step": 198540 }, { "epoch": 0.35, "learning_rate": 3.268763275285386e-05, "loss": 2.4009, "step": 198550 }, { "epoch": 0.35, "learning_rate": 3.2686760812927034e-05, "loss": 2.4924, "step": 198560 }, { "epoch": 0.35, "learning_rate": 3.268588887300021e-05, "loss": 2.4998, "step": 198570 }, { "epoch": 0.35, "learning_rate": 3.268501693307338e-05, "loss": 2.5625, "step": 198580 }, { "epoch": 0.35, "learning_rate": 3.268414499314655e-05, "loss": 2.5713, "step": 198590 }, { "epoch": 0.35, "learning_rate": 3.268327305321973e-05, "loss": 2.3628, "step": 198600 }, { "epoch": 0.35, "learning_rate": 3.26824011132929e-05, "loss": 2.5879, "step": 198610 }, { "epoch": 0.35, "learning_rate": 3.268152917336607e-05, "loss": 2.3452, "step": 198620 }, { "epoch": 0.35, "learning_rate": 3.268065723343925e-05, "loss": 2.4237, "step": 198630 }, { "epoch": 0.35, "learning_rate": 3.2679785293512424e-05, "loss": 2.4769, "step": 198640 }, { "epoch": 0.35, "learning_rate": 3.2678913353585595e-05, "loss": 2.462, "step": 198650 }, { "epoch": 0.35, "learning_rate": 3.2678041413658765e-05, "loss": 2.4017, "step": 198660 }, { "epoch": 0.35, "learning_rate": 3.2677169473731936e-05, "loss": 2.3617, "step": 198670 }, { "epoch": 0.35, "learning_rate": 3.267629753380511e-05, "loss": 2.5034, "step": 198680 }, { "epoch": 0.35, "learning_rate": 3.267542559387828e-05, "loss": 2.5002, "step": 198690 }, { "epoch": 0.35, "learning_rate": 3.2674553653951453e-05, "loss": 2.4398, "step": 198700 }, { "epoch": 0.35, "learning_rate": 3.267368171402464e-05, "loss": 2.5269, "step": 198710 }, { "epoch": 0.35, "learning_rate": 3.267280977409781e-05, "loss": 2.4625, "step": 198720 }, { "epoch": 0.35, "learning_rate": 3.267193783417098e-05, "loss": 2.4227, "step": 198730 }, { "epoch": 0.35, "learning_rate": 3.267106589424415e-05, "loss": 2.4081, "step": 198740 }, { "epoch": 0.35, "learning_rate": 3.2670193954317326e-05, "loss": 2.4563, "step": 198750 }, { "epoch": 0.35, "learning_rate": 3.2669322014390496e-05, "loss": 2.3753, "step": 198760 }, { "epoch": 0.35, "learning_rate": 3.2668450074463666e-05, "loss": 2.4041, "step": 198770 }, { "epoch": 0.35, "learning_rate": 3.2667578134536844e-05, "loss": 2.5012, "step": 198780 }, { "epoch": 0.35, "learning_rate": 3.266670619461002e-05, "loss": 2.4334, "step": 198790 }, { "epoch": 0.35, "learning_rate": 3.266583425468319e-05, "loss": 2.3591, "step": 198800 }, { "epoch": 0.35, "learning_rate": 3.266496231475636e-05, "loss": 2.4966, "step": 198810 }, { "epoch": 0.35, "learning_rate": 3.266409037482954e-05, "loss": 2.374, "step": 198820 }, { "epoch": 0.35, "learning_rate": 3.266321843490271e-05, "loss": 2.5311, "step": 198830 }, { "epoch": 0.35, "learning_rate": 3.266234649497588e-05, "loss": 2.4285, "step": 198840 }, { "epoch": 0.35, "learning_rate": 3.266147455504906e-05, "loss": 2.4086, "step": 198850 }, { "epoch": 0.35, "learning_rate": 3.2660602615122234e-05, "loss": 2.4313, "step": 198860 }, { "epoch": 0.35, "learning_rate": 3.2659730675195404e-05, "loss": 2.5595, "step": 198870 }, { "epoch": 0.35, "learning_rate": 3.2658858735268575e-05, "loss": 2.4121, "step": 198880 }, { "epoch": 0.35, "learning_rate": 3.265798679534175e-05, "loss": 2.4785, "step": 198890 }, { "epoch": 0.35, "learning_rate": 3.265711485541492e-05, "loss": 2.4694, "step": 198900 }, { "epoch": 0.35, "learning_rate": 3.265624291548809e-05, "loss": 2.5109, "step": 198910 }, { "epoch": 0.35, "learning_rate": 3.265537097556127e-05, "loss": 2.3871, "step": 198920 }, { "epoch": 0.35, "learning_rate": 3.265449903563445e-05, "loss": 2.4365, "step": 198930 }, { "epoch": 0.35, "learning_rate": 3.265362709570762e-05, "loss": 2.3069, "step": 198940 }, { "epoch": 0.35, "learning_rate": 3.265275515578079e-05, "loss": 2.4487, "step": 198950 }, { "epoch": 0.35, "learning_rate": 3.2651883215853965e-05, "loss": 2.4408, "step": 198960 }, { "epoch": 0.35, "learning_rate": 3.2651011275927135e-05, "loss": 2.4553, "step": 198970 }, { "epoch": 0.35, "learning_rate": 3.2650139336000305e-05, "loss": 2.4517, "step": 198980 }, { "epoch": 0.35, "learning_rate": 3.264926739607348e-05, "loss": 2.4025, "step": 198990 }, { "epoch": 0.35, "learning_rate": 3.264839545614666e-05, "loss": 2.5362, "step": 199000 }, { "epoch": 0.35, "learning_rate": 3.264752351621983e-05, "loss": 2.3784, "step": 199010 }, { "epoch": 0.35, "learning_rate": 3.2646651576293e-05, "loss": 2.4592, "step": 199020 }, { "epoch": 0.35, "learning_rate": 3.264577963636618e-05, "loss": 2.3538, "step": 199030 }, { "epoch": 0.35, "learning_rate": 3.264490769643935e-05, "loss": 2.3656, "step": 199040 }, { "epoch": 0.35, "learning_rate": 3.264403575651252e-05, "loss": 2.3562, "step": 199050 }, { "epoch": 0.35, "learning_rate": 3.2643163816585696e-05, "loss": 2.4429, "step": 199060 }, { "epoch": 0.35, "learning_rate": 3.2642291876658866e-05, "loss": 2.4409, "step": 199070 }, { "epoch": 0.35, "learning_rate": 3.264141993673204e-05, "loss": 2.3889, "step": 199080 }, { "epoch": 0.35, "learning_rate": 3.2640547996805214e-05, "loss": 2.4449, "step": 199090 }, { "epoch": 0.35, "learning_rate": 3.263967605687839e-05, "loss": 2.3462, "step": 199100 }, { "epoch": 0.35, "learning_rate": 3.263880411695156e-05, "loss": 2.3999, "step": 199110 }, { "epoch": 0.35, "learning_rate": 3.263793217702473e-05, "loss": 2.4371, "step": 199120 }, { "epoch": 0.35, "learning_rate": 3.26370602370979e-05, "loss": 2.3326, "step": 199130 }, { "epoch": 0.35, "learning_rate": 3.263618829717108e-05, "loss": 2.299, "step": 199140 }, { "epoch": 0.35, "learning_rate": 3.2635316357244256e-05, "loss": 2.2778, "step": 199150 }, { "epoch": 0.35, "learning_rate": 3.2634444417317427e-05, "loss": 2.4341, "step": 199160 }, { "epoch": 0.35, "learning_rate": 3.2633572477390604e-05, "loss": 2.3902, "step": 199170 }, { "epoch": 0.35, "learning_rate": 3.2632700537463774e-05, "loss": 2.4315, "step": 199180 }, { "epoch": 0.35, "learning_rate": 3.2631828597536944e-05, "loss": 2.5137, "step": 199190 }, { "epoch": 0.35, "learning_rate": 3.2630956657610115e-05, "loss": 2.4676, "step": 199200 }, { "epoch": 0.35, "learning_rate": 3.263008471768329e-05, "loss": 2.4558, "step": 199210 }, { "epoch": 0.35, "learning_rate": 3.262921277775646e-05, "loss": 2.5041, "step": 199220 }, { "epoch": 0.35, "learning_rate": 3.262834083782964e-05, "loss": 2.5027, "step": 199230 }, { "epoch": 0.35, "learning_rate": 3.262746889790281e-05, "loss": 2.4124, "step": 199240 }, { "epoch": 0.35, "learning_rate": 3.262659695797599e-05, "loss": 2.37, "step": 199250 }, { "epoch": 0.35, "learning_rate": 3.262572501804916e-05, "loss": 2.3537, "step": 199260 }, { "epoch": 0.35, "learning_rate": 3.262485307812233e-05, "loss": 2.2568, "step": 199270 }, { "epoch": 0.35, "learning_rate": 3.2623981138195505e-05, "loss": 2.4383, "step": 199280 }, { "epoch": 0.35, "learning_rate": 3.2623109198268675e-05, "loss": 2.416, "step": 199290 }, { "epoch": 0.35, "learning_rate": 3.262223725834185e-05, "loss": 2.4458, "step": 199300 }, { "epoch": 0.35, "learning_rate": 3.262136531841502e-05, "loss": 2.4909, "step": 199310 }, { "epoch": 0.35, "learning_rate": 3.26204933784882e-05, "loss": 2.3691, "step": 199320 }, { "epoch": 0.35, "learning_rate": 3.261962143856137e-05, "loss": 2.4178, "step": 199330 }, { "epoch": 0.35, "learning_rate": 3.261874949863454e-05, "loss": 2.4862, "step": 199340 }, { "epoch": 0.35, "learning_rate": 3.261787755870772e-05, "loss": 2.3762, "step": 199350 }, { "epoch": 0.35, "learning_rate": 3.261700561878089e-05, "loss": 2.4365, "step": 199360 }, { "epoch": 0.35, "learning_rate": 3.261613367885406e-05, "loss": 2.4009, "step": 199370 }, { "epoch": 0.35, "learning_rate": 3.2615261738927236e-05, "loss": 2.4796, "step": 199380 }, { "epoch": 0.35, "learning_rate": 3.261438979900041e-05, "loss": 2.3846, "step": 199390 }, { "epoch": 0.35, "learning_rate": 3.2613517859073584e-05, "loss": 2.3258, "step": 199400 }, { "epoch": 0.35, "learning_rate": 3.2612645919146754e-05, "loss": 2.376, "step": 199410 }, { "epoch": 0.35, "learning_rate": 3.261177397921993e-05, "loss": 2.4126, "step": 199420 }, { "epoch": 0.35, "learning_rate": 3.26109020392931e-05, "loss": 2.4482, "step": 199430 }, { "epoch": 0.35, "learning_rate": 3.261003009936627e-05, "loss": 2.3738, "step": 199440 }, { "epoch": 0.35, "learning_rate": 3.260915815943945e-05, "loss": 2.443, "step": 199450 }, { "epoch": 0.35, "learning_rate": 3.2608286219512626e-05, "loss": 2.402, "step": 199460 }, { "epoch": 0.35, "learning_rate": 3.2607414279585797e-05, "loss": 2.3742, "step": 199470 }, { "epoch": 0.35, "learning_rate": 3.260654233965897e-05, "loss": 2.4329, "step": 199480 }, { "epoch": 0.35, "learning_rate": 3.2605670399732144e-05, "loss": 2.3985, "step": 199490 }, { "epoch": 0.35, "learning_rate": 3.2604798459805314e-05, "loss": 2.4421, "step": 199500 }, { "epoch": 0.35, "learning_rate": 3.2603926519878485e-05, "loss": 2.5025, "step": 199510 }, { "epoch": 0.35, "learning_rate": 3.2603054579951655e-05, "loss": 2.2736, "step": 199520 }, { "epoch": 0.35, "learning_rate": 3.260218264002484e-05, "loss": 2.408, "step": 199530 }, { "epoch": 0.35, "learning_rate": 3.260131070009801e-05, "loss": 2.4409, "step": 199540 }, { "epoch": 0.35, "learning_rate": 3.260043876017118e-05, "loss": 2.3861, "step": 199550 }, { "epoch": 0.35, "learning_rate": 3.259956682024436e-05, "loss": 2.2761, "step": 199560 }, { "epoch": 0.35, "learning_rate": 3.259869488031753e-05, "loss": 2.3794, "step": 199570 }, { "epoch": 0.35, "learning_rate": 3.25978229403907e-05, "loss": 2.4682, "step": 199580 }, { "epoch": 0.35, "learning_rate": 3.259695100046387e-05, "loss": 2.4653, "step": 199590 }, { "epoch": 0.35, "learning_rate": 3.259607906053705e-05, "loss": 2.3939, "step": 199600 }, { "epoch": 0.35, "learning_rate": 3.259520712061022e-05, "loss": 2.4258, "step": 199610 }, { "epoch": 0.35, "learning_rate": 3.259433518068339e-05, "loss": 2.4438, "step": 199620 }, { "epoch": 0.35, "learning_rate": 3.259346324075656e-05, "loss": 2.3699, "step": 199630 }, { "epoch": 0.35, "learning_rate": 3.259259130082974e-05, "loss": 2.5553, "step": 199640 }, { "epoch": 0.35, "learning_rate": 3.259171936090291e-05, "loss": 2.4395, "step": 199650 }, { "epoch": 0.35, "learning_rate": 3.259084742097608e-05, "loss": 2.413, "step": 199660 }, { "epoch": 0.35, "learning_rate": 3.2589975481049265e-05, "loss": 2.3086, "step": 199670 }, { "epoch": 0.35, "learning_rate": 3.2589103541122436e-05, "loss": 2.4864, "step": 199680 }, { "epoch": 0.35, "learning_rate": 3.2588231601195606e-05, "loss": 2.4191, "step": 199690 }, { "epoch": 0.35, "learning_rate": 3.2587359661268776e-05, "loss": 2.3275, "step": 199700 }, { "epoch": 0.35, "learning_rate": 3.2586487721341953e-05, "loss": 2.4964, "step": 199710 }, { "epoch": 0.35, "learning_rate": 3.2585615781415124e-05, "loss": 2.4897, "step": 199720 }, { "epoch": 0.35, "learning_rate": 3.2584743841488294e-05, "loss": 2.4301, "step": 199730 }, { "epoch": 0.35, "learning_rate": 3.258387190156147e-05, "loss": 2.4251, "step": 199740 }, { "epoch": 0.35, "learning_rate": 3.258299996163465e-05, "loss": 2.3386, "step": 199750 }, { "epoch": 0.35, "learning_rate": 3.258212802170782e-05, "loss": 2.471, "step": 199760 }, { "epoch": 0.35, "learning_rate": 3.258125608178099e-05, "loss": 2.2313, "step": 199770 }, { "epoch": 0.35, "learning_rate": 3.2580384141854166e-05, "loss": 2.3081, "step": 199780 }, { "epoch": 0.35, "learning_rate": 3.257951220192734e-05, "loss": 2.4874, "step": 199790 }, { "epoch": 0.35, "learning_rate": 3.257864026200051e-05, "loss": 2.3451, "step": 199800 }, { "epoch": 0.35, "learning_rate": 3.2577768322073684e-05, "loss": 2.4659, "step": 199810 }, { "epoch": 0.35, "learning_rate": 3.257689638214686e-05, "loss": 2.3594, "step": 199820 }, { "epoch": 0.35, "learning_rate": 3.257602444222003e-05, "loss": 2.3494, "step": 199830 }, { "epoch": 0.35, "learning_rate": 3.25751525022932e-05, "loss": 2.2746, "step": 199840 }, { "epoch": 0.35, "learning_rate": 3.257428056236638e-05, "loss": 2.4961, "step": 199850 }, { "epoch": 0.35, "learning_rate": 3.257340862243955e-05, "loss": 2.3841, "step": 199860 }, { "epoch": 0.35, "learning_rate": 3.257253668251272e-05, "loss": 2.4391, "step": 199870 }, { "epoch": 0.35, "learning_rate": 3.25716647425859e-05, "loss": 2.3875, "step": 199880 }, { "epoch": 0.35, "learning_rate": 3.257079280265907e-05, "loss": 2.5286, "step": 199890 }, { "epoch": 0.35, "learning_rate": 3.2569920862732245e-05, "loss": 2.294, "step": 199900 }, { "epoch": 0.35, "learning_rate": 3.2569048922805415e-05, "loss": 2.4811, "step": 199910 }, { "epoch": 0.35, "learning_rate": 3.256817698287859e-05, "loss": 2.5192, "step": 199920 }, { "epoch": 0.35, "learning_rate": 3.256730504295176e-05, "loss": 2.353, "step": 199930 }, { "epoch": 0.35, "learning_rate": 3.256643310302493e-05, "loss": 2.3902, "step": 199940 }, { "epoch": 0.35, "learning_rate": 3.256556116309811e-05, "loss": 2.4699, "step": 199950 }, { "epoch": 0.35, "learning_rate": 3.256468922317128e-05, "loss": 2.4408, "step": 199960 }, { "epoch": 0.35, "learning_rate": 3.256381728324446e-05, "loss": 2.4956, "step": 199970 }, { "epoch": 0.35, "learning_rate": 3.256294534331763e-05, "loss": 2.4474, "step": 199980 }, { "epoch": 0.35, "learning_rate": 3.2562073403390805e-05, "loss": 2.4985, "step": 199990 }, { "epoch": 0.35, "learning_rate": 3.2561201463463976e-05, "loss": 2.3258, "step": 200000 }, { "epoch": 0.35, "learning_rate": 3.2560329523537146e-05, "loss": 2.375, "step": 200010 }, { "epoch": 0.35, "learning_rate": 3.2559457583610317e-05, "loss": 2.4304, "step": 200020 }, { "epoch": 0.35, "learning_rate": 3.2558585643683494e-05, "loss": 2.5263, "step": 200030 }, { "epoch": 0.35, "learning_rate": 3.2557713703756664e-05, "loss": 2.4025, "step": 200040 }, { "epoch": 0.35, "learning_rate": 3.255684176382984e-05, "loss": 2.4592, "step": 200050 }, { "epoch": 0.35, "learning_rate": 3.255596982390302e-05, "loss": 2.4198, "step": 200060 }, { "epoch": 0.35, "learning_rate": 3.255509788397619e-05, "loss": 2.4058, "step": 200070 }, { "epoch": 0.35, "learning_rate": 3.255422594404936e-05, "loss": 2.3121, "step": 200080 }, { "epoch": 0.35, "learning_rate": 3.255335400412253e-05, "loss": 2.4499, "step": 200090 }, { "epoch": 0.35, "learning_rate": 3.255248206419571e-05, "loss": 2.3441, "step": 200100 }, { "epoch": 0.35, "learning_rate": 3.255161012426888e-05, "loss": 2.3203, "step": 200110 }, { "epoch": 0.35, "learning_rate": 3.2550738184342054e-05, "loss": 2.3759, "step": 200120 }, { "epoch": 0.35, "learning_rate": 3.2549866244415225e-05, "loss": 2.3744, "step": 200130 }, { "epoch": 0.35, "learning_rate": 3.25489943044884e-05, "loss": 2.3382, "step": 200140 }, { "epoch": 0.35, "learning_rate": 3.254812236456157e-05, "loss": 2.4322, "step": 200150 }, { "epoch": 0.35, "learning_rate": 3.254725042463474e-05, "loss": 2.4109, "step": 200160 }, { "epoch": 0.35, "learning_rate": 3.254637848470792e-05, "loss": 2.3789, "step": 200170 }, { "epoch": 0.35, "learning_rate": 3.254550654478109e-05, "loss": 2.424, "step": 200180 }, { "epoch": 0.35, "learning_rate": 3.254463460485427e-05, "loss": 2.3609, "step": 200190 }, { "epoch": 0.35, "learning_rate": 3.254376266492744e-05, "loss": 2.4249, "step": 200200 }, { "epoch": 0.35, "learning_rate": 3.2542890725000615e-05, "loss": 2.3976, "step": 200210 }, { "epoch": 0.35, "learning_rate": 3.2542018785073785e-05, "loss": 2.4664, "step": 200220 }, { "epoch": 0.35, "learning_rate": 3.2541146845146956e-05, "loss": 2.5167, "step": 200230 }, { "epoch": 0.35, "learning_rate": 3.254027490522013e-05, "loss": 2.4559, "step": 200240 }, { "epoch": 0.35, "learning_rate": 3.25394029652933e-05, "loss": 2.4562, "step": 200250 }, { "epoch": 0.35, "learning_rate": 3.2538531025366474e-05, "loss": 2.4423, "step": 200260 }, { "epoch": 0.35, "learning_rate": 3.253765908543965e-05, "loss": 2.3411, "step": 200270 }, { "epoch": 0.35, "learning_rate": 3.253678714551283e-05, "loss": 2.4759, "step": 200280 }, { "epoch": 0.35, "learning_rate": 3.2535915205586e-05, "loss": 2.4588, "step": 200290 }, { "epoch": 0.35, "learning_rate": 3.253504326565917e-05, "loss": 2.4729, "step": 200300 }, { "epoch": 0.35, "learning_rate": 3.2534171325732346e-05, "loss": 2.5079, "step": 200310 }, { "epoch": 0.35, "learning_rate": 3.2533299385805516e-05, "loss": 2.3768, "step": 200320 }, { "epoch": 0.35, "learning_rate": 3.2532427445878687e-05, "loss": 2.4536, "step": 200330 }, { "epoch": 0.35, "learning_rate": 3.2531555505951864e-05, "loss": 2.4222, "step": 200340 }, { "epoch": 0.35, "learning_rate": 3.253068356602504e-05, "loss": 2.4645, "step": 200350 }, { "epoch": 0.35, "learning_rate": 3.252981162609821e-05, "loss": 2.4242, "step": 200360 }, { "epoch": 0.35, "learning_rate": 3.252893968617138e-05, "loss": 2.3308, "step": 200370 }, { "epoch": 0.35, "learning_rate": 3.252806774624456e-05, "loss": 2.5865, "step": 200380 }, { "epoch": 0.35, "learning_rate": 3.252719580631773e-05, "loss": 2.4242, "step": 200390 }, { "epoch": 0.35, "learning_rate": 3.25263238663909e-05, "loss": 2.4043, "step": 200400 }, { "epoch": 0.35, "learning_rate": 3.252545192646408e-05, "loss": 2.3827, "step": 200410 }, { "epoch": 0.35, "learning_rate": 3.2524579986537254e-05, "loss": 2.492, "step": 200420 }, { "epoch": 0.35, "learning_rate": 3.2523708046610424e-05, "loss": 2.4153, "step": 200430 }, { "epoch": 0.35, "learning_rate": 3.2522836106683595e-05, "loss": 2.4152, "step": 200440 }, { "epoch": 0.35, "learning_rate": 3.252196416675677e-05, "loss": 2.4897, "step": 200450 }, { "epoch": 0.35, "learning_rate": 3.252109222682994e-05, "loss": 2.4158, "step": 200460 }, { "epoch": 0.35, "learning_rate": 3.252022028690311e-05, "loss": 2.3367, "step": 200470 }, { "epoch": 0.35, "learning_rate": 3.251934834697628e-05, "loss": 2.4927, "step": 200480 }, { "epoch": 0.35, "learning_rate": 3.251847640704947e-05, "loss": 2.3526, "step": 200490 }, { "epoch": 0.35, "learning_rate": 3.251760446712264e-05, "loss": 2.4911, "step": 200500 }, { "epoch": 0.35, "learning_rate": 3.251673252719581e-05, "loss": 2.387, "step": 200510 }, { "epoch": 0.35, "learning_rate": 3.2515860587268985e-05, "loss": 2.579, "step": 200520 }, { "epoch": 0.35, "learning_rate": 3.2514988647342155e-05, "loss": 2.3701, "step": 200530 }, { "epoch": 0.35, "learning_rate": 3.2514116707415326e-05, "loss": 2.4414, "step": 200540 }, { "epoch": 0.35, "learning_rate": 3.2513244767488496e-05, "loss": 2.4518, "step": 200550 }, { "epoch": 0.35, "learning_rate": 3.251237282756167e-05, "loss": 2.3626, "step": 200560 }, { "epoch": 0.35, "learning_rate": 3.251150088763485e-05, "loss": 2.4489, "step": 200570 }, { "epoch": 0.35, "learning_rate": 3.251062894770802e-05, "loss": 2.4973, "step": 200580 }, { "epoch": 0.35, "learning_rate": 3.250975700778119e-05, "loss": 2.3838, "step": 200590 }, { "epoch": 0.35, "learning_rate": 3.250888506785437e-05, "loss": 2.4427, "step": 200600 }, { "epoch": 0.35, "learning_rate": 3.250801312792754e-05, "loss": 2.5204, "step": 200610 }, { "epoch": 0.35, "learning_rate": 3.250714118800071e-05, "loss": 2.3146, "step": 200620 }, { "epoch": 0.35, "learning_rate": 3.2506269248073886e-05, "loss": 2.4796, "step": 200630 }, { "epoch": 0.35, "learning_rate": 3.250539730814706e-05, "loss": 2.4298, "step": 200640 }, { "epoch": 0.35, "learning_rate": 3.2504525368220234e-05, "loss": 2.3469, "step": 200650 }, { "epoch": 0.35, "learning_rate": 3.2503653428293404e-05, "loss": 2.4688, "step": 200660 }, { "epoch": 0.35, "learning_rate": 3.250278148836658e-05, "loss": 2.4075, "step": 200670 }, { "epoch": 0.35, "learning_rate": 3.250190954843975e-05, "loss": 2.4646, "step": 200680 }, { "epoch": 0.35, "learning_rate": 3.250103760851292e-05, "loss": 2.4594, "step": 200690 }, { "epoch": 0.35, "learning_rate": 3.25001656685861e-05, "loss": 2.4527, "step": 200700 }, { "epoch": 0.35, "learning_rate": 3.249929372865927e-05, "loss": 2.3821, "step": 200710 }, { "epoch": 0.35, "learning_rate": 3.2498421788732447e-05, "loss": 2.4244, "step": 200720 }, { "epoch": 0.35, "learning_rate": 3.249754984880562e-05, "loss": 2.4261, "step": 200730 }, { "epoch": 0.35, "learning_rate": 3.2496677908878794e-05, "loss": 2.3534, "step": 200740 }, { "epoch": 0.35, "learning_rate": 3.2495805968951965e-05, "loss": 2.5238, "step": 200750 }, { "epoch": 0.35, "learning_rate": 3.2494934029025135e-05, "loss": 2.4096, "step": 200760 }, { "epoch": 0.35, "learning_rate": 3.249406208909831e-05, "loss": 2.4505, "step": 200770 }, { "epoch": 0.35, "learning_rate": 3.249319014917148e-05, "loss": 2.5289, "step": 200780 }, { "epoch": 0.35, "learning_rate": 3.249231820924466e-05, "loss": 2.3185, "step": 200790 }, { "epoch": 0.35, "learning_rate": 3.249144626931783e-05, "loss": 2.4866, "step": 200800 }, { "epoch": 0.35, "learning_rate": 3.249057432939101e-05, "loss": 2.483, "step": 200810 }, { "epoch": 0.35, "learning_rate": 3.248970238946418e-05, "loss": 2.4259, "step": 200820 }, { "epoch": 0.35, "learning_rate": 3.248883044953735e-05, "loss": 2.5148, "step": 200830 }, { "epoch": 0.35, "learning_rate": 3.2487958509610525e-05, "loss": 2.4259, "step": 200840 }, { "epoch": 0.35, "learning_rate": 3.2487086569683695e-05, "loss": 2.3345, "step": 200850 }, { "epoch": 0.35, "learning_rate": 3.248621462975687e-05, "loss": 2.3989, "step": 200860 }, { "epoch": 0.35, "learning_rate": 3.248534268983004e-05, "loss": 2.4234, "step": 200870 }, { "epoch": 0.35, "learning_rate": 3.248447074990322e-05, "loss": 2.3935, "step": 200880 }, { "epoch": 0.35, "learning_rate": 3.248359880997639e-05, "loss": 2.3581, "step": 200890 }, { "epoch": 0.35, "learning_rate": 3.248272687004956e-05, "loss": 2.3465, "step": 200900 }, { "epoch": 0.35, "learning_rate": 3.248185493012274e-05, "loss": 2.4603, "step": 200910 }, { "epoch": 0.35, "learning_rate": 3.248098299019591e-05, "loss": 2.3332, "step": 200920 }, { "epoch": 0.35, "learning_rate": 3.248011105026908e-05, "loss": 2.3961, "step": 200930 }, { "epoch": 0.35, "learning_rate": 3.2479239110342256e-05, "loss": 2.3703, "step": 200940 }, { "epoch": 0.35, "learning_rate": 3.247836717041543e-05, "loss": 2.4118, "step": 200950 }, { "epoch": 0.35, "learning_rate": 3.2477495230488604e-05, "loss": 2.49, "step": 200960 }, { "epoch": 0.35, "learning_rate": 3.2476623290561774e-05, "loss": 2.4424, "step": 200970 }, { "epoch": 0.35, "learning_rate": 3.2475751350634944e-05, "loss": 2.3982, "step": 200980 }, { "epoch": 0.35, "learning_rate": 3.247487941070812e-05, "loss": 2.3806, "step": 200990 }, { "epoch": 0.35, "learning_rate": 3.247400747078129e-05, "loss": 2.3538, "step": 201000 }, { "epoch": 0.35, "learning_rate": 3.247313553085447e-05, "loss": 2.4384, "step": 201010 }, { "epoch": 0.35, "learning_rate": 3.2472263590927646e-05, "loss": 2.4275, "step": 201020 }, { "epoch": 0.35, "learning_rate": 3.2471391651000817e-05, "loss": 2.4233, "step": 201030 }, { "epoch": 0.35, "learning_rate": 3.247051971107399e-05, "loss": 2.4223, "step": 201040 }, { "epoch": 0.35, "learning_rate": 3.246964777114716e-05, "loss": 2.3752, "step": 201050 }, { "epoch": 0.35, "learning_rate": 3.2468775831220334e-05, "loss": 2.3823, "step": 201060 }, { "epoch": 0.35, "learning_rate": 3.2467903891293505e-05, "loss": 2.4281, "step": 201070 }, { "epoch": 0.35, "learning_rate": 3.2467031951366675e-05, "loss": 2.4507, "step": 201080 }, { "epoch": 0.35, "learning_rate": 3.246616001143985e-05, "loss": 2.4033, "step": 201090 }, { "epoch": 0.35, "learning_rate": 3.246528807151303e-05, "loss": 2.4424, "step": 201100 }, { "epoch": 0.35, "learning_rate": 3.24644161315862e-05, "loss": 2.4155, "step": 201110 }, { "epoch": 0.35, "learning_rate": 3.246354419165937e-05, "loss": 2.4169, "step": 201120 }, { "epoch": 0.35, "learning_rate": 3.246267225173255e-05, "loss": 2.3678, "step": 201130 }, { "epoch": 0.35, "learning_rate": 3.246180031180572e-05, "loss": 2.3108, "step": 201140 }, { "epoch": 0.35, "learning_rate": 3.246092837187889e-05, "loss": 2.5288, "step": 201150 }, { "epoch": 0.35, "learning_rate": 3.2460056431952065e-05, "loss": 2.3546, "step": 201160 }, { "epoch": 0.35, "learning_rate": 3.245918449202524e-05, "loss": 2.3813, "step": 201170 }, { "epoch": 0.35, "learning_rate": 3.245831255209841e-05, "loss": 2.3928, "step": 201180 }, { "epoch": 0.35, "learning_rate": 3.245744061217158e-05, "loss": 2.3716, "step": 201190 }, { "epoch": 0.35, "learning_rate": 3.245656867224476e-05, "loss": 2.4358, "step": 201200 }, { "epoch": 0.35, "learning_rate": 3.245569673231793e-05, "loss": 2.3645, "step": 201210 }, { "epoch": 0.35, "learning_rate": 3.24548247923911e-05, "loss": 2.4729, "step": 201220 }, { "epoch": 0.35, "learning_rate": 3.245395285246428e-05, "loss": 2.3615, "step": 201230 }, { "epoch": 0.35, "learning_rate": 3.2453080912537456e-05, "loss": 2.4312, "step": 201240 }, { "epoch": 0.35, "learning_rate": 3.2452208972610626e-05, "loss": 2.3032, "step": 201250 }, { "epoch": 0.35, "learning_rate": 3.2451337032683796e-05, "loss": 2.4882, "step": 201260 }, { "epoch": 0.35, "learning_rate": 3.2450465092756973e-05, "loss": 2.513, "step": 201270 }, { "epoch": 0.35, "learning_rate": 3.2449593152830144e-05, "loss": 2.4526, "step": 201280 }, { "epoch": 0.35, "learning_rate": 3.2448721212903314e-05, "loss": 2.4917, "step": 201290 }, { "epoch": 0.35, "learning_rate": 3.244784927297649e-05, "loss": 2.3853, "step": 201300 }, { "epoch": 0.35, "learning_rate": 3.244697733304967e-05, "loss": 2.3954, "step": 201310 }, { "epoch": 0.35, "learning_rate": 3.244610539312284e-05, "loss": 2.4784, "step": 201320 }, { "epoch": 0.35, "learning_rate": 3.244523345319601e-05, "loss": 2.4022, "step": 201330 }, { "epoch": 0.35, "learning_rate": 3.2444361513269186e-05, "loss": 2.3918, "step": 201340 }, { "epoch": 0.35, "learning_rate": 3.244348957334236e-05, "loss": 2.4944, "step": 201350 }, { "epoch": 0.35, "learning_rate": 3.244261763341553e-05, "loss": 2.6049, "step": 201360 }, { "epoch": 0.35, "learning_rate": 3.24417456934887e-05, "loss": 2.5186, "step": 201370 }, { "epoch": 0.35, "learning_rate": 3.2440873753561875e-05, "loss": 2.4607, "step": 201380 }, { "epoch": 0.35, "learning_rate": 3.244000181363505e-05, "loss": 2.3236, "step": 201390 }, { "epoch": 0.35, "learning_rate": 3.243912987370822e-05, "loss": 2.3682, "step": 201400 }, { "epoch": 0.35, "learning_rate": 3.24382579337814e-05, "loss": 2.5258, "step": 201410 }, { "epoch": 0.35, "learning_rate": 3.243738599385457e-05, "loss": 2.3778, "step": 201420 }, { "epoch": 0.35, "learning_rate": 3.243651405392774e-05, "loss": 2.3834, "step": 201430 }, { "epoch": 0.35, "learning_rate": 3.243564211400091e-05, "loss": 2.4949, "step": 201440 }, { "epoch": 0.35, "learning_rate": 3.243477017407409e-05, "loss": 2.4027, "step": 201450 }, { "epoch": 0.35, "learning_rate": 3.2433898234147265e-05, "loss": 2.4303, "step": 201460 }, { "epoch": 0.35, "learning_rate": 3.2433026294220435e-05, "loss": 2.4754, "step": 201470 }, { "epoch": 0.35, "learning_rate": 3.2432154354293606e-05, "loss": 2.281, "step": 201480 }, { "epoch": 0.35, "learning_rate": 3.243128241436678e-05, "loss": 2.4382, "step": 201490 }, { "epoch": 0.35, "learning_rate": 3.243041047443995e-05, "loss": 2.2203, "step": 201500 }, { "epoch": 0.35, "learning_rate": 3.2429538534513124e-05, "loss": 2.4512, "step": 201510 }, { "epoch": 0.35, "learning_rate": 3.24286665945863e-05, "loss": 2.3811, "step": 201520 }, { "epoch": 0.35, "learning_rate": 3.242779465465948e-05, "loss": 2.3694, "step": 201530 }, { "epoch": 0.35, "learning_rate": 3.242692271473265e-05, "loss": 2.5255, "step": 201540 }, { "epoch": 0.35, "learning_rate": 3.242605077480582e-05, "loss": 2.4703, "step": 201550 }, { "epoch": 0.35, "learning_rate": 3.2425178834878996e-05, "loss": 2.5133, "step": 201560 }, { "epoch": 0.35, "learning_rate": 3.2424306894952166e-05, "loss": 2.3681, "step": 201570 }, { "epoch": 0.35, "learning_rate": 3.2423434955025337e-05, "loss": 2.3794, "step": 201580 }, { "epoch": 0.35, "learning_rate": 3.2422563015098514e-05, "loss": 2.4627, "step": 201590 }, { "epoch": 0.35, "learning_rate": 3.2421691075171684e-05, "loss": 2.4418, "step": 201600 }, { "epoch": 0.35, "learning_rate": 3.242081913524486e-05, "loss": 2.38, "step": 201610 }, { "epoch": 0.35, "learning_rate": 3.241994719531803e-05, "loss": 2.3085, "step": 201620 }, { "epoch": 0.35, "learning_rate": 3.241907525539121e-05, "loss": 2.4332, "step": 201630 }, { "epoch": 0.35, "learning_rate": 3.241820331546438e-05, "loss": 2.489, "step": 201640 }, { "epoch": 0.35, "learning_rate": 3.241733137553755e-05, "loss": 2.4621, "step": 201650 }, { "epoch": 0.35, "learning_rate": 3.241645943561073e-05, "loss": 2.3413, "step": 201660 }, { "epoch": 0.35, "learning_rate": 3.24155874956839e-05, "loss": 2.2316, "step": 201670 }, { "epoch": 0.35, "learning_rate": 3.2414715555757074e-05, "loss": 2.3554, "step": 201680 }, { "epoch": 0.35, "learning_rate": 3.2413843615830245e-05, "loss": 2.5251, "step": 201690 }, { "epoch": 0.35, "learning_rate": 3.241297167590342e-05, "loss": 2.3847, "step": 201700 }, { "epoch": 0.35, "learning_rate": 3.241209973597659e-05, "loss": 2.4042, "step": 201710 }, { "epoch": 0.35, "learning_rate": 3.241122779604976e-05, "loss": 2.3598, "step": 201720 }, { "epoch": 0.35, "learning_rate": 3.241035585612294e-05, "loss": 2.4446, "step": 201730 }, { "epoch": 0.35, "learning_rate": 3.240948391619611e-05, "loss": 2.3335, "step": 201740 }, { "epoch": 0.35, "learning_rate": 3.240861197626928e-05, "loss": 2.4473, "step": 201750 }, { "epoch": 0.35, "learning_rate": 3.240774003634246e-05, "loss": 2.3514, "step": 201760 }, { "epoch": 0.35, "learning_rate": 3.2406868096415635e-05, "loss": 2.4963, "step": 201770 }, { "epoch": 0.35, "learning_rate": 3.2405996156488805e-05, "loss": 2.4546, "step": 201780 }, { "epoch": 0.35, "learning_rate": 3.2405124216561976e-05, "loss": 2.4747, "step": 201790 }, { "epoch": 0.35, "learning_rate": 3.240425227663515e-05, "loss": 2.4181, "step": 201800 }, { "epoch": 0.35, "learning_rate": 3.240338033670832e-05, "loss": 2.4214, "step": 201810 }, { "epoch": 0.35, "learning_rate": 3.2402508396781494e-05, "loss": 2.4848, "step": 201820 }, { "epoch": 0.35, "learning_rate": 3.240163645685467e-05, "loss": 2.4386, "step": 201830 }, { "epoch": 0.35, "learning_rate": 3.240076451692785e-05, "loss": 2.3804, "step": 201840 }, { "epoch": 0.35, "learning_rate": 3.239989257700102e-05, "loss": 2.3736, "step": 201850 }, { "epoch": 0.35, "learning_rate": 3.239902063707419e-05, "loss": 2.4183, "step": 201860 }, { "epoch": 0.35, "learning_rate": 3.2398148697147366e-05, "loss": 2.4921, "step": 201870 }, { "epoch": 0.35, "learning_rate": 3.2397276757220536e-05, "loss": 2.4321, "step": 201880 }, { "epoch": 0.35, "learning_rate": 3.2396404817293707e-05, "loss": 2.4125, "step": 201890 }, { "epoch": 0.35, "learning_rate": 3.239553287736688e-05, "loss": 2.386, "step": 201900 }, { "epoch": 0.35, "learning_rate": 3.239466093744006e-05, "loss": 2.3718, "step": 201910 }, { "epoch": 0.35, "learning_rate": 3.239378899751323e-05, "loss": 2.4983, "step": 201920 }, { "epoch": 0.35, "learning_rate": 3.23929170575864e-05, "loss": 2.4627, "step": 201930 }, { "epoch": 0.35, "learning_rate": 3.239204511765957e-05, "loss": 2.4486, "step": 201940 }, { "epoch": 0.35, "learning_rate": 3.239117317773275e-05, "loss": 2.34, "step": 201950 }, { "epoch": 0.35, "learning_rate": 3.239030123780592e-05, "loss": 2.4307, "step": 201960 }, { "epoch": 0.35, "learning_rate": 3.238942929787909e-05, "loss": 2.3929, "step": 201970 }, { "epoch": 0.35, "learning_rate": 3.2388557357952274e-05, "loss": 2.4342, "step": 201980 }, { "epoch": 0.35, "learning_rate": 3.2387685418025444e-05, "loss": 2.2701, "step": 201990 }, { "epoch": 0.35, "learning_rate": 3.2386813478098615e-05, "loss": 2.3773, "step": 202000 }, { "epoch": 0.35, "learning_rate": 3.2385941538171785e-05, "loss": 2.2789, "step": 202010 }, { "epoch": 0.35, "learning_rate": 3.238506959824496e-05, "loss": 2.338, "step": 202020 }, { "epoch": 0.35, "learning_rate": 3.238419765831813e-05, "loss": 2.4533, "step": 202030 }, { "epoch": 0.35, "learning_rate": 3.23833257183913e-05, "loss": 2.4273, "step": 202040 }, { "epoch": 0.35, "learning_rate": 3.238245377846448e-05, "loss": 2.3155, "step": 202050 }, { "epoch": 0.35, "learning_rate": 3.238158183853766e-05, "loss": 2.3899, "step": 202060 }, { "epoch": 0.35, "learning_rate": 3.238070989861083e-05, "loss": 2.4386, "step": 202070 }, { "epoch": 0.35, "learning_rate": 3.2379837958684e-05, "loss": 2.4283, "step": 202080 }, { "epoch": 0.35, "learning_rate": 3.2378966018757175e-05, "loss": 2.4419, "step": 202090 }, { "epoch": 0.35, "learning_rate": 3.2378094078830346e-05, "loss": 2.4818, "step": 202100 }, { "epoch": 0.35, "learning_rate": 3.2377222138903516e-05, "loss": 2.418, "step": 202110 }, { "epoch": 0.35, "learning_rate": 3.237635019897669e-05, "loss": 2.4851, "step": 202120 }, { "epoch": 0.35, "learning_rate": 3.237547825904987e-05, "loss": 2.4878, "step": 202130 }, { "epoch": 0.35, "learning_rate": 3.237460631912304e-05, "loss": 2.3674, "step": 202140 }, { "epoch": 0.35, "learning_rate": 3.237373437919621e-05, "loss": 2.314, "step": 202150 }, { "epoch": 0.35, "learning_rate": 3.237286243926939e-05, "loss": 2.4007, "step": 202160 }, { "epoch": 0.35, "learning_rate": 3.237199049934256e-05, "loss": 2.4175, "step": 202170 }, { "epoch": 0.35, "learning_rate": 3.237111855941573e-05, "loss": 2.4046, "step": 202180 }, { "epoch": 0.35, "learning_rate": 3.2370246619488906e-05, "loss": 2.3138, "step": 202190 }, { "epoch": 0.35, "learning_rate": 3.236937467956208e-05, "loss": 2.4456, "step": 202200 }, { "epoch": 0.35, "learning_rate": 3.2368502739635254e-05, "loss": 2.4531, "step": 202210 }, { "epoch": 0.35, "learning_rate": 3.2367630799708424e-05, "loss": 2.4124, "step": 202220 }, { "epoch": 0.35, "learning_rate": 3.23667588597816e-05, "loss": 2.3967, "step": 202230 }, { "epoch": 0.35, "learning_rate": 3.236588691985477e-05, "loss": 2.4926, "step": 202240 }, { "epoch": 0.35, "learning_rate": 3.236501497992794e-05, "loss": 2.3153, "step": 202250 }, { "epoch": 0.35, "learning_rate": 3.236414304000112e-05, "loss": 2.4156, "step": 202260 }, { "epoch": 0.35, "learning_rate": 3.236327110007429e-05, "loss": 2.4385, "step": 202270 }, { "epoch": 0.35, "learning_rate": 3.2362399160147467e-05, "loss": 2.3051, "step": 202280 }, { "epoch": 0.35, "learning_rate": 3.236152722022064e-05, "loss": 2.4096, "step": 202290 }, { "epoch": 0.35, "learning_rate": 3.2360655280293814e-05, "loss": 2.3712, "step": 202300 }, { "epoch": 0.35, "learning_rate": 3.2359783340366985e-05, "loss": 2.5039, "step": 202310 }, { "epoch": 0.35, "learning_rate": 3.2358911400440155e-05, "loss": 2.3538, "step": 202320 }, { "epoch": 0.35, "learning_rate": 3.2358039460513325e-05, "loss": 2.3654, "step": 202330 }, { "epoch": 0.35, "learning_rate": 3.23571675205865e-05, "loss": 2.4158, "step": 202340 }, { "epoch": 0.35, "learning_rate": 3.235629558065968e-05, "loss": 2.295, "step": 202350 }, { "epoch": 0.35, "learning_rate": 3.235542364073285e-05, "loss": 2.37, "step": 202360 }, { "epoch": 0.35, "learning_rate": 3.235455170080603e-05, "loss": 2.4822, "step": 202370 }, { "epoch": 0.35, "learning_rate": 3.23536797608792e-05, "loss": 2.366, "step": 202380 }, { "epoch": 0.35, "learning_rate": 3.235280782095237e-05, "loss": 2.359, "step": 202390 }, { "epoch": 0.35, "learning_rate": 3.235193588102554e-05, "loss": 2.4812, "step": 202400 }, { "epoch": 0.35, "learning_rate": 3.2351063941098715e-05, "loss": 2.4373, "step": 202410 }, { "epoch": 0.35, "learning_rate": 3.2350192001171886e-05, "loss": 2.3575, "step": 202420 }, { "epoch": 0.35, "learning_rate": 3.234932006124506e-05, "loss": 2.3987, "step": 202430 }, { "epoch": 0.35, "learning_rate": 3.234844812131823e-05, "loss": 2.553, "step": 202440 }, { "epoch": 0.35, "learning_rate": 3.234757618139141e-05, "loss": 2.3915, "step": 202450 }, { "epoch": 0.35, "learning_rate": 3.234670424146458e-05, "loss": 2.4228, "step": 202460 }, { "epoch": 0.35, "learning_rate": 3.234583230153775e-05, "loss": 2.4015, "step": 202470 }, { "epoch": 0.35, "learning_rate": 3.234496036161093e-05, "loss": 2.4981, "step": 202480 }, { "epoch": 0.35, "learning_rate": 3.23440884216841e-05, "loss": 2.3373, "step": 202490 }, { "epoch": 0.35, "learning_rate": 3.2343216481757276e-05, "loss": 2.3354, "step": 202500 }, { "epoch": 0.35, "learning_rate": 3.2342344541830446e-05, "loss": 2.4393, "step": 202510 }, { "epoch": 0.35, "learning_rate": 3.2341472601903624e-05, "loss": 2.4996, "step": 202520 }, { "epoch": 0.35, "learning_rate": 3.2340600661976794e-05, "loss": 2.3782, "step": 202530 }, { "epoch": 0.35, "learning_rate": 3.2339728722049964e-05, "loss": 2.4083, "step": 202540 }, { "epoch": 0.35, "learning_rate": 3.233885678212314e-05, "loss": 2.459, "step": 202550 }, { "epoch": 0.35, "learning_rate": 3.233798484219631e-05, "loss": 2.4184, "step": 202560 }, { "epoch": 0.35, "learning_rate": 3.233711290226948e-05, "loss": 2.3561, "step": 202570 }, { "epoch": 0.35, "learning_rate": 3.233624096234266e-05, "loss": 2.4403, "step": 202580 }, { "epoch": 0.35, "learning_rate": 3.2335369022415837e-05, "loss": 2.4345, "step": 202590 }, { "epoch": 0.35, "learning_rate": 3.233449708248901e-05, "loss": 2.3534, "step": 202600 }, { "epoch": 0.35, "learning_rate": 3.233362514256218e-05, "loss": 2.3854, "step": 202610 }, { "epoch": 0.35, "learning_rate": 3.2332753202635354e-05, "loss": 2.4893, "step": 202620 }, { "epoch": 0.35, "learning_rate": 3.2331881262708525e-05, "loss": 2.5185, "step": 202630 }, { "epoch": 0.35, "learning_rate": 3.2331009322781695e-05, "loss": 2.554, "step": 202640 }, { "epoch": 0.35, "learning_rate": 3.233013738285487e-05, "loss": 2.3962, "step": 202650 }, { "epoch": 0.35, "learning_rate": 3.232926544292805e-05, "loss": 2.4047, "step": 202660 }, { "epoch": 0.35, "learning_rate": 3.232839350300122e-05, "loss": 2.4358, "step": 202670 }, { "epoch": 0.35, "learning_rate": 3.232752156307439e-05, "loss": 2.4621, "step": 202680 }, { "epoch": 0.35, "learning_rate": 3.232664962314757e-05, "loss": 2.4004, "step": 202690 }, { "epoch": 0.35, "learning_rate": 3.232577768322074e-05, "loss": 2.3807, "step": 202700 }, { "epoch": 0.35, "learning_rate": 3.232490574329391e-05, "loss": 2.4454, "step": 202710 }, { "epoch": 0.35, "learning_rate": 3.2324033803367085e-05, "loss": 2.3777, "step": 202720 }, { "epoch": 0.35, "learning_rate": 3.232316186344026e-05, "loss": 2.4031, "step": 202730 }, { "epoch": 0.35, "learning_rate": 3.232228992351343e-05, "loss": 2.4452, "step": 202740 }, { "epoch": 0.35, "learning_rate": 3.23214179835866e-05, "loss": 2.4067, "step": 202750 }, { "epoch": 0.35, "learning_rate": 3.232054604365978e-05, "loss": 2.3668, "step": 202760 }, { "epoch": 0.35, "learning_rate": 3.231967410373295e-05, "loss": 2.4116, "step": 202770 }, { "epoch": 0.35, "learning_rate": 3.231880216380612e-05, "loss": 2.3657, "step": 202780 }, { "epoch": 0.35, "learning_rate": 3.231793022387929e-05, "loss": 2.3823, "step": 202790 }, { "epoch": 0.35, "learning_rate": 3.2317058283952476e-05, "loss": 2.5166, "step": 202800 }, { "epoch": 0.35, "learning_rate": 3.2316186344025646e-05, "loss": 2.4353, "step": 202810 }, { "epoch": 0.35, "learning_rate": 3.2315314404098816e-05, "loss": 2.4749, "step": 202820 }, { "epoch": 0.35, "learning_rate": 3.231444246417199e-05, "loss": 2.4003, "step": 202830 }, { "epoch": 0.35, "learning_rate": 3.2313570524245164e-05, "loss": 2.3324, "step": 202840 }, { "epoch": 0.35, "learning_rate": 3.2312698584318334e-05, "loss": 2.448, "step": 202850 }, { "epoch": 0.35, "learning_rate": 3.2311826644391505e-05, "loss": 2.3531, "step": 202860 }, { "epoch": 0.35, "learning_rate": 3.231095470446469e-05, "loss": 2.3562, "step": 202870 }, { "epoch": 0.35, "learning_rate": 3.231008276453786e-05, "loss": 2.429, "step": 202880 }, { "epoch": 0.35, "learning_rate": 3.230921082461103e-05, "loss": 2.4637, "step": 202890 }, { "epoch": 0.35, "learning_rate": 3.23083388846842e-05, "loss": 2.4482, "step": 202900 }, { "epoch": 0.35, "learning_rate": 3.230746694475738e-05, "loss": 2.2619, "step": 202910 }, { "epoch": 0.35, "learning_rate": 3.230659500483055e-05, "loss": 2.3817, "step": 202920 }, { "epoch": 0.35, "learning_rate": 3.230572306490372e-05, "loss": 2.4484, "step": 202930 }, { "epoch": 0.35, "learning_rate": 3.2304851124976895e-05, "loss": 2.4728, "step": 202940 }, { "epoch": 0.35, "learning_rate": 3.230397918505007e-05, "loss": 2.3688, "step": 202950 }, { "epoch": 0.35, "learning_rate": 3.230310724512324e-05, "loss": 2.2871, "step": 202960 }, { "epoch": 0.35, "learning_rate": 3.230223530519641e-05, "loss": 2.4209, "step": 202970 }, { "epoch": 0.35, "learning_rate": 3.230136336526959e-05, "loss": 2.3582, "step": 202980 }, { "epoch": 0.35, "learning_rate": 3.230049142534276e-05, "loss": 2.4804, "step": 202990 }, { "epoch": 0.35, "learning_rate": 3.229961948541593e-05, "loss": 2.4255, "step": 203000 }, { "epoch": 0.35, "learning_rate": 3.229874754548911e-05, "loss": 2.3366, "step": 203010 }, { "epoch": 0.35, "learning_rate": 3.2297875605562285e-05, "loss": 2.3974, "step": 203020 }, { "epoch": 0.35, "learning_rate": 3.2297003665635455e-05, "loss": 2.3461, "step": 203030 }, { "epoch": 0.35, "learning_rate": 3.2296131725708626e-05, "loss": 2.4049, "step": 203040 }, { "epoch": 0.35, "learning_rate": 3.22952597857818e-05, "loss": 2.4426, "step": 203050 }, { "epoch": 0.35, "learning_rate": 3.229438784585497e-05, "loss": 2.6098, "step": 203060 }, { "epoch": 0.35, "learning_rate": 3.2293515905928144e-05, "loss": 2.3895, "step": 203070 }, { "epoch": 0.35, "learning_rate": 3.229264396600132e-05, "loss": 2.4299, "step": 203080 }, { "epoch": 0.35, "learning_rate": 3.229177202607449e-05, "loss": 2.5059, "step": 203090 }, { "epoch": 0.35, "learning_rate": 3.229090008614767e-05, "loss": 2.4061, "step": 203100 }, { "epoch": 0.35, "learning_rate": 3.229002814622084e-05, "loss": 2.4935, "step": 203110 }, { "epoch": 0.35, "learning_rate": 3.2289156206294016e-05, "loss": 2.2173, "step": 203120 }, { "epoch": 0.35, "learning_rate": 3.2288284266367186e-05, "loss": 2.3327, "step": 203130 }, { "epoch": 0.35, "learning_rate": 3.2287412326440357e-05, "loss": 2.4351, "step": 203140 }, { "epoch": 0.35, "learning_rate": 3.2286540386513534e-05, "loss": 2.4924, "step": 203150 }, { "epoch": 0.35, "learning_rate": 3.2285668446586704e-05, "loss": 2.3331, "step": 203160 }, { "epoch": 0.35, "learning_rate": 3.228479650665988e-05, "loss": 2.4122, "step": 203170 }, { "epoch": 0.35, "learning_rate": 3.228392456673305e-05, "loss": 2.423, "step": 203180 }, { "epoch": 0.35, "learning_rate": 3.228305262680623e-05, "loss": 2.5257, "step": 203190 }, { "epoch": 0.35, "learning_rate": 3.22821806868794e-05, "loss": 2.4978, "step": 203200 }, { "epoch": 0.35, "learning_rate": 3.228130874695257e-05, "loss": 2.4109, "step": 203210 }, { "epoch": 0.35, "learning_rate": 3.228043680702575e-05, "loss": 2.3598, "step": 203220 }, { "epoch": 0.35, "learning_rate": 3.227956486709892e-05, "loss": 2.5092, "step": 203230 }, { "epoch": 0.35, "learning_rate": 3.227869292717209e-05, "loss": 2.3613, "step": 203240 }, { "epoch": 0.35, "learning_rate": 3.2277820987245265e-05, "loss": 2.3746, "step": 203250 }, { "epoch": 0.35, "learning_rate": 3.227694904731844e-05, "loss": 2.3131, "step": 203260 }, { "epoch": 0.35, "learning_rate": 3.227607710739161e-05, "loss": 2.5153, "step": 203270 }, { "epoch": 0.35, "learning_rate": 3.227520516746478e-05, "loss": 2.4182, "step": 203280 }, { "epoch": 0.35, "learning_rate": 3.227433322753795e-05, "loss": 2.4106, "step": 203290 }, { "epoch": 0.35, "learning_rate": 3.227346128761113e-05, "loss": 2.3502, "step": 203300 }, { "epoch": 0.35, "learning_rate": 3.22725893476843e-05, "loss": 2.401, "step": 203310 }, { "epoch": 0.35, "learning_rate": 3.227171740775748e-05, "loss": 2.418, "step": 203320 }, { "epoch": 0.35, "learning_rate": 3.2270845467830655e-05, "loss": 2.2494, "step": 203330 }, { "epoch": 0.35, "learning_rate": 3.2269973527903825e-05, "loss": 2.3566, "step": 203340 }, { "epoch": 0.35, "learning_rate": 3.2269101587976996e-05, "loss": 2.4247, "step": 203350 }, { "epoch": 0.35, "learning_rate": 3.2268229648050166e-05, "loss": 2.4335, "step": 203360 }, { "epoch": 0.35, "learning_rate": 3.226735770812334e-05, "loss": 2.3699, "step": 203370 }, { "epoch": 0.35, "learning_rate": 3.2266485768196514e-05, "loss": 2.4133, "step": 203380 }, { "epoch": 0.35, "learning_rate": 3.226561382826969e-05, "loss": 2.4559, "step": 203390 }, { "epoch": 0.35, "learning_rate": 3.226474188834286e-05, "loss": 2.3513, "step": 203400 }, { "epoch": 0.35, "learning_rate": 3.226386994841604e-05, "loss": 2.4937, "step": 203410 }, { "epoch": 0.35, "learning_rate": 3.226299800848921e-05, "loss": 2.4737, "step": 203420 }, { "epoch": 0.35, "learning_rate": 3.226212606856238e-05, "loss": 2.4162, "step": 203430 }, { "epoch": 0.35, "learning_rate": 3.2261254128635556e-05, "loss": 2.3584, "step": 203440 }, { "epoch": 0.35, "learning_rate": 3.2260382188708727e-05, "loss": 2.339, "step": 203450 }, { "epoch": 0.35, "learning_rate": 3.22595102487819e-05, "loss": 2.351, "step": 203460 }, { "epoch": 0.35, "learning_rate": 3.2258638308855074e-05, "loss": 2.372, "step": 203470 }, { "epoch": 0.35, "learning_rate": 3.225776636892825e-05, "loss": 2.3025, "step": 203480 }, { "epoch": 0.35, "learning_rate": 3.225689442900142e-05, "loss": 2.3287, "step": 203490 }, { "epoch": 0.35, "learning_rate": 3.225602248907459e-05, "loss": 2.42, "step": 203500 }, { "epoch": 0.35, "learning_rate": 3.225515054914777e-05, "loss": 2.4611, "step": 203510 }, { "epoch": 0.35, "learning_rate": 3.225427860922094e-05, "loss": 2.4427, "step": 203520 }, { "epoch": 0.35, "learning_rate": 3.225340666929411e-05, "loss": 2.3682, "step": 203530 }, { "epoch": 0.35, "learning_rate": 3.225253472936729e-05, "loss": 2.3323, "step": 203540 }, { "epoch": 0.35, "learning_rate": 3.2251662789440464e-05, "loss": 2.3887, "step": 203550 }, { "epoch": 0.35, "learning_rate": 3.2250790849513635e-05, "loss": 2.5595, "step": 203560 }, { "epoch": 0.36, "learning_rate": 3.2249918909586805e-05, "loss": 2.4039, "step": 203570 }, { "epoch": 0.36, "learning_rate": 3.224904696965998e-05, "loss": 2.4151, "step": 203580 }, { "epoch": 0.36, "learning_rate": 3.224817502973315e-05, "loss": 2.3732, "step": 203590 }, { "epoch": 0.36, "learning_rate": 3.224730308980632e-05, "loss": 2.3595, "step": 203600 }, { "epoch": 0.36, "learning_rate": 3.22464311498795e-05, "loss": 2.5053, "step": 203610 }, { "epoch": 0.36, "learning_rate": 3.224555920995268e-05, "loss": 2.434, "step": 203620 }, { "epoch": 0.36, "learning_rate": 3.224468727002585e-05, "loss": 2.3947, "step": 203630 }, { "epoch": 0.36, "learning_rate": 3.224381533009902e-05, "loss": 2.466, "step": 203640 }, { "epoch": 0.36, "learning_rate": 3.2242943390172195e-05, "loss": 2.2854, "step": 203650 }, { "epoch": 0.36, "learning_rate": 3.2242071450245366e-05, "loss": 2.4452, "step": 203660 }, { "epoch": 0.36, "learning_rate": 3.2241199510318536e-05, "loss": 2.4592, "step": 203670 }, { "epoch": 0.36, "learning_rate": 3.2240327570391706e-05, "loss": 2.388, "step": 203680 }, { "epoch": 0.36, "learning_rate": 3.223945563046489e-05, "loss": 2.3522, "step": 203690 }, { "epoch": 0.36, "learning_rate": 3.223858369053806e-05, "loss": 2.4029, "step": 203700 }, { "epoch": 0.36, "learning_rate": 3.223771175061123e-05, "loss": 2.4648, "step": 203710 }, { "epoch": 0.36, "learning_rate": 3.223683981068441e-05, "loss": 2.52, "step": 203720 }, { "epoch": 0.36, "learning_rate": 3.223596787075758e-05, "loss": 2.2897, "step": 203730 }, { "epoch": 0.36, "learning_rate": 3.223509593083075e-05, "loss": 2.4578, "step": 203740 }, { "epoch": 0.36, "learning_rate": 3.223422399090392e-05, "loss": 2.4215, "step": 203750 }, { "epoch": 0.36, "learning_rate": 3.2233352050977096e-05, "loss": 2.3833, "step": 203760 }, { "epoch": 0.36, "learning_rate": 3.2232480111050274e-05, "loss": 2.4098, "step": 203770 }, { "epoch": 0.36, "learning_rate": 3.2231608171123444e-05, "loss": 2.3018, "step": 203780 }, { "epoch": 0.36, "learning_rate": 3.2230736231196614e-05, "loss": 2.3939, "step": 203790 }, { "epoch": 0.36, "learning_rate": 3.222986429126979e-05, "loss": 2.3346, "step": 203800 }, { "epoch": 0.36, "learning_rate": 3.222899235134296e-05, "loss": 2.4914, "step": 203810 }, { "epoch": 0.36, "learning_rate": 3.222812041141613e-05, "loss": 2.4602, "step": 203820 }, { "epoch": 0.36, "learning_rate": 3.222724847148931e-05, "loss": 2.4321, "step": 203830 }, { "epoch": 0.36, "learning_rate": 3.222637653156249e-05, "loss": 2.4817, "step": 203840 }, { "epoch": 0.36, "learning_rate": 3.222550459163566e-05, "loss": 2.374, "step": 203850 }, { "epoch": 0.36, "learning_rate": 3.222463265170883e-05, "loss": 2.3671, "step": 203860 }, { "epoch": 0.36, "learning_rate": 3.2223760711782005e-05, "loss": 2.3589, "step": 203870 }, { "epoch": 0.36, "learning_rate": 3.2222888771855175e-05, "loss": 2.426, "step": 203880 }, { "epoch": 0.36, "learning_rate": 3.2222016831928345e-05, "loss": 2.4198, "step": 203890 }, { "epoch": 0.36, "learning_rate": 3.222114489200152e-05, "loss": 2.4484, "step": 203900 }, { "epoch": 0.36, "learning_rate": 3.222027295207469e-05, "loss": 2.4851, "step": 203910 }, { "epoch": 0.36, "learning_rate": 3.221940101214787e-05, "loss": 2.3949, "step": 203920 }, { "epoch": 0.36, "learning_rate": 3.221852907222104e-05, "loss": 2.5058, "step": 203930 }, { "epoch": 0.36, "learning_rate": 3.221765713229422e-05, "loss": 2.3946, "step": 203940 }, { "epoch": 0.36, "learning_rate": 3.221678519236739e-05, "loss": 2.3741, "step": 203950 }, { "epoch": 0.36, "learning_rate": 3.221591325244056e-05, "loss": 2.4569, "step": 203960 }, { "epoch": 0.36, "learning_rate": 3.2215041312513735e-05, "loss": 2.3288, "step": 203970 }, { "epoch": 0.36, "learning_rate": 3.2214169372586906e-05, "loss": 2.4244, "step": 203980 }, { "epoch": 0.36, "learning_rate": 3.221329743266008e-05, "loss": 2.4652, "step": 203990 }, { "epoch": 0.36, "learning_rate": 3.221242549273325e-05, "loss": 2.4508, "step": 204000 }, { "epoch": 0.36, "learning_rate": 3.221155355280643e-05, "loss": 2.3453, "step": 204010 }, { "epoch": 0.36, "learning_rate": 3.22106816128796e-05, "loss": 2.3967, "step": 204020 }, { "epoch": 0.36, "learning_rate": 3.220980967295277e-05, "loss": 2.4297, "step": 204030 }, { "epoch": 0.36, "learning_rate": 3.220893773302595e-05, "loss": 2.3522, "step": 204040 }, { "epoch": 0.36, "learning_rate": 3.220806579309912e-05, "loss": 2.3487, "step": 204050 }, { "epoch": 0.36, "learning_rate": 3.2207193853172296e-05, "loss": 2.3988, "step": 204060 }, { "epoch": 0.36, "learning_rate": 3.2206321913245466e-05, "loss": 2.22, "step": 204070 }, { "epoch": 0.36, "learning_rate": 3.2205449973318644e-05, "loss": 2.3798, "step": 204080 }, { "epoch": 0.36, "learning_rate": 3.2204578033391814e-05, "loss": 2.3909, "step": 204090 }, { "epoch": 0.36, "learning_rate": 3.2203706093464984e-05, "loss": 2.4061, "step": 204100 }, { "epoch": 0.36, "learning_rate": 3.220283415353816e-05, "loss": 2.3703, "step": 204110 }, { "epoch": 0.36, "learning_rate": 3.220196221361133e-05, "loss": 2.4229, "step": 204120 }, { "epoch": 0.36, "learning_rate": 3.22010902736845e-05, "loss": 2.4107, "step": 204130 }, { "epoch": 0.36, "learning_rate": 3.220021833375768e-05, "loss": 2.2285, "step": 204140 }, { "epoch": 0.36, "learning_rate": 3.2199346393830857e-05, "loss": 2.4774, "step": 204150 }, { "epoch": 0.36, "learning_rate": 3.219847445390403e-05, "loss": 2.5074, "step": 204160 }, { "epoch": 0.36, "learning_rate": 3.21976025139772e-05, "loss": 2.4143, "step": 204170 }, { "epoch": 0.36, "learning_rate": 3.219673057405037e-05, "loss": 2.4419, "step": 204180 }, { "epoch": 0.36, "learning_rate": 3.2195858634123545e-05, "loss": 2.4282, "step": 204190 }, { "epoch": 0.36, "learning_rate": 3.2194986694196715e-05, "loss": 2.512, "step": 204200 }, { "epoch": 0.36, "learning_rate": 3.219411475426989e-05, "loss": 2.3237, "step": 204210 }, { "epoch": 0.36, "learning_rate": 3.219324281434307e-05, "loss": 2.4317, "step": 204220 }, { "epoch": 0.36, "learning_rate": 3.219237087441624e-05, "loss": 2.4371, "step": 204230 }, { "epoch": 0.36, "learning_rate": 3.219149893448941e-05, "loss": 2.3861, "step": 204240 }, { "epoch": 0.36, "learning_rate": 3.219062699456258e-05, "loss": 2.4251, "step": 204250 }, { "epoch": 0.36, "learning_rate": 3.218975505463576e-05, "loss": 2.3981, "step": 204260 }, { "epoch": 0.36, "learning_rate": 3.218888311470893e-05, "loss": 2.3849, "step": 204270 }, { "epoch": 0.36, "learning_rate": 3.21880111747821e-05, "loss": 2.4491, "step": 204280 }, { "epoch": 0.36, "learning_rate": 3.2187139234855276e-05, "loss": 2.4571, "step": 204290 }, { "epoch": 0.36, "learning_rate": 3.218626729492845e-05, "loss": 2.4905, "step": 204300 }, { "epoch": 0.36, "learning_rate": 3.218539535500162e-05, "loss": 2.4894, "step": 204310 }, { "epoch": 0.36, "learning_rate": 3.2184523415074794e-05, "loss": 2.4818, "step": 204320 }, { "epoch": 0.36, "learning_rate": 3.218365147514797e-05, "loss": 2.4772, "step": 204330 }, { "epoch": 0.36, "learning_rate": 3.218277953522114e-05, "loss": 2.504, "step": 204340 }, { "epoch": 0.36, "learning_rate": 3.218190759529431e-05, "loss": 2.4284, "step": 204350 }, { "epoch": 0.36, "learning_rate": 3.218103565536749e-05, "loss": 2.4503, "step": 204360 }, { "epoch": 0.36, "learning_rate": 3.2180163715440666e-05, "loss": 2.3631, "step": 204370 }, { "epoch": 0.36, "learning_rate": 3.2179291775513836e-05, "loss": 2.3825, "step": 204380 }, { "epoch": 0.36, "learning_rate": 3.217841983558701e-05, "loss": 2.4239, "step": 204390 }, { "epoch": 0.36, "learning_rate": 3.2177547895660184e-05, "loss": 2.3963, "step": 204400 }, { "epoch": 0.36, "learning_rate": 3.2176675955733354e-05, "loss": 2.425, "step": 204410 }, { "epoch": 0.36, "learning_rate": 3.2175804015806525e-05, "loss": 2.3052, "step": 204420 }, { "epoch": 0.36, "learning_rate": 3.21749320758797e-05, "loss": 2.4638, "step": 204430 }, { "epoch": 0.36, "learning_rate": 3.217406013595288e-05, "loss": 2.4068, "step": 204440 }, { "epoch": 0.36, "learning_rate": 3.217318819602605e-05, "loss": 2.5206, "step": 204450 }, { "epoch": 0.36, "learning_rate": 3.217231625609922e-05, "loss": 2.4477, "step": 204460 }, { "epoch": 0.36, "learning_rate": 3.21714443161724e-05, "loss": 2.4418, "step": 204470 }, { "epoch": 0.36, "learning_rate": 3.217057237624557e-05, "loss": 2.6085, "step": 204480 }, { "epoch": 0.36, "learning_rate": 3.216970043631874e-05, "loss": 2.4092, "step": 204490 }, { "epoch": 0.36, "learning_rate": 3.2168828496391915e-05, "loss": 2.3916, "step": 204500 }, { "epoch": 0.36, "learning_rate": 3.216795655646509e-05, "loss": 2.4623, "step": 204510 }, { "epoch": 0.36, "learning_rate": 3.216708461653826e-05, "loss": 2.5044, "step": 204520 }, { "epoch": 0.36, "learning_rate": 3.216621267661143e-05, "loss": 2.3471, "step": 204530 }, { "epoch": 0.36, "learning_rate": 3.216534073668461e-05, "loss": 2.3176, "step": 204540 }, { "epoch": 0.36, "learning_rate": 3.216446879675778e-05, "loss": 2.4662, "step": 204550 }, { "epoch": 0.36, "learning_rate": 3.216359685683095e-05, "loss": 2.4473, "step": 204560 }, { "epoch": 0.36, "learning_rate": 3.216272491690413e-05, "loss": 2.4612, "step": 204570 }, { "epoch": 0.36, "learning_rate": 3.2161852976977305e-05, "loss": 2.4454, "step": 204580 }, { "epoch": 0.36, "learning_rate": 3.2160981037050475e-05, "loss": 2.5055, "step": 204590 }, { "epoch": 0.36, "learning_rate": 3.2160109097123646e-05, "loss": 2.6031, "step": 204600 }, { "epoch": 0.36, "learning_rate": 3.215923715719682e-05, "loss": 2.4223, "step": 204610 }, { "epoch": 0.36, "learning_rate": 3.215836521726999e-05, "loss": 2.5363, "step": 204620 }, { "epoch": 0.36, "learning_rate": 3.2157493277343164e-05, "loss": 2.3929, "step": 204630 }, { "epoch": 0.36, "learning_rate": 3.2156621337416334e-05, "loss": 2.4773, "step": 204640 }, { "epoch": 0.36, "learning_rate": 3.215574939748951e-05, "loss": 2.5391, "step": 204650 }, { "epoch": 0.36, "learning_rate": 3.215487745756269e-05, "loss": 2.4727, "step": 204660 }, { "epoch": 0.36, "learning_rate": 3.215400551763586e-05, "loss": 2.3687, "step": 204670 }, { "epoch": 0.36, "learning_rate": 3.2153133577709036e-05, "loss": 2.2996, "step": 204680 }, { "epoch": 0.36, "learning_rate": 3.2152261637782206e-05, "loss": 2.3644, "step": 204690 }, { "epoch": 0.36, "learning_rate": 3.215138969785538e-05, "loss": 2.34, "step": 204700 }, { "epoch": 0.36, "learning_rate": 3.215051775792855e-05, "loss": 2.2241, "step": 204710 }, { "epoch": 0.36, "learning_rate": 3.2149645818001724e-05, "loss": 2.4408, "step": 204720 }, { "epoch": 0.36, "learning_rate": 3.21487738780749e-05, "loss": 2.4375, "step": 204730 }, { "epoch": 0.36, "learning_rate": 3.214790193814807e-05, "loss": 2.4367, "step": 204740 }, { "epoch": 0.36, "learning_rate": 3.214702999822124e-05, "loss": 2.3915, "step": 204750 }, { "epoch": 0.36, "learning_rate": 3.214615805829442e-05, "loss": 2.4747, "step": 204760 }, { "epoch": 0.36, "learning_rate": 3.214528611836759e-05, "loss": 2.4452, "step": 204770 }, { "epoch": 0.36, "learning_rate": 3.214441417844076e-05, "loss": 2.5077, "step": 204780 }, { "epoch": 0.36, "learning_rate": 3.214354223851394e-05, "loss": 2.3176, "step": 204790 }, { "epoch": 0.36, "learning_rate": 3.214267029858711e-05, "loss": 2.3676, "step": 204800 }, { "epoch": 0.36, "learning_rate": 3.2141798358660285e-05, "loss": 2.3398, "step": 204810 }, { "epoch": 0.36, "learning_rate": 3.2140926418733455e-05, "loss": 2.3739, "step": 204820 }, { "epoch": 0.36, "learning_rate": 3.214005447880663e-05, "loss": 2.4678, "step": 204830 }, { "epoch": 0.36, "learning_rate": 3.21391825388798e-05, "loss": 2.4204, "step": 204840 }, { "epoch": 0.36, "learning_rate": 3.213831059895297e-05, "loss": 2.3983, "step": 204850 }, { "epoch": 0.36, "learning_rate": 3.213743865902615e-05, "loss": 2.4578, "step": 204860 }, { "epoch": 0.36, "learning_rate": 3.213656671909932e-05, "loss": 2.4549, "step": 204870 }, { "epoch": 0.36, "learning_rate": 3.21356947791725e-05, "loss": 2.308, "step": 204880 }, { "epoch": 0.36, "learning_rate": 3.213482283924567e-05, "loss": 2.4147, "step": 204890 }, { "epoch": 0.36, "learning_rate": 3.2133950899318845e-05, "loss": 2.3012, "step": 204900 }, { "epoch": 0.36, "learning_rate": 3.2133078959392016e-05, "loss": 2.4941, "step": 204910 }, { "epoch": 0.36, "learning_rate": 3.2132207019465186e-05, "loss": 2.464, "step": 204920 }, { "epoch": 0.36, "learning_rate": 3.213133507953836e-05, "loss": 2.4847, "step": 204930 }, { "epoch": 0.36, "learning_rate": 3.2130463139611534e-05, "loss": 2.356, "step": 204940 }, { "epoch": 0.36, "learning_rate": 3.2129591199684704e-05, "loss": 2.4926, "step": 204950 }, { "epoch": 0.36, "learning_rate": 3.212871925975788e-05, "loss": 2.416, "step": 204960 }, { "epoch": 0.36, "learning_rate": 3.212784731983106e-05, "loss": 2.4901, "step": 204970 }, { "epoch": 0.36, "learning_rate": 3.212697537990423e-05, "loss": 2.386, "step": 204980 }, { "epoch": 0.36, "learning_rate": 3.21261034399774e-05, "loss": 2.411, "step": 204990 }, { "epoch": 0.36, "learning_rate": 3.2125231500050576e-05, "loss": 2.4975, "step": 205000 }, { "epoch": 0.36, "learning_rate": 3.2124359560123747e-05, "loss": 2.4597, "step": 205010 }, { "epoch": 0.36, "learning_rate": 3.212348762019692e-05, "loss": 2.3781, "step": 205020 }, { "epoch": 0.36, "learning_rate": 3.2122615680270094e-05, "loss": 2.344, "step": 205030 }, { "epoch": 0.36, "learning_rate": 3.212174374034327e-05, "loss": 2.4791, "step": 205040 }, { "epoch": 0.36, "learning_rate": 3.212087180041644e-05, "loss": 2.4369, "step": 205050 }, { "epoch": 0.36, "learning_rate": 3.211999986048961e-05, "loss": 2.4544, "step": 205060 }, { "epoch": 0.36, "learning_rate": 3.211912792056279e-05, "loss": 2.4523, "step": 205070 }, { "epoch": 0.36, "learning_rate": 3.211825598063596e-05, "loss": 2.3102, "step": 205080 }, { "epoch": 0.36, "learning_rate": 3.211738404070913e-05, "loss": 2.3949, "step": 205090 }, { "epoch": 0.36, "learning_rate": 3.21165121007823e-05, "loss": 2.3915, "step": 205100 }, { "epoch": 0.36, "learning_rate": 3.2115640160855484e-05, "loss": 2.4835, "step": 205110 }, { "epoch": 0.36, "learning_rate": 3.2114768220928655e-05, "loss": 2.4571, "step": 205120 }, { "epoch": 0.36, "learning_rate": 3.2113896281001825e-05, "loss": 2.4145, "step": 205130 }, { "epoch": 0.36, "learning_rate": 3.2113024341074995e-05, "loss": 2.4523, "step": 205140 }, { "epoch": 0.36, "learning_rate": 3.211215240114817e-05, "loss": 2.4613, "step": 205150 }, { "epoch": 0.36, "learning_rate": 3.211128046122134e-05, "loss": 2.4811, "step": 205160 }, { "epoch": 0.36, "learning_rate": 3.211040852129451e-05, "loss": 2.5162, "step": 205170 }, { "epoch": 0.36, "learning_rate": 3.21095365813677e-05, "loss": 2.3821, "step": 205180 }, { "epoch": 0.36, "learning_rate": 3.210866464144087e-05, "loss": 2.4468, "step": 205190 }, { "epoch": 0.36, "learning_rate": 3.210779270151404e-05, "loss": 2.3566, "step": 205200 }, { "epoch": 0.36, "learning_rate": 3.210692076158721e-05, "loss": 2.4032, "step": 205210 }, { "epoch": 0.36, "learning_rate": 3.2106048821660386e-05, "loss": 2.436, "step": 205220 }, { "epoch": 0.36, "learning_rate": 3.2105176881733556e-05, "loss": 2.4623, "step": 205230 }, { "epoch": 0.36, "learning_rate": 3.2104304941806726e-05, "loss": 2.5085, "step": 205240 }, { "epoch": 0.36, "learning_rate": 3.2103433001879903e-05, "loss": 2.5545, "step": 205250 }, { "epoch": 0.36, "learning_rate": 3.210256106195308e-05, "loss": 2.5158, "step": 205260 }, { "epoch": 0.36, "learning_rate": 3.210168912202625e-05, "loss": 2.3772, "step": 205270 }, { "epoch": 0.36, "learning_rate": 3.210081718209942e-05, "loss": 2.3742, "step": 205280 }, { "epoch": 0.36, "learning_rate": 3.20999452421726e-05, "loss": 2.3735, "step": 205290 }, { "epoch": 0.36, "learning_rate": 3.209907330224577e-05, "loss": 2.4435, "step": 205300 }, { "epoch": 0.36, "learning_rate": 3.209820136231894e-05, "loss": 2.5038, "step": 205310 }, { "epoch": 0.36, "learning_rate": 3.2097329422392116e-05, "loss": 2.4329, "step": 205320 }, { "epoch": 0.36, "learning_rate": 3.2096457482465294e-05, "loss": 2.3991, "step": 205330 }, { "epoch": 0.36, "learning_rate": 3.2095585542538464e-05, "loss": 2.4746, "step": 205340 }, { "epoch": 0.36, "learning_rate": 3.2094713602611634e-05, "loss": 2.4944, "step": 205350 }, { "epoch": 0.36, "learning_rate": 3.209384166268481e-05, "loss": 2.5041, "step": 205360 }, { "epoch": 0.36, "learning_rate": 3.209296972275798e-05, "loss": 2.4942, "step": 205370 }, { "epoch": 0.36, "learning_rate": 3.209209778283115e-05, "loss": 2.3403, "step": 205380 }, { "epoch": 0.36, "learning_rate": 3.209122584290433e-05, "loss": 2.3407, "step": 205390 }, { "epoch": 0.36, "learning_rate": 3.209035390297751e-05, "loss": 2.4883, "step": 205400 }, { "epoch": 0.36, "learning_rate": 3.208948196305068e-05, "loss": 2.363, "step": 205410 }, { "epoch": 0.36, "learning_rate": 3.208861002312385e-05, "loss": 2.4351, "step": 205420 }, { "epoch": 0.36, "learning_rate": 3.2087738083197025e-05, "loss": 2.344, "step": 205430 }, { "epoch": 0.36, "learning_rate": 3.2086866143270195e-05, "loss": 2.3733, "step": 205440 }, { "epoch": 0.36, "learning_rate": 3.2085994203343365e-05, "loss": 2.4213, "step": 205450 }, { "epoch": 0.36, "learning_rate": 3.208512226341654e-05, "loss": 2.3833, "step": 205460 }, { "epoch": 0.36, "learning_rate": 3.208425032348971e-05, "loss": 2.4326, "step": 205470 }, { "epoch": 0.36, "learning_rate": 3.208337838356289e-05, "loss": 2.4012, "step": 205480 }, { "epoch": 0.36, "learning_rate": 3.208250644363606e-05, "loss": 2.332, "step": 205490 }, { "epoch": 0.36, "learning_rate": 3.208163450370924e-05, "loss": 2.3448, "step": 205500 }, { "epoch": 0.36, "learning_rate": 3.208076256378241e-05, "loss": 2.553, "step": 205510 }, { "epoch": 0.36, "learning_rate": 3.207989062385558e-05, "loss": 2.3735, "step": 205520 }, { "epoch": 0.36, "learning_rate": 3.2079018683928755e-05, "loss": 2.4431, "step": 205530 }, { "epoch": 0.36, "learning_rate": 3.2078146744001926e-05, "loss": 2.3169, "step": 205540 }, { "epoch": 0.36, "learning_rate": 3.20772748040751e-05, "loss": 2.4381, "step": 205550 }, { "epoch": 0.36, "learning_rate": 3.2076402864148273e-05, "loss": 2.396, "step": 205560 }, { "epoch": 0.36, "learning_rate": 3.207553092422145e-05, "loss": 2.3588, "step": 205570 }, { "epoch": 0.36, "learning_rate": 3.207465898429462e-05, "loss": 2.4418, "step": 205580 }, { "epoch": 0.36, "learning_rate": 3.207378704436779e-05, "loss": 2.3774, "step": 205590 }, { "epoch": 0.36, "learning_rate": 3.207291510444096e-05, "loss": 2.4011, "step": 205600 }, { "epoch": 0.36, "learning_rate": 3.207204316451414e-05, "loss": 2.3516, "step": 205610 }, { "epoch": 0.36, "learning_rate": 3.207117122458731e-05, "loss": 2.5026, "step": 205620 }, { "epoch": 0.36, "learning_rate": 3.2070299284660486e-05, "loss": 2.3792, "step": 205630 }, { "epoch": 0.36, "learning_rate": 3.2069427344733664e-05, "loss": 2.4209, "step": 205640 }, { "epoch": 0.36, "learning_rate": 3.2068555404806834e-05, "loss": 2.4254, "step": 205650 }, { "epoch": 0.36, "learning_rate": 3.2067683464880004e-05, "loss": 2.4302, "step": 205660 }, { "epoch": 0.36, "learning_rate": 3.2066811524953175e-05, "loss": 2.3218, "step": 205670 }, { "epoch": 0.36, "learning_rate": 3.206593958502635e-05, "loss": 2.4864, "step": 205680 }, { "epoch": 0.36, "learning_rate": 3.206506764509952e-05, "loss": 2.478, "step": 205690 }, { "epoch": 0.36, "learning_rate": 3.20641957051727e-05, "loss": 2.2895, "step": 205700 }, { "epoch": 0.36, "learning_rate": 3.206332376524587e-05, "loss": 2.5352, "step": 205710 }, { "epoch": 0.36, "learning_rate": 3.206245182531905e-05, "loss": 2.3424, "step": 205720 }, { "epoch": 0.36, "learning_rate": 3.206157988539222e-05, "loss": 2.3866, "step": 205730 }, { "epoch": 0.36, "learning_rate": 3.206070794546539e-05, "loss": 2.3592, "step": 205740 }, { "epoch": 0.36, "learning_rate": 3.2059836005538565e-05, "loss": 2.5298, "step": 205750 }, { "epoch": 0.36, "learning_rate": 3.2058964065611735e-05, "loss": 2.4929, "step": 205760 }, { "epoch": 0.36, "learning_rate": 3.2058092125684906e-05, "loss": 2.4346, "step": 205770 }, { "epoch": 0.36, "learning_rate": 3.205722018575808e-05, "loss": 2.3927, "step": 205780 }, { "epoch": 0.36, "learning_rate": 3.205634824583126e-05, "loss": 2.4053, "step": 205790 }, { "epoch": 0.36, "learning_rate": 3.205547630590443e-05, "loss": 2.3, "step": 205800 }, { "epoch": 0.36, "learning_rate": 3.20546043659776e-05, "loss": 2.4661, "step": 205810 }, { "epoch": 0.36, "learning_rate": 3.205373242605078e-05, "loss": 2.4696, "step": 205820 }, { "epoch": 0.36, "learning_rate": 3.205286048612395e-05, "loss": 2.4056, "step": 205830 }, { "epoch": 0.36, "learning_rate": 3.205198854619712e-05, "loss": 2.4186, "step": 205840 }, { "epoch": 0.36, "learning_rate": 3.2051116606270296e-05, "loss": 2.4548, "step": 205850 }, { "epoch": 0.36, "learning_rate": 3.205024466634347e-05, "loss": 2.4633, "step": 205860 }, { "epoch": 0.36, "learning_rate": 3.204937272641664e-05, "loss": 2.5082, "step": 205870 }, { "epoch": 0.36, "learning_rate": 3.2048500786489814e-05, "loss": 2.4491, "step": 205880 }, { "epoch": 0.36, "learning_rate": 3.204762884656299e-05, "loss": 2.4017, "step": 205890 }, { "epoch": 0.36, "learning_rate": 3.204675690663616e-05, "loss": 2.2991, "step": 205900 }, { "epoch": 0.36, "learning_rate": 3.204588496670933e-05, "loss": 2.2784, "step": 205910 }, { "epoch": 0.36, "learning_rate": 3.204501302678251e-05, "loss": 2.4183, "step": 205920 }, { "epoch": 0.36, "learning_rate": 3.2044141086855686e-05, "loss": 2.3781, "step": 205930 }, { "epoch": 0.36, "learning_rate": 3.2043269146928856e-05, "loss": 2.3872, "step": 205940 }, { "epoch": 0.36, "learning_rate": 3.204239720700203e-05, "loss": 2.483, "step": 205950 }, { "epoch": 0.36, "learning_rate": 3.2041525267075204e-05, "loss": 2.4383, "step": 205960 }, { "epoch": 0.36, "learning_rate": 3.2040653327148374e-05, "loss": 2.3506, "step": 205970 }, { "epoch": 0.36, "learning_rate": 3.2039781387221545e-05, "loss": 2.4038, "step": 205980 }, { "epoch": 0.36, "learning_rate": 3.2038909447294715e-05, "loss": 2.3971, "step": 205990 }, { "epoch": 0.36, "learning_rate": 3.20380375073679e-05, "loss": 2.3146, "step": 206000 }, { "epoch": 0.36, "learning_rate": 3.203716556744107e-05, "loss": 2.4633, "step": 206010 }, { "epoch": 0.36, "learning_rate": 3.203629362751424e-05, "loss": 2.3234, "step": 206020 }, { "epoch": 0.36, "learning_rate": 3.203542168758742e-05, "loss": 2.3612, "step": 206030 }, { "epoch": 0.36, "learning_rate": 3.203454974766059e-05, "loss": 2.4307, "step": 206040 }, { "epoch": 0.36, "learning_rate": 3.203367780773376e-05, "loss": 2.4082, "step": 206050 }, { "epoch": 0.36, "learning_rate": 3.203280586780693e-05, "loss": 2.4394, "step": 206060 }, { "epoch": 0.36, "learning_rate": 3.203193392788011e-05, "loss": 2.3177, "step": 206070 }, { "epoch": 0.36, "learning_rate": 3.203106198795328e-05, "loss": 2.5199, "step": 206080 }, { "epoch": 0.36, "learning_rate": 3.203019004802645e-05, "loss": 2.2875, "step": 206090 }, { "epoch": 0.36, "learning_rate": 3.202931810809962e-05, "loss": 2.4504, "step": 206100 }, { "epoch": 0.36, "learning_rate": 3.20284461681728e-05, "loss": 2.4676, "step": 206110 }, { "epoch": 0.36, "learning_rate": 3.202757422824597e-05, "loss": 2.5626, "step": 206120 }, { "epoch": 0.36, "learning_rate": 3.202670228831914e-05, "loss": 2.3572, "step": 206130 }, { "epoch": 0.36, "learning_rate": 3.202583034839232e-05, "loss": 2.3653, "step": 206140 }, { "epoch": 0.36, "learning_rate": 3.2024958408465495e-05, "loss": 2.5401, "step": 206150 }, { "epoch": 0.36, "learning_rate": 3.2024086468538666e-05, "loss": 2.4316, "step": 206160 }, { "epoch": 0.36, "learning_rate": 3.2023214528611836e-05, "loss": 2.4854, "step": 206170 }, { "epoch": 0.36, "learning_rate": 3.202234258868501e-05, "loss": 2.572, "step": 206180 }, { "epoch": 0.36, "learning_rate": 3.2021470648758184e-05, "loss": 2.5298, "step": 206190 }, { "epoch": 0.36, "learning_rate": 3.2020598708831354e-05, "loss": 2.4161, "step": 206200 }, { "epoch": 0.36, "learning_rate": 3.201972676890453e-05, "loss": 2.4386, "step": 206210 }, { "epoch": 0.36, "learning_rate": 3.201885482897771e-05, "loss": 2.5539, "step": 206220 }, { "epoch": 0.36, "learning_rate": 3.201798288905088e-05, "loss": 2.4, "step": 206230 }, { "epoch": 0.36, "learning_rate": 3.201711094912405e-05, "loss": 2.2398, "step": 206240 }, { "epoch": 0.36, "learning_rate": 3.2016239009197226e-05, "loss": 2.3641, "step": 206250 }, { "epoch": 0.36, "learning_rate": 3.20153670692704e-05, "loss": 2.5389, "step": 206260 }, { "epoch": 0.36, "learning_rate": 3.201449512934357e-05, "loss": 2.3465, "step": 206270 }, { "epoch": 0.36, "learning_rate": 3.2013623189416744e-05, "loss": 2.4226, "step": 206280 }, { "epoch": 0.36, "learning_rate": 3.2012751249489915e-05, "loss": 2.3347, "step": 206290 }, { "epoch": 0.36, "learning_rate": 3.201187930956309e-05, "loss": 2.4195, "step": 206300 }, { "epoch": 0.36, "learning_rate": 3.201100736963626e-05, "loss": 2.4098, "step": 206310 }, { "epoch": 0.36, "learning_rate": 3.201013542970944e-05, "loss": 2.3531, "step": 206320 }, { "epoch": 0.36, "learning_rate": 3.200926348978261e-05, "loss": 2.3788, "step": 206330 }, { "epoch": 0.36, "learning_rate": 3.200839154985578e-05, "loss": 2.465, "step": 206340 }, { "epoch": 0.36, "learning_rate": 3.200751960992896e-05, "loss": 2.3533, "step": 206350 }, { "epoch": 0.36, "learning_rate": 3.200664767000213e-05, "loss": 2.2632, "step": 206360 }, { "epoch": 0.36, "learning_rate": 3.2005775730075305e-05, "loss": 2.447, "step": 206370 }, { "epoch": 0.36, "learning_rate": 3.2004903790148475e-05, "loss": 2.399, "step": 206380 }, { "epoch": 0.36, "learning_rate": 3.200403185022165e-05, "loss": 2.5187, "step": 206390 }, { "epoch": 0.36, "learning_rate": 3.200315991029482e-05, "loss": 2.4086, "step": 206400 }, { "epoch": 0.36, "learning_rate": 3.200228797036799e-05, "loss": 2.5178, "step": 206410 }, { "epoch": 0.36, "learning_rate": 3.200141603044117e-05, "loss": 2.4429, "step": 206420 }, { "epoch": 0.36, "learning_rate": 3.200054409051434e-05, "loss": 2.4299, "step": 206430 }, { "epoch": 0.36, "learning_rate": 3.199967215058751e-05, "loss": 2.4583, "step": 206440 }, { "epoch": 0.36, "learning_rate": 3.199880021066069e-05, "loss": 2.4348, "step": 206450 }, { "epoch": 0.36, "learning_rate": 3.1997928270733865e-05, "loss": 2.3486, "step": 206460 }, { "epoch": 0.36, "learning_rate": 3.1997056330807036e-05, "loss": 2.3471, "step": 206470 }, { "epoch": 0.36, "learning_rate": 3.1996184390880206e-05, "loss": 2.3922, "step": 206480 }, { "epoch": 0.36, "learning_rate": 3.1995312450953376e-05, "loss": 2.3836, "step": 206490 }, { "epoch": 0.36, "learning_rate": 3.1994440511026554e-05, "loss": 2.4037, "step": 206500 }, { "epoch": 0.36, "learning_rate": 3.1993568571099724e-05, "loss": 2.4566, "step": 206510 }, { "epoch": 0.36, "learning_rate": 3.19926966311729e-05, "loss": 2.4493, "step": 206520 }, { "epoch": 0.36, "learning_rate": 3.199182469124608e-05, "loss": 2.4554, "step": 206530 }, { "epoch": 0.36, "learning_rate": 3.199095275131925e-05, "loss": 2.3917, "step": 206540 }, { "epoch": 0.36, "learning_rate": 3.199008081139242e-05, "loss": 2.4728, "step": 206550 }, { "epoch": 0.36, "learning_rate": 3.198920887146559e-05, "loss": 2.4733, "step": 206560 }, { "epoch": 0.36, "learning_rate": 3.1988336931538767e-05, "loss": 2.3515, "step": 206570 }, { "epoch": 0.36, "learning_rate": 3.198746499161194e-05, "loss": 2.424, "step": 206580 }, { "epoch": 0.36, "learning_rate": 3.1986593051685114e-05, "loss": 2.3485, "step": 206590 }, { "epoch": 0.36, "learning_rate": 3.1985721111758284e-05, "loss": 2.4471, "step": 206600 }, { "epoch": 0.36, "learning_rate": 3.198484917183146e-05, "loss": 2.3241, "step": 206610 }, { "epoch": 0.36, "learning_rate": 3.198397723190463e-05, "loss": 2.447, "step": 206620 }, { "epoch": 0.36, "learning_rate": 3.19831052919778e-05, "loss": 2.3131, "step": 206630 }, { "epoch": 0.36, "learning_rate": 3.198223335205098e-05, "loss": 2.2678, "step": 206640 }, { "epoch": 0.36, "learning_rate": 3.198136141212415e-05, "loss": 2.467, "step": 206650 }, { "epoch": 0.36, "learning_rate": 3.198048947219732e-05, "loss": 2.4695, "step": 206660 }, { "epoch": 0.36, "learning_rate": 3.19796175322705e-05, "loss": 2.3462, "step": 206670 }, { "epoch": 0.36, "learning_rate": 3.1978745592343675e-05, "loss": 2.4485, "step": 206680 }, { "epoch": 0.36, "learning_rate": 3.1977873652416845e-05, "loss": 2.5422, "step": 206690 }, { "epoch": 0.36, "learning_rate": 3.1977001712490015e-05, "loss": 2.3385, "step": 206700 }, { "epoch": 0.36, "learning_rate": 3.197612977256319e-05, "loss": 2.3732, "step": 206710 }, { "epoch": 0.36, "learning_rate": 3.197525783263636e-05, "loss": 2.431, "step": 206720 }, { "epoch": 0.36, "learning_rate": 3.197438589270953e-05, "loss": 2.4376, "step": 206730 }, { "epoch": 0.36, "learning_rate": 3.197351395278271e-05, "loss": 2.3579, "step": 206740 }, { "epoch": 0.36, "learning_rate": 3.197264201285589e-05, "loss": 2.4233, "step": 206750 }, { "epoch": 0.36, "learning_rate": 3.197177007292906e-05, "loss": 2.4765, "step": 206760 }, { "epoch": 0.36, "learning_rate": 3.197089813300223e-05, "loss": 2.2997, "step": 206770 }, { "epoch": 0.36, "learning_rate": 3.1970026193075406e-05, "loss": 2.4318, "step": 206780 }, { "epoch": 0.36, "learning_rate": 3.1969154253148576e-05, "loss": 2.3837, "step": 206790 }, { "epoch": 0.36, "learning_rate": 3.1968282313221746e-05, "loss": 2.4966, "step": 206800 }, { "epoch": 0.36, "learning_rate": 3.1967410373294923e-05, "loss": 2.3675, "step": 206810 }, { "epoch": 0.36, "learning_rate": 3.19665384333681e-05, "loss": 2.2523, "step": 206820 }, { "epoch": 0.36, "learning_rate": 3.196566649344127e-05, "loss": 2.5456, "step": 206830 }, { "epoch": 0.36, "learning_rate": 3.196479455351444e-05, "loss": 2.2706, "step": 206840 }, { "epoch": 0.36, "learning_rate": 3.196392261358762e-05, "loss": 2.2939, "step": 206850 }, { "epoch": 0.36, "learning_rate": 3.196305067366079e-05, "loss": 2.5291, "step": 206860 }, { "epoch": 0.36, "learning_rate": 3.196217873373396e-05, "loss": 2.3676, "step": 206870 }, { "epoch": 0.36, "learning_rate": 3.1961306793807136e-05, "loss": 2.4266, "step": 206880 }, { "epoch": 0.36, "learning_rate": 3.1960434853880314e-05, "loss": 2.5004, "step": 206890 }, { "epoch": 0.36, "learning_rate": 3.1959562913953484e-05, "loss": 2.3749, "step": 206900 }, { "epoch": 0.36, "learning_rate": 3.1958690974026654e-05, "loss": 2.3072, "step": 206910 }, { "epoch": 0.36, "learning_rate": 3.195781903409983e-05, "loss": 2.4957, "step": 206920 }, { "epoch": 0.36, "learning_rate": 3.1956947094173e-05, "loss": 2.547, "step": 206930 }, { "epoch": 0.36, "learning_rate": 3.195607515424617e-05, "loss": 2.4674, "step": 206940 }, { "epoch": 0.36, "learning_rate": 3.195520321431934e-05, "loss": 2.453, "step": 206950 }, { "epoch": 0.36, "learning_rate": 3.195433127439252e-05, "loss": 2.3531, "step": 206960 }, { "epoch": 0.36, "learning_rate": 3.19534593344657e-05, "loss": 2.4749, "step": 206970 }, { "epoch": 0.36, "learning_rate": 3.195258739453887e-05, "loss": 2.5248, "step": 206980 }, { "epoch": 0.36, "learning_rate": 3.1951715454612045e-05, "loss": 2.3522, "step": 206990 }, { "epoch": 0.36, "learning_rate": 3.1950843514685215e-05, "loss": 2.4521, "step": 207000 }, { "epoch": 0.36, "learning_rate": 3.1949971574758385e-05, "loss": 2.3771, "step": 207010 }, { "epoch": 0.36, "learning_rate": 3.1949099634831556e-05, "loss": 2.3731, "step": 207020 }, { "epoch": 0.36, "learning_rate": 3.194822769490473e-05, "loss": 2.4715, "step": 207030 }, { "epoch": 0.36, "learning_rate": 3.194735575497791e-05, "loss": 2.4104, "step": 207040 }, { "epoch": 0.36, "learning_rate": 3.194648381505108e-05, "loss": 2.4022, "step": 207050 }, { "epoch": 0.36, "learning_rate": 3.194561187512425e-05, "loss": 2.3295, "step": 207060 }, { "epoch": 0.36, "learning_rate": 3.194473993519743e-05, "loss": 2.2718, "step": 207070 }, { "epoch": 0.36, "learning_rate": 3.19438679952706e-05, "loss": 2.4076, "step": 207080 }, { "epoch": 0.36, "learning_rate": 3.194299605534377e-05, "loss": 2.526, "step": 207090 }, { "epoch": 0.36, "learning_rate": 3.1942124115416946e-05, "loss": 2.4078, "step": 207100 }, { "epoch": 0.36, "learning_rate": 3.194125217549012e-05, "loss": 2.2204, "step": 207110 }, { "epoch": 0.36, "learning_rate": 3.1940380235563293e-05, "loss": 2.5293, "step": 207120 }, { "epoch": 0.36, "learning_rate": 3.1939508295636464e-05, "loss": 2.5344, "step": 207130 }, { "epoch": 0.36, "learning_rate": 3.193863635570964e-05, "loss": 2.429, "step": 207140 }, { "epoch": 0.36, "learning_rate": 3.193776441578281e-05, "loss": 2.4581, "step": 207150 }, { "epoch": 0.36, "learning_rate": 3.193689247585598e-05, "loss": 2.4176, "step": 207160 }, { "epoch": 0.36, "learning_rate": 3.193602053592916e-05, "loss": 2.4113, "step": 207170 }, { "epoch": 0.36, "learning_rate": 3.193514859600233e-05, "loss": 2.4627, "step": 207180 }, { "epoch": 0.36, "learning_rate": 3.1934276656075506e-05, "loss": 2.3895, "step": 207190 }, { "epoch": 0.36, "learning_rate": 3.193340471614868e-05, "loss": 2.3824, "step": 207200 }, { "epoch": 0.36, "learning_rate": 3.1932532776221854e-05, "loss": 2.4154, "step": 207210 }, { "epoch": 0.36, "learning_rate": 3.1931660836295024e-05, "loss": 2.3355, "step": 207220 }, { "epoch": 0.36, "learning_rate": 3.1930788896368195e-05, "loss": 2.4038, "step": 207230 }, { "epoch": 0.36, "learning_rate": 3.192991695644137e-05, "loss": 2.4415, "step": 207240 }, { "epoch": 0.36, "learning_rate": 3.192904501651454e-05, "loss": 2.4575, "step": 207250 }, { "epoch": 0.36, "learning_rate": 3.192817307658772e-05, "loss": 2.4085, "step": 207260 }, { "epoch": 0.36, "learning_rate": 3.192730113666089e-05, "loss": 2.4097, "step": 207270 }, { "epoch": 0.36, "learning_rate": 3.192642919673407e-05, "loss": 2.4289, "step": 207280 }, { "epoch": 0.36, "learning_rate": 3.192555725680724e-05, "loss": 2.3699, "step": 207290 }, { "epoch": 0.36, "learning_rate": 3.192468531688041e-05, "loss": 2.4076, "step": 207300 }, { "epoch": 0.36, "learning_rate": 3.1923813376953585e-05, "loss": 2.4169, "step": 207310 }, { "epoch": 0.36, "learning_rate": 3.1922941437026755e-05, "loss": 2.4195, "step": 207320 }, { "epoch": 0.36, "learning_rate": 3.1922069497099926e-05, "loss": 2.4144, "step": 207330 }, { "epoch": 0.36, "learning_rate": 3.19211975571731e-05, "loss": 2.3487, "step": 207340 }, { "epoch": 0.36, "learning_rate": 3.192032561724628e-05, "loss": 2.3558, "step": 207350 }, { "epoch": 0.36, "learning_rate": 3.191945367731945e-05, "loss": 2.4179, "step": 207360 }, { "epoch": 0.36, "learning_rate": 3.191858173739262e-05, "loss": 2.3572, "step": 207370 }, { "epoch": 0.36, "learning_rate": 3.19177097974658e-05, "loss": 2.3826, "step": 207380 }, { "epoch": 0.36, "learning_rate": 3.191683785753897e-05, "loss": 2.5028, "step": 207390 }, { "epoch": 0.36, "learning_rate": 3.191596591761214e-05, "loss": 2.4195, "step": 207400 }, { "epoch": 0.36, "learning_rate": 3.1915093977685316e-05, "loss": 2.4371, "step": 207410 }, { "epoch": 0.36, "learning_rate": 3.191422203775849e-05, "loss": 2.4014, "step": 207420 }, { "epoch": 0.36, "learning_rate": 3.191335009783166e-05, "loss": 2.4286, "step": 207430 }, { "epoch": 0.36, "learning_rate": 3.1912478157904834e-05, "loss": 2.3791, "step": 207440 }, { "epoch": 0.36, "learning_rate": 3.1911606217978004e-05, "loss": 2.2904, "step": 207450 }, { "epoch": 0.36, "learning_rate": 3.191073427805118e-05, "loss": 2.4537, "step": 207460 }, { "epoch": 0.36, "learning_rate": 3.190986233812435e-05, "loss": 2.3853, "step": 207470 }, { "epoch": 0.36, "learning_rate": 3.190899039819752e-05, "loss": 2.4731, "step": 207480 }, { "epoch": 0.36, "learning_rate": 3.1908118458270706e-05, "loss": 2.4904, "step": 207490 }, { "epoch": 0.36, "learning_rate": 3.1907246518343876e-05, "loss": 2.3755, "step": 207500 }, { "epoch": 0.36, "learning_rate": 3.190637457841705e-05, "loss": 2.3009, "step": 207510 }, { "epoch": 0.36, "learning_rate": 3.190550263849022e-05, "loss": 2.3059, "step": 207520 }, { "epoch": 0.36, "learning_rate": 3.1904630698563394e-05, "loss": 2.3447, "step": 207530 }, { "epoch": 0.36, "learning_rate": 3.1903758758636565e-05, "loss": 2.3895, "step": 207540 }, { "epoch": 0.36, "learning_rate": 3.1902886818709735e-05, "loss": 2.43, "step": 207550 }, { "epoch": 0.36, "learning_rate": 3.190201487878291e-05, "loss": 2.426, "step": 207560 }, { "epoch": 0.36, "learning_rate": 3.190114293885609e-05, "loss": 2.4636, "step": 207570 }, { "epoch": 0.36, "learning_rate": 3.190027099892926e-05, "loss": 2.4327, "step": 207580 }, { "epoch": 0.36, "learning_rate": 3.189939905900243e-05, "loss": 2.4612, "step": 207590 }, { "epoch": 0.36, "learning_rate": 3.189852711907561e-05, "loss": 2.3482, "step": 207600 }, { "epoch": 0.36, "learning_rate": 3.189765517914878e-05, "loss": 2.4998, "step": 207610 }, { "epoch": 0.36, "learning_rate": 3.189678323922195e-05, "loss": 2.3713, "step": 207620 }, { "epoch": 0.36, "learning_rate": 3.1895911299295125e-05, "loss": 2.4666, "step": 207630 }, { "epoch": 0.36, "learning_rate": 3.18950393593683e-05, "loss": 2.3717, "step": 207640 }, { "epoch": 0.36, "learning_rate": 3.189416741944147e-05, "loss": 2.3665, "step": 207650 }, { "epoch": 0.36, "learning_rate": 3.189329547951464e-05, "loss": 2.4269, "step": 207660 }, { "epoch": 0.36, "learning_rate": 3.189242353958782e-05, "loss": 2.3747, "step": 207670 }, { "epoch": 0.36, "learning_rate": 3.189155159966099e-05, "loss": 2.4152, "step": 207680 }, { "epoch": 0.36, "learning_rate": 3.189067965973416e-05, "loss": 2.4594, "step": 207690 }, { "epoch": 0.36, "learning_rate": 3.188980771980734e-05, "loss": 2.4218, "step": 207700 }, { "epoch": 0.36, "learning_rate": 3.1888935779880515e-05, "loss": 2.5022, "step": 207710 }, { "epoch": 0.36, "learning_rate": 3.1888063839953686e-05, "loss": 2.417, "step": 207720 }, { "epoch": 0.36, "learning_rate": 3.1887191900026856e-05, "loss": 2.3903, "step": 207730 }, { "epoch": 0.36, "learning_rate": 3.188631996010003e-05, "loss": 2.3784, "step": 207740 }, { "epoch": 0.36, "learning_rate": 3.1885448020173204e-05, "loss": 2.3511, "step": 207750 }, { "epoch": 0.36, "learning_rate": 3.1884576080246374e-05, "loss": 2.4279, "step": 207760 }, { "epoch": 0.36, "learning_rate": 3.188370414031955e-05, "loss": 2.4383, "step": 207770 }, { "epoch": 0.36, "learning_rate": 3.188283220039273e-05, "loss": 2.3437, "step": 207780 }, { "epoch": 0.36, "learning_rate": 3.18819602604659e-05, "loss": 2.3554, "step": 207790 }, { "epoch": 0.36, "learning_rate": 3.188108832053907e-05, "loss": 2.3576, "step": 207800 }, { "epoch": 0.36, "learning_rate": 3.1880216380612246e-05, "loss": 2.3858, "step": 207810 }, { "epoch": 0.36, "learning_rate": 3.187934444068542e-05, "loss": 2.4186, "step": 207820 }, { "epoch": 0.36, "learning_rate": 3.187847250075859e-05, "loss": 2.3685, "step": 207830 }, { "epoch": 0.36, "learning_rate": 3.187760056083176e-05, "loss": 2.324, "step": 207840 }, { "epoch": 0.36, "learning_rate": 3.1876728620904935e-05, "loss": 2.4002, "step": 207850 }, { "epoch": 0.36, "learning_rate": 3.187585668097811e-05, "loss": 2.3171, "step": 207860 }, { "epoch": 0.36, "learning_rate": 3.187498474105128e-05, "loss": 2.4421, "step": 207870 }, { "epoch": 0.36, "learning_rate": 3.187411280112446e-05, "loss": 2.3965, "step": 207880 }, { "epoch": 0.36, "learning_rate": 3.187324086119763e-05, "loss": 2.4362, "step": 207890 }, { "epoch": 0.36, "learning_rate": 3.18723689212708e-05, "loss": 2.4392, "step": 207900 }, { "epoch": 0.36, "learning_rate": 3.187149698134397e-05, "loss": 2.4564, "step": 207910 }, { "epoch": 0.36, "learning_rate": 3.187062504141715e-05, "loss": 2.4082, "step": 207920 }, { "epoch": 0.36, "learning_rate": 3.1869753101490325e-05, "loss": 2.2948, "step": 207930 }, { "epoch": 0.36, "learning_rate": 3.1868881161563495e-05, "loss": 2.349, "step": 207940 }, { "epoch": 0.36, "learning_rate": 3.1868009221636665e-05, "loss": 2.4873, "step": 207950 }, { "epoch": 0.36, "learning_rate": 3.186713728170984e-05, "loss": 2.4297, "step": 207960 }, { "epoch": 0.36, "learning_rate": 3.186626534178301e-05, "loss": 2.4357, "step": 207970 }, { "epoch": 0.36, "learning_rate": 3.1865393401856183e-05, "loss": 2.3501, "step": 207980 }, { "epoch": 0.36, "learning_rate": 3.186452146192936e-05, "loss": 2.4188, "step": 207990 }, { "epoch": 0.36, "learning_rate": 3.186364952200253e-05, "loss": 2.4635, "step": 208000 }, { "epoch": 0.36, "learning_rate": 3.186277758207571e-05, "loss": 2.3461, "step": 208010 }, { "epoch": 0.36, "learning_rate": 3.186190564214888e-05, "loss": 2.3222, "step": 208020 }, { "epoch": 0.36, "learning_rate": 3.1861033702222056e-05, "loss": 2.4247, "step": 208030 }, { "epoch": 0.36, "learning_rate": 3.1860161762295226e-05, "loss": 2.4515, "step": 208040 }, { "epoch": 0.36, "learning_rate": 3.1859289822368396e-05, "loss": 2.4169, "step": 208050 }, { "epoch": 0.36, "learning_rate": 3.1858417882441574e-05, "loss": 2.4565, "step": 208060 }, { "epoch": 0.36, "learning_rate": 3.1857545942514744e-05, "loss": 2.352, "step": 208070 }, { "epoch": 0.36, "learning_rate": 3.185667400258792e-05, "loss": 2.2751, "step": 208080 }, { "epoch": 0.36, "learning_rate": 3.185580206266109e-05, "loss": 2.4217, "step": 208090 }, { "epoch": 0.36, "learning_rate": 3.185493012273427e-05, "loss": 2.2913, "step": 208100 }, { "epoch": 0.36, "learning_rate": 3.185405818280744e-05, "loss": 2.4145, "step": 208110 }, { "epoch": 0.36, "learning_rate": 3.185318624288061e-05, "loss": 2.5038, "step": 208120 }, { "epoch": 0.36, "learning_rate": 3.1852314302953787e-05, "loss": 2.4875, "step": 208130 }, { "epoch": 0.36, "learning_rate": 3.185144236302696e-05, "loss": 2.3713, "step": 208140 }, { "epoch": 0.36, "learning_rate": 3.185057042310013e-05, "loss": 2.3854, "step": 208150 }, { "epoch": 0.36, "learning_rate": 3.1849698483173304e-05, "loss": 2.4602, "step": 208160 }, { "epoch": 0.36, "learning_rate": 3.184882654324648e-05, "loss": 2.3618, "step": 208170 }, { "epoch": 0.36, "learning_rate": 3.184795460331965e-05, "loss": 2.4308, "step": 208180 }, { "epoch": 0.36, "learning_rate": 3.184708266339282e-05, "loss": 2.4332, "step": 208190 }, { "epoch": 0.36, "learning_rate": 3.1846210723466e-05, "loss": 2.3763, "step": 208200 }, { "epoch": 0.36, "learning_rate": 3.184533878353917e-05, "loss": 2.4227, "step": 208210 }, { "epoch": 0.36, "learning_rate": 3.184446684361234e-05, "loss": 2.4029, "step": 208220 }, { "epoch": 0.36, "learning_rate": 3.184359490368552e-05, "loss": 2.4692, "step": 208230 }, { "epoch": 0.36, "learning_rate": 3.1842722963758695e-05, "loss": 2.4417, "step": 208240 }, { "epoch": 0.36, "learning_rate": 3.1841851023831865e-05, "loss": 2.5285, "step": 208250 }, { "epoch": 0.36, "learning_rate": 3.1840979083905035e-05, "loss": 2.4722, "step": 208260 }, { "epoch": 0.36, "learning_rate": 3.184010714397821e-05, "loss": 2.4754, "step": 208270 }, { "epoch": 0.36, "learning_rate": 3.183923520405138e-05, "loss": 2.2927, "step": 208280 }, { "epoch": 0.36, "learning_rate": 3.183836326412455e-05, "loss": 2.3897, "step": 208290 }, { "epoch": 0.36, "learning_rate": 3.1837491324197724e-05, "loss": 2.356, "step": 208300 }, { "epoch": 0.36, "learning_rate": 3.183661938427091e-05, "loss": 2.5083, "step": 208310 }, { "epoch": 0.36, "learning_rate": 3.183574744434408e-05, "loss": 2.4535, "step": 208320 }, { "epoch": 0.36, "learning_rate": 3.183487550441725e-05, "loss": 2.4361, "step": 208330 }, { "epoch": 0.36, "learning_rate": 3.1834003564490426e-05, "loss": 2.3735, "step": 208340 }, { "epoch": 0.36, "learning_rate": 3.1833131624563596e-05, "loss": 2.3053, "step": 208350 }, { "epoch": 0.36, "learning_rate": 3.1832259684636766e-05, "loss": 2.456, "step": 208360 }, { "epoch": 0.36, "learning_rate": 3.183138774470994e-05, "loss": 2.3746, "step": 208370 }, { "epoch": 0.36, "learning_rate": 3.183051580478312e-05, "loss": 2.5363, "step": 208380 }, { "epoch": 0.36, "learning_rate": 3.182964386485629e-05, "loss": 2.3822, "step": 208390 }, { "epoch": 0.36, "learning_rate": 3.182877192492946e-05, "loss": 2.3467, "step": 208400 }, { "epoch": 0.36, "learning_rate": 3.182789998500263e-05, "loss": 2.3276, "step": 208410 }, { "epoch": 0.36, "learning_rate": 3.182702804507581e-05, "loss": 2.3952, "step": 208420 }, { "epoch": 0.36, "learning_rate": 3.182615610514898e-05, "loss": 2.6023, "step": 208430 }, { "epoch": 0.36, "learning_rate": 3.182528416522215e-05, "loss": 2.4998, "step": 208440 }, { "epoch": 0.36, "learning_rate": 3.1824412225295334e-05, "loss": 2.3387, "step": 208450 }, { "epoch": 0.36, "learning_rate": 3.1823540285368504e-05, "loss": 2.4572, "step": 208460 }, { "epoch": 0.36, "learning_rate": 3.1822668345441674e-05, "loss": 2.5158, "step": 208470 }, { "epoch": 0.36, "learning_rate": 3.1821796405514845e-05, "loss": 2.5044, "step": 208480 }, { "epoch": 0.36, "learning_rate": 3.182092446558802e-05, "loss": 2.369, "step": 208490 }, { "epoch": 0.36, "learning_rate": 3.182005252566119e-05, "loss": 2.3162, "step": 208500 }, { "epoch": 0.36, "learning_rate": 3.181918058573436e-05, "loss": 2.4519, "step": 208510 }, { "epoch": 0.36, "learning_rate": 3.181830864580754e-05, "loss": 2.3627, "step": 208520 }, { "epoch": 0.36, "learning_rate": 3.181743670588072e-05, "loss": 2.4583, "step": 208530 }, { "epoch": 0.36, "learning_rate": 3.181656476595389e-05, "loss": 2.4502, "step": 208540 }, { "epoch": 0.36, "learning_rate": 3.181569282602706e-05, "loss": 2.3167, "step": 208550 }, { "epoch": 0.36, "learning_rate": 3.1814820886100235e-05, "loss": 2.3756, "step": 208560 }, { "epoch": 0.36, "learning_rate": 3.1813948946173405e-05, "loss": 2.3252, "step": 208570 }, { "epoch": 0.36, "learning_rate": 3.1813077006246576e-05, "loss": 2.3703, "step": 208580 }, { "epoch": 0.36, "learning_rate": 3.181220506631975e-05, "loss": 2.405, "step": 208590 }, { "epoch": 0.36, "learning_rate": 3.181133312639293e-05, "loss": 2.4488, "step": 208600 }, { "epoch": 0.36, "learning_rate": 3.18104611864661e-05, "loss": 2.4048, "step": 208610 }, { "epoch": 0.36, "learning_rate": 3.180958924653927e-05, "loss": 2.4943, "step": 208620 }, { "epoch": 0.36, "learning_rate": 3.180871730661245e-05, "loss": 2.3906, "step": 208630 }, { "epoch": 0.36, "learning_rate": 3.180784536668562e-05, "loss": 2.5032, "step": 208640 }, { "epoch": 0.36, "learning_rate": 3.180697342675879e-05, "loss": 2.4431, "step": 208650 }, { "epoch": 0.36, "learning_rate": 3.1806101486831966e-05, "loss": 2.4193, "step": 208660 }, { "epoch": 0.36, "learning_rate": 3.1805229546905136e-05, "loss": 2.3768, "step": 208670 }, { "epoch": 0.36, "learning_rate": 3.1804357606978313e-05, "loss": 2.4155, "step": 208680 }, { "epoch": 0.36, "learning_rate": 3.1803485667051484e-05, "loss": 2.4219, "step": 208690 }, { "epoch": 0.36, "learning_rate": 3.180261372712466e-05, "loss": 2.36, "step": 208700 }, { "epoch": 0.36, "learning_rate": 3.180174178719783e-05, "loss": 2.5088, "step": 208710 }, { "epoch": 0.36, "learning_rate": 3.1800869847271e-05, "loss": 2.3339, "step": 208720 }, { "epoch": 0.36, "learning_rate": 3.179999790734418e-05, "loss": 2.4089, "step": 208730 }, { "epoch": 0.36, "learning_rate": 3.179912596741735e-05, "loss": 2.3727, "step": 208740 }, { "epoch": 0.36, "learning_rate": 3.1798254027490526e-05, "loss": 2.3506, "step": 208750 }, { "epoch": 0.36, "learning_rate": 3.17973820875637e-05, "loss": 2.5363, "step": 208760 }, { "epoch": 0.36, "learning_rate": 3.1796510147636874e-05, "loss": 2.493, "step": 208770 }, { "epoch": 0.36, "learning_rate": 3.1795638207710044e-05, "loss": 2.3839, "step": 208780 }, { "epoch": 0.36, "learning_rate": 3.1794766267783215e-05, "loss": 2.435, "step": 208790 }, { "epoch": 0.36, "learning_rate": 3.1793894327856385e-05, "loss": 2.5456, "step": 208800 }, { "epoch": 0.36, "learning_rate": 3.179302238792956e-05, "loss": 2.4977, "step": 208810 }, { "epoch": 0.36, "learning_rate": 3.179215044800273e-05, "loss": 2.3438, "step": 208820 }, { "epoch": 0.36, "learning_rate": 3.179127850807591e-05, "loss": 2.4502, "step": 208830 }, { "epoch": 0.36, "learning_rate": 3.179040656814909e-05, "loss": 2.4388, "step": 208840 }, { "epoch": 0.36, "learning_rate": 3.178953462822226e-05, "loss": 2.4067, "step": 208850 }, { "epoch": 0.36, "learning_rate": 3.178866268829543e-05, "loss": 2.4531, "step": 208860 }, { "epoch": 0.36, "learning_rate": 3.17877907483686e-05, "loss": 2.4063, "step": 208870 }, { "epoch": 0.36, "learning_rate": 3.1786918808441775e-05, "loss": 2.5662, "step": 208880 }, { "epoch": 0.36, "learning_rate": 3.1786046868514946e-05, "loss": 2.4172, "step": 208890 }, { "epoch": 0.36, "learning_rate": 3.178517492858812e-05, "loss": 2.5452, "step": 208900 }, { "epoch": 0.36, "learning_rate": 3.178430298866129e-05, "loss": 2.4926, "step": 208910 }, { "epoch": 0.36, "learning_rate": 3.178343104873447e-05, "loss": 2.359, "step": 208920 }, { "epoch": 0.36, "learning_rate": 3.178255910880764e-05, "loss": 2.4385, "step": 208930 }, { "epoch": 0.36, "learning_rate": 3.178168716888081e-05, "loss": 2.4903, "step": 208940 }, { "epoch": 0.36, "learning_rate": 3.178081522895399e-05, "loss": 2.4118, "step": 208950 }, { "epoch": 0.36, "learning_rate": 3.177994328902716e-05, "loss": 2.3087, "step": 208960 }, { "epoch": 0.36, "learning_rate": 3.1779071349100336e-05, "loss": 2.4239, "step": 208970 }, { "epoch": 0.36, "learning_rate": 3.1778199409173506e-05, "loss": 2.4106, "step": 208980 }, { "epoch": 0.36, "learning_rate": 3.177732746924668e-05, "loss": 2.3433, "step": 208990 }, { "epoch": 0.36, "learning_rate": 3.1776455529319854e-05, "loss": 2.4176, "step": 209000 }, { "epoch": 0.36, "learning_rate": 3.1775583589393024e-05, "loss": 2.3983, "step": 209010 }, { "epoch": 0.36, "learning_rate": 3.17747116494662e-05, "loss": 2.3356, "step": 209020 }, { "epoch": 0.36, "learning_rate": 3.177383970953937e-05, "loss": 2.3982, "step": 209030 }, { "epoch": 0.36, "learning_rate": 3.177296776961254e-05, "loss": 2.4517, "step": 209040 }, { "epoch": 0.36, "learning_rate": 3.177209582968572e-05, "loss": 2.3662, "step": 209050 }, { "epoch": 0.36, "learning_rate": 3.1771223889758896e-05, "loss": 2.4179, "step": 209060 }, { "epoch": 0.36, "learning_rate": 3.177035194983207e-05, "loss": 2.479, "step": 209070 }, { "epoch": 0.36, "learning_rate": 3.176948000990524e-05, "loss": 2.4826, "step": 209080 }, { "epoch": 0.36, "learning_rate": 3.1768608069978414e-05, "loss": 2.4218, "step": 209090 }, { "epoch": 0.36, "learning_rate": 3.1767736130051585e-05, "loss": 2.3221, "step": 209100 }, { "epoch": 0.36, "learning_rate": 3.1766864190124755e-05, "loss": 2.4119, "step": 209110 }, { "epoch": 0.36, "learning_rate": 3.176599225019793e-05, "loss": 2.3331, "step": 209120 }, { "epoch": 0.36, "learning_rate": 3.176512031027111e-05, "loss": 2.3336, "step": 209130 }, { "epoch": 0.36, "learning_rate": 3.176424837034428e-05, "loss": 2.3611, "step": 209140 }, { "epoch": 0.36, "learning_rate": 3.176337643041745e-05, "loss": 2.4464, "step": 209150 }, { "epoch": 0.36, "learning_rate": 3.176250449049063e-05, "loss": 2.4598, "step": 209160 }, { "epoch": 0.36, "learning_rate": 3.17616325505638e-05, "loss": 2.3108, "step": 209170 }, { "epoch": 0.36, "learning_rate": 3.176076061063697e-05, "loss": 2.3687, "step": 209180 }, { "epoch": 0.36, "learning_rate": 3.175988867071014e-05, "loss": 2.356, "step": 209190 }, { "epoch": 0.36, "learning_rate": 3.175901673078332e-05, "loss": 2.4639, "step": 209200 }, { "epoch": 0.36, "learning_rate": 3.175814479085649e-05, "loss": 2.4506, "step": 209210 }, { "epoch": 0.36, "learning_rate": 3.175727285092966e-05, "loss": 2.4858, "step": 209220 }, { "epoch": 0.36, "learning_rate": 3.175640091100284e-05, "loss": 2.4125, "step": 209230 }, { "epoch": 0.36, "learning_rate": 3.175552897107601e-05, "loss": 2.2683, "step": 209240 }, { "epoch": 0.36, "learning_rate": 3.175465703114918e-05, "loss": 2.2369, "step": 209250 }, { "epoch": 0.36, "learning_rate": 3.175378509122235e-05, "loss": 2.3279, "step": 209260 }, { "epoch": 0.36, "learning_rate": 3.1752913151295535e-05, "loss": 2.3288, "step": 209270 }, { "epoch": 0.36, "learning_rate": 3.1752041211368706e-05, "loss": 2.4517, "step": 209280 }, { "epoch": 0.36, "learning_rate": 3.1751169271441876e-05, "loss": 2.3714, "step": 209290 }, { "epoch": 0.36, "learning_rate": 3.1750297331515047e-05, "loss": 2.5762, "step": 209300 }, { "epoch": 0.37, "learning_rate": 3.1749425391588224e-05, "loss": 2.4919, "step": 209310 }, { "epoch": 0.37, "learning_rate": 3.1748553451661394e-05, "loss": 2.4199, "step": 209320 }, { "epoch": 0.37, "learning_rate": 3.1747681511734564e-05, "loss": 2.4534, "step": 209330 }, { "epoch": 0.37, "learning_rate": 3.174680957180774e-05, "loss": 2.4759, "step": 209340 }, { "epoch": 0.37, "learning_rate": 3.174593763188092e-05, "loss": 2.3253, "step": 209350 }, { "epoch": 0.37, "learning_rate": 3.174506569195409e-05, "loss": 2.4087, "step": 209360 }, { "epoch": 0.37, "learning_rate": 3.174419375202726e-05, "loss": 2.3769, "step": 209370 }, { "epoch": 0.37, "learning_rate": 3.174332181210044e-05, "loss": 2.3713, "step": 209380 }, { "epoch": 0.37, "learning_rate": 3.174244987217361e-05, "loss": 2.3829, "step": 209390 }, { "epoch": 0.37, "learning_rate": 3.174157793224678e-05, "loss": 2.4045, "step": 209400 }, { "epoch": 0.37, "learning_rate": 3.1740705992319955e-05, "loss": 2.3756, "step": 209410 }, { "epoch": 0.37, "learning_rate": 3.173983405239313e-05, "loss": 2.3966, "step": 209420 }, { "epoch": 0.37, "learning_rate": 3.17389621124663e-05, "loss": 2.3064, "step": 209430 }, { "epoch": 0.37, "learning_rate": 3.173809017253947e-05, "loss": 2.4577, "step": 209440 }, { "epoch": 0.37, "learning_rate": 3.173721823261265e-05, "loss": 2.4971, "step": 209450 }, { "epoch": 0.37, "learning_rate": 3.173634629268582e-05, "loss": 2.5004, "step": 209460 }, { "epoch": 0.37, "learning_rate": 3.173547435275899e-05, "loss": 2.4046, "step": 209470 }, { "epoch": 0.37, "learning_rate": 3.173460241283217e-05, "loss": 2.4611, "step": 209480 }, { "epoch": 0.37, "learning_rate": 3.173373047290534e-05, "loss": 2.4755, "step": 209490 }, { "epoch": 0.37, "learning_rate": 3.1732858532978515e-05, "loss": 2.3244, "step": 209500 }, { "epoch": 0.37, "learning_rate": 3.1731986593051686e-05, "loss": 2.5185, "step": 209510 }, { "epoch": 0.37, "learning_rate": 3.173111465312486e-05, "loss": 2.3749, "step": 209520 }, { "epoch": 0.37, "learning_rate": 3.173024271319803e-05, "loss": 2.5028, "step": 209530 }, { "epoch": 0.37, "learning_rate": 3.1729370773271203e-05, "loss": 2.4214, "step": 209540 }, { "epoch": 0.37, "learning_rate": 3.172849883334438e-05, "loss": 2.4758, "step": 209550 }, { "epoch": 0.37, "learning_rate": 3.172762689341755e-05, "loss": 2.3752, "step": 209560 }, { "epoch": 0.37, "learning_rate": 3.172675495349073e-05, "loss": 2.5271, "step": 209570 }, { "epoch": 0.37, "learning_rate": 3.17258830135639e-05, "loss": 2.3663, "step": 209580 }, { "epoch": 0.37, "learning_rate": 3.1725011073637076e-05, "loss": 2.3205, "step": 209590 }, { "epoch": 0.37, "learning_rate": 3.1724139133710246e-05, "loss": 2.3869, "step": 209600 }, { "epoch": 0.37, "learning_rate": 3.1723267193783416e-05, "loss": 2.4078, "step": 209610 }, { "epoch": 0.37, "learning_rate": 3.1722395253856594e-05, "loss": 2.4796, "step": 209620 }, { "epoch": 0.37, "learning_rate": 3.1721523313929764e-05, "loss": 2.412, "step": 209630 }, { "epoch": 0.37, "learning_rate": 3.172065137400294e-05, "loss": 2.331, "step": 209640 }, { "epoch": 0.37, "learning_rate": 3.171977943407611e-05, "loss": 2.492, "step": 209650 }, { "epoch": 0.37, "learning_rate": 3.171890749414929e-05, "loss": 2.3668, "step": 209660 }, { "epoch": 0.37, "learning_rate": 3.171803555422246e-05, "loss": 2.4698, "step": 209670 }, { "epoch": 0.37, "learning_rate": 3.171716361429563e-05, "loss": 2.4714, "step": 209680 }, { "epoch": 0.37, "learning_rate": 3.1716291674368807e-05, "loss": 2.2913, "step": 209690 }, { "epoch": 0.37, "learning_rate": 3.171541973444198e-05, "loss": 2.381, "step": 209700 }, { "epoch": 0.37, "learning_rate": 3.171454779451515e-05, "loss": 2.3433, "step": 209710 }, { "epoch": 0.37, "learning_rate": 3.1713675854588325e-05, "loss": 2.4431, "step": 209720 }, { "epoch": 0.37, "learning_rate": 3.17128039146615e-05, "loss": 2.3564, "step": 209730 }, { "epoch": 0.37, "learning_rate": 3.171193197473467e-05, "loss": 2.4877, "step": 209740 }, { "epoch": 0.37, "learning_rate": 3.171106003480784e-05, "loss": 2.5378, "step": 209750 }, { "epoch": 0.37, "learning_rate": 3.171018809488101e-05, "loss": 2.4146, "step": 209760 }, { "epoch": 0.37, "learning_rate": 3.170931615495419e-05, "loss": 2.4483, "step": 209770 }, { "epoch": 0.37, "learning_rate": 3.170844421502736e-05, "loss": 2.331, "step": 209780 }, { "epoch": 0.37, "learning_rate": 3.170757227510054e-05, "loss": 2.3795, "step": 209790 }, { "epoch": 0.37, "learning_rate": 3.1706700335173715e-05, "loss": 2.4093, "step": 209800 }, { "epoch": 0.37, "learning_rate": 3.1705828395246885e-05, "loss": 2.331, "step": 209810 }, { "epoch": 0.37, "learning_rate": 3.1704956455320055e-05, "loss": 2.3769, "step": 209820 }, { "epoch": 0.37, "learning_rate": 3.1704084515393226e-05, "loss": 2.4692, "step": 209830 }, { "epoch": 0.37, "learning_rate": 3.17032125754664e-05, "loss": 2.4154, "step": 209840 }, { "epoch": 0.37, "learning_rate": 3.170234063553957e-05, "loss": 2.4244, "step": 209850 }, { "epoch": 0.37, "learning_rate": 3.1701468695612744e-05, "loss": 2.431, "step": 209860 }, { "epoch": 0.37, "learning_rate": 3.170059675568592e-05, "loss": 2.5301, "step": 209870 }, { "epoch": 0.37, "learning_rate": 3.16997248157591e-05, "loss": 2.5213, "step": 209880 }, { "epoch": 0.37, "learning_rate": 3.169885287583227e-05, "loss": 2.3757, "step": 209890 }, { "epoch": 0.37, "learning_rate": 3.169798093590544e-05, "loss": 2.2731, "step": 209900 }, { "epoch": 0.37, "learning_rate": 3.1697108995978616e-05, "loss": 2.3664, "step": 209910 }, { "epoch": 0.37, "learning_rate": 3.1696237056051786e-05, "loss": 2.4555, "step": 209920 }, { "epoch": 0.37, "learning_rate": 3.169536511612496e-05, "loss": 2.3027, "step": 209930 }, { "epoch": 0.37, "learning_rate": 3.1694493176198134e-05, "loss": 2.3742, "step": 209940 }, { "epoch": 0.37, "learning_rate": 3.169362123627131e-05, "loss": 2.377, "step": 209950 }, { "epoch": 0.37, "learning_rate": 3.169274929634448e-05, "loss": 2.3923, "step": 209960 }, { "epoch": 0.37, "learning_rate": 3.169187735641765e-05, "loss": 2.3354, "step": 209970 }, { "epoch": 0.37, "learning_rate": 3.169100541649083e-05, "loss": 2.391, "step": 209980 }, { "epoch": 0.37, "learning_rate": 3.1690133476564e-05, "loss": 2.5144, "step": 209990 }, { "epoch": 0.37, "learning_rate": 3.168926153663717e-05, "loss": 2.3314, "step": 210000 }, { "epoch": 0.37, "learning_rate": 3.168838959671035e-05, "loss": 2.4694, "step": 210010 }, { "epoch": 0.37, "learning_rate": 3.1687517656783524e-05, "loss": 2.423, "step": 210020 }, { "epoch": 0.37, "learning_rate": 3.1686645716856694e-05, "loss": 2.5076, "step": 210030 }, { "epoch": 0.37, "learning_rate": 3.1685773776929865e-05, "loss": 2.4191, "step": 210040 }, { "epoch": 0.37, "learning_rate": 3.168490183700304e-05, "loss": 2.3309, "step": 210050 }, { "epoch": 0.37, "learning_rate": 3.168402989707621e-05, "loss": 2.5923, "step": 210060 }, { "epoch": 0.37, "learning_rate": 3.168315795714938e-05, "loss": 2.3605, "step": 210070 }, { "epoch": 0.37, "learning_rate": 3.168228601722256e-05, "loss": 2.3292, "step": 210080 }, { "epoch": 0.37, "learning_rate": 3.168141407729574e-05, "loss": 2.4949, "step": 210090 }, { "epoch": 0.37, "learning_rate": 3.168054213736891e-05, "loss": 2.4377, "step": 210100 }, { "epoch": 0.37, "learning_rate": 3.167967019744208e-05, "loss": 2.4585, "step": 210110 }, { "epoch": 0.37, "learning_rate": 3.1678798257515255e-05, "loss": 2.3974, "step": 210120 }, { "epoch": 0.37, "learning_rate": 3.1677926317588425e-05, "loss": 2.4007, "step": 210130 }, { "epoch": 0.37, "learning_rate": 3.1677054377661596e-05, "loss": 2.3877, "step": 210140 }, { "epoch": 0.37, "learning_rate": 3.1676182437734766e-05, "loss": 2.4468, "step": 210150 }, { "epoch": 0.37, "learning_rate": 3.167531049780794e-05, "loss": 2.4419, "step": 210160 }, { "epoch": 0.37, "learning_rate": 3.167443855788112e-05, "loss": 2.5096, "step": 210170 }, { "epoch": 0.37, "learning_rate": 3.167356661795429e-05, "loss": 2.4113, "step": 210180 }, { "epoch": 0.37, "learning_rate": 3.167269467802747e-05, "loss": 2.3679, "step": 210190 }, { "epoch": 0.37, "learning_rate": 3.167182273810064e-05, "loss": 2.2662, "step": 210200 }, { "epoch": 0.37, "learning_rate": 3.167095079817381e-05, "loss": 2.3866, "step": 210210 }, { "epoch": 0.37, "learning_rate": 3.167007885824698e-05, "loss": 2.415, "step": 210220 }, { "epoch": 0.37, "learning_rate": 3.1669206918320156e-05, "loss": 2.522, "step": 210230 }, { "epoch": 0.37, "learning_rate": 3.1668334978393333e-05, "loss": 2.4889, "step": 210240 }, { "epoch": 0.37, "learning_rate": 3.1667463038466504e-05, "loss": 2.4518, "step": 210250 }, { "epoch": 0.37, "learning_rate": 3.1666591098539674e-05, "loss": 2.5101, "step": 210260 }, { "epoch": 0.37, "learning_rate": 3.166571915861285e-05, "loss": 2.3304, "step": 210270 }, { "epoch": 0.37, "learning_rate": 3.166484721868602e-05, "loss": 2.4084, "step": 210280 }, { "epoch": 0.37, "learning_rate": 3.166397527875919e-05, "loss": 2.4133, "step": 210290 }, { "epoch": 0.37, "learning_rate": 3.166310333883237e-05, "loss": 2.3198, "step": 210300 }, { "epoch": 0.37, "learning_rate": 3.1662231398905546e-05, "loss": 2.3881, "step": 210310 }, { "epoch": 0.37, "learning_rate": 3.166135945897872e-05, "loss": 2.4682, "step": 210320 }, { "epoch": 0.37, "learning_rate": 3.166048751905189e-05, "loss": 2.3575, "step": 210330 }, { "epoch": 0.37, "learning_rate": 3.1659615579125064e-05, "loss": 2.2665, "step": 210340 }, { "epoch": 0.37, "learning_rate": 3.1658743639198235e-05, "loss": 2.3873, "step": 210350 }, { "epoch": 0.37, "learning_rate": 3.1657871699271405e-05, "loss": 2.3866, "step": 210360 }, { "epoch": 0.37, "learning_rate": 3.165699975934458e-05, "loss": 2.49, "step": 210370 }, { "epoch": 0.37, "learning_rate": 3.165612781941775e-05, "loss": 2.389, "step": 210380 }, { "epoch": 0.37, "learning_rate": 3.165525587949093e-05, "loss": 2.5185, "step": 210390 }, { "epoch": 0.37, "learning_rate": 3.16543839395641e-05, "loss": 2.4239, "step": 210400 }, { "epoch": 0.37, "learning_rate": 3.165351199963728e-05, "loss": 2.3982, "step": 210410 }, { "epoch": 0.37, "learning_rate": 3.165264005971045e-05, "loss": 2.4586, "step": 210420 }, { "epoch": 0.37, "learning_rate": 3.165176811978362e-05, "loss": 2.5157, "step": 210430 }, { "epoch": 0.37, "learning_rate": 3.1650896179856795e-05, "loss": 2.4134, "step": 210440 }, { "epoch": 0.37, "learning_rate": 3.1650024239929966e-05, "loss": 2.475, "step": 210450 }, { "epoch": 0.37, "learning_rate": 3.164915230000314e-05, "loss": 2.4684, "step": 210460 }, { "epoch": 0.37, "learning_rate": 3.164828036007631e-05, "loss": 2.5609, "step": 210470 }, { "epoch": 0.37, "learning_rate": 3.164740842014949e-05, "loss": 2.3646, "step": 210480 }, { "epoch": 0.37, "learning_rate": 3.164653648022266e-05, "loss": 2.513, "step": 210490 }, { "epoch": 0.37, "learning_rate": 3.164566454029583e-05, "loss": 2.4102, "step": 210500 }, { "epoch": 0.37, "learning_rate": 3.164479260036901e-05, "loss": 2.4664, "step": 210510 }, { "epoch": 0.37, "learning_rate": 3.164392066044218e-05, "loss": 2.4097, "step": 210520 }, { "epoch": 0.37, "learning_rate": 3.164304872051535e-05, "loss": 2.3823, "step": 210530 }, { "epoch": 0.37, "learning_rate": 3.1642176780588526e-05, "loss": 2.3175, "step": 210540 }, { "epoch": 0.37, "learning_rate": 3.16413048406617e-05, "loss": 2.4211, "step": 210550 }, { "epoch": 0.37, "learning_rate": 3.1640432900734874e-05, "loss": 2.3822, "step": 210560 }, { "epoch": 0.37, "learning_rate": 3.1639560960808044e-05, "loss": 2.3114, "step": 210570 }, { "epoch": 0.37, "learning_rate": 3.163868902088122e-05, "loss": 2.4123, "step": 210580 }, { "epoch": 0.37, "learning_rate": 3.163781708095439e-05, "loss": 2.4888, "step": 210590 }, { "epoch": 0.37, "learning_rate": 3.163694514102756e-05, "loss": 2.4468, "step": 210600 }, { "epoch": 0.37, "learning_rate": 3.163607320110074e-05, "loss": 2.42, "step": 210610 }, { "epoch": 0.37, "learning_rate": 3.1635201261173916e-05, "loss": 2.4802, "step": 210620 }, { "epoch": 0.37, "learning_rate": 3.163432932124709e-05, "loss": 2.4069, "step": 210630 }, { "epoch": 0.37, "learning_rate": 3.163345738132026e-05, "loss": 2.4512, "step": 210640 }, { "epoch": 0.37, "learning_rate": 3.163258544139343e-05, "loss": 2.4557, "step": 210650 }, { "epoch": 0.37, "learning_rate": 3.1631713501466605e-05, "loss": 2.248, "step": 210660 }, { "epoch": 0.37, "learning_rate": 3.1630841561539775e-05, "loss": 2.4948, "step": 210670 }, { "epoch": 0.37, "learning_rate": 3.1629969621612945e-05, "loss": 2.283, "step": 210680 }, { "epoch": 0.37, "learning_rate": 3.162909768168613e-05, "loss": 2.4146, "step": 210690 }, { "epoch": 0.37, "learning_rate": 3.16282257417593e-05, "loss": 2.5003, "step": 210700 }, { "epoch": 0.37, "learning_rate": 3.162735380183247e-05, "loss": 2.3931, "step": 210710 }, { "epoch": 0.37, "learning_rate": 3.162648186190564e-05, "loss": 2.352, "step": 210720 }, { "epoch": 0.37, "learning_rate": 3.162560992197882e-05, "loss": 2.3794, "step": 210730 }, { "epoch": 0.37, "learning_rate": 3.162473798205199e-05, "loss": 2.3687, "step": 210740 }, { "epoch": 0.37, "learning_rate": 3.162386604212516e-05, "loss": 2.4427, "step": 210750 }, { "epoch": 0.37, "learning_rate": 3.1622994102198336e-05, "loss": 2.4689, "step": 210760 }, { "epoch": 0.37, "learning_rate": 3.162212216227151e-05, "loss": 2.3997, "step": 210770 }, { "epoch": 0.37, "learning_rate": 3.162125022234468e-05, "loss": 2.408, "step": 210780 }, { "epoch": 0.37, "learning_rate": 3.1620378282417854e-05, "loss": 2.4727, "step": 210790 }, { "epoch": 0.37, "learning_rate": 3.161950634249103e-05, "loss": 2.3476, "step": 210800 }, { "epoch": 0.37, "learning_rate": 3.16186344025642e-05, "loss": 2.5546, "step": 210810 }, { "epoch": 0.37, "learning_rate": 3.161776246263737e-05, "loss": 2.4558, "step": 210820 }, { "epoch": 0.37, "learning_rate": 3.161689052271055e-05, "loss": 2.2174, "step": 210830 }, { "epoch": 0.37, "learning_rate": 3.1616018582783726e-05, "loss": 2.4562, "step": 210840 }, { "epoch": 0.37, "learning_rate": 3.1615146642856896e-05, "loss": 2.3438, "step": 210850 }, { "epoch": 0.37, "learning_rate": 3.1614274702930067e-05, "loss": 2.4528, "step": 210860 }, { "epoch": 0.37, "learning_rate": 3.1613402763003244e-05, "loss": 2.3562, "step": 210870 }, { "epoch": 0.37, "learning_rate": 3.1612530823076414e-05, "loss": 2.3051, "step": 210880 }, { "epoch": 0.37, "learning_rate": 3.1611658883149584e-05, "loss": 2.3295, "step": 210890 }, { "epoch": 0.37, "learning_rate": 3.161078694322276e-05, "loss": 2.4211, "step": 210900 }, { "epoch": 0.37, "learning_rate": 3.160991500329594e-05, "loss": 2.4998, "step": 210910 }, { "epoch": 0.37, "learning_rate": 3.160904306336911e-05, "loss": 2.3776, "step": 210920 }, { "epoch": 0.37, "learning_rate": 3.160817112344228e-05, "loss": 2.3729, "step": 210930 }, { "epoch": 0.37, "learning_rate": 3.160729918351546e-05, "loss": 2.3473, "step": 210940 }, { "epoch": 0.37, "learning_rate": 3.160642724358863e-05, "loss": 2.4563, "step": 210950 }, { "epoch": 0.37, "learning_rate": 3.16055553036618e-05, "loss": 2.4091, "step": 210960 }, { "epoch": 0.37, "learning_rate": 3.1604683363734975e-05, "loss": 2.4401, "step": 210970 }, { "epoch": 0.37, "learning_rate": 3.160381142380815e-05, "loss": 2.3963, "step": 210980 }, { "epoch": 0.37, "learning_rate": 3.160293948388132e-05, "loss": 2.4289, "step": 210990 }, { "epoch": 0.37, "learning_rate": 3.160206754395449e-05, "loss": 2.4774, "step": 211000 }, { "epoch": 0.37, "learning_rate": 3.160119560402767e-05, "loss": 2.3187, "step": 211010 }, { "epoch": 0.37, "learning_rate": 3.160032366410084e-05, "loss": 2.453, "step": 211020 }, { "epoch": 0.37, "learning_rate": 3.159945172417401e-05, "loss": 2.3286, "step": 211030 }, { "epoch": 0.37, "learning_rate": 3.159857978424719e-05, "loss": 2.4094, "step": 211040 }, { "epoch": 0.37, "learning_rate": 3.159770784432036e-05, "loss": 2.3485, "step": 211050 }, { "epoch": 0.37, "learning_rate": 3.1596835904393535e-05, "loss": 2.3804, "step": 211060 }, { "epoch": 0.37, "learning_rate": 3.1595963964466706e-05, "loss": 2.5039, "step": 211070 }, { "epoch": 0.37, "learning_rate": 3.159509202453988e-05, "loss": 2.4522, "step": 211080 }, { "epoch": 0.37, "learning_rate": 3.159422008461305e-05, "loss": 2.4529, "step": 211090 }, { "epoch": 0.37, "learning_rate": 3.1593348144686223e-05, "loss": 2.5001, "step": 211100 }, { "epoch": 0.37, "learning_rate": 3.1592476204759394e-05, "loss": 2.3556, "step": 211110 }, { "epoch": 0.37, "learning_rate": 3.159160426483257e-05, "loss": 2.4933, "step": 211120 }, { "epoch": 0.37, "learning_rate": 3.159073232490575e-05, "loss": 2.3778, "step": 211130 }, { "epoch": 0.37, "learning_rate": 3.158986038497892e-05, "loss": 2.5327, "step": 211140 }, { "epoch": 0.37, "learning_rate": 3.1588988445052096e-05, "loss": 2.3995, "step": 211150 }, { "epoch": 0.37, "learning_rate": 3.1588116505125266e-05, "loss": 2.4711, "step": 211160 }, { "epoch": 0.37, "learning_rate": 3.1587244565198436e-05, "loss": 2.4397, "step": 211170 }, { "epoch": 0.37, "learning_rate": 3.158637262527161e-05, "loss": 2.4429, "step": 211180 }, { "epoch": 0.37, "learning_rate": 3.1585500685344784e-05, "loss": 2.3577, "step": 211190 }, { "epoch": 0.37, "learning_rate": 3.1584628745417954e-05, "loss": 2.4634, "step": 211200 }, { "epoch": 0.37, "learning_rate": 3.158375680549113e-05, "loss": 2.4046, "step": 211210 }, { "epoch": 0.37, "learning_rate": 3.15828848655643e-05, "loss": 2.3966, "step": 211220 }, { "epoch": 0.37, "learning_rate": 3.158201292563748e-05, "loss": 2.4445, "step": 211230 }, { "epoch": 0.37, "learning_rate": 3.158114098571065e-05, "loss": 2.3401, "step": 211240 }, { "epoch": 0.37, "learning_rate": 3.158026904578382e-05, "loss": 2.4866, "step": 211250 }, { "epoch": 0.37, "learning_rate": 3.1579397105857e-05, "loss": 2.415, "step": 211260 }, { "epoch": 0.37, "learning_rate": 3.157852516593017e-05, "loss": 2.2678, "step": 211270 }, { "epoch": 0.37, "learning_rate": 3.1577653226003345e-05, "loss": 2.4289, "step": 211280 }, { "epoch": 0.37, "learning_rate": 3.1576781286076515e-05, "loss": 2.3775, "step": 211290 }, { "epoch": 0.37, "learning_rate": 3.157590934614969e-05, "loss": 2.3748, "step": 211300 }, { "epoch": 0.37, "learning_rate": 3.157503740622286e-05, "loss": 2.3847, "step": 211310 }, { "epoch": 0.37, "learning_rate": 3.157416546629603e-05, "loss": 2.3587, "step": 211320 }, { "epoch": 0.37, "learning_rate": 3.157329352636921e-05, "loss": 2.4281, "step": 211330 }, { "epoch": 0.37, "learning_rate": 3.157242158644238e-05, "loss": 2.4313, "step": 211340 }, { "epoch": 0.37, "learning_rate": 3.157154964651555e-05, "loss": 2.4482, "step": 211350 }, { "epoch": 0.37, "learning_rate": 3.157067770658873e-05, "loss": 2.2841, "step": 211360 }, { "epoch": 0.37, "learning_rate": 3.1569805766661905e-05, "loss": 2.578, "step": 211370 }, { "epoch": 0.37, "learning_rate": 3.1568933826735075e-05, "loss": 2.3901, "step": 211380 }, { "epoch": 0.37, "learning_rate": 3.1568061886808246e-05, "loss": 2.4288, "step": 211390 }, { "epoch": 0.37, "learning_rate": 3.156718994688142e-05, "loss": 2.2802, "step": 211400 }, { "epoch": 0.37, "learning_rate": 3.156631800695459e-05, "loss": 2.4544, "step": 211410 }, { "epoch": 0.37, "learning_rate": 3.1565446067027764e-05, "loss": 2.312, "step": 211420 }, { "epoch": 0.37, "learning_rate": 3.156457412710094e-05, "loss": 2.395, "step": 211430 }, { "epoch": 0.37, "learning_rate": 3.156370218717412e-05, "loss": 2.479, "step": 211440 }, { "epoch": 0.37, "learning_rate": 3.156283024724729e-05, "loss": 2.5405, "step": 211450 }, { "epoch": 0.37, "learning_rate": 3.156195830732046e-05, "loss": 2.3803, "step": 211460 }, { "epoch": 0.37, "learning_rate": 3.1561086367393636e-05, "loss": 2.4159, "step": 211470 }, { "epoch": 0.37, "learning_rate": 3.1560214427466806e-05, "loss": 2.4502, "step": 211480 }, { "epoch": 0.37, "learning_rate": 3.155934248753998e-05, "loss": 2.4452, "step": 211490 }, { "epoch": 0.37, "learning_rate": 3.1558470547613154e-05, "loss": 2.349, "step": 211500 }, { "epoch": 0.37, "learning_rate": 3.155759860768633e-05, "loss": 2.4145, "step": 211510 }, { "epoch": 0.37, "learning_rate": 3.15567266677595e-05, "loss": 2.2856, "step": 211520 }, { "epoch": 0.37, "learning_rate": 3.155585472783267e-05, "loss": 2.3872, "step": 211530 }, { "epoch": 0.37, "learning_rate": 3.155498278790585e-05, "loss": 2.409, "step": 211540 }, { "epoch": 0.37, "learning_rate": 3.155411084797902e-05, "loss": 2.4892, "step": 211550 }, { "epoch": 0.37, "learning_rate": 3.155323890805219e-05, "loss": 2.3375, "step": 211560 }, { "epoch": 0.37, "learning_rate": 3.155236696812536e-05, "loss": 2.3064, "step": 211570 }, { "epoch": 0.37, "learning_rate": 3.1551495028198544e-05, "loss": 2.3752, "step": 211580 }, { "epoch": 0.37, "learning_rate": 3.1550623088271714e-05, "loss": 2.444, "step": 211590 }, { "epoch": 0.37, "learning_rate": 3.1549751148344885e-05, "loss": 2.3603, "step": 211600 }, { "epoch": 0.37, "learning_rate": 3.1548879208418055e-05, "loss": 2.368, "step": 211610 }, { "epoch": 0.37, "learning_rate": 3.154800726849123e-05, "loss": 2.4911, "step": 211620 }, { "epoch": 0.37, "learning_rate": 3.15471353285644e-05, "loss": 2.4093, "step": 211630 }, { "epoch": 0.37, "learning_rate": 3.154626338863757e-05, "loss": 2.4095, "step": 211640 }, { "epoch": 0.37, "learning_rate": 3.154539144871076e-05, "loss": 2.2348, "step": 211650 }, { "epoch": 0.37, "learning_rate": 3.154451950878393e-05, "loss": 2.422, "step": 211660 }, { "epoch": 0.37, "learning_rate": 3.15436475688571e-05, "loss": 2.4846, "step": 211670 }, { "epoch": 0.37, "learning_rate": 3.154277562893027e-05, "loss": 2.4548, "step": 211680 }, { "epoch": 0.37, "learning_rate": 3.1541903689003445e-05, "loss": 2.4273, "step": 211690 }, { "epoch": 0.37, "learning_rate": 3.1541031749076616e-05, "loss": 2.5392, "step": 211700 }, { "epoch": 0.37, "learning_rate": 3.1540159809149786e-05, "loss": 2.3986, "step": 211710 }, { "epoch": 0.37, "learning_rate": 3.153928786922296e-05, "loss": 2.5153, "step": 211720 }, { "epoch": 0.37, "learning_rate": 3.153841592929614e-05, "loss": 2.3819, "step": 211730 }, { "epoch": 0.37, "learning_rate": 3.153754398936931e-05, "loss": 2.4925, "step": 211740 }, { "epoch": 0.37, "learning_rate": 3.153667204944248e-05, "loss": 2.5186, "step": 211750 }, { "epoch": 0.37, "learning_rate": 3.153580010951566e-05, "loss": 2.3608, "step": 211760 }, { "epoch": 0.37, "learning_rate": 3.153492816958883e-05, "loss": 2.3266, "step": 211770 }, { "epoch": 0.37, "learning_rate": 3.1534056229662e-05, "loss": 2.3794, "step": 211780 }, { "epoch": 0.37, "learning_rate": 3.1533184289735176e-05, "loss": 2.4694, "step": 211790 }, { "epoch": 0.37, "learning_rate": 3.1532312349808353e-05, "loss": 2.3865, "step": 211800 }, { "epoch": 0.37, "learning_rate": 3.1531440409881524e-05, "loss": 2.349, "step": 211810 }, { "epoch": 0.37, "learning_rate": 3.1530568469954694e-05, "loss": 2.4814, "step": 211820 }, { "epoch": 0.37, "learning_rate": 3.152969653002787e-05, "loss": 2.3826, "step": 211830 }, { "epoch": 0.37, "learning_rate": 3.152882459010104e-05, "loss": 2.3809, "step": 211840 }, { "epoch": 0.37, "learning_rate": 3.152795265017421e-05, "loss": 2.3144, "step": 211850 }, { "epoch": 0.37, "learning_rate": 3.152708071024739e-05, "loss": 2.3981, "step": 211860 }, { "epoch": 0.37, "learning_rate": 3.152620877032056e-05, "loss": 2.4496, "step": 211870 }, { "epoch": 0.37, "learning_rate": 3.152533683039374e-05, "loss": 2.4168, "step": 211880 }, { "epoch": 0.37, "learning_rate": 3.152446489046691e-05, "loss": 2.3311, "step": 211890 }, { "epoch": 0.37, "learning_rate": 3.1523592950540084e-05, "loss": 2.302, "step": 211900 }, { "epoch": 0.37, "learning_rate": 3.1522721010613255e-05, "loss": 2.3416, "step": 211910 }, { "epoch": 0.37, "learning_rate": 3.1521849070686425e-05, "loss": 2.3936, "step": 211920 }, { "epoch": 0.37, "learning_rate": 3.15209771307596e-05, "loss": 2.4449, "step": 211930 }, { "epoch": 0.37, "learning_rate": 3.152010519083277e-05, "loss": 2.4575, "step": 211940 }, { "epoch": 0.37, "learning_rate": 3.151923325090595e-05, "loss": 2.3706, "step": 211950 }, { "epoch": 0.37, "learning_rate": 3.151836131097912e-05, "loss": 2.4281, "step": 211960 }, { "epoch": 0.37, "learning_rate": 3.15174893710523e-05, "loss": 2.3249, "step": 211970 }, { "epoch": 0.37, "learning_rate": 3.151661743112547e-05, "loss": 2.2819, "step": 211980 }, { "epoch": 0.37, "learning_rate": 3.151574549119864e-05, "loss": 2.5215, "step": 211990 }, { "epoch": 0.37, "learning_rate": 3.151487355127181e-05, "loss": 2.4359, "step": 212000 }, { "epoch": 0.37, "learning_rate": 3.1514001611344986e-05, "loss": 2.527, "step": 212010 }, { "epoch": 0.37, "learning_rate": 3.1513129671418156e-05, "loss": 2.3518, "step": 212020 }, { "epoch": 0.37, "learning_rate": 3.151225773149133e-05, "loss": 2.321, "step": 212030 }, { "epoch": 0.37, "learning_rate": 3.151138579156451e-05, "loss": 2.3774, "step": 212040 }, { "epoch": 0.37, "learning_rate": 3.151051385163768e-05, "loss": 2.5002, "step": 212050 }, { "epoch": 0.37, "learning_rate": 3.150964191171085e-05, "loss": 2.2998, "step": 212060 }, { "epoch": 0.37, "learning_rate": 3.150876997178402e-05, "loss": 2.3234, "step": 212070 }, { "epoch": 0.37, "learning_rate": 3.15078980318572e-05, "loss": 2.4301, "step": 212080 }, { "epoch": 0.37, "learning_rate": 3.150702609193037e-05, "loss": 2.3836, "step": 212090 }, { "epoch": 0.37, "learning_rate": 3.1506154152003546e-05, "loss": 2.2711, "step": 212100 }, { "epoch": 0.37, "learning_rate": 3.1505282212076717e-05, "loss": 2.3964, "step": 212110 }, { "epoch": 0.37, "learning_rate": 3.1504410272149894e-05, "loss": 2.5385, "step": 212120 }, { "epoch": 0.37, "learning_rate": 3.1503538332223064e-05, "loss": 2.4481, "step": 212130 }, { "epoch": 0.37, "learning_rate": 3.1502666392296235e-05, "loss": 2.4381, "step": 212140 }, { "epoch": 0.37, "learning_rate": 3.150179445236941e-05, "loss": 2.3555, "step": 212150 }, { "epoch": 0.37, "learning_rate": 3.150092251244258e-05, "loss": 2.4613, "step": 212160 }, { "epoch": 0.37, "learning_rate": 3.150005057251576e-05, "loss": 2.3274, "step": 212170 }, { "epoch": 0.37, "learning_rate": 3.149917863258893e-05, "loss": 2.5112, "step": 212180 }, { "epoch": 0.37, "learning_rate": 3.149830669266211e-05, "loss": 2.4744, "step": 212190 }, { "epoch": 0.37, "learning_rate": 3.149743475273528e-05, "loss": 2.4683, "step": 212200 }, { "epoch": 0.37, "learning_rate": 3.149656281280845e-05, "loss": 2.3427, "step": 212210 }, { "epoch": 0.37, "learning_rate": 3.1495690872881625e-05, "loss": 2.2921, "step": 212220 }, { "epoch": 0.37, "learning_rate": 3.1494818932954795e-05, "loss": 2.3814, "step": 212230 }, { "epoch": 0.37, "learning_rate": 3.1493946993027965e-05, "loss": 2.3593, "step": 212240 }, { "epoch": 0.37, "learning_rate": 3.149307505310114e-05, "loss": 2.3163, "step": 212250 }, { "epoch": 0.37, "learning_rate": 3.149220311317432e-05, "loss": 2.4756, "step": 212260 }, { "epoch": 0.37, "learning_rate": 3.149133117324749e-05, "loss": 2.4133, "step": 212270 }, { "epoch": 0.37, "learning_rate": 3.149045923332066e-05, "loss": 2.4069, "step": 212280 }, { "epoch": 0.37, "learning_rate": 3.148958729339384e-05, "loss": 2.4374, "step": 212290 }, { "epoch": 0.37, "learning_rate": 3.148871535346701e-05, "loss": 2.4058, "step": 212300 }, { "epoch": 0.37, "learning_rate": 3.148784341354018e-05, "loss": 2.4451, "step": 212310 }, { "epoch": 0.37, "learning_rate": 3.1486971473613356e-05, "loss": 2.4724, "step": 212320 }, { "epoch": 0.37, "learning_rate": 3.148609953368653e-05, "loss": 2.4148, "step": 212330 }, { "epoch": 0.37, "learning_rate": 3.14852275937597e-05, "loss": 2.3622, "step": 212340 }, { "epoch": 0.37, "learning_rate": 3.1484355653832874e-05, "loss": 2.2931, "step": 212350 }, { "epoch": 0.37, "learning_rate": 3.148348371390605e-05, "loss": 2.505, "step": 212360 }, { "epoch": 0.37, "learning_rate": 3.148261177397922e-05, "loss": 2.4683, "step": 212370 }, { "epoch": 0.37, "learning_rate": 3.148173983405239e-05, "loss": 2.3398, "step": 212380 }, { "epoch": 0.37, "learning_rate": 3.148086789412557e-05, "loss": 2.4735, "step": 212390 }, { "epoch": 0.37, "learning_rate": 3.1479995954198746e-05, "loss": 2.4378, "step": 212400 }, { "epoch": 0.37, "learning_rate": 3.1479124014271916e-05, "loss": 2.402, "step": 212410 }, { "epoch": 0.37, "learning_rate": 3.1478252074345087e-05, "loss": 2.4017, "step": 212420 }, { "epoch": 0.37, "learning_rate": 3.1477380134418264e-05, "loss": 2.4058, "step": 212430 }, { "epoch": 0.37, "learning_rate": 3.1476508194491434e-05, "loss": 2.3798, "step": 212440 }, { "epoch": 0.37, "learning_rate": 3.1475636254564604e-05, "loss": 2.4111, "step": 212450 }, { "epoch": 0.37, "learning_rate": 3.1474764314637775e-05, "loss": 2.2709, "step": 212460 }, { "epoch": 0.37, "learning_rate": 3.147389237471096e-05, "loss": 2.3721, "step": 212470 }, { "epoch": 0.37, "learning_rate": 3.147302043478413e-05, "loss": 2.3424, "step": 212480 }, { "epoch": 0.37, "learning_rate": 3.14721484948573e-05, "loss": 2.4382, "step": 212490 }, { "epoch": 0.37, "learning_rate": 3.147127655493048e-05, "loss": 2.3654, "step": 212500 }, { "epoch": 0.37, "learning_rate": 3.147040461500365e-05, "loss": 2.3275, "step": 212510 }, { "epoch": 0.37, "learning_rate": 3.146953267507682e-05, "loss": 2.3819, "step": 212520 }, { "epoch": 0.37, "learning_rate": 3.146866073514999e-05, "loss": 2.2925, "step": 212530 }, { "epoch": 0.37, "learning_rate": 3.1467788795223165e-05, "loss": 2.4558, "step": 212540 }, { "epoch": 0.37, "learning_rate": 3.146691685529634e-05, "loss": 2.4475, "step": 212550 }, { "epoch": 0.37, "learning_rate": 3.146604491536951e-05, "loss": 2.4064, "step": 212560 }, { "epoch": 0.37, "learning_rate": 3.146517297544268e-05, "loss": 2.4832, "step": 212570 }, { "epoch": 0.37, "learning_rate": 3.146430103551586e-05, "loss": 2.443, "step": 212580 }, { "epoch": 0.37, "learning_rate": 3.146342909558903e-05, "loss": 2.3341, "step": 212590 }, { "epoch": 0.37, "learning_rate": 3.14625571556622e-05, "loss": 2.4504, "step": 212600 }, { "epoch": 0.37, "learning_rate": 3.146168521573538e-05, "loss": 2.4142, "step": 212610 }, { "epoch": 0.37, "learning_rate": 3.1460813275808555e-05, "loss": 2.27, "step": 212620 }, { "epoch": 0.37, "learning_rate": 3.1459941335881726e-05, "loss": 2.3274, "step": 212630 }, { "epoch": 0.37, "learning_rate": 3.1459069395954896e-05, "loss": 2.4544, "step": 212640 }, { "epoch": 0.37, "learning_rate": 3.145819745602807e-05, "loss": 2.4255, "step": 212650 }, { "epoch": 0.37, "learning_rate": 3.1457325516101243e-05, "loss": 2.5695, "step": 212660 }, { "epoch": 0.37, "learning_rate": 3.1456453576174414e-05, "loss": 2.4812, "step": 212670 }, { "epoch": 0.37, "learning_rate": 3.145558163624759e-05, "loss": 2.3774, "step": 212680 }, { "epoch": 0.37, "learning_rate": 3.145470969632076e-05, "loss": 2.3345, "step": 212690 }, { "epoch": 0.37, "learning_rate": 3.145383775639394e-05, "loss": 2.4578, "step": 212700 }, { "epoch": 0.37, "learning_rate": 3.145296581646711e-05, "loss": 2.3458, "step": 212710 }, { "epoch": 0.37, "learning_rate": 3.1452093876540286e-05, "loss": 2.3343, "step": 212720 }, { "epoch": 0.37, "learning_rate": 3.1451221936613456e-05, "loss": 2.4175, "step": 212730 }, { "epoch": 0.37, "learning_rate": 3.145034999668663e-05, "loss": 2.3696, "step": 212740 }, { "epoch": 0.37, "learning_rate": 3.1449478056759804e-05, "loss": 2.3931, "step": 212750 }, { "epoch": 0.37, "learning_rate": 3.1448606116832974e-05, "loss": 2.4196, "step": 212760 }, { "epoch": 0.37, "learning_rate": 3.144773417690615e-05, "loss": 2.4131, "step": 212770 }, { "epoch": 0.37, "learning_rate": 3.144686223697932e-05, "loss": 2.4026, "step": 212780 }, { "epoch": 0.37, "learning_rate": 3.14459902970525e-05, "loss": 2.4308, "step": 212790 }, { "epoch": 0.37, "learning_rate": 3.144511835712567e-05, "loss": 2.302, "step": 212800 }, { "epoch": 0.37, "learning_rate": 3.144424641719884e-05, "loss": 2.4553, "step": 212810 }, { "epoch": 0.37, "learning_rate": 3.144337447727202e-05, "loss": 2.3261, "step": 212820 }, { "epoch": 0.37, "learning_rate": 3.144250253734519e-05, "loss": 2.33, "step": 212830 }, { "epoch": 0.37, "learning_rate": 3.1441630597418365e-05, "loss": 2.5527, "step": 212840 }, { "epoch": 0.37, "learning_rate": 3.1440758657491535e-05, "loss": 2.4329, "step": 212850 }, { "epoch": 0.37, "learning_rate": 3.143988671756471e-05, "loss": 2.3848, "step": 212860 }, { "epoch": 0.37, "learning_rate": 3.143901477763788e-05, "loss": 2.4381, "step": 212870 }, { "epoch": 0.37, "learning_rate": 3.143814283771105e-05, "loss": 2.3694, "step": 212880 }, { "epoch": 0.37, "learning_rate": 3.143727089778423e-05, "loss": 2.4212, "step": 212890 }, { "epoch": 0.37, "learning_rate": 3.14363989578574e-05, "loss": 2.3569, "step": 212900 }, { "epoch": 0.37, "learning_rate": 3.143552701793057e-05, "loss": 2.4401, "step": 212910 }, { "epoch": 0.37, "learning_rate": 3.143465507800375e-05, "loss": 2.3959, "step": 212920 }, { "epoch": 0.37, "learning_rate": 3.1433783138076925e-05, "loss": 2.4186, "step": 212930 }, { "epoch": 0.37, "learning_rate": 3.1432911198150095e-05, "loss": 2.3407, "step": 212940 }, { "epoch": 0.37, "learning_rate": 3.1432039258223266e-05, "loss": 2.3765, "step": 212950 }, { "epoch": 0.37, "learning_rate": 3.1431167318296436e-05, "loss": 2.3623, "step": 212960 }, { "epoch": 0.37, "learning_rate": 3.143029537836961e-05, "loss": 2.4542, "step": 212970 }, { "epoch": 0.37, "learning_rate": 3.1429423438442784e-05, "loss": 2.3206, "step": 212980 }, { "epoch": 0.37, "learning_rate": 3.142855149851596e-05, "loss": 2.3542, "step": 212990 }, { "epoch": 0.37, "learning_rate": 3.142767955858914e-05, "loss": 2.3635, "step": 213000 }, { "epoch": 0.37, "learning_rate": 3.142680761866231e-05, "loss": 2.3971, "step": 213010 }, { "epoch": 0.37, "learning_rate": 3.142593567873548e-05, "loss": 2.3809, "step": 213020 }, { "epoch": 0.37, "learning_rate": 3.142506373880865e-05, "loss": 2.4077, "step": 213030 }, { "epoch": 0.37, "learning_rate": 3.1424191798881826e-05, "loss": 2.5393, "step": 213040 }, { "epoch": 0.37, "learning_rate": 3.1423319858955e-05, "loss": 2.4087, "step": 213050 }, { "epoch": 0.37, "learning_rate": 3.142244791902817e-05, "loss": 2.3138, "step": 213060 }, { "epoch": 0.37, "learning_rate": 3.1421575979101344e-05, "loss": 2.4273, "step": 213070 }, { "epoch": 0.37, "learning_rate": 3.142070403917452e-05, "loss": 2.4709, "step": 213080 }, { "epoch": 0.37, "learning_rate": 3.141983209924769e-05, "loss": 2.4504, "step": 213090 }, { "epoch": 0.37, "learning_rate": 3.141896015932086e-05, "loss": 2.3567, "step": 213100 }, { "epoch": 0.37, "learning_rate": 3.141808821939404e-05, "loss": 2.4647, "step": 213110 }, { "epoch": 0.37, "learning_rate": 3.141721627946721e-05, "loss": 2.3743, "step": 213120 }, { "epoch": 0.37, "learning_rate": 3.141634433954038e-05, "loss": 2.2484, "step": 213130 }, { "epoch": 0.37, "learning_rate": 3.141547239961356e-05, "loss": 2.3748, "step": 213140 }, { "epoch": 0.37, "learning_rate": 3.1414600459686734e-05, "loss": 2.3609, "step": 213150 }, { "epoch": 0.37, "learning_rate": 3.1413728519759905e-05, "loss": 2.427, "step": 213160 }, { "epoch": 0.37, "learning_rate": 3.1412856579833075e-05, "loss": 2.392, "step": 213170 }, { "epoch": 0.37, "learning_rate": 3.141198463990625e-05, "loss": 2.4125, "step": 213180 }, { "epoch": 0.37, "learning_rate": 3.141111269997942e-05, "loss": 2.3819, "step": 213190 }, { "epoch": 0.37, "learning_rate": 3.141024076005259e-05, "loss": 2.3893, "step": 213200 }, { "epoch": 0.37, "learning_rate": 3.140936882012577e-05, "loss": 2.3597, "step": 213210 }, { "epoch": 0.37, "learning_rate": 3.140849688019895e-05, "loss": 2.4757, "step": 213220 }, { "epoch": 0.37, "learning_rate": 3.140762494027212e-05, "loss": 2.4017, "step": 213230 }, { "epoch": 0.37, "learning_rate": 3.140675300034529e-05, "loss": 2.28, "step": 213240 }, { "epoch": 0.37, "learning_rate": 3.1405881060418465e-05, "loss": 2.3962, "step": 213250 }, { "epoch": 0.37, "learning_rate": 3.1405009120491636e-05, "loss": 2.4795, "step": 213260 }, { "epoch": 0.37, "learning_rate": 3.1404137180564806e-05, "loss": 2.2566, "step": 213270 }, { "epoch": 0.37, "learning_rate": 3.140326524063798e-05, "loss": 2.4645, "step": 213280 }, { "epoch": 0.37, "learning_rate": 3.140239330071116e-05, "loss": 2.3896, "step": 213290 }, { "epoch": 0.37, "learning_rate": 3.140152136078433e-05, "loss": 2.4572, "step": 213300 }, { "epoch": 0.37, "learning_rate": 3.14006494208575e-05, "loss": 2.4409, "step": 213310 }, { "epoch": 0.37, "learning_rate": 3.139977748093068e-05, "loss": 2.4071, "step": 213320 }, { "epoch": 0.37, "learning_rate": 3.139890554100385e-05, "loss": 2.4938, "step": 213330 }, { "epoch": 0.37, "learning_rate": 3.139803360107702e-05, "loss": 2.4387, "step": 213340 }, { "epoch": 0.37, "learning_rate": 3.139716166115019e-05, "loss": 2.3161, "step": 213350 }, { "epoch": 0.37, "learning_rate": 3.1396289721223373e-05, "loss": 2.4333, "step": 213360 }, { "epoch": 0.37, "learning_rate": 3.1395417781296544e-05, "loss": 2.4882, "step": 213370 }, { "epoch": 0.37, "learning_rate": 3.1394545841369714e-05, "loss": 2.4633, "step": 213380 }, { "epoch": 0.37, "learning_rate": 3.139367390144289e-05, "loss": 2.3256, "step": 213390 }, { "epoch": 0.37, "learning_rate": 3.139280196151606e-05, "loss": 2.446, "step": 213400 }, { "epoch": 0.37, "learning_rate": 3.139193002158923e-05, "loss": 2.3834, "step": 213410 }, { "epoch": 0.37, "learning_rate": 3.13910580816624e-05, "loss": 2.3445, "step": 213420 }, { "epoch": 0.37, "learning_rate": 3.139018614173558e-05, "loss": 2.4379, "step": 213430 }, { "epoch": 0.37, "learning_rate": 3.138931420180876e-05, "loss": 2.4476, "step": 213440 }, { "epoch": 0.37, "learning_rate": 3.138844226188193e-05, "loss": 2.4777, "step": 213450 }, { "epoch": 0.37, "learning_rate": 3.13875703219551e-05, "loss": 2.44, "step": 213460 }, { "epoch": 0.37, "learning_rate": 3.1386698382028275e-05, "loss": 2.3754, "step": 213470 }, { "epoch": 0.37, "learning_rate": 3.1385826442101445e-05, "loss": 2.3381, "step": 213480 }, { "epoch": 0.37, "learning_rate": 3.1384954502174616e-05, "loss": 2.4609, "step": 213490 }, { "epoch": 0.37, "learning_rate": 3.138408256224779e-05, "loss": 2.4353, "step": 213500 }, { "epoch": 0.37, "learning_rate": 3.138321062232097e-05, "loss": 2.5419, "step": 213510 }, { "epoch": 0.37, "learning_rate": 3.138233868239414e-05, "loss": 2.3311, "step": 213520 }, { "epoch": 0.37, "learning_rate": 3.138146674246731e-05, "loss": 2.3732, "step": 213530 }, { "epoch": 0.37, "learning_rate": 3.138059480254049e-05, "loss": 2.5169, "step": 213540 }, { "epoch": 0.37, "learning_rate": 3.137972286261366e-05, "loss": 2.437, "step": 213550 }, { "epoch": 0.37, "learning_rate": 3.137885092268683e-05, "loss": 2.5028, "step": 213560 }, { "epoch": 0.37, "learning_rate": 3.1377978982760006e-05, "loss": 2.327, "step": 213570 }, { "epoch": 0.37, "learning_rate": 3.1377107042833176e-05, "loss": 2.3398, "step": 213580 }, { "epoch": 0.37, "learning_rate": 3.137623510290635e-05, "loss": 2.3347, "step": 213590 }, { "epoch": 0.37, "learning_rate": 3.1375363162979524e-05, "loss": 2.3499, "step": 213600 }, { "epoch": 0.37, "learning_rate": 3.13744912230527e-05, "loss": 2.5159, "step": 213610 }, { "epoch": 0.37, "learning_rate": 3.137361928312587e-05, "loss": 2.4316, "step": 213620 }, { "epoch": 0.37, "learning_rate": 3.137274734319904e-05, "loss": 2.4361, "step": 213630 }, { "epoch": 0.37, "learning_rate": 3.137187540327222e-05, "loss": 2.4269, "step": 213640 }, { "epoch": 0.37, "learning_rate": 3.137100346334539e-05, "loss": 2.4281, "step": 213650 }, { "epoch": 0.37, "learning_rate": 3.1370131523418566e-05, "loss": 2.3702, "step": 213660 }, { "epoch": 0.37, "learning_rate": 3.136925958349174e-05, "loss": 2.4515, "step": 213670 }, { "epoch": 0.37, "learning_rate": 3.1368387643564914e-05, "loss": 2.4485, "step": 213680 }, { "epoch": 0.37, "learning_rate": 3.1367515703638084e-05, "loss": 2.5595, "step": 213690 }, { "epoch": 0.37, "learning_rate": 3.1366643763711255e-05, "loss": 2.3175, "step": 213700 }, { "epoch": 0.37, "learning_rate": 3.136577182378443e-05, "loss": 2.3911, "step": 213710 }, { "epoch": 0.37, "learning_rate": 3.13648998838576e-05, "loss": 2.3999, "step": 213720 }, { "epoch": 0.37, "learning_rate": 3.136402794393077e-05, "loss": 2.5085, "step": 213730 }, { "epoch": 0.37, "learning_rate": 3.136315600400395e-05, "loss": 2.3191, "step": 213740 }, { "epoch": 0.37, "learning_rate": 3.136228406407713e-05, "loss": 2.3294, "step": 213750 }, { "epoch": 0.37, "learning_rate": 3.13614121241503e-05, "loss": 2.5127, "step": 213760 }, { "epoch": 0.37, "learning_rate": 3.136054018422347e-05, "loss": 2.5273, "step": 213770 }, { "epoch": 0.37, "learning_rate": 3.1359668244296645e-05, "loss": 2.5399, "step": 213780 }, { "epoch": 0.37, "learning_rate": 3.1358796304369815e-05, "loss": 2.4126, "step": 213790 }, { "epoch": 0.37, "learning_rate": 3.1357924364442985e-05, "loss": 2.3255, "step": 213800 }, { "epoch": 0.37, "learning_rate": 3.135705242451616e-05, "loss": 2.5157, "step": 213810 }, { "epoch": 0.37, "learning_rate": 3.135618048458934e-05, "loss": 2.3808, "step": 213820 }, { "epoch": 0.37, "learning_rate": 3.135530854466251e-05, "loss": 2.4184, "step": 213830 }, { "epoch": 0.37, "learning_rate": 3.135443660473568e-05, "loss": 2.403, "step": 213840 }, { "epoch": 0.37, "learning_rate": 3.135356466480886e-05, "loss": 2.4243, "step": 213850 }, { "epoch": 0.37, "learning_rate": 3.135269272488203e-05, "loss": 2.3642, "step": 213860 }, { "epoch": 0.37, "learning_rate": 3.13518207849552e-05, "loss": 2.2911, "step": 213870 }, { "epoch": 0.37, "learning_rate": 3.135094884502837e-05, "loss": 2.333, "step": 213880 }, { "epoch": 0.37, "learning_rate": 3.135007690510155e-05, "loss": 2.502, "step": 213890 }, { "epoch": 0.37, "learning_rate": 3.134920496517472e-05, "loss": 2.5684, "step": 213900 }, { "epoch": 0.37, "learning_rate": 3.1348333025247894e-05, "loss": 2.5132, "step": 213910 }, { "epoch": 0.37, "learning_rate": 3.1347461085321064e-05, "loss": 2.4373, "step": 213920 }, { "epoch": 0.37, "learning_rate": 3.134658914539424e-05, "loss": 2.4267, "step": 213930 }, { "epoch": 0.37, "learning_rate": 3.134571720546741e-05, "loss": 2.3269, "step": 213940 }, { "epoch": 0.37, "learning_rate": 3.134484526554058e-05, "loss": 2.3149, "step": 213950 }, { "epoch": 0.37, "learning_rate": 3.1343973325613766e-05, "loss": 2.3856, "step": 213960 }, { "epoch": 0.37, "learning_rate": 3.1343101385686936e-05, "loss": 2.3729, "step": 213970 }, { "epoch": 0.37, "learning_rate": 3.1342229445760107e-05, "loss": 2.4083, "step": 213980 }, { "epoch": 0.37, "learning_rate": 3.134135750583328e-05, "loss": 2.3155, "step": 213990 }, { "epoch": 0.37, "learning_rate": 3.1340485565906454e-05, "loss": 2.3079, "step": 214000 }, { "epoch": 0.37, "learning_rate": 3.1339613625979624e-05, "loss": 2.4054, "step": 214010 }, { "epoch": 0.37, "learning_rate": 3.1338741686052795e-05, "loss": 2.493, "step": 214020 }, { "epoch": 0.37, "learning_rate": 3.133786974612597e-05, "loss": 2.5583, "step": 214030 }, { "epoch": 0.37, "learning_rate": 3.133699780619915e-05, "loss": 2.4178, "step": 214040 }, { "epoch": 0.37, "learning_rate": 3.133612586627232e-05, "loss": 2.3391, "step": 214050 }, { "epoch": 0.37, "learning_rate": 3.133525392634549e-05, "loss": 2.3832, "step": 214060 }, { "epoch": 0.37, "learning_rate": 3.133438198641867e-05, "loss": 2.53, "step": 214070 }, { "epoch": 0.37, "learning_rate": 3.133351004649184e-05, "loss": 2.413, "step": 214080 }, { "epoch": 0.37, "learning_rate": 3.133263810656501e-05, "loss": 2.3981, "step": 214090 }, { "epoch": 0.37, "learning_rate": 3.1331766166638185e-05, "loss": 2.3788, "step": 214100 }, { "epoch": 0.37, "learning_rate": 3.133089422671136e-05, "loss": 2.332, "step": 214110 }, { "epoch": 0.37, "learning_rate": 3.133002228678453e-05, "loss": 2.3837, "step": 214120 }, { "epoch": 0.37, "learning_rate": 3.13291503468577e-05, "loss": 2.4725, "step": 214130 }, { "epoch": 0.37, "learning_rate": 3.132827840693088e-05, "loss": 2.431, "step": 214140 }, { "epoch": 0.37, "learning_rate": 3.132740646700405e-05, "loss": 2.4872, "step": 214150 }, { "epoch": 0.37, "learning_rate": 3.132653452707722e-05, "loss": 2.4132, "step": 214160 }, { "epoch": 0.37, "learning_rate": 3.13256625871504e-05, "loss": 2.2885, "step": 214170 }, { "epoch": 0.37, "learning_rate": 3.1324790647223575e-05, "loss": 2.4386, "step": 214180 }, { "epoch": 0.37, "learning_rate": 3.1323918707296746e-05, "loss": 2.4563, "step": 214190 }, { "epoch": 0.37, "learning_rate": 3.1323046767369916e-05, "loss": 2.4155, "step": 214200 }, { "epoch": 0.37, "learning_rate": 3.132217482744309e-05, "loss": 2.3435, "step": 214210 }, { "epoch": 0.37, "learning_rate": 3.1321302887516263e-05, "loss": 2.4012, "step": 214220 }, { "epoch": 0.37, "learning_rate": 3.1320430947589434e-05, "loss": 2.5851, "step": 214230 }, { "epoch": 0.37, "learning_rate": 3.131955900766261e-05, "loss": 2.4625, "step": 214240 }, { "epoch": 0.37, "learning_rate": 3.131868706773578e-05, "loss": 2.4214, "step": 214250 }, { "epoch": 0.37, "learning_rate": 3.131781512780896e-05, "loss": 2.407, "step": 214260 }, { "epoch": 0.37, "learning_rate": 3.131694318788213e-05, "loss": 2.3884, "step": 214270 }, { "epoch": 0.37, "learning_rate": 3.1316071247955306e-05, "loss": 2.3834, "step": 214280 }, { "epoch": 0.37, "learning_rate": 3.1315199308028476e-05, "loss": 2.4081, "step": 214290 }, { "epoch": 0.37, "learning_rate": 3.131432736810165e-05, "loss": 2.4592, "step": 214300 }, { "epoch": 0.37, "learning_rate": 3.131345542817482e-05, "loss": 2.3026, "step": 214310 }, { "epoch": 0.37, "learning_rate": 3.1312583488247994e-05, "loss": 2.4638, "step": 214320 }, { "epoch": 0.37, "learning_rate": 3.131171154832117e-05, "loss": 2.3872, "step": 214330 }, { "epoch": 0.37, "learning_rate": 3.131083960839434e-05, "loss": 2.3322, "step": 214340 }, { "epoch": 0.37, "learning_rate": 3.130996766846752e-05, "loss": 2.2955, "step": 214350 }, { "epoch": 0.37, "learning_rate": 3.130909572854069e-05, "loss": 2.3531, "step": 214360 }, { "epoch": 0.37, "learning_rate": 3.130822378861386e-05, "loss": 2.3942, "step": 214370 }, { "epoch": 0.37, "learning_rate": 3.130735184868703e-05, "loss": 2.4654, "step": 214380 }, { "epoch": 0.37, "learning_rate": 3.130647990876021e-05, "loss": 2.276, "step": 214390 }, { "epoch": 0.37, "learning_rate": 3.130560796883338e-05, "loss": 2.3064, "step": 214400 }, { "epoch": 0.37, "learning_rate": 3.1304736028906555e-05, "loss": 2.4528, "step": 214410 }, { "epoch": 0.37, "learning_rate": 3.1303864088979725e-05, "loss": 2.4159, "step": 214420 }, { "epoch": 0.37, "learning_rate": 3.13029921490529e-05, "loss": 2.4886, "step": 214430 }, { "epoch": 0.37, "learning_rate": 3.130212020912607e-05, "loss": 2.4027, "step": 214440 }, { "epoch": 0.37, "learning_rate": 3.130124826919924e-05, "loss": 2.429, "step": 214450 }, { "epoch": 0.37, "learning_rate": 3.130037632927242e-05, "loss": 2.4051, "step": 214460 }, { "epoch": 0.37, "learning_rate": 3.129950438934559e-05, "loss": 2.2903, "step": 214470 }, { "epoch": 0.37, "learning_rate": 3.129863244941877e-05, "loss": 2.4429, "step": 214480 }, { "epoch": 0.37, "learning_rate": 3.129776050949194e-05, "loss": 2.5451, "step": 214490 }, { "epoch": 0.37, "learning_rate": 3.1296888569565115e-05, "loss": 2.4018, "step": 214500 }, { "epoch": 0.37, "learning_rate": 3.1296016629638286e-05, "loss": 2.3892, "step": 214510 }, { "epoch": 0.37, "learning_rate": 3.1295144689711456e-05, "loss": 2.45, "step": 214520 }, { "epoch": 0.37, "learning_rate": 3.1294272749784633e-05, "loss": 2.3945, "step": 214530 }, { "epoch": 0.37, "learning_rate": 3.1293400809857804e-05, "loss": 2.3462, "step": 214540 }, { "epoch": 0.37, "learning_rate": 3.1292528869930974e-05, "loss": 2.483, "step": 214550 }, { "epoch": 0.37, "learning_rate": 3.129165693000415e-05, "loss": 2.291, "step": 214560 }, { "epoch": 0.37, "learning_rate": 3.129078499007733e-05, "loss": 2.3414, "step": 214570 }, { "epoch": 0.37, "learning_rate": 3.12899130501505e-05, "loss": 2.313, "step": 214580 }, { "epoch": 0.37, "learning_rate": 3.128904111022367e-05, "loss": 2.3287, "step": 214590 }, { "epoch": 0.37, "learning_rate": 3.1288169170296846e-05, "loss": 2.518, "step": 214600 }, { "epoch": 0.37, "learning_rate": 3.128729723037002e-05, "loss": 2.5323, "step": 214610 }, { "epoch": 0.37, "learning_rate": 3.128642529044319e-05, "loss": 2.3581, "step": 214620 }, { "epoch": 0.37, "learning_rate": 3.1285553350516364e-05, "loss": 2.3179, "step": 214630 }, { "epoch": 0.37, "learning_rate": 3.128468141058954e-05, "loss": 2.4189, "step": 214640 }, { "epoch": 0.37, "learning_rate": 3.128380947066271e-05, "loss": 2.3542, "step": 214650 }, { "epoch": 0.37, "learning_rate": 3.128293753073588e-05, "loss": 2.5305, "step": 214660 }, { "epoch": 0.37, "learning_rate": 3.128206559080906e-05, "loss": 2.4392, "step": 214670 }, { "epoch": 0.37, "learning_rate": 3.128119365088223e-05, "loss": 2.3743, "step": 214680 }, { "epoch": 0.37, "learning_rate": 3.12803217109554e-05, "loss": 2.4344, "step": 214690 }, { "epoch": 0.37, "learning_rate": 3.127944977102858e-05, "loss": 2.4871, "step": 214700 }, { "epoch": 0.37, "learning_rate": 3.1278577831101754e-05, "loss": 2.4962, "step": 214710 }, { "epoch": 0.37, "learning_rate": 3.1277705891174925e-05, "loss": 2.354, "step": 214720 }, { "epoch": 0.37, "learning_rate": 3.1276833951248095e-05, "loss": 2.3799, "step": 214730 }, { "epoch": 0.37, "learning_rate": 3.127596201132127e-05, "loss": 2.4295, "step": 214740 }, { "epoch": 0.37, "learning_rate": 3.127509007139444e-05, "loss": 2.343, "step": 214750 }, { "epoch": 0.37, "learning_rate": 3.127421813146761e-05, "loss": 2.4167, "step": 214760 }, { "epoch": 0.37, "learning_rate": 3.1273346191540784e-05, "loss": 2.4698, "step": 214770 }, { "epoch": 0.37, "learning_rate": 3.127247425161397e-05, "loss": 2.3635, "step": 214780 }, { "epoch": 0.37, "learning_rate": 3.127160231168714e-05, "loss": 2.3302, "step": 214790 }, { "epoch": 0.37, "learning_rate": 3.127073037176031e-05, "loss": 2.5925, "step": 214800 }, { "epoch": 0.37, "learning_rate": 3.126985843183348e-05, "loss": 2.4329, "step": 214810 }, { "epoch": 0.37, "learning_rate": 3.1268986491906656e-05, "loss": 2.4233, "step": 214820 }, { "epoch": 0.37, "learning_rate": 3.1268114551979826e-05, "loss": 2.4971, "step": 214830 }, { "epoch": 0.37, "learning_rate": 3.1267242612052997e-05, "loss": 2.5679, "step": 214840 }, { "epoch": 0.37, "learning_rate": 3.126637067212618e-05, "loss": 2.3375, "step": 214850 }, { "epoch": 0.37, "learning_rate": 3.126549873219935e-05, "loss": 2.4669, "step": 214860 }, { "epoch": 0.37, "learning_rate": 3.126462679227252e-05, "loss": 2.3784, "step": 214870 }, { "epoch": 0.37, "learning_rate": 3.126375485234569e-05, "loss": 2.358, "step": 214880 }, { "epoch": 0.37, "learning_rate": 3.126288291241887e-05, "loss": 2.4008, "step": 214890 }, { "epoch": 0.37, "learning_rate": 3.126201097249204e-05, "loss": 2.3271, "step": 214900 }, { "epoch": 0.37, "learning_rate": 3.126113903256521e-05, "loss": 2.4632, "step": 214910 }, { "epoch": 0.37, "learning_rate": 3.126026709263839e-05, "loss": 2.3424, "step": 214920 }, { "epoch": 0.37, "learning_rate": 3.1259395152711564e-05, "loss": 2.3587, "step": 214930 }, { "epoch": 0.37, "learning_rate": 3.1258523212784734e-05, "loss": 2.4364, "step": 214940 }, { "epoch": 0.37, "learning_rate": 3.1257651272857905e-05, "loss": 2.5711, "step": 214950 }, { "epoch": 0.37, "learning_rate": 3.125677933293108e-05, "loss": 2.3449, "step": 214960 }, { "epoch": 0.37, "learning_rate": 3.125590739300425e-05, "loss": 2.3755, "step": 214970 }, { "epoch": 0.37, "learning_rate": 3.125503545307742e-05, "loss": 2.3156, "step": 214980 }, { "epoch": 0.37, "learning_rate": 3.12541635131506e-05, "loss": 2.3618, "step": 214990 }, { "epoch": 0.37, "learning_rate": 3.125329157322378e-05, "loss": 2.4386, "step": 215000 }, { "epoch": 0.37, "learning_rate": 3.125241963329695e-05, "loss": 2.4719, "step": 215010 }, { "epoch": 0.37, "learning_rate": 3.125154769337012e-05, "loss": 2.3835, "step": 215020 }, { "epoch": 0.37, "learning_rate": 3.1250675753443295e-05, "loss": 2.3427, "step": 215030 }, { "epoch": 0.38, "learning_rate": 3.1249803813516465e-05, "loss": 2.3775, "step": 215040 }, { "epoch": 0.38, "learning_rate": 3.1248931873589636e-05, "loss": 2.316, "step": 215050 }, { "epoch": 0.38, "learning_rate": 3.124805993366281e-05, "loss": 2.4302, "step": 215060 }, { "epoch": 0.38, "learning_rate": 3.124718799373598e-05, "loss": 2.4244, "step": 215070 }, { "epoch": 0.38, "learning_rate": 3.124631605380916e-05, "loss": 2.4498, "step": 215080 }, { "epoch": 0.38, "learning_rate": 3.124544411388233e-05, "loss": 2.4043, "step": 215090 }, { "epoch": 0.38, "learning_rate": 3.124457217395551e-05, "loss": 2.4023, "step": 215100 }, { "epoch": 0.38, "learning_rate": 3.124370023402868e-05, "loss": 2.3627, "step": 215110 }, { "epoch": 0.38, "learning_rate": 3.124282829410185e-05, "loss": 2.4099, "step": 215120 }, { "epoch": 0.38, "learning_rate": 3.1241956354175026e-05, "loss": 2.5333, "step": 215130 }, { "epoch": 0.38, "learning_rate": 3.1241084414248196e-05, "loss": 2.4619, "step": 215140 }, { "epoch": 0.38, "learning_rate": 3.124021247432137e-05, "loss": 2.3779, "step": 215150 }, { "epoch": 0.38, "learning_rate": 3.1239340534394544e-05, "loss": 2.3594, "step": 215160 }, { "epoch": 0.38, "learning_rate": 3.123846859446772e-05, "loss": 2.374, "step": 215170 }, { "epoch": 0.38, "learning_rate": 3.123759665454089e-05, "loss": 2.4544, "step": 215180 }, { "epoch": 0.38, "learning_rate": 3.123672471461406e-05, "loss": 2.4983, "step": 215190 }, { "epoch": 0.38, "learning_rate": 3.123585277468724e-05, "loss": 2.4042, "step": 215200 }, { "epoch": 0.38, "learning_rate": 3.123498083476041e-05, "loss": 2.4611, "step": 215210 }, { "epoch": 0.38, "learning_rate": 3.123410889483358e-05, "loss": 2.3174, "step": 215220 }, { "epoch": 0.38, "learning_rate": 3.123323695490676e-05, "loss": 2.424, "step": 215230 }, { "epoch": 0.38, "learning_rate": 3.1232365014979934e-05, "loss": 2.3757, "step": 215240 }, { "epoch": 0.38, "learning_rate": 3.1231493075053104e-05, "loss": 2.4944, "step": 215250 }, { "epoch": 0.38, "learning_rate": 3.1230621135126275e-05, "loss": 2.3329, "step": 215260 }, { "epoch": 0.38, "learning_rate": 3.1229749195199445e-05, "loss": 2.3904, "step": 215270 }, { "epoch": 0.38, "learning_rate": 3.122887725527262e-05, "loss": 2.4236, "step": 215280 }, { "epoch": 0.38, "learning_rate": 3.122800531534579e-05, "loss": 2.4042, "step": 215290 }, { "epoch": 0.38, "learning_rate": 3.122713337541897e-05, "loss": 2.4433, "step": 215300 }, { "epoch": 0.38, "learning_rate": 3.122626143549215e-05, "loss": 2.4457, "step": 215310 }, { "epoch": 0.38, "learning_rate": 3.122538949556532e-05, "loss": 2.4846, "step": 215320 }, { "epoch": 0.38, "learning_rate": 3.122451755563849e-05, "loss": 2.3441, "step": 215330 }, { "epoch": 0.38, "learning_rate": 3.122364561571166e-05, "loss": 2.35, "step": 215340 }, { "epoch": 0.38, "learning_rate": 3.1222773675784835e-05, "loss": 2.4669, "step": 215350 }, { "epoch": 0.38, "learning_rate": 3.1221901735858005e-05, "loss": 2.3679, "step": 215360 }, { "epoch": 0.38, "learning_rate": 3.122102979593118e-05, "loss": 2.4731, "step": 215370 }, { "epoch": 0.38, "learning_rate": 3.122015785600435e-05, "loss": 2.4014, "step": 215380 }, { "epoch": 0.38, "learning_rate": 3.121928591607753e-05, "loss": 2.2666, "step": 215390 }, { "epoch": 0.38, "learning_rate": 3.12184139761507e-05, "loss": 2.4621, "step": 215400 }, { "epoch": 0.38, "learning_rate": 3.121754203622387e-05, "loss": 2.4507, "step": 215410 }, { "epoch": 0.38, "learning_rate": 3.121667009629705e-05, "loss": 2.3302, "step": 215420 }, { "epoch": 0.38, "learning_rate": 3.121579815637022e-05, "loss": 2.439, "step": 215430 }, { "epoch": 0.38, "learning_rate": 3.121492621644339e-05, "loss": 2.4014, "step": 215440 }, { "epoch": 0.38, "learning_rate": 3.1214054276516566e-05, "loss": 2.5048, "step": 215450 }, { "epoch": 0.38, "learning_rate": 3.121318233658974e-05, "loss": 2.4362, "step": 215460 }, { "epoch": 0.38, "learning_rate": 3.1212310396662914e-05, "loss": 2.3518, "step": 215470 }, { "epoch": 0.38, "learning_rate": 3.1211438456736084e-05, "loss": 2.3881, "step": 215480 }, { "epoch": 0.38, "learning_rate": 3.121056651680926e-05, "loss": 2.4311, "step": 215490 }, { "epoch": 0.38, "learning_rate": 3.120969457688243e-05, "loss": 2.291, "step": 215500 }, { "epoch": 0.38, "learning_rate": 3.12088226369556e-05, "loss": 2.4807, "step": 215510 }, { "epoch": 0.38, "learning_rate": 3.120795069702878e-05, "loss": 2.4961, "step": 215520 }, { "epoch": 0.38, "learning_rate": 3.1207078757101956e-05, "loss": 2.4082, "step": 215530 }, { "epoch": 0.38, "learning_rate": 3.1206206817175127e-05, "loss": 2.4398, "step": 215540 }, { "epoch": 0.38, "learning_rate": 3.12053348772483e-05, "loss": 2.47, "step": 215550 }, { "epoch": 0.38, "learning_rate": 3.1204462937321474e-05, "loss": 2.4343, "step": 215560 }, { "epoch": 0.38, "learning_rate": 3.1203590997394644e-05, "loss": 2.349, "step": 215570 }, { "epoch": 0.38, "learning_rate": 3.1202719057467815e-05, "loss": 2.4006, "step": 215580 }, { "epoch": 0.38, "learning_rate": 3.120184711754099e-05, "loss": 2.4976, "step": 215590 }, { "epoch": 0.38, "learning_rate": 3.120097517761417e-05, "loss": 2.4, "step": 215600 }, { "epoch": 0.38, "learning_rate": 3.120010323768734e-05, "loss": 2.4108, "step": 215610 }, { "epoch": 0.38, "learning_rate": 3.119923129776051e-05, "loss": 2.4274, "step": 215620 }, { "epoch": 0.38, "learning_rate": 3.119835935783369e-05, "loss": 2.3461, "step": 215630 }, { "epoch": 0.38, "learning_rate": 3.119748741790686e-05, "loss": 2.3509, "step": 215640 }, { "epoch": 0.38, "learning_rate": 3.119661547798003e-05, "loss": 2.4348, "step": 215650 }, { "epoch": 0.38, "learning_rate": 3.11957435380532e-05, "loss": 2.4481, "step": 215660 }, { "epoch": 0.38, "learning_rate": 3.119487159812638e-05, "loss": 2.3454, "step": 215670 }, { "epoch": 0.38, "learning_rate": 3.119399965819955e-05, "loss": 2.3864, "step": 215680 }, { "epoch": 0.38, "learning_rate": 3.119312771827272e-05, "loss": 2.4999, "step": 215690 }, { "epoch": 0.38, "learning_rate": 3.11922557783459e-05, "loss": 2.3677, "step": 215700 }, { "epoch": 0.38, "learning_rate": 3.119138383841907e-05, "loss": 2.3196, "step": 215710 }, { "epoch": 0.38, "learning_rate": 3.119051189849224e-05, "loss": 2.4891, "step": 215720 }, { "epoch": 0.38, "learning_rate": 3.118963995856541e-05, "loss": 2.3378, "step": 215730 }, { "epoch": 0.38, "learning_rate": 3.118876801863859e-05, "loss": 2.5048, "step": 215740 }, { "epoch": 0.38, "learning_rate": 3.1187896078711766e-05, "loss": 2.4292, "step": 215750 }, { "epoch": 0.38, "learning_rate": 3.1187024138784936e-05, "loss": 2.5197, "step": 215760 }, { "epoch": 0.38, "learning_rate": 3.1186152198858106e-05, "loss": 2.4289, "step": 215770 }, { "epoch": 0.38, "learning_rate": 3.1185280258931283e-05, "loss": 2.5006, "step": 215780 }, { "epoch": 0.38, "learning_rate": 3.1184408319004454e-05, "loss": 2.4706, "step": 215790 }, { "epoch": 0.38, "learning_rate": 3.1183536379077624e-05, "loss": 2.5069, "step": 215800 }, { "epoch": 0.38, "learning_rate": 3.11826644391508e-05, "loss": 2.5063, "step": 215810 }, { "epoch": 0.38, "learning_rate": 3.118179249922398e-05, "loss": 2.3477, "step": 215820 }, { "epoch": 0.38, "learning_rate": 3.118092055929715e-05, "loss": 2.3363, "step": 215830 }, { "epoch": 0.38, "learning_rate": 3.118004861937032e-05, "loss": 2.3411, "step": 215840 }, { "epoch": 0.38, "learning_rate": 3.1179176679443496e-05, "loss": 2.3353, "step": 215850 }, { "epoch": 0.38, "learning_rate": 3.117830473951667e-05, "loss": 2.3617, "step": 215860 }, { "epoch": 0.38, "learning_rate": 3.117743279958984e-05, "loss": 2.4911, "step": 215870 }, { "epoch": 0.38, "learning_rate": 3.1176560859663014e-05, "loss": 2.3644, "step": 215880 }, { "epoch": 0.38, "learning_rate": 3.117568891973619e-05, "loss": 2.3499, "step": 215890 }, { "epoch": 0.38, "learning_rate": 3.117481697980936e-05, "loss": 2.5339, "step": 215900 }, { "epoch": 0.38, "learning_rate": 3.117394503988253e-05, "loss": 2.4872, "step": 215910 }, { "epoch": 0.38, "learning_rate": 3.117307309995571e-05, "loss": 2.4229, "step": 215920 }, { "epoch": 0.38, "learning_rate": 3.117220116002888e-05, "loss": 2.4732, "step": 215930 }, { "epoch": 0.38, "learning_rate": 3.117132922010205e-05, "loss": 2.4304, "step": 215940 }, { "epoch": 0.38, "learning_rate": 3.117045728017523e-05, "loss": 2.4873, "step": 215950 }, { "epoch": 0.38, "learning_rate": 3.11695853402484e-05, "loss": 2.4018, "step": 215960 }, { "epoch": 0.38, "learning_rate": 3.1168713400321575e-05, "loss": 2.3694, "step": 215970 }, { "epoch": 0.38, "learning_rate": 3.1167841460394745e-05, "loss": 2.5476, "step": 215980 }, { "epoch": 0.38, "learning_rate": 3.116696952046792e-05, "loss": 2.3618, "step": 215990 }, { "epoch": 0.38, "learning_rate": 3.116609758054109e-05, "loss": 2.2318, "step": 216000 }, { "epoch": 0.38, "learning_rate": 3.116522564061426e-05, "loss": 2.3668, "step": 216010 }, { "epoch": 0.38, "learning_rate": 3.116435370068744e-05, "loss": 2.388, "step": 216020 }, { "epoch": 0.38, "learning_rate": 3.116348176076061e-05, "loss": 2.4514, "step": 216030 }, { "epoch": 0.38, "learning_rate": 3.116260982083379e-05, "loss": 2.4116, "step": 216040 }, { "epoch": 0.38, "learning_rate": 3.116173788090696e-05, "loss": 2.4661, "step": 216050 }, { "epoch": 0.38, "learning_rate": 3.1160865940980135e-05, "loss": 2.5069, "step": 216060 }, { "epoch": 0.38, "learning_rate": 3.1159994001053306e-05, "loss": 2.4099, "step": 216070 }, { "epoch": 0.38, "learning_rate": 3.1159122061126476e-05, "loss": 2.4728, "step": 216080 }, { "epoch": 0.38, "learning_rate": 3.1158250121199653e-05, "loss": 2.3536, "step": 216090 }, { "epoch": 0.38, "learning_rate": 3.1157378181272824e-05, "loss": 2.3889, "step": 216100 }, { "epoch": 0.38, "learning_rate": 3.1156506241345994e-05, "loss": 2.4425, "step": 216110 }, { "epoch": 0.38, "learning_rate": 3.115563430141917e-05, "loss": 2.4376, "step": 216120 }, { "epoch": 0.38, "learning_rate": 3.115476236149235e-05, "loss": 2.4018, "step": 216130 }, { "epoch": 0.38, "learning_rate": 3.115389042156552e-05, "loss": 2.4918, "step": 216140 }, { "epoch": 0.38, "learning_rate": 3.115301848163869e-05, "loss": 2.394, "step": 216150 }, { "epoch": 0.38, "learning_rate": 3.115214654171186e-05, "loss": 2.3295, "step": 216160 }, { "epoch": 0.38, "learning_rate": 3.115127460178504e-05, "loss": 2.3768, "step": 216170 }, { "epoch": 0.38, "learning_rate": 3.115040266185821e-05, "loss": 2.3463, "step": 216180 }, { "epoch": 0.38, "learning_rate": 3.1149530721931384e-05, "loss": 2.3317, "step": 216190 }, { "epoch": 0.38, "learning_rate": 3.114865878200456e-05, "loss": 2.434, "step": 216200 }, { "epoch": 0.38, "learning_rate": 3.114778684207773e-05, "loss": 2.3071, "step": 216210 }, { "epoch": 0.38, "learning_rate": 3.11469149021509e-05, "loss": 2.4335, "step": 216220 }, { "epoch": 0.38, "learning_rate": 3.114604296222407e-05, "loss": 2.3321, "step": 216230 }, { "epoch": 0.38, "learning_rate": 3.114517102229725e-05, "loss": 2.5368, "step": 216240 }, { "epoch": 0.38, "learning_rate": 3.114429908237042e-05, "loss": 2.4526, "step": 216250 }, { "epoch": 0.38, "learning_rate": 3.114342714244359e-05, "loss": 2.3993, "step": 216260 }, { "epoch": 0.38, "learning_rate": 3.114255520251677e-05, "loss": 2.3927, "step": 216270 }, { "epoch": 0.38, "learning_rate": 3.1141683262589945e-05, "loss": 2.384, "step": 216280 }, { "epoch": 0.38, "learning_rate": 3.1140811322663115e-05, "loss": 2.4451, "step": 216290 }, { "epoch": 0.38, "learning_rate": 3.1139939382736286e-05, "loss": 2.4862, "step": 216300 }, { "epoch": 0.38, "learning_rate": 3.113906744280946e-05, "loss": 2.4058, "step": 216310 }, { "epoch": 0.38, "learning_rate": 3.113819550288263e-05, "loss": 2.3641, "step": 216320 }, { "epoch": 0.38, "learning_rate": 3.1137323562955804e-05, "loss": 2.3651, "step": 216330 }, { "epoch": 0.38, "learning_rate": 3.113645162302898e-05, "loss": 2.4574, "step": 216340 }, { "epoch": 0.38, "learning_rate": 3.113557968310216e-05, "loss": 2.395, "step": 216350 }, { "epoch": 0.38, "learning_rate": 3.113470774317533e-05, "loss": 2.3537, "step": 216360 }, { "epoch": 0.38, "learning_rate": 3.11338358032485e-05, "loss": 2.3351, "step": 216370 }, { "epoch": 0.38, "learning_rate": 3.1132963863321676e-05, "loss": 2.3451, "step": 216380 }, { "epoch": 0.38, "learning_rate": 3.1132091923394846e-05, "loss": 2.3632, "step": 216390 }, { "epoch": 0.38, "learning_rate": 3.1131219983468017e-05, "loss": 2.1991, "step": 216400 }, { "epoch": 0.38, "learning_rate": 3.1130348043541194e-05, "loss": 2.4533, "step": 216410 }, { "epoch": 0.38, "learning_rate": 3.112947610361437e-05, "loss": 2.4754, "step": 216420 }, { "epoch": 0.38, "learning_rate": 3.112860416368754e-05, "loss": 2.4361, "step": 216430 }, { "epoch": 0.38, "learning_rate": 3.112773222376071e-05, "loss": 2.38, "step": 216440 }, { "epoch": 0.38, "learning_rate": 3.112686028383389e-05, "loss": 2.3772, "step": 216450 }, { "epoch": 0.38, "learning_rate": 3.112598834390706e-05, "loss": 2.4133, "step": 216460 }, { "epoch": 0.38, "learning_rate": 3.112511640398023e-05, "loss": 2.3722, "step": 216470 }, { "epoch": 0.38, "learning_rate": 3.112424446405341e-05, "loss": 2.3517, "step": 216480 }, { "epoch": 0.38, "learning_rate": 3.1123372524126584e-05, "loss": 2.5136, "step": 216490 }, { "epoch": 0.38, "learning_rate": 3.1122500584199754e-05, "loss": 2.3758, "step": 216500 }, { "epoch": 0.38, "learning_rate": 3.1121628644272925e-05, "loss": 2.4138, "step": 216510 }, { "epoch": 0.38, "learning_rate": 3.11207567043461e-05, "loss": 2.4294, "step": 216520 }, { "epoch": 0.38, "learning_rate": 3.111988476441927e-05, "loss": 2.3976, "step": 216530 }, { "epoch": 0.38, "learning_rate": 3.111901282449244e-05, "loss": 2.4371, "step": 216540 }, { "epoch": 0.38, "learning_rate": 3.111814088456562e-05, "loss": 2.3392, "step": 216550 }, { "epoch": 0.38, "learning_rate": 3.11172689446388e-05, "loss": 2.4953, "step": 216560 }, { "epoch": 0.38, "learning_rate": 3.111639700471197e-05, "loss": 2.4379, "step": 216570 }, { "epoch": 0.38, "learning_rate": 3.111552506478514e-05, "loss": 2.4635, "step": 216580 }, { "epoch": 0.38, "learning_rate": 3.1114653124858315e-05, "loss": 2.4241, "step": 216590 }, { "epoch": 0.38, "learning_rate": 3.1113781184931485e-05, "loss": 2.492, "step": 216600 }, { "epoch": 0.38, "learning_rate": 3.1112909245004656e-05, "loss": 2.5106, "step": 216610 }, { "epoch": 0.38, "learning_rate": 3.1112037305077826e-05, "loss": 2.3478, "step": 216620 }, { "epoch": 0.38, "learning_rate": 3.1111165365151e-05, "loss": 2.4034, "step": 216630 }, { "epoch": 0.38, "learning_rate": 3.111029342522418e-05, "loss": 2.5187, "step": 216640 }, { "epoch": 0.38, "learning_rate": 3.110942148529735e-05, "loss": 2.412, "step": 216650 }, { "epoch": 0.38, "learning_rate": 3.110854954537053e-05, "loss": 2.4121, "step": 216660 }, { "epoch": 0.38, "learning_rate": 3.11076776054437e-05, "loss": 2.4467, "step": 216670 }, { "epoch": 0.38, "learning_rate": 3.110680566551687e-05, "loss": 2.3941, "step": 216680 }, { "epoch": 0.38, "learning_rate": 3.110593372559004e-05, "loss": 2.331, "step": 216690 }, { "epoch": 0.38, "learning_rate": 3.1105061785663216e-05, "loss": 2.3921, "step": 216700 }, { "epoch": 0.38, "learning_rate": 3.110418984573639e-05, "loss": 2.3964, "step": 216710 }, { "epoch": 0.38, "learning_rate": 3.1103317905809564e-05, "loss": 2.4358, "step": 216720 }, { "epoch": 0.38, "learning_rate": 3.1102445965882734e-05, "loss": 2.4416, "step": 216730 }, { "epoch": 0.38, "learning_rate": 3.110157402595591e-05, "loss": 2.5258, "step": 216740 }, { "epoch": 0.38, "learning_rate": 3.110070208602908e-05, "loss": 2.428, "step": 216750 }, { "epoch": 0.38, "learning_rate": 3.109983014610225e-05, "loss": 2.3372, "step": 216760 }, { "epoch": 0.38, "learning_rate": 3.109895820617543e-05, "loss": 2.4613, "step": 216770 }, { "epoch": 0.38, "learning_rate": 3.10980862662486e-05, "loss": 2.2863, "step": 216780 }, { "epoch": 0.38, "learning_rate": 3.109721432632178e-05, "loss": 2.3782, "step": 216790 }, { "epoch": 0.38, "learning_rate": 3.109634238639495e-05, "loss": 2.4668, "step": 216800 }, { "epoch": 0.38, "learning_rate": 3.1095470446468124e-05, "loss": 2.3855, "step": 216810 }, { "epoch": 0.38, "learning_rate": 3.1094598506541295e-05, "loss": 2.3144, "step": 216820 }, { "epoch": 0.38, "learning_rate": 3.1093726566614465e-05, "loss": 2.3664, "step": 216830 }, { "epoch": 0.38, "learning_rate": 3.109285462668764e-05, "loss": 2.4716, "step": 216840 }, { "epoch": 0.38, "learning_rate": 3.109198268676081e-05, "loss": 2.3957, "step": 216850 }, { "epoch": 0.38, "learning_rate": 3.109111074683399e-05, "loss": 2.4055, "step": 216860 }, { "epoch": 0.38, "learning_rate": 3.109023880690716e-05, "loss": 2.3497, "step": 216870 }, { "epoch": 0.38, "learning_rate": 3.108936686698034e-05, "loss": 2.4047, "step": 216880 }, { "epoch": 0.38, "learning_rate": 3.108849492705351e-05, "loss": 2.3191, "step": 216890 }, { "epoch": 0.38, "learning_rate": 3.108762298712668e-05, "loss": 2.4543, "step": 216900 }, { "epoch": 0.38, "learning_rate": 3.1086751047199855e-05, "loss": 2.3936, "step": 216910 }, { "epoch": 0.38, "learning_rate": 3.1085879107273025e-05, "loss": 2.4307, "step": 216920 }, { "epoch": 0.38, "learning_rate": 3.1085007167346196e-05, "loss": 2.4574, "step": 216930 }, { "epoch": 0.38, "learning_rate": 3.108413522741937e-05, "loss": 2.4951, "step": 216940 }, { "epoch": 0.38, "learning_rate": 3.108326328749255e-05, "loss": 2.2821, "step": 216950 }, { "epoch": 0.38, "learning_rate": 3.108239134756572e-05, "loss": 2.3458, "step": 216960 }, { "epoch": 0.38, "learning_rate": 3.108151940763889e-05, "loss": 2.3554, "step": 216970 }, { "epoch": 0.38, "learning_rate": 3.108064746771207e-05, "loss": 2.4126, "step": 216980 }, { "epoch": 0.38, "learning_rate": 3.107977552778524e-05, "loss": 2.3972, "step": 216990 }, { "epoch": 0.38, "learning_rate": 3.107890358785841e-05, "loss": 2.2766, "step": 217000 }, { "epoch": 0.38, "learning_rate": 3.1078031647931586e-05, "loss": 2.3331, "step": 217010 }, { "epoch": 0.38, "learning_rate": 3.107715970800476e-05, "loss": 2.2942, "step": 217020 }, { "epoch": 0.38, "learning_rate": 3.1076287768077934e-05, "loss": 2.4591, "step": 217030 }, { "epoch": 0.38, "learning_rate": 3.1075415828151104e-05, "loss": 2.499, "step": 217040 }, { "epoch": 0.38, "learning_rate": 3.107454388822428e-05, "loss": 2.4917, "step": 217050 }, { "epoch": 0.38, "learning_rate": 3.107367194829745e-05, "loss": 2.5051, "step": 217060 }, { "epoch": 0.38, "learning_rate": 3.107280000837062e-05, "loss": 2.4013, "step": 217070 }, { "epoch": 0.38, "learning_rate": 3.107192806844379e-05, "loss": 2.3216, "step": 217080 }, { "epoch": 0.38, "learning_rate": 3.1071056128516976e-05, "loss": 2.4064, "step": 217090 }, { "epoch": 0.38, "learning_rate": 3.1070184188590147e-05, "loss": 2.3283, "step": 217100 }, { "epoch": 0.38, "learning_rate": 3.106931224866332e-05, "loss": 2.4629, "step": 217110 }, { "epoch": 0.38, "learning_rate": 3.106844030873649e-05, "loss": 2.4501, "step": 217120 }, { "epoch": 0.38, "learning_rate": 3.1067568368809664e-05, "loss": 2.4642, "step": 217130 }, { "epoch": 0.38, "learning_rate": 3.1066696428882835e-05, "loss": 2.4116, "step": 217140 }, { "epoch": 0.38, "learning_rate": 3.1065824488956005e-05, "loss": 2.4402, "step": 217150 }, { "epoch": 0.38, "learning_rate": 3.106495254902919e-05, "loss": 2.3406, "step": 217160 }, { "epoch": 0.38, "learning_rate": 3.106408060910236e-05, "loss": 2.3767, "step": 217170 }, { "epoch": 0.38, "learning_rate": 3.106320866917553e-05, "loss": 2.4677, "step": 217180 }, { "epoch": 0.38, "learning_rate": 3.10623367292487e-05, "loss": 2.3082, "step": 217190 }, { "epoch": 0.38, "learning_rate": 3.106146478932188e-05, "loss": 2.3765, "step": 217200 }, { "epoch": 0.38, "learning_rate": 3.106059284939505e-05, "loss": 2.4774, "step": 217210 }, { "epoch": 0.38, "learning_rate": 3.105972090946822e-05, "loss": 2.4483, "step": 217220 }, { "epoch": 0.38, "learning_rate": 3.1058848969541395e-05, "loss": 2.3856, "step": 217230 }, { "epoch": 0.38, "learning_rate": 3.105797702961457e-05, "loss": 2.3673, "step": 217240 }, { "epoch": 0.38, "learning_rate": 3.105710508968774e-05, "loss": 2.3923, "step": 217250 }, { "epoch": 0.38, "learning_rate": 3.105623314976091e-05, "loss": 2.5076, "step": 217260 }, { "epoch": 0.38, "learning_rate": 3.105536120983409e-05, "loss": 2.4024, "step": 217270 }, { "epoch": 0.38, "learning_rate": 3.105448926990726e-05, "loss": 2.2455, "step": 217280 }, { "epoch": 0.38, "learning_rate": 3.105361732998043e-05, "loss": 2.308, "step": 217290 }, { "epoch": 0.38, "learning_rate": 3.105274539005361e-05, "loss": 2.4372, "step": 217300 }, { "epoch": 0.38, "learning_rate": 3.1051873450126786e-05, "loss": 2.5045, "step": 217310 }, { "epoch": 0.38, "learning_rate": 3.1051001510199956e-05, "loss": 2.5027, "step": 217320 }, { "epoch": 0.38, "learning_rate": 3.1050129570273126e-05, "loss": 2.4675, "step": 217330 }, { "epoch": 0.38, "learning_rate": 3.1049257630346304e-05, "loss": 2.4286, "step": 217340 }, { "epoch": 0.38, "learning_rate": 3.1048385690419474e-05, "loss": 2.2834, "step": 217350 }, { "epoch": 0.38, "learning_rate": 3.1047513750492644e-05, "loss": 2.462, "step": 217360 }, { "epoch": 0.38, "learning_rate": 3.104664181056582e-05, "loss": 2.4126, "step": 217370 }, { "epoch": 0.38, "learning_rate": 3.1045769870639e-05, "loss": 2.4038, "step": 217380 }, { "epoch": 0.38, "learning_rate": 3.104489793071217e-05, "loss": 2.2262, "step": 217390 }, { "epoch": 0.38, "learning_rate": 3.104402599078534e-05, "loss": 2.3882, "step": 217400 }, { "epoch": 0.38, "learning_rate": 3.1043154050858517e-05, "loss": 2.4242, "step": 217410 }, { "epoch": 0.38, "learning_rate": 3.104228211093169e-05, "loss": 2.4444, "step": 217420 }, { "epoch": 0.38, "learning_rate": 3.104141017100486e-05, "loss": 2.4527, "step": 217430 }, { "epoch": 0.38, "learning_rate": 3.1040538231078034e-05, "loss": 2.415, "step": 217440 }, { "epoch": 0.38, "learning_rate": 3.1039666291151205e-05, "loss": 2.3243, "step": 217450 }, { "epoch": 0.38, "learning_rate": 3.103879435122438e-05, "loss": 2.4649, "step": 217460 }, { "epoch": 0.38, "learning_rate": 3.103792241129755e-05, "loss": 2.3634, "step": 217470 }, { "epoch": 0.38, "learning_rate": 3.103705047137073e-05, "loss": 2.4255, "step": 217480 }, { "epoch": 0.38, "learning_rate": 3.10361785314439e-05, "loss": 2.4614, "step": 217490 }, { "epoch": 0.38, "learning_rate": 3.103530659151707e-05, "loss": 2.3921, "step": 217500 }, { "epoch": 0.38, "learning_rate": 3.103443465159024e-05, "loss": 2.3534, "step": 217510 }, { "epoch": 0.38, "learning_rate": 3.103356271166342e-05, "loss": 2.3606, "step": 217520 }, { "epoch": 0.38, "learning_rate": 3.1032690771736595e-05, "loss": 2.4702, "step": 217530 }, { "epoch": 0.38, "learning_rate": 3.1031818831809765e-05, "loss": 2.425, "step": 217540 }, { "epoch": 0.38, "learning_rate": 3.103094689188294e-05, "loss": 2.343, "step": 217550 }, { "epoch": 0.38, "learning_rate": 3.103007495195611e-05, "loss": 2.3816, "step": 217560 }, { "epoch": 0.38, "learning_rate": 3.102920301202928e-05, "loss": 2.4141, "step": 217570 }, { "epoch": 0.38, "learning_rate": 3.1028331072102454e-05, "loss": 2.5183, "step": 217580 }, { "epoch": 0.38, "learning_rate": 3.102745913217563e-05, "loss": 2.4164, "step": 217590 }, { "epoch": 0.38, "learning_rate": 3.10265871922488e-05, "loss": 2.4842, "step": 217600 }, { "epoch": 0.38, "learning_rate": 3.102571525232198e-05, "loss": 2.4135, "step": 217610 }, { "epoch": 0.38, "learning_rate": 3.102484331239515e-05, "loss": 2.3785, "step": 217620 }, { "epoch": 0.38, "learning_rate": 3.1023971372468326e-05, "loss": 2.4552, "step": 217630 }, { "epoch": 0.38, "learning_rate": 3.1023099432541496e-05, "loss": 2.3639, "step": 217640 }, { "epoch": 0.38, "learning_rate": 3.102222749261467e-05, "loss": 2.3514, "step": 217650 }, { "epoch": 0.38, "learning_rate": 3.1021355552687844e-05, "loss": 2.4046, "step": 217660 }, { "epoch": 0.38, "learning_rate": 3.1020483612761014e-05, "loss": 2.3926, "step": 217670 }, { "epoch": 0.38, "learning_rate": 3.101961167283419e-05, "loss": 2.4305, "step": 217680 }, { "epoch": 0.38, "learning_rate": 3.101873973290736e-05, "loss": 2.4456, "step": 217690 }, { "epoch": 0.38, "learning_rate": 3.101786779298054e-05, "loss": 2.2949, "step": 217700 }, { "epoch": 0.38, "learning_rate": 3.101699585305371e-05, "loss": 2.4623, "step": 217710 }, { "epoch": 0.38, "learning_rate": 3.101612391312688e-05, "loss": 2.4671, "step": 217720 }, { "epoch": 0.38, "learning_rate": 3.101525197320006e-05, "loss": 2.3806, "step": 217730 }, { "epoch": 0.38, "learning_rate": 3.101438003327323e-05, "loss": 2.3919, "step": 217740 }, { "epoch": 0.38, "learning_rate": 3.1013508093346404e-05, "loss": 2.4277, "step": 217750 }, { "epoch": 0.38, "learning_rate": 3.1012636153419575e-05, "loss": 2.3928, "step": 217760 }, { "epoch": 0.38, "learning_rate": 3.101176421349275e-05, "loss": 2.418, "step": 217770 }, { "epoch": 0.38, "learning_rate": 3.101089227356592e-05, "loss": 2.4941, "step": 217780 }, { "epoch": 0.38, "learning_rate": 3.101002033363909e-05, "loss": 2.4664, "step": 217790 }, { "epoch": 0.38, "learning_rate": 3.100914839371227e-05, "loss": 2.3574, "step": 217800 }, { "epoch": 0.38, "learning_rate": 3.100827645378544e-05, "loss": 2.3739, "step": 217810 }, { "epoch": 0.38, "learning_rate": 3.100740451385861e-05, "loss": 2.485, "step": 217820 }, { "epoch": 0.38, "learning_rate": 3.100653257393179e-05, "loss": 2.4637, "step": 217830 }, { "epoch": 0.38, "learning_rate": 3.1005660634004965e-05, "loss": 2.417, "step": 217840 }, { "epoch": 0.38, "learning_rate": 3.1004788694078135e-05, "loss": 2.3139, "step": 217850 }, { "epoch": 0.38, "learning_rate": 3.1003916754151306e-05, "loss": 2.4225, "step": 217860 }, { "epoch": 0.38, "learning_rate": 3.100304481422448e-05, "loss": 2.3242, "step": 217870 }, { "epoch": 0.38, "learning_rate": 3.100217287429765e-05, "loss": 2.4239, "step": 217880 }, { "epoch": 0.38, "learning_rate": 3.1001300934370824e-05, "loss": 2.4307, "step": 217890 }, { "epoch": 0.38, "learning_rate": 3.1000428994444e-05, "loss": 2.3686, "step": 217900 }, { "epoch": 0.38, "learning_rate": 3.099955705451718e-05, "loss": 2.4157, "step": 217910 }, { "epoch": 0.38, "learning_rate": 3.099868511459035e-05, "loss": 2.4049, "step": 217920 }, { "epoch": 0.38, "learning_rate": 3.099781317466352e-05, "loss": 2.4367, "step": 217930 }, { "epoch": 0.38, "learning_rate": 3.0996941234736696e-05, "loss": 2.4497, "step": 217940 }, { "epoch": 0.38, "learning_rate": 3.0996069294809866e-05, "loss": 2.3944, "step": 217950 }, { "epoch": 0.38, "learning_rate": 3.0995197354883037e-05, "loss": 2.4804, "step": 217960 }, { "epoch": 0.38, "learning_rate": 3.099432541495621e-05, "loss": 2.4756, "step": 217970 }, { "epoch": 0.38, "learning_rate": 3.099345347502939e-05, "loss": 2.5773, "step": 217980 }, { "epoch": 0.38, "learning_rate": 3.099258153510256e-05, "loss": 2.3881, "step": 217990 }, { "epoch": 0.38, "learning_rate": 3.099170959517573e-05, "loss": 2.4306, "step": 218000 }, { "epoch": 0.38, "learning_rate": 3.099083765524891e-05, "loss": 2.4765, "step": 218010 }, { "epoch": 0.38, "learning_rate": 3.098996571532208e-05, "loss": 2.4428, "step": 218020 }, { "epoch": 0.38, "learning_rate": 3.098909377539525e-05, "loss": 2.4398, "step": 218030 }, { "epoch": 0.38, "learning_rate": 3.098822183546842e-05, "loss": 2.469, "step": 218040 }, { "epoch": 0.38, "learning_rate": 3.0987349895541604e-05, "loss": 2.4706, "step": 218050 }, { "epoch": 0.38, "learning_rate": 3.0986477955614774e-05, "loss": 2.3556, "step": 218060 }, { "epoch": 0.38, "learning_rate": 3.0985606015687945e-05, "loss": 2.3839, "step": 218070 }, { "epoch": 0.38, "learning_rate": 3.0984734075761115e-05, "loss": 2.4811, "step": 218080 }, { "epoch": 0.38, "learning_rate": 3.098386213583429e-05, "loss": 2.4567, "step": 218090 }, { "epoch": 0.38, "learning_rate": 3.098299019590746e-05, "loss": 2.3146, "step": 218100 }, { "epoch": 0.38, "learning_rate": 3.098211825598063e-05, "loss": 2.4289, "step": 218110 }, { "epoch": 0.38, "learning_rate": 3.098124631605381e-05, "loss": 2.3726, "step": 218120 }, { "epoch": 0.38, "learning_rate": 3.098037437612699e-05, "loss": 2.4561, "step": 218130 }, { "epoch": 0.38, "learning_rate": 3.097950243620016e-05, "loss": 2.3417, "step": 218140 }, { "epoch": 0.38, "learning_rate": 3.097863049627333e-05, "loss": 2.3546, "step": 218150 }, { "epoch": 0.38, "learning_rate": 3.0977758556346505e-05, "loss": 2.3691, "step": 218160 }, { "epoch": 0.38, "learning_rate": 3.0976886616419676e-05, "loss": 2.4856, "step": 218170 }, { "epoch": 0.38, "learning_rate": 3.0976014676492846e-05, "loss": 2.5545, "step": 218180 }, { "epoch": 0.38, "learning_rate": 3.097514273656602e-05, "loss": 2.4226, "step": 218190 }, { "epoch": 0.38, "learning_rate": 3.09742707966392e-05, "loss": 2.4539, "step": 218200 }, { "epoch": 0.38, "learning_rate": 3.097339885671237e-05, "loss": 2.4321, "step": 218210 }, { "epoch": 0.38, "learning_rate": 3.097252691678554e-05, "loss": 2.303, "step": 218220 }, { "epoch": 0.38, "learning_rate": 3.097165497685872e-05, "loss": 2.4495, "step": 218230 }, { "epoch": 0.38, "learning_rate": 3.097078303693189e-05, "loss": 2.518, "step": 218240 }, { "epoch": 0.38, "learning_rate": 3.096991109700506e-05, "loss": 2.45, "step": 218250 }, { "epoch": 0.38, "learning_rate": 3.0969039157078236e-05, "loss": 2.4445, "step": 218260 }, { "epoch": 0.38, "learning_rate": 3.0968167217151407e-05, "loss": 2.3831, "step": 218270 }, { "epoch": 0.38, "learning_rate": 3.0967295277224584e-05, "loss": 2.3795, "step": 218280 }, { "epoch": 0.38, "learning_rate": 3.0966423337297754e-05, "loss": 2.3446, "step": 218290 }, { "epoch": 0.38, "learning_rate": 3.096555139737093e-05, "loss": 2.3345, "step": 218300 }, { "epoch": 0.38, "learning_rate": 3.09646794574441e-05, "loss": 2.3919, "step": 218310 }, { "epoch": 0.38, "learning_rate": 3.096380751751727e-05, "loss": 2.397, "step": 218320 }, { "epoch": 0.38, "learning_rate": 3.096293557759045e-05, "loss": 2.4504, "step": 218330 }, { "epoch": 0.38, "learning_rate": 3.096206363766362e-05, "loss": 2.3957, "step": 218340 }, { "epoch": 0.38, "learning_rate": 3.09611916977368e-05, "loss": 2.4119, "step": 218350 }, { "epoch": 0.38, "learning_rate": 3.096031975780997e-05, "loss": 2.4082, "step": 218360 }, { "epoch": 0.38, "learning_rate": 3.0959447817883144e-05, "loss": 2.4047, "step": 218370 }, { "epoch": 0.38, "learning_rate": 3.0958575877956315e-05, "loss": 2.3311, "step": 218380 }, { "epoch": 0.38, "learning_rate": 3.0957703938029485e-05, "loss": 2.3955, "step": 218390 }, { "epoch": 0.38, "learning_rate": 3.095683199810266e-05, "loss": 2.3495, "step": 218400 }, { "epoch": 0.38, "learning_rate": 3.095596005817583e-05, "loss": 2.4512, "step": 218410 }, { "epoch": 0.38, "learning_rate": 3.095508811824901e-05, "loss": 2.4399, "step": 218420 }, { "epoch": 0.38, "learning_rate": 3.095421617832218e-05, "loss": 2.3573, "step": 218430 }, { "epoch": 0.38, "learning_rate": 3.095334423839536e-05, "loss": 2.3385, "step": 218440 }, { "epoch": 0.38, "learning_rate": 3.095247229846853e-05, "loss": 2.4026, "step": 218450 }, { "epoch": 0.38, "learning_rate": 3.09516003585417e-05, "loss": 2.4856, "step": 218460 }, { "epoch": 0.38, "learning_rate": 3.095072841861487e-05, "loss": 2.3993, "step": 218470 }, { "epoch": 0.38, "learning_rate": 3.0949856478688046e-05, "loss": 2.439, "step": 218480 }, { "epoch": 0.38, "learning_rate": 3.0948984538761216e-05, "loss": 2.4042, "step": 218490 }, { "epoch": 0.38, "learning_rate": 3.094811259883439e-05, "loss": 2.4398, "step": 218500 }, { "epoch": 0.38, "learning_rate": 3.094724065890757e-05, "loss": 2.4334, "step": 218510 }, { "epoch": 0.38, "learning_rate": 3.094636871898074e-05, "loss": 2.4154, "step": 218520 }, { "epoch": 0.38, "learning_rate": 3.094549677905391e-05, "loss": 2.4137, "step": 218530 }, { "epoch": 0.38, "learning_rate": 3.094462483912708e-05, "loss": 2.4037, "step": 218540 }, { "epoch": 0.38, "learning_rate": 3.094375289920026e-05, "loss": 2.3949, "step": 218550 }, { "epoch": 0.38, "learning_rate": 3.094288095927343e-05, "loss": 2.4996, "step": 218560 }, { "epoch": 0.38, "learning_rate": 3.0942009019346606e-05, "loss": 2.4877, "step": 218570 }, { "epoch": 0.38, "learning_rate": 3.0941137079419776e-05, "loss": 2.4115, "step": 218580 }, { "epoch": 0.38, "learning_rate": 3.0940265139492954e-05, "loss": 2.3796, "step": 218590 }, { "epoch": 0.38, "learning_rate": 3.0939393199566124e-05, "loss": 2.5107, "step": 218600 }, { "epoch": 0.38, "learning_rate": 3.0938521259639294e-05, "loss": 2.3803, "step": 218610 }, { "epoch": 0.38, "learning_rate": 3.093764931971247e-05, "loss": 2.2734, "step": 218620 }, { "epoch": 0.38, "learning_rate": 3.093677737978564e-05, "loss": 2.4496, "step": 218630 }, { "epoch": 0.38, "learning_rate": 3.093590543985881e-05, "loss": 2.4128, "step": 218640 }, { "epoch": 0.38, "learning_rate": 3.093503349993199e-05, "loss": 2.3573, "step": 218650 }, { "epoch": 0.38, "learning_rate": 3.0934161560005167e-05, "loss": 2.4494, "step": 218660 }, { "epoch": 0.38, "learning_rate": 3.093328962007834e-05, "loss": 2.4519, "step": 218670 }, { "epoch": 0.38, "learning_rate": 3.093241768015151e-05, "loss": 2.5883, "step": 218680 }, { "epoch": 0.38, "learning_rate": 3.0931545740224685e-05, "loss": 2.4336, "step": 218690 }, { "epoch": 0.38, "learning_rate": 3.0930673800297855e-05, "loss": 2.2765, "step": 218700 }, { "epoch": 0.38, "learning_rate": 3.0929801860371025e-05, "loss": 2.4942, "step": 218710 }, { "epoch": 0.38, "learning_rate": 3.09289299204442e-05, "loss": 2.3079, "step": 218720 }, { "epoch": 0.38, "learning_rate": 3.092805798051738e-05, "loss": 2.3511, "step": 218730 }, { "epoch": 0.38, "learning_rate": 3.092718604059055e-05, "loss": 2.5402, "step": 218740 }, { "epoch": 0.38, "learning_rate": 3.092631410066372e-05, "loss": 2.3192, "step": 218750 }, { "epoch": 0.38, "learning_rate": 3.09254421607369e-05, "loss": 2.3571, "step": 218760 }, { "epoch": 0.38, "learning_rate": 3.092457022081007e-05, "loss": 2.3554, "step": 218770 }, { "epoch": 0.38, "learning_rate": 3.092369828088324e-05, "loss": 2.2394, "step": 218780 }, { "epoch": 0.38, "learning_rate": 3.0922826340956415e-05, "loss": 2.4372, "step": 218790 }, { "epoch": 0.38, "learning_rate": 3.092195440102959e-05, "loss": 2.3665, "step": 218800 }, { "epoch": 0.38, "learning_rate": 3.092108246110276e-05, "loss": 2.4756, "step": 218810 }, { "epoch": 0.38, "learning_rate": 3.092021052117593e-05, "loss": 2.3534, "step": 218820 }, { "epoch": 0.38, "learning_rate": 3.091933858124911e-05, "loss": 2.4686, "step": 218830 }, { "epoch": 0.38, "learning_rate": 3.091846664132228e-05, "loss": 2.4002, "step": 218840 }, { "epoch": 0.38, "learning_rate": 3.091759470139545e-05, "loss": 2.3567, "step": 218850 }, { "epoch": 0.38, "learning_rate": 3.091672276146862e-05, "loss": 2.3728, "step": 218860 }, { "epoch": 0.38, "learning_rate": 3.0915850821541806e-05, "loss": 2.3398, "step": 218870 }, { "epoch": 0.38, "learning_rate": 3.0914978881614976e-05, "loss": 2.339, "step": 218880 }, { "epoch": 0.38, "learning_rate": 3.0914106941688146e-05, "loss": 2.4888, "step": 218890 }, { "epoch": 0.38, "learning_rate": 3.0913235001761324e-05, "loss": 2.4843, "step": 218900 }, { "epoch": 0.38, "learning_rate": 3.0912363061834494e-05, "loss": 2.542, "step": 218910 }, { "epoch": 0.38, "learning_rate": 3.0911491121907664e-05, "loss": 2.4153, "step": 218920 }, { "epoch": 0.38, "learning_rate": 3.0910619181980835e-05, "loss": 2.3253, "step": 218930 }, { "epoch": 0.38, "learning_rate": 3.090974724205401e-05, "loss": 2.4235, "step": 218940 }, { "epoch": 0.38, "learning_rate": 3.090887530212719e-05, "loss": 2.4738, "step": 218950 }, { "epoch": 0.38, "learning_rate": 3.090800336220036e-05, "loss": 2.4123, "step": 218960 }, { "epoch": 0.38, "learning_rate": 3.090713142227353e-05, "loss": 2.3408, "step": 218970 }, { "epoch": 0.38, "learning_rate": 3.090625948234671e-05, "loss": 2.3451, "step": 218980 }, { "epoch": 0.38, "learning_rate": 3.090538754241988e-05, "loss": 2.2698, "step": 218990 }, { "epoch": 0.38, "learning_rate": 3.090451560249305e-05, "loss": 2.4378, "step": 219000 }, { "epoch": 0.38, "learning_rate": 3.0903643662566225e-05, "loss": 2.4308, "step": 219010 }, { "epoch": 0.38, "learning_rate": 3.09027717226394e-05, "loss": 2.2904, "step": 219020 }, { "epoch": 0.38, "learning_rate": 3.090189978271257e-05, "loss": 2.4327, "step": 219030 }, { "epoch": 0.38, "learning_rate": 3.090102784278574e-05, "loss": 2.2951, "step": 219040 }, { "epoch": 0.38, "learning_rate": 3.090015590285892e-05, "loss": 2.3841, "step": 219050 }, { "epoch": 0.38, "learning_rate": 3.089928396293209e-05, "loss": 2.2962, "step": 219060 }, { "epoch": 0.38, "learning_rate": 3.089841202300526e-05, "loss": 2.4271, "step": 219070 }, { "epoch": 0.38, "learning_rate": 3.089754008307844e-05, "loss": 2.3686, "step": 219080 }, { "epoch": 0.38, "learning_rate": 3.0896668143151615e-05, "loss": 2.4467, "step": 219090 }, { "epoch": 0.38, "learning_rate": 3.0895796203224785e-05, "loss": 2.3321, "step": 219100 }, { "epoch": 0.38, "learning_rate": 3.0894924263297956e-05, "loss": 2.449, "step": 219110 }, { "epoch": 0.38, "learning_rate": 3.089405232337113e-05, "loss": 2.3713, "step": 219120 }, { "epoch": 0.38, "learning_rate": 3.08931803834443e-05, "loss": 2.4259, "step": 219130 }, { "epoch": 0.38, "learning_rate": 3.0892308443517474e-05, "loss": 2.4179, "step": 219140 }, { "epoch": 0.38, "learning_rate": 3.089143650359065e-05, "loss": 2.4932, "step": 219150 }, { "epoch": 0.38, "learning_rate": 3.089056456366382e-05, "loss": 2.3979, "step": 219160 }, { "epoch": 0.38, "learning_rate": 3.0889692623737e-05, "loss": 2.3317, "step": 219170 }, { "epoch": 0.38, "learning_rate": 3.088882068381017e-05, "loss": 2.4597, "step": 219180 }, { "epoch": 0.38, "learning_rate": 3.0887948743883346e-05, "loss": 2.304, "step": 219190 }, { "epoch": 0.38, "learning_rate": 3.0887076803956516e-05, "loss": 2.388, "step": 219200 }, { "epoch": 0.38, "learning_rate": 3.088620486402969e-05, "loss": 2.3984, "step": 219210 }, { "epoch": 0.38, "learning_rate": 3.0885332924102864e-05, "loss": 2.4573, "step": 219220 }, { "epoch": 0.38, "learning_rate": 3.0884460984176034e-05, "loss": 2.3247, "step": 219230 }, { "epoch": 0.38, "learning_rate": 3.088358904424921e-05, "loss": 2.451, "step": 219240 }, { "epoch": 0.38, "learning_rate": 3.088271710432238e-05, "loss": 2.4613, "step": 219250 }, { "epoch": 0.38, "learning_rate": 3.088184516439556e-05, "loss": 2.5041, "step": 219260 }, { "epoch": 0.38, "learning_rate": 3.088097322446873e-05, "loss": 2.3757, "step": 219270 }, { "epoch": 0.38, "learning_rate": 3.08801012845419e-05, "loss": 2.3702, "step": 219280 }, { "epoch": 0.38, "learning_rate": 3.087922934461508e-05, "loss": 2.3216, "step": 219290 }, { "epoch": 0.38, "learning_rate": 3.087835740468825e-05, "loss": 2.3721, "step": 219300 }, { "epoch": 0.38, "learning_rate": 3.087748546476142e-05, "loss": 2.3188, "step": 219310 }, { "epoch": 0.38, "learning_rate": 3.0876613524834595e-05, "loss": 2.4671, "step": 219320 }, { "epoch": 0.38, "learning_rate": 3.087574158490777e-05, "loss": 2.4944, "step": 219330 }, { "epoch": 0.38, "learning_rate": 3.087486964498094e-05, "loss": 2.5027, "step": 219340 }, { "epoch": 0.38, "learning_rate": 3.087399770505411e-05, "loss": 2.3971, "step": 219350 }, { "epoch": 0.38, "learning_rate": 3.087312576512729e-05, "loss": 2.3181, "step": 219360 }, { "epoch": 0.38, "learning_rate": 3.087225382520046e-05, "loss": 2.401, "step": 219370 }, { "epoch": 0.38, "learning_rate": 3.087138188527363e-05, "loss": 2.3652, "step": 219380 }, { "epoch": 0.38, "learning_rate": 3.087050994534681e-05, "loss": 2.4736, "step": 219390 }, { "epoch": 0.38, "learning_rate": 3.0869638005419985e-05, "loss": 2.3452, "step": 219400 }, { "epoch": 0.38, "learning_rate": 3.0868766065493155e-05, "loss": 2.4165, "step": 219410 }, { "epoch": 0.38, "learning_rate": 3.0867894125566326e-05, "loss": 2.416, "step": 219420 }, { "epoch": 0.38, "learning_rate": 3.0867022185639496e-05, "loss": 2.3319, "step": 219430 }, { "epoch": 0.38, "learning_rate": 3.086615024571267e-05, "loss": 2.3446, "step": 219440 }, { "epoch": 0.38, "learning_rate": 3.0865278305785844e-05, "loss": 2.3673, "step": 219450 }, { "epoch": 0.38, "learning_rate": 3.0864406365859014e-05, "loss": 2.3972, "step": 219460 }, { "epoch": 0.38, "learning_rate": 3.08635344259322e-05, "loss": 2.3483, "step": 219470 }, { "epoch": 0.38, "learning_rate": 3.086266248600537e-05, "loss": 2.3019, "step": 219480 }, { "epoch": 0.38, "learning_rate": 3.086179054607854e-05, "loss": 2.4144, "step": 219490 }, { "epoch": 0.38, "learning_rate": 3.086091860615171e-05, "loss": 2.3565, "step": 219500 }, { "epoch": 0.38, "learning_rate": 3.0860046666224886e-05, "loss": 2.2501, "step": 219510 }, { "epoch": 0.38, "learning_rate": 3.0859174726298057e-05, "loss": 2.3973, "step": 219520 }, { "epoch": 0.38, "learning_rate": 3.085830278637123e-05, "loss": 2.4944, "step": 219530 }, { "epoch": 0.38, "learning_rate": 3.0857430846444404e-05, "loss": 2.4709, "step": 219540 }, { "epoch": 0.38, "learning_rate": 3.085655890651758e-05, "loss": 2.4557, "step": 219550 }, { "epoch": 0.38, "learning_rate": 3.085568696659075e-05, "loss": 2.4846, "step": 219560 }, { "epoch": 0.38, "learning_rate": 3.085481502666392e-05, "loss": 2.4258, "step": 219570 }, { "epoch": 0.38, "learning_rate": 3.08539430867371e-05, "loss": 2.4485, "step": 219580 }, { "epoch": 0.38, "learning_rate": 3.085307114681027e-05, "loss": 2.4369, "step": 219590 }, { "epoch": 0.38, "learning_rate": 3.085219920688344e-05, "loss": 2.4114, "step": 219600 }, { "epoch": 0.38, "learning_rate": 3.085132726695662e-05, "loss": 2.3056, "step": 219610 }, { "epoch": 0.38, "learning_rate": 3.0850455327029794e-05, "loss": 2.3453, "step": 219620 }, { "epoch": 0.38, "learning_rate": 3.0849583387102965e-05, "loss": 2.507, "step": 219630 }, { "epoch": 0.38, "learning_rate": 3.0848711447176135e-05, "loss": 2.453, "step": 219640 }, { "epoch": 0.38, "learning_rate": 3.084783950724931e-05, "loss": 2.3168, "step": 219650 }, { "epoch": 0.38, "learning_rate": 3.084696756732248e-05, "loss": 2.3585, "step": 219660 }, { "epoch": 0.38, "learning_rate": 3.084609562739565e-05, "loss": 2.4609, "step": 219670 }, { "epoch": 0.38, "learning_rate": 3.084522368746883e-05, "loss": 2.4161, "step": 219680 }, { "epoch": 0.38, "learning_rate": 3.084435174754201e-05, "loss": 2.3752, "step": 219690 }, { "epoch": 0.38, "learning_rate": 3.084347980761518e-05, "loss": 2.4033, "step": 219700 }, { "epoch": 0.38, "learning_rate": 3.084260786768835e-05, "loss": 2.4724, "step": 219710 }, { "epoch": 0.38, "learning_rate": 3.0841735927761525e-05, "loss": 2.4783, "step": 219720 }, { "epoch": 0.38, "learning_rate": 3.0840863987834696e-05, "loss": 2.5021, "step": 219730 }, { "epoch": 0.38, "learning_rate": 3.0839992047907866e-05, "loss": 2.4954, "step": 219740 }, { "epoch": 0.38, "learning_rate": 3.083912010798104e-05, "loss": 2.3791, "step": 219750 }, { "epoch": 0.38, "learning_rate": 3.083824816805422e-05, "loss": 2.3617, "step": 219760 }, { "epoch": 0.38, "learning_rate": 3.083737622812739e-05, "loss": 2.4164, "step": 219770 }, { "epoch": 0.38, "learning_rate": 3.083650428820056e-05, "loss": 2.3965, "step": 219780 }, { "epoch": 0.38, "learning_rate": 3.083563234827374e-05, "loss": 2.4316, "step": 219790 }, { "epoch": 0.38, "learning_rate": 3.083476040834691e-05, "loss": 2.3516, "step": 219800 }, { "epoch": 0.38, "learning_rate": 3.083388846842008e-05, "loss": 2.4541, "step": 219810 }, { "epoch": 0.38, "learning_rate": 3.083301652849325e-05, "loss": 2.4653, "step": 219820 }, { "epoch": 0.38, "learning_rate": 3.0832144588566427e-05, "loss": 2.3306, "step": 219830 }, { "epoch": 0.38, "learning_rate": 3.0831272648639604e-05, "loss": 2.4571, "step": 219840 }, { "epoch": 0.38, "learning_rate": 3.0830400708712774e-05, "loss": 2.3896, "step": 219850 }, { "epoch": 0.38, "learning_rate": 3.082952876878595e-05, "loss": 2.4494, "step": 219860 }, { "epoch": 0.38, "learning_rate": 3.082865682885912e-05, "loss": 2.3522, "step": 219870 }, { "epoch": 0.38, "learning_rate": 3.082778488893229e-05, "loss": 2.4299, "step": 219880 }, { "epoch": 0.38, "learning_rate": 3.082691294900546e-05, "loss": 2.3781, "step": 219890 }, { "epoch": 0.38, "learning_rate": 3.082604100907864e-05, "loss": 2.422, "step": 219900 }, { "epoch": 0.38, "learning_rate": 3.082516906915182e-05, "loss": 2.4191, "step": 219910 }, { "epoch": 0.38, "learning_rate": 3.082429712922499e-05, "loss": 2.3743, "step": 219920 }, { "epoch": 0.38, "learning_rate": 3.082342518929816e-05, "loss": 2.3307, "step": 219930 }, { "epoch": 0.38, "learning_rate": 3.0822553249371335e-05, "loss": 2.3893, "step": 219940 }, { "epoch": 0.38, "learning_rate": 3.0821681309444505e-05, "loss": 2.4206, "step": 219950 }, { "epoch": 0.38, "learning_rate": 3.0820809369517675e-05, "loss": 2.3648, "step": 219960 }, { "epoch": 0.38, "learning_rate": 3.081993742959085e-05, "loss": 2.3318, "step": 219970 }, { "epoch": 0.38, "learning_rate": 3.081906548966402e-05, "loss": 2.3309, "step": 219980 }, { "epoch": 0.38, "learning_rate": 3.08181935497372e-05, "loss": 2.3593, "step": 219990 }, { "epoch": 0.38, "learning_rate": 3.081732160981037e-05, "loss": 2.4683, "step": 220000 }, { "epoch": 0.38, "learning_rate": 3.081644966988355e-05, "loss": 2.3946, "step": 220010 }, { "epoch": 0.38, "learning_rate": 3.081557772995672e-05, "loss": 2.3775, "step": 220020 }, { "epoch": 0.38, "learning_rate": 3.081470579002989e-05, "loss": 2.434, "step": 220030 }, { "epoch": 0.38, "learning_rate": 3.0813833850103066e-05, "loss": 2.3122, "step": 220040 }, { "epoch": 0.38, "learning_rate": 3.0812961910176236e-05, "loss": 2.4275, "step": 220050 }, { "epoch": 0.38, "learning_rate": 3.081208997024941e-05, "loss": 2.4542, "step": 220060 }, { "epoch": 0.38, "learning_rate": 3.0811218030322583e-05, "loss": 2.4001, "step": 220070 }, { "epoch": 0.38, "learning_rate": 3.081034609039576e-05, "loss": 2.4276, "step": 220080 }, { "epoch": 0.38, "learning_rate": 3.080947415046893e-05, "loss": 2.4589, "step": 220090 }, { "epoch": 0.38, "learning_rate": 3.08086022105421e-05, "loss": 2.4639, "step": 220100 }, { "epoch": 0.38, "learning_rate": 3.080773027061528e-05, "loss": 2.4465, "step": 220110 }, { "epoch": 0.38, "learning_rate": 3.080685833068845e-05, "loss": 2.3854, "step": 220120 }, { "epoch": 0.38, "learning_rate": 3.080598639076162e-05, "loss": 2.3576, "step": 220130 }, { "epoch": 0.38, "learning_rate": 3.0805114450834796e-05, "loss": 2.4477, "step": 220140 }, { "epoch": 0.38, "learning_rate": 3.0804242510907974e-05, "loss": 2.3764, "step": 220150 }, { "epoch": 0.38, "learning_rate": 3.0803370570981144e-05, "loss": 2.4282, "step": 220160 }, { "epoch": 0.38, "learning_rate": 3.0802498631054314e-05, "loss": 2.4217, "step": 220170 }, { "epoch": 0.38, "learning_rate": 3.080162669112749e-05, "loss": 2.4261, "step": 220180 }, { "epoch": 0.38, "learning_rate": 3.080075475120066e-05, "loss": 2.4379, "step": 220190 }, { "epoch": 0.38, "learning_rate": 3.079988281127383e-05, "loss": 2.5129, "step": 220200 }, { "epoch": 0.38, "learning_rate": 3.079901087134701e-05, "loss": 2.4443, "step": 220210 }, { "epoch": 0.38, "learning_rate": 3.0798138931420187e-05, "loss": 2.3999, "step": 220220 }, { "epoch": 0.38, "learning_rate": 3.079726699149336e-05, "loss": 2.4491, "step": 220230 }, { "epoch": 0.38, "learning_rate": 3.079639505156653e-05, "loss": 2.4375, "step": 220240 }, { "epoch": 0.38, "learning_rate": 3.0795523111639705e-05, "loss": 2.2736, "step": 220250 }, { "epoch": 0.38, "learning_rate": 3.0794651171712875e-05, "loss": 2.482, "step": 220260 }, { "epoch": 0.38, "learning_rate": 3.0793779231786045e-05, "loss": 2.5344, "step": 220270 }, { "epoch": 0.38, "learning_rate": 3.079290729185922e-05, "loss": 2.3401, "step": 220280 }, { "epoch": 0.38, "learning_rate": 3.07920353519324e-05, "loss": 2.6185, "step": 220290 }, { "epoch": 0.38, "learning_rate": 3.079116341200557e-05, "loss": 2.4605, "step": 220300 }, { "epoch": 0.38, "learning_rate": 3.079029147207874e-05, "loss": 2.3403, "step": 220310 }, { "epoch": 0.38, "learning_rate": 3.078941953215191e-05, "loss": 2.5613, "step": 220320 }, { "epoch": 0.38, "learning_rate": 3.078854759222509e-05, "loss": 2.4331, "step": 220330 }, { "epoch": 0.38, "learning_rate": 3.078767565229826e-05, "loss": 2.3263, "step": 220340 }, { "epoch": 0.38, "learning_rate": 3.078680371237143e-05, "loss": 2.3976, "step": 220350 }, { "epoch": 0.38, "learning_rate": 3.078593177244461e-05, "loss": 2.3361, "step": 220360 }, { "epoch": 0.38, "learning_rate": 3.078505983251778e-05, "loss": 2.5645, "step": 220370 }, { "epoch": 0.38, "learning_rate": 3.078418789259095e-05, "loss": 2.265, "step": 220380 }, { "epoch": 0.38, "learning_rate": 3.0783315952664124e-05, "loss": 2.3827, "step": 220390 }, { "epoch": 0.38, "learning_rate": 3.07824440127373e-05, "loss": 2.4246, "step": 220400 }, { "epoch": 0.38, "learning_rate": 3.078157207281047e-05, "loss": 2.3858, "step": 220410 }, { "epoch": 0.38, "learning_rate": 3.078070013288364e-05, "loss": 2.4091, "step": 220420 }, { "epoch": 0.38, "learning_rate": 3.077982819295682e-05, "loss": 2.2833, "step": 220430 }, { "epoch": 0.38, "learning_rate": 3.0778956253029996e-05, "loss": 2.4121, "step": 220440 }, { "epoch": 0.38, "learning_rate": 3.0778084313103166e-05, "loss": 2.3893, "step": 220450 }, { "epoch": 0.38, "learning_rate": 3.077721237317634e-05, "loss": 2.3872, "step": 220460 }, { "epoch": 0.38, "learning_rate": 3.0776340433249514e-05, "loss": 2.3849, "step": 220470 }, { "epoch": 0.38, "learning_rate": 3.0775468493322684e-05, "loss": 2.3256, "step": 220480 }, { "epoch": 0.38, "learning_rate": 3.0774596553395855e-05, "loss": 2.4281, "step": 220490 }, { "epoch": 0.38, "learning_rate": 3.077372461346903e-05, "loss": 2.3624, "step": 220500 }, { "epoch": 0.38, "learning_rate": 3.077285267354221e-05, "loss": 2.4482, "step": 220510 }, { "epoch": 0.38, "learning_rate": 3.077198073361538e-05, "loss": 2.4134, "step": 220520 }, { "epoch": 0.38, "learning_rate": 3.077110879368855e-05, "loss": 2.4123, "step": 220530 }, { "epoch": 0.38, "learning_rate": 3.077023685376173e-05, "loss": 2.4431, "step": 220540 }, { "epoch": 0.38, "learning_rate": 3.07693649138349e-05, "loss": 2.4778, "step": 220550 }, { "epoch": 0.38, "learning_rate": 3.076849297390807e-05, "loss": 2.4132, "step": 220560 }, { "epoch": 0.38, "learning_rate": 3.0767621033981245e-05, "loss": 2.4273, "step": 220570 }, { "epoch": 0.38, "learning_rate": 3.076674909405442e-05, "loss": 2.4297, "step": 220580 }, { "epoch": 0.38, "learning_rate": 3.076587715412759e-05, "loss": 2.405, "step": 220590 }, { "epoch": 0.38, "learning_rate": 3.076500521420076e-05, "loss": 2.4745, "step": 220600 }, { "epoch": 0.38, "learning_rate": 3.076413327427394e-05, "loss": 2.3984, "step": 220610 }, { "epoch": 0.38, "learning_rate": 3.076326133434711e-05, "loss": 2.4243, "step": 220620 }, { "epoch": 0.38, "learning_rate": 3.076238939442028e-05, "loss": 2.3327, "step": 220630 }, { "epoch": 0.38, "learning_rate": 3.076151745449346e-05, "loss": 2.4472, "step": 220640 }, { "epoch": 0.38, "learning_rate": 3.076064551456663e-05, "loss": 2.4225, "step": 220650 }, { "epoch": 0.38, "learning_rate": 3.0759773574639805e-05, "loss": 2.3931, "step": 220660 }, { "epoch": 0.38, "learning_rate": 3.0758901634712976e-05, "loss": 2.4382, "step": 220670 }, { "epoch": 0.38, "learning_rate": 3.075802969478615e-05, "loss": 2.4582, "step": 220680 }, { "epoch": 0.38, "learning_rate": 3.075715775485932e-05, "loss": 2.4426, "step": 220690 }, { "epoch": 0.38, "learning_rate": 3.0756285814932494e-05, "loss": 2.2736, "step": 220700 }, { "epoch": 0.38, "learning_rate": 3.075541387500567e-05, "loss": 2.4874, "step": 220710 }, { "epoch": 0.38, "learning_rate": 3.075454193507884e-05, "loss": 2.5076, "step": 220720 }, { "epoch": 0.38, "learning_rate": 3.075366999515202e-05, "loss": 2.5026, "step": 220730 }, { "epoch": 0.38, "learning_rate": 3.075279805522519e-05, "loss": 2.5884, "step": 220740 }, { "epoch": 0.38, "learning_rate": 3.0751926115298366e-05, "loss": 2.2963, "step": 220750 }, { "epoch": 0.38, "learning_rate": 3.0751054175371536e-05, "loss": 2.4193, "step": 220760 }, { "epoch": 0.38, "learning_rate": 3.075018223544471e-05, "loss": 2.2332, "step": 220770 }, { "epoch": 0.39, "learning_rate": 3.074931029551788e-05, "loss": 2.4148, "step": 220780 }, { "epoch": 0.39, "learning_rate": 3.0748438355591054e-05, "loss": 2.5514, "step": 220790 }, { "epoch": 0.39, "learning_rate": 3.0747566415664225e-05, "loss": 2.2729, "step": 220800 }, { "epoch": 0.39, "learning_rate": 3.07466944757374e-05, "loss": 2.4196, "step": 220810 }, { "epoch": 0.39, "learning_rate": 3.074582253581058e-05, "loss": 2.3122, "step": 220820 }, { "epoch": 0.39, "learning_rate": 3.074495059588375e-05, "loss": 2.3815, "step": 220830 }, { "epoch": 0.39, "learning_rate": 3.074407865595692e-05, "loss": 2.4283, "step": 220840 }, { "epoch": 0.39, "learning_rate": 3.074320671603009e-05, "loss": 2.4718, "step": 220850 }, { "epoch": 0.39, "learning_rate": 3.074233477610327e-05, "loss": 2.4984, "step": 220860 }, { "epoch": 0.39, "learning_rate": 3.074146283617644e-05, "loss": 2.3594, "step": 220870 }, { "epoch": 0.39, "learning_rate": 3.0740590896249615e-05, "loss": 2.4588, "step": 220880 }, { "epoch": 0.39, "learning_rate": 3.0739718956322785e-05, "loss": 2.3204, "step": 220890 }, { "epoch": 0.39, "learning_rate": 3.073884701639596e-05, "loss": 2.3925, "step": 220900 }, { "epoch": 0.39, "learning_rate": 3.073797507646913e-05, "loss": 2.3953, "step": 220910 }, { "epoch": 0.39, "learning_rate": 3.07371031365423e-05, "loss": 2.3742, "step": 220920 }, { "epoch": 0.39, "learning_rate": 3.073623119661548e-05, "loss": 2.5209, "step": 220930 }, { "epoch": 0.39, "learning_rate": 3.073535925668865e-05, "loss": 2.4091, "step": 220940 }, { "epoch": 0.39, "learning_rate": 3.073448731676183e-05, "loss": 2.4941, "step": 220950 }, { "epoch": 0.39, "learning_rate": 3.0733615376835e-05, "loss": 2.3396, "step": 220960 }, { "epoch": 0.39, "learning_rate": 3.0732743436908175e-05, "loss": 2.4468, "step": 220970 }, { "epoch": 0.39, "learning_rate": 3.0731871496981346e-05, "loss": 2.306, "step": 220980 }, { "epoch": 0.39, "learning_rate": 3.0730999557054516e-05, "loss": 2.4959, "step": 220990 }, { "epoch": 0.39, "learning_rate": 3.073012761712769e-05, "loss": 2.3464, "step": 221000 }, { "epoch": 0.39, "learning_rate": 3.0729255677200864e-05, "loss": 2.3416, "step": 221010 }, { "epoch": 0.39, "learning_rate": 3.0728383737274034e-05, "loss": 2.2784, "step": 221020 }, { "epoch": 0.39, "learning_rate": 3.072751179734721e-05, "loss": 2.329, "step": 221030 }, { "epoch": 0.39, "learning_rate": 3.072663985742039e-05, "loss": 2.4687, "step": 221040 }, { "epoch": 0.39, "learning_rate": 3.072576791749356e-05, "loss": 2.4926, "step": 221050 }, { "epoch": 0.39, "learning_rate": 3.072489597756673e-05, "loss": 2.287, "step": 221060 }, { "epoch": 0.39, "learning_rate": 3.0724024037639906e-05, "loss": 2.4409, "step": 221070 }, { "epoch": 0.39, "learning_rate": 3.0723152097713077e-05, "loss": 2.4169, "step": 221080 }, { "epoch": 0.39, "learning_rate": 3.072228015778625e-05, "loss": 2.33, "step": 221090 }, { "epoch": 0.39, "learning_rate": 3.0721408217859424e-05, "loss": 2.4557, "step": 221100 }, { "epoch": 0.39, "learning_rate": 3.07205362779326e-05, "loss": 2.4461, "step": 221110 }, { "epoch": 0.39, "learning_rate": 3.071966433800577e-05, "loss": 2.4407, "step": 221120 }, { "epoch": 0.39, "learning_rate": 3.071879239807894e-05, "loss": 2.343, "step": 221130 }, { "epoch": 0.39, "learning_rate": 3.071792045815212e-05, "loss": 2.4102, "step": 221140 }, { "epoch": 0.39, "learning_rate": 3.071704851822529e-05, "loss": 2.4164, "step": 221150 }, { "epoch": 0.39, "learning_rate": 3.071617657829846e-05, "loss": 2.4123, "step": 221160 }, { "epoch": 0.39, "learning_rate": 3.071530463837163e-05, "loss": 2.5312, "step": 221170 }, { "epoch": 0.39, "learning_rate": 3.0714432698444814e-05, "loss": 2.5306, "step": 221180 }, { "epoch": 0.39, "learning_rate": 3.0713560758517985e-05, "loss": 2.405, "step": 221190 }, { "epoch": 0.39, "learning_rate": 3.0712688818591155e-05, "loss": 2.2547, "step": 221200 }, { "epoch": 0.39, "learning_rate": 3.071181687866433e-05, "loss": 2.4021, "step": 221210 }, { "epoch": 0.39, "learning_rate": 3.07109449387375e-05, "loss": 2.4599, "step": 221220 }, { "epoch": 0.39, "learning_rate": 3.071007299881067e-05, "loss": 2.3919, "step": 221230 }, { "epoch": 0.39, "learning_rate": 3.070920105888384e-05, "loss": 2.5551, "step": 221240 }, { "epoch": 0.39, "learning_rate": 3.070832911895703e-05, "loss": 2.4523, "step": 221250 }, { "epoch": 0.39, "learning_rate": 3.07074571790302e-05, "loss": 2.3258, "step": 221260 }, { "epoch": 0.39, "learning_rate": 3.070658523910337e-05, "loss": 2.2031, "step": 221270 }, { "epoch": 0.39, "learning_rate": 3.070571329917654e-05, "loss": 2.4316, "step": 221280 }, { "epoch": 0.39, "learning_rate": 3.0704841359249716e-05, "loss": 2.5034, "step": 221290 }, { "epoch": 0.39, "learning_rate": 3.0703969419322886e-05, "loss": 2.3911, "step": 221300 }, { "epoch": 0.39, "learning_rate": 3.0703097479396056e-05, "loss": 2.3742, "step": 221310 }, { "epoch": 0.39, "learning_rate": 3.0702225539469234e-05, "loss": 2.3617, "step": 221320 }, { "epoch": 0.39, "learning_rate": 3.070135359954241e-05, "loss": 2.4834, "step": 221330 }, { "epoch": 0.39, "learning_rate": 3.070048165961558e-05, "loss": 2.3477, "step": 221340 }, { "epoch": 0.39, "learning_rate": 3.069960971968875e-05, "loss": 2.386, "step": 221350 }, { "epoch": 0.39, "learning_rate": 3.069873777976193e-05, "loss": 2.4411, "step": 221360 }, { "epoch": 0.39, "learning_rate": 3.06978658398351e-05, "loss": 2.3036, "step": 221370 }, { "epoch": 0.39, "learning_rate": 3.069699389990827e-05, "loss": 2.4537, "step": 221380 }, { "epoch": 0.39, "learning_rate": 3.0696121959981447e-05, "loss": 2.4622, "step": 221390 }, { "epoch": 0.39, "learning_rate": 3.0695250020054624e-05, "loss": 2.3244, "step": 221400 }, { "epoch": 0.39, "learning_rate": 3.0694378080127794e-05, "loss": 2.3704, "step": 221410 }, { "epoch": 0.39, "learning_rate": 3.0693506140200964e-05, "loss": 2.4831, "step": 221420 }, { "epoch": 0.39, "learning_rate": 3.069263420027414e-05, "loss": 2.4986, "step": 221430 }, { "epoch": 0.39, "learning_rate": 3.069176226034731e-05, "loss": 2.4865, "step": 221440 }, { "epoch": 0.39, "learning_rate": 3.069089032042048e-05, "loss": 2.2011, "step": 221450 }, { "epoch": 0.39, "learning_rate": 3.069001838049366e-05, "loss": 2.448, "step": 221460 }, { "epoch": 0.39, "learning_rate": 3.068914644056683e-05, "loss": 2.5187, "step": 221470 }, { "epoch": 0.39, "learning_rate": 3.068827450064001e-05, "loss": 2.4738, "step": 221480 }, { "epoch": 0.39, "learning_rate": 3.068740256071318e-05, "loss": 2.3584, "step": 221490 }, { "epoch": 0.39, "learning_rate": 3.0686530620786355e-05, "loss": 2.2956, "step": 221500 }, { "epoch": 0.39, "learning_rate": 3.0685658680859525e-05, "loss": 2.4209, "step": 221510 }, { "epoch": 0.39, "learning_rate": 3.0684786740932695e-05, "loss": 2.3908, "step": 221520 }, { "epoch": 0.39, "learning_rate": 3.068391480100587e-05, "loss": 2.4011, "step": 221530 }, { "epoch": 0.39, "learning_rate": 3.068304286107904e-05, "loss": 2.5407, "step": 221540 }, { "epoch": 0.39, "learning_rate": 3.068217092115222e-05, "loss": 2.419, "step": 221550 }, { "epoch": 0.39, "learning_rate": 3.068129898122539e-05, "loss": 2.389, "step": 221560 }, { "epoch": 0.39, "learning_rate": 3.068042704129857e-05, "loss": 2.2761, "step": 221570 }, { "epoch": 0.39, "learning_rate": 3.067955510137174e-05, "loss": 2.3897, "step": 221580 }, { "epoch": 0.39, "learning_rate": 3.067868316144491e-05, "loss": 2.4084, "step": 221590 }, { "epoch": 0.39, "learning_rate": 3.0677811221518086e-05, "loss": 2.4065, "step": 221600 }, { "epoch": 0.39, "learning_rate": 3.0676939281591256e-05, "loss": 2.4565, "step": 221610 }, { "epoch": 0.39, "learning_rate": 3.067606734166443e-05, "loss": 2.4221, "step": 221620 }, { "epoch": 0.39, "learning_rate": 3.0675195401737603e-05, "loss": 2.4128, "step": 221630 }, { "epoch": 0.39, "learning_rate": 3.067432346181078e-05, "loss": 2.4099, "step": 221640 }, { "epoch": 0.39, "learning_rate": 3.067345152188395e-05, "loss": 2.3207, "step": 221650 }, { "epoch": 0.39, "learning_rate": 3.067257958195712e-05, "loss": 2.3479, "step": 221660 }, { "epoch": 0.39, "learning_rate": 3.067170764203029e-05, "loss": 2.3407, "step": 221670 }, { "epoch": 0.39, "learning_rate": 3.067083570210347e-05, "loss": 2.4024, "step": 221680 }, { "epoch": 0.39, "learning_rate": 3.066996376217664e-05, "loss": 2.3508, "step": 221690 }, { "epoch": 0.39, "learning_rate": 3.0669091822249816e-05, "loss": 2.3865, "step": 221700 }, { "epoch": 0.39, "learning_rate": 3.0668219882322994e-05, "loss": 2.3508, "step": 221710 }, { "epoch": 0.39, "learning_rate": 3.0667347942396164e-05, "loss": 2.3831, "step": 221720 }, { "epoch": 0.39, "learning_rate": 3.0666476002469334e-05, "loss": 2.4501, "step": 221730 }, { "epoch": 0.39, "learning_rate": 3.0665604062542505e-05, "loss": 2.4623, "step": 221740 }, { "epoch": 0.39, "learning_rate": 3.066473212261568e-05, "loss": 2.4777, "step": 221750 }, { "epoch": 0.39, "learning_rate": 3.066386018268885e-05, "loss": 2.3716, "step": 221760 }, { "epoch": 0.39, "learning_rate": 3.066298824276203e-05, "loss": 2.4841, "step": 221770 }, { "epoch": 0.39, "learning_rate": 3.06621163028352e-05, "loss": 2.4094, "step": 221780 }, { "epoch": 0.39, "learning_rate": 3.066124436290838e-05, "loss": 2.3743, "step": 221790 }, { "epoch": 0.39, "learning_rate": 3.066037242298155e-05, "loss": 2.4228, "step": 221800 }, { "epoch": 0.39, "learning_rate": 3.065950048305472e-05, "loss": 2.3512, "step": 221810 }, { "epoch": 0.39, "learning_rate": 3.0658628543127895e-05, "loss": 2.4001, "step": 221820 }, { "epoch": 0.39, "learning_rate": 3.0657756603201065e-05, "loss": 2.4233, "step": 221830 }, { "epoch": 0.39, "learning_rate": 3.0656884663274236e-05, "loss": 2.4672, "step": 221840 }, { "epoch": 0.39, "learning_rate": 3.065601272334741e-05, "loss": 2.5508, "step": 221850 }, { "epoch": 0.39, "learning_rate": 3.065514078342059e-05, "loss": 2.4285, "step": 221860 }, { "epoch": 0.39, "learning_rate": 3.065426884349376e-05, "loss": 2.3135, "step": 221870 }, { "epoch": 0.39, "learning_rate": 3.065339690356693e-05, "loss": 2.4251, "step": 221880 }, { "epoch": 0.39, "learning_rate": 3.065252496364011e-05, "loss": 2.4781, "step": 221890 }, { "epoch": 0.39, "learning_rate": 3.065165302371328e-05, "loss": 2.4958, "step": 221900 }, { "epoch": 0.39, "learning_rate": 3.065078108378645e-05, "loss": 2.3911, "step": 221910 }, { "epoch": 0.39, "learning_rate": 3.0649909143859626e-05, "loss": 2.3769, "step": 221920 }, { "epoch": 0.39, "learning_rate": 3.06490372039328e-05, "loss": 2.379, "step": 221930 }, { "epoch": 0.39, "learning_rate": 3.064816526400597e-05, "loss": 2.3222, "step": 221940 }, { "epoch": 0.39, "learning_rate": 3.0647293324079144e-05, "loss": 2.3922, "step": 221950 }, { "epoch": 0.39, "learning_rate": 3.064642138415232e-05, "loss": 2.4247, "step": 221960 }, { "epoch": 0.39, "learning_rate": 3.064554944422549e-05, "loss": 2.4008, "step": 221970 }, { "epoch": 0.39, "learning_rate": 3.064467750429866e-05, "loss": 2.3837, "step": 221980 }, { "epoch": 0.39, "learning_rate": 3.064380556437184e-05, "loss": 2.392, "step": 221990 }, { "epoch": 0.39, "learning_rate": 3.0642933624445016e-05, "loss": 2.4082, "step": 222000 }, { "epoch": 0.39, "learning_rate": 3.0642061684518186e-05, "loss": 2.4928, "step": 222010 }, { "epoch": 0.39, "learning_rate": 3.064118974459136e-05, "loss": 2.3022, "step": 222020 }, { "epoch": 0.39, "learning_rate": 3.0640317804664534e-05, "loss": 2.3594, "step": 222030 }, { "epoch": 0.39, "learning_rate": 3.0639445864737704e-05, "loss": 2.4334, "step": 222040 }, { "epoch": 0.39, "learning_rate": 3.0638573924810875e-05, "loss": 2.3963, "step": 222050 }, { "epoch": 0.39, "learning_rate": 3.063770198488405e-05, "loss": 2.4585, "step": 222060 }, { "epoch": 0.39, "learning_rate": 3.063683004495723e-05, "loss": 2.3863, "step": 222070 }, { "epoch": 0.39, "learning_rate": 3.06359581050304e-05, "loss": 2.4689, "step": 222080 }, { "epoch": 0.39, "learning_rate": 3.063508616510357e-05, "loss": 2.3479, "step": 222090 }, { "epoch": 0.39, "learning_rate": 3.063421422517675e-05, "loss": 2.338, "step": 222100 }, { "epoch": 0.39, "learning_rate": 3.063334228524992e-05, "loss": 2.4688, "step": 222110 }, { "epoch": 0.39, "learning_rate": 3.063247034532309e-05, "loss": 2.3733, "step": 222120 }, { "epoch": 0.39, "learning_rate": 3.063159840539626e-05, "loss": 2.4046, "step": 222130 }, { "epoch": 0.39, "learning_rate": 3.063072646546944e-05, "loss": 2.2712, "step": 222140 }, { "epoch": 0.39, "learning_rate": 3.062985452554261e-05, "loss": 2.4299, "step": 222150 }, { "epoch": 0.39, "learning_rate": 3.062898258561578e-05, "loss": 2.4678, "step": 222160 }, { "epoch": 0.39, "learning_rate": 3.062811064568896e-05, "loss": 2.4169, "step": 222170 }, { "epoch": 0.39, "learning_rate": 3.062723870576213e-05, "loss": 2.3934, "step": 222180 }, { "epoch": 0.39, "learning_rate": 3.06263667658353e-05, "loss": 2.2935, "step": 222190 }, { "epoch": 0.39, "learning_rate": 3.062549482590847e-05, "loss": 2.3706, "step": 222200 }, { "epoch": 0.39, "learning_rate": 3.062462288598165e-05, "loss": 2.4223, "step": 222210 }, { "epoch": 0.39, "learning_rate": 3.0623750946054825e-05, "loss": 2.4367, "step": 222220 }, { "epoch": 0.39, "learning_rate": 3.0622879006127996e-05, "loss": 2.4341, "step": 222230 }, { "epoch": 0.39, "learning_rate": 3.0622007066201166e-05, "loss": 2.4594, "step": 222240 }, { "epoch": 0.39, "learning_rate": 3.062113512627434e-05, "loss": 2.2921, "step": 222250 }, { "epoch": 0.39, "learning_rate": 3.0620263186347514e-05, "loss": 2.3994, "step": 222260 }, { "epoch": 0.39, "learning_rate": 3.0619391246420684e-05, "loss": 2.3272, "step": 222270 }, { "epoch": 0.39, "learning_rate": 3.061851930649386e-05, "loss": 2.4161, "step": 222280 }, { "epoch": 0.39, "learning_rate": 3.061764736656704e-05, "loss": 2.3757, "step": 222290 }, { "epoch": 0.39, "learning_rate": 3.061677542664021e-05, "loss": 2.4055, "step": 222300 }, { "epoch": 0.39, "learning_rate": 3.061590348671338e-05, "loss": 2.3691, "step": 222310 }, { "epoch": 0.39, "learning_rate": 3.0615031546786556e-05, "loss": 2.3895, "step": 222320 }, { "epoch": 0.39, "learning_rate": 3.061415960685973e-05, "loss": 2.4458, "step": 222330 }, { "epoch": 0.39, "learning_rate": 3.06132876669329e-05, "loss": 2.2778, "step": 222340 }, { "epoch": 0.39, "learning_rate": 3.0612415727006074e-05, "loss": 2.3017, "step": 222350 }, { "epoch": 0.39, "learning_rate": 3.0611543787079245e-05, "loss": 2.3786, "step": 222360 }, { "epoch": 0.39, "learning_rate": 3.061067184715242e-05, "loss": 2.3347, "step": 222370 }, { "epoch": 0.39, "learning_rate": 3.060979990722559e-05, "loss": 2.5736, "step": 222380 }, { "epoch": 0.39, "learning_rate": 3.060892796729877e-05, "loss": 2.3233, "step": 222390 }, { "epoch": 0.39, "learning_rate": 3.060805602737194e-05, "loss": 2.3949, "step": 222400 }, { "epoch": 0.39, "learning_rate": 3.060718408744511e-05, "loss": 2.4063, "step": 222410 }, { "epoch": 0.39, "learning_rate": 3.060631214751829e-05, "loss": 2.3705, "step": 222420 }, { "epoch": 0.39, "learning_rate": 3.060544020759146e-05, "loss": 2.408, "step": 222430 }, { "epoch": 0.39, "learning_rate": 3.0604568267664635e-05, "loss": 2.3447, "step": 222440 }, { "epoch": 0.39, "learning_rate": 3.0603696327737805e-05, "loss": 2.4829, "step": 222450 }, { "epoch": 0.39, "learning_rate": 3.060282438781098e-05, "loss": 2.3946, "step": 222460 }, { "epoch": 0.39, "learning_rate": 3.060195244788415e-05, "loss": 2.3973, "step": 222470 }, { "epoch": 0.39, "learning_rate": 3.060108050795732e-05, "loss": 2.4347, "step": 222480 }, { "epoch": 0.39, "learning_rate": 3.06002085680305e-05, "loss": 2.3386, "step": 222490 }, { "epoch": 0.39, "learning_rate": 3.059933662810367e-05, "loss": 2.4312, "step": 222500 }, { "epoch": 0.39, "learning_rate": 3.059846468817684e-05, "loss": 2.4465, "step": 222510 }, { "epoch": 0.39, "learning_rate": 3.059759274825002e-05, "loss": 2.3666, "step": 222520 }, { "epoch": 0.39, "learning_rate": 3.0596720808323195e-05, "loss": 2.3695, "step": 222530 }, { "epoch": 0.39, "learning_rate": 3.0595848868396366e-05, "loss": 2.3584, "step": 222540 }, { "epoch": 0.39, "learning_rate": 3.0594976928469536e-05, "loss": 2.4464, "step": 222550 }, { "epoch": 0.39, "learning_rate": 3.059410498854271e-05, "loss": 2.4993, "step": 222560 }, { "epoch": 0.39, "learning_rate": 3.0593233048615884e-05, "loss": 2.419, "step": 222570 }, { "epoch": 0.39, "learning_rate": 3.0592361108689054e-05, "loss": 2.3024, "step": 222580 }, { "epoch": 0.39, "learning_rate": 3.059148916876223e-05, "loss": 2.4065, "step": 222590 }, { "epoch": 0.39, "learning_rate": 3.059061722883541e-05, "loss": 2.4622, "step": 222600 }, { "epoch": 0.39, "learning_rate": 3.058974528890858e-05, "loss": 2.4306, "step": 222610 }, { "epoch": 0.39, "learning_rate": 3.058887334898175e-05, "loss": 2.4311, "step": 222620 }, { "epoch": 0.39, "learning_rate": 3.058800140905492e-05, "loss": 2.4826, "step": 222630 }, { "epoch": 0.39, "learning_rate": 3.05871294691281e-05, "loss": 2.5891, "step": 222640 }, { "epoch": 0.39, "learning_rate": 3.058625752920127e-05, "loss": 2.5458, "step": 222650 }, { "epoch": 0.39, "learning_rate": 3.058538558927444e-05, "loss": 2.4952, "step": 222660 }, { "epoch": 0.39, "learning_rate": 3.058451364934762e-05, "loss": 2.3108, "step": 222670 }, { "epoch": 0.39, "learning_rate": 3.058364170942079e-05, "loss": 2.4945, "step": 222680 }, { "epoch": 0.39, "learning_rate": 3.058276976949396e-05, "loss": 2.3559, "step": 222690 }, { "epoch": 0.39, "learning_rate": 3.058189782956713e-05, "loss": 2.4597, "step": 222700 }, { "epoch": 0.39, "learning_rate": 3.058102588964031e-05, "loss": 2.2791, "step": 222710 }, { "epoch": 0.39, "learning_rate": 3.058015394971348e-05, "loss": 2.3924, "step": 222720 }, { "epoch": 0.39, "learning_rate": 3.057928200978665e-05, "loss": 2.366, "step": 222730 }, { "epoch": 0.39, "learning_rate": 3.057841006985983e-05, "loss": 2.3724, "step": 222740 }, { "epoch": 0.39, "learning_rate": 3.0577538129933005e-05, "loss": 2.3295, "step": 222750 }, { "epoch": 0.39, "learning_rate": 3.0576666190006175e-05, "loss": 2.366, "step": 222760 }, { "epoch": 0.39, "learning_rate": 3.0575794250079345e-05, "loss": 2.4688, "step": 222770 }, { "epoch": 0.39, "learning_rate": 3.057492231015252e-05, "loss": 2.3258, "step": 222780 }, { "epoch": 0.39, "learning_rate": 3.057405037022569e-05, "loss": 2.4736, "step": 222790 }, { "epoch": 0.39, "learning_rate": 3.0573178430298863e-05, "loss": 2.3895, "step": 222800 }, { "epoch": 0.39, "learning_rate": 3.057230649037204e-05, "loss": 2.5169, "step": 222810 }, { "epoch": 0.39, "learning_rate": 3.057143455044522e-05, "loss": 2.5234, "step": 222820 }, { "epoch": 0.39, "learning_rate": 3.057056261051839e-05, "loss": 2.5532, "step": 222830 }, { "epoch": 0.39, "learning_rate": 3.056969067059156e-05, "loss": 2.4576, "step": 222840 }, { "epoch": 0.39, "learning_rate": 3.0568818730664736e-05, "loss": 2.5279, "step": 222850 }, { "epoch": 0.39, "learning_rate": 3.0567946790737906e-05, "loss": 2.4529, "step": 222860 }, { "epoch": 0.39, "learning_rate": 3.0567074850811076e-05, "loss": 2.4246, "step": 222870 }, { "epoch": 0.39, "learning_rate": 3.0566202910884254e-05, "loss": 2.4192, "step": 222880 }, { "epoch": 0.39, "learning_rate": 3.056533097095743e-05, "loss": 2.4604, "step": 222890 }, { "epoch": 0.39, "learning_rate": 3.05644590310306e-05, "loss": 2.4744, "step": 222900 }, { "epoch": 0.39, "learning_rate": 3.056358709110377e-05, "loss": 2.3649, "step": 222910 }, { "epoch": 0.39, "learning_rate": 3.056271515117695e-05, "loss": 2.3258, "step": 222920 }, { "epoch": 0.39, "learning_rate": 3.056184321125012e-05, "loss": 2.4366, "step": 222930 }, { "epoch": 0.39, "learning_rate": 3.056097127132329e-05, "loss": 2.3586, "step": 222940 }, { "epoch": 0.39, "learning_rate": 3.0560099331396467e-05, "loss": 2.2794, "step": 222950 }, { "epoch": 0.39, "learning_rate": 3.0559227391469644e-05, "loss": 2.5327, "step": 222960 }, { "epoch": 0.39, "learning_rate": 3.0558355451542814e-05, "loss": 2.4295, "step": 222970 }, { "epoch": 0.39, "learning_rate": 3.0557483511615984e-05, "loss": 2.4375, "step": 222980 }, { "epoch": 0.39, "learning_rate": 3.055661157168916e-05, "loss": 2.4149, "step": 222990 }, { "epoch": 0.39, "learning_rate": 3.055573963176233e-05, "loss": 2.4145, "step": 223000 }, { "epoch": 0.39, "learning_rate": 3.05548676918355e-05, "loss": 2.4226, "step": 223010 }, { "epoch": 0.39, "learning_rate": 3.055399575190867e-05, "loss": 2.2988, "step": 223020 }, { "epoch": 0.39, "learning_rate": 3.055312381198185e-05, "loss": 2.3995, "step": 223030 }, { "epoch": 0.39, "learning_rate": 3.055225187205503e-05, "loss": 2.4747, "step": 223040 }, { "epoch": 0.39, "learning_rate": 3.05513799321282e-05, "loss": 2.3891, "step": 223050 }, { "epoch": 0.39, "learning_rate": 3.0550507992201375e-05, "loss": 2.4762, "step": 223060 }, { "epoch": 0.39, "learning_rate": 3.0549636052274545e-05, "loss": 2.4388, "step": 223070 }, { "epoch": 0.39, "learning_rate": 3.0548764112347715e-05, "loss": 2.4034, "step": 223080 }, { "epoch": 0.39, "learning_rate": 3.0547892172420886e-05, "loss": 2.478, "step": 223090 }, { "epoch": 0.39, "learning_rate": 3.054702023249406e-05, "loss": 2.4125, "step": 223100 }, { "epoch": 0.39, "learning_rate": 3.054614829256724e-05, "loss": 2.4514, "step": 223110 }, { "epoch": 0.39, "learning_rate": 3.054527635264041e-05, "loss": 2.4435, "step": 223120 }, { "epoch": 0.39, "learning_rate": 3.054440441271358e-05, "loss": 2.4117, "step": 223130 }, { "epoch": 0.39, "learning_rate": 3.054353247278676e-05, "loss": 2.3401, "step": 223140 }, { "epoch": 0.39, "learning_rate": 3.054266053285993e-05, "loss": 2.3627, "step": 223150 }, { "epoch": 0.39, "learning_rate": 3.05417885929331e-05, "loss": 2.3614, "step": 223160 }, { "epoch": 0.39, "learning_rate": 3.0540916653006276e-05, "loss": 2.4348, "step": 223170 }, { "epoch": 0.39, "learning_rate": 3.0540044713079446e-05, "loss": 2.3159, "step": 223180 }, { "epoch": 0.39, "learning_rate": 3.0539172773152623e-05, "loss": 2.418, "step": 223190 }, { "epoch": 0.39, "learning_rate": 3.0538300833225794e-05, "loss": 2.312, "step": 223200 }, { "epoch": 0.39, "learning_rate": 3.053742889329897e-05, "loss": 2.3073, "step": 223210 }, { "epoch": 0.39, "learning_rate": 3.053655695337214e-05, "loss": 2.3813, "step": 223220 }, { "epoch": 0.39, "learning_rate": 3.053568501344531e-05, "loss": 2.5441, "step": 223230 }, { "epoch": 0.39, "learning_rate": 3.053481307351849e-05, "loss": 2.3519, "step": 223240 }, { "epoch": 0.39, "learning_rate": 3.053394113359166e-05, "loss": 2.4459, "step": 223250 }, { "epoch": 0.39, "learning_rate": 3.0533069193664836e-05, "loss": 2.4116, "step": 223260 }, { "epoch": 0.39, "learning_rate": 3.053219725373801e-05, "loss": 2.3573, "step": 223270 }, { "epoch": 0.39, "learning_rate": 3.0531325313811184e-05, "loss": 2.3721, "step": 223280 }, { "epoch": 0.39, "learning_rate": 3.0530453373884354e-05, "loss": 2.4026, "step": 223290 }, { "epoch": 0.39, "learning_rate": 3.0529581433957525e-05, "loss": 2.4285, "step": 223300 }, { "epoch": 0.39, "learning_rate": 3.05287094940307e-05, "loss": 2.4622, "step": 223310 }, { "epoch": 0.39, "learning_rate": 3.052783755410387e-05, "loss": 2.296, "step": 223320 }, { "epoch": 0.39, "learning_rate": 3.052696561417704e-05, "loss": 2.4715, "step": 223330 }, { "epoch": 0.39, "learning_rate": 3.052609367425022e-05, "loss": 2.3671, "step": 223340 }, { "epoch": 0.39, "learning_rate": 3.05252217343234e-05, "loss": 2.4405, "step": 223350 }, { "epoch": 0.39, "learning_rate": 3.052434979439657e-05, "loss": 2.4298, "step": 223360 }, { "epoch": 0.39, "learning_rate": 3.052347785446974e-05, "loss": 2.3613, "step": 223370 }, { "epoch": 0.39, "learning_rate": 3.0522605914542915e-05, "loss": 2.3121, "step": 223380 }, { "epoch": 0.39, "learning_rate": 3.0521733974616085e-05, "loss": 2.507, "step": 223390 }, { "epoch": 0.39, "learning_rate": 3.0520862034689256e-05, "loss": 2.4568, "step": 223400 }, { "epoch": 0.39, "learning_rate": 3.051999009476243e-05, "loss": 2.4652, "step": 223410 }, { "epoch": 0.39, "learning_rate": 3.051911815483561e-05, "loss": 2.457, "step": 223420 }, { "epoch": 0.39, "learning_rate": 3.051824621490878e-05, "loss": 2.4217, "step": 223430 }, { "epoch": 0.39, "learning_rate": 3.051737427498195e-05, "loss": 2.4825, "step": 223440 }, { "epoch": 0.39, "learning_rate": 3.0516502335055125e-05, "loss": 2.4418, "step": 223450 }, { "epoch": 0.39, "learning_rate": 3.05156303951283e-05, "loss": 2.4847, "step": 223460 }, { "epoch": 0.39, "learning_rate": 3.051475845520147e-05, "loss": 2.451, "step": 223470 }, { "epoch": 0.39, "learning_rate": 3.051388651527465e-05, "loss": 2.4539, "step": 223480 }, { "epoch": 0.39, "learning_rate": 3.051301457534782e-05, "loss": 2.4833, "step": 223490 }, { "epoch": 0.39, "learning_rate": 3.0512142635420993e-05, "loss": 2.4762, "step": 223500 }, { "epoch": 0.39, "learning_rate": 3.0511270695494164e-05, "loss": 2.5384, "step": 223510 }, { "epoch": 0.39, "learning_rate": 3.0510398755567338e-05, "loss": 2.3898, "step": 223520 }, { "epoch": 0.39, "learning_rate": 3.050952681564051e-05, "loss": 2.3615, "step": 223530 }, { "epoch": 0.39, "learning_rate": 3.0508654875713682e-05, "loss": 2.5305, "step": 223540 }, { "epoch": 0.39, "learning_rate": 3.0507782935786855e-05, "loss": 2.3582, "step": 223550 }, { "epoch": 0.39, "learning_rate": 3.0506910995860033e-05, "loss": 2.4266, "step": 223560 }, { "epoch": 0.39, "learning_rate": 3.0506039055933206e-05, "loss": 2.4302, "step": 223570 }, { "epoch": 0.39, "learning_rate": 3.0505167116006377e-05, "loss": 2.4313, "step": 223580 }, { "epoch": 0.39, "learning_rate": 3.050429517607955e-05, "loss": 2.3129, "step": 223590 }, { "epoch": 0.39, "learning_rate": 3.0503423236152724e-05, "loss": 2.3591, "step": 223600 }, { "epoch": 0.39, "learning_rate": 3.0502551296225895e-05, "loss": 2.3533, "step": 223610 }, { "epoch": 0.39, "learning_rate": 3.050167935629907e-05, "loss": 2.469, "step": 223620 }, { "epoch": 0.39, "learning_rate": 3.0500807416372246e-05, "loss": 2.4861, "step": 223630 }, { "epoch": 0.39, "learning_rate": 3.049993547644542e-05, "loss": 2.5584, "step": 223640 }, { "epoch": 0.39, "learning_rate": 3.049906353651859e-05, "loss": 2.328, "step": 223650 }, { "epoch": 0.39, "learning_rate": 3.0498191596591764e-05, "loss": 2.3163, "step": 223660 }, { "epoch": 0.39, "learning_rate": 3.0497319656664934e-05, "loss": 2.538, "step": 223670 }, { "epoch": 0.39, "learning_rate": 3.0496447716738108e-05, "loss": 2.4525, "step": 223680 }, { "epoch": 0.39, "learning_rate": 3.049557577681128e-05, "loss": 2.4103, "step": 223690 }, { "epoch": 0.39, "learning_rate": 3.0494703836884452e-05, "loss": 2.3033, "step": 223700 }, { "epoch": 0.39, "learning_rate": 3.0493831896957632e-05, "loss": 2.4561, "step": 223710 }, { "epoch": 0.39, "learning_rate": 3.0492959957030803e-05, "loss": 2.4589, "step": 223720 }, { "epoch": 0.39, "learning_rate": 3.0492088017103977e-05, "loss": 2.3911, "step": 223730 }, { "epoch": 0.39, "learning_rate": 3.0491216077177147e-05, "loss": 2.333, "step": 223740 }, { "epoch": 0.39, "learning_rate": 3.049034413725032e-05, "loss": 2.3813, "step": 223750 }, { "epoch": 0.39, "learning_rate": 3.0489472197323494e-05, "loss": 2.4733, "step": 223760 }, { "epoch": 0.39, "learning_rate": 3.0488600257396665e-05, "loss": 2.3541, "step": 223770 }, { "epoch": 0.39, "learning_rate": 3.0487728317469842e-05, "loss": 2.3023, "step": 223780 }, { "epoch": 0.39, "learning_rate": 3.0486856377543016e-05, "loss": 2.4737, "step": 223790 }, { "epoch": 0.39, "learning_rate": 3.048598443761619e-05, "loss": 2.3829, "step": 223800 }, { "epoch": 0.39, "learning_rate": 3.048511249768936e-05, "loss": 2.373, "step": 223810 }, { "epoch": 0.39, "learning_rate": 3.0484240557762534e-05, "loss": 2.3517, "step": 223820 }, { "epoch": 0.39, "learning_rate": 3.0483368617835707e-05, "loss": 2.3613, "step": 223830 }, { "epoch": 0.39, "learning_rate": 3.0482496677908878e-05, "loss": 2.3077, "step": 223840 }, { "epoch": 0.39, "learning_rate": 3.048162473798205e-05, "loss": 2.3338, "step": 223850 }, { "epoch": 0.39, "learning_rate": 3.048075279805523e-05, "loss": 2.4736, "step": 223860 }, { "epoch": 0.39, "learning_rate": 3.0479880858128403e-05, "loss": 2.3867, "step": 223870 }, { "epoch": 0.39, "learning_rate": 3.0479008918201573e-05, "loss": 2.2507, "step": 223880 }, { "epoch": 0.39, "learning_rate": 3.0478136978274747e-05, "loss": 2.4674, "step": 223890 }, { "epoch": 0.39, "learning_rate": 3.0477265038347917e-05, "loss": 2.4195, "step": 223900 }, { "epoch": 0.39, "learning_rate": 3.047639309842109e-05, "loss": 2.4562, "step": 223910 }, { "epoch": 0.39, "learning_rate": 3.0475521158494265e-05, "loss": 2.456, "step": 223920 }, { "epoch": 0.39, "learning_rate": 3.0474649218567442e-05, "loss": 2.4344, "step": 223930 }, { "epoch": 0.39, "learning_rate": 3.0473777278640616e-05, "loss": 2.2654, "step": 223940 }, { "epoch": 0.39, "learning_rate": 3.0472905338713786e-05, "loss": 2.4089, "step": 223950 }, { "epoch": 0.39, "learning_rate": 3.047203339878696e-05, "loss": 2.4577, "step": 223960 }, { "epoch": 0.39, "learning_rate": 3.047116145886013e-05, "loss": 2.4172, "step": 223970 }, { "epoch": 0.39, "learning_rate": 3.0470289518933304e-05, "loss": 2.3651, "step": 223980 }, { "epoch": 0.39, "learning_rate": 3.0469417579006478e-05, "loss": 2.416, "step": 223990 }, { "epoch": 0.39, "learning_rate": 3.0468545639079655e-05, "loss": 2.3133, "step": 224000 }, { "epoch": 0.39, "learning_rate": 3.0467673699152825e-05, "loss": 2.4263, "step": 224010 }, { "epoch": 0.39, "learning_rate": 3.0466801759226e-05, "loss": 2.3929, "step": 224020 }, { "epoch": 0.39, "learning_rate": 3.0465929819299173e-05, "loss": 2.4045, "step": 224030 }, { "epoch": 0.39, "learning_rate": 3.0465057879372343e-05, "loss": 2.5087, "step": 224040 }, { "epoch": 0.39, "learning_rate": 3.0464185939445517e-05, "loss": 2.4582, "step": 224050 }, { "epoch": 0.39, "learning_rate": 3.0463313999518687e-05, "loss": 2.4727, "step": 224060 }, { "epoch": 0.39, "learning_rate": 3.046244205959186e-05, "loss": 2.3833, "step": 224070 }, { "epoch": 0.39, "learning_rate": 3.0461570119665038e-05, "loss": 2.3472, "step": 224080 }, { "epoch": 0.39, "learning_rate": 3.0460698179738212e-05, "loss": 2.3551, "step": 224090 }, { "epoch": 0.39, "learning_rate": 3.0459826239811386e-05, "loss": 2.4509, "step": 224100 }, { "epoch": 0.39, "learning_rate": 3.0458954299884556e-05, "loss": 2.5285, "step": 224110 }, { "epoch": 0.39, "learning_rate": 3.045808235995773e-05, "loss": 2.4375, "step": 224120 }, { "epoch": 0.39, "learning_rate": 3.04572104200309e-05, "loss": 2.4441, "step": 224130 }, { "epoch": 0.39, "learning_rate": 3.0456338480104074e-05, "loss": 2.457, "step": 224140 }, { "epoch": 0.39, "learning_rate": 3.045546654017725e-05, "loss": 2.331, "step": 224150 }, { "epoch": 0.39, "learning_rate": 3.0454594600250425e-05, "loss": 2.3595, "step": 224160 }, { "epoch": 0.39, "learning_rate": 3.0453722660323595e-05, "loss": 2.3277, "step": 224170 }, { "epoch": 0.39, "learning_rate": 3.045285072039677e-05, "loss": 2.5035, "step": 224180 }, { "epoch": 0.39, "learning_rate": 3.0451978780469943e-05, "loss": 2.3812, "step": 224190 }, { "epoch": 0.39, "learning_rate": 3.0451106840543113e-05, "loss": 2.4589, "step": 224200 }, { "epoch": 0.39, "learning_rate": 3.0450234900616287e-05, "loss": 2.3239, "step": 224210 }, { "epoch": 0.39, "learning_rate": 3.044936296068946e-05, "loss": 2.3871, "step": 224220 }, { "epoch": 0.39, "learning_rate": 3.0448491020762638e-05, "loss": 2.4165, "step": 224230 }, { "epoch": 0.39, "learning_rate": 3.044761908083581e-05, "loss": 2.4241, "step": 224240 }, { "epoch": 0.39, "learning_rate": 3.0446747140908982e-05, "loss": 2.4613, "step": 224250 }, { "epoch": 0.39, "learning_rate": 3.0445875200982156e-05, "loss": 2.5357, "step": 224260 }, { "epoch": 0.39, "learning_rate": 3.0445003261055326e-05, "loss": 2.4357, "step": 224270 }, { "epoch": 0.39, "learning_rate": 3.04441313211285e-05, "loss": 2.3581, "step": 224280 }, { "epoch": 0.39, "learning_rate": 3.044325938120167e-05, "loss": 2.3635, "step": 224290 }, { "epoch": 0.39, "learning_rate": 3.044238744127485e-05, "loss": 2.4138, "step": 224300 }, { "epoch": 0.39, "learning_rate": 3.044151550134802e-05, "loss": 2.4075, "step": 224310 }, { "epoch": 0.39, "learning_rate": 3.0440643561421195e-05, "loss": 2.3921, "step": 224320 }, { "epoch": 0.39, "learning_rate": 3.043977162149437e-05, "loss": 2.4025, "step": 224330 }, { "epoch": 0.39, "learning_rate": 3.043889968156754e-05, "loss": 2.3086, "step": 224340 }, { "epoch": 0.39, "learning_rate": 3.0438027741640713e-05, "loss": 2.4293, "step": 224350 }, { "epoch": 0.39, "learning_rate": 3.0437155801713883e-05, "loss": 2.3729, "step": 224360 }, { "epoch": 0.39, "learning_rate": 3.0436283861787057e-05, "loss": 2.4959, "step": 224370 }, { "epoch": 0.39, "learning_rate": 3.0435411921860234e-05, "loss": 2.4225, "step": 224380 }, { "epoch": 0.39, "learning_rate": 3.0434539981933408e-05, "loss": 2.4875, "step": 224390 }, { "epoch": 0.39, "learning_rate": 3.043366804200658e-05, "loss": 2.3085, "step": 224400 }, { "epoch": 0.39, "learning_rate": 3.0432796102079752e-05, "loss": 2.4603, "step": 224410 }, { "epoch": 0.39, "learning_rate": 3.0431924162152926e-05, "loss": 2.3421, "step": 224420 }, { "epoch": 0.39, "learning_rate": 3.0431052222226096e-05, "loss": 2.338, "step": 224430 }, { "epoch": 0.39, "learning_rate": 3.043018028229927e-05, "loss": 2.3099, "step": 224440 }, { "epoch": 0.39, "learning_rate": 3.0429308342372447e-05, "loss": 2.3849, "step": 224450 }, { "epoch": 0.39, "learning_rate": 3.042843640244562e-05, "loss": 2.4955, "step": 224460 }, { "epoch": 0.39, "learning_rate": 3.042756446251879e-05, "loss": 2.4066, "step": 224470 }, { "epoch": 0.39, "learning_rate": 3.0426692522591965e-05, "loss": 2.3765, "step": 224480 }, { "epoch": 0.39, "learning_rate": 3.042582058266514e-05, "loss": 2.4109, "step": 224490 }, { "epoch": 0.39, "learning_rate": 3.042494864273831e-05, "loss": 2.3649, "step": 224500 }, { "epoch": 0.39, "learning_rate": 3.0424076702811483e-05, "loss": 2.3534, "step": 224510 }, { "epoch": 0.39, "learning_rate": 3.0423204762884654e-05, "loss": 2.2608, "step": 224520 }, { "epoch": 0.39, "learning_rate": 3.0422332822957834e-05, "loss": 2.3556, "step": 224530 }, { "epoch": 0.39, "learning_rate": 3.0421460883031004e-05, "loss": 2.4663, "step": 224540 }, { "epoch": 0.39, "learning_rate": 3.0420588943104178e-05, "loss": 2.4336, "step": 224550 }, { "epoch": 0.39, "learning_rate": 3.0419717003177352e-05, "loss": 2.3585, "step": 224560 }, { "epoch": 0.39, "learning_rate": 3.0418845063250522e-05, "loss": 2.3702, "step": 224570 }, { "epoch": 0.39, "learning_rate": 3.0417973123323696e-05, "loss": 2.433, "step": 224580 }, { "epoch": 0.39, "learning_rate": 3.0417101183396867e-05, "loss": 2.4577, "step": 224590 }, { "epoch": 0.39, "learning_rate": 3.0416229243470047e-05, "loss": 2.5034, "step": 224600 }, { "epoch": 0.39, "learning_rate": 3.0415357303543217e-05, "loss": 2.3944, "step": 224610 }, { "epoch": 0.39, "learning_rate": 3.041448536361639e-05, "loss": 2.4049, "step": 224620 }, { "epoch": 0.39, "learning_rate": 3.041361342368956e-05, "loss": 2.4554, "step": 224630 }, { "epoch": 0.39, "learning_rate": 3.0412741483762735e-05, "loss": 2.4048, "step": 224640 }, { "epoch": 0.39, "learning_rate": 3.041186954383591e-05, "loss": 2.4401, "step": 224650 }, { "epoch": 0.39, "learning_rate": 3.041099760390908e-05, "loss": 2.466, "step": 224660 }, { "epoch": 0.39, "learning_rate": 3.041012566398226e-05, "loss": 2.4611, "step": 224670 }, { "epoch": 0.39, "learning_rate": 3.040925372405543e-05, "loss": 2.3315, "step": 224680 }, { "epoch": 0.39, "learning_rate": 3.0408381784128604e-05, "loss": 2.4321, "step": 224690 }, { "epoch": 0.39, "learning_rate": 3.0407509844201775e-05, "loss": 2.3306, "step": 224700 }, { "epoch": 0.39, "learning_rate": 3.040663790427495e-05, "loss": 2.4858, "step": 224710 }, { "epoch": 0.39, "learning_rate": 3.0405765964348122e-05, "loss": 2.4007, "step": 224720 }, { "epoch": 0.39, "learning_rate": 3.0404894024421293e-05, "loss": 2.4416, "step": 224730 }, { "epoch": 0.39, "learning_rate": 3.0404022084494466e-05, "loss": 2.2938, "step": 224740 }, { "epoch": 0.39, "learning_rate": 3.0403150144567643e-05, "loss": 2.4451, "step": 224750 }, { "epoch": 0.39, "learning_rate": 3.0402278204640817e-05, "loss": 2.39, "step": 224760 }, { "epoch": 0.39, "learning_rate": 3.0401406264713988e-05, "loss": 2.4063, "step": 224770 }, { "epoch": 0.39, "learning_rate": 3.040053432478716e-05, "loss": 2.3804, "step": 224780 }, { "epoch": 0.39, "learning_rate": 3.0399662384860332e-05, "loss": 2.4216, "step": 224790 }, { "epoch": 0.39, "learning_rate": 3.0398790444933506e-05, "loss": 2.4603, "step": 224800 }, { "epoch": 0.39, "learning_rate": 3.039791850500668e-05, "loss": 2.2757, "step": 224810 }, { "epoch": 0.39, "learning_rate": 3.0397046565079856e-05, "loss": 2.3136, "step": 224820 }, { "epoch": 0.39, "learning_rate": 3.039617462515303e-05, "loss": 2.2087, "step": 224830 }, { "epoch": 0.39, "learning_rate": 3.03953026852262e-05, "loss": 2.4292, "step": 224840 }, { "epoch": 0.39, "learning_rate": 3.0394430745299374e-05, "loss": 2.3943, "step": 224850 }, { "epoch": 0.39, "learning_rate": 3.0393558805372545e-05, "loss": 2.4521, "step": 224860 }, { "epoch": 0.39, "learning_rate": 3.039268686544572e-05, "loss": 2.3748, "step": 224870 }, { "epoch": 0.39, "learning_rate": 3.0391814925518892e-05, "loss": 2.4587, "step": 224880 }, { "epoch": 0.39, "learning_rate": 3.0390942985592063e-05, "loss": 2.4099, "step": 224890 }, { "epoch": 0.39, "learning_rate": 3.039007104566524e-05, "loss": 2.331, "step": 224900 }, { "epoch": 0.39, "learning_rate": 3.0389199105738414e-05, "loss": 2.4216, "step": 224910 }, { "epoch": 0.39, "learning_rate": 3.0388327165811587e-05, "loss": 2.3948, "step": 224920 }, { "epoch": 0.39, "learning_rate": 3.0387455225884758e-05, "loss": 2.4289, "step": 224930 }, { "epoch": 0.39, "learning_rate": 3.038658328595793e-05, "loss": 2.4261, "step": 224940 }, { "epoch": 0.39, "learning_rate": 3.0385711346031105e-05, "loss": 2.4071, "step": 224950 }, { "epoch": 0.39, "learning_rate": 3.0384839406104276e-05, "loss": 2.4271, "step": 224960 }, { "epoch": 0.39, "learning_rate": 3.0383967466177453e-05, "loss": 2.385, "step": 224970 }, { "epoch": 0.39, "learning_rate": 3.0383095526250627e-05, "loss": 2.3996, "step": 224980 }, { "epoch": 0.39, "learning_rate": 3.03822235863238e-05, "loss": 2.3187, "step": 224990 }, { "epoch": 0.39, "learning_rate": 3.038135164639697e-05, "loss": 2.439, "step": 225000 }, { "epoch": 0.39, "learning_rate": 3.0380479706470145e-05, "loss": 2.407, "step": 225010 }, { "epoch": 0.39, "learning_rate": 3.0379607766543315e-05, "loss": 2.3839, "step": 225020 }, { "epoch": 0.39, "learning_rate": 3.037873582661649e-05, "loss": 2.3971, "step": 225030 }, { "epoch": 0.39, "learning_rate": 3.0377863886689662e-05, "loss": 2.4273, "step": 225040 }, { "epoch": 0.39, "learning_rate": 3.037699194676284e-05, "loss": 2.4419, "step": 225050 }, { "epoch": 0.39, "learning_rate": 3.0376120006836013e-05, "loss": 2.3896, "step": 225060 }, { "epoch": 0.39, "learning_rate": 3.0375248066909184e-05, "loss": 2.396, "step": 225070 }, { "epoch": 0.39, "learning_rate": 3.0374376126982358e-05, "loss": 2.3742, "step": 225080 }, { "epoch": 0.39, "learning_rate": 3.0373504187055528e-05, "loss": 2.3891, "step": 225090 }, { "epoch": 0.39, "learning_rate": 3.0372632247128702e-05, "loss": 2.4581, "step": 225100 }, { "epoch": 0.39, "learning_rate": 3.0371760307201875e-05, "loss": 2.3533, "step": 225110 }, { "epoch": 0.39, "learning_rate": 3.0370888367275053e-05, "loss": 2.3648, "step": 225120 }, { "epoch": 0.39, "learning_rate": 3.0370016427348223e-05, "loss": 2.4385, "step": 225130 }, { "epoch": 0.39, "learning_rate": 3.0369144487421397e-05, "loss": 2.4161, "step": 225140 }, { "epoch": 0.39, "learning_rate": 3.036827254749457e-05, "loss": 2.3423, "step": 225150 }, { "epoch": 0.39, "learning_rate": 3.036740060756774e-05, "loss": 2.4703, "step": 225160 }, { "epoch": 0.39, "learning_rate": 3.0366528667640915e-05, "loss": 2.434, "step": 225170 }, { "epoch": 0.39, "learning_rate": 3.036565672771409e-05, "loss": 2.335, "step": 225180 }, { "epoch": 0.39, "learning_rate": 3.036478478778726e-05, "loss": 2.5369, "step": 225190 }, { "epoch": 0.39, "learning_rate": 3.0363912847860436e-05, "loss": 2.3544, "step": 225200 }, { "epoch": 0.39, "learning_rate": 3.036304090793361e-05, "loss": 2.3824, "step": 225210 }, { "epoch": 0.39, "learning_rate": 3.0362168968006784e-05, "loss": 2.4065, "step": 225220 }, { "epoch": 0.39, "learning_rate": 3.0361297028079954e-05, "loss": 2.4106, "step": 225230 }, { "epoch": 0.39, "learning_rate": 3.0360425088153128e-05, "loss": 2.3614, "step": 225240 }, { "epoch": 0.39, "learning_rate": 3.0359553148226298e-05, "loss": 2.3389, "step": 225250 }, { "epoch": 0.39, "learning_rate": 3.0358681208299472e-05, "loss": 2.3719, "step": 225260 }, { "epoch": 0.39, "learning_rate": 3.035780926837265e-05, "loss": 2.4818, "step": 225270 }, { "epoch": 0.39, "learning_rate": 3.0356937328445823e-05, "loss": 2.3403, "step": 225280 }, { "epoch": 0.39, "learning_rate": 3.0356065388518997e-05, "loss": 2.3899, "step": 225290 }, { "epoch": 0.39, "learning_rate": 3.0355193448592167e-05, "loss": 2.3989, "step": 225300 }, { "epoch": 0.39, "learning_rate": 3.035432150866534e-05, "loss": 2.3347, "step": 225310 }, { "epoch": 0.39, "learning_rate": 3.035344956873851e-05, "loss": 2.3262, "step": 225320 }, { "epoch": 0.39, "learning_rate": 3.0352577628811685e-05, "loss": 2.3127, "step": 225330 }, { "epoch": 0.39, "learning_rate": 3.0351705688884862e-05, "loss": 2.2784, "step": 225340 }, { "epoch": 0.39, "learning_rate": 3.0350833748958036e-05, "loss": 2.6192, "step": 225350 }, { "epoch": 0.39, "learning_rate": 3.0349961809031206e-05, "loss": 2.4833, "step": 225360 }, { "epoch": 0.39, "learning_rate": 3.034908986910438e-05, "loss": 2.4617, "step": 225370 }, { "epoch": 0.39, "learning_rate": 3.0348217929177554e-05, "loss": 2.4573, "step": 225380 }, { "epoch": 0.39, "learning_rate": 3.0347345989250724e-05, "loss": 2.4162, "step": 225390 }, { "epoch": 0.39, "learning_rate": 3.0346474049323898e-05, "loss": 2.4023, "step": 225400 }, { "epoch": 0.39, "learning_rate": 3.0345602109397068e-05, "loss": 2.3175, "step": 225410 }, { "epoch": 0.39, "learning_rate": 3.034473016947025e-05, "loss": 2.2769, "step": 225420 }, { "epoch": 0.39, "learning_rate": 3.034385822954342e-05, "loss": 2.4227, "step": 225430 }, { "epoch": 0.39, "learning_rate": 3.0342986289616593e-05, "loss": 2.3806, "step": 225440 }, { "epoch": 0.39, "learning_rate": 3.0342114349689767e-05, "loss": 2.4387, "step": 225450 }, { "epoch": 0.39, "learning_rate": 3.0341242409762937e-05, "loss": 2.4675, "step": 225460 }, { "epoch": 0.39, "learning_rate": 3.034037046983611e-05, "loss": 2.5192, "step": 225470 }, { "epoch": 0.39, "learning_rate": 3.033949852990928e-05, "loss": 2.3135, "step": 225480 }, { "epoch": 0.39, "learning_rate": 3.0338626589982462e-05, "loss": 2.5263, "step": 225490 }, { "epoch": 0.39, "learning_rate": 3.0337754650055632e-05, "loss": 2.3496, "step": 225500 }, { "epoch": 0.39, "learning_rate": 3.0336882710128806e-05, "loss": 2.3435, "step": 225510 }, { "epoch": 0.39, "learning_rate": 3.0336010770201976e-05, "loss": 2.535, "step": 225520 }, { "epoch": 0.39, "learning_rate": 3.033513883027515e-05, "loss": 2.3788, "step": 225530 }, { "epoch": 0.39, "learning_rate": 3.0334266890348324e-05, "loss": 2.3515, "step": 225540 }, { "epoch": 0.39, "learning_rate": 3.0333394950421494e-05, "loss": 2.436, "step": 225550 }, { "epoch": 0.39, "learning_rate": 3.0332523010494668e-05, "loss": 2.409, "step": 225560 }, { "epoch": 0.39, "learning_rate": 3.0331651070567845e-05, "loss": 2.3702, "step": 225570 }, { "epoch": 0.39, "learning_rate": 3.033077913064102e-05, "loss": 2.4116, "step": 225580 }, { "epoch": 0.39, "learning_rate": 3.032990719071419e-05, "loss": 2.4258, "step": 225590 }, { "epoch": 0.39, "learning_rate": 3.0329035250787363e-05, "loss": 2.2385, "step": 225600 }, { "epoch": 0.39, "learning_rate": 3.0328163310860537e-05, "loss": 2.373, "step": 225610 }, { "epoch": 0.39, "learning_rate": 3.0327291370933707e-05, "loss": 2.4491, "step": 225620 }, { "epoch": 0.39, "learning_rate": 3.032641943100688e-05, "loss": 2.4426, "step": 225630 }, { "epoch": 0.39, "learning_rate": 3.0325547491080058e-05, "loss": 2.4065, "step": 225640 }, { "epoch": 0.39, "learning_rate": 3.0324675551153232e-05, "loss": 2.4683, "step": 225650 }, { "epoch": 0.39, "learning_rate": 3.0323803611226402e-05, "loss": 2.4709, "step": 225660 }, { "epoch": 0.39, "learning_rate": 3.0322931671299576e-05, "loss": 2.4263, "step": 225670 }, { "epoch": 0.39, "learning_rate": 3.032205973137275e-05, "loss": 2.349, "step": 225680 }, { "epoch": 0.39, "learning_rate": 3.032118779144592e-05, "loss": 2.3099, "step": 225690 }, { "epoch": 0.39, "learning_rate": 3.0320315851519094e-05, "loss": 2.4268, "step": 225700 }, { "epoch": 0.39, "learning_rate": 3.0319443911592264e-05, "loss": 2.322, "step": 225710 }, { "epoch": 0.39, "learning_rate": 3.0318571971665445e-05, "loss": 2.4065, "step": 225720 }, { "epoch": 0.39, "learning_rate": 3.0317700031738615e-05, "loss": 2.4813, "step": 225730 }, { "epoch": 0.39, "learning_rate": 3.031682809181179e-05, "loss": 2.4266, "step": 225740 }, { "epoch": 0.39, "learning_rate": 3.031595615188496e-05, "loss": 2.412, "step": 225750 }, { "epoch": 0.39, "learning_rate": 3.0315084211958133e-05, "loss": 2.3982, "step": 225760 }, { "epoch": 0.39, "learning_rate": 3.0314212272031307e-05, "loss": 2.3671, "step": 225770 }, { "epoch": 0.39, "learning_rate": 3.0313340332104477e-05, "loss": 2.4319, "step": 225780 }, { "epoch": 0.39, "learning_rate": 3.0312468392177658e-05, "loss": 2.4439, "step": 225790 }, { "epoch": 0.39, "learning_rate": 3.031159645225083e-05, "loss": 2.4768, "step": 225800 }, { "epoch": 0.39, "learning_rate": 3.0310724512324002e-05, "loss": 2.4285, "step": 225810 }, { "epoch": 0.39, "learning_rate": 3.0309852572397172e-05, "loss": 2.4034, "step": 225820 }, { "epoch": 0.39, "learning_rate": 3.0308980632470346e-05, "loss": 2.4057, "step": 225830 }, { "epoch": 0.39, "learning_rate": 3.030810869254352e-05, "loss": 2.3801, "step": 225840 }, { "epoch": 0.39, "learning_rate": 3.030723675261669e-05, "loss": 2.3933, "step": 225850 }, { "epoch": 0.39, "learning_rate": 3.0306364812689864e-05, "loss": 2.5, "step": 225860 }, { "epoch": 0.39, "learning_rate": 3.030549287276304e-05, "loss": 2.3594, "step": 225870 }, { "epoch": 0.39, "learning_rate": 3.0304620932836215e-05, "loss": 2.3141, "step": 225880 }, { "epoch": 0.39, "learning_rate": 3.0303748992909385e-05, "loss": 2.3865, "step": 225890 }, { "epoch": 0.39, "learning_rate": 3.030287705298256e-05, "loss": 2.4548, "step": 225900 }, { "epoch": 0.39, "learning_rate": 3.0302005113055733e-05, "loss": 2.3357, "step": 225910 }, { "epoch": 0.39, "learning_rate": 3.0301133173128903e-05, "loss": 2.3785, "step": 225920 }, { "epoch": 0.39, "learning_rate": 3.0300261233202077e-05, "loss": 2.4292, "step": 225930 }, { "epoch": 0.39, "learning_rate": 3.0299389293275254e-05, "loss": 2.3921, "step": 225940 }, { "epoch": 0.39, "learning_rate": 3.0298517353348428e-05, "loss": 2.4895, "step": 225950 }, { "epoch": 0.39, "learning_rate": 3.02976454134216e-05, "loss": 2.3358, "step": 225960 }, { "epoch": 0.39, "learning_rate": 3.0296773473494772e-05, "loss": 2.4065, "step": 225970 }, { "epoch": 0.39, "learning_rate": 3.0295901533567943e-05, "loss": 2.5033, "step": 225980 }, { "epoch": 0.39, "learning_rate": 3.0295029593641116e-05, "loss": 2.3803, "step": 225990 }, { "epoch": 0.39, "learning_rate": 3.029415765371429e-05, "loss": 2.3797, "step": 226000 }, { "epoch": 0.39, "learning_rate": 3.0293285713787467e-05, "loss": 2.3428, "step": 226010 }, { "epoch": 0.39, "learning_rate": 3.029241377386064e-05, "loss": 2.467, "step": 226020 }, { "epoch": 0.39, "learning_rate": 3.029154183393381e-05, "loss": 2.4685, "step": 226030 }, { "epoch": 0.39, "learning_rate": 3.0290669894006985e-05, "loss": 2.3942, "step": 226040 }, { "epoch": 0.39, "learning_rate": 3.0289797954080156e-05, "loss": 2.3762, "step": 226050 }, { "epoch": 0.39, "learning_rate": 3.028892601415333e-05, "loss": 2.4003, "step": 226060 }, { "epoch": 0.39, "learning_rate": 3.0288054074226503e-05, "loss": 2.43, "step": 226070 }, { "epoch": 0.39, "learning_rate": 3.0287182134299674e-05, "loss": 2.3512, "step": 226080 }, { "epoch": 0.39, "learning_rate": 3.028631019437285e-05, "loss": 2.4463, "step": 226090 }, { "epoch": 0.39, "learning_rate": 3.0285438254446025e-05, "loss": 2.4047, "step": 226100 }, { "epoch": 0.39, "learning_rate": 3.0284566314519198e-05, "loss": 2.4535, "step": 226110 }, { "epoch": 0.39, "learning_rate": 3.028369437459237e-05, "loss": 2.5024, "step": 226120 }, { "epoch": 0.39, "learning_rate": 3.0282822434665542e-05, "loss": 2.4391, "step": 226130 }, { "epoch": 0.39, "learning_rate": 3.0281950494738713e-05, "loss": 2.3483, "step": 226140 }, { "epoch": 0.39, "learning_rate": 3.0281078554811887e-05, "loss": 2.3273, "step": 226150 }, { "epoch": 0.39, "learning_rate": 3.0280206614885064e-05, "loss": 2.3908, "step": 226160 }, { "epoch": 0.39, "learning_rate": 3.0279334674958238e-05, "loss": 2.3576, "step": 226170 }, { "epoch": 0.39, "learning_rate": 3.027846273503141e-05, "loss": 2.4335, "step": 226180 }, { "epoch": 0.39, "learning_rate": 3.027759079510458e-05, "loss": 2.3814, "step": 226190 }, { "epoch": 0.39, "learning_rate": 3.0276718855177755e-05, "loss": 2.3871, "step": 226200 }, { "epoch": 0.39, "learning_rate": 3.0275846915250926e-05, "loss": 2.4505, "step": 226210 }, { "epoch": 0.39, "learning_rate": 3.02749749753241e-05, "loss": 2.4326, "step": 226220 }, { "epoch": 0.39, "learning_rate": 3.0274103035397273e-05, "loss": 2.4177, "step": 226230 }, { "epoch": 0.39, "learning_rate": 3.027323109547045e-05, "loss": 2.2896, "step": 226240 }, { "epoch": 0.39, "learning_rate": 3.027235915554362e-05, "loss": 2.432, "step": 226250 }, { "epoch": 0.39, "learning_rate": 3.0271487215616795e-05, "loss": 2.3497, "step": 226260 }, { "epoch": 0.39, "learning_rate": 3.027061527568997e-05, "loss": 2.3282, "step": 226270 }, { "epoch": 0.39, "learning_rate": 3.026974333576314e-05, "loss": 2.3653, "step": 226280 }, { "epoch": 0.39, "learning_rate": 3.0268871395836313e-05, "loss": 2.4103, "step": 226290 }, { "epoch": 0.39, "learning_rate": 3.0267999455909486e-05, "loss": 2.3864, "step": 226300 }, { "epoch": 0.39, "learning_rate": 3.0267127515982664e-05, "loss": 2.3398, "step": 226310 }, { "epoch": 0.39, "learning_rate": 3.0266255576055834e-05, "loss": 2.4603, "step": 226320 }, { "epoch": 0.39, "learning_rate": 3.0265383636129008e-05, "loss": 2.3761, "step": 226330 }, { "epoch": 0.39, "learning_rate": 3.026451169620218e-05, "loss": 2.3793, "step": 226340 }, { "epoch": 0.39, "learning_rate": 3.0263639756275352e-05, "loss": 2.3495, "step": 226350 }, { "epoch": 0.39, "learning_rate": 3.0262767816348526e-05, "loss": 2.4354, "step": 226360 }, { "epoch": 0.39, "learning_rate": 3.0261895876421696e-05, "loss": 2.3685, "step": 226370 }, { "epoch": 0.39, "learning_rate": 3.026102393649487e-05, "loss": 2.3611, "step": 226380 }, { "epoch": 0.39, "learning_rate": 3.0260151996568047e-05, "loss": 2.3234, "step": 226390 }, { "epoch": 0.39, "learning_rate": 3.025928005664122e-05, "loss": 2.3781, "step": 226400 }, { "epoch": 0.39, "learning_rate": 3.0258408116714394e-05, "loss": 2.3883, "step": 226410 }, { "epoch": 0.39, "learning_rate": 3.0257536176787565e-05, "loss": 2.2465, "step": 226420 }, { "epoch": 0.39, "learning_rate": 3.025666423686074e-05, "loss": 2.399, "step": 226430 }, { "epoch": 0.39, "learning_rate": 3.025579229693391e-05, "loss": 2.3755, "step": 226440 }, { "epoch": 0.39, "learning_rate": 3.0254920357007083e-05, "loss": 2.3924, "step": 226450 }, { "epoch": 0.39, "learning_rate": 3.025404841708026e-05, "loss": 2.4485, "step": 226460 }, { "epoch": 0.39, "learning_rate": 3.0253176477153434e-05, "loss": 2.3306, "step": 226470 }, { "epoch": 0.39, "learning_rate": 3.0252304537226604e-05, "loss": 2.4167, "step": 226480 }, { "epoch": 0.39, "learning_rate": 3.0251432597299778e-05, "loss": 2.3332, "step": 226490 }, { "epoch": 0.39, "learning_rate": 3.025056065737295e-05, "loss": 2.4247, "step": 226500 }, { "epoch": 0.4, "learning_rate": 3.0249688717446122e-05, "loss": 2.4381, "step": 226510 }, { "epoch": 0.4, "learning_rate": 3.0248816777519296e-05, "loss": 2.4718, "step": 226520 }, { "epoch": 0.4, "learning_rate": 3.0247944837592473e-05, "loss": 2.3527, "step": 226530 }, { "epoch": 0.4, "learning_rate": 3.0247072897665647e-05, "loss": 2.4868, "step": 226540 }, { "epoch": 0.4, "learning_rate": 3.0246200957738817e-05, "loss": 2.3517, "step": 226550 }, { "epoch": 0.4, "learning_rate": 3.024532901781199e-05, "loss": 2.3166, "step": 226560 }, { "epoch": 0.4, "learning_rate": 3.0244457077885165e-05, "loss": 2.4129, "step": 226570 }, { "epoch": 0.4, "learning_rate": 3.0243585137958335e-05, "loss": 2.4178, "step": 226580 }, { "epoch": 0.4, "learning_rate": 3.024271319803151e-05, "loss": 2.3208, "step": 226590 }, { "epoch": 0.4, "learning_rate": 3.024184125810468e-05, "loss": 2.3817, "step": 226600 }, { "epoch": 0.4, "learning_rate": 3.024096931817786e-05, "loss": 2.3739, "step": 226610 }, { "epoch": 0.4, "learning_rate": 3.024009737825103e-05, "loss": 2.5773, "step": 226620 }, { "epoch": 0.4, "learning_rate": 3.0239225438324204e-05, "loss": 2.323, "step": 226630 }, { "epoch": 0.4, "learning_rate": 3.0238353498397378e-05, "loss": 2.3837, "step": 226640 }, { "epoch": 0.4, "learning_rate": 3.0237481558470548e-05, "loss": 2.3738, "step": 226650 }, { "epoch": 0.4, "learning_rate": 3.0236609618543722e-05, "loss": 2.3874, "step": 226660 }, { "epoch": 0.4, "learning_rate": 3.0235737678616892e-05, "loss": 2.4332, "step": 226670 }, { "epoch": 0.4, "learning_rate": 3.0234865738690073e-05, "loss": 2.4773, "step": 226680 }, { "epoch": 0.4, "learning_rate": 3.0233993798763243e-05, "loss": 2.3665, "step": 226690 }, { "epoch": 0.4, "learning_rate": 3.0233121858836417e-05, "loss": 2.4199, "step": 226700 }, { "epoch": 0.4, "learning_rate": 3.0232249918909587e-05, "loss": 2.3063, "step": 226710 }, { "epoch": 0.4, "learning_rate": 3.023137797898276e-05, "loss": 2.4337, "step": 226720 }, { "epoch": 0.4, "learning_rate": 3.0230506039055935e-05, "loss": 2.3752, "step": 226730 }, { "epoch": 0.4, "learning_rate": 3.0229634099129105e-05, "loss": 2.3728, "step": 226740 }, { "epoch": 0.4, "learning_rate": 3.022876215920228e-05, "loss": 2.3931, "step": 226750 }, { "epoch": 0.4, "learning_rate": 3.0227890219275456e-05, "loss": 2.3843, "step": 226760 }, { "epoch": 0.4, "learning_rate": 3.022701827934863e-05, "loss": 2.4598, "step": 226770 }, { "epoch": 0.4, "learning_rate": 3.02261463394218e-05, "loss": 2.3631, "step": 226780 }, { "epoch": 0.4, "learning_rate": 3.0225274399494974e-05, "loss": 2.4687, "step": 226790 }, { "epoch": 0.4, "learning_rate": 3.0224402459568148e-05, "loss": 2.4595, "step": 226800 }, { "epoch": 0.4, "learning_rate": 3.0223530519641318e-05, "loss": 2.2797, "step": 226810 }, { "epoch": 0.4, "learning_rate": 3.0222658579714492e-05, "loss": 2.3264, "step": 226820 }, { "epoch": 0.4, "learning_rate": 3.022178663978767e-05, "loss": 2.4372, "step": 226830 }, { "epoch": 0.4, "learning_rate": 3.0220914699860843e-05, "loss": 2.366, "step": 226840 }, { "epoch": 0.4, "learning_rate": 3.0220042759934013e-05, "loss": 2.5229, "step": 226850 }, { "epoch": 0.4, "learning_rate": 3.0219170820007187e-05, "loss": 2.4639, "step": 226860 }, { "epoch": 0.4, "learning_rate": 3.0218298880080357e-05, "loss": 2.5099, "step": 226870 }, { "epoch": 0.4, "learning_rate": 3.021742694015353e-05, "loss": 2.3158, "step": 226880 }, { "epoch": 0.4, "learning_rate": 3.0216555000226705e-05, "loss": 2.5115, "step": 226890 }, { "epoch": 0.4, "learning_rate": 3.0215683060299875e-05, "loss": 2.2579, "step": 226900 }, { "epoch": 0.4, "learning_rate": 3.0214811120373056e-05, "loss": 2.4728, "step": 226910 }, { "epoch": 0.4, "learning_rate": 3.0213939180446226e-05, "loss": 2.414, "step": 226920 }, { "epoch": 0.4, "learning_rate": 3.02130672405194e-05, "loss": 2.2534, "step": 226930 }, { "epoch": 0.4, "learning_rate": 3.021219530059257e-05, "loss": 2.4101, "step": 226940 }, { "epoch": 0.4, "learning_rate": 3.0211323360665744e-05, "loss": 2.3455, "step": 226950 }, { "epoch": 0.4, "learning_rate": 3.0210451420738918e-05, "loss": 2.3973, "step": 226960 }, { "epoch": 0.4, "learning_rate": 3.0209579480812088e-05, "loss": 2.3894, "step": 226970 }, { "epoch": 0.4, "learning_rate": 3.0208707540885265e-05, "loss": 2.3961, "step": 226980 }, { "epoch": 0.4, "learning_rate": 3.020783560095844e-05, "loss": 2.318, "step": 226990 }, { "epoch": 0.4, "learning_rate": 3.0206963661031613e-05, "loss": 2.3494, "step": 227000 }, { "epoch": 0.4, "learning_rate": 3.0206091721104783e-05, "loss": 2.3643, "step": 227010 }, { "epoch": 0.4, "learning_rate": 3.0205219781177957e-05, "loss": 2.4532, "step": 227020 }, { "epoch": 0.4, "learning_rate": 3.020434784125113e-05, "loss": 2.3542, "step": 227030 }, { "epoch": 0.4, "learning_rate": 3.02034759013243e-05, "loss": 2.4696, "step": 227040 }, { "epoch": 0.4, "learning_rate": 3.0202603961397475e-05, "loss": 2.3853, "step": 227050 }, { "epoch": 0.4, "learning_rate": 3.0201732021470652e-05, "loss": 2.3982, "step": 227060 }, { "epoch": 0.4, "learning_rate": 3.0200860081543826e-05, "loss": 2.3299, "step": 227070 }, { "epoch": 0.4, "learning_rate": 3.0199988141616996e-05, "loss": 2.2973, "step": 227080 }, { "epoch": 0.4, "learning_rate": 3.019911620169017e-05, "loss": 2.2964, "step": 227090 }, { "epoch": 0.4, "learning_rate": 3.019824426176334e-05, "loss": 2.4338, "step": 227100 }, { "epoch": 0.4, "learning_rate": 3.0197372321836514e-05, "loss": 2.4077, "step": 227110 }, { "epoch": 0.4, "learning_rate": 3.0196500381909688e-05, "loss": 2.4755, "step": 227120 }, { "epoch": 0.4, "learning_rate": 3.0195628441982865e-05, "loss": 2.3625, "step": 227130 }, { "epoch": 0.4, "learning_rate": 3.019475650205604e-05, "loss": 2.3995, "step": 227140 }, { "epoch": 0.4, "learning_rate": 3.019388456212921e-05, "loss": 2.3064, "step": 227150 }, { "epoch": 0.4, "learning_rate": 3.0193012622202383e-05, "loss": 2.514, "step": 227160 }, { "epoch": 0.4, "learning_rate": 3.0192140682275554e-05, "loss": 2.4118, "step": 227170 }, { "epoch": 0.4, "learning_rate": 3.0191268742348727e-05, "loss": 2.4492, "step": 227180 }, { "epoch": 0.4, "learning_rate": 3.01903968024219e-05, "loss": 2.3609, "step": 227190 }, { "epoch": 0.4, "learning_rate": 3.0189524862495078e-05, "loss": 2.3885, "step": 227200 }, { "epoch": 0.4, "learning_rate": 3.018865292256825e-05, "loss": 2.299, "step": 227210 }, { "epoch": 0.4, "learning_rate": 3.0187780982641422e-05, "loss": 2.4592, "step": 227220 }, { "epoch": 0.4, "learning_rate": 3.0186909042714596e-05, "loss": 2.4248, "step": 227230 }, { "epoch": 0.4, "learning_rate": 3.0186037102787767e-05, "loss": 2.4355, "step": 227240 }, { "epoch": 0.4, "learning_rate": 3.018516516286094e-05, "loss": 2.3305, "step": 227250 }, { "epoch": 0.4, "learning_rate": 3.0184293222934114e-05, "loss": 2.2941, "step": 227260 }, { "epoch": 0.4, "learning_rate": 3.0183421283007284e-05, "loss": 2.3142, "step": 227270 }, { "epoch": 0.4, "learning_rate": 3.018254934308046e-05, "loss": 2.3326, "step": 227280 }, { "epoch": 0.4, "learning_rate": 3.0181677403153635e-05, "loss": 2.3414, "step": 227290 }, { "epoch": 0.4, "learning_rate": 3.018080546322681e-05, "loss": 2.432, "step": 227300 }, { "epoch": 0.4, "learning_rate": 3.017993352329998e-05, "loss": 2.4447, "step": 227310 }, { "epoch": 0.4, "learning_rate": 3.0179061583373153e-05, "loss": 2.4573, "step": 227320 }, { "epoch": 0.4, "learning_rate": 3.0178189643446324e-05, "loss": 2.3553, "step": 227330 }, { "epoch": 0.4, "learning_rate": 3.0177317703519497e-05, "loss": 2.3828, "step": 227340 }, { "epoch": 0.4, "learning_rate": 3.0176445763592675e-05, "loss": 2.3889, "step": 227350 }, { "epoch": 0.4, "learning_rate": 3.017557382366585e-05, "loss": 2.365, "step": 227360 }, { "epoch": 0.4, "learning_rate": 3.0174701883739022e-05, "loss": 2.3453, "step": 227370 }, { "epoch": 0.4, "learning_rate": 3.0173829943812193e-05, "loss": 2.4413, "step": 227380 }, { "epoch": 0.4, "learning_rate": 3.0172958003885366e-05, "loss": 2.2904, "step": 227390 }, { "epoch": 0.4, "learning_rate": 3.0172086063958537e-05, "loss": 2.444, "step": 227400 }, { "epoch": 0.4, "learning_rate": 3.017121412403171e-05, "loss": 2.4488, "step": 227410 }, { "epoch": 0.4, "learning_rate": 3.0170342184104884e-05, "loss": 2.3999, "step": 227420 }, { "epoch": 0.4, "learning_rate": 3.016947024417806e-05, "loss": 2.481, "step": 227430 }, { "epoch": 0.4, "learning_rate": 3.0168598304251232e-05, "loss": 2.4047, "step": 227440 }, { "epoch": 0.4, "learning_rate": 3.0167726364324406e-05, "loss": 2.4211, "step": 227450 }, { "epoch": 0.4, "learning_rate": 3.016685442439758e-05, "loss": 2.4031, "step": 227460 }, { "epoch": 0.4, "learning_rate": 3.016598248447075e-05, "loss": 2.4026, "step": 227470 }, { "epoch": 0.4, "learning_rate": 3.0165110544543923e-05, "loss": 2.3315, "step": 227480 }, { "epoch": 0.4, "learning_rate": 3.0164238604617094e-05, "loss": 2.6336, "step": 227490 }, { "epoch": 0.4, "learning_rate": 3.0163366664690274e-05, "loss": 2.3936, "step": 227500 }, { "epoch": 0.4, "learning_rate": 3.0162494724763445e-05, "loss": 2.4873, "step": 227510 }, { "epoch": 0.4, "learning_rate": 3.016162278483662e-05, "loss": 2.4723, "step": 227520 }, { "epoch": 0.4, "learning_rate": 3.0160750844909792e-05, "loss": 2.2936, "step": 227530 }, { "epoch": 0.4, "learning_rate": 3.0159878904982963e-05, "loss": 2.4943, "step": 227540 }, { "epoch": 0.4, "learning_rate": 3.0159006965056136e-05, "loss": 2.436, "step": 227550 }, { "epoch": 0.4, "learning_rate": 3.0158135025129307e-05, "loss": 2.3665, "step": 227560 }, { "epoch": 0.4, "learning_rate": 3.015726308520248e-05, "loss": 2.4892, "step": 227570 }, { "epoch": 0.4, "learning_rate": 3.0156391145275658e-05, "loss": 2.3677, "step": 227580 }, { "epoch": 0.4, "learning_rate": 3.015551920534883e-05, "loss": 2.3982, "step": 227590 }, { "epoch": 0.4, "learning_rate": 3.0154647265422002e-05, "loss": 2.3381, "step": 227600 }, { "epoch": 0.4, "learning_rate": 3.0153775325495176e-05, "loss": 2.3726, "step": 227610 }, { "epoch": 0.4, "learning_rate": 3.015290338556835e-05, "loss": 2.4701, "step": 227620 }, { "epoch": 0.4, "learning_rate": 3.015203144564152e-05, "loss": 2.3526, "step": 227630 }, { "epoch": 0.4, "learning_rate": 3.0151159505714694e-05, "loss": 2.3782, "step": 227640 }, { "epoch": 0.4, "learning_rate": 3.015028756578787e-05, "loss": 2.3786, "step": 227650 }, { "epoch": 0.4, "learning_rate": 3.0149415625861045e-05, "loss": 2.3287, "step": 227660 }, { "epoch": 0.4, "learning_rate": 3.0148543685934215e-05, "loss": 2.5151, "step": 227670 }, { "epoch": 0.4, "learning_rate": 3.014767174600739e-05, "loss": 2.4618, "step": 227680 }, { "epoch": 0.4, "learning_rate": 3.0146799806080562e-05, "loss": 2.4114, "step": 227690 }, { "epoch": 0.4, "learning_rate": 3.0145927866153733e-05, "loss": 2.4437, "step": 227700 }, { "epoch": 0.4, "learning_rate": 3.0145055926226907e-05, "loss": 2.3955, "step": 227710 }, { "epoch": 0.4, "learning_rate": 3.0144183986300077e-05, "loss": 2.3003, "step": 227720 }, { "epoch": 0.4, "learning_rate": 3.0143312046373258e-05, "loss": 2.4035, "step": 227730 }, { "epoch": 0.4, "learning_rate": 3.0142440106446428e-05, "loss": 2.4513, "step": 227740 }, { "epoch": 0.4, "learning_rate": 3.01415681665196e-05, "loss": 2.5157, "step": 227750 }, { "epoch": 0.4, "learning_rate": 3.0140696226592775e-05, "loss": 2.4375, "step": 227760 }, { "epoch": 0.4, "learning_rate": 3.0139824286665946e-05, "loss": 2.4091, "step": 227770 }, { "epoch": 0.4, "learning_rate": 3.013895234673912e-05, "loss": 2.3912, "step": 227780 }, { "epoch": 0.4, "learning_rate": 3.013808040681229e-05, "loss": 2.3237, "step": 227790 }, { "epoch": 0.4, "learning_rate": 3.013720846688547e-05, "loss": 2.4231, "step": 227800 }, { "epoch": 0.4, "learning_rate": 3.013633652695864e-05, "loss": 2.4252, "step": 227810 }, { "epoch": 0.4, "learning_rate": 3.0135464587031815e-05, "loss": 2.4417, "step": 227820 }, { "epoch": 0.4, "learning_rate": 3.0134592647104985e-05, "loss": 2.2845, "step": 227830 }, { "epoch": 0.4, "learning_rate": 3.013372070717816e-05, "loss": 2.3971, "step": 227840 }, { "epoch": 0.4, "learning_rate": 3.0132848767251333e-05, "loss": 2.5129, "step": 227850 }, { "epoch": 0.4, "learning_rate": 3.0131976827324503e-05, "loss": 2.3793, "step": 227860 }, { "epoch": 0.4, "learning_rate": 3.0131104887397684e-05, "loss": 2.3622, "step": 227870 }, { "epoch": 0.4, "learning_rate": 3.0130232947470854e-05, "loss": 2.387, "step": 227880 }, { "epoch": 0.4, "learning_rate": 3.0129361007544028e-05, "loss": 2.4549, "step": 227890 }, { "epoch": 0.4, "learning_rate": 3.0128489067617198e-05, "loss": 2.2664, "step": 227900 }, { "epoch": 0.4, "learning_rate": 3.0127617127690372e-05, "loss": 2.3122, "step": 227910 }, { "epoch": 0.4, "learning_rate": 3.0126745187763546e-05, "loss": 2.3408, "step": 227920 }, { "epoch": 0.4, "learning_rate": 3.0125873247836716e-05, "loss": 2.4657, "step": 227930 }, { "epoch": 0.4, "learning_rate": 3.012500130790989e-05, "loss": 2.3683, "step": 227940 }, { "epoch": 0.4, "learning_rate": 3.0124129367983067e-05, "loss": 2.3707, "step": 227950 }, { "epoch": 0.4, "learning_rate": 3.012325742805624e-05, "loss": 2.3308, "step": 227960 }, { "epoch": 0.4, "learning_rate": 3.012238548812941e-05, "loss": 2.4199, "step": 227970 }, { "epoch": 0.4, "learning_rate": 3.0121513548202585e-05, "loss": 2.3599, "step": 227980 }, { "epoch": 0.4, "learning_rate": 3.012064160827576e-05, "loss": 2.4091, "step": 227990 }, { "epoch": 0.4, "learning_rate": 3.011976966834893e-05, "loss": 2.3792, "step": 228000 }, { "epoch": 0.4, "learning_rate": 3.0118897728422103e-05, "loss": 2.3181, "step": 228010 }, { "epoch": 0.4, "learning_rate": 3.011802578849528e-05, "loss": 2.4577, "step": 228020 }, { "epoch": 0.4, "learning_rate": 3.0117153848568454e-05, "loss": 2.3489, "step": 228030 }, { "epoch": 0.4, "learning_rate": 3.0116281908641624e-05, "loss": 2.427, "step": 228040 }, { "epoch": 0.4, "learning_rate": 3.0115409968714798e-05, "loss": 2.3569, "step": 228050 }, { "epoch": 0.4, "learning_rate": 3.0114538028787968e-05, "loss": 2.4005, "step": 228060 }, { "epoch": 0.4, "learning_rate": 3.0113666088861142e-05, "loss": 2.4095, "step": 228070 }, { "epoch": 0.4, "learning_rate": 3.0112794148934316e-05, "loss": 2.4533, "step": 228080 }, { "epoch": 0.4, "learning_rate": 3.0111922209007486e-05, "loss": 2.4458, "step": 228090 }, { "epoch": 0.4, "learning_rate": 3.0111050269080667e-05, "loss": 2.3545, "step": 228100 }, { "epoch": 0.4, "learning_rate": 3.0110178329153837e-05, "loss": 2.4627, "step": 228110 }, { "epoch": 0.4, "learning_rate": 3.010930638922701e-05, "loss": 2.4283, "step": 228120 }, { "epoch": 0.4, "learning_rate": 3.010843444930018e-05, "loss": 2.4013, "step": 228130 }, { "epoch": 0.4, "learning_rate": 3.0107562509373355e-05, "loss": 2.5265, "step": 228140 }, { "epoch": 0.4, "learning_rate": 3.010669056944653e-05, "loss": 2.3931, "step": 228150 }, { "epoch": 0.4, "learning_rate": 3.01058186295197e-05, "loss": 2.4469, "step": 228160 }, { "epoch": 0.4, "learning_rate": 3.0104946689592876e-05, "loss": 2.3986, "step": 228170 }, { "epoch": 0.4, "learning_rate": 3.010407474966605e-05, "loss": 2.3571, "step": 228180 }, { "epoch": 0.4, "learning_rate": 3.0103202809739224e-05, "loss": 2.4391, "step": 228190 }, { "epoch": 0.4, "learning_rate": 3.0102330869812394e-05, "loss": 2.2686, "step": 228200 }, { "epoch": 0.4, "learning_rate": 3.0101458929885568e-05, "loss": 2.3176, "step": 228210 }, { "epoch": 0.4, "learning_rate": 3.010058698995874e-05, "loss": 2.3909, "step": 228220 }, { "epoch": 0.4, "learning_rate": 3.0099715050031912e-05, "loss": 2.4523, "step": 228230 }, { "epoch": 0.4, "learning_rate": 3.0098843110105086e-05, "loss": 2.3511, "step": 228240 }, { "epoch": 0.4, "learning_rate": 3.0097971170178263e-05, "loss": 2.4388, "step": 228250 }, { "epoch": 0.4, "learning_rate": 3.0097099230251437e-05, "loss": 2.4159, "step": 228260 }, { "epoch": 0.4, "learning_rate": 3.0096227290324607e-05, "loss": 2.4936, "step": 228270 }, { "epoch": 0.4, "learning_rate": 3.009535535039778e-05, "loss": 2.4067, "step": 228280 }, { "epoch": 0.4, "learning_rate": 3.009448341047095e-05, "loss": 2.4244, "step": 228290 }, { "epoch": 0.4, "learning_rate": 3.0093611470544125e-05, "loss": 2.4004, "step": 228300 }, { "epoch": 0.4, "learning_rate": 3.00927395306173e-05, "loss": 2.3827, "step": 228310 }, { "epoch": 0.4, "learning_rate": 3.0091867590690476e-05, "loss": 2.4014, "step": 228320 }, { "epoch": 0.4, "learning_rate": 3.0090995650763646e-05, "loss": 2.3108, "step": 228330 }, { "epoch": 0.4, "learning_rate": 3.009012371083682e-05, "loss": 2.3752, "step": 228340 }, { "epoch": 0.4, "learning_rate": 3.0089251770909994e-05, "loss": 2.383, "step": 228350 }, { "epoch": 0.4, "learning_rate": 3.0088379830983164e-05, "loss": 2.4643, "step": 228360 }, { "epoch": 0.4, "learning_rate": 3.0087507891056338e-05, "loss": 2.3931, "step": 228370 }, { "epoch": 0.4, "learning_rate": 3.0086635951129512e-05, "loss": 2.4844, "step": 228380 }, { "epoch": 0.4, "learning_rate": 3.008576401120269e-05, "loss": 2.3707, "step": 228390 }, { "epoch": 0.4, "learning_rate": 3.008489207127586e-05, "loss": 2.4261, "step": 228400 }, { "epoch": 0.4, "learning_rate": 3.0084020131349033e-05, "loss": 2.2833, "step": 228410 }, { "epoch": 0.4, "learning_rate": 3.0083148191422207e-05, "loss": 2.4031, "step": 228420 }, { "epoch": 0.4, "learning_rate": 3.0082276251495377e-05, "loss": 2.379, "step": 228430 }, { "epoch": 0.4, "learning_rate": 3.008140431156855e-05, "loss": 2.4282, "step": 228440 }, { "epoch": 0.4, "learning_rate": 3.008053237164172e-05, "loss": 2.4186, "step": 228450 }, { "epoch": 0.4, "learning_rate": 3.0079660431714895e-05, "loss": 2.4015, "step": 228460 }, { "epoch": 0.4, "learning_rate": 3.0078788491788072e-05, "loss": 2.3768, "step": 228470 }, { "epoch": 0.4, "learning_rate": 3.0077916551861246e-05, "loss": 2.4324, "step": 228480 }, { "epoch": 0.4, "learning_rate": 3.007704461193442e-05, "loss": 2.3539, "step": 228490 }, { "epoch": 0.4, "learning_rate": 3.007617267200759e-05, "loss": 2.4593, "step": 228500 }, { "epoch": 0.4, "learning_rate": 3.0075300732080764e-05, "loss": 2.3541, "step": 228510 }, { "epoch": 0.4, "learning_rate": 3.0074428792153935e-05, "loss": 2.4687, "step": 228520 }, { "epoch": 0.4, "learning_rate": 3.0073556852227108e-05, "loss": 2.2957, "step": 228530 }, { "epoch": 0.4, "learning_rate": 3.0072684912300285e-05, "loss": 2.3712, "step": 228540 }, { "epoch": 0.4, "learning_rate": 3.007181297237346e-05, "loss": 2.3883, "step": 228550 }, { "epoch": 0.4, "learning_rate": 3.007094103244663e-05, "loss": 2.3947, "step": 228560 }, { "epoch": 0.4, "learning_rate": 3.0070069092519803e-05, "loss": 2.5382, "step": 228570 }, { "epoch": 0.4, "learning_rate": 3.0069197152592977e-05, "loss": 2.4176, "step": 228580 }, { "epoch": 0.4, "learning_rate": 3.0068325212666148e-05, "loss": 2.3864, "step": 228590 }, { "epoch": 0.4, "learning_rate": 3.006745327273932e-05, "loss": 2.3765, "step": 228600 }, { "epoch": 0.4, "learning_rate": 3.0066581332812495e-05, "loss": 2.501, "step": 228610 }, { "epoch": 0.4, "learning_rate": 3.0065709392885672e-05, "loss": 2.4984, "step": 228620 }, { "epoch": 0.4, "learning_rate": 3.0064837452958843e-05, "loss": 2.3528, "step": 228630 }, { "epoch": 0.4, "learning_rate": 3.0063965513032016e-05, "loss": 2.4372, "step": 228640 }, { "epoch": 0.4, "learning_rate": 3.006309357310519e-05, "loss": 2.4225, "step": 228650 }, { "epoch": 0.4, "learning_rate": 3.006222163317836e-05, "loss": 2.319, "step": 228660 }, { "epoch": 0.4, "learning_rate": 3.0061349693251534e-05, "loss": 2.2999, "step": 228670 }, { "epoch": 0.4, "learning_rate": 3.0060477753324705e-05, "loss": 2.4998, "step": 228680 }, { "epoch": 0.4, "learning_rate": 3.0059605813397885e-05, "loss": 2.4799, "step": 228690 }, { "epoch": 0.4, "learning_rate": 3.0058733873471056e-05, "loss": 2.3579, "step": 228700 }, { "epoch": 0.4, "learning_rate": 3.005786193354423e-05, "loss": 2.3289, "step": 228710 }, { "epoch": 0.4, "learning_rate": 3.0056989993617403e-05, "loss": 2.4426, "step": 228720 }, { "epoch": 0.4, "learning_rate": 3.0056118053690574e-05, "loss": 2.2476, "step": 228730 }, { "epoch": 0.4, "learning_rate": 3.0055246113763747e-05, "loss": 2.3682, "step": 228740 }, { "epoch": 0.4, "learning_rate": 3.0054374173836918e-05, "loss": 2.4564, "step": 228750 }, { "epoch": 0.4, "learning_rate": 3.005350223391009e-05, "loss": 2.3832, "step": 228760 }, { "epoch": 0.4, "learning_rate": 3.005263029398327e-05, "loss": 2.2879, "step": 228770 }, { "epoch": 0.4, "learning_rate": 3.0051758354056442e-05, "loss": 2.3397, "step": 228780 }, { "epoch": 0.4, "learning_rate": 3.0050886414129613e-05, "loss": 2.3987, "step": 228790 }, { "epoch": 0.4, "learning_rate": 3.0050014474202787e-05, "loss": 2.4077, "step": 228800 }, { "epoch": 0.4, "learning_rate": 3.004914253427596e-05, "loss": 2.5326, "step": 228810 }, { "epoch": 0.4, "learning_rate": 3.004827059434913e-05, "loss": 2.3357, "step": 228820 }, { "epoch": 0.4, "learning_rate": 3.0047398654422304e-05, "loss": 2.3913, "step": 228830 }, { "epoch": 0.4, "learning_rate": 3.004652671449548e-05, "loss": 2.3902, "step": 228840 }, { "epoch": 0.4, "learning_rate": 3.0045654774568655e-05, "loss": 2.4817, "step": 228850 }, { "epoch": 0.4, "learning_rate": 3.0044782834641826e-05, "loss": 2.4754, "step": 228860 }, { "epoch": 0.4, "learning_rate": 3.0043910894715e-05, "loss": 2.4379, "step": 228870 }, { "epoch": 0.4, "learning_rate": 3.0043038954788173e-05, "loss": 2.3033, "step": 228880 }, { "epoch": 0.4, "learning_rate": 3.0042167014861344e-05, "loss": 2.4105, "step": 228890 }, { "epoch": 0.4, "learning_rate": 3.0041295074934517e-05, "loss": 2.5305, "step": 228900 }, { "epoch": 0.4, "learning_rate": 3.0040423135007688e-05, "loss": 2.3499, "step": 228910 }, { "epoch": 0.4, "learning_rate": 3.003955119508087e-05, "loss": 2.4149, "step": 228920 }, { "epoch": 0.4, "learning_rate": 3.003867925515404e-05, "loss": 2.4941, "step": 228930 }, { "epoch": 0.4, "learning_rate": 3.0037807315227213e-05, "loss": 2.2913, "step": 228940 }, { "epoch": 0.4, "learning_rate": 3.0036935375300383e-05, "loss": 2.3685, "step": 228950 }, { "epoch": 0.4, "learning_rate": 3.0036063435373557e-05, "loss": 2.4812, "step": 228960 }, { "epoch": 0.4, "learning_rate": 3.003519149544673e-05, "loss": 2.3526, "step": 228970 }, { "epoch": 0.4, "learning_rate": 3.00343195555199e-05, "loss": 2.4114, "step": 228980 }, { "epoch": 0.4, "learning_rate": 3.003344761559308e-05, "loss": 2.4372, "step": 228990 }, { "epoch": 0.4, "learning_rate": 3.0032575675666252e-05, "loss": 2.3688, "step": 229000 }, { "epoch": 0.4, "learning_rate": 3.0031703735739426e-05, "loss": 2.5684, "step": 229010 }, { "epoch": 0.4, "learning_rate": 3.0030831795812596e-05, "loss": 2.3578, "step": 229020 }, { "epoch": 0.4, "learning_rate": 3.002995985588577e-05, "loss": 2.4591, "step": 229030 }, { "epoch": 0.4, "learning_rate": 3.0029087915958943e-05, "loss": 2.4633, "step": 229040 }, { "epoch": 0.4, "learning_rate": 3.0028215976032114e-05, "loss": 2.4424, "step": 229050 }, { "epoch": 0.4, "learning_rate": 3.002734403610529e-05, "loss": 2.39, "step": 229060 }, { "epoch": 0.4, "learning_rate": 3.0026472096178465e-05, "loss": 2.36, "step": 229070 }, { "epoch": 0.4, "learning_rate": 3.002560015625164e-05, "loss": 2.3392, "step": 229080 }, { "epoch": 0.4, "learning_rate": 3.002472821632481e-05, "loss": 2.4401, "step": 229090 }, { "epoch": 0.4, "learning_rate": 3.0023856276397983e-05, "loss": 2.4074, "step": 229100 }, { "epoch": 0.4, "learning_rate": 3.0022984336471156e-05, "loss": 2.4014, "step": 229110 }, { "epoch": 0.4, "learning_rate": 3.0022112396544327e-05, "loss": 2.4165, "step": 229120 }, { "epoch": 0.4, "learning_rate": 3.00212404566175e-05, "loss": 2.3409, "step": 229130 }, { "epoch": 0.4, "learning_rate": 3.0020368516690678e-05, "loss": 2.5605, "step": 229140 }, { "epoch": 0.4, "learning_rate": 3.001949657676385e-05, "loss": 2.41, "step": 229150 }, { "epoch": 0.4, "learning_rate": 3.0018624636837022e-05, "loss": 2.413, "step": 229160 }, { "epoch": 0.4, "learning_rate": 3.0017752696910196e-05, "loss": 2.5036, "step": 229170 }, { "epoch": 0.4, "learning_rate": 3.0016880756983366e-05, "loss": 2.3787, "step": 229180 }, { "epoch": 0.4, "learning_rate": 3.001600881705654e-05, "loss": 2.372, "step": 229190 }, { "epoch": 0.4, "learning_rate": 3.0015136877129714e-05, "loss": 2.5239, "step": 229200 }, { "epoch": 0.4, "learning_rate": 3.001426493720289e-05, "loss": 2.4654, "step": 229210 }, { "epoch": 0.4, "learning_rate": 3.0013392997276065e-05, "loss": 2.3772, "step": 229220 }, { "epoch": 0.4, "learning_rate": 3.0012521057349235e-05, "loss": 2.3126, "step": 229230 }, { "epoch": 0.4, "learning_rate": 3.001164911742241e-05, "loss": 2.2879, "step": 229240 }, { "epoch": 0.4, "learning_rate": 3.001077717749558e-05, "loss": 2.3368, "step": 229250 }, { "epoch": 0.4, "learning_rate": 3.0009905237568753e-05, "loss": 2.5277, "step": 229260 }, { "epoch": 0.4, "learning_rate": 3.0009033297641927e-05, "loss": 2.3847, "step": 229270 }, { "epoch": 0.4, "learning_rate": 3.0008161357715097e-05, "loss": 2.3436, "step": 229280 }, { "epoch": 0.4, "learning_rate": 3.0007289417788274e-05, "loss": 2.3717, "step": 229290 }, { "epoch": 0.4, "learning_rate": 3.0006417477861448e-05, "loss": 2.3324, "step": 229300 }, { "epoch": 0.4, "learning_rate": 3.000554553793462e-05, "loss": 2.3799, "step": 229310 }, { "epoch": 0.4, "learning_rate": 3.0004673598007792e-05, "loss": 2.3948, "step": 229320 }, { "epoch": 0.4, "learning_rate": 3.0003801658080966e-05, "loss": 2.536, "step": 229330 }, { "epoch": 0.4, "learning_rate": 3.000292971815414e-05, "loss": 2.4389, "step": 229340 }, { "epoch": 0.4, "learning_rate": 3.000205777822731e-05, "loss": 2.3748, "step": 229350 }, { "epoch": 0.4, "learning_rate": 3.0001185838300487e-05, "loss": 2.4577, "step": 229360 }, { "epoch": 0.4, "learning_rate": 3.000031389837366e-05, "loss": 2.4191, "step": 229370 }, { "epoch": 0.4, "learning_rate": 2.9999441958446835e-05, "loss": 2.4343, "step": 229380 }, { "epoch": 0.4, "learning_rate": 2.9998570018520005e-05, "loss": 2.3488, "step": 229390 }, { "epoch": 0.4, "learning_rate": 2.999769807859318e-05, "loss": 2.3078, "step": 229400 }, { "epoch": 0.4, "learning_rate": 2.999682613866635e-05, "loss": 2.4495, "step": 229410 }, { "epoch": 0.4, "learning_rate": 2.9995954198739523e-05, "loss": 2.335, "step": 229420 }, { "epoch": 0.4, "learning_rate": 2.9995082258812697e-05, "loss": 2.3768, "step": 229430 }, { "epoch": 0.4, "learning_rate": 2.9994210318885874e-05, "loss": 2.4947, "step": 229440 }, { "epoch": 0.4, "learning_rate": 2.9993338378959048e-05, "loss": 2.5406, "step": 229450 }, { "epoch": 0.4, "learning_rate": 2.9992466439032218e-05, "loss": 2.3812, "step": 229460 }, { "epoch": 0.4, "learning_rate": 2.9991594499105392e-05, "loss": 2.311, "step": 229470 }, { "epoch": 0.4, "learning_rate": 2.9990722559178562e-05, "loss": 2.3023, "step": 229480 }, { "epoch": 0.4, "learning_rate": 2.9989850619251736e-05, "loss": 2.3307, "step": 229490 }, { "epoch": 0.4, "learning_rate": 2.998897867932491e-05, "loss": 2.4229, "step": 229500 }, { "epoch": 0.4, "learning_rate": 2.9988106739398087e-05, "loss": 2.3977, "step": 229510 }, { "epoch": 0.4, "learning_rate": 2.9987234799471257e-05, "loss": 2.4633, "step": 229520 }, { "epoch": 0.4, "learning_rate": 2.998636285954443e-05, "loss": 2.3847, "step": 229530 }, { "epoch": 0.4, "learning_rate": 2.9985490919617605e-05, "loss": 2.3912, "step": 229540 }, { "epoch": 0.4, "learning_rate": 2.9984618979690775e-05, "loss": 2.4079, "step": 229550 }, { "epoch": 0.4, "learning_rate": 2.998374703976395e-05, "loss": 2.4619, "step": 229560 }, { "epoch": 0.4, "learning_rate": 2.998287509983712e-05, "loss": 2.3957, "step": 229570 }, { "epoch": 0.4, "learning_rate": 2.9982003159910293e-05, "loss": 2.5016, "step": 229580 }, { "epoch": 0.4, "learning_rate": 2.998113121998347e-05, "loss": 2.4016, "step": 229590 }, { "epoch": 0.4, "learning_rate": 2.9980259280056644e-05, "loss": 2.3767, "step": 229600 }, { "epoch": 0.4, "learning_rate": 2.9979387340129818e-05, "loss": 2.3527, "step": 229610 }, { "epoch": 0.4, "learning_rate": 2.9978515400202988e-05, "loss": 2.461, "step": 229620 }, { "epoch": 0.4, "learning_rate": 2.9977643460276162e-05, "loss": 2.391, "step": 229630 }, { "epoch": 0.4, "learning_rate": 2.9976771520349332e-05, "loss": 2.4068, "step": 229640 }, { "epoch": 0.4, "learning_rate": 2.9975899580422506e-05, "loss": 2.2723, "step": 229650 }, { "epoch": 0.4, "learning_rate": 2.9975027640495683e-05, "loss": 2.4809, "step": 229660 }, { "epoch": 0.4, "learning_rate": 2.9974155700568857e-05, "loss": 2.418, "step": 229670 }, { "epoch": 0.4, "learning_rate": 2.9973283760642027e-05, "loss": 2.4203, "step": 229680 }, { "epoch": 0.4, "learning_rate": 2.99724118207152e-05, "loss": 2.4684, "step": 229690 }, { "epoch": 0.4, "learning_rate": 2.9971539880788375e-05, "loss": 2.3469, "step": 229700 }, { "epoch": 0.4, "learning_rate": 2.9970667940861545e-05, "loss": 2.3692, "step": 229710 }, { "epoch": 0.4, "learning_rate": 2.996979600093472e-05, "loss": 2.4128, "step": 229720 }, { "epoch": 0.4, "learning_rate": 2.9968924061007896e-05, "loss": 2.3543, "step": 229730 }, { "epoch": 0.4, "learning_rate": 2.996805212108107e-05, "loss": 2.2687, "step": 229740 }, { "epoch": 0.4, "learning_rate": 2.996718018115424e-05, "loss": 2.5014, "step": 229750 }, { "epoch": 0.4, "learning_rate": 2.9966308241227414e-05, "loss": 2.4241, "step": 229760 }, { "epoch": 0.4, "learning_rate": 2.9965436301300588e-05, "loss": 2.3707, "step": 229770 }, { "epoch": 0.4, "learning_rate": 2.996456436137376e-05, "loss": 2.4863, "step": 229780 }, { "epoch": 0.4, "learning_rate": 2.9963692421446932e-05, "loss": 2.368, "step": 229790 }, { "epoch": 0.4, "learning_rate": 2.9962820481520103e-05, "loss": 2.3334, "step": 229800 }, { "epoch": 0.4, "learning_rate": 2.9961948541593283e-05, "loss": 2.3477, "step": 229810 }, { "epoch": 0.4, "learning_rate": 2.9961076601666453e-05, "loss": 2.3531, "step": 229820 }, { "epoch": 0.4, "learning_rate": 2.9960204661739627e-05, "loss": 2.41, "step": 229830 }, { "epoch": 0.4, "learning_rate": 2.99593327218128e-05, "loss": 2.3816, "step": 229840 }, { "epoch": 0.4, "learning_rate": 2.995846078188597e-05, "loss": 2.5305, "step": 229850 }, { "epoch": 0.4, "learning_rate": 2.9957588841959145e-05, "loss": 2.4658, "step": 229860 }, { "epoch": 0.4, "learning_rate": 2.9956716902032316e-05, "loss": 2.3685, "step": 229870 }, { "epoch": 0.4, "learning_rate": 2.9955844962105496e-05, "loss": 2.3428, "step": 229880 }, { "epoch": 0.4, "learning_rate": 2.9954973022178666e-05, "loss": 2.3708, "step": 229890 }, { "epoch": 0.4, "learning_rate": 2.995410108225184e-05, "loss": 2.3753, "step": 229900 }, { "epoch": 0.4, "learning_rate": 2.995322914232501e-05, "loss": 2.3653, "step": 229910 }, { "epoch": 0.4, "learning_rate": 2.9952357202398184e-05, "loss": 2.3553, "step": 229920 }, { "epoch": 0.4, "learning_rate": 2.9951485262471358e-05, "loss": 2.3571, "step": 229930 }, { "epoch": 0.4, "learning_rate": 2.995061332254453e-05, "loss": 2.3451, "step": 229940 }, { "epoch": 0.4, "learning_rate": 2.9949741382617702e-05, "loss": 2.4391, "step": 229950 }, { "epoch": 0.4, "learning_rate": 2.994886944269088e-05, "loss": 2.3115, "step": 229960 }, { "epoch": 0.4, "learning_rate": 2.9947997502764053e-05, "loss": 2.4255, "step": 229970 }, { "epoch": 0.4, "learning_rate": 2.9947125562837224e-05, "loss": 2.3074, "step": 229980 }, { "epoch": 0.4, "learning_rate": 2.9946253622910397e-05, "loss": 2.3355, "step": 229990 }, { "epoch": 0.4, "learning_rate": 2.994538168298357e-05, "loss": 2.4978, "step": 230000 }, { "epoch": 0.4, "learning_rate": 2.994450974305674e-05, "loss": 2.3777, "step": 230010 }, { "epoch": 0.4, "learning_rate": 2.9943637803129915e-05, "loss": 2.4549, "step": 230020 }, { "epoch": 0.4, "learning_rate": 2.9942765863203092e-05, "loss": 2.3007, "step": 230030 }, { "epoch": 0.4, "learning_rate": 2.9941893923276266e-05, "loss": 2.4542, "step": 230040 }, { "epoch": 0.4, "learning_rate": 2.9941021983349437e-05, "loss": 2.4662, "step": 230050 }, { "epoch": 0.4, "learning_rate": 2.994015004342261e-05, "loss": 2.2724, "step": 230060 }, { "epoch": 0.4, "learning_rate": 2.9939278103495784e-05, "loss": 2.3585, "step": 230070 }, { "epoch": 0.4, "learning_rate": 2.9938406163568955e-05, "loss": 2.5, "step": 230080 }, { "epoch": 0.4, "learning_rate": 2.9937534223642128e-05, "loss": 2.4529, "step": 230090 }, { "epoch": 0.4, "learning_rate": 2.99366622837153e-05, "loss": 2.3394, "step": 230100 }, { "epoch": 0.4, "learning_rate": 2.993579034378848e-05, "loss": 2.3968, "step": 230110 }, { "epoch": 0.4, "learning_rate": 2.993491840386165e-05, "loss": 2.3874, "step": 230120 }, { "epoch": 0.4, "learning_rate": 2.9934046463934823e-05, "loss": 2.323, "step": 230130 }, { "epoch": 0.4, "learning_rate": 2.9933174524007994e-05, "loss": 2.3708, "step": 230140 }, { "epoch": 0.4, "learning_rate": 2.9932302584081168e-05, "loss": 2.3648, "step": 230150 }, { "epoch": 0.4, "learning_rate": 2.993143064415434e-05, "loss": 2.3297, "step": 230160 }, { "epoch": 0.4, "learning_rate": 2.993055870422751e-05, "loss": 2.3563, "step": 230170 }, { "epoch": 0.4, "learning_rate": 2.9929686764300692e-05, "loss": 2.3346, "step": 230180 }, { "epoch": 0.4, "learning_rate": 2.9928814824373863e-05, "loss": 2.422, "step": 230190 }, { "epoch": 0.4, "learning_rate": 2.9927942884447036e-05, "loss": 2.3892, "step": 230200 }, { "epoch": 0.4, "learning_rate": 2.9927070944520207e-05, "loss": 2.3009, "step": 230210 }, { "epoch": 0.4, "learning_rate": 2.992619900459338e-05, "loss": 2.2901, "step": 230220 }, { "epoch": 0.4, "learning_rate": 2.9925327064666554e-05, "loss": 2.3236, "step": 230230 }, { "epoch": 0.4, "learning_rate": 2.9924455124739725e-05, "loss": 2.4039, "step": 230240 }, { "epoch": 0.4, "learning_rate": 2.99235831848129e-05, "loss": 2.4187, "step": 230250 }, { "epoch": 0.4, "learning_rate": 2.9922711244886076e-05, "loss": 2.3976, "step": 230260 }, { "epoch": 0.4, "learning_rate": 2.992183930495925e-05, "loss": 2.4796, "step": 230270 }, { "epoch": 0.4, "learning_rate": 2.992096736503242e-05, "loss": 2.4787, "step": 230280 }, { "epoch": 0.4, "learning_rate": 2.9920095425105594e-05, "loss": 2.3778, "step": 230290 }, { "epoch": 0.4, "learning_rate": 2.9919223485178764e-05, "loss": 2.3789, "step": 230300 }, { "epoch": 0.4, "learning_rate": 2.9918351545251938e-05, "loss": 2.4116, "step": 230310 }, { "epoch": 0.4, "learning_rate": 2.991747960532511e-05, "loss": 2.4378, "step": 230320 }, { "epoch": 0.4, "learning_rate": 2.991660766539829e-05, "loss": 2.3434, "step": 230330 }, { "epoch": 0.4, "learning_rate": 2.9915735725471462e-05, "loss": 2.3771, "step": 230340 }, { "epoch": 0.4, "learning_rate": 2.9914863785544633e-05, "loss": 2.4692, "step": 230350 }, { "epoch": 0.4, "learning_rate": 2.9913991845617807e-05, "loss": 2.3964, "step": 230360 }, { "epoch": 0.4, "learning_rate": 2.9913119905690977e-05, "loss": 2.4336, "step": 230370 }, { "epoch": 0.4, "learning_rate": 2.991224796576415e-05, "loss": 2.4879, "step": 230380 }, { "epoch": 0.4, "learning_rate": 2.9911376025837324e-05, "loss": 2.3746, "step": 230390 }, { "epoch": 0.4, "learning_rate": 2.99105040859105e-05, "loss": 2.3379, "step": 230400 }, { "epoch": 0.4, "learning_rate": 2.9909632145983672e-05, "loss": 2.321, "step": 230410 }, { "epoch": 0.4, "learning_rate": 2.9908760206056846e-05, "loss": 2.3469, "step": 230420 }, { "epoch": 0.4, "learning_rate": 2.990788826613002e-05, "loss": 2.2469, "step": 230430 }, { "epoch": 0.4, "learning_rate": 2.990701632620319e-05, "loss": 2.2498, "step": 230440 }, { "epoch": 0.4, "learning_rate": 2.9906144386276364e-05, "loss": 2.4172, "step": 230450 }, { "epoch": 0.4, "learning_rate": 2.9905272446349537e-05, "loss": 2.3781, "step": 230460 }, { "epoch": 0.4, "learning_rate": 2.9904400506422708e-05, "loss": 2.3695, "step": 230470 }, { "epoch": 0.4, "learning_rate": 2.9903528566495885e-05, "loss": 2.4668, "step": 230480 }, { "epoch": 0.4, "learning_rate": 2.990265662656906e-05, "loss": 2.3288, "step": 230490 }, { "epoch": 0.4, "learning_rate": 2.9901784686642233e-05, "loss": 2.3539, "step": 230500 }, { "epoch": 0.4, "learning_rate": 2.9900912746715403e-05, "loss": 2.5015, "step": 230510 }, { "epoch": 0.4, "learning_rate": 2.9900040806788577e-05, "loss": 2.4994, "step": 230520 }, { "epoch": 0.4, "learning_rate": 2.9899168866861747e-05, "loss": 2.3228, "step": 230530 }, { "epoch": 0.4, "learning_rate": 2.989829692693492e-05, "loss": 2.4102, "step": 230540 }, { "epoch": 0.4, "learning_rate": 2.9897424987008098e-05, "loss": 2.4166, "step": 230550 }, { "epoch": 0.4, "learning_rate": 2.9896553047081272e-05, "loss": 2.418, "step": 230560 }, { "epoch": 0.4, "learning_rate": 2.9895681107154446e-05, "loss": 2.4007, "step": 230570 }, { "epoch": 0.4, "learning_rate": 2.9894809167227616e-05, "loss": 2.525, "step": 230580 }, { "epoch": 0.4, "learning_rate": 2.989393722730079e-05, "loss": 2.4292, "step": 230590 }, { "epoch": 0.4, "learning_rate": 2.989306528737396e-05, "loss": 2.4097, "step": 230600 }, { "epoch": 0.4, "learning_rate": 2.9892193347447134e-05, "loss": 2.3473, "step": 230610 }, { "epoch": 0.4, "learning_rate": 2.9891321407520308e-05, "loss": 2.4169, "step": 230620 }, { "epoch": 0.4, "learning_rate": 2.9890449467593485e-05, "loss": 2.4131, "step": 230630 }, { "epoch": 0.4, "learning_rate": 2.9889577527666655e-05, "loss": 2.4808, "step": 230640 }, { "epoch": 0.4, "learning_rate": 2.988870558773983e-05, "loss": 2.3472, "step": 230650 }, { "epoch": 0.4, "learning_rate": 2.9887833647813003e-05, "loss": 2.4317, "step": 230660 }, { "epoch": 0.4, "learning_rate": 2.9886961707886173e-05, "loss": 2.3459, "step": 230670 }, { "epoch": 0.4, "learning_rate": 2.9886089767959347e-05, "loss": 2.361, "step": 230680 }, { "epoch": 0.4, "learning_rate": 2.988521782803252e-05, "loss": 2.352, "step": 230690 }, { "epoch": 0.4, "learning_rate": 2.9884345888105698e-05, "loss": 2.3951, "step": 230700 }, { "epoch": 0.4, "learning_rate": 2.9883473948178868e-05, "loss": 2.3896, "step": 230710 }, { "epoch": 0.4, "learning_rate": 2.9882602008252042e-05, "loss": 2.3925, "step": 230720 }, { "epoch": 0.4, "learning_rate": 2.9881730068325216e-05, "loss": 2.3478, "step": 230730 }, { "epoch": 0.4, "learning_rate": 2.9880858128398386e-05, "loss": 2.4617, "step": 230740 }, { "epoch": 0.4, "learning_rate": 2.987998618847156e-05, "loss": 2.4918, "step": 230750 }, { "epoch": 0.4, "learning_rate": 2.987911424854473e-05, "loss": 2.3397, "step": 230760 }, { "epoch": 0.4, "learning_rate": 2.9878242308617904e-05, "loss": 2.3214, "step": 230770 }, { "epoch": 0.4, "learning_rate": 2.987737036869108e-05, "loss": 2.3959, "step": 230780 }, { "epoch": 0.4, "learning_rate": 2.9876498428764255e-05, "loss": 2.5179, "step": 230790 }, { "epoch": 0.4, "learning_rate": 2.987562648883743e-05, "loss": 2.402, "step": 230800 }, { "epoch": 0.4, "learning_rate": 2.98747545489106e-05, "loss": 2.4268, "step": 230810 }, { "epoch": 0.4, "learning_rate": 2.9873882608983773e-05, "loss": 2.4338, "step": 230820 }, { "epoch": 0.4, "learning_rate": 2.9873010669056943e-05, "loss": 2.3373, "step": 230830 }, { "epoch": 0.4, "learning_rate": 2.9872138729130117e-05, "loss": 2.2227, "step": 230840 }, { "epoch": 0.4, "learning_rate": 2.9871266789203294e-05, "loss": 2.3839, "step": 230850 }, { "epoch": 0.4, "learning_rate": 2.9870394849276468e-05, "loss": 2.2575, "step": 230860 }, { "epoch": 0.4, "learning_rate": 2.986952290934964e-05, "loss": 2.5047, "step": 230870 }, { "epoch": 0.4, "learning_rate": 2.9868650969422812e-05, "loss": 2.4687, "step": 230880 }, { "epoch": 0.4, "learning_rate": 2.9867779029495986e-05, "loss": 2.445, "step": 230890 }, { "epoch": 0.4, "learning_rate": 2.9866907089569156e-05, "loss": 2.4922, "step": 230900 }, { "epoch": 0.4, "learning_rate": 2.986603514964233e-05, "loss": 2.4281, "step": 230910 }, { "epoch": 0.4, "learning_rate": 2.9865163209715507e-05, "loss": 2.3408, "step": 230920 }, { "epoch": 0.4, "learning_rate": 2.986429126978868e-05, "loss": 2.3552, "step": 230930 }, { "epoch": 0.4, "learning_rate": 2.986341932986185e-05, "loss": 2.5562, "step": 230940 }, { "epoch": 0.4, "learning_rate": 2.9862547389935025e-05, "loss": 2.299, "step": 230950 }, { "epoch": 0.4, "learning_rate": 2.98616754500082e-05, "loss": 2.357, "step": 230960 }, { "epoch": 0.4, "learning_rate": 2.986080351008137e-05, "loss": 2.4147, "step": 230970 }, { "epoch": 0.4, "learning_rate": 2.9859931570154543e-05, "loss": 2.4306, "step": 230980 }, { "epoch": 0.4, "learning_rate": 2.9859059630227713e-05, "loss": 2.4869, "step": 230990 }, { "epoch": 0.4, "learning_rate": 2.9858187690300894e-05, "loss": 2.4109, "step": 231000 }, { "epoch": 0.4, "learning_rate": 2.9857315750374064e-05, "loss": 2.391, "step": 231010 }, { "epoch": 0.4, "learning_rate": 2.9856443810447238e-05, "loss": 2.4216, "step": 231020 }, { "epoch": 0.4, "learning_rate": 2.9855571870520412e-05, "loss": 2.2887, "step": 231030 }, { "epoch": 0.4, "learning_rate": 2.9854699930593582e-05, "loss": 2.362, "step": 231040 }, { "epoch": 0.4, "learning_rate": 2.9853827990666756e-05, "loss": 2.4044, "step": 231050 }, { "epoch": 0.4, "learning_rate": 2.9852956050739926e-05, "loss": 2.3729, "step": 231060 }, { "epoch": 0.4, "learning_rate": 2.9852084110813107e-05, "loss": 2.3427, "step": 231070 }, { "epoch": 0.4, "learning_rate": 2.9851212170886277e-05, "loss": 2.3985, "step": 231080 }, { "epoch": 0.4, "learning_rate": 2.985034023095945e-05, "loss": 2.4428, "step": 231090 }, { "epoch": 0.4, "learning_rate": 2.984946829103262e-05, "loss": 2.357, "step": 231100 }, { "epoch": 0.4, "learning_rate": 2.9848596351105795e-05, "loss": 2.3619, "step": 231110 }, { "epoch": 0.4, "learning_rate": 2.984772441117897e-05, "loss": 2.3417, "step": 231120 }, { "epoch": 0.4, "learning_rate": 2.984685247125214e-05, "loss": 2.4973, "step": 231130 }, { "epoch": 0.4, "learning_rate": 2.9845980531325313e-05, "loss": 2.2356, "step": 231140 }, { "epoch": 0.4, "learning_rate": 2.984510859139849e-05, "loss": 2.4192, "step": 231150 }, { "epoch": 0.4, "learning_rate": 2.9844236651471664e-05, "loss": 2.3558, "step": 231160 }, { "epoch": 0.4, "learning_rate": 2.9843364711544834e-05, "loss": 2.3991, "step": 231170 }, { "epoch": 0.4, "learning_rate": 2.9842492771618008e-05, "loss": 2.3005, "step": 231180 }, { "epoch": 0.4, "learning_rate": 2.9841620831691182e-05, "loss": 2.3912, "step": 231190 }, { "epoch": 0.4, "learning_rate": 2.9840748891764352e-05, "loss": 2.4654, "step": 231200 }, { "epoch": 0.4, "learning_rate": 2.9839876951837526e-05, "loss": 2.4095, "step": 231210 }, { "epoch": 0.4, "learning_rate": 2.9839005011910703e-05, "loss": 2.4597, "step": 231220 }, { "epoch": 0.4, "learning_rate": 2.9838133071983877e-05, "loss": 2.2971, "step": 231230 }, { "epoch": 0.4, "learning_rate": 2.9837261132057047e-05, "loss": 2.3373, "step": 231240 }, { "epoch": 0.4, "learning_rate": 2.983638919213022e-05, "loss": 2.2804, "step": 231250 }, { "epoch": 0.4, "learning_rate": 2.983551725220339e-05, "loss": 2.3311, "step": 231260 }, { "epoch": 0.4, "learning_rate": 2.9834645312276565e-05, "loss": 2.4305, "step": 231270 }, { "epoch": 0.4, "learning_rate": 2.983377337234974e-05, "loss": 2.4089, "step": 231280 }, { "epoch": 0.4, "learning_rate": 2.983290143242291e-05, "loss": 2.4755, "step": 231290 }, { "epoch": 0.4, "learning_rate": 2.983202949249609e-05, "loss": 2.3235, "step": 231300 }, { "epoch": 0.4, "learning_rate": 2.983115755256926e-05, "loss": 2.3228, "step": 231310 }, { "epoch": 0.4, "learning_rate": 2.9830285612642434e-05, "loss": 2.4026, "step": 231320 }, { "epoch": 0.4, "learning_rate": 2.9829413672715605e-05, "loss": 2.5069, "step": 231330 }, { "epoch": 0.4, "learning_rate": 2.982854173278878e-05, "loss": 2.3467, "step": 231340 }, { "epoch": 0.4, "learning_rate": 2.9827669792861952e-05, "loss": 2.3507, "step": 231350 }, { "epoch": 0.4, "learning_rate": 2.9826797852935123e-05, "loss": 2.5256, "step": 231360 }, { "epoch": 0.4, "learning_rate": 2.98259259130083e-05, "loss": 2.4744, "step": 231370 }, { "epoch": 0.4, "learning_rate": 2.9825053973081473e-05, "loss": 2.4307, "step": 231380 }, { "epoch": 0.4, "learning_rate": 2.9824182033154647e-05, "loss": 2.4986, "step": 231390 }, { "epoch": 0.4, "learning_rate": 2.9823310093227818e-05, "loss": 2.4659, "step": 231400 }, { "epoch": 0.4, "learning_rate": 2.982243815330099e-05, "loss": 2.3549, "step": 231410 }, { "epoch": 0.4, "learning_rate": 2.9821566213374165e-05, "loss": 2.3863, "step": 231420 }, { "epoch": 0.4, "learning_rate": 2.9820694273447336e-05, "loss": 2.3983, "step": 231430 }, { "epoch": 0.4, "learning_rate": 2.981982233352051e-05, "loss": 2.3269, "step": 231440 }, { "epoch": 0.4, "learning_rate": 2.9818950393593686e-05, "loss": 2.351, "step": 231450 }, { "epoch": 0.4, "learning_rate": 2.981807845366686e-05, "loss": 2.3511, "step": 231460 }, { "epoch": 0.4, "learning_rate": 2.981720651374003e-05, "loss": 2.4358, "step": 231470 }, { "epoch": 0.4, "learning_rate": 2.9816334573813204e-05, "loss": 2.369, "step": 231480 }, { "epoch": 0.4, "learning_rate": 2.9815462633886375e-05, "loss": 2.5157, "step": 231490 }, { "epoch": 0.4, "learning_rate": 2.981459069395955e-05, "loss": 2.3762, "step": 231500 }, { "epoch": 0.4, "learning_rate": 2.9813718754032722e-05, "loss": 2.4582, "step": 231510 }, { "epoch": 0.4, "learning_rate": 2.98128468141059e-05, "loss": 2.3831, "step": 231520 }, { "epoch": 0.4, "learning_rate": 2.9811974874179073e-05, "loss": 2.4322, "step": 231530 }, { "epoch": 0.4, "learning_rate": 2.9811102934252244e-05, "loss": 2.2944, "step": 231540 }, { "epoch": 0.4, "learning_rate": 2.9810230994325417e-05, "loss": 2.4614, "step": 231550 }, { "epoch": 0.4, "learning_rate": 2.9809359054398588e-05, "loss": 2.4199, "step": 231560 }, { "epoch": 0.4, "learning_rate": 2.980848711447176e-05, "loss": 2.4346, "step": 231570 }, { "epoch": 0.4, "learning_rate": 2.9807615174544935e-05, "loss": 2.3539, "step": 231580 }, { "epoch": 0.4, "learning_rate": 2.9806743234618112e-05, "loss": 2.4582, "step": 231590 }, { "epoch": 0.4, "learning_rate": 2.9805871294691283e-05, "loss": 2.5053, "step": 231600 }, { "epoch": 0.4, "learning_rate": 2.9804999354764457e-05, "loss": 2.3914, "step": 231610 }, { "epoch": 0.4, "learning_rate": 2.980412741483763e-05, "loss": 2.3949, "step": 231620 }, { "epoch": 0.4, "learning_rate": 2.98032554749108e-05, "loss": 2.2505, "step": 231630 }, { "epoch": 0.4, "learning_rate": 2.9802383534983975e-05, "loss": 2.3573, "step": 231640 }, { "epoch": 0.4, "learning_rate": 2.980151159505715e-05, "loss": 2.3877, "step": 231650 }, { "epoch": 0.4, "learning_rate": 2.980063965513032e-05, "loss": 2.4372, "step": 231660 }, { "epoch": 0.4, "learning_rate": 2.9799767715203496e-05, "loss": 2.3378, "step": 231670 }, { "epoch": 0.4, "learning_rate": 2.979889577527667e-05, "loss": 2.3575, "step": 231680 }, { "epoch": 0.4, "learning_rate": 2.9798023835349843e-05, "loss": 2.3293, "step": 231690 }, { "epoch": 0.4, "learning_rate": 2.9797151895423014e-05, "loss": 2.4183, "step": 231700 }, { "epoch": 0.4, "learning_rate": 2.9796279955496188e-05, "loss": 2.2318, "step": 231710 }, { "epoch": 0.4, "learning_rate": 2.9795408015569358e-05, "loss": 2.3539, "step": 231720 }, { "epoch": 0.4, "learning_rate": 2.9794536075642532e-05, "loss": 2.405, "step": 231730 }, { "epoch": 0.4, "learning_rate": 2.979366413571571e-05, "loss": 2.3797, "step": 231740 }, { "epoch": 0.4, "learning_rate": 2.9792792195788883e-05, "loss": 2.4393, "step": 231750 }, { "epoch": 0.4, "learning_rate": 2.9791920255862056e-05, "loss": 2.5018, "step": 231760 }, { "epoch": 0.4, "learning_rate": 2.9791048315935227e-05, "loss": 2.4739, "step": 231770 }, { "epoch": 0.4, "learning_rate": 2.97901763760084e-05, "loss": 2.4121, "step": 231780 }, { "epoch": 0.4, "learning_rate": 2.978930443608157e-05, "loss": 2.4645, "step": 231790 }, { "epoch": 0.4, "learning_rate": 2.9788432496154745e-05, "loss": 2.3552, "step": 231800 }, { "epoch": 0.4, "learning_rate": 2.978756055622792e-05, "loss": 2.4189, "step": 231810 }, { "epoch": 0.4, "learning_rate": 2.9786688616301096e-05, "loss": 2.4269, "step": 231820 }, { "epoch": 0.4, "learning_rate": 2.9785816676374266e-05, "loss": 2.4539, "step": 231830 }, { "epoch": 0.4, "learning_rate": 2.978494473644744e-05, "loss": 2.3633, "step": 231840 }, { "epoch": 0.4, "learning_rate": 2.9784072796520614e-05, "loss": 2.4301, "step": 231850 }, { "epoch": 0.4, "learning_rate": 2.9783200856593784e-05, "loss": 2.2732, "step": 231860 }, { "epoch": 0.4, "learning_rate": 2.9782328916666958e-05, "loss": 2.3595, "step": 231870 }, { "epoch": 0.4, "learning_rate": 2.9781456976740128e-05, "loss": 2.2825, "step": 231880 }, { "epoch": 0.4, "learning_rate": 2.978058503681331e-05, "loss": 2.3809, "step": 231890 }, { "epoch": 0.4, "learning_rate": 2.977971309688648e-05, "loss": 2.39, "step": 231900 }, { "epoch": 0.4, "learning_rate": 2.9778841156959653e-05, "loss": 2.4304, "step": 231910 }, { "epoch": 0.4, "learning_rate": 2.9777969217032827e-05, "loss": 2.3699, "step": 231920 }, { "epoch": 0.4, "learning_rate": 2.9777097277105997e-05, "loss": 2.4104, "step": 231930 }, { "epoch": 0.4, "learning_rate": 2.977622533717917e-05, "loss": 2.4074, "step": 231940 }, { "epoch": 0.4, "learning_rate": 2.977535339725234e-05, "loss": 2.4415, "step": 231950 }, { "epoch": 0.4, "learning_rate": 2.9774481457325515e-05, "loss": 2.4815, "step": 231960 }, { "epoch": 0.4, "learning_rate": 2.9773609517398692e-05, "loss": 2.5069, "step": 231970 }, { "epoch": 0.4, "learning_rate": 2.9772737577471866e-05, "loss": 2.3322, "step": 231980 }, { "epoch": 0.4, "learning_rate": 2.9771865637545036e-05, "loss": 2.3969, "step": 231990 }, { "epoch": 0.4, "learning_rate": 2.977099369761821e-05, "loss": 2.4008, "step": 232000 }, { "epoch": 0.4, "learning_rate": 2.9770121757691384e-05, "loss": 2.3191, "step": 232010 }, { "epoch": 0.4, "learning_rate": 2.9769249817764554e-05, "loss": 2.4005, "step": 232020 }, { "epoch": 0.4, "learning_rate": 2.9768377877837728e-05, "loss": 2.3146, "step": 232030 }, { "epoch": 0.4, "learning_rate": 2.9767505937910905e-05, "loss": 2.3899, "step": 232040 }, { "epoch": 0.4, "learning_rate": 2.976663399798408e-05, "loss": 2.4567, "step": 232050 }, { "epoch": 0.4, "learning_rate": 2.976576205805725e-05, "loss": 2.4565, "step": 232060 }, { "epoch": 0.4, "learning_rate": 2.9764890118130423e-05, "loss": 2.3935, "step": 232070 }, { "epoch": 0.4, "learning_rate": 2.9764018178203597e-05, "loss": 2.4386, "step": 232080 }, { "epoch": 0.4, "learning_rate": 2.9763146238276767e-05, "loss": 2.3994, "step": 232090 }, { "epoch": 0.4, "learning_rate": 2.976227429834994e-05, "loss": 2.3637, "step": 232100 }, { "epoch": 0.4, "learning_rate": 2.976140235842311e-05, "loss": 2.4205, "step": 232110 }, { "epoch": 0.4, "learning_rate": 2.9760530418496292e-05, "loss": 2.4104, "step": 232120 }, { "epoch": 0.4, "learning_rate": 2.9759658478569462e-05, "loss": 2.3465, "step": 232130 }, { "epoch": 0.4, "learning_rate": 2.9758786538642636e-05, "loss": 2.4043, "step": 232140 }, { "epoch": 0.4, "learning_rate": 2.975791459871581e-05, "loss": 2.3848, "step": 232150 }, { "epoch": 0.4, "learning_rate": 2.975704265878898e-05, "loss": 2.3846, "step": 232160 }, { "epoch": 0.4, "learning_rate": 2.9756170718862154e-05, "loss": 2.4007, "step": 232170 }, { "epoch": 0.4, "learning_rate": 2.9755298778935324e-05, "loss": 2.2471, "step": 232180 }, { "epoch": 0.4, "learning_rate": 2.9754426839008505e-05, "loss": 2.3616, "step": 232190 }, { "epoch": 0.4, "learning_rate": 2.9753554899081675e-05, "loss": 2.3497, "step": 232200 }, { "epoch": 0.4, "learning_rate": 2.975268295915485e-05, "loss": 2.3027, "step": 232210 }, { "epoch": 0.4, "learning_rate": 2.975181101922802e-05, "loss": 2.3087, "step": 232220 }, { "epoch": 0.4, "learning_rate": 2.9750939079301193e-05, "loss": 2.4973, "step": 232230 }, { "epoch": 0.4, "learning_rate": 2.9750067139374367e-05, "loss": 2.3185, "step": 232240 }, { "epoch": 0.41, "learning_rate": 2.9749195199447537e-05, "loss": 2.3104, "step": 232250 }, { "epoch": 0.41, "learning_rate": 2.9748323259520718e-05, "loss": 2.3617, "step": 232260 }, { "epoch": 0.41, "learning_rate": 2.9747451319593888e-05, "loss": 2.3295, "step": 232270 }, { "epoch": 0.41, "learning_rate": 2.9746579379667062e-05, "loss": 2.3568, "step": 232280 }, { "epoch": 0.41, "learning_rate": 2.9745707439740232e-05, "loss": 2.4768, "step": 232290 }, { "epoch": 0.41, "learning_rate": 2.9744835499813406e-05, "loss": 2.4529, "step": 232300 }, { "epoch": 0.41, "learning_rate": 2.974396355988658e-05, "loss": 2.4966, "step": 232310 }, { "epoch": 0.41, "learning_rate": 2.974309161995975e-05, "loss": 2.3394, "step": 232320 }, { "epoch": 0.41, "learning_rate": 2.9742219680032924e-05, "loss": 2.3647, "step": 232330 }, { "epoch": 0.41, "learning_rate": 2.97413477401061e-05, "loss": 2.3572, "step": 232340 }, { "epoch": 0.41, "learning_rate": 2.9740475800179275e-05, "loss": 2.3668, "step": 232350 }, { "epoch": 0.41, "learning_rate": 2.9739603860252445e-05, "loss": 2.5187, "step": 232360 }, { "epoch": 0.41, "learning_rate": 2.973873192032562e-05, "loss": 2.4372, "step": 232370 }, { "epoch": 0.41, "learning_rate": 2.9737859980398793e-05, "loss": 2.3871, "step": 232380 }, { "epoch": 0.41, "learning_rate": 2.9736988040471963e-05, "loss": 2.3562, "step": 232390 }, { "epoch": 0.41, "learning_rate": 2.9736116100545137e-05, "loss": 2.3976, "step": 232400 }, { "epoch": 0.41, "learning_rate": 2.9735244160618314e-05, "loss": 2.4743, "step": 232410 }, { "epoch": 0.41, "learning_rate": 2.9734372220691488e-05, "loss": 2.4963, "step": 232420 }, { "epoch": 0.41, "learning_rate": 2.973350028076466e-05, "loss": 2.404, "step": 232430 }, { "epoch": 0.41, "learning_rate": 2.9732628340837832e-05, "loss": 2.5043, "step": 232440 }, { "epoch": 0.41, "learning_rate": 2.9731756400911002e-05, "loss": 2.3465, "step": 232450 }, { "epoch": 0.41, "learning_rate": 2.9730884460984176e-05, "loss": 2.4492, "step": 232460 }, { "epoch": 0.41, "learning_rate": 2.973001252105735e-05, "loss": 2.4737, "step": 232470 }, { "epoch": 0.41, "learning_rate": 2.972914058113052e-05, "loss": 2.4531, "step": 232480 }, { "epoch": 0.41, "learning_rate": 2.97282686412037e-05, "loss": 2.4255, "step": 232490 }, { "epoch": 0.41, "learning_rate": 2.972739670127687e-05, "loss": 2.4134, "step": 232500 }, { "epoch": 0.41, "learning_rate": 2.9726524761350045e-05, "loss": 2.4101, "step": 232510 }, { "epoch": 0.41, "learning_rate": 2.9725652821423215e-05, "loss": 2.4663, "step": 232520 }, { "epoch": 0.41, "learning_rate": 2.972478088149639e-05, "loss": 2.3292, "step": 232530 }, { "epoch": 0.41, "learning_rate": 2.9723908941569563e-05, "loss": 2.2617, "step": 232540 }, { "epoch": 0.41, "learning_rate": 2.9723037001642733e-05, "loss": 2.3854, "step": 232550 }, { "epoch": 0.41, "learning_rate": 2.972216506171591e-05, "loss": 2.3261, "step": 232560 }, { "epoch": 0.41, "learning_rate": 2.9721293121789084e-05, "loss": 2.3862, "step": 232570 }, { "epoch": 0.41, "learning_rate": 2.9720421181862258e-05, "loss": 2.4385, "step": 232580 }, { "epoch": 0.41, "learning_rate": 2.971954924193543e-05, "loss": 2.318, "step": 232590 }, { "epoch": 0.41, "learning_rate": 2.9718677302008602e-05, "loss": 2.3195, "step": 232600 }, { "epoch": 0.41, "learning_rate": 2.9717805362081773e-05, "loss": 2.3718, "step": 232610 }, { "epoch": 0.41, "learning_rate": 2.9716933422154946e-05, "loss": 2.3789, "step": 232620 }, { "epoch": 0.41, "learning_rate": 2.971606148222812e-05, "loss": 2.4465, "step": 232630 }, { "epoch": 0.41, "learning_rate": 2.9715189542301297e-05, "loss": 2.5131, "step": 232640 }, { "epoch": 0.41, "learning_rate": 2.971431760237447e-05, "loss": 2.4977, "step": 232650 }, { "epoch": 0.41, "learning_rate": 2.971344566244764e-05, "loss": 2.4002, "step": 232660 }, { "epoch": 0.41, "learning_rate": 2.9712573722520815e-05, "loss": 2.4592, "step": 232670 }, { "epoch": 0.41, "learning_rate": 2.9711701782593986e-05, "loss": 2.4945, "step": 232680 }, { "epoch": 0.41, "learning_rate": 2.971082984266716e-05, "loss": 2.3709, "step": 232690 }, { "epoch": 0.41, "learning_rate": 2.9709957902740333e-05, "loss": 2.4394, "step": 232700 }, { "epoch": 0.41, "learning_rate": 2.970908596281351e-05, "loss": 2.4716, "step": 232710 }, { "epoch": 0.41, "learning_rate": 2.970821402288668e-05, "loss": 2.4003, "step": 232720 }, { "epoch": 0.41, "learning_rate": 2.9707342082959854e-05, "loss": 2.4783, "step": 232730 }, { "epoch": 0.41, "learning_rate": 2.9706470143033028e-05, "loss": 2.34, "step": 232740 }, { "epoch": 0.41, "learning_rate": 2.97055982031062e-05, "loss": 2.3739, "step": 232750 }, { "epoch": 0.41, "learning_rate": 2.9704726263179372e-05, "loss": 2.4218, "step": 232760 }, { "epoch": 0.41, "learning_rate": 2.9703854323252546e-05, "loss": 2.4219, "step": 232770 }, { "epoch": 0.41, "learning_rate": 2.9702982383325723e-05, "loss": 2.5032, "step": 232780 }, { "epoch": 0.41, "learning_rate": 2.9702110443398894e-05, "loss": 2.225, "step": 232790 }, { "epoch": 0.41, "learning_rate": 2.9701238503472067e-05, "loss": 2.3975, "step": 232800 }, { "epoch": 0.41, "learning_rate": 2.970036656354524e-05, "loss": 2.4107, "step": 232810 }, { "epoch": 0.41, "learning_rate": 2.969949462361841e-05, "loss": 2.4141, "step": 232820 }, { "epoch": 0.41, "learning_rate": 2.9698622683691585e-05, "loss": 2.4452, "step": 232830 }, { "epoch": 0.41, "learning_rate": 2.9697750743764756e-05, "loss": 2.5351, "step": 232840 }, { "epoch": 0.41, "learning_rate": 2.969687880383793e-05, "loss": 2.2805, "step": 232850 }, { "epoch": 0.41, "learning_rate": 2.9696006863911107e-05, "loss": 2.4724, "step": 232860 }, { "epoch": 0.41, "learning_rate": 2.969513492398428e-05, "loss": 2.4018, "step": 232870 }, { "epoch": 0.41, "learning_rate": 2.9694262984057454e-05, "loss": 2.3756, "step": 232880 }, { "epoch": 0.41, "learning_rate": 2.9693391044130625e-05, "loss": 2.3385, "step": 232890 }, { "epoch": 0.41, "learning_rate": 2.96925191042038e-05, "loss": 2.3627, "step": 232900 }, { "epoch": 0.41, "learning_rate": 2.969164716427697e-05, "loss": 2.3977, "step": 232910 }, { "epoch": 0.41, "learning_rate": 2.9690775224350143e-05, "loss": 2.244, "step": 232920 }, { "epoch": 0.41, "learning_rate": 2.968990328442332e-05, "loss": 2.3146, "step": 232930 }, { "epoch": 0.41, "learning_rate": 2.9689031344496493e-05, "loss": 2.4781, "step": 232940 }, { "epoch": 0.41, "learning_rate": 2.9688159404569664e-05, "loss": 2.4355, "step": 232950 }, { "epoch": 0.41, "learning_rate": 2.9687287464642838e-05, "loss": 2.5337, "step": 232960 }, { "epoch": 0.41, "learning_rate": 2.968641552471601e-05, "loss": 2.4296, "step": 232970 }, { "epoch": 0.41, "learning_rate": 2.9685543584789182e-05, "loss": 2.3877, "step": 232980 }, { "epoch": 0.41, "learning_rate": 2.9684671644862356e-05, "loss": 2.3443, "step": 232990 }, { "epoch": 0.41, "learning_rate": 2.968379970493553e-05, "loss": 2.3289, "step": 233000 }, { "epoch": 0.41, "learning_rate": 2.9682927765008706e-05, "loss": 2.4002, "step": 233010 }, { "epoch": 0.41, "learning_rate": 2.9682055825081877e-05, "loss": 2.4719, "step": 233020 }, { "epoch": 0.41, "learning_rate": 2.968118388515505e-05, "loss": 2.3914, "step": 233030 }, { "epoch": 0.41, "learning_rate": 2.9680311945228224e-05, "loss": 2.5329, "step": 233040 }, { "epoch": 0.41, "learning_rate": 2.9679440005301395e-05, "loss": 2.4657, "step": 233050 }, { "epoch": 0.41, "learning_rate": 2.967856806537457e-05, "loss": 2.418, "step": 233060 }, { "epoch": 0.41, "learning_rate": 2.967769612544774e-05, "loss": 2.2901, "step": 233070 }, { "epoch": 0.41, "learning_rate": 2.967682418552092e-05, "loss": 2.3669, "step": 233080 }, { "epoch": 0.41, "learning_rate": 2.967595224559409e-05, "loss": 2.3624, "step": 233090 }, { "epoch": 0.41, "learning_rate": 2.9675080305667264e-05, "loss": 2.3629, "step": 233100 }, { "epoch": 0.41, "learning_rate": 2.9674208365740437e-05, "loss": 2.4021, "step": 233110 }, { "epoch": 0.41, "learning_rate": 2.9673336425813608e-05, "loss": 2.2978, "step": 233120 }, { "epoch": 0.41, "learning_rate": 2.967246448588678e-05, "loss": 2.453, "step": 233130 }, { "epoch": 0.41, "learning_rate": 2.9671592545959952e-05, "loss": 2.4268, "step": 233140 }, { "epoch": 0.41, "learning_rate": 2.9670720606033126e-05, "loss": 2.4048, "step": 233150 }, { "epoch": 0.41, "learning_rate": 2.9669848666106303e-05, "loss": 2.4796, "step": 233160 }, { "epoch": 0.41, "learning_rate": 2.9668976726179477e-05, "loss": 2.3157, "step": 233170 }, { "epoch": 0.41, "learning_rate": 2.9668104786252647e-05, "loss": 2.2492, "step": 233180 }, { "epoch": 0.41, "learning_rate": 2.966723284632582e-05, "loss": 2.4996, "step": 233190 }, { "epoch": 0.41, "learning_rate": 2.9666360906398995e-05, "loss": 2.3948, "step": 233200 }, { "epoch": 0.41, "learning_rate": 2.9665488966472165e-05, "loss": 2.4068, "step": 233210 }, { "epoch": 0.41, "learning_rate": 2.966461702654534e-05, "loss": 2.4175, "step": 233220 }, { "epoch": 0.41, "learning_rate": 2.9663745086618516e-05, "loss": 2.4709, "step": 233230 }, { "epoch": 0.41, "learning_rate": 2.966287314669169e-05, "loss": 2.3847, "step": 233240 }, { "epoch": 0.41, "learning_rate": 2.966200120676486e-05, "loss": 2.333, "step": 233250 }, { "epoch": 0.41, "learning_rate": 2.9661129266838034e-05, "loss": 2.4185, "step": 233260 }, { "epoch": 0.41, "learning_rate": 2.9660257326911208e-05, "loss": 2.4615, "step": 233270 }, { "epoch": 0.41, "learning_rate": 2.9659385386984378e-05, "loss": 2.347, "step": 233280 }, { "epoch": 0.41, "learning_rate": 2.9658513447057552e-05, "loss": 2.3577, "step": 233290 }, { "epoch": 0.41, "learning_rate": 2.9657641507130722e-05, "loss": 2.4092, "step": 233300 }, { "epoch": 0.41, "learning_rate": 2.9656769567203903e-05, "loss": 2.4222, "step": 233310 }, { "epoch": 0.41, "learning_rate": 2.9655897627277073e-05, "loss": 2.4685, "step": 233320 }, { "epoch": 0.41, "learning_rate": 2.9655025687350247e-05, "loss": 2.3828, "step": 233330 }, { "epoch": 0.41, "learning_rate": 2.9654153747423417e-05, "loss": 2.388, "step": 233340 }, { "epoch": 0.41, "learning_rate": 2.965328180749659e-05, "loss": 2.4207, "step": 233350 }, { "epoch": 0.41, "learning_rate": 2.9652409867569765e-05, "loss": 2.4461, "step": 233360 }, { "epoch": 0.41, "learning_rate": 2.9651537927642935e-05, "loss": 2.4066, "step": 233370 }, { "epoch": 0.41, "learning_rate": 2.9650665987716116e-05, "loss": 2.4639, "step": 233380 }, { "epoch": 0.41, "learning_rate": 2.9649794047789286e-05, "loss": 2.3624, "step": 233390 }, { "epoch": 0.41, "learning_rate": 2.964892210786246e-05, "loss": 2.4013, "step": 233400 }, { "epoch": 0.41, "learning_rate": 2.964805016793563e-05, "loss": 2.3587, "step": 233410 }, { "epoch": 0.41, "learning_rate": 2.9647178228008804e-05, "loss": 2.3012, "step": 233420 }, { "epoch": 0.41, "learning_rate": 2.9646306288081978e-05, "loss": 2.3997, "step": 233430 }, { "epoch": 0.41, "learning_rate": 2.9645434348155148e-05, "loss": 2.2657, "step": 233440 }, { "epoch": 0.41, "learning_rate": 2.9644562408228325e-05, "loss": 2.4237, "step": 233450 }, { "epoch": 0.41, "learning_rate": 2.96436904683015e-05, "loss": 2.4603, "step": 233460 }, { "epoch": 0.41, "learning_rate": 2.9642818528374673e-05, "loss": 2.3181, "step": 233470 }, { "epoch": 0.41, "learning_rate": 2.9641946588447843e-05, "loss": 2.3892, "step": 233480 }, { "epoch": 0.41, "learning_rate": 2.9641074648521017e-05, "loss": 2.3856, "step": 233490 }, { "epoch": 0.41, "learning_rate": 2.964020270859419e-05, "loss": 2.462, "step": 233500 }, { "epoch": 0.41, "learning_rate": 2.963933076866736e-05, "loss": 2.4495, "step": 233510 }, { "epoch": 0.41, "learning_rate": 2.9638458828740535e-05, "loss": 2.437, "step": 233520 }, { "epoch": 0.41, "learning_rate": 2.9637586888813712e-05, "loss": 2.3672, "step": 233530 }, { "epoch": 0.41, "learning_rate": 2.9636714948886886e-05, "loss": 2.4906, "step": 233540 }, { "epoch": 0.41, "learning_rate": 2.9635843008960056e-05, "loss": 2.318, "step": 233550 }, { "epoch": 0.41, "learning_rate": 2.963497106903323e-05, "loss": 2.451, "step": 233560 }, { "epoch": 0.41, "learning_rate": 2.96340991291064e-05, "loss": 2.336, "step": 233570 }, { "epoch": 0.41, "learning_rate": 2.9633227189179574e-05, "loss": 2.4885, "step": 233580 }, { "epoch": 0.41, "learning_rate": 2.9632355249252748e-05, "loss": 2.3822, "step": 233590 }, { "epoch": 0.41, "learning_rate": 2.9631483309325925e-05, "loss": 2.3679, "step": 233600 }, { "epoch": 0.41, "learning_rate": 2.96306113693991e-05, "loss": 2.2957, "step": 233610 }, { "epoch": 0.41, "learning_rate": 2.962973942947227e-05, "loss": 2.3134, "step": 233620 }, { "epoch": 0.41, "learning_rate": 2.9628867489545443e-05, "loss": 2.4471, "step": 233630 }, { "epoch": 0.41, "learning_rate": 2.9627995549618613e-05, "loss": 2.4624, "step": 233640 }, { "epoch": 0.41, "learning_rate": 2.9627123609691787e-05, "loss": 2.4666, "step": 233650 }, { "epoch": 0.41, "learning_rate": 2.962625166976496e-05, "loss": 2.3422, "step": 233660 }, { "epoch": 0.41, "learning_rate": 2.962537972983813e-05, "loss": 2.4098, "step": 233670 }, { "epoch": 0.41, "learning_rate": 2.962450778991131e-05, "loss": 2.399, "step": 233680 }, { "epoch": 0.41, "learning_rate": 2.9623635849984482e-05, "loss": 2.378, "step": 233690 }, { "epoch": 0.41, "learning_rate": 2.9622763910057656e-05, "loss": 2.3559, "step": 233700 }, { "epoch": 0.41, "learning_rate": 2.9621891970130826e-05, "loss": 2.421, "step": 233710 }, { "epoch": 0.41, "learning_rate": 2.9621020030204e-05, "loss": 2.473, "step": 233720 }, { "epoch": 0.41, "learning_rate": 2.9620148090277174e-05, "loss": 2.4666, "step": 233730 }, { "epoch": 0.41, "learning_rate": 2.9619276150350344e-05, "loss": 2.3793, "step": 233740 }, { "epoch": 0.41, "learning_rate": 2.961840421042352e-05, "loss": 2.2496, "step": 233750 }, { "epoch": 0.41, "learning_rate": 2.9617532270496695e-05, "loss": 2.3586, "step": 233760 }, { "epoch": 0.41, "learning_rate": 2.961666033056987e-05, "loss": 2.3318, "step": 233770 }, { "epoch": 0.41, "learning_rate": 2.961578839064304e-05, "loss": 2.3702, "step": 233780 }, { "epoch": 0.41, "learning_rate": 2.9614916450716213e-05, "loss": 2.3867, "step": 233790 }, { "epoch": 0.41, "learning_rate": 2.9614044510789383e-05, "loss": 2.4584, "step": 233800 }, { "epoch": 0.41, "learning_rate": 2.9613172570862557e-05, "loss": 2.5695, "step": 233810 }, { "epoch": 0.41, "learning_rate": 2.961230063093573e-05, "loss": 2.3707, "step": 233820 }, { "epoch": 0.41, "learning_rate": 2.9611428691008908e-05, "loss": 2.372, "step": 233830 }, { "epoch": 0.41, "learning_rate": 2.9610556751082082e-05, "loss": 2.3405, "step": 233840 }, { "epoch": 0.41, "learning_rate": 2.9609684811155252e-05, "loss": 2.429, "step": 233850 }, { "epoch": 0.41, "learning_rate": 2.9608812871228426e-05, "loss": 2.5022, "step": 233860 }, { "epoch": 0.41, "learning_rate": 2.9607940931301596e-05, "loss": 2.3545, "step": 233870 }, { "epoch": 0.41, "learning_rate": 2.960706899137477e-05, "loss": 2.3677, "step": 233880 }, { "epoch": 0.41, "learning_rate": 2.9606197051447944e-05, "loss": 2.3394, "step": 233890 }, { "epoch": 0.41, "learning_rate": 2.960532511152112e-05, "loss": 2.3345, "step": 233900 }, { "epoch": 0.41, "learning_rate": 2.960445317159429e-05, "loss": 2.2831, "step": 233910 }, { "epoch": 0.41, "learning_rate": 2.9603581231667465e-05, "loss": 2.2499, "step": 233920 }, { "epoch": 0.41, "learning_rate": 2.960270929174064e-05, "loss": 2.2572, "step": 233930 }, { "epoch": 0.41, "learning_rate": 2.960183735181381e-05, "loss": 2.3456, "step": 233940 }, { "epoch": 0.41, "learning_rate": 2.9600965411886983e-05, "loss": 2.3693, "step": 233950 }, { "epoch": 0.41, "learning_rate": 2.9600093471960154e-05, "loss": 2.4423, "step": 233960 }, { "epoch": 0.41, "learning_rate": 2.9599221532033327e-05, "loss": 2.3689, "step": 233970 }, { "epoch": 0.41, "learning_rate": 2.9598349592106505e-05, "loss": 2.4394, "step": 233980 }, { "epoch": 0.41, "learning_rate": 2.959747765217968e-05, "loss": 2.4189, "step": 233990 }, { "epoch": 0.41, "learning_rate": 2.9596605712252852e-05, "loss": 2.2991, "step": 234000 }, { "epoch": 0.41, "learning_rate": 2.9595733772326022e-05, "loss": 2.355, "step": 234010 }, { "epoch": 0.41, "learning_rate": 2.9594861832399196e-05, "loss": 2.3971, "step": 234020 }, { "epoch": 0.41, "learning_rate": 2.9593989892472367e-05, "loss": 2.3868, "step": 234030 }, { "epoch": 0.41, "learning_rate": 2.959311795254554e-05, "loss": 2.4157, "step": 234040 }, { "epoch": 0.41, "learning_rate": 2.9592246012618718e-05, "loss": 2.3994, "step": 234050 }, { "epoch": 0.41, "learning_rate": 2.959137407269189e-05, "loss": 2.4444, "step": 234060 }, { "epoch": 0.41, "learning_rate": 2.9590502132765062e-05, "loss": 2.3647, "step": 234070 }, { "epoch": 0.41, "learning_rate": 2.9589630192838235e-05, "loss": 2.4066, "step": 234080 }, { "epoch": 0.41, "learning_rate": 2.958875825291141e-05, "loss": 2.3599, "step": 234090 }, { "epoch": 0.41, "learning_rate": 2.958788631298458e-05, "loss": 2.4739, "step": 234100 }, { "epoch": 0.41, "learning_rate": 2.9587014373057753e-05, "loss": 2.5006, "step": 234110 }, { "epoch": 0.41, "learning_rate": 2.958614243313093e-05, "loss": 2.3361, "step": 234120 }, { "epoch": 0.41, "learning_rate": 2.9585270493204104e-05, "loss": 2.408, "step": 234130 }, { "epoch": 0.41, "learning_rate": 2.9584398553277275e-05, "loss": 2.2921, "step": 234140 }, { "epoch": 0.41, "learning_rate": 2.958352661335045e-05, "loss": 2.3878, "step": 234150 }, { "epoch": 0.41, "learning_rate": 2.9582654673423622e-05, "loss": 2.4109, "step": 234160 }, { "epoch": 0.41, "learning_rate": 2.9581782733496793e-05, "loss": 2.3528, "step": 234170 }, { "epoch": 0.41, "learning_rate": 2.9580910793569966e-05, "loss": 2.3969, "step": 234180 }, { "epoch": 0.41, "learning_rate": 2.9580038853643137e-05, "loss": 2.4039, "step": 234190 }, { "epoch": 0.41, "learning_rate": 2.9579166913716317e-05, "loss": 2.4285, "step": 234200 }, { "epoch": 0.41, "learning_rate": 2.9578294973789488e-05, "loss": 2.2862, "step": 234210 }, { "epoch": 0.41, "learning_rate": 2.957742303386266e-05, "loss": 2.3507, "step": 234220 }, { "epoch": 0.41, "learning_rate": 2.9576551093935835e-05, "loss": 2.4598, "step": 234230 }, { "epoch": 0.41, "learning_rate": 2.9575679154009006e-05, "loss": 2.3721, "step": 234240 }, { "epoch": 0.41, "learning_rate": 2.957480721408218e-05, "loss": 2.3358, "step": 234250 }, { "epoch": 0.41, "learning_rate": 2.957393527415535e-05, "loss": 2.3672, "step": 234260 }, { "epoch": 0.41, "learning_rate": 2.957306333422853e-05, "loss": 2.4097, "step": 234270 }, { "epoch": 0.41, "learning_rate": 2.95721913943017e-05, "loss": 2.452, "step": 234280 }, { "epoch": 0.41, "learning_rate": 2.9571319454374874e-05, "loss": 2.3986, "step": 234290 }, { "epoch": 0.41, "learning_rate": 2.9570447514448045e-05, "loss": 2.3206, "step": 234300 }, { "epoch": 0.41, "learning_rate": 2.956957557452122e-05, "loss": 2.3782, "step": 234310 }, { "epoch": 0.41, "learning_rate": 2.9568703634594392e-05, "loss": 2.3263, "step": 234320 }, { "epoch": 0.41, "learning_rate": 2.9567831694667563e-05, "loss": 2.3769, "step": 234330 }, { "epoch": 0.41, "learning_rate": 2.9566959754740737e-05, "loss": 2.2547, "step": 234340 }, { "epoch": 0.41, "learning_rate": 2.9566087814813914e-05, "loss": 2.4158, "step": 234350 }, { "epoch": 0.41, "learning_rate": 2.9565215874887087e-05, "loss": 2.4831, "step": 234360 }, { "epoch": 0.41, "learning_rate": 2.9564343934960258e-05, "loss": 2.4046, "step": 234370 }, { "epoch": 0.41, "learning_rate": 2.956347199503343e-05, "loss": 2.476, "step": 234380 }, { "epoch": 0.41, "learning_rate": 2.9562600055106605e-05, "loss": 2.4372, "step": 234390 }, { "epoch": 0.41, "learning_rate": 2.9561728115179776e-05, "loss": 2.4252, "step": 234400 }, { "epoch": 0.41, "learning_rate": 2.956085617525295e-05, "loss": 2.3569, "step": 234410 }, { "epoch": 0.41, "learning_rate": 2.9559984235326127e-05, "loss": 2.3998, "step": 234420 }, { "epoch": 0.41, "learning_rate": 2.95591122953993e-05, "loss": 2.3969, "step": 234430 }, { "epoch": 0.41, "learning_rate": 2.955824035547247e-05, "loss": 2.4176, "step": 234440 }, { "epoch": 0.41, "learning_rate": 2.9557368415545645e-05, "loss": 2.3537, "step": 234450 }, { "epoch": 0.41, "learning_rate": 2.955649647561882e-05, "loss": 2.401, "step": 234460 }, { "epoch": 0.41, "learning_rate": 2.955562453569199e-05, "loss": 2.4148, "step": 234470 }, { "epoch": 0.41, "learning_rate": 2.9554752595765163e-05, "loss": 2.3824, "step": 234480 }, { "epoch": 0.41, "learning_rate": 2.9553880655838333e-05, "loss": 2.4048, "step": 234490 }, { "epoch": 0.41, "learning_rate": 2.9553008715911513e-05, "loss": 2.4588, "step": 234500 }, { "epoch": 0.41, "learning_rate": 2.9552136775984684e-05, "loss": 2.4158, "step": 234510 }, { "epoch": 0.41, "learning_rate": 2.9551264836057858e-05, "loss": 2.3219, "step": 234520 }, { "epoch": 0.41, "learning_rate": 2.9550392896131028e-05, "loss": 2.52, "step": 234530 }, { "epoch": 0.41, "learning_rate": 2.9549520956204202e-05, "loss": 2.4422, "step": 234540 }, { "epoch": 0.41, "learning_rate": 2.9548649016277376e-05, "loss": 2.3634, "step": 234550 }, { "epoch": 0.41, "learning_rate": 2.9547777076350546e-05, "loss": 2.4873, "step": 234560 }, { "epoch": 0.41, "learning_rate": 2.9546905136423726e-05, "loss": 2.4685, "step": 234570 }, { "epoch": 0.41, "learning_rate": 2.9546033196496897e-05, "loss": 2.4227, "step": 234580 }, { "epoch": 0.41, "learning_rate": 2.954516125657007e-05, "loss": 2.3557, "step": 234590 }, { "epoch": 0.41, "learning_rate": 2.954428931664324e-05, "loss": 2.3568, "step": 234600 }, { "epoch": 0.41, "learning_rate": 2.9543417376716415e-05, "loss": 2.3512, "step": 234610 }, { "epoch": 0.41, "learning_rate": 2.954254543678959e-05, "loss": 2.3824, "step": 234620 }, { "epoch": 0.41, "learning_rate": 2.954167349686276e-05, "loss": 2.3547, "step": 234630 }, { "epoch": 0.41, "learning_rate": 2.9540801556935933e-05, "loss": 2.483, "step": 234640 }, { "epoch": 0.41, "learning_rate": 2.953992961700911e-05, "loss": 2.4763, "step": 234650 }, { "epoch": 0.41, "learning_rate": 2.9539057677082284e-05, "loss": 2.3554, "step": 234660 }, { "epoch": 0.41, "learning_rate": 2.9538185737155454e-05, "loss": 2.4865, "step": 234670 }, { "epoch": 0.41, "learning_rate": 2.9537313797228628e-05, "loss": 2.3278, "step": 234680 }, { "epoch": 0.41, "learning_rate": 2.9536441857301798e-05, "loss": 2.3791, "step": 234690 }, { "epoch": 0.41, "learning_rate": 2.9535569917374972e-05, "loss": 2.2929, "step": 234700 }, { "epoch": 0.41, "learning_rate": 2.9534697977448146e-05, "loss": 2.441, "step": 234710 }, { "epoch": 0.41, "learning_rate": 2.9533826037521323e-05, "loss": 2.4053, "step": 234720 }, { "epoch": 0.41, "learning_rate": 2.9532954097594497e-05, "loss": 2.3983, "step": 234730 }, { "epoch": 0.41, "learning_rate": 2.9532082157667667e-05, "loss": 2.5164, "step": 234740 }, { "epoch": 0.41, "learning_rate": 2.953121021774084e-05, "loss": 2.3957, "step": 234750 }, { "epoch": 0.41, "learning_rate": 2.953033827781401e-05, "loss": 2.2731, "step": 234760 }, { "epoch": 0.41, "learning_rate": 2.9529466337887185e-05, "loss": 2.4944, "step": 234770 }, { "epoch": 0.41, "learning_rate": 2.952859439796036e-05, "loss": 2.2288, "step": 234780 }, { "epoch": 0.41, "learning_rate": 2.9527722458033536e-05, "loss": 2.3233, "step": 234790 }, { "epoch": 0.41, "learning_rate": 2.9526850518106706e-05, "loss": 2.3926, "step": 234800 }, { "epoch": 0.41, "learning_rate": 2.952597857817988e-05, "loss": 2.255, "step": 234810 }, { "epoch": 0.41, "learning_rate": 2.9525106638253054e-05, "loss": 2.423, "step": 234820 }, { "epoch": 0.41, "learning_rate": 2.9524234698326224e-05, "loss": 2.4449, "step": 234830 }, { "epoch": 0.41, "learning_rate": 2.9523362758399398e-05, "loss": 2.32, "step": 234840 }, { "epoch": 0.41, "learning_rate": 2.9522490818472572e-05, "loss": 2.3395, "step": 234850 }, { "epoch": 0.41, "learning_rate": 2.9521618878545742e-05, "loss": 2.4355, "step": 234860 }, { "epoch": 0.41, "learning_rate": 2.952074693861892e-05, "loss": 2.3701, "step": 234870 }, { "epoch": 0.41, "learning_rate": 2.9519874998692093e-05, "loss": 2.2632, "step": 234880 }, { "epoch": 0.41, "learning_rate": 2.9519003058765267e-05, "loss": 2.4041, "step": 234890 }, { "epoch": 0.41, "learning_rate": 2.9518131118838437e-05, "loss": 2.3449, "step": 234900 }, { "epoch": 0.41, "learning_rate": 2.951725917891161e-05, "loss": 2.4732, "step": 234910 }, { "epoch": 0.41, "learning_rate": 2.951638723898478e-05, "loss": 2.3266, "step": 234920 }, { "epoch": 0.41, "learning_rate": 2.9515515299057955e-05, "loss": 2.421, "step": 234930 }, { "epoch": 0.41, "learning_rate": 2.9514643359131132e-05, "loss": 2.2991, "step": 234940 }, { "epoch": 0.41, "learning_rate": 2.9513771419204306e-05, "loss": 2.3633, "step": 234950 }, { "epoch": 0.41, "learning_rate": 2.951289947927748e-05, "loss": 2.4084, "step": 234960 }, { "epoch": 0.41, "learning_rate": 2.951202753935065e-05, "loss": 2.325, "step": 234970 }, { "epoch": 0.41, "learning_rate": 2.9511155599423824e-05, "loss": 2.4805, "step": 234980 }, { "epoch": 0.41, "learning_rate": 2.9510283659496994e-05, "loss": 2.33, "step": 234990 }, { "epoch": 0.41, "learning_rate": 2.9509411719570168e-05, "loss": 2.4136, "step": 235000 }, { "epoch": 0.41, "learning_rate": 2.9508539779643342e-05, "loss": 2.4063, "step": 235010 }, { "epoch": 0.41, "learning_rate": 2.950766783971652e-05, "loss": 2.3702, "step": 235020 }, { "epoch": 0.41, "learning_rate": 2.950679589978969e-05, "loss": 2.4129, "step": 235030 }, { "epoch": 0.41, "learning_rate": 2.9505923959862863e-05, "loss": 2.3539, "step": 235040 }, { "epoch": 0.41, "learning_rate": 2.9505052019936037e-05, "loss": 2.4322, "step": 235050 }, { "epoch": 0.41, "learning_rate": 2.9504180080009207e-05, "loss": 2.3004, "step": 235060 }, { "epoch": 0.41, "learning_rate": 2.950330814008238e-05, "loss": 2.2658, "step": 235070 }, { "epoch": 0.41, "learning_rate": 2.9502436200155555e-05, "loss": 2.3656, "step": 235080 }, { "epoch": 0.41, "learning_rate": 2.9501564260228732e-05, "loss": 2.3173, "step": 235090 }, { "epoch": 0.41, "learning_rate": 2.9500692320301902e-05, "loss": 2.3968, "step": 235100 }, { "epoch": 0.41, "learning_rate": 2.9499820380375076e-05, "loss": 2.3676, "step": 235110 }, { "epoch": 0.41, "learning_rate": 2.949894844044825e-05, "loss": 2.3349, "step": 235120 }, { "epoch": 0.41, "learning_rate": 2.949807650052142e-05, "loss": 2.42, "step": 235130 }, { "epoch": 0.41, "learning_rate": 2.9497204560594594e-05, "loss": 2.4713, "step": 235140 }, { "epoch": 0.41, "learning_rate": 2.9496332620667764e-05, "loss": 2.4617, "step": 235150 }, { "epoch": 0.41, "learning_rate": 2.9495460680740938e-05, "loss": 2.3466, "step": 235160 }, { "epoch": 0.41, "learning_rate": 2.9494588740814115e-05, "loss": 2.3872, "step": 235170 }, { "epoch": 0.41, "learning_rate": 2.949371680088729e-05, "loss": 2.6229, "step": 235180 }, { "epoch": 0.41, "learning_rate": 2.9492844860960463e-05, "loss": 2.5272, "step": 235190 }, { "epoch": 0.41, "learning_rate": 2.9491972921033633e-05, "loss": 2.4356, "step": 235200 }, { "epoch": 0.41, "learning_rate": 2.9491100981106807e-05, "loss": 2.4239, "step": 235210 }, { "epoch": 0.41, "learning_rate": 2.9490229041179977e-05, "loss": 2.2739, "step": 235220 }, { "epoch": 0.41, "learning_rate": 2.948935710125315e-05, "loss": 2.3398, "step": 235230 }, { "epoch": 0.41, "learning_rate": 2.948848516132633e-05, "loss": 2.4946, "step": 235240 }, { "epoch": 0.41, "learning_rate": 2.9487613221399502e-05, "loss": 2.3601, "step": 235250 }, { "epoch": 0.41, "learning_rate": 2.9486741281472673e-05, "loss": 2.4343, "step": 235260 }, { "epoch": 0.41, "learning_rate": 2.9485869341545846e-05, "loss": 2.43, "step": 235270 }, { "epoch": 0.41, "learning_rate": 2.948499740161902e-05, "loss": 2.3123, "step": 235280 }, { "epoch": 0.41, "learning_rate": 2.948412546169219e-05, "loss": 2.4382, "step": 235290 }, { "epoch": 0.41, "learning_rate": 2.9483253521765364e-05, "loss": 2.3458, "step": 235300 }, { "epoch": 0.41, "learning_rate": 2.948238158183854e-05, "loss": 2.4602, "step": 235310 }, { "epoch": 0.41, "learning_rate": 2.9481509641911715e-05, "loss": 2.3824, "step": 235320 }, { "epoch": 0.41, "learning_rate": 2.9480637701984886e-05, "loss": 2.3487, "step": 235330 }, { "epoch": 0.41, "learning_rate": 2.947976576205806e-05, "loss": 2.3962, "step": 235340 }, { "epoch": 0.41, "learning_rate": 2.9478893822131233e-05, "loss": 2.4352, "step": 235350 }, { "epoch": 0.41, "learning_rate": 2.9478021882204403e-05, "loss": 2.3684, "step": 235360 }, { "epoch": 0.41, "learning_rate": 2.9477149942277577e-05, "loss": 2.4329, "step": 235370 }, { "epoch": 0.41, "learning_rate": 2.9476278002350748e-05, "loss": 2.2928, "step": 235380 }, { "epoch": 0.41, "learning_rate": 2.9475406062423928e-05, "loss": 2.4479, "step": 235390 }, { "epoch": 0.41, "learning_rate": 2.94745341224971e-05, "loss": 2.457, "step": 235400 }, { "epoch": 0.41, "learning_rate": 2.9473662182570272e-05, "loss": 2.3817, "step": 235410 }, { "epoch": 0.41, "learning_rate": 2.9472790242643443e-05, "loss": 2.5211, "step": 235420 }, { "epoch": 0.41, "learning_rate": 2.9471918302716617e-05, "loss": 2.4398, "step": 235430 }, { "epoch": 0.41, "learning_rate": 2.947104636278979e-05, "loss": 2.375, "step": 235440 }, { "epoch": 0.41, "learning_rate": 2.947017442286296e-05, "loss": 2.5181, "step": 235450 }, { "epoch": 0.41, "learning_rate": 2.946930248293614e-05, "loss": 2.47, "step": 235460 }, { "epoch": 0.41, "learning_rate": 2.946843054300931e-05, "loss": 2.3759, "step": 235470 }, { "epoch": 0.41, "learning_rate": 2.9467558603082485e-05, "loss": 2.4283, "step": 235480 }, { "epoch": 0.41, "learning_rate": 2.9466686663155656e-05, "loss": 2.4469, "step": 235490 }, { "epoch": 0.41, "learning_rate": 2.946581472322883e-05, "loss": 2.3151, "step": 235500 }, { "epoch": 0.41, "learning_rate": 2.9464942783302003e-05, "loss": 2.3652, "step": 235510 }, { "epoch": 0.41, "learning_rate": 2.9464070843375174e-05, "loss": 2.3782, "step": 235520 }, { "epoch": 0.41, "learning_rate": 2.9463198903448347e-05, "loss": 2.4485, "step": 235530 }, { "epoch": 0.41, "learning_rate": 2.9462326963521525e-05, "loss": 2.3142, "step": 235540 }, { "epoch": 0.41, "learning_rate": 2.94614550235947e-05, "loss": 2.2824, "step": 235550 }, { "epoch": 0.41, "learning_rate": 2.946058308366787e-05, "loss": 2.4601, "step": 235560 }, { "epoch": 0.41, "learning_rate": 2.9459711143741043e-05, "loss": 2.2625, "step": 235570 }, { "epoch": 0.41, "learning_rate": 2.9458839203814216e-05, "loss": 2.4156, "step": 235580 }, { "epoch": 0.41, "learning_rate": 2.9457967263887387e-05, "loss": 2.3631, "step": 235590 }, { "epoch": 0.41, "learning_rate": 2.945709532396056e-05, "loss": 2.3686, "step": 235600 }, { "epoch": 0.41, "learning_rate": 2.9456223384033738e-05, "loss": 2.2936, "step": 235610 }, { "epoch": 0.41, "learning_rate": 2.945535144410691e-05, "loss": 2.3095, "step": 235620 }, { "epoch": 0.41, "learning_rate": 2.9454479504180082e-05, "loss": 2.2928, "step": 235630 }, { "epoch": 0.41, "learning_rate": 2.9453607564253256e-05, "loss": 2.4402, "step": 235640 }, { "epoch": 0.41, "learning_rate": 2.9452735624326426e-05, "loss": 2.4739, "step": 235650 }, { "epoch": 0.41, "learning_rate": 2.94518636843996e-05, "loss": 2.5571, "step": 235660 }, { "epoch": 0.41, "learning_rate": 2.9450991744472773e-05, "loss": 2.2897, "step": 235670 }, { "epoch": 0.41, "learning_rate": 2.9450119804545944e-05, "loss": 2.4955, "step": 235680 }, { "epoch": 0.41, "learning_rate": 2.9449247864619124e-05, "loss": 2.3325, "step": 235690 }, { "epoch": 0.41, "learning_rate": 2.9448375924692295e-05, "loss": 2.5032, "step": 235700 }, { "epoch": 0.41, "learning_rate": 2.944750398476547e-05, "loss": 2.3842, "step": 235710 }, { "epoch": 0.41, "learning_rate": 2.944663204483864e-05, "loss": 2.3237, "step": 235720 }, { "epoch": 0.41, "learning_rate": 2.9445760104911813e-05, "loss": 2.3979, "step": 235730 }, { "epoch": 0.41, "learning_rate": 2.9444888164984986e-05, "loss": 2.3975, "step": 235740 }, { "epoch": 0.41, "learning_rate": 2.9444016225058157e-05, "loss": 2.4317, "step": 235750 }, { "epoch": 0.41, "learning_rate": 2.9443144285131334e-05, "loss": 2.2487, "step": 235760 }, { "epoch": 0.41, "learning_rate": 2.9442272345204508e-05, "loss": 2.4143, "step": 235770 }, { "epoch": 0.41, "learning_rate": 2.944140040527768e-05, "loss": 2.4529, "step": 235780 }, { "epoch": 0.41, "learning_rate": 2.9440528465350852e-05, "loss": 2.3522, "step": 235790 }, { "epoch": 0.41, "learning_rate": 2.9439656525424026e-05, "loss": 2.4838, "step": 235800 }, { "epoch": 0.41, "learning_rate": 2.94387845854972e-05, "loss": 2.3905, "step": 235810 }, { "epoch": 0.41, "learning_rate": 2.943791264557037e-05, "loss": 2.3377, "step": 235820 }, { "epoch": 0.41, "learning_rate": 2.9437040705643544e-05, "loss": 2.3223, "step": 235830 }, { "epoch": 0.41, "learning_rate": 2.943616876571672e-05, "loss": 2.3337, "step": 235840 }, { "epoch": 0.41, "learning_rate": 2.9435296825789895e-05, "loss": 2.3394, "step": 235850 }, { "epoch": 0.41, "learning_rate": 2.9434424885863065e-05, "loss": 2.4904, "step": 235860 }, { "epoch": 0.41, "learning_rate": 2.943355294593624e-05, "loss": 2.4398, "step": 235870 }, { "epoch": 0.41, "learning_rate": 2.943268100600941e-05, "loss": 2.4717, "step": 235880 }, { "epoch": 0.41, "learning_rate": 2.9431809066082583e-05, "loss": 2.4286, "step": 235890 }, { "epoch": 0.41, "learning_rate": 2.9430937126155757e-05, "loss": 2.4394, "step": 235900 }, { "epoch": 0.41, "learning_rate": 2.9430065186228934e-05, "loss": 2.3964, "step": 235910 }, { "epoch": 0.41, "learning_rate": 2.9429193246302108e-05, "loss": 2.3184, "step": 235920 }, { "epoch": 0.41, "learning_rate": 2.9428321306375278e-05, "loss": 2.3735, "step": 235930 }, { "epoch": 0.41, "learning_rate": 2.942744936644845e-05, "loss": 2.4144, "step": 235940 }, { "epoch": 0.41, "learning_rate": 2.9426577426521622e-05, "loss": 2.3835, "step": 235950 }, { "epoch": 0.41, "learning_rate": 2.9425705486594796e-05, "loss": 2.2854, "step": 235960 }, { "epoch": 0.41, "learning_rate": 2.942483354666797e-05, "loss": 2.363, "step": 235970 }, { "epoch": 0.41, "learning_rate": 2.9423961606741147e-05, "loss": 2.4019, "step": 235980 }, { "epoch": 0.41, "learning_rate": 2.9423089666814317e-05, "loss": 2.3689, "step": 235990 }, { "epoch": 0.41, "learning_rate": 2.942221772688749e-05, "loss": 2.4048, "step": 236000 }, { "epoch": 0.41, "learning_rate": 2.9421345786960665e-05, "loss": 2.4043, "step": 236010 }, { "epoch": 0.41, "learning_rate": 2.9420473847033835e-05, "loss": 2.3788, "step": 236020 }, { "epoch": 0.41, "learning_rate": 2.941960190710701e-05, "loss": 2.4901, "step": 236030 }, { "epoch": 0.41, "learning_rate": 2.941872996718018e-05, "loss": 2.382, "step": 236040 }, { "epoch": 0.41, "learning_rate": 2.9417858027253353e-05, "loss": 2.3533, "step": 236050 }, { "epoch": 0.41, "learning_rate": 2.941698608732653e-05, "loss": 2.3853, "step": 236060 }, { "epoch": 0.41, "learning_rate": 2.9416114147399704e-05, "loss": 2.474, "step": 236070 }, { "epoch": 0.41, "learning_rate": 2.9415242207472878e-05, "loss": 2.4072, "step": 236080 }, { "epoch": 0.41, "learning_rate": 2.9414370267546048e-05, "loss": 2.3214, "step": 236090 }, { "epoch": 0.41, "learning_rate": 2.9413498327619222e-05, "loss": 2.3831, "step": 236100 }, { "epoch": 0.41, "learning_rate": 2.9412626387692392e-05, "loss": 2.3469, "step": 236110 }, { "epoch": 0.41, "learning_rate": 2.9411754447765566e-05, "loss": 2.5003, "step": 236120 }, { "epoch": 0.41, "learning_rate": 2.9410882507838743e-05, "loss": 2.5013, "step": 236130 }, { "epoch": 0.41, "learning_rate": 2.9410010567911917e-05, "loss": 2.4922, "step": 236140 }, { "epoch": 0.41, "learning_rate": 2.9409138627985087e-05, "loss": 2.3403, "step": 236150 }, { "epoch": 0.41, "learning_rate": 2.940826668805826e-05, "loss": 2.3666, "step": 236160 }, { "epoch": 0.41, "learning_rate": 2.9407394748131435e-05, "loss": 2.3742, "step": 236170 }, { "epoch": 0.41, "learning_rate": 2.9406522808204605e-05, "loss": 2.3755, "step": 236180 }, { "epoch": 0.41, "learning_rate": 2.940565086827778e-05, "loss": 2.3174, "step": 236190 }, { "epoch": 0.41, "learning_rate": 2.9404778928350953e-05, "loss": 2.3187, "step": 236200 }, { "epoch": 0.41, "learning_rate": 2.940390698842413e-05, "loss": 2.4722, "step": 236210 }, { "epoch": 0.41, "learning_rate": 2.94030350484973e-05, "loss": 2.4563, "step": 236220 }, { "epoch": 0.41, "learning_rate": 2.9402163108570474e-05, "loss": 2.4057, "step": 236230 }, { "epoch": 0.41, "learning_rate": 2.9401291168643648e-05, "loss": 2.3461, "step": 236240 }, { "epoch": 0.41, "learning_rate": 2.9400419228716818e-05, "loss": 2.3573, "step": 236250 }, { "epoch": 0.41, "learning_rate": 2.9399547288789992e-05, "loss": 2.4001, "step": 236260 }, { "epoch": 0.41, "learning_rate": 2.9398675348863162e-05, "loss": 2.3258, "step": 236270 }, { "epoch": 0.41, "learning_rate": 2.9397803408936343e-05, "loss": 2.3592, "step": 236280 }, { "epoch": 0.41, "learning_rate": 2.9396931469009513e-05, "loss": 2.4474, "step": 236290 }, { "epoch": 0.41, "learning_rate": 2.9396059529082687e-05, "loss": 2.3023, "step": 236300 }, { "epoch": 0.41, "learning_rate": 2.939518758915586e-05, "loss": 2.3694, "step": 236310 }, { "epoch": 0.41, "learning_rate": 2.939431564922903e-05, "loss": 2.3935, "step": 236320 }, { "epoch": 0.41, "learning_rate": 2.9393443709302205e-05, "loss": 2.3885, "step": 236330 }, { "epoch": 0.41, "learning_rate": 2.9392571769375375e-05, "loss": 2.2771, "step": 236340 }, { "epoch": 0.41, "learning_rate": 2.939169982944855e-05, "loss": 2.3316, "step": 236350 }, { "epoch": 0.41, "learning_rate": 2.9390827889521726e-05, "loss": 2.4624, "step": 236360 }, { "epoch": 0.41, "learning_rate": 2.93899559495949e-05, "loss": 2.338, "step": 236370 }, { "epoch": 0.41, "learning_rate": 2.938908400966807e-05, "loss": 2.3712, "step": 236380 }, { "epoch": 0.41, "learning_rate": 2.9388212069741244e-05, "loss": 2.425, "step": 236390 }, { "epoch": 0.41, "learning_rate": 2.9387340129814418e-05, "loss": 2.45, "step": 236400 }, { "epoch": 0.41, "learning_rate": 2.938646818988759e-05, "loss": 2.3967, "step": 236410 }, { "epoch": 0.41, "learning_rate": 2.9385596249960762e-05, "loss": 2.4948, "step": 236420 }, { "epoch": 0.41, "learning_rate": 2.938472431003394e-05, "loss": 2.4723, "step": 236430 }, { "epoch": 0.41, "learning_rate": 2.9383852370107113e-05, "loss": 2.417, "step": 236440 }, { "epoch": 0.41, "learning_rate": 2.9382980430180283e-05, "loss": 2.2689, "step": 236450 }, { "epoch": 0.41, "learning_rate": 2.9382108490253457e-05, "loss": 2.2028, "step": 236460 }, { "epoch": 0.41, "learning_rate": 2.938123655032663e-05, "loss": 2.4457, "step": 236470 }, { "epoch": 0.41, "learning_rate": 2.93803646103998e-05, "loss": 2.3357, "step": 236480 }, { "epoch": 0.41, "learning_rate": 2.9379492670472975e-05, "loss": 2.4153, "step": 236490 }, { "epoch": 0.41, "learning_rate": 2.9378620730546146e-05, "loss": 2.3187, "step": 236500 }, { "epoch": 0.41, "learning_rate": 2.9377748790619326e-05, "loss": 2.4323, "step": 236510 }, { "epoch": 0.41, "learning_rate": 2.9376876850692496e-05, "loss": 2.4039, "step": 236520 }, { "epoch": 0.41, "learning_rate": 2.937600491076567e-05, "loss": 2.2963, "step": 236530 }, { "epoch": 0.41, "learning_rate": 2.9375132970838844e-05, "loss": 2.4163, "step": 236540 }, { "epoch": 0.41, "learning_rate": 2.9374261030912014e-05, "loss": 2.4503, "step": 236550 }, { "epoch": 0.41, "learning_rate": 2.9373389090985188e-05, "loss": 2.371, "step": 236560 }, { "epoch": 0.41, "learning_rate": 2.937251715105836e-05, "loss": 2.4097, "step": 236570 }, { "epoch": 0.41, "learning_rate": 2.937164521113154e-05, "loss": 2.4088, "step": 236580 }, { "epoch": 0.41, "learning_rate": 2.937077327120471e-05, "loss": 2.4245, "step": 236590 }, { "epoch": 0.41, "learning_rate": 2.9369901331277883e-05, "loss": 2.3989, "step": 236600 }, { "epoch": 0.41, "learning_rate": 2.9369029391351054e-05, "loss": 2.4816, "step": 236610 }, { "epoch": 0.41, "learning_rate": 2.9368157451424227e-05, "loss": 2.4096, "step": 236620 }, { "epoch": 0.41, "learning_rate": 2.93672855114974e-05, "loss": 2.5361, "step": 236630 }, { "epoch": 0.41, "learning_rate": 2.936641357157057e-05, "loss": 2.4331, "step": 236640 }, { "epoch": 0.41, "learning_rate": 2.9365541631643752e-05, "loss": 2.4104, "step": 236650 }, { "epoch": 0.41, "learning_rate": 2.9364669691716922e-05, "loss": 2.3751, "step": 236660 }, { "epoch": 0.41, "learning_rate": 2.9363797751790096e-05, "loss": 2.3968, "step": 236670 }, { "epoch": 0.41, "learning_rate": 2.9362925811863267e-05, "loss": 2.3548, "step": 236680 }, { "epoch": 0.41, "learning_rate": 2.936205387193644e-05, "loss": 2.4794, "step": 236690 }, { "epoch": 0.41, "learning_rate": 2.9361181932009614e-05, "loss": 2.4413, "step": 236700 }, { "epoch": 0.41, "learning_rate": 2.9360309992082785e-05, "loss": 2.4248, "step": 236710 }, { "epoch": 0.41, "learning_rate": 2.9359438052155958e-05, "loss": 2.5247, "step": 236720 }, { "epoch": 0.41, "learning_rate": 2.9358566112229135e-05, "loss": 2.419, "step": 236730 }, { "epoch": 0.41, "learning_rate": 2.935769417230231e-05, "loss": 2.4375, "step": 236740 }, { "epoch": 0.41, "learning_rate": 2.935682223237548e-05, "loss": 2.4782, "step": 236750 }, { "epoch": 0.41, "learning_rate": 2.9355950292448653e-05, "loss": 2.5053, "step": 236760 }, { "epoch": 0.41, "learning_rate": 2.9355078352521824e-05, "loss": 2.3042, "step": 236770 }, { "epoch": 0.41, "learning_rate": 2.9354206412594998e-05, "loss": 2.4659, "step": 236780 }, { "epoch": 0.41, "learning_rate": 2.935333447266817e-05, "loss": 2.3824, "step": 236790 }, { "epoch": 0.41, "learning_rate": 2.935246253274135e-05, "loss": 2.466, "step": 236800 }, { "epoch": 0.41, "learning_rate": 2.9351590592814522e-05, "loss": 2.3871, "step": 236810 }, { "epoch": 0.41, "learning_rate": 2.9350718652887693e-05, "loss": 2.3095, "step": 236820 }, { "epoch": 0.41, "learning_rate": 2.9349846712960866e-05, "loss": 2.3974, "step": 236830 }, { "epoch": 0.41, "learning_rate": 2.9348974773034037e-05, "loss": 2.3956, "step": 236840 }, { "epoch": 0.41, "learning_rate": 2.934810283310721e-05, "loss": 2.2888, "step": 236850 }, { "epoch": 0.41, "learning_rate": 2.9347230893180384e-05, "loss": 2.3868, "step": 236860 }, { "epoch": 0.41, "learning_rate": 2.9346358953253555e-05, "loss": 2.4271, "step": 236870 }, { "epoch": 0.41, "learning_rate": 2.9345487013326732e-05, "loss": 2.3831, "step": 236880 }, { "epoch": 0.41, "learning_rate": 2.9344615073399906e-05, "loss": 2.2806, "step": 236890 }, { "epoch": 0.41, "learning_rate": 2.934374313347308e-05, "loss": 2.2106, "step": 236900 }, { "epoch": 0.41, "learning_rate": 2.934287119354625e-05, "loss": 2.5218, "step": 236910 }, { "epoch": 0.41, "learning_rate": 2.9341999253619424e-05, "loss": 2.3455, "step": 236920 }, { "epoch": 0.41, "learning_rate": 2.9341127313692597e-05, "loss": 2.2995, "step": 236930 }, { "epoch": 0.41, "learning_rate": 2.9340255373765768e-05, "loss": 2.4892, "step": 236940 }, { "epoch": 0.41, "learning_rate": 2.9339383433838945e-05, "loss": 2.3813, "step": 236950 }, { "epoch": 0.41, "learning_rate": 2.933851149391212e-05, "loss": 2.4378, "step": 236960 }, { "epoch": 0.41, "learning_rate": 2.9337639553985292e-05, "loss": 2.3774, "step": 236970 }, { "epoch": 0.41, "learning_rate": 2.9336767614058463e-05, "loss": 2.3287, "step": 236980 }, { "epoch": 0.41, "learning_rate": 2.9335895674131637e-05, "loss": 2.4332, "step": 236990 }, { "epoch": 0.41, "learning_rate": 2.9335023734204807e-05, "loss": 2.2918, "step": 237000 }, { "epoch": 0.41, "learning_rate": 2.933415179427798e-05, "loss": 2.4609, "step": 237010 }, { "epoch": 0.41, "learning_rate": 2.9333279854351154e-05, "loss": 2.4278, "step": 237020 }, { "epoch": 0.41, "learning_rate": 2.933240791442433e-05, "loss": 2.4239, "step": 237030 }, { "epoch": 0.41, "learning_rate": 2.9331535974497505e-05, "loss": 2.4249, "step": 237040 }, { "epoch": 0.41, "learning_rate": 2.9330664034570676e-05, "loss": 2.3649, "step": 237050 }, { "epoch": 0.41, "learning_rate": 2.932979209464385e-05, "loss": 2.3927, "step": 237060 }, { "epoch": 0.41, "learning_rate": 2.932892015471702e-05, "loss": 2.3161, "step": 237070 }, { "epoch": 0.41, "learning_rate": 2.9328048214790194e-05, "loss": 2.3861, "step": 237080 }, { "epoch": 0.41, "learning_rate": 2.9327176274863367e-05, "loss": 2.4218, "step": 237090 }, { "epoch": 0.41, "learning_rate": 2.9326304334936545e-05, "loss": 2.381, "step": 237100 }, { "epoch": 0.41, "learning_rate": 2.9325432395009715e-05, "loss": 2.4393, "step": 237110 }, { "epoch": 0.41, "learning_rate": 2.932456045508289e-05, "loss": 2.3374, "step": 237120 }, { "epoch": 0.41, "learning_rate": 2.9323688515156063e-05, "loss": 2.3187, "step": 237130 }, { "epoch": 0.41, "learning_rate": 2.9322816575229233e-05, "loss": 2.5044, "step": 237140 }, { "epoch": 0.41, "learning_rate": 2.9321944635302407e-05, "loss": 2.4001, "step": 237150 }, { "epoch": 0.41, "learning_rate": 2.932107269537558e-05, "loss": 2.3035, "step": 237160 }, { "epoch": 0.41, "learning_rate": 2.9320200755448758e-05, "loss": 2.4837, "step": 237170 }, { "epoch": 0.41, "learning_rate": 2.9319328815521928e-05, "loss": 2.4393, "step": 237180 }, { "epoch": 0.41, "learning_rate": 2.9318456875595102e-05, "loss": 2.3699, "step": 237190 }, { "epoch": 0.41, "learning_rate": 2.9317584935668276e-05, "loss": 2.4046, "step": 237200 }, { "epoch": 0.41, "learning_rate": 2.9316712995741446e-05, "loss": 2.4905, "step": 237210 }, { "epoch": 0.41, "learning_rate": 2.931584105581462e-05, "loss": 2.3552, "step": 237220 }, { "epoch": 0.41, "learning_rate": 2.931496911588779e-05, "loss": 2.3985, "step": 237230 }, { "epoch": 0.41, "learning_rate": 2.9314097175960964e-05, "loss": 2.3754, "step": 237240 }, { "epoch": 0.41, "learning_rate": 2.931322523603414e-05, "loss": 2.4035, "step": 237250 }, { "epoch": 0.41, "learning_rate": 2.9312353296107315e-05, "loss": 2.4221, "step": 237260 }, { "epoch": 0.41, "learning_rate": 2.931148135618049e-05, "loss": 2.3712, "step": 237270 }, { "epoch": 0.41, "learning_rate": 2.931060941625366e-05, "loss": 2.3144, "step": 237280 }, { "epoch": 0.41, "learning_rate": 2.9309737476326833e-05, "loss": 2.3994, "step": 237290 }, { "epoch": 0.41, "learning_rate": 2.9308865536400003e-05, "loss": 2.3494, "step": 237300 }, { "epoch": 0.41, "learning_rate": 2.9307993596473177e-05, "loss": 2.3443, "step": 237310 }, { "epoch": 0.41, "learning_rate": 2.9307121656546354e-05, "loss": 2.4817, "step": 237320 }, { "epoch": 0.41, "learning_rate": 2.9306249716619528e-05, "loss": 2.4217, "step": 237330 }, { "epoch": 0.41, "learning_rate": 2.9305377776692698e-05, "loss": 2.2881, "step": 237340 }, { "epoch": 0.41, "learning_rate": 2.9304505836765872e-05, "loss": 2.3443, "step": 237350 }, { "epoch": 0.41, "learning_rate": 2.9303633896839046e-05, "loss": 2.33, "step": 237360 }, { "epoch": 0.41, "learning_rate": 2.9302761956912216e-05, "loss": 2.3148, "step": 237370 }, { "epoch": 0.41, "learning_rate": 2.930189001698539e-05, "loss": 2.4183, "step": 237380 }, { "epoch": 0.41, "learning_rate": 2.930101807705856e-05, "loss": 2.3629, "step": 237390 }, { "epoch": 0.41, "learning_rate": 2.930014613713174e-05, "loss": 2.328, "step": 237400 }, { "epoch": 0.41, "learning_rate": 2.929927419720491e-05, "loss": 2.4122, "step": 237410 }, { "epoch": 0.41, "learning_rate": 2.9298402257278085e-05, "loss": 2.3661, "step": 237420 }, { "epoch": 0.41, "learning_rate": 2.929753031735126e-05, "loss": 2.3692, "step": 237430 }, { "epoch": 0.41, "learning_rate": 2.929665837742443e-05, "loss": 2.3147, "step": 237440 }, { "epoch": 0.41, "learning_rate": 2.9295786437497603e-05, "loss": 2.3919, "step": 237450 }, { "epoch": 0.41, "learning_rate": 2.9294914497570773e-05, "loss": 2.4541, "step": 237460 }, { "epoch": 0.41, "learning_rate": 2.9294042557643954e-05, "loss": 2.2652, "step": 237470 }, { "epoch": 0.41, "learning_rate": 2.9293170617717124e-05, "loss": 2.3913, "step": 237480 }, { "epoch": 0.41, "learning_rate": 2.9292298677790298e-05, "loss": 2.4, "step": 237490 }, { "epoch": 0.41, "learning_rate": 2.9291426737863468e-05, "loss": 2.3718, "step": 237500 }, { "epoch": 0.41, "learning_rate": 2.9290554797936642e-05, "loss": 2.3493, "step": 237510 }, { "epoch": 0.41, "learning_rate": 2.9289682858009816e-05, "loss": 2.3376, "step": 237520 }, { "epoch": 0.41, "learning_rate": 2.9288810918082986e-05, "loss": 2.4232, "step": 237530 }, { "epoch": 0.41, "learning_rate": 2.928793897815616e-05, "loss": 2.5617, "step": 237540 }, { "epoch": 0.41, "learning_rate": 2.9287067038229337e-05, "loss": 2.3158, "step": 237550 }, { "epoch": 0.41, "learning_rate": 2.928619509830251e-05, "loss": 2.3896, "step": 237560 }, { "epoch": 0.41, "learning_rate": 2.928532315837568e-05, "loss": 2.3799, "step": 237570 }, { "epoch": 0.41, "learning_rate": 2.9284451218448855e-05, "loss": 2.3308, "step": 237580 }, { "epoch": 0.41, "learning_rate": 2.928357927852203e-05, "loss": 2.4216, "step": 237590 }, { "epoch": 0.41, "learning_rate": 2.92827073385952e-05, "loss": 2.3383, "step": 237600 }, { "epoch": 0.41, "learning_rate": 2.9281835398668373e-05, "loss": 2.3547, "step": 237610 }, { "epoch": 0.41, "learning_rate": 2.928096345874155e-05, "loss": 2.4319, "step": 237620 }, { "epoch": 0.41, "learning_rate": 2.9280091518814724e-05, "loss": 2.4224, "step": 237630 }, { "epoch": 0.41, "learning_rate": 2.9279219578887894e-05, "loss": 2.4205, "step": 237640 }, { "epoch": 0.41, "learning_rate": 2.9278347638961068e-05, "loss": 2.3139, "step": 237650 }, { "epoch": 0.41, "learning_rate": 2.9277475699034242e-05, "loss": 2.3994, "step": 237660 }, { "epoch": 0.41, "learning_rate": 2.9276603759107412e-05, "loss": 2.3822, "step": 237670 }, { "epoch": 0.41, "learning_rate": 2.9275731819180586e-05, "loss": 2.5138, "step": 237680 }, { "epoch": 0.41, "learning_rate": 2.9274859879253756e-05, "loss": 2.4465, "step": 237690 }, { "epoch": 0.41, "learning_rate": 2.9273987939326937e-05, "loss": 2.3314, "step": 237700 }, { "epoch": 0.41, "learning_rate": 2.9273115999400107e-05, "loss": 2.4248, "step": 237710 }, { "epoch": 0.41, "learning_rate": 2.927224405947328e-05, "loss": 2.4055, "step": 237720 }, { "epoch": 0.41, "learning_rate": 2.927137211954645e-05, "loss": 2.4205, "step": 237730 }, { "epoch": 0.41, "learning_rate": 2.9270500179619625e-05, "loss": 2.4611, "step": 237740 }, { "epoch": 0.41, "learning_rate": 2.92696282396928e-05, "loss": 2.3047, "step": 237750 }, { "epoch": 0.41, "learning_rate": 2.926875629976597e-05, "loss": 2.5047, "step": 237760 }, { "epoch": 0.41, "learning_rate": 2.926788435983915e-05, "loss": 2.2291, "step": 237770 }, { "epoch": 0.41, "learning_rate": 2.926701241991232e-05, "loss": 2.4082, "step": 237780 }, { "epoch": 0.41, "learning_rate": 2.9266140479985494e-05, "loss": 2.2968, "step": 237790 }, { "epoch": 0.41, "learning_rate": 2.9265268540058664e-05, "loss": 2.4294, "step": 237800 }, { "epoch": 0.41, "learning_rate": 2.9264396600131838e-05, "loss": 2.39, "step": 237810 }, { "epoch": 0.41, "learning_rate": 2.9263524660205012e-05, "loss": 2.4464, "step": 237820 }, { "epoch": 0.41, "learning_rate": 2.9262652720278182e-05, "loss": 2.4251, "step": 237830 }, { "epoch": 0.41, "learning_rate": 2.926178078035136e-05, "loss": 2.3756, "step": 237840 }, { "epoch": 0.41, "learning_rate": 2.9260908840424533e-05, "loss": 2.4473, "step": 237850 }, { "epoch": 0.41, "learning_rate": 2.9260036900497707e-05, "loss": 2.3588, "step": 237860 }, { "epoch": 0.41, "learning_rate": 2.9259164960570877e-05, "loss": 2.3602, "step": 237870 }, { "epoch": 0.41, "learning_rate": 2.925829302064405e-05, "loss": 2.3947, "step": 237880 }, { "epoch": 0.41, "learning_rate": 2.9257421080717225e-05, "loss": 2.3711, "step": 237890 }, { "epoch": 0.41, "learning_rate": 2.9256549140790395e-05, "loss": 2.3412, "step": 237900 }, { "epoch": 0.41, "learning_rate": 2.925567720086357e-05, "loss": 2.368, "step": 237910 }, { "epoch": 0.41, "learning_rate": 2.9254805260936746e-05, "loss": 2.4569, "step": 237920 }, { "epoch": 0.41, "learning_rate": 2.925393332100992e-05, "loss": 2.4088, "step": 237930 }, { "epoch": 0.41, "learning_rate": 2.925306138108309e-05, "loss": 2.438, "step": 237940 }, { "epoch": 0.41, "learning_rate": 2.9252189441156264e-05, "loss": 2.3205, "step": 237950 }, { "epoch": 0.41, "learning_rate": 2.9251317501229435e-05, "loss": 2.3804, "step": 237960 }, { "epoch": 0.41, "learning_rate": 2.925044556130261e-05, "loss": 2.3843, "step": 237970 }, { "epoch": 0.42, "learning_rate": 2.9249573621375782e-05, "loss": 2.4832, "step": 237980 }, { "epoch": 0.42, "learning_rate": 2.924870168144896e-05, "loss": 2.3415, "step": 237990 }, { "epoch": 0.42, "learning_rate": 2.9247829741522133e-05, "loss": 2.3879, "step": 238000 }, { "epoch": 0.42, "learning_rate": 2.9246957801595303e-05, "loss": 2.437, "step": 238010 }, { "epoch": 0.42, "learning_rate": 2.9246085861668477e-05, "loss": 2.4185, "step": 238020 }, { "epoch": 0.42, "learning_rate": 2.9245213921741648e-05, "loss": 2.3437, "step": 238030 }, { "epoch": 0.42, "learning_rate": 2.924434198181482e-05, "loss": 2.2486, "step": 238040 }, { "epoch": 0.42, "learning_rate": 2.9243470041887995e-05, "loss": 2.3235, "step": 238050 }, { "epoch": 0.42, "learning_rate": 2.9242598101961166e-05, "loss": 2.3867, "step": 238060 }, { "epoch": 0.42, "learning_rate": 2.9241726162034343e-05, "loss": 2.3513, "step": 238070 }, { "epoch": 0.42, "learning_rate": 2.9240854222107516e-05, "loss": 2.4442, "step": 238080 }, { "epoch": 0.42, "learning_rate": 2.923998228218069e-05, "loss": 2.422, "step": 238090 }, { "epoch": 0.42, "learning_rate": 2.923911034225386e-05, "loss": 2.4632, "step": 238100 }, { "epoch": 0.42, "learning_rate": 2.9238238402327034e-05, "loss": 2.3991, "step": 238110 }, { "epoch": 0.42, "learning_rate": 2.9237366462400205e-05, "loss": 2.3726, "step": 238120 }, { "epoch": 0.42, "learning_rate": 2.923649452247338e-05, "loss": 2.5, "step": 238130 }, { "epoch": 0.42, "learning_rate": 2.9235622582546556e-05, "loss": 2.3964, "step": 238140 }, { "epoch": 0.42, "learning_rate": 2.923475064261973e-05, "loss": 2.3241, "step": 238150 }, { "epoch": 0.42, "learning_rate": 2.9233878702692903e-05, "loss": 2.4459, "step": 238160 }, { "epoch": 0.42, "learning_rate": 2.9233006762766074e-05, "loss": 2.5051, "step": 238170 }, { "epoch": 0.42, "learning_rate": 2.9232134822839247e-05, "loss": 2.3571, "step": 238180 }, { "epoch": 0.42, "learning_rate": 2.9231262882912418e-05, "loss": 2.4574, "step": 238190 }, { "epoch": 0.42, "learning_rate": 2.923039094298559e-05, "loss": 2.2677, "step": 238200 }, { "epoch": 0.42, "learning_rate": 2.9229519003058765e-05, "loss": 2.3521, "step": 238210 }, { "epoch": 0.42, "learning_rate": 2.9228647063131942e-05, "loss": 2.4982, "step": 238220 }, { "epoch": 0.42, "learning_rate": 2.9227775123205113e-05, "loss": 2.373, "step": 238230 }, { "epoch": 0.42, "learning_rate": 2.9226903183278287e-05, "loss": 2.341, "step": 238240 }, { "epoch": 0.42, "learning_rate": 2.922603124335146e-05, "loss": 2.4684, "step": 238250 }, { "epoch": 0.42, "learning_rate": 2.922515930342463e-05, "loss": 2.4095, "step": 238260 }, { "epoch": 0.42, "learning_rate": 2.9224287363497805e-05, "loss": 2.311, "step": 238270 }, { "epoch": 0.42, "learning_rate": 2.9223415423570978e-05, "loss": 2.3428, "step": 238280 }, { "epoch": 0.42, "learning_rate": 2.9222543483644155e-05, "loss": 2.437, "step": 238290 }, { "epoch": 0.42, "learning_rate": 2.9221671543717326e-05, "loss": 2.3692, "step": 238300 }, { "epoch": 0.42, "learning_rate": 2.92207996037905e-05, "loss": 2.2942, "step": 238310 }, { "epoch": 0.42, "learning_rate": 2.9219927663863673e-05, "loss": 2.4719, "step": 238320 }, { "epoch": 0.42, "learning_rate": 2.9219055723936844e-05, "loss": 2.3067, "step": 238330 }, { "epoch": 0.42, "learning_rate": 2.9218183784010018e-05, "loss": 2.4313, "step": 238340 }, { "epoch": 0.42, "learning_rate": 2.9217311844083188e-05, "loss": 2.3465, "step": 238350 }, { "epoch": 0.42, "learning_rate": 2.921643990415636e-05, "loss": 2.3753, "step": 238360 }, { "epoch": 0.42, "learning_rate": 2.921556796422954e-05, "loss": 2.293, "step": 238370 }, { "epoch": 0.42, "learning_rate": 2.9214696024302713e-05, "loss": 2.4028, "step": 238380 }, { "epoch": 0.42, "learning_rate": 2.9213824084375886e-05, "loss": 2.2972, "step": 238390 }, { "epoch": 0.42, "learning_rate": 2.9212952144449057e-05, "loss": 2.4677, "step": 238400 }, { "epoch": 0.42, "learning_rate": 2.921208020452223e-05, "loss": 2.3901, "step": 238410 }, { "epoch": 0.42, "learning_rate": 2.92112082645954e-05, "loss": 2.4534, "step": 238420 }, { "epoch": 0.42, "learning_rate": 2.9210336324668575e-05, "loss": 2.4185, "step": 238430 }, { "epoch": 0.42, "learning_rate": 2.9209464384741752e-05, "loss": 2.4077, "step": 238440 }, { "epoch": 0.42, "learning_rate": 2.9208592444814926e-05, "loss": 2.3722, "step": 238450 }, { "epoch": 0.42, "learning_rate": 2.9207720504888096e-05, "loss": 2.4618, "step": 238460 }, { "epoch": 0.42, "learning_rate": 2.920684856496127e-05, "loss": 2.3831, "step": 238470 }, { "epoch": 0.42, "learning_rate": 2.9205976625034444e-05, "loss": 2.4038, "step": 238480 }, { "epoch": 0.42, "learning_rate": 2.9205104685107614e-05, "loss": 2.4305, "step": 238490 }, { "epoch": 0.42, "learning_rate": 2.9204232745180788e-05, "loss": 2.4499, "step": 238500 }, { "epoch": 0.42, "learning_rate": 2.9203360805253965e-05, "loss": 2.3322, "step": 238510 }, { "epoch": 0.42, "learning_rate": 2.920248886532714e-05, "loss": 2.3466, "step": 238520 }, { "epoch": 0.42, "learning_rate": 2.920161692540031e-05, "loss": 2.378, "step": 238530 }, { "epoch": 0.42, "learning_rate": 2.9200744985473483e-05, "loss": 2.4425, "step": 238540 }, { "epoch": 0.42, "learning_rate": 2.9199873045546657e-05, "loss": 2.3472, "step": 238550 }, { "epoch": 0.42, "learning_rate": 2.9199001105619827e-05, "loss": 2.4893, "step": 238560 }, { "epoch": 0.42, "learning_rate": 2.9198129165693e-05, "loss": 2.3195, "step": 238570 }, { "epoch": 0.42, "learning_rate": 2.919725722576617e-05, "loss": 2.4792, "step": 238580 }, { "epoch": 0.42, "learning_rate": 2.919638528583935e-05, "loss": 2.4492, "step": 238590 }, { "epoch": 0.42, "learning_rate": 2.9195513345912522e-05, "loss": 2.3127, "step": 238600 }, { "epoch": 0.42, "learning_rate": 2.9194641405985696e-05, "loss": 2.3265, "step": 238610 }, { "epoch": 0.42, "learning_rate": 2.919376946605887e-05, "loss": 2.4, "step": 238620 }, { "epoch": 0.42, "learning_rate": 2.919289752613204e-05, "loss": 2.4229, "step": 238630 }, { "epoch": 0.42, "learning_rate": 2.9192025586205214e-05, "loss": 2.4685, "step": 238640 }, { "epoch": 0.42, "learning_rate": 2.9191153646278384e-05, "loss": 2.5046, "step": 238650 }, { "epoch": 0.42, "learning_rate": 2.9190281706351565e-05, "loss": 2.5483, "step": 238660 }, { "epoch": 0.42, "learning_rate": 2.9189409766424735e-05, "loss": 2.2917, "step": 238670 }, { "epoch": 0.42, "learning_rate": 2.918853782649791e-05, "loss": 2.4847, "step": 238680 }, { "epoch": 0.42, "learning_rate": 2.918766588657108e-05, "loss": 2.3472, "step": 238690 }, { "epoch": 0.42, "learning_rate": 2.9186793946644253e-05, "loss": 2.4718, "step": 238700 }, { "epoch": 0.42, "learning_rate": 2.9185922006717427e-05, "loss": 2.4393, "step": 238710 }, { "epoch": 0.42, "learning_rate": 2.9185050066790597e-05, "loss": 2.3681, "step": 238720 }, { "epoch": 0.42, "learning_rate": 2.918417812686377e-05, "loss": 2.36, "step": 238730 }, { "epoch": 0.42, "learning_rate": 2.9183306186936948e-05, "loss": 2.4042, "step": 238740 }, { "epoch": 0.42, "learning_rate": 2.9182434247010122e-05, "loss": 2.3747, "step": 238750 }, { "epoch": 0.42, "learning_rate": 2.9181562307083292e-05, "loss": 2.385, "step": 238760 }, { "epoch": 0.42, "learning_rate": 2.9180690367156466e-05, "loss": 2.4182, "step": 238770 }, { "epoch": 0.42, "learning_rate": 2.917981842722964e-05, "loss": 2.3819, "step": 238780 }, { "epoch": 0.42, "learning_rate": 2.917894648730281e-05, "loss": 2.4402, "step": 238790 }, { "epoch": 0.42, "learning_rate": 2.9178074547375984e-05, "loss": 2.3862, "step": 238800 }, { "epoch": 0.42, "learning_rate": 2.917720260744916e-05, "loss": 2.4354, "step": 238810 }, { "epoch": 0.42, "learning_rate": 2.9176330667522335e-05, "loss": 2.4346, "step": 238820 }, { "epoch": 0.42, "learning_rate": 2.9175458727595505e-05, "loss": 2.4086, "step": 238830 }, { "epoch": 0.42, "learning_rate": 2.917458678766868e-05, "loss": 2.2857, "step": 238840 }, { "epoch": 0.42, "learning_rate": 2.917371484774185e-05, "loss": 2.3502, "step": 238850 }, { "epoch": 0.42, "learning_rate": 2.9172842907815023e-05, "loss": 2.4347, "step": 238860 }, { "epoch": 0.42, "learning_rate": 2.9171970967888197e-05, "loss": 2.2518, "step": 238870 }, { "epoch": 0.42, "learning_rate": 2.9171099027961367e-05, "loss": 2.4405, "step": 238880 }, { "epoch": 0.42, "learning_rate": 2.9170227088034548e-05, "loss": 2.3944, "step": 238890 }, { "epoch": 0.42, "learning_rate": 2.9169355148107718e-05, "loss": 2.4256, "step": 238900 }, { "epoch": 0.42, "learning_rate": 2.9168483208180892e-05, "loss": 2.4276, "step": 238910 }, { "epoch": 0.42, "learning_rate": 2.9167611268254062e-05, "loss": 2.4906, "step": 238920 }, { "epoch": 0.42, "learning_rate": 2.9166739328327236e-05, "loss": 2.4043, "step": 238930 }, { "epoch": 0.42, "learning_rate": 2.916586738840041e-05, "loss": 2.2642, "step": 238940 }, { "epoch": 0.42, "learning_rate": 2.916499544847358e-05, "loss": 2.4363, "step": 238950 }, { "epoch": 0.42, "learning_rate": 2.9164123508546757e-05, "loss": 2.4167, "step": 238960 }, { "epoch": 0.42, "learning_rate": 2.916325156861993e-05, "loss": 2.2866, "step": 238970 }, { "epoch": 0.42, "learning_rate": 2.9162379628693105e-05, "loss": 2.3342, "step": 238980 }, { "epoch": 0.42, "learning_rate": 2.9161507688766275e-05, "loss": 2.4198, "step": 238990 }, { "epoch": 0.42, "learning_rate": 2.916063574883945e-05, "loss": 2.3961, "step": 239000 }, { "epoch": 0.42, "learning_rate": 2.9159763808912623e-05, "loss": 2.3733, "step": 239010 }, { "epoch": 0.42, "learning_rate": 2.9158891868985793e-05, "loss": 2.2849, "step": 239020 }, { "epoch": 0.42, "learning_rate": 2.9158019929058967e-05, "loss": 2.3816, "step": 239030 }, { "epoch": 0.42, "learning_rate": 2.9157147989132144e-05, "loss": 2.2625, "step": 239040 }, { "epoch": 0.42, "learning_rate": 2.9156276049205318e-05, "loss": 2.3739, "step": 239050 }, { "epoch": 0.42, "learning_rate": 2.9155404109278488e-05, "loss": 2.4938, "step": 239060 }, { "epoch": 0.42, "learning_rate": 2.9154532169351662e-05, "loss": 2.3295, "step": 239070 }, { "epoch": 0.42, "learning_rate": 2.9153660229424832e-05, "loss": 2.4174, "step": 239080 }, { "epoch": 0.42, "learning_rate": 2.9152788289498006e-05, "loss": 2.348, "step": 239090 }, { "epoch": 0.42, "learning_rate": 2.915191634957118e-05, "loss": 2.3729, "step": 239100 }, { "epoch": 0.42, "learning_rate": 2.9151044409644357e-05, "loss": 2.5517, "step": 239110 }, { "epoch": 0.42, "learning_rate": 2.915017246971753e-05, "loss": 2.3401, "step": 239120 }, { "epoch": 0.42, "learning_rate": 2.91493005297907e-05, "loss": 2.3624, "step": 239130 }, { "epoch": 0.42, "learning_rate": 2.9148428589863875e-05, "loss": 2.3888, "step": 239140 }, { "epoch": 0.42, "learning_rate": 2.9147556649937045e-05, "loss": 2.2736, "step": 239150 }, { "epoch": 0.42, "learning_rate": 2.914668471001022e-05, "loss": 2.4588, "step": 239160 }, { "epoch": 0.42, "learning_rate": 2.9145812770083393e-05, "loss": 2.3848, "step": 239170 }, { "epoch": 0.42, "learning_rate": 2.914494083015657e-05, "loss": 2.3441, "step": 239180 }, { "epoch": 0.42, "learning_rate": 2.914406889022974e-05, "loss": 2.3476, "step": 239190 }, { "epoch": 0.42, "learning_rate": 2.9143196950302914e-05, "loss": 2.3834, "step": 239200 }, { "epoch": 0.42, "learning_rate": 2.9142325010376088e-05, "loss": 2.4691, "step": 239210 }, { "epoch": 0.42, "learning_rate": 2.914145307044926e-05, "loss": 2.3655, "step": 239220 }, { "epoch": 0.42, "learning_rate": 2.9140581130522432e-05, "loss": 2.417, "step": 239230 }, { "epoch": 0.42, "learning_rate": 2.9139709190595606e-05, "loss": 2.4124, "step": 239240 }, { "epoch": 0.42, "learning_rate": 2.9138837250668776e-05, "loss": 2.4806, "step": 239250 }, { "epoch": 0.42, "learning_rate": 2.9137965310741954e-05, "loss": 2.3046, "step": 239260 }, { "epoch": 0.42, "learning_rate": 2.9137093370815127e-05, "loss": 2.405, "step": 239270 }, { "epoch": 0.42, "learning_rate": 2.91362214308883e-05, "loss": 2.284, "step": 239280 }, { "epoch": 0.42, "learning_rate": 2.913534949096147e-05, "loss": 2.3905, "step": 239290 }, { "epoch": 0.42, "learning_rate": 2.9134477551034645e-05, "loss": 2.3945, "step": 239300 }, { "epoch": 0.42, "learning_rate": 2.9133605611107816e-05, "loss": 2.4368, "step": 239310 }, { "epoch": 0.42, "learning_rate": 2.913273367118099e-05, "loss": 2.3966, "step": 239320 }, { "epoch": 0.42, "learning_rate": 2.9131861731254167e-05, "loss": 2.4935, "step": 239330 }, { "epoch": 0.42, "learning_rate": 2.913098979132734e-05, "loss": 2.4395, "step": 239340 }, { "epoch": 0.42, "learning_rate": 2.9130117851400514e-05, "loss": 2.3837, "step": 239350 }, { "epoch": 0.42, "learning_rate": 2.9129245911473684e-05, "loss": 2.3037, "step": 239360 }, { "epoch": 0.42, "learning_rate": 2.9128373971546858e-05, "loss": 2.337, "step": 239370 }, { "epoch": 0.42, "learning_rate": 2.912750203162003e-05, "loss": 2.3917, "step": 239380 }, { "epoch": 0.42, "learning_rate": 2.9126630091693202e-05, "loss": 2.401, "step": 239390 }, { "epoch": 0.42, "learning_rate": 2.9125758151766376e-05, "loss": 2.4685, "step": 239400 }, { "epoch": 0.42, "learning_rate": 2.9124886211839553e-05, "loss": 2.3237, "step": 239410 }, { "epoch": 0.42, "learning_rate": 2.9124014271912724e-05, "loss": 2.3475, "step": 239420 }, { "epoch": 0.42, "learning_rate": 2.9123142331985897e-05, "loss": 2.3358, "step": 239430 }, { "epoch": 0.42, "learning_rate": 2.912227039205907e-05, "loss": 2.3515, "step": 239440 }, { "epoch": 0.42, "learning_rate": 2.912139845213224e-05, "loss": 2.4703, "step": 239450 }, { "epoch": 0.42, "learning_rate": 2.9120526512205415e-05, "loss": 2.4485, "step": 239460 }, { "epoch": 0.42, "learning_rate": 2.9119654572278586e-05, "loss": 2.2462, "step": 239470 }, { "epoch": 0.42, "learning_rate": 2.9118782632351766e-05, "loss": 2.4112, "step": 239480 }, { "epoch": 0.42, "learning_rate": 2.9117910692424937e-05, "loss": 2.4307, "step": 239490 }, { "epoch": 0.42, "learning_rate": 2.911703875249811e-05, "loss": 2.3161, "step": 239500 }, { "epoch": 0.42, "learning_rate": 2.9116166812571284e-05, "loss": 2.457, "step": 239510 }, { "epoch": 0.42, "learning_rate": 2.9115294872644455e-05, "loss": 2.3689, "step": 239520 }, { "epoch": 0.42, "learning_rate": 2.911442293271763e-05, "loss": 2.4055, "step": 239530 }, { "epoch": 0.42, "learning_rate": 2.91135509927908e-05, "loss": 2.4109, "step": 239540 }, { "epoch": 0.42, "learning_rate": 2.9112679052863973e-05, "loss": 2.3062, "step": 239550 }, { "epoch": 0.42, "learning_rate": 2.911180711293715e-05, "loss": 2.3764, "step": 239560 }, { "epoch": 0.42, "learning_rate": 2.9110935173010323e-05, "loss": 2.4595, "step": 239570 }, { "epoch": 0.42, "learning_rate": 2.9110063233083494e-05, "loss": 2.354, "step": 239580 }, { "epoch": 0.42, "learning_rate": 2.9109191293156668e-05, "loss": 2.4047, "step": 239590 }, { "epoch": 0.42, "learning_rate": 2.910831935322984e-05, "loss": 2.4392, "step": 239600 }, { "epoch": 0.42, "learning_rate": 2.9107447413303012e-05, "loss": 2.3576, "step": 239610 }, { "epoch": 0.42, "learning_rate": 2.9106575473376186e-05, "loss": 2.3663, "step": 239620 }, { "epoch": 0.42, "learning_rate": 2.9105703533449363e-05, "loss": 2.4206, "step": 239630 }, { "epoch": 0.42, "learning_rate": 2.9104831593522536e-05, "loss": 2.4841, "step": 239640 }, { "epoch": 0.42, "learning_rate": 2.9103959653595707e-05, "loss": 2.3819, "step": 239650 }, { "epoch": 0.42, "learning_rate": 2.910308771366888e-05, "loss": 2.3399, "step": 239660 }, { "epoch": 0.42, "learning_rate": 2.9102215773742054e-05, "loss": 2.3748, "step": 239670 }, { "epoch": 0.42, "learning_rate": 2.9101343833815225e-05, "loss": 2.4261, "step": 239680 }, { "epoch": 0.42, "learning_rate": 2.91004718938884e-05, "loss": 2.3549, "step": 239690 }, { "epoch": 0.42, "learning_rate": 2.9099599953961576e-05, "loss": 2.3646, "step": 239700 }, { "epoch": 0.42, "learning_rate": 2.909872801403475e-05, "loss": 2.4632, "step": 239710 }, { "epoch": 0.42, "learning_rate": 2.909785607410792e-05, "loss": 2.3731, "step": 239720 }, { "epoch": 0.42, "learning_rate": 2.9096984134181094e-05, "loss": 2.3874, "step": 239730 }, { "epoch": 0.42, "learning_rate": 2.9096112194254267e-05, "loss": 2.4158, "step": 239740 }, { "epoch": 0.42, "learning_rate": 2.9095240254327438e-05, "loss": 2.2808, "step": 239750 }, { "epoch": 0.42, "learning_rate": 2.909436831440061e-05, "loss": 2.441, "step": 239760 }, { "epoch": 0.42, "learning_rate": 2.9093496374473782e-05, "loss": 2.3754, "step": 239770 }, { "epoch": 0.42, "learning_rate": 2.9092624434546962e-05, "loss": 2.3066, "step": 239780 }, { "epoch": 0.42, "learning_rate": 2.9091752494620133e-05, "loss": 2.3698, "step": 239790 }, { "epoch": 0.42, "learning_rate": 2.9090880554693307e-05, "loss": 2.3503, "step": 239800 }, { "epoch": 0.42, "learning_rate": 2.9090008614766477e-05, "loss": 2.4087, "step": 239810 }, { "epoch": 0.42, "learning_rate": 2.908913667483965e-05, "loss": 2.3628, "step": 239820 }, { "epoch": 0.42, "learning_rate": 2.9088264734912825e-05, "loss": 2.4483, "step": 239830 }, { "epoch": 0.42, "learning_rate": 2.9087392794985995e-05, "loss": 2.3699, "step": 239840 }, { "epoch": 0.42, "learning_rate": 2.9086520855059175e-05, "loss": 2.4233, "step": 239850 }, { "epoch": 0.42, "learning_rate": 2.9085648915132346e-05, "loss": 2.3676, "step": 239860 }, { "epoch": 0.42, "learning_rate": 2.908477697520552e-05, "loss": 2.3782, "step": 239870 }, { "epoch": 0.42, "learning_rate": 2.908390503527869e-05, "loss": 2.2704, "step": 239880 }, { "epoch": 0.42, "learning_rate": 2.9083033095351864e-05, "loss": 2.4395, "step": 239890 }, { "epoch": 0.42, "learning_rate": 2.9082161155425038e-05, "loss": 2.2844, "step": 239900 }, { "epoch": 0.42, "learning_rate": 2.9081289215498208e-05, "loss": 2.1865, "step": 239910 }, { "epoch": 0.42, "learning_rate": 2.908041727557138e-05, "loss": 2.4691, "step": 239920 }, { "epoch": 0.42, "learning_rate": 2.907954533564456e-05, "loss": 2.4039, "step": 239930 }, { "epoch": 0.42, "learning_rate": 2.9078673395717733e-05, "loss": 2.3618, "step": 239940 }, { "epoch": 0.42, "learning_rate": 2.9077801455790903e-05, "loss": 2.3784, "step": 239950 }, { "epoch": 0.42, "learning_rate": 2.9076929515864077e-05, "loss": 2.4692, "step": 239960 }, { "epoch": 0.42, "learning_rate": 2.907605757593725e-05, "loss": 2.3593, "step": 239970 }, { "epoch": 0.42, "learning_rate": 2.907518563601042e-05, "loss": 2.4526, "step": 239980 }, { "epoch": 0.42, "learning_rate": 2.9074313696083595e-05, "loss": 2.3641, "step": 239990 }, { "epoch": 0.42, "learning_rate": 2.9073441756156772e-05, "loss": 2.3669, "step": 240000 }, { "epoch": 0.42, "learning_rate": 2.9072569816229946e-05, "loss": 2.4356, "step": 240010 }, { "epoch": 0.42, "learning_rate": 2.9071697876303116e-05, "loss": 2.3789, "step": 240020 }, { "epoch": 0.42, "learning_rate": 2.907082593637629e-05, "loss": 2.2849, "step": 240030 }, { "epoch": 0.42, "learning_rate": 2.906995399644946e-05, "loss": 2.346, "step": 240040 }, { "epoch": 0.42, "learning_rate": 2.9069082056522634e-05, "loss": 2.4042, "step": 240050 }, { "epoch": 0.42, "learning_rate": 2.9068210116595808e-05, "loss": 2.426, "step": 240060 }, { "epoch": 0.42, "learning_rate": 2.9067338176668978e-05, "loss": 2.3516, "step": 240070 }, { "epoch": 0.42, "learning_rate": 2.906646623674216e-05, "loss": 2.3219, "step": 240080 }, { "epoch": 0.42, "learning_rate": 2.906559429681533e-05, "loss": 2.3432, "step": 240090 }, { "epoch": 0.42, "learning_rate": 2.9064722356888503e-05, "loss": 2.3158, "step": 240100 }, { "epoch": 0.42, "learning_rate": 2.9063850416961673e-05, "loss": 2.4156, "step": 240110 }, { "epoch": 0.42, "learning_rate": 2.9062978477034847e-05, "loss": 2.3767, "step": 240120 }, { "epoch": 0.42, "learning_rate": 2.906210653710802e-05, "loss": 2.3017, "step": 240130 }, { "epoch": 0.42, "learning_rate": 2.906123459718119e-05, "loss": 2.5153, "step": 240140 }, { "epoch": 0.42, "learning_rate": 2.9060362657254368e-05, "loss": 2.4824, "step": 240150 }, { "epoch": 0.42, "learning_rate": 2.9059490717327542e-05, "loss": 2.3451, "step": 240160 }, { "epoch": 0.42, "learning_rate": 2.9058618777400716e-05, "loss": 2.2553, "step": 240170 }, { "epoch": 0.42, "learning_rate": 2.9057746837473886e-05, "loss": 2.349, "step": 240180 }, { "epoch": 0.42, "learning_rate": 2.905687489754706e-05, "loss": 2.3836, "step": 240190 }, { "epoch": 0.42, "learning_rate": 2.905600295762023e-05, "loss": 2.4297, "step": 240200 }, { "epoch": 0.42, "learning_rate": 2.9055131017693404e-05, "loss": 2.4146, "step": 240210 }, { "epoch": 0.42, "learning_rate": 2.9054259077766578e-05, "loss": 2.3766, "step": 240220 }, { "epoch": 0.42, "learning_rate": 2.9053387137839755e-05, "loss": 2.2934, "step": 240230 }, { "epoch": 0.42, "learning_rate": 2.905251519791293e-05, "loss": 2.3753, "step": 240240 }, { "epoch": 0.42, "learning_rate": 2.90516432579861e-05, "loss": 2.3743, "step": 240250 }, { "epoch": 0.42, "learning_rate": 2.9050771318059273e-05, "loss": 2.3056, "step": 240260 }, { "epoch": 0.42, "learning_rate": 2.9049899378132443e-05, "loss": 2.4693, "step": 240270 }, { "epoch": 0.42, "learning_rate": 2.9049027438205617e-05, "loss": 2.2917, "step": 240280 }, { "epoch": 0.42, "learning_rate": 2.904815549827879e-05, "loss": 2.2688, "step": 240290 }, { "epoch": 0.42, "learning_rate": 2.9047283558351968e-05, "loss": 2.4809, "step": 240300 }, { "epoch": 0.42, "learning_rate": 2.904641161842514e-05, "loss": 2.3358, "step": 240310 }, { "epoch": 0.42, "learning_rate": 2.9045539678498312e-05, "loss": 2.4659, "step": 240320 }, { "epoch": 0.42, "learning_rate": 2.9044667738571486e-05, "loss": 2.3836, "step": 240330 }, { "epoch": 0.42, "learning_rate": 2.9043795798644656e-05, "loss": 2.3633, "step": 240340 }, { "epoch": 0.42, "learning_rate": 2.904292385871783e-05, "loss": 2.2431, "step": 240350 }, { "epoch": 0.42, "learning_rate": 2.9042051918791004e-05, "loss": 2.3358, "step": 240360 }, { "epoch": 0.42, "learning_rate": 2.904117997886418e-05, "loss": 2.3386, "step": 240370 }, { "epoch": 0.42, "learning_rate": 2.904030803893735e-05, "loss": 2.3953, "step": 240380 }, { "epoch": 0.42, "learning_rate": 2.9039436099010525e-05, "loss": 2.3352, "step": 240390 }, { "epoch": 0.42, "learning_rate": 2.90385641590837e-05, "loss": 2.4012, "step": 240400 }, { "epoch": 0.42, "learning_rate": 2.903769221915687e-05, "loss": 2.3989, "step": 240410 }, { "epoch": 0.42, "learning_rate": 2.9036820279230043e-05, "loss": 2.3692, "step": 240420 }, { "epoch": 0.42, "learning_rate": 2.9035948339303213e-05, "loss": 2.3177, "step": 240430 }, { "epoch": 0.42, "learning_rate": 2.9035076399376387e-05, "loss": 2.3806, "step": 240440 }, { "epoch": 0.42, "learning_rate": 2.9034204459449564e-05, "loss": 2.4321, "step": 240450 }, { "epoch": 0.42, "learning_rate": 2.9033332519522738e-05, "loss": 2.3518, "step": 240460 }, { "epoch": 0.42, "learning_rate": 2.9032460579595912e-05, "loss": 2.4407, "step": 240470 }, { "epoch": 0.42, "learning_rate": 2.9031588639669082e-05, "loss": 2.3587, "step": 240480 }, { "epoch": 0.42, "learning_rate": 2.9030716699742256e-05, "loss": 2.4474, "step": 240490 }, { "epoch": 0.42, "learning_rate": 2.9029844759815426e-05, "loss": 2.4228, "step": 240500 }, { "epoch": 0.42, "learning_rate": 2.90289728198886e-05, "loss": 2.3481, "step": 240510 }, { "epoch": 0.42, "learning_rate": 2.9028100879961777e-05, "loss": 2.3818, "step": 240520 }, { "epoch": 0.42, "learning_rate": 2.902722894003495e-05, "loss": 2.2582, "step": 240530 }, { "epoch": 0.42, "learning_rate": 2.902635700010812e-05, "loss": 2.4116, "step": 240540 }, { "epoch": 0.42, "learning_rate": 2.9025485060181295e-05, "loss": 2.4131, "step": 240550 }, { "epoch": 0.42, "learning_rate": 2.902461312025447e-05, "loss": 2.4273, "step": 240560 }, { "epoch": 0.42, "learning_rate": 2.902374118032764e-05, "loss": 2.418, "step": 240570 }, { "epoch": 0.42, "learning_rate": 2.9022869240400813e-05, "loss": 2.3828, "step": 240580 }, { "epoch": 0.42, "learning_rate": 2.9021997300473987e-05, "loss": 2.3458, "step": 240590 }, { "epoch": 0.42, "learning_rate": 2.9021125360547164e-05, "loss": 2.366, "step": 240600 }, { "epoch": 0.42, "learning_rate": 2.9020253420620335e-05, "loss": 2.4555, "step": 240610 }, { "epoch": 0.42, "learning_rate": 2.901938148069351e-05, "loss": 2.4137, "step": 240620 }, { "epoch": 0.42, "learning_rate": 2.9018509540766682e-05, "loss": 2.1648, "step": 240630 }, { "epoch": 0.42, "learning_rate": 2.9017637600839852e-05, "loss": 2.2962, "step": 240640 }, { "epoch": 0.42, "learning_rate": 2.9016765660913026e-05, "loss": 2.4545, "step": 240650 }, { "epoch": 0.42, "learning_rate": 2.9015893720986197e-05, "loss": 2.5402, "step": 240660 }, { "epoch": 0.42, "learning_rate": 2.9015021781059377e-05, "loss": 2.4916, "step": 240670 }, { "epoch": 0.42, "learning_rate": 2.9014149841132548e-05, "loss": 2.2588, "step": 240680 }, { "epoch": 0.42, "learning_rate": 2.901327790120572e-05, "loss": 2.4678, "step": 240690 }, { "epoch": 0.42, "learning_rate": 2.9012405961278895e-05, "loss": 2.3103, "step": 240700 }, { "epoch": 0.42, "learning_rate": 2.9011534021352065e-05, "loss": 2.3152, "step": 240710 }, { "epoch": 0.42, "learning_rate": 2.901066208142524e-05, "loss": 2.4707, "step": 240720 }, { "epoch": 0.42, "learning_rate": 2.900979014149841e-05, "loss": 2.3653, "step": 240730 }, { "epoch": 0.42, "learning_rate": 2.9008918201571583e-05, "loss": 2.4509, "step": 240740 }, { "epoch": 0.42, "learning_rate": 2.900804626164476e-05, "loss": 2.4814, "step": 240750 }, { "epoch": 0.42, "learning_rate": 2.9007174321717934e-05, "loss": 2.4015, "step": 240760 }, { "epoch": 0.42, "learning_rate": 2.9006302381791105e-05, "loss": 2.3491, "step": 240770 }, { "epoch": 0.42, "learning_rate": 2.900543044186428e-05, "loss": 2.3451, "step": 240780 }, { "epoch": 0.42, "learning_rate": 2.9004558501937452e-05, "loss": 2.4359, "step": 240790 }, { "epoch": 0.42, "learning_rate": 2.9003686562010623e-05, "loss": 2.3662, "step": 240800 }, { "epoch": 0.42, "learning_rate": 2.9002814622083796e-05, "loss": 2.3246, "step": 240810 }, { "epoch": 0.42, "learning_rate": 2.9001942682156974e-05, "loss": 2.4025, "step": 240820 }, { "epoch": 0.42, "learning_rate": 2.9001070742230147e-05, "loss": 2.4356, "step": 240830 }, { "epoch": 0.42, "learning_rate": 2.9000198802303318e-05, "loss": 2.4912, "step": 240840 }, { "epoch": 0.42, "learning_rate": 2.899932686237649e-05, "loss": 2.4188, "step": 240850 }, { "epoch": 0.42, "learning_rate": 2.8998454922449665e-05, "loss": 2.3095, "step": 240860 }, { "epoch": 0.42, "learning_rate": 2.8997582982522836e-05, "loss": 2.5075, "step": 240870 }, { "epoch": 0.42, "learning_rate": 2.899671104259601e-05, "loss": 2.4123, "step": 240880 }, { "epoch": 0.42, "learning_rate": 2.899583910266918e-05, "loss": 2.431, "step": 240890 }, { "epoch": 0.42, "learning_rate": 2.899496716274236e-05, "loss": 2.4141, "step": 240900 }, { "epoch": 0.42, "learning_rate": 2.899409522281553e-05, "loss": 2.3895, "step": 240910 }, { "epoch": 0.42, "learning_rate": 2.8993223282888704e-05, "loss": 2.5775, "step": 240920 }, { "epoch": 0.42, "learning_rate": 2.8992351342961875e-05, "loss": 2.3259, "step": 240930 }, { "epoch": 0.42, "learning_rate": 2.899147940303505e-05, "loss": 2.2832, "step": 240940 }, { "epoch": 0.42, "learning_rate": 2.8990607463108222e-05, "loss": 2.3756, "step": 240950 }, { "epoch": 0.42, "learning_rate": 2.8989735523181393e-05, "loss": 2.3944, "step": 240960 }, { "epoch": 0.42, "learning_rate": 2.8988863583254573e-05, "loss": 2.4668, "step": 240970 }, { "epoch": 0.42, "learning_rate": 2.8987991643327744e-05, "loss": 2.4354, "step": 240980 }, { "epoch": 0.42, "learning_rate": 2.8987119703400917e-05, "loss": 2.355, "step": 240990 }, { "epoch": 0.42, "learning_rate": 2.8986247763474088e-05, "loss": 2.2255, "step": 241000 }, { "epoch": 0.42, "learning_rate": 2.898537582354726e-05, "loss": 2.382, "step": 241010 }, { "epoch": 0.42, "learning_rate": 2.8984503883620435e-05, "loss": 2.396, "step": 241020 }, { "epoch": 0.42, "learning_rate": 2.8983631943693606e-05, "loss": 2.4144, "step": 241030 }, { "epoch": 0.42, "learning_rate": 2.8982760003766783e-05, "loss": 2.3581, "step": 241040 }, { "epoch": 0.42, "learning_rate": 2.8981888063839957e-05, "loss": 2.4143, "step": 241050 }, { "epoch": 0.42, "learning_rate": 2.898101612391313e-05, "loss": 2.3001, "step": 241060 }, { "epoch": 0.42, "learning_rate": 2.89801441839863e-05, "loss": 2.4422, "step": 241070 }, { "epoch": 0.42, "learning_rate": 2.8979272244059475e-05, "loss": 2.4038, "step": 241080 }, { "epoch": 0.42, "learning_rate": 2.897840030413265e-05, "loss": 2.4836, "step": 241090 }, { "epoch": 0.42, "learning_rate": 2.897752836420582e-05, "loss": 2.392, "step": 241100 }, { "epoch": 0.42, "learning_rate": 2.8976656424278993e-05, "loss": 2.311, "step": 241110 }, { "epoch": 0.42, "learning_rate": 2.897578448435217e-05, "loss": 2.4834, "step": 241120 }, { "epoch": 0.42, "learning_rate": 2.8974912544425343e-05, "loss": 2.4569, "step": 241130 }, { "epoch": 0.42, "learning_rate": 2.8974040604498514e-05, "loss": 2.3939, "step": 241140 }, { "epoch": 0.42, "learning_rate": 2.8973168664571688e-05, "loss": 2.3777, "step": 241150 }, { "epoch": 0.42, "learning_rate": 2.8972296724644858e-05, "loss": 2.4384, "step": 241160 }, { "epoch": 0.42, "learning_rate": 2.8971424784718032e-05, "loss": 2.4686, "step": 241170 }, { "epoch": 0.42, "learning_rate": 2.8970552844791206e-05, "loss": 2.3907, "step": 241180 }, { "epoch": 0.42, "learning_rate": 2.8969680904864383e-05, "loss": 2.3792, "step": 241190 }, { "epoch": 0.42, "learning_rate": 2.8968808964937556e-05, "loss": 2.3587, "step": 241200 }, { "epoch": 0.42, "learning_rate": 2.8967937025010727e-05, "loss": 2.3305, "step": 241210 }, { "epoch": 0.42, "learning_rate": 2.89670650850839e-05, "loss": 2.3412, "step": 241220 }, { "epoch": 0.42, "learning_rate": 2.896619314515707e-05, "loss": 2.4129, "step": 241230 }, { "epoch": 0.42, "learning_rate": 2.8965321205230245e-05, "loss": 2.5495, "step": 241240 }, { "epoch": 0.42, "learning_rate": 2.896444926530342e-05, "loss": 2.2836, "step": 241250 }, { "epoch": 0.42, "learning_rate": 2.896357732537659e-05, "loss": 2.3903, "step": 241260 }, { "epoch": 0.42, "learning_rate": 2.8962705385449766e-05, "loss": 2.3419, "step": 241270 }, { "epoch": 0.42, "learning_rate": 2.896183344552294e-05, "loss": 2.3215, "step": 241280 }, { "epoch": 0.42, "learning_rate": 2.8960961505596114e-05, "loss": 2.3772, "step": 241290 }, { "epoch": 0.42, "learning_rate": 2.8960089565669284e-05, "loss": 2.4587, "step": 241300 }, { "epoch": 0.42, "learning_rate": 2.8959217625742458e-05, "loss": 2.4961, "step": 241310 }, { "epoch": 0.42, "learning_rate": 2.895834568581563e-05, "loss": 2.4115, "step": 241320 }, { "epoch": 0.42, "learning_rate": 2.8957473745888802e-05, "loss": 2.3678, "step": 241330 }, { "epoch": 0.42, "learning_rate": 2.895660180596198e-05, "loss": 2.4734, "step": 241340 }, { "epoch": 0.42, "learning_rate": 2.8955729866035153e-05, "loss": 2.3316, "step": 241350 }, { "epoch": 0.42, "learning_rate": 2.8954857926108327e-05, "loss": 2.4115, "step": 241360 }, { "epoch": 0.42, "learning_rate": 2.8953985986181497e-05, "loss": 2.3587, "step": 241370 }, { "epoch": 0.42, "learning_rate": 2.895311404625467e-05, "loss": 2.452, "step": 241380 }, { "epoch": 0.42, "learning_rate": 2.895224210632784e-05, "loss": 2.4767, "step": 241390 }, { "epoch": 0.42, "learning_rate": 2.8951370166401015e-05, "loss": 2.4583, "step": 241400 }, { "epoch": 0.42, "learning_rate": 2.895049822647419e-05, "loss": 2.4032, "step": 241410 }, { "epoch": 0.42, "learning_rate": 2.8949626286547366e-05, "loss": 2.4183, "step": 241420 }, { "epoch": 0.42, "learning_rate": 2.894875434662054e-05, "loss": 2.4216, "step": 241430 }, { "epoch": 0.42, "learning_rate": 2.894788240669371e-05, "loss": 2.4068, "step": 241440 }, { "epoch": 0.42, "learning_rate": 2.8947010466766884e-05, "loss": 2.3032, "step": 241450 }, { "epoch": 0.42, "learning_rate": 2.8946138526840054e-05, "loss": 2.3408, "step": 241460 }, { "epoch": 0.42, "learning_rate": 2.8945266586913228e-05, "loss": 2.3889, "step": 241470 }, { "epoch": 0.42, "learning_rate": 2.8944394646986402e-05, "loss": 2.3249, "step": 241480 }, { "epoch": 0.42, "learning_rate": 2.894352270705958e-05, "loss": 2.4366, "step": 241490 }, { "epoch": 0.42, "learning_rate": 2.894265076713275e-05, "loss": 2.4657, "step": 241500 }, { "epoch": 0.42, "learning_rate": 2.8941778827205923e-05, "loss": 2.1678, "step": 241510 }, { "epoch": 0.42, "learning_rate": 2.8940906887279097e-05, "loss": 2.3895, "step": 241520 }, { "epoch": 0.42, "learning_rate": 2.8940034947352267e-05, "loss": 2.4347, "step": 241530 }, { "epoch": 0.42, "learning_rate": 2.893916300742544e-05, "loss": 2.324, "step": 241540 }, { "epoch": 0.42, "learning_rate": 2.893829106749861e-05, "loss": 2.3881, "step": 241550 }, { "epoch": 0.42, "learning_rate": 2.8937419127571792e-05, "loss": 2.4041, "step": 241560 }, { "epoch": 0.42, "learning_rate": 2.8936547187644962e-05, "loss": 2.3731, "step": 241570 }, { "epoch": 0.42, "learning_rate": 2.8935675247718136e-05, "loss": 2.3649, "step": 241580 }, { "epoch": 0.42, "learning_rate": 2.893480330779131e-05, "loss": 2.3051, "step": 241590 }, { "epoch": 0.42, "learning_rate": 2.893393136786448e-05, "loss": 2.3653, "step": 241600 }, { "epoch": 0.42, "learning_rate": 2.8933059427937654e-05, "loss": 2.4003, "step": 241610 }, { "epoch": 0.42, "learning_rate": 2.8932187488010824e-05, "loss": 2.2698, "step": 241620 }, { "epoch": 0.42, "learning_rate": 2.8931315548083998e-05, "loss": 2.4317, "step": 241630 }, { "epoch": 0.42, "learning_rate": 2.8930443608157175e-05, "loss": 2.3491, "step": 241640 }, { "epoch": 0.42, "learning_rate": 2.892957166823035e-05, "loss": 2.2708, "step": 241650 }, { "epoch": 0.42, "learning_rate": 2.892869972830352e-05, "loss": 2.4342, "step": 241660 }, { "epoch": 0.42, "learning_rate": 2.8927827788376693e-05, "loss": 2.2411, "step": 241670 }, { "epoch": 0.42, "learning_rate": 2.8926955848449867e-05, "loss": 2.2845, "step": 241680 }, { "epoch": 0.42, "learning_rate": 2.8926083908523037e-05, "loss": 2.3812, "step": 241690 }, { "epoch": 0.42, "learning_rate": 2.892521196859621e-05, "loss": 2.3819, "step": 241700 }, { "epoch": 0.42, "learning_rate": 2.8924340028669388e-05, "loss": 2.3931, "step": 241710 }, { "epoch": 0.42, "learning_rate": 2.8923468088742562e-05, "loss": 2.3681, "step": 241720 }, { "epoch": 0.42, "learning_rate": 2.8922596148815732e-05, "loss": 2.3741, "step": 241730 }, { "epoch": 0.42, "learning_rate": 2.8921724208888906e-05, "loss": 2.4586, "step": 241740 }, { "epoch": 0.42, "learning_rate": 2.892085226896208e-05, "loss": 2.473, "step": 241750 }, { "epoch": 0.42, "learning_rate": 2.891998032903525e-05, "loss": 2.4593, "step": 241760 }, { "epoch": 0.42, "learning_rate": 2.8919108389108424e-05, "loss": 2.391, "step": 241770 }, { "epoch": 0.42, "learning_rate": 2.8918236449181594e-05, "loss": 2.3853, "step": 241780 }, { "epoch": 0.42, "learning_rate": 2.8917364509254775e-05, "loss": 2.3438, "step": 241790 }, { "epoch": 0.42, "learning_rate": 2.8916492569327945e-05, "loss": 2.2576, "step": 241800 }, { "epoch": 0.42, "learning_rate": 2.891562062940112e-05, "loss": 2.4046, "step": 241810 }, { "epoch": 0.42, "learning_rate": 2.8914748689474293e-05, "loss": 2.4632, "step": 241820 }, { "epoch": 0.42, "learning_rate": 2.8913876749547463e-05, "loss": 2.5135, "step": 241830 }, { "epoch": 0.42, "learning_rate": 2.8913004809620637e-05, "loss": 2.3869, "step": 241840 }, { "epoch": 0.42, "learning_rate": 2.8912132869693807e-05, "loss": 2.4262, "step": 241850 }, { "epoch": 0.42, "learning_rate": 2.8911260929766988e-05, "loss": 2.323, "step": 241860 }, { "epoch": 0.42, "learning_rate": 2.891038898984016e-05, "loss": 2.3039, "step": 241870 }, { "epoch": 0.42, "learning_rate": 2.8909517049913332e-05, "loss": 2.3628, "step": 241880 }, { "epoch": 0.42, "learning_rate": 2.8908645109986503e-05, "loss": 2.3529, "step": 241890 }, { "epoch": 0.42, "learning_rate": 2.8907773170059676e-05, "loss": 2.3706, "step": 241900 }, { "epoch": 0.42, "learning_rate": 2.890690123013285e-05, "loss": 2.4442, "step": 241910 }, { "epoch": 0.42, "learning_rate": 2.890602929020602e-05, "loss": 2.384, "step": 241920 }, { "epoch": 0.42, "learning_rate": 2.8905157350279194e-05, "loss": 2.3146, "step": 241930 }, { "epoch": 0.42, "learning_rate": 2.890428541035237e-05, "loss": 2.4703, "step": 241940 }, { "epoch": 0.42, "learning_rate": 2.8903413470425545e-05, "loss": 2.3793, "step": 241950 }, { "epoch": 0.42, "learning_rate": 2.8902541530498716e-05, "loss": 2.2795, "step": 241960 }, { "epoch": 0.42, "learning_rate": 2.890166959057189e-05, "loss": 2.454, "step": 241970 }, { "epoch": 0.42, "learning_rate": 2.8900797650645063e-05, "loss": 2.4617, "step": 241980 }, { "epoch": 0.42, "learning_rate": 2.8899925710718233e-05, "loss": 2.3187, "step": 241990 }, { "epoch": 0.42, "learning_rate": 2.8899053770791407e-05, "loss": 2.3894, "step": 242000 }, { "epoch": 0.42, "learning_rate": 2.8898181830864584e-05, "loss": 2.4151, "step": 242010 }, { "epoch": 0.42, "learning_rate": 2.8897309890937758e-05, "loss": 2.3255, "step": 242020 }, { "epoch": 0.42, "learning_rate": 2.889643795101093e-05, "loss": 2.4189, "step": 242030 }, { "epoch": 0.42, "learning_rate": 2.8895566011084102e-05, "loss": 2.46, "step": 242040 }, { "epoch": 0.42, "learning_rate": 2.8894694071157276e-05, "loss": 2.5091, "step": 242050 }, { "epoch": 0.42, "learning_rate": 2.8893822131230446e-05, "loss": 2.2513, "step": 242060 }, { "epoch": 0.42, "learning_rate": 2.889295019130362e-05, "loss": 2.3531, "step": 242070 }, { "epoch": 0.42, "learning_rate": 2.889207825137679e-05, "loss": 2.401, "step": 242080 }, { "epoch": 0.42, "learning_rate": 2.889120631144997e-05, "loss": 2.5523, "step": 242090 }, { "epoch": 0.42, "learning_rate": 2.889033437152314e-05, "loss": 2.3241, "step": 242100 }, { "epoch": 0.42, "learning_rate": 2.8889462431596315e-05, "loss": 2.4944, "step": 242110 }, { "epoch": 0.42, "learning_rate": 2.8888590491669486e-05, "loss": 2.4952, "step": 242120 }, { "epoch": 0.42, "learning_rate": 2.888771855174266e-05, "loss": 2.3205, "step": 242130 }, { "epoch": 0.42, "learning_rate": 2.8886846611815833e-05, "loss": 2.3551, "step": 242140 }, { "epoch": 0.42, "learning_rate": 2.8885974671889004e-05, "loss": 2.338, "step": 242150 }, { "epoch": 0.42, "learning_rate": 2.8885102731962184e-05, "loss": 2.4834, "step": 242160 }, { "epoch": 0.42, "learning_rate": 2.8884230792035355e-05, "loss": 2.3835, "step": 242170 }, { "epoch": 0.42, "learning_rate": 2.888335885210853e-05, "loss": 2.3037, "step": 242180 }, { "epoch": 0.42, "learning_rate": 2.88824869121817e-05, "loss": 2.3879, "step": 242190 }, { "epoch": 0.42, "learning_rate": 2.8881614972254872e-05, "loss": 2.2975, "step": 242200 }, { "epoch": 0.42, "learning_rate": 2.8880743032328046e-05, "loss": 2.263, "step": 242210 }, { "epoch": 0.42, "learning_rate": 2.8879871092401217e-05, "loss": 2.4665, "step": 242220 }, { "epoch": 0.42, "learning_rate": 2.8878999152474394e-05, "loss": 2.3564, "step": 242230 }, { "epoch": 0.42, "learning_rate": 2.8878127212547568e-05, "loss": 2.4907, "step": 242240 }, { "epoch": 0.42, "learning_rate": 2.887725527262074e-05, "loss": 2.4327, "step": 242250 }, { "epoch": 0.42, "learning_rate": 2.8876383332693912e-05, "loss": 2.3898, "step": 242260 }, { "epoch": 0.42, "learning_rate": 2.8875511392767085e-05, "loss": 2.4311, "step": 242270 }, { "epoch": 0.42, "learning_rate": 2.8874639452840256e-05, "loss": 2.3433, "step": 242280 }, { "epoch": 0.42, "learning_rate": 2.887376751291343e-05, "loss": 2.4013, "step": 242290 }, { "epoch": 0.42, "learning_rate": 2.8872895572986603e-05, "loss": 2.3672, "step": 242300 }, { "epoch": 0.42, "learning_rate": 2.887202363305978e-05, "loss": 2.3554, "step": 242310 }, { "epoch": 0.42, "learning_rate": 2.8871151693132954e-05, "loss": 2.3816, "step": 242320 }, { "epoch": 0.42, "learning_rate": 2.8870279753206125e-05, "loss": 2.4294, "step": 242330 }, { "epoch": 0.42, "learning_rate": 2.88694078132793e-05, "loss": 2.2984, "step": 242340 }, { "epoch": 0.42, "learning_rate": 2.886853587335247e-05, "loss": 2.4283, "step": 242350 }, { "epoch": 0.42, "learning_rate": 2.8867663933425643e-05, "loss": 2.4723, "step": 242360 }, { "epoch": 0.42, "learning_rate": 2.8866791993498816e-05, "loss": 2.2865, "step": 242370 }, { "epoch": 0.42, "learning_rate": 2.8865920053571994e-05, "loss": 2.3549, "step": 242380 }, { "epoch": 0.42, "learning_rate": 2.8865048113645164e-05, "loss": 2.4292, "step": 242390 }, { "epoch": 0.42, "learning_rate": 2.8864176173718338e-05, "loss": 2.3625, "step": 242400 }, { "epoch": 0.42, "learning_rate": 2.886330423379151e-05, "loss": 2.4159, "step": 242410 }, { "epoch": 0.42, "learning_rate": 2.8862432293864682e-05, "loss": 2.3699, "step": 242420 }, { "epoch": 0.42, "learning_rate": 2.8861560353937856e-05, "loss": 2.3532, "step": 242430 }, { "epoch": 0.42, "learning_rate": 2.886068841401103e-05, "loss": 2.386, "step": 242440 }, { "epoch": 0.42, "learning_rate": 2.88598164740842e-05, "loss": 2.3499, "step": 242450 }, { "epoch": 0.42, "learning_rate": 2.8858944534157377e-05, "loss": 2.3977, "step": 242460 }, { "epoch": 0.42, "learning_rate": 2.885807259423055e-05, "loss": 2.421, "step": 242470 }, { "epoch": 0.42, "learning_rate": 2.8857200654303724e-05, "loss": 2.4267, "step": 242480 }, { "epoch": 0.42, "learning_rate": 2.8856328714376895e-05, "loss": 2.3816, "step": 242490 }, { "epoch": 0.42, "learning_rate": 2.885545677445007e-05, "loss": 2.3375, "step": 242500 }, { "epoch": 0.42, "learning_rate": 2.885458483452324e-05, "loss": 2.2383, "step": 242510 }, { "epoch": 0.42, "learning_rate": 2.8853712894596413e-05, "loss": 2.2448, "step": 242520 }, { "epoch": 0.42, "learning_rate": 2.885284095466959e-05, "loss": 2.3694, "step": 242530 }, { "epoch": 0.42, "learning_rate": 2.8851969014742764e-05, "loss": 2.4244, "step": 242540 }, { "epoch": 0.42, "learning_rate": 2.8851097074815937e-05, "loss": 2.4918, "step": 242550 }, { "epoch": 0.42, "learning_rate": 2.8850225134889108e-05, "loss": 2.5298, "step": 242560 }, { "epoch": 0.42, "learning_rate": 2.884935319496228e-05, "loss": 2.384, "step": 242570 }, { "epoch": 0.42, "learning_rate": 2.8848481255035452e-05, "loss": 2.447, "step": 242580 }, { "epoch": 0.42, "learning_rate": 2.8847609315108626e-05, "loss": 2.3172, "step": 242590 }, { "epoch": 0.42, "learning_rate": 2.88467373751818e-05, "loss": 2.2151, "step": 242600 }, { "epoch": 0.42, "learning_rate": 2.8845865435254977e-05, "loss": 2.3292, "step": 242610 }, { "epoch": 0.42, "learning_rate": 2.8844993495328147e-05, "loss": 2.3937, "step": 242620 }, { "epoch": 0.42, "learning_rate": 2.884412155540132e-05, "loss": 2.2716, "step": 242630 }, { "epoch": 0.42, "learning_rate": 2.8843249615474495e-05, "loss": 2.4902, "step": 242640 }, { "epoch": 0.42, "learning_rate": 2.8842377675547665e-05, "loss": 2.3741, "step": 242650 }, { "epoch": 0.42, "learning_rate": 2.884150573562084e-05, "loss": 2.4248, "step": 242660 }, { "epoch": 0.42, "learning_rate": 2.8840633795694013e-05, "loss": 2.3473, "step": 242670 }, { "epoch": 0.42, "learning_rate": 2.883976185576719e-05, "loss": 2.3329, "step": 242680 }, { "epoch": 0.42, "learning_rate": 2.883888991584036e-05, "loss": 2.2839, "step": 242690 }, { "epoch": 0.42, "learning_rate": 2.8838017975913534e-05, "loss": 2.3774, "step": 242700 }, { "epoch": 0.42, "learning_rate": 2.8837146035986708e-05, "loss": 2.2626, "step": 242710 }, { "epoch": 0.42, "learning_rate": 2.8836274096059878e-05, "loss": 2.2615, "step": 242720 }, { "epoch": 0.42, "learning_rate": 2.8835402156133052e-05, "loss": 2.3267, "step": 242730 }, { "epoch": 0.42, "learning_rate": 2.8834530216206222e-05, "loss": 2.4299, "step": 242740 }, { "epoch": 0.42, "learning_rate": 2.8833658276279396e-05, "loss": 2.3517, "step": 242750 }, { "epoch": 0.42, "learning_rate": 2.8832786336352573e-05, "loss": 2.2856, "step": 242760 }, { "epoch": 0.42, "learning_rate": 2.8831914396425747e-05, "loss": 2.3651, "step": 242770 }, { "epoch": 0.42, "learning_rate": 2.883104245649892e-05, "loss": 2.4572, "step": 242780 }, { "epoch": 0.42, "learning_rate": 2.883017051657209e-05, "loss": 2.339, "step": 242790 }, { "epoch": 0.42, "learning_rate": 2.8829298576645265e-05, "loss": 2.4179, "step": 242800 }, { "epoch": 0.42, "learning_rate": 2.8828426636718435e-05, "loss": 2.3583, "step": 242810 }, { "epoch": 0.42, "learning_rate": 2.882755469679161e-05, "loss": 2.3792, "step": 242820 }, { "epoch": 0.42, "learning_rate": 2.8826682756864786e-05, "loss": 2.4316, "step": 242830 }, { "epoch": 0.42, "learning_rate": 2.882581081693796e-05, "loss": 2.4264, "step": 242840 }, { "epoch": 0.42, "learning_rate": 2.882493887701113e-05, "loss": 2.3819, "step": 242850 }, { "epoch": 0.42, "learning_rate": 2.8824066937084304e-05, "loss": 2.4002, "step": 242860 }, { "epoch": 0.42, "learning_rate": 2.8823194997157478e-05, "loss": 2.4763, "step": 242870 }, { "epoch": 0.42, "learning_rate": 2.8822323057230648e-05, "loss": 2.408, "step": 242880 }, { "epoch": 0.42, "learning_rate": 2.8821451117303822e-05, "loss": 2.3874, "step": 242890 }, { "epoch": 0.42, "learning_rate": 2.8820579177377e-05, "loss": 2.262, "step": 242900 }, { "epoch": 0.42, "learning_rate": 2.8819707237450173e-05, "loss": 2.3515, "step": 242910 }, { "epoch": 0.42, "learning_rate": 2.8818835297523343e-05, "loss": 2.5326, "step": 242920 }, { "epoch": 0.42, "learning_rate": 2.8817963357596517e-05, "loss": 2.5119, "step": 242930 }, { "epoch": 0.42, "learning_rate": 2.881709141766969e-05, "loss": 2.4481, "step": 242940 }, { "epoch": 0.42, "learning_rate": 2.881621947774286e-05, "loss": 2.4358, "step": 242950 }, { "epoch": 0.42, "learning_rate": 2.8815347537816035e-05, "loss": 2.339, "step": 242960 }, { "epoch": 0.42, "learning_rate": 2.8814475597889205e-05, "loss": 2.2429, "step": 242970 }, { "epoch": 0.42, "learning_rate": 2.8813603657962386e-05, "loss": 2.4893, "step": 242980 }, { "epoch": 0.42, "learning_rate": 2.8812731718035556e-05, "loss": 2.3094, "step": 242990 }, { "epoch": 0.42, "learning_rate": 2.881185977810873e-05, "loss": 2.2788, "step": 243000 }, { "epoch": 0.42, "learning_rate": 2.88109878381819e-05, "loss": 2.3976, "step": 243010 }, { "epoch": 0.42, "learning_rate": 2.8810115898255074e-05, "loss": 2.2593, "step": 243020 }, { "epoch": 0.42, "learning_rate": 2.8809243958328248e-05, "loss": 2.3883, "step": 243030 }, { "epoch": 0.42, "learning_rate": 2.880837201840142e-05, "loss": 2.391, "step": 243040 }, { "epoch": 0.42, "learning_rate": 2.88075000784746e-05, "loss": 2.4815, "step": 243050 }, { "epoch": 0.42, "learning_rate": 2.880662813854777e-05, "loss": 2.5227, "step": 243060 }, { "epoch": 0.42, "learning_rate": 2.8805756198620943e-05, "loss": 2.4929, "step": 243070 }, { "epoch": 0.42, "learning_rate": 2.8804884258694113e-05, "loss": 2.3404, "step": 243080 }, { "epoch": 0.42, "learning_rate": 2.8804012318767287e-05, "loss": 2.3832, "step": 243090 }, { "epoch": 0.42, "learning_rate": 2.880314037884046e-05, "loss": 2.3447, "step": 243100 }, { "epoch": 0.42, "learning_rate": 2.880226843891363e-05, "loss": 2.3747, "step": 243110 }, { "epoch": 0.42, "learning_rate": 2.8801396498986805e-05, "loss": 2.4929, "step": 243120 }, { "epoch": 0.42, "learning_rate": 2.8800524559059982e-05, "loss": 2.417, "step": 243130 }, { "epoch": 0.42, "learning_rate": 2.8799652619133156e-05, "loss": 2.4128, "step": 243140 }, { "epoch": 0.42, "learning_rate": 2.8798780679206326e-05, "loss": 2.2712, "step": 243150 }, { "epoch": 0.42, "learning_rate": 2.87979087392795e-05, "loss": 2.2602, "step": 243160 }, { "epoch": 0.42, "learning_rate": 2.8797036799352674e-05, "loss": 2.2729, "step": 243170 }, { "epoch": 0.42, "learning_rate": 2.8796164859425844e-05, "loss": 2.4664, "step": 243180 }, { "epoch": 0.42, "learning_rate": 2.8795292919499018e-05, "loss": 2.3744, "step": 243190 }, { "epoch": 0.42, "learning_rate": 2.8794420979572195e-05, "loss": 2.352, "step": 243200 }, { "epoch": 0.42, "learning_rate": 2.879354903964537e-05, "loss": 2.372, "step": 243210 }, { "epoch": 0.42, "learning_rate": 2.879267709971854e-05, "loss": 2.3551, "step": 243220 }, { "epoch": 0.42, "learning_rate": 2.8791805159791713e-05, "loss": 2.3261, "step": 243230 }, { "epoch": 0.42, "learning_rate": 2.8790933219864884e-05, "loss": 2.4232, "step": 243240 }, { "epoch": 0.42, "learning_rate": 2.8790061279938057e-05, "loss": 2.3877, "step": 243250 }, { "epoch": 0.42, "learning_rate": 2.878918934001123e-05, "loss": 2.3462, "step": 243260 }, { "epoch": 0.42, "learning_rate": 2.87883174000844e-05, "loss": 2.3924, "step": 243270 }, { "epoch": 0.42, "learning_rate": 2.8787445460157582e-05, "loss": 2.3917, "step": 243280 }, { "epoch": 0.42, "learning_rate": 2.8786573520230752e-05, "loss": 2.5033, "step": 243290 }, { "epoch": 0.42, "learning_rate": 2.8785701580303926e-05, "loss": 2.4202, "step": 243300 }, { "epoch": 0.42, "learning_rate": 2.8784829640377097e-05, "loss": 2.3099, "step": 243310 }, { "epoch": 0.42, "learning_rate": 2.878395770045027e-05, "loss": 2.3687, "step": 243320 }, { "epoch": 0.42, "learning_rate": 2.8783085760523444e-05, "loss": 2.3328, "step": 243330 }, { "epoch": 0.42, "learning_rate": 2.8782213820596614e-05, "loss": 2.3834, "step": 243340 }, { "epoch": 0.42, "learning_rate": 2.878134188066979e-05, "loss": 2.2959, "step": 243350 }, { "epoch": 0.42, "learning_rate": 2.8780469940742965e-05, "loss": 2.4275, "step": 243360 }, { "epoch": 0.42, "learning_rate": 2.877959800081614e-05, "loss": 2.3651, "step": 243370 }, { "epoch": 0.42, "learning_rate": 2.877872606088931e-05, "loss": 2.361, "step": 243380 }, { "epoch": 0.42, "learning_rate": 2.8777854120962483e-05, "loss": 2.387, "step": 243390 }, { "epoch": 0.42, "learning_rate": 2.8776982181035657e-05, "loss": 2.3448, "step": 243400 }, { "epoch": 0.42, "learning_rate": 2.8776110241108827e-05, "loss": 2.3447, "step": 243410 }, { "epoch": 0.42, "learning_rate": 2.8775238301182e-05, "loss": 2.404, "step": 243420 }, { "epoch": 0.42, "learning_rate": 2.877436636125518e-05, "loss": 2.3214, "step": 243430 }, { "epoch": 0.42, "learning_rate": 2.8773494421328352e-05, "loss": 2.397, "step": 243440 }, { "epoch": 0.42, "learning_rate": 2.8772622481401523e-05, "loss": 2.3086, "step": 243450 }, { "epoch": 0.42, "learning_rate": 2.8771750541474696e-05, "loss": 2.3473, "step": 243460 }, { "epoch": 0.42, "learning_rate": 2.8770878601547867e-05, "loss": 2.2899, "step": 243470 }, { "epoch": 0.42, "learning_rate": 2.877000666162104e-05, "loss": 2.3985, "step": 243480 }, { "epoch": 0.42, "learning_rate": 2.8769134721694214e-05, "loss": 2.4717, "step": 243490 }, { "epoch": 0.42, "learning_rate": 2.876826278176739e-05, "loss": 2.5098, "step": 243500 }, { "epoch": 0.42, "learning_rate": 2.8767390841840565e-05, "loss": 2.4205, "step": 243510 }, { "epoch": 0.42, "learning_rate": 2.8766518901913736e-05, "loss": 2.33, "step": 243520 }, { "epoch": 0.42, "learning_rate": 2.876564696198691e-05, "loss": 2.302, "step": 243530 }, { "epoch": 0.42, "learning_rate": 2.876477502206008e-05, "loss": 2.3307, "step": 243540 }, { "epoch": 0.42, "learning_rate": 2.8763903082133253e-05, "loss": 2.3921, "step": 243550 }, { "epoch": 0.42, "learning_rate": 2.8763031142206427e-05, "loss": 2.385, "step": 243560 }, { "epoch": 0.42, "learning_rate": 2.8762159202279604e-05, "loss": 2.422, "step": 243570 }, { "epoch": 0.42, "learning_rate": 2.8761287262352775e-05, "loss": 2.272, "step": 243580 }, { "epoch": 0.42, "learning_rate": 2.876041532242595e-05, "loss": 2.3894, "step": 243590 }, { "epoch": 0.42, "learning_rate": 2.8759543382499122e-05, "loss": 2.3781, "step": 243600 }, { "epoch": 0.42, "learning_rate": 2.8758671442572293e-05, "loss": 2.486, "step": 243610 }, { "epoch": 0.42, "learning_rate": 2.8757799502645466e-05, "loss": 2.377, "step": 243620 }, { "epoch": 0.42, "learning_rate": 2.8756927562718637e-05, "loss": 2.3293, "step": 243630 }, { "epoch": 0.42, "learning_rate": 2.875605562279181e-05, "loss": 2.4007, "step": 243640 }, { "epoch": 0.42, "learning_rate": 2.8755183682864988e-05, "loss": 2.2327, "step": 243650 }, { "epoch": 0.42, "learning_rate": 2.875431174293816e-05, "loss": 2.4741, "step": 243660 }, { "epoch": 0.42, "learning_rate": 2.8753439803011335e-05, "loss": 2.4451, "step": 243670 }, { "epoch": 0.42, "learning_rate": 2.8752567863084506e-05, "loss": 2.3866, "step": 243680 }, { "epoch": 0.42, "learning_rate": 2.875169592315768e-05, "loss": 2.4598, "step": 243690 }, { "epoch": 0.42, "learning_rate": 2.875082398323085e-05, "loss": 2.4917, "step": 243700 }, { "epoch": 0.43, "learning_rate": 2.8749952043304024e-05, "loss": 2.2569, "step": 243710 }, { "epoch": 0.43, "learning_rate": 2.87490801033772e-05, "loss": 2.355, "step": 243720 }, { "epoch": 0.43, "learning_rate": 2.8748208163450375e-05, "loss": 2.3995, "step": 243730 }, { "epoch": 0.43, "learning_rate": 2.8747336223523545e-05, "loss": 2.4082, "step": 243740 }, { "epoch": 0.43, "learning_rate": 2.874646428359672e-05, "loss": 2.3837, "step": 243750 }, { "epoch": 0.43, "learning_rate": 2.8745592343669892e-05, "loss": 2.2877, "step": 243760 }, { "epoch": 0.43, "learning_rate": 2.8744720403743063e-05, "loss": 2.4297, "step": 243770 }, { "epoch": 0.43, "learning_rate": 2.8743848463816237e-05, "loss": 2.3633, "step": 243780 }, { "epoch": 0.43, "learning_rate": 2.874297652388941e-05, "loss": 2.3723, "step": 243790 }, { "epoch": 0.43, "learning_rate": 2.8742104583962588e-05, "loss": 2.4662, "step": 243800 }, { "epoch": 0.43, "learning_rate": 2.8741232644035758e-05, "loss": 2.3443, "step": 243810 }, { "epoch": 0.43, "learning_rate": 2.8740360704108932e-05, "loss": 2.3372, "step": 243820 }, { "epoch": 0.43, "learning_rate": 2.8739488764182105e-05, "loss": 2.4123, "step": 243830 }, { "epoch": 0.43, "learning_rate": 2.8738616824255276e-05, "loss": 2.5435, "step": 243840 }, { "epoch": 0.43, "learning_rate": 2.873774488432845e-05, "loss": 2.428, "step": 243850 }, { "epoch": 0.43, "learning_rate": 2.873687294440162e-05, "loss": 2.5078, "step": 243860 }, { "epoch": 0.43, "learning_rate": 2.87360010044748e-05, "loss": 2.3218, "step": 243870 }, { "epoch": 0.43, "learning_rate": 2.873512906454797e-05, "loss": 2.4922, "step": 243880 }, { "epoch": 0.43, "learning_rate": 2.8734257124621145e-05, "loss": 2.2812, "step": 243890 }, { "epoch": 0.43, "learning_rate": 2.873338518469432e-05, "loss": 2.3141, "step": 243900 }, { "epoch": 0.43, "learning_rate": 2.873251324476749e-05, "loss": 2.3125, "step": 243910 }, { "epoch": 0.43, "learning_rate": 2.8731641304840663e-05, "loss": 2.389, "step": 243920 }, { "epoch": 0.43, "learning_rate": 2.8730769364913833e-05, "loss": 2.4683, "step": 243930 }, { "epoch": 0.43, "learning_rate": 2.8729897424987007e-05, "loss": 2.3818, "step": 243940 }, { "epoch": 0.43, "learning_rate": 2.8729025485060184e-05, "loss": 2.3475, "step": 243950 }, { "epoch": 0.43, "learning_rate": 2.8728153545133358e-05, "loss": 2.4741, "step": 243960 }, { "epoch": 0.43, "learning_rate": 2.8727281605206528e-05, "loss": 2.4408, "step": 243970 }, { "epoch": 0.43, "learning_rate": 2.8726409665279702e-05, "loss": 2.5526, "step": 243980 }, { "epoch": 0.43, "learning_rate": 2.8725537725352876e-05, "loss": 2.4844, "step": 243990 }, { "epoch": 0.43, "learning_rate": 2.8724665785426046e-05, "loss": 2.3131, "step": 244000 }, { "epoch": 0.43, "learning_rate": 2.872379384549922e-05, "loss": 2.3365, "step": 244010 }, { "epoch": 0.43, "learning_rate": 2.8722921905572397e-05, "loss": 2.3863, "step": 244020 }, { "epoch": 0.43, "learning_rate": 2.872204996564557e-05, "loss": 2.3975, "step": 244030 }, { "epoch": 0.43, "learning_rate": 2.872117802571874e-05, "loss": 2.4345, "step": 244040 }, { "epoch": 0.43, "learning_rate": 2.8720306085791915e-05, "loss": 2.3679, "step": 244050 }, { "epoch": 0.43, "learning_rate": 2.871943414586509e-05, "loss": 2.3484, "step": 244060 }, { "epoch": 0.43, "learning_rate": 2.871856220593826e-05, "loss": 2.3087, "step": 244070 }, { "epoch": 0.43, "learning_rate": 2.8717690266011433e-05, "loss": 2.2959, "step": 244080 }, { "epoch": 0.43, "learning_rate": 2.871681832608461e-05, "loss": 2.5016, "step": 244090 }, { "epoch": 0.43, "learning_rate": 2.8715946386157784e-05, "loss": 2.446, "step": 244100 }, { "epoch": 0.43, "learning_rate": 2.8715074446230954e-05, "loss": 2.3425, "step": 244110 }, { "epoch": 0.43, "learning_rate": 2.8714202506304128e-05, "loss": 2.3637, "step": 244120 }, { "epoch": 0.43, "learning_rate": 2.87133305663773e-05, "loss": 2.3208, "step": 244130 }, { "epoch": 0.43, "learning_rate": 2.8712458626450472e-05, "loss": 2.2981, "step": 244140 }, { "epoch": 0.43, "learning_rate": 2.8711586686523646e-05, "loss": 2.4238, "step": 244150 }, { "epoch": 0.43, "learning_rate": 2.8710714746596816e-05, "loss": 2.3327, "step": 244160 }, { "epoch": 0.43, "learning_rate": 2.8709842806669997e-05, "loss": 2.4794, "step": 244170 }, { "epoch": 0.43, "learning_rate": 2.8708970866743167e-05, "loss": 2.35, "step": 244180 }, { "epoch": 0.43, "learning_rate": 2.870809892681634e-05, "loss": 2.3804, "step": 244190 }, { "epoch": 0.43, "learning_rate": 2.870722698688951e-05, "loss": 2.4817, "step": 244200 }, { "epoch": 0.43, "learning_rate": 2.8706355046962685e-05, "loss": 2.4568, "step": 244210 }, { "epoch": 0.43, "learning_rate": 2.870548310703586e-05, "loss": 2.3968, "step": 244220 }, { "epoch": 0.43, "learning_rate": 2.870461116710903e-05, "loss": 2.4747, "step": 244230 }, { "epoch": 0.43, "learning_rate": 2.870373922718221e-05, "loss": 2.4147, "step": 244240 }, { "epoch": 0.43, "learning_rate": 2.870286728725538e-05, "loss": 2.3786, "step": 244250 }, { "epoch": 0.43, "learning_rate": 2.8701995347328554e-05, "loss": 2.4033, "step": 244260 }, { "epoch": 0.43, "learning_rate": 2.8701123407401724e-05, "loss": 2.35, "step": 244270 }, { "epoch": 0.43, "learning_rate": 2.8700251467474898e-05, "loss": 2.4449, "step": 244280 }, { "epoch": 0.43, "learning_rate": 2.8699379527548072e-05, "loss": 2.3394, "step": 244290 }, { "epoch": 0.43, "learning_rate": 2.8698507587621242e-05, "loss": 2.4428, "step": 244300 }, { "epoch": 0.43, "learning_rate": 2.8697635647694416e-05, "loss": 2.3809, "step": 244310 }, { "epoch": 0.43, "learning_rate": 2.8696763707767593e-05, "loss": 2.303, "step": 244320 }, { "epoch": 0.43, "learning_rate": 2.8695891767840767e-05, "loss": 2.3261, "step": 244330 }, { "epoch": 0.43, "learning_rate": 2.8695019827913937e-05, "loss": 2.3751, "step": 244340 }, { "epoch": 0.43, "learning_rate": 2.869414788798711e-05, "loss": 2.344, "step": 244350 }, { "epoch": 0.43, "learning_rate": 2.869327594806028e-05, "loss": 2.2781, "step": 244360 }, { "epoch": 0.43, "learning_rate": 2.8692404008133455e-05, "loss": 2.1759, "step": 244370 }, { "epoch": 0.43, "learning_rate": 2.869153206820663e-05, "loss": 2.2733, "step": 244380 }, { "epoch": 0.43, "learning_rate": 2.8690660128279806e-05, "loss": 2.3764, "step": 244390 }, { "epoch": 0.43, "learning_rate": 2.868978818835298e-05, "loss": 2.3409, "step": 244400 }, { "epoch": 0.43, "learning_rate": 2.868891624842615e-05, "loss": 2.5366, "step": 244410 }, { "epoch": 0.43, "learning_rate": 2.8688044308499324e-05, "loss": 2.4427, "step": 244420 }, { "epoch": 0.43, "learning_rate": 2.8687172368572494e-05, "loss": 2.422, "step": 244430 }, { "epoch": 0.43, "learning_rate": 2.8686300428645668e-05, "loss": 2.4382, "step": 244440 }, { "epoch": 0.43, "learning_rate": 2.8685428488718842e-05, "loss": 2.4329, "step": 244450 }, { "epoch": 0.43, "learning_rate": 2.8684556548792012e-05, "loss": 2.3787, "step": 244460 }, { "epoch": 0.43, "learning_rate": 2.868368460886519e-05, "loss": 2.4584, "step": 244470 }, { "epoch": 0.43, "learning_rate": 2.8682812668938363e-05, "loss": 2.343, "step": 244480 }, { "epoch": 0.43, "learning_rate": 2.8681940729011537e-05, "loss": 2.3098, "step": 244490 }, { "epoch": 0.43, "learning_rate": 2.8681068789084707e-05, "loss": 2.4451, "step": 244500 }, { "epoch": 0.43, "learning_rate": 2.868019684915788e-05, "loss": 2.4524, "step": 244510 }, { "epoch": 0.43, "learning_rate": 2.8679324909231055e-05, "loss": 2.2532, "step": 244520 }, { "epoch": 0.43, "learning_rate": 2.8678452969304225e-05, "loss": 2.3947, "step": 244530 }, { "epoch": 0.43, "learning_rate": 2.8677581029377403e-05, "loss": 2.3974, "step": 244540 }, { "epoch": 0.43, "learning_rate": 2.8676709089450576e-05, "loss": 2.2899, "step": 244550 }, { "epoch": 0.43, "learning_rate": 2.867583714952375e-05, "loss": 2.3319, "step": 244560 }, { "epoch": 0.43, "learning_rate": 2.867496520959692e-05, "loss": 2.3784, "step": 244570 }, { "epoch": 0.43, "learning_rate": 2.8674093269670094e-05, "loss": 2.3137, "step": 244580 }, { "epoch": 0.43, "learning_rate": 2.8673221329743265e-05, "loss": 2.3874, "step": 244590 }, { "epoch": 0.43, "learning_rate": 2.867234938981644e-05, "loss": 2.514, "step": 244600 }, { "epoch": 0.43, "learning_rate": 2.8671477449889612e-05, "loss": 2.4534, "step": 244610 }, { "epoch": 0.43, "learning_rate": 2.867060550996279e-05, "loss": 2.4049, "step": 244620 }, { "epoch": 0.43, "learning_rate": 2.8669733570035963e-05, "loss": 2.454, "step": 244630 }, { "epoch": 0.43, "learning_rate": 2.8668861630109133e-05, "loss": 2.3701, "step": 244640 }, { "epoch": 0.43, "learning_rate": 2.8667989690182307e-05, "loss": 2.4076, "step": 244650 }, { "epoch": 0.43, "learning_rate": 2.8667117750255478e-05, "loss": 2.5464, "step": 244660 }, { "epoch": 0.43, "learning_rate": 2.866624581032865e-05, "loss": 2.3694, "step": 244670 }, { "epoch": 0.43, "learning_rate": 2.8665373870401825e-05, "loss": 2.1961, "step": 244680 }, { "epoch": 0.43, "learning_rate": 2.8664501930475002e-05, "loss": 2.3195, "step": 244690 }, { "epoch": 0.43, "learning_rate": 2.8663629990548173e-05, "loss": 2.2084, "step": 244700 }, { "epoch": 0.43, "learning_rate": 2.8662758050621346e-05, "loss": 2.5108, "step": 244710 }, { "epoch": 0.43, "learning_rate": 2.866188611069452e-05, "loss": 2.4287, "step": 244720 }, { "epoch": 0.43, "learning_rate": 2.866101417076769e-05, "loss": 2.4373, "step": 244730 }, { "epoch": 0.43, "learning_rate": 2.8660142230840864e-05, "loss": 2.4274, "step": 244740 }, { "epoch": 0.43, "learning_rate": 2.8659270290914038e-05, "loss": 2.3805, "step": 244750 }, { "epoch": 0.43, "learning_rate": 2.8658398350987215e-05, "loss": 2.3345, "step": 244760 }, { "epoch": 0.43, "learning_rate": 2.8657526411060386e-05, "loss": 2.3844, "step": 244770 }, { "epoch": 0.43, "learning_rate": 2.865665447113356e-05, "loss": 2.4139, "step": 244780 }, { "epoch": 0.43, "learning_rate": 2.8655782531206733e-05, "loss": 2.4192, "step": 244790 }, { "epoch": 0.43, "learning_rate": 2.8654910591279904e-05, "loss": 2.3867, "step": 244800 }, { "epoch": 0.43, "learning_rate": 2.8654038651353077e-05, "loss": 2.3812, "step": 244810 }, { "epoch": 0.43, "learning_rate": 2.8653166711426248e-05, "loss": 2.3663, "step": 244820 }, { "epoch": 0.43, "learning_rate": 2.865229477149942e-05, "loss": 2.3667, "step": 244830 }, { "epoch": 0.43, "learning_rate": 2.86514228315726e-05, "loss": 2.3643, "step": 244840 }, { "epoch": 0.43, "learning_rate": 2.8650550891645772e-05, "loss": 2.365, "step": 244850 }, { "epoch": 0.43, "learning_rate": 2.8649678951718946e-05, "loss": 2.3812, "step": 244860 }, { "epoch": 0.43, "learning_rate": 2.8648807011792117e-05, "loss": 2.2818, "step": 244870 }, { "epoch": 0.43, "learning_rate": 2.864793507186529e-05, "loss": 2.3547, "step": 244880 }, { "epoch": 0.43, "learning_rate": 2.864706313193846e-05, "loss": 2.4103, "step": 244890 }, { "epoch": 0.43, "learning_rate": 2.8646191192011635e-05, "loss": 2.3453, "step": 244900 }, { "epoch": 0.43, "learning_rate": 2.864531925208481e-05, "loss": 2.3509, "step": 244910 }, { "epoch": 0.43, "learning_rate": 2.8644447312157985e-05, "loss": 2.3677, "step": 244920 }, { "epoch": 0.43, "learning_rate": 2.8643575372231156e-05, "loss": 2.3724, "step": 244930 }, { "epoch": 0.43, "learning_rate": 2.864270343230433e-05, "loss": 2.5169, "step": 244940 }, { "epoch": 0.43, "learning_rate": 2.8641831492377503e-05, "loss": 2.3966, "step": 244950 }, { "epoch": 0.43, "learning_rate": 2.8640959552450674e-05, "loss": 2.2184, "step": 244960 }, { "epoch": 0.43, "learning_rate": 2.8640087612523848e-05, "loss": 2.341, "step": 244970 }, { "epoch": 0.43, "learning_rate": 2.8639215672597018e-05, "loss": 2.4406, "step": 244980 }, { "epoch": 0.43, "learning_rate": 2.86383437326702e-05, "loss": 2.2794, "step": 244990 }, { "epoch": 0.43, "learning_rate": 2.863747179274337e-05, "loss": 2.3613, "step": 245000 }, { "epoch": 0.43, "learning_rate": 2.8636599852816543e-05, "loss": 2.4719, "step": 245010 }, { "epoch": 0.43, "learning_rate": 2.8635727912889716e-05, "loss": 2.323, "step": 245020 }, { "epoch": 0.43, "learning_rate": 2.8634855972962887e-05, "loss": 2.4129, "step": 245030 }, { "epoch": 0.43, "learning_rate": 2.863398403303606e-05, "loss": 2.2737, "step": 245040 }, { "epoch": 0.43, "learning_rate": 2.863311209310923e-05, "loss": 2.4593, "step": 245050 }, { "epoch": 0.43, "learning_rate": 2.863224015318241e-05, "loss": 2.5225, "step": 245060 }, { "epoch": 0.43, "learning_rate": 2.8631368213255582e-05, "loss": 2.3856, "step": 245070 }, { "epoch": 0.43, "learning_rate": 2.8630496273328756e-05, "loss": 2.3508, "step": 245080 }, { "epoch": 0.43, "learning_rate": 2.8629624333401926e-05, "loss": 2.3612, "step": 245090 }, { "epoch": 0.43, "learning_rate": 2.86287523934751e-05, "loss": 2.3273, "step": 245100 }, { "epoch": 0.43, "learning_rate": 2.8627880453548274e-05, "loss": 2.4202, "step": 245110 }, { "epoch": 0.43, "learning_rate": 2.8627008513621444e-05, "loss": 2.4248, "step": 245120 }, { "epoch": 0.43, "learning_rate": 2.8626136573694618e-05, "loss": 2.3357, "step": 245130 }, { "epoch": 0.43, "learning_rate": 2.8625264633767795e-05, "loss": 2.3336, "step": 245140 }, { "epoch": 0.43, "learning_rate": 2.862439269384097e-05, "loss": 2.3837, "step": 245150 }, { "epoch": 0.43, "learning_rate": 2.862352075391414e-05, "loss": 2.3691, "step": 245160 }, { "epoch": 0.43, "learning_rate": 2.8622648813987313e-05, "loss": 2.4129, "step": 245170 }, { "epoch": 0.43, "learning_rate": 2.8621776874060487e-05, "loss": 2.449, "step": 245180 }, { "epoch": 0.43, "learning_rate": 2.8620904934133657e-05, "loss": 2.2806, "step": 245190 }, { "epoch": 0.43, "learning_rate": 2.862003299420683e-05, "loss": 2.3603, "step": 245200 }, { "epoch": 0.43, "learning_rate": 2.8619161054280008e-05, "loss": 2.3466, "step": 245210 }, { "epoch": 0.43, "learning_rate": 2.861828911435318e-05, "loss": 2.2745, "step": 245220 }, { "epoch": 0.43, "learning_rate": 2.8617417174426352e-05, "loss": 2.3912, "step": 245230 }, { "epoch": 0.43, "learning_rate": 2.8616545234499526e-05, "loss": 2.4375, "step": 245240 }, { "epoch": 0.43, "learning_rate": 2.86156732945727e-05, "loss": 2.3684, "step": 245250 }, { "epoch": 0.43, "learning_rate": 2.861480135464587e-05, "loss": 2.44, "step": 245260 }, { "epoch": 0.43, "learning_rate": 2.8613929414719044e-05, "loss": 2.3516, "step": 245270 }, { "epoch": 0.43, "learning_rate": 2.8613057474792214e-05, "loss": 2.2466, "step": 245280 }, { "epoch": 0.43, "learning_rate": 2.8612185534865395e-05, "loss": 2.5626, "step": 245290 }, { "epoch": 0.43, "learning_rate": 2.8611313594938565e-05, "loss": 2.3116, "step": 245300 }, { "epoch": 0.43, "learning_rate": 2.861044165501174e-05, "loss": 2.3261, "step": 245310 }, { "epoch": 0.43, "learning_rate": 2.860956971508491e-05, "loss": 2.4273, "step": 245320 }, { "epoch": 0.43, "learning_rate": 2.8608697775158083e-05, "loss": 2.2773, "step": 245330 }, { "epoch": 0.43, "learning_rate": 2.8607825835231257e-05, "loss": 2.3581, "step": 245340 }, { "epoch": 0.43, "learning_rate": 2.8606953895304427e-05, "loss": 2.4054, "step": 245350 }, { "epoch": 0.43, "learning_rate": 2.8606081955377608e-05, "loss": 2.2441, "step": 245360 }, { "epoch": 0.43, "learning_rate": 2.8605210015450778e-05, "loss": 2.4066, "step": 245370 }, { "epoch": 0.43, "learning_rate": 2.8604338075523952e-05, "loss": 2.3905, "step": 245380 }, { "epoch": 0.43, "learning_rate": 2.8603466135597122e-05, "loss": 2.4322, "step": 245390 }, { "epoch": 0.43, "learning_rate": 2.8602594195670296e-05, "loss": 2.2582, "step": 245400 }, { "epoch": 0.43, "learning_rate": 2.860172225574347e-05, "loss": 2.3232, "step": 245410 }, { "epoch": 0.43, "learning_rate": 2.860085031581664e-05, "loss": 2.3879, "step": 245420 }, { "epoch": 0.43, "learning_rate": 2.8599978375889817e-05, "loss": 2.3019, "step": 245430 }, { "epoch": 0.43, "learning_rate": 2.859910643596299e-05, "loss": 2.1526, "step": 245440 }, { "epoch": 0.43, "learning_rate": 2.8598234496036165e-05, "loss": 2.3872, "step": 245450 }, { "epoch": 0.43, "learning_rate": 2.8597362556109335e-05, "loss": 2.3229, "step": 245460 }, { "epoch": 0.43, "learning_rate": 2.859649061618251e-05, "loss": 2.4571, "step": 245470 }, { "epoch": 0.43, "learning_rate": 2.8595618676255683e-05, "loss": 2.3602, "step": 245480 }, { "epoch": 0.43, "learning_rate": 2.8594746736328853e-05, "loss": 2.4445, "step": 245490 }, { "epoch": 0.43, "learning_rate": 2.8593874796402027e-05, "loss": 2.294, "step": 245500 }, { "epoch": 0.43, "learning_rate": 2.8593002856475204e-05, "loss": 2.408, "step": 245510 }, { "epoch": 0.43, "learning_rate": 2.8592130916548378e-05, "loss": 2.4139, "step": 245520 }, { "epoch": 0.43, "learning_rate": 2.8591258976621548e-05, "loss": 2.3671, "step": 245530 }, { "epoch": 0.43, "learning_rate": 2.8590387036694722e-05, "loss": 2.3951, "step": 245540 }, { "epoch": 0.43, "learning_rate": 2.8589515096767892e-05, "loss": 2.2899, "step": 245550 }, { "epoch": 0.43, "learning_rate": 2.8588643156841066e-05, "loss": 2.3811, "step": 245560 }, { "epoch": 0.43, "learning_rate": 2.858777121691424e-05, "loss": 2.4457, "step": 245570 }, { "epoch": 0.43, "learning_rate": 2.8586899276987417e-05, "loss": 2.2992, "step": 245580 }, { "epoch": 0.43, "learning_rate": 2.858602733706059e-05, "loss": 2.3177, "step": 245590 }, { "epoch": 0.43, "learning_rate": 2.858515539713376e-05, "loss": 2.4617, "step": 245600 }, { "epoch": 0.43, "learning_rate": 2.8584283457206935e-05, "loss": 2.359, "step": 245610 }, { "epoch": 0.43, "learning_rate": 2.8583411517280105e-05, "loss": 2.3159, "step": 245620 }, { "epoch": 0.43, "learning_rate": 2.858253957735328e-05, "loss": 2.3328, "step": 245630 }, { "epoch": 0.43, "learning_rate": 2.8581667637426453e-05, "loss": 2.3006, "step": 245640 }, { "epoch": 0.43, "learning_rate": 2.8580795697499623e-05, "loss": 2.3202, "step": 245650 }, { "epoch": 0.43, "learning_rate": 2.85799237575728e-05, "loss": 2.1917, "step": 245660 }, { "epoch": 0.43, "learning_rate": 2.8579051817645974e-05, "loss": 2.3469, "step": 245670 }, { "epoch": 0.43, "learning_rate": 2.8578179877719148e-05, "loss": 2.4715, "step": 245680 }, { "epoch": 0.43, "learning_rate": 2.8577307937792318e-05, "loss": 2.3354, "step": 245690 }, { "epoch": 0.43, "learning_rate": 2.8576435997865492e-05, "loss": 2.3257, "step": 245700 }, { "epoch": 0.43, "learning_rate": 2.8575564057938662e-05, "loss": 2.3769, "step": 245710 }, { "epoch": 0.43, "learning_rate": 2.8574692118011836e-05, "loss": 2.3835, "step": 245720 }, { "epoch": 0.43, "learning_rate": 2.8573820178085013e-05, "loss": 2.4494, "step": 245730 }, { "epoch": 0.43, "learning_rate": 2.8572948238158187e-05, "loss": 2.3979, "step": 245740 }, { "epoch": 0.43, "learning_rate": 2.857207629823136e-05, "loss": 2.4004, "step": 245750 }, { "epoch": 0.43, "learning_rate": 2.857120435830453e-05, "loss": 2.3302, "step": 245760 }, { "epoch": 0.43, "learning_rate": 2.8570332418377705e-05, "loss": 2.3137, "step": 245770 }, { "epoch": 0.43, "learning_rate": 2.8569460478450875e-05, "loss": 2.3733, "step": 245780 }, { "epoch": 0.43, "learning_rate": 2.856858853852405e-05, "loss": 2.3152, "step": 245790 }, { "epoch": 0.43, "learning_rate": 2.8567716598597223e-05, "loss": 2.4759, "step": 245800 }, { "epoch": 0.43, "learning_rate": 2.85668446586704e-05, "loss": 2.4111, "step": 245810 }, { "epoch": 0.43, "learning_rate": 2.856597271874357e-05, "loss": 2.3235, "step": 245820 }, { "epoch": 0.43, "learning_rate": 2.8565100778816744e-05, "loss": 2.2963, "step": 245830 }, { "epoch": 0.43, "learning_rate": 2.8564228838889918e-05, "loss": 2.3509, "step": 245840 }, { "epoch": 0.43, "learning_rate": 2.856335689896309e-05, "loss": 2.5217, "step": 245850 }, { "epoch": 0.43, "learning_rate": 2.8562484959036262e-05, "loss": 2.4098, "step": 245860 }, { "epoch": 0.43, "learning_rate": 2.8561613019109436e-05, "loss": 2.366, "step": 245870 }, { "epoch": 0.43, "learning_rate": 2.8560741079182613e-05, "loss": 2.3873, "step": 245880 }, { "epoch": 0.43, "learning_rate": 2.8559869139255784e-05, "loss": 2.3782, "step": 245890 }, { "epoch": 0.43, "learning_rate": 2.8558997199328957e-05, "loss": 2.2906, "step": 245900 }, { "epoch": 0.43, "learning_rate": 2.855812525940213e-05, "loss": 2.3531, "step": 245910 }, { "epoch": 0.43, "learning_rate": 2.85572533194753e-05, "loss": 2.4112, "step": 245920 }, { "epoch": 0.43, "learning_rate": 2.8556381379548475e-05, "loss": 2.4118, "step": 245930 }, { "epoch": 0.43, "learning_rate": 2.8555509439621646e-05, "loss": 2.3564, "step": 245940 }, { "epoch": 0.43, "learning_rate": 2.8554637499694826e-05, "loss": 2.4667, "step": 245950 }, { "epoch": 0.43, "learning_rate": 2.8553765559767997e-05, "loss": 2.4213, "step": 245960 }, { "epoch": 0.43, "learning_rate": 2.855289361984117e-05, "loss": 2.3991, "step": 245970 }, { "epoch": 0.43, "learning_rate": 2.8552021679914344e-05, "loss": 2.4328, "step": 245980 }, { "epoch": 0.43, "learning_rate": 2.8551149739987514e-05, "loss": 2.294, "step": 245990 }, { "epoch": 0.43, "learning_rate": 2.8550277800060688e-05, "loss": 2.3862, "step": 246000 }, { "epoch": 0.43, "learning_rate": 2.854940586013386e-05, "loss": 2.3631, "step": 246010 }, { "epoch": 0.43, "learning_rate": 2.8548533920207032e-05, "loss": 2.3904, "step": 246020 }, { "epoch": 0.43, "learning_rate": 2.854766198028021e-05, "loss": 2.3509, "step": 246030 }, { "epoch": 0.43, "learning_rate": 2.8546790040353383e-05, "loss": 2.3014, "step": 246040 }, { "epoch": 0.43, "learning_rate": 2.8545918100426554e-05, "loss": 2.3454, "step": 246050 }, { "epoch": 0.43, "learning_rate": 2.8545046160499727e-05, "loss": 2.4714, "step": 246060 }, { "epoch": 0.43, "learning_rate": 2.85441742205729e-05, "loss": 2.4039, "step": 246070 }, { "epoch": 0.43, "learning_rate": 2.854330228064607e-05, "loss": 2.3748, "step": 246080 }, { "epoch": 0.43, "learning_rate": 2.8542430340719245e-05, "loss": 2.4107, "step": 246090 }, { "epoch": 0.43, "learning_rate": 2.8541558400792423e-05, "loss": 2.3621, "step": 246100 }, { "epoch": 0.43, "learning_rate": 2.8540686460865596e-05, "loss": 2.4451, "step": 246110 }, { "epoch": 0.43, "learning_rate": 2.8539814520938767e-05, "loss": 2.3735, "step": 246120 }, { "epoch": 0.43, "learning_rate": 2.853894258101194e-05, "loss": 2.3675, "step": 246130 }, { "epoch": 0.43, "learning_rate": 2.8538070641085114e-05, "loss": 2.4945, "step": 246140 }, { "epoch": 0.43, "learning_rate": 2.8537198701158285e-05, "loss": 2.4685, "step": 246150 }, { "epoch": 0.43, "learning_rate": 2.853632676123146e-05, "loss": 2.4322, "step": 246160 }, { "epoch": 0.43, "learning_rate": 2.853545482130463e-05, "loss": 2.3231, "step": 246170 }, { "epoch": 0.43, "learning_rate": 2.853458288137781e-05, "loss": 2.3617, "step": 246180 }, { "epoch": 0.43, "learning_rate": 2.853371094145098e-05, "loss": 2.4968, "step": 246190 }, { "epoch": 0.43, "learning_rate": 2.8532839001524153e-05, "loss": 2.3979, "step": 246200 }, { "epoch": 0.43, "learning_rate": 2.8531967061597327e-05, "loss": 2.4505, "step": 246210 }, { "epoch": 0.43, "learning_rate": 2.8531095121670498e-05, "loss": 2.4659, "step": 246220 }, { "epoch": 0.43, "learning_rate": 2.853022318174367e-05, "loss": 2.3657, "step": 246230 }, { "epoch": 0.43, "learning_rate": 2.8529351241816842e-05, "loss": 2.3808, "step": 246240 }, { "epoch": 0.43, "learning_rate": 2.8528479301890022e-05, "loss": 2.3541, "step": 246250 }, { "epoch": 0.43, "learning_rate": 2.8527607361963193e-05, "loss": 2.4519, "step": 246260 }, { "epoch": 0.43, "learning_rate": 2.8526735422036366e-05, "loss": 2.2436, "step": 246270 }, { "epoch": 0.43, "learning_rate": 2.8525863482109537e-05, "loss": 2.4062, "step": 246280 }, { "epoch": 0.43, "learning_rate": 2.852499154218271e-05, "loss": 2.4275, "step": 246290 }, { "epoch": 0.43, "learning_rate": 2.8524119602255884e-05, "loss": 2.3935, "step": 246300 }, { "epoch": 0.43, "learning_rate": 2.8523247662329055e-05, "loss": 2.356, "step": 246310 }, { "epoch": 0.43, "learning_rate": 2.852237572240223e-05, "loss": 2.3472, "step": 246320 }, { "epoch": 0.43, "learning_rate": 2.8521503782475406e-05, "loss": 2.346, "step": 246330 }, { "epoch": 0.43, "learning_rate": 2.852063184254858e-05, "loss": 2.4861, "step": 246340 }, { "epoch": 0.43, "learning_rate": 2.851975990262175e-05, "loss": 2.3553, "step": 246350 }, { "epoch": 0.43, "learning_rate": 2.8518887962694924e-05, "loss": 2.3715, "step": 246360 }, { "epoch": 0.43, "learning_rate": 2.8518016022768097e-05, "loss": 2.2936, "step": 246370 }, { "epoch": 0.43, "learning_rate": 2.8517144082841268e-05, "loss": 2.4267, "step": 246380 }, { "epoch": 0.43, "learning_rate": 2.851627214291444e-05, "loss": 2.3603, "step": 246390 }, { "epoch": 0.43, "learning_rate": 2.851540020298762e-05, "loss": 2.4139, "step": 246400 }, { "epoch": 0.43, "learning_rate": 2.8514528263060792e-05, "loss": 2.2985, "step": 246410 }, { "epoch": 0.43, "learning_rate": 2.8513656323133963e-05, "loss": 2.5067, "step": 246420 }, { "epoch": 0.43, "learning_rate": 2.8512784383207137e-05, "loss": 2.359, "step": 246430 }, { "epoch": 0.43, "learning_rate": 2.8511912443280307e-05, "loss": 2.392, "step": 246440 }, { "epoch": 0.43, "learning_rate": 2.851104050335348e-05, "loss": 2.4611, "step": 246450 }, { "epoch": 0.43, "learning_rate": 2.8510168563426655e-05, "loss": 2.337, "step": 246460 }, { "epoch": 0.43, "learning_rate": 2.8509296623499825e-05, "loss": 2.3506, "step": 246470 }, { "epoch": 0.43, "learning_rate": 2.8508424683573005e-05, "loss": 2.446, "step": 246480 }, { "epoch": 0.43, "learning_rate": 2.8507552743646176e-05, "loss": 2.3342, "step": 246490 }, { "epoch": 0.43, "learning_rate": 2.850668080371935e-05, "loss": 2.431, "step": 246500 }, { "epoch": 0.43, "learning_rate": 2.850580886379252e-05, "loss": 2.259, "step": 246510 }, { "epoch": 0.43, "learning_rate": 2.8504936923865694e-05, "loss": 2.3228, "step": 246520 }, { "epoch": 0.43, "learning_rate": 2.8504064983938868e-05, "loss": 2.4769, "step": 246530 }, { "epoch": 0.43, "learning_rate": 2.8503193044012038e-05, "loss": 2.4144, "step": 246540 }, { "epoch": 0.43, "learning_rate": 2.8502321104085215e-05, "loss": 2.4424, "step": 246550 }, { "epoch": 0.43, "learning_rate": 2.850144916415839e-05, "loss": 2.4265, "step": 246560 }, { "epoch": 0.43, "learning_rate": 2.8500577224231563e-05, "loss": 2.4053, "step": 246570 }, { "epoch": 0.43, "learning_rate": 2.8499705284304733e-05, "loss": 2.4265, "step": 246580 }, { "epoch": 0.43, "learning_rate": 2.8498833344377907e-05, "loss": 2.453, "step": 246590 }, { "epoch": 0.43, "learning_rate": 2.849796140445108e-05, "loss": 2.4088, "step": 246600 }, { "epoch": 0.43, "learning_rate": 2.849708946452425e-05, "loss": 2.3816, "step": 246610 }, { "epoch": 0.43, "learning_rate": 2.8496217524597428e-05, "loss": 2.4214, "step": 246620 }, { "epoch": 0.43, "learning_rate": 2.8495345584670602e-05, "loss": 2.3285, "step": 246630 }, { "epoch": 0.43, "learning_rate": 2.8494473644743776e-05, "loss": 2.3287, "step": 246640 }, { "epoch": 0.43, "learning_rate": 2.8493601704816946e-05, "loss": 2.3505, "step": 246650 }, { "epoch": 0.43, "learning_rate": 2.849272976489012e-05, "loss": 2.3778, "step": 246660 }, { "epoch": 0.43, "learning_rate": 2.849185782496329e-05, "loss": 2.3955, "step": 246670 }, { "epoch": 0.43, "learning_rate": 2.8490985885036464e-05, "loss": 2.352, "step": 246680 }, { "epoch": 0.43, "learning_rate": 2.8490113945109638e-05, "loss": 2.3233, "step": 246690 }, { "epoch": 0.43, "learning_rate": 2.8489242005182815e-05, "loss": 2.4982, "step": 246700 }, { "epoch": 0.43, "learning_rate": 2.848837006525599e-05, "loss": 2.4446, "step": 246710 }, { "epoch": 0.43, "learning_rate": 2.848749812532916e-05, "loss": 2.3796, "step": 246720 }, { "epoch": 0.43, "learning_rate": 2.8486626185402333e-05, "loss": 2.3838, "step": 246730 }, { "epoch": 0.43, "learning_rate": 2.8485754245475503e-05, "loss": 2.3252, "step": 246740 }, { "epoch": 0.43, "learning_rate": 2.8484882305548677e-05, "loss": 2.3377, "step": 246750 }, { "epoch": 0.43, "learning_rate": 2.848401036562185e-05, "loss": 2.3469, "step": 246760 }, { "epoch": 0.43, "learning_rate": 2.8483138425695028e-05, "loss": 2.4251, "step": 246770 }, { "epoch": 0.43, "learning_rate": 2.8482266485768198e-05, "loss": 2.3938, "step": 246780 }, { "epoch": 0.43, "learning_rate": 2.8481394545841372e-05, "loss": 2.3894, "step": 246790 }, { "epoch": 0.43, "learning_rate": 2.8480522605914546e-05, "loss": 2.3409, "step": 246800 }, { "epoch": 0.43, "learning_rate": 2.8479650665987716e-05, "loss": 2.4042, "step": 246810 }, { "epoch": 0.43, "learning_rate": 2.847877872606089e-05, "loss": 2.3666, "step": 246820 }, { "epoch": 0.43, "learning_rate": 2.8477906786134064e-05, "loss": 2.3685, "step": 246830 }, { "epoch": 0.43, "learning_rate": 2.8477034846207234e-05, "loss": 2.4069, "step": 246840 }, { "epoch": 0.43, "learning_rate": 2.847616290628041e-05, "loss": 2.3832, "step": 246850 }, { "epoch": 0.43, "learning_rate": 2.8475290966353585e-05, "loss": 2.4186, "step": 246860 }, { "epoch": 0.43, "learning_rate": 2.847441902642676e-05, "loss": 2.4157, "step": 246870 }, { "epoch": 0.43, "learning_rate": 2.847354708649993e-05, "loss": 2.355, "step": 246880 }, { "epoch": 0.43, "learning_rate": 2.8472675146573103e-05, "loss": 2.3311, "step": 246890 }, { "epoch": 0.43, "learning_rate": 2.8471803206646273e-05, "loss": 2.2961, "step": 246900 }, { "epoch": 0.43, "learning_rate": 2.8470931266719447e-05, "loss": 2.3866, "step": 246910 }, { "epoch": 0.43, "learning_rate": 2.8470059326792624e-05, "loss": 2.4452, "step": 246920 }, { "epoch": 0.43, "learning_rate": 2.8469187386865798e-05, "loss": 2.351, "step": 246930 }, { "epoch": 0.43, "learning_rate": 2.8468315446938972e-05, "loss": 2.395, "step": 246940 }, { "epoch": 0.43, "learning_rate": 2.8467443507012142e-05, "loss": 2.3455, "step": 246950 }, { "epoch": 0.43, "learning_rate": 2.8466571567085316e-05, "loss": 2.2824, "step": 246960 }, { "epoch": 0.43, "learning_rate": 2.8465699627158486e-05, "loss": 2.3906, "step": 246970 }, { "epoch": 0.43, "learning_rate": 2.846482768723166e-05, "loss": 2.316, "step": 246980 }, { "epoch": 0.43, "learning_rate": 2.8463955747304834e-05, "loss": 2.3936, "step": 246990 }, { "epoch": 0.43, "learning_rate": 2.846308380737801e-05, "loss": 2.3979, "step": 247000 }, { "epoch": 0.43, "learning_rate": 2.846221186745118e-05, "loss": 2.3305, "step": 247010 }, { "epoch": 0.43, "learning_rate": 2.8461339927524355e-05, "loss": 2.3954, "step": 247020 }, { "epoch": 0.43, "learning_rate": 2.846046798759753e-05, "loss": 2.4613, "step": 247030 }, { "epoch": 0.43, "learning_rate": 2.84595960476707e-05, "loss": 2.337, "step": 247040 }, { "epoch": 0.43, "learning_rate": 2.8458724107743873e-05, "loss": 2.345, "step": 247050 }, { "epoch": 0.43, "learning_rate": 2.8457852167817043e-05, "loss": 2.3961, "step": 247060 }, { "epoch": 0.43, "learning_rate": 2.8456980227890224e-05, "loss": 2.5158, "step": 247070 }, { "epoch": 0.43, "learning_rate": 2.8456108287963394e-05, "loss": 2.3591, "step": 247080 }, { "epoch": 0.43, "learning_rate": 2.8455236348036568e-05, "loss": 2.3727, "step": 247090 }, { "epoch": 0.43, "learning_rate": 2.8454364408109742e-05, "loss": 2.3069, "step": 247100 }, { "epoch": 0.43, "learning_rate": 2.8453492468182912e-05, "loss": 2.3783, "step": 247110 }, { "epoch": 0.43, "learning_rate": 2.8452620528256086e-05, "loss": 2.42, "step": 247120 }, { "epoch": 0.43, "learning_rate": 2.8451748588329256e-05, "loss": 2.3585, "step": 247130 }, { "epoch": 0.43, "learning_rate": 2.845087664840243e-05, "loss": 2.2831, "step": 247140 }, { "epoch": 0.43, "learning_rate": 2.8450004708475607e-05, "loss": 2.3898, "step": 247150 }, { "epoch": 0.43, "learning_rate": 2.844913276854878e-05, "loss": 2.3134, "step": 247160 }, { "epoch": 0.43, "learning_rate": 2.844826082862195e-05, "loss": 2.3582, "step": 247170 }, { "epoch": 0.43, "learning_rate": 2.8447388888695125e-05, "loss": 2.2181, "step": 247180 }, { "epoch": 0.43, "learning_rate": 2.84465169487683e-05, "loss": 2.3148, "step": 247190 }, { "epoch": 0.43, "learning_rate": 2.844564500884147e-05, "loss": 2.3315, "step": 247200 }, { "epoch": 0.43, "learning_rate": 2.8444773068914643e-05, "loss": 2.3988, "step": 247210 }, { "epoch": 0.43, "learning_rate": 2.844390112898782e-05, "loss": 2.4284, "step": 247220 }, { "epoch": 0.43, "learning_rate": 2.8443029189060994e-05, "loss": 2.3869, "step": 247230 }, { "epoch": 0.43, "learning_rate": 2.8442157249134165e-05, "loss": 2.4832, "step": 247240 }, { "epoch": 0.43, "learning_rate": 2.8441285309207338e-05, "loss": 2.3316, "step": 247250 }, { "epoch": 0.43, "learning_rate": 2.8440413369280512e-05, "loss": 2.4013, "step": 247260 }, { "epoch": 0.43, "learning_rate": 2.8439541429353682e-05, "loss": 2.3485, "step": 247270 }, { "epoch": 0.43, "learning_rate": 2.8438669489426856e-05, "loss": 2.3558, "step": 247280 }, { "epoch": 0.43, "learning_rate": 2.8437797549500033e-05, "loss": 2.4394, "step": 247290 }, { "epoch": 0.43, "learning_rate": 2.8436925609573207e-05, "loss": 2.3872, "step": 247300 }, { "epoch": 0.43, "learning_rate": 2.8436053669646378e-05, "loss": 2.402, "step": 247310 }, { "epoch": 0.43, "learning_rate": 2.843518172971955e-05, "loss": 2.3365, "step": 247320 }, { "epoch": 0.43, "learning_rate": 2.8434309789792725e-05, "loss": 2.3707, "step": 247330 }, { "epoch": 0.43, "learning_rate": 2.8433437849865895e-05, "loss": 2.4207, "step": 247340 }, { "epoch": 0.43, "learning_rate": 2.843256590993907e-05, "loss": 2.4339, "step": 247350 }, { "epoch": 0.43, "learning_rate": 2.843169397001224e-05, "loss": 2.373, "step": 247360 }, { "epoch": 0.43, "learning_rate": 2.843082203008542e-05, "loss": 2.3579, "step": 247370 }, { "epoch": 0.43, "learning_rate": 2.842995009015859e-05, "loss": 2.3893, "step": 247380 }, { "epoch": 0.43, "learning_rate": 2.8429078150231764e-05, "loss": 2.3315, "step": 247390 }, { "epoch": 0.43, "learning_rate": 2.8428206210304935e-05, "loss": 2.345, "step": 247400 }, { "epoch": 0.43, "learning_rate": 2.842733427037811e-05, "loss": 2.4022, "step": 247410 }, { "epoch": 0.43, "learning_rate": 2.8426462330451282e-05, "loss": 2.3633, "step": 247420 }, { "epoch": 0.43, "learning_rate": 2.8425590390524453e-05, "loss": 2.4421, "step": 247430 }, { "epoch": 0.43, "learning_rate": 2.8424718450597633e-05, "loss": 2.4681, "step": 247440 }, { "epoch": 0.43, "learning_rate": 2.8423846510670804e-05, "loss": 2.4905, "step": 247450 }, { "epoch": 0.43, "learning_rate": 2.8422974570743977e-05, "loss": 2.406, "step": 247460 }, { "epoch": 0.43, "learning_rate": 2.8422102630817148e-05, "loss": 2.3654, "step": 247470 }, { "epoch": 0.43, "learning_rate": 2.842123069089032e-05, "loss": 2.3935, "step": 247480 }, { "epoch": 0.43, "learning_rate": 2.8420358750963495e-05, "loss": 2.3913, "step": 247490 }, { "epoch": 0.43, "learning_rate": 2.8419486811036666e-05, "loss": 2.3924, "step": 247500 }, { "epoch": 0.43, "learning_rate": 2.841861487110984e-05, "loss": 2.3949, "step": 247510 }, { "epoch": 0.43, "learning_rate": 2.8417742931183017e-05, "loss": 2.3842, "step": 247520 }, { "epoch": 0.43, "learning_rate": 2.841687099125619e-05, "loss": 2.4553, "step": 247530 }, { "epoch": 0.43, "learning_rate": 2.841599905132936e-05, "loss": 2.3899, "step": 247540 }, { "epoch": 0.43, "learning_rate": 2.8415127111402534e-05, "loss": 2.5026, "step": 247550 }, { "epoch": 0.43, "learning_rate": 2.8414255171475708e-05, "loss": 2.4101, "step": 247560 }, { "epoch": 0.43, "learning_rate": 2.841338323154888e-05, "loss": 2.3494, "step": 247570 }, { "epoch": 0.43, "learning_rate": 2.8412511291622052e-05, "loss": 2.4109, "step": 247580 }, { "epoch": 0.43, "learning_rate": 2.841163935169523e-05, "loss": 2.5008, "step": 247590 }, { "epoch": 0.43, "learning_rate": 2.8410767411768403e-05, "loss": 2.3658, "step": 247600 }, { "epoch": 0.43, "learning_rate": 2.8409895471841574e-05, "loss": 2.393, "step": 247610 }, { "epoch": 0.43, "learning_rate": 2.8409023531914747e-05, "loss": 2.3815, "step": 247620 }, { "epoch": 0.43, "learning_rate": 2.8408151591987918e-05, "loss": 2.2829, "step": 247630 }, { "epoch": 0.43, "learning_rate": 2.840727965206109e-05, "loss": 2.3521, "step": 247640 }, { "epoch": 0.43, "learning_rate": 2.8406407712134265e-05, "loss": 2.321, "step": 247650 }, { "epoch": 0.43, "learning_rate": 2.8405535772207436e-05, "loss": 2.3331, "step": 247660 }, { "epoch": 0.43, "learning_rate": 2.8404663832280616e-05, "loss": 2.4419, "step": 247670 }, { "epoch": 0.43, "learning_rate": 2.8403791892353787e-05, "loss": 2.404, "step": 247680 }, { "epoch": 0.43, "learning_rate": 2.840291995242696e-05, "loss": 2.3056, "step": 247690 }, { "epoch": 0.43, "learning_rate": 2.840204801250013e-05, "loss": 2.4164, "step": 247700 }, { "epoch": 0.43, "learning_rate": 2.8401176072573305e-05, "loss": 2.369, "step": 247710 }, { "epoch": 0.43, "learning_rate": 2.840030413264648e-05, "loss": 2.5083, "step": 247720 }, { "epoch": 0.43, "learning_rate": 2.839943219271965e-05, "loss": 2.4005, "step": 247730 }, { "epoch": 0.43, "learning_rate": 2.8398560252792826e-05, "loss": 2.3664, "step": 247740 }, { "epoch": 0.43, "learning_rate": 2.8397688312866e-05, "loss": 2.3989, "step": 247750 }, { "epoch": 0.43, "learning_rate": 2.8396816372939173e-05, "loss": 2.4617, "step": 247760 }, { "epoch": 0.43, "learning_rate": 2.8395944433012344e-05, "loss": 2.4553, "step": 247770 }, { "epoch": 0.43, "learning_rate": 2.8395072493085518e-05, "loss": 2.3548, "step": 247780 }, { "epoch": 0.43, "learning_rate": 2.8394200553158688e-05, "loss": 2.3612, "step": 247790 }, { "epoch": 0.43, "learning_rate": 2.8393328613231862e-05, "loss": 2.4687, "step": 247800 }, { "epoch": 0.43, "learning_rate": 2.839245667330504e-05, "loss": 2.3697, "step": 247810 }, { "epoch": 0.43, "learning_rate": 2.8391584733378213e-05, "loss": 2.3686, "step": 247820 }, { "epoch": 0.43, "learning_rate": 2.8390712793451386e-05, "loss": 2.5143, "step": 247830 }, { "epoch": 0.43, "learning_rate": 2.8389840853524557e-05, "loss": 2.3993, "step": 247840 }, { "epoch": 0.43, "learning_rate": 2.838896891359773e-05, "loss": 2.3793, "step": 247850 }, { "epoch": 0.43, "learning_rate": 2.83880969736709e-05, "loss": 2.3831, "step": 247860 }, { "epoch": 0.43, "learning_rate": 2.8387225033744075e-05, "loss": 2.3943, "step": 247870 }, { "epoch": 0.43, "learning_rate": 2.838635309381725e-05, "loss": 2.4123, "step": 247880 }, { "epoch": 0.43, "learning_rate": 2.8385481153890426e-05, "loss": 2.3444, "step": 247890 }, { "epoch": 0.43, "learning_rate": 2.8384609213963596e-05, "loss": 2.5063, "step": 247900 }, { "epoch": 0.43, "learning_rate": 2.838373727403677e-05, "loss": 2.4652, "step": 247910 }, { "epoch": 0.43, "learning_rate": 2.8382865334109944e-05, "loss": 2.3035, "step": 247920 }, { "epoch": 0.43, "learning_rate": 2.8381993394183114e-05, "loss": 2.5045, "step": 247930 }, { "epoch": 0.43, "learning_rate": 2.8381121454256288e-05, "loss": 2.5161, "step": 247940 }, { "epoch": 0.43, "learning_rate": 2.838024951432946e-05, "loss": 2.442, "step": 247950 }, { "epoch": 0.43, "learning_rate": 2.837937757440264e-05, "loss": 2.4643, "step": 247960 }, { "epoch": 0.43, "learning_rate": 2.837850563447581e-05, "loss": 2.4149, "step": 247970 }, { "epoch": 0.43, "learning_rate": 2.8377633694548983e-05, "loss": 2.32, "step": 247980 }, { "epoch": 0.43, "learning_rate": 2.8376761754622157e-05, "loss": 2.3077, "step": 247990 }, { "epoch": 0.43, "learning_rate": 2.8375889814695327e-05, "loss": 2.3522, "step": 248000 }, { "epoch": 0.43, "learning_rate": 2.83750178747685e-05, "loss": 2.4452, "step": 248010 }, { "epoch": 0.43, "learning_rate": 2.837414593484167e-05, "loss": 2.3612, "step": 248020 }, { "epoch": 0.43, "learning_rate": 2.8373273994914845e-05, "loss": 2.4995, "step": 248030 }, { "epoch": 0.43, "learning_rate": 2.8372402054988022e-05, "loss": 2.3867, "step": 248040 }, { "epoch": 0.43, "learning_rate": 2.8371530115061196e-05, "loss": 2.386, "step": 248050 }, { "epoch": 0.43, "learning_rate": 2.837065817513437e-05, "loss": 2.479, "step": 248060 }, { "epoch": 0.43, "learning_rate": 2.836978623520754e-05, "loss": 2.4566, "step": 248070 }, { "epoch": 0.43, "learning_rate": 2.8368914295280714e-05, "loss": 2.3765, "step": 248080 }, { "epoch": 0.43, "learning_rate": 2.8368042355353884e-05, "loss": 2.3941, "step": 248090 }, { "epoch": 0.43, "learning_rate": 2.8367170415427058e-05, "loss": 2.5683, "step": 248100 }, { "epoch": 0.43, "learning_rate": 2.8366298475500235e-05, "loss": 2.3681, "step": 248110 }, { "epoch": 0.43, "learning_rate": 2.836542653557341e-05, "loss": 2.397, "step": 248120 }, { "epoch": 0.43, "learning_rate": 2.836455459564658e-05, "loss": 2.4261, "step": 248130 }, { "epoch": 0.43, "learning_rate": 2.8363682655719753e-05, "loss": 2.3197, "step": 248140 }, { "epoch": 0.43, "learning_rate": 2.8362810715792927e-05, "loss": 2.4592, "step": 248150 }, { "epoch": 0.43, "learning_rate": 2.8361938775866097e-05, "loss": 2.3454, "step": 248160 }, { "epoch": 0.43, "learning_rate": 2.836106683593927e-05, "loss": 2.4207, "step": 248170 }, { "epoch": 0.43, "learning_rate": 2.8360194896012445e-05, "loss": 2.3068, "step": 248180 }, { "epoch": 0.43, "learning_rate": 2.8359322956085622e-05, "loss": 2.4476, "step": 248190 }, { "epoch": 0.43, "learning_rate": 2.8358451016158792e-05, "loss": 2.4316, "step": 248200 }, { "epoch": 0.43, "learning_rate": 2.8357579076231966e-05, "loss": 2.4903, "step": 248210 }, { "epoch": 0.43, "learning_rate": 2.835670713630514e-05, "loss": 2.399, "step": 248220 }, { "epoch": 0.43, "learning_rate": 2.835583519637831e-05, "loss": 2.3034, "step": 248230 }, { "epoch": 0.43, "learning_rate": 2.8354963256451484e-05, "loss": 2.3937, "step": 248240 }, { "epoch": 0.43, "learning_rate": 2.8354091316524654e-05, "loss": 2.4275, "step": 248250 }, { "epoch": 0.43, "learning_rate": 2.8353219376597835e-05, "loss": 2.3094, "step": 248260 }, { "epoch": 0.43, "learning_rate": 2.8352347436671005e-05, "loss": 2.5134, "step": 248270 }, { "epoch": 0.43, "learning_rate": 2.835147549674418e-05, "loss": 2.3144, "step": 248280 }, { "epoch": 0.43, "learning_rate": 2.8350603556817353e-05, "loss": 2.3895, "step": 248290 }, { "epoch": 0.43, "learning_rate": 2.8349731616890523e-05, "loss": 2.429, "step": 248300 }, { "epoch": 0.43, "learning_rate": 2.8348859676963697e-05, "loss": 2.4318, "step": 248310 }, { "epoch": 0.43, "learning_rate": 2.8347987737036867e-05, "loss": 2.3973, "step": 248320 }, { "epoch": 0.43, "learning_rate": 2.834711579711004e-05, "loss": 2.3875, "step": 248330 }, { "epoch": 0.43, "learning_rate": 2.8346243857183218e-05, "loss": 2.4332, "step": 248340 }, { "epoch": 0.43, "learning_rate": 2.8345371917256392e-05, "loss": 2.4313, "step": 248350 }, { "epoch": 0.43, "learning_rate": 2.8344499977329562e-05, "loss": 2.3162, "step": 248360 }, { "epoch": 0.43, "learning_rate": 2.8343628037402736e-05, "loss": 2.2923, "step": 248370 }, { "epoch": 0.43, "learning_rate": 2.834275609747591e-05, "loss": 2.2926, "step": 248380 }, { "epoch": 0.43, "learning_rate": 2.834188415754908e-05, "loss": 2.477, "step": 248390 }, { "epoch": 0.43, "learning_rate": 2.8341012217622254e-05, "loss": 2.4268, "step": 248400 }, { "epoch": 0.43, "learning_rate": 2.834014027769543e-05, "loss": 2.272, "step": 248410 }, { "epoch": 0.43, "learning_rate": 2.8339268337768605e-05, "loss": 2.3832, "step": 248420 }, { "epoch": 0.43, "learning_rate": 2.8338396397841775e-05, "loss": 2.4697, "step": 248430 }, { "epoch": 0.43, "learning_rate": 2.833752445791495e-05, "loss": 2.3767, "step": 248440 }, { "epoch": 0.43, "learning_rate": 2.8336652517988123e-05, "loss": 2.402, "step": 248450 }, { "epoch": 0.43, "learning_rate": 2.8335780578061293e-05, "loss": 2.4095, "step": 248460 }, { "epoch": 0.43, "learning_rate": 2.8334908638134467e-05, "loss": 2.4492, "step": 248470 }, { "epoch": 0.43, "learning_rate": 2.8334036698207644e-05, "loss": 2.3899, "step": 248480 }, { "epoch": 0.43, "learning_rate": 2.8333164758280818e-05, "loss": 2.3423, "step": 248490 }, { "epoch": 0.43, "learning_rate": 2.833229281835399e-05, "loss": 2.2997, "step": 248500 }, { "epoch": 0.43, "learning_rate": 2.8331420878427162e-05, "loss": 2.3794, "step": 248510 }, { "epoch": 0.43, "learning_rate": 2.8330548938500333e-05, "loss": 2.3663, "step": 248520 }, { "epoch": 0.43, "learning_rate": 2.8329676998573506e-05, "loss": 2.4387, "step": 248530 }, { "epoch": 0.43, "learning_rate": 2.832880505864668e-05, "loss": 2.3133, "step": 248540 }, { "epoch": 0.43, "learning_rate": 2.832793311871985e-05, "loss": 2.3398, "step": 248550 }, { "epoch": 0.43, "learning_rate": 2.832706117879303e-05, "loss": 2.4907, "step": 248560 }, { "epoch": 0.43, "learning_rate": 2.83261892388662e-05, "loss": 2.3282, "step": 248570 }, { "epoch": 0.43, "learning_rate": 2.8325317298939375e-05, "loss": 2.3631, "step": 248580 }, { "epoch": 0.43, "learning_rate": 2.8324445359012546e-05, "loss": 2.4429, "step": 248590 }, { "epoch": 0.43, "learning_rate": 2.832357341908572e-05, "loss": 2.5103, "step": 248600 }, { "epoch": 0.43, "learning_rate": 2.8322701479158893e-05, "loss": 2.3561, "step": 248610 }, { "epoch": 0.43, "learning_rate": 2.8321829539232063e-05, "loss": 2.3621, "step": 248620 }, { "epoch": 0.43, "learning_rate": 2.832095759930524e-05, "loss": 2.3646, "step": 248630 }, { "epoch": 0.43, "learning_rate": 2.8320085659378414e-05, "loss": 2.3799, "step": 248640 }, { "epoch": 0.43, "learning_rate": 2.8319213719451588e-05, "loss": 2.3734, "step": 248650 }, { "epoch": 0.43, "learning_rate": 2.831834177952476e-05, "loss": 2.4498, "step": 248660 }, { "epoch": 0.43, "learning_rate": 2.8317469839597932e-05, "loss": 2.3996, "step": 248670 }, { "epoch": 0.43, "learning_rate": 2.8316597899671106e-05, "loss": 2.365, "step": 248680 }, { "epoch": 0.43, "learning_rate": 2.8315725959744276e-05, "loss": 2.3475, "step": 248690 }, { "epoch": 0.43, "learning_rate": 2.831485401981745e-05, "loss": 2.4035, "step": 248700 }, { "epoch": 0.43, "learning_rate": 2.8313982079890627e-05, "loss": 2.3927, "step": 248710 }, { "epoch": 0.43, "learning_rate": 2.83131101399638e-05, "loss": 2.3642, "step": 248720 }, { "epoch": 0.43, "learning_rate": 2.831223820003697e-05, "loss": 2.4836, "step": 248730 }, { "epoch": 0.43, "learning_rate": 2.8311366260110145e-05, "loss": 2.3605, "step": 248740 }, { "epoch": 0.43, "learning_rate": 2.8310494320183316e-05, "loss": 2.5012, "step": 248750 }, { "epoch": 0.43, "learning_rate": 2.830962238025649e-05, "loss": 2.3535, "step": 248760 }, { "epoch": 0.43, "learning_rate": 2.8308750440329663e-05, "loss": 2.3435, "step": 248770 }, { "epoch": 0.43, "learning_rate": 2.830787850040284e-05, "loss": 2.2883, "step": 248780 }, { "epoch": 0.43, "learning_rate": 2.8307006560476014e-05, "loss": 2.4659, "step": 248790 }, { "epoch": 0.43, "learning_rate": 2.8306134620549185e-05, "loss": 2.4712, "step": 248800 }, { "epoch": 0.43, "learning_rate": 2.830526268062236e-05, "loss": 2.4074, "step": 248810 }, { "epoch": 0.43, "learning_rate": 2.830439074069553e-05, "loss": 2.455, "step": 248820 }, { "epoch": 0.43, "learning_rate": 2.8303518800768702e-05, "loss": 2.4181, "step": 248830 }, { "epoch": 0.43, "learning_rate": 2.8302646860841876e-05, "loss": 2.3692, "step": 248840 }, { "epoch": 0.43, "learning_rate": 2.8301774920915047e-05, "loss": 2.2579, "step": 248850 }, { "epoch": 0.43, "learning_rate": 2.8300902980988224e-05, "loss": 2.3381, "step": 248860 }, { "epoch": 0.43, "learning_rate": 2.8300031041061398e-05, "loss": 2.3975, "step": 248870 }, { "epoch": 0.43, "learning_rate": 2.829915910113457e-05, "loss": 2.4753, "step": 248880 }, { "epoch": 0.43, "learning_rate": 2.829828716120774e-05, "loss": 2.3337, "step": 248890 }, { "epoch": 0.43, "learning_rate": 2.8297415221280915e-05, "loss": 2.3176, "step": 248900 }, { "epoch": 0.43, "learning_rate": 2.829654328135409e-05, "loss": 2.3428, "step": 248910 }, { "epoch": 0.43, "learning_rate": 2.829567134142726e-05, "loss": 2.3428, "step": 248920 }, { "epoch": 0.43, "learning_rate": 2.8294799401500437e-05, "loss": 2.2915, "step": 248930 }, { "epoch": 0.43, "learning_rate": 2.829392746157361e-05, "loss": 2.4295, "step": 248940 }, { "epoch": 0.43, "learning_rate": 2.8293055521646784e-05, "loss": 2.4371, "step": 248950 }, { "epoch": 0.43, "learning_rate": 2.8292183581719955e-05, "loss": 2.297, "step": 248960 }, { "epoch": 0.43, "learning_rate": 2.829131164179313e-05, "loss": 2.2187, "step": 248970 }, { "epoch": 0.43, "learning_rate": 2.82904397018663e-05, "loss": 2.4937, "step": 248980 }, { "epoch": 0.43, "learning_rate": 2.8289567761939473e-05, "loss": 2.4701, "step": 248990 }, { "epoch": 0.43, "learning_rate": 2.8288695822012646e-05, "loss": 2.2846, "step": 249000 }, { "epoch": 0.43, "learning_rate": 2.8287823882085824e-05, "loss": 2.458, "step": 249010 }, { "epoch": 0.43, "learning_rate": 2.8286951942158997e-05, "loss": 2.344, "step": 249020 }, { "epoch": 0.43, "learning_rate": 2.8286080002232168e-05, "loss": 2.4567, "step": 249030 }, { "epoch": 0.43, "learning_rate": 2.828520806230534e-05, "loss": 2.47, "step": 249040 }, { "epoch": 0.43, "learning_rate": 2.8284336122378512e-05, "loss": 2.5644, "step": 249050 }, { "epoch": 0.43, "learning_rate": 2.8283464182451686e-05, "loss": 2.3866, "step": 249060 }, { "epoch": 0.43, "learning_rate": 2.828259224252486e-05, "loss": 2.4076, "step": 249070 }, { "epoch": 0.43, "learning_rate": 2.8281720302598037e-05, "loss": 2.398, "step": 249080 }, { "epoch": 0.43, "learning_rate": 2.8280848362671207e-05, "loss": 2.4526, "step": 249090 }, { "epoch": 0.43, "learning_rate": 2.827997642274438e-05, "loss": 2.4631, "step": 249100 }, { "epoch": 0.43, "learning_rate": 2.8279104482817554e-05, "loss": 2.3608, "step": 249110 }, { "epoch": 0.43, "learning_rate": 2.8278232542890725e-05, "loss": 2.4666, "step": 249120 }, { "epoch": 0.43, "learning_rate": 2.82773606029639e-05, "loss": 2.431, "step": 249130 }, { "epoch": 0.43, "learning_rate": 2.827648866303707e-05, "loss": 2.3059, "step": 249140 }, { "epoch": 0.43, "learning_rate": 2.827561672311025e-05, "loss": 2.3784, "step": 249150 }, { "epoch": 0.43, "learning_rate": 2.827474478318342e-05, "loss": 2.3872, "step": 249160 }, { "epoch": 0.43, "learning_rate": 2.8273872843256594e-05, "loss": 2.4111, "step": 249170 }, { "epoch": 0.43, "learning_rate": 2.8273000903329767e-05, "loss": 2.4353, "step": 249180 }, { "epoch": 0.43, "learning_rate": 2.8272128963402938e-05, "loss": 2.3155, "step": 249190 }, { "epoch": 0.43, "learning_rate": 2.827125702347611e-05, "loss": 2.3918, "step": 249200 }, { "epoch": 0.43, "learning_rate": 2.8270385083549282e-05, "loss": 2.325, "step": 249210 }, { "epoch": 0.43, "learning_rate": 2.8269513143622456e-05, "loss": 2.4625, "step": 249220 }, { "epoch": 0.43, "learning_rate": 2.8268641203695633e-05, "loss": 2.3801, "step": 249230 }, { "epoch": 0.43, "learning_rate": 2.8267769263768807e-05, "loss": 2.4026, "step": 249240 }, { "epoch": 0.43, "learning_rate": 2.8266897323841977e-05, "loss": 2.3312, "step": 249250 }, { "epoch": 0.43, "learning_rate": 2.826602538391515e-05, "loss": 2.4112, "step": 249260 }, { "epoch": 0.43, "learning_rate": 2.8265153443988325e-05, "loss": 2.3629, "step": 249270 }, { "epoch": 0.43, "learning_rate": 2.8264281504061495e-05, "loss": 2.4734, "step": 249280 }, { "epoch": 0.43, "learning_rate": 2.826340956413467e-05, "loss": 2.2905, "step": 249290 }, { "epoch": 0.43, "learning_rate": 2.8262537624207846e-05, "loss": 2.3896, "step": 249300 }, { "epoch": 0.43, "learning_rate": 2.826166568428102e-05, "loss": 2.3844, "step": 249310 }, { "epoch": 0.43, "learning_rate": 2.826079374435419e-05, "loss": 2.3669, "step": 249320 }, { "epoch": 0.43, "learning_rate": 2.8259921804427364e-05, "loss": 2.335, "step": 249330 }, { "epoch": 0.43, "learning_rate": 2.8259049864500538e-05, "loss": 2.3055, "step": 249340 }, { "epoch": 0.43, "learning_rate": 2.8258177924573708e-05, "loss": 2.4332, "step": 249350 }, { "epoch": 0.43, "learning_rate": 2.8257305984646882e-05, "loss": 2.5294, "step": 249360 }, { "epoch": 0.43, "learning_rate": 2.8256434044720052e-05, "loss": 2.4437, "step": 249370 }, { "epoch": 0.43, "learning_rate": 2.8255562104793233e-05, "loss": 2.5043, "step": 249380 }, { "epoch": 0.43, "learning_rate": 2.8254690164866403e-05, "loss": 2.3785, "step": 249390 }, { "epoch": 0.43, "learning_rate": 2.8253818224939577e-05, "loss": 2.5137, "step": 249400 }, { "epoch": 0.43, "learning_rate": 2.825294628501275e-05, "loss": 2.384, "step": 249410 }, { "epoch": 0.43, "learning_rate": 2.825207434508592e-05, "loss": 2.413, "step": 249420 }, { "epoch": 0.43, "learning_rate": 2.8251202405159095e-05, "loss": 2.3799, "step": 249430 }, { "epoch": 0.43, "learning_rate": 2.8250330465232265e-05, "loss": 2.3674, "step": 249440 }, { "epoch": 0.44, "learning_rate": 2.8249458525305446e-05, "loss": 2.3922, "step": 249450 }, { "epoch": 0.44, "learning_rate": 2.8248586585378616e-05, "loss": 2.4736, "step": 249460 }, { "epoch": 0.44, "learning_rate": 2.824771464545179e-05, "loss": 2.3516, "step": 249470 }, { "epoch": 0.44, "learning_rate": 2.824684270552496e-05, "loss": 2.4209, "step": 249480 }, { "epoch": 0.44, "learning_rate": 2.8245970765598134e-05, "loss": 2.3157, "step": 249490 }, { "epoch": 0.44, "learning_rate": 2.8245098825671308e-05, "loss": 2.3629, "step": 249500 }, { "epoch": 0.44, "learning_rate": 2.8244226885744478e-05, "loss": 2.3229, "step": 249510 }, { "epoch": 0.44, "learning_rate": 2.8243354945817652e-05, "loss": 2.3577, "step": 249520 }, { "epoch": 0.44, "learning_rate": 2.824248300589083e-05, "loss": 2.429, "step": 249530 }, { "epoch": 0.44, "learning_rate": 2.8241611065964003e-05, "loss": 2.3918, "step": 249540 }, { "epoch": 0.44, "learning_rate": 2.8240739126037173e-05, "loss": 2.4326, "step": 249550 }, { "epoch": 0.44, "learning_rate": 2.8239867186110347e-05, "loss": 2.3339, "step": 249560 }, { "epoch": 0.44, "learning_rate": 2.823899524618352e-05, "loss": 2.38, "step": 249570 }, { "epoch": 0.44, "learning_rate": 2.823812330625669e-05, "loss": 2.3335, "step": 249580 }, { "epoch": 0.44, "learning_rate": 2.8237251366329865e-05, "loss": 2.3282, "step": 249590 }, { "epoch": 0.44, "learning_rate": 2.8236379426403042e-05, "loss": 2.3702, "step": 249600 }, { "epoch": 0.44, "learning_rate": 2.8235507486476216e-05, "loss": 2.4401, "step": 249610 }, { "epoch": 0.44, "learning_rate": 2.8234635546549386e-05, "loss": 2.5287, "step": 249620 }, { "epoch": 0.44, "learning_rate": 2.823376360662256e-05, "loss": 2.4044, "step": 249630 }, { "epoch": 0.44, "learning_rate": 2.8232891666695734e-05, "loss": 2.3797, "step": 249640 }, { "epoch": 0.44, "learning_rate": 2.8232019726768904e-05, "loss": 2.3912, "step": 249650 }, { "epoch": 0.44, "learning_rate": 2.8231147786842078e-05, "loss": 2.2302, "step": 249660 }, { "epoch": 0.44, "learning_rate": 2.823027584691525e-05, "loss": 2.4194, "step": 249670 }, { "epoch": 0.44, "learning_rate": 2.822940390698843e-05, "loss": 2.3336, "step": 249680 }, { "epoch": 0.44, "learning_rate": 2.82285319670616e-05, "loss": 2.3014, "step": 249690 }, { "epoch": 0.44, "learning_rate": 2.8227660027134773e-05, "loss": 2.3539, "step": 249700 }, { "epoch": 0.44, "learning_rate": 2.8226788087207943e-05, "loss": 2.4192, "step": 249710 }, { "epoch": 0.44, "learning_rate": 2.8225916147281117e-05, "loss": 2.409, "step": 249720 }, { "epoch": 0.44, "learning_rate": 2.822504420735429e-05, "loss": 2.3183, "step": 249730 }, { "epoch": 0.44, "learning_rate": 2.822417226742746e-05, "loss": 2.365, "step": 249740 }, { "epoch": 0.44, "learning_rate": 2.8223300327500642e-05, "loss": 2.3742, "step": 249750 }, { "epoch": 0.44, "learning_rate": 2.8222428387573812e-05, "loss": 2.4174, "step": 249760 }, { "epoch": 0.44, "learning_rate": 2.8221556447646986e-05, "loss": 2.3699, "step": 249770 }, { "epoch": 0.44, "learning_rate": 2.8220684507720156e-05, "loss": 2.4081, "step": 249780 }, { "epoch": 0.44, "learning_rate": 2.821981256779333e-05, "loss": 2.4019, "step": 249790 }, { "epoch": 0.44, "learning_rate": 2.8218940627866504e-05, "loss": 2.3005, "step": 249800 }, { "epoch": 0.44, "learning_rate": 2.8218068687939674e-05, "loss": 2.3798, "step": 249810 }, { "epoch": 0.44, "learning_rate": 2.821719674801285e-05, "loss": 2.275, "step": 249820 }, { "epoch": 0.44, "learning_rate": 2.8216324808086025e-05, "loss": 2.3642, "step": 249830 }, { "epoch": 0.44, "learning_rate": 2.82154528681592e-05, "loss": 2.2631, "step": 249840 }, { "epoch": 0.44, "learning_rate": 2.821458092823237e-05, "loss": 2.3691, "step": 249850 }, { "epoch": 0.44, "learning_rate": 2.8213708988305543e-05, "loss": 2.3994, "step": 249860 }, { "epoch": 0.44, "learning_rate": 2.8212837048378714e-05, "loss": 2.3554, "step": 249870 }, { "epoch": 0.44, "learning_rate": 2.8211965108451887e-05, "loss": 2.223, "step": 249880 }, { "epoch": 0.44, "learning_rate": 2.821109316852506e-05, "loss": 2.3068, "step": 249890 }, { "epoch": 0.44, "learning_rate": 2.8210221228598238e-05, "loss": 2.3744, "step": 249900 }, { "epoch": 0.44, "learning_rate": 2.8209349288671412e-05, "loss": 2.4611, "step": 249910 }, { "epoch": 0.44, "learning_rate": 2.8208477348744582e-05, "loss": 2.4337, "step": 249920 }, { "epoch": 0.44, "learning_rate": 2.8207605408817756e-05, "loss": 2.3842, "step": 249930 }, { "epoch": 0.44, "learning_rate": 2.8206733468890927e-05, "loss": 2.4696, "step": 249940 }, { "epoch": 0.44, "learning_rate": 2.82058615289641e-05, "loss": 2.3131, "step": 249950 }, { "epoch": 0.44, "learning_rate": 2.8204989589037274e-05, "loss": 2.3421, "step": 249960 }, { "epoch": 0.44, "learning_rate": 2.820411764911045e-05, "loss": 2.3899, "step": 249970 }, { "epoch": 0.44, "learning_rate": 2.820324570918362e-05, "loss": 2.3702, "step": 249980 }, { "epoch": 0.44, "learning_rate": 2.8202373769256795e-05, "loss": 2.3528, "step": 249990 }, { "epoch": 0.44, "learning_rate": 2.820150182932997e-05, "loss": 2.4109, "step": 250000 }, { "epoch": 0.44, "learning_rate": 2.820062988940314e-05, "loss": 2.4066, "step": 250010 }, { "epoch": 0.44, "learning_rate": 2.8199757949476313e-05, "loss": 2.3437, "step": 250020 }, { "epoch": 0.44, "learning_rate": 2.8198886009549487e-05, "loss": 2.4409, "step": 250030 }, { "epoch": 0.44, "learning_rate": 2.8198014069622657e-05, "loss": 2.4333, "step": 250040 }, { "epoch": 0.44, "learning_rate": 2.8197142129695835e-05, "loss": 2.3758, "step": 250050 }, { "epoch": 0.44, "learning_rate": 2.819627018976901e-05, "loss": 2.4991, "step": 250060 }, { "epoch": 0.44, "learning_rate": 2.8195398249842182e-05, "loss": 2.3851, "step": 250070 }, { "epoch": 0.44, "learning_rate": 2.8194526309915353e-05, "loss": 2.4059, "step": 250080 }, { "epoch": 0.44, "learning_rate": 2.8193654369988526e-05, "loss": 2.3711, "step": 250090 }, { "epoch": 0.44, "learning_rate": 2.8192782430061697e-05, "loss": 2.283, "step": 250100 }, { "epoch": 0.44, "learning_rate": 2.819191049013487e-05, "loss": 2.3302, "step": 250110 }, { "epoch": 0.44, "learning_rate": 2.8191038550208048e-05, "loss": 2.3547, "step": 250120 }, { "epoch": 0.44, "learning_rate": 2.819016661028122e-05, "loss": 2.3298, "step": 250130 }, { "epoch": 0.44, "learning_rate": 2.8189294670354395e-05, "loss": 2.3518, "step": 250140 }, { "epoch": 0.44, "learning_rate": 2.8188422730427566e-05, "loss": 2.4255, "step": 250150 }, { "epoch": 0.44, "learning_rate": 2.818755079050074e-05, "loss": 2.4486, "step": 250160 }, { "epoch": 0.44, "learning_rate": 2.818667885057391e-05, "loss": 2.3114, "step": 250170 }, { "epoch": 0.44, "learning_rate": 2.8185806910647083e-05, "loss": 2.4562, "step": 250180 }, { "epoch": 0.44, "learning_rate": 2.8184934970720257e-05, "loss": 2.3166, "step": 250190 }, { "epoch": 0.44, "learning_rate": 2.8184063030793434e-05, "loss": 2.2788, "step": 250200 }, { "epoch": 0.44, "learning_rate": 2.8183191090866605e-05, "loss": 2.3477, "step": 250210 }, { "epoch": 0.44, "learning_rate": 2.818231915093978e-05, "loss": 2.3876, "step": 250220 }, { "epoch": 0.44, "learning_rate": 2.8181447211012952e-05, "loss": 2.3946, "step": 250230 }, { "epoch": 0.44, "learning_rate": 2.8180575271086123e-05, "loss": 2.3983, "step": 250240 }, { "epoch": 0.44, "learning_rate": 2.8179703331159296e-05, "loss": 2.3794, "step": 250250 }, { "epoch": 0.44, "learning_rate": 2.817883139123247e-05, "loss": 2.3631, "step": 250260 }, { "epoch": 0.44, "learning_rate": 2.8177959451305647e-05, "loss": 2.3901, "step": 250270 }, { "epoch": 0.44, "learning_rate": 2.8177087511378818e-05, "loss": 2.4371, "step": 250280 }, { "epoch": 0.44, "learning_rate": 2.817621557145199e-05, "loss": 2.3947, "step": 250290 }, { "epoch": 0.44, "learning_rate": 2.8175343631525165e-05, "loss": 2.3943, "step": 250300 }, { "epoch": 0.44, "learning_rate": 2.8174471691598336e-05, "loss": 2.4379, "step": 250310 }, { "epoch": 0.44, "learning_rate": 2.817359975167151e-05, "loss": 2.3251, "step": 250320 }, { "epoch": 0.44, "learning_rate": 2.817272781174468e-05, "loss": 2.4425, "step": 250330 }, { "epoch": 0.44, "learning_rate": 2.817185587181786e-05, "loss": 2.5714, "step": 250340 }, { "epoch": 0.44, "learning_rate": 2.817098393189103e-05, "loss": 2.1696, "step": 250350 }, { "epoch": 0.44, "learning_rate": 2.8170111991964205e-05, "loss": 2.4102, "step": 250360 }, { "epoch": 0.44, "learning_rate": 2.816924005203738e-05, "loss": 2.4223, "step": 250370 }, { "epoch": 0.44, "learning_rate": 2.816836811211055e-05, "loss": 2.3931, "step": 250380 }, { "epoch": 0.44, "learning_rate": 2.8167496172183722e-05, "loss": 2.4592, "step": 250390 }, { "epoch": 0.44, "learning_rate": 2.8166624232256893e-05, "loss": 2.3698, "step": 250400 }, { "epoch": 0.44, "learning_rate": 2.8165752292330067e-05, "loss": 2.4895, "step": 250410 }, { "epoch": 0.44, "learning_rate": 2.8164880352403244e-05, "loss": 2.316, "step": 250420 }, { "epoch": 0.44, "learning_rate": 2.8164008412476418e-05, "loss": 2.4881, "step": 250430 }, { "epoch": 0.44, "learning_rate": 2.8163136472549588e-05, "loss": 2.389, "step": 250440 }, { "epoch": 0.44, "learning_rate": 2.8162264532622762e-05, "loss": 2.4297, "step": 250450 }, { "epoch": 0.44, "learning_rate": 2.8161392592695935e-05, "loss": 2.3178, "step": 250460 }, { "epoch": 0.44, "learning_rate": 2.8160520652769106e-05, "loss": 2.3214, "step": 250470 }, { "epoch": 0.44, "learning_rate": 2.815964871284228e-05, "loss": 2.3869, "step": 250480 }, { "epoch": 0.44, "learning_rate": 2.8158776772915457e-05, "loss": 2.3227, "step": 250490 }, { "epoch": 0.44, "learning_rate": 2.815790483298863e-05, "loss": 2.3362, "step": 250500 }, { "epoch": 0.44, "learning_rate": 2.81570328930618e-05, "loss": 2.3021, "step": 250510 }, { "epoch": 0.44, "learning_rate": 2.8156160953134975e-05, "loss": 2.4497, "step": 250520 }, { "epoch": 0.44, "learning_rate": 2.815528901320815e-05, "loss": 2.3597, "step": 250530 }, { "epoch": 0.44, "learning_rate": 2.815441707328132e-05, "loss": 2.4744, "step": 250540 }, { "epoch": 0.44, "learning_rate": 2.8153545133354493e-05, "loss": 2.3717, "step": 250550 }, { "epoch": 0.44, "learning_rate": 2.8152673193427663e-05, "loss": 2.4429, "step": 250560 }, { "epoch": 0.44, "learning_rate": 2.8151801253500844e-05, "loss": 2.4086, "step": 250570 }, { "epoch": 0.44, "learning_rate": 2.8150929313574014e-05, "loss": 2.4956, "step": 250580 }, { "epoch": 0.44, "learning_rate": 2.8150057373647188e-05, "loss": 2.4202, "step": 250590 }, { "epoch": 0.44, "learning_rate": 2.8149185433720358e-05, "loss": 2.4012, "step": 250600 }, { "epoch": 0.44, "learning_rate": 2.8148313493793532e-05, "loss": 2.4827, "step": 250610 }, { "epoch": 0.44, "learning_rate": 2.8147441553866706e-05, "loss": 2.3177, "step": 250620 }, { "epoch": 0.44, "learning_rate": 2.8146569613939876e-05, "loss": 2.4161, "step": 250630 }, { "epoch": 0.44, "learning_rate": 2.8145697674013057e-05, "loss": 2.4524, "step": 250640 }, { "epoch": 0.44, "learning_rate": 2.8144825734086227e-05, "loss": 2.2542, "step": 250650 }, { "epoch": 0.44, "learning_rate": 2.81439537941594e-05, "loss": 2.3453, "step": 250660 }, { "epoch": 0.44, "learning_rate": 2.814308185423257e-05, "loss": 2.3545, "step": 250670 }, { "epoch": 0.44, "learning_rate": 2.8142209914305745e-05, "loss": 2.4145, "step": 250680 }, { "epoch": 0.44, "learning_rate": 2.814133797437892e-05, "loss": 2.4047, "step": 250690 }, { "epoch": 0.44, "learning_rate": 2.814046603445209e-05, "loss": 2.24, "step": 250700 }, { "epoch": 0.44, "learning_rate": 2.8139594094525263e-05, "loss": 2.3585, "step": 250710 }, { "epoch": 0.44, "learning_rate": 2.813872215459844e-05, "loss": 2.336, "step": 250720 }, { "epoch": 0.44, "learning_rate": 2.8137850214671614e-05, "loss": 2.4156, "step": 250730 }, { "epoch": 0.44, "learning_rate": 2.8136978274744784e-05, "loss": 2.3499, "step": 250740 }, { "epoch": 0.44, "learning_rate": 2.8136106334817958e-05, "loss": 2.3701, "step": 250750 }, { "epoch": 0.44, "learning_rate": 2.813523439489113e-05, "loss": 2.3332, "step": 250760 }, { "epoch": 0.44, "learning_rate": 2.8134362454964302e-05, "loss": 2.3162, "step": 250770 }, { "epoch": 0.44, "learning_rate": 2.8133490515037476e-05, "loss": 2.3157, "step": 250780 }, { "epoch": 0.44, "learning_rate": 2.8132618575110653e-05, "loss": 2.3869, "step": 250790 }, { "epoch": 0.44, "learning_rate": 2.8131746635183827e-05, "loss": 2.3601, "step": 250800 }, { "epoch": 0.44, "learning_rate": 2.8130874695256997e-05, "loss": 2.4291, "step": 250810 }, { "epoch": 0.44, "learning_rate": 2.813000275533017e-05, "loss": 2.4127, "step": 250820 }, { "epoch": 0.44, "learning_rate": 2.812913081540334e-05, "loss": 2.3183, "step": 250830 }, { "epoch": 0.44, "learning_rate": 2.8128258875476515e-05, "loss": 2.4982, "step": 250840 }, { "epoch": 0.44, "learning_rate": 2.812738693554969e-05, "loss": 2.4576, "step": 250850 }, { "epoch": 0.44, "learning_rate": 2.812651499562286e-05, "loss": 2.4828, "step": 250860 }, { "epoch": 0.44, "learning_rate": 2.812564305569604e-05, "loss": 2.5099, "step": 250870 }, { "epoch": 0.44, "learning_rate": 2.812477111576921e-05, "loss": 2.3744, "step": 250880 }, { "epoch": 0.44, "learning_rate": 2.8123899175842384e-05, "loss": 2.3456, "step": 250890 }, { "epoch": 0.44, "learning_rate": 2.8123027235915554e-05, "loss": 2.3745, "step": 250900 }, { "epoch": 0.44, "learning_rate": 2.8122155295988728e-05, "loss": 2.3907, "step": 250910 }, { "epoch": 0.44, "learning_rate": 2.8121283356061902e-05, "loss": 2.3744, "step": 250920 }, { "epoch": 0.44, "learning_rate": 2.8120411416135072e-05, "loss": 2.3239, "step": 250930 }, { "epoch": 0.44, "learning_rate": 2.811953947620825e-05, "loss": 2.3716, "step": 250940 }, { "epoch": 0.44, "learning_rate": 2.8118667536281423e-05, "loss": 2.3529, "step": 250950 }, { "epoch": 0.44, "learning_rate": 2.8117795596354597e-05, "loss": 2.3612, "step": 250960 }, { "epoch": 0.44, "learning_rate": 2.8116923656427767e-05, "loss": 2.2948, "step": 250970 }, { "epoch": 0.44, "learning_rate": 2.811605171650094e-05, "loss": 2.3537, "step": 250980 }, { "epoch": 0.44, "learning_rate": 2.8115179776574115e-05, "loss": 2.3536, "step": 250990 }, { "epoch": 0.44, "learning_rate": 2.8114307836647285e-05, "loss": 2.3416, "step": 251000 }, { "epoch": 0.44, "learning_rate": 2.8113435896720462e-05, "loss": 2.2796, "step": 251010 }, { "epoch": 0.44, "learning_rate": 2.8112563956793636e-05, "loss": 2.1598, "step": 251020 }, { "epoch": 0.44, "learning_rate": 2.811169201686681e-05, "loss": 2.3941, "step": 251030 }, { "epoch": 0.44, "learning_rate": 2.811082007693998e-05, "loss": 2.4109, "step": 251040 }, { "epoch": 0.44, "learning_rate": 2.8109948137013154e-05, "loss": 2.3269, "step": 251050 }, { "epoch": 0.44, "learning_rate": 2.8109076197086324e-05, "loss": 2.4919, "step": 251060 }, { "epoch": 0.44, "learning_rate": 2.8108204257159498e-05, "loss": 2.3991, "step": 251070 }, { "epoch": 0.44, "learning_rate": 2.8107332317232672e-05, "loss": 2.3607, "step": 251080 }, { "epoch": 0.44, "learning_rate": 2.810646037730585e-05, "loss": 2.3327, "step": 251090 }, { "epoch": 0.44, "learning_rate": 2.8105588437379023e-05, "loss": 2.4526, "step": 251100 }, { "epoch": 0.44, "learning_rate": 2.8104716497452193e-05, "loss": 2.4055, "step": 251110 }, { "epoch": 0.44, "learning_rate": 2.8103844557525367e-05, "loss": 2.4559, "step": 251120 }, { "epoch": 0.44, "learning_rate": 2.8102972617598537e-05, "loss": 2.3667, "step": 251130 }, { "epoch": 0.44, "learning_rate": 2.810210067767171e-05, "loss": 2.2985, "step": 251140 }, { "epoch": 0.44, "learning_rate": 2.8101228737744885e-05, "loss": 2.4075, "step": 251150 }, { "epoch": 0.44, "learning_rate": 2.8100356797818062e-05, "loss": 2.4902, "step": 251160 }, { "epoch": 0.44, "learning_rate": 2.8099484857891232e-05, "loss": 2.3624, "step": 251170 }, { "epoch": 0.44, "learning_rate": 2.8098612917964406e-05, "loss": 2.3139, "step": 251180 }, { "epoch": 0.44, "learning_rate": 2.809774097803758e-05, "loss": 2.4476, "step": 251190 }, { "epoch": 0.44, "learning_rate": 2.809686903811075e-05, "loss": 2.406, "step": 251200 }, { "epoch": 0.44, "learning_rate": 2.8095997098183924e-05, "loss": 2.4883, "step": 251210 }, { "epoch": 0.44, "learning_rate": 2.8095125158257095e-05, "loss": 2.4377, "step": 251220 }, { "epoch": 0.44, "learning_rate": 2.809425321833027e-05, "loss": 2.3754, "step": 251230 }, { "epoch": 0.44, "learning_rate": 2.8093381278403445e-05, "loss": 2.3678, "step": 251240 }, { "epoch": 0.44, "learning_rate": 2.809250933847662e-05, "loss": 2.4361, "step": 251250 }, { "epoch": 0.44, "learning_rate": 2.8091637398549793e-05, "loss": 2.4963, "step": 251260 }, { "epoch": 0.44, "learning_rate": 2.8090765458622963e-05, "loss": 2.3533, "step": 251270 }, { "epoch": 0.44, "learning_rate": 2.8089893518696137e-05, "loss": 2.3312, "step": 251280 }, { "epoch": 0.44, "learning_rate": 2.8089021578769308e-05, "loss": 2.3356, "step": 251290 }, { "epoch": 0.44, "learning_rate": 2.808814963884248e-05, "loss": 2.4532, "step": 251300 }, { "epoch": 0.44, "learning_rate": 2.808727769891566e-05, "loss": 2.4308, "step": 251310 }, { "epoch": 0.44, "learning_rate": 2.8086405758988832e-05, "loss": 2.4363, "step": 251320 }, { "epoch": 0.44, "learning_rate": 2.8085533819062003e-05, "loss": 2.3676, "step": 251330 }, { "epoch": 0.44, "learning_rate": 2.8084661879135176e-05, "loss": 2.3274, "step": 251340 }, { "epoch": 0.44, "learning_rate": 2.808378993920835e-05, "loss": 2.4045, "step": 251350 }, { "epoch": 0.44, "learning_rate": 2.808291799928152e-05, "loss": 2.3822, "step": 251360 }, { "epoch": 0.44, "learning_rate": 2.8082046059354694e-05, "loss": 2.3902, "step": 251370 }, { "epoch": 0.44, "learning_rate": 2.8081174119427868e-05, "loss": 2.411, "step": 251380 }, { "epoch": 0.44, "learning_rate": 2.8080302179501045e-05, "loss": 2.4034, "step": 251390 }, { "epoch": 0.44, "learning_rate": 2.8079430239574216e-05, "loss": 2.2519, "step": 251400 }, { "epoch": 0.44, "learning_rate": 2.807855829964739e-05, "loss": 2.3523, "step": 251410 }, { "epoch": 0.44, "learning_rate": 2.8077686359720563e-05, "loss": 2.3418, "step": 251420 }, { "epoch": 0.44, "learning_rate": 2.8076814419793734e-05, "loss": 2.3161, "step": 251430 }, { "epoch": 0.44, "learning_rate": 2.8075942479866907e-05, "loss": 2.4225, "step": 251440 }, { "epoch": 0.44, "learning_rate": 2.8075070539940078e-05, "loss": 2.3955, "step": 251450 }, { "epoch": 0.44, "learning_rate": 2.8074198600013258e-05, "loss": 2.2751, "step": 251460 }, { "epoch": 0.44, "learning_rate": 2.807332666008643e-05, "loss": 2.4628, "step": 251470 }, { "epoch": 0.44, "learning_rate": 2.8072454720159602e-05, "loss": 2.2813, "step": 251480 }, { "epoch": 0.44, "learning_rate": 2.8071582780232776e-05, "loss": 2.4014, "step": 251490 }, { "epoch": 0.44, "learning_rate": 2.8070710840305947e-05, "loss": 2.324, "step": 251500 }, { "epoch": 0.44, "learning_rate": 2.806983890037912e-05, "loss": 2.4562, "step": 251510 }, { "epoch": 0.44, "learning_rate": 2.806896696045229e-05, "loss": 2.4011, "step": 251520 }, { "epoch": 0.44, "learning_rate": 2.8068095020525464e-05, "loss": 2.3785, "step": 251530 }, { "epoch": 0.44, "learning_rate": 2.806722308059864e-05, "loss": 2.43, "step": 251540 }, { "epoch": 0.44, "learning_rate": 2.8066351140671815e-05, "loss": 2.4289, "step": 251550 }, { "epoch": 0.44, "learning_rate": 2.8065479200744986e-05, "loss": 2.3036, "step": 251560 }, { "epoch": 0.44, "learning_rate": 2.806460726081816e-05, "loss": 2.234, "step": 251570 }, { "epoch": 0.44, "learning_rate": 2.8063735320891333e-05, "loss": 2.4378, "step": 251580 }, { "epoch": 0.44, "learning_rate": 2.8062863380964504e-05, "loss": 2.4778, "step": 251590 }, { "epoch": 0.44, "learning_rate": 2.8061991441037677e-05, "loss": 2.2756, "step": 251600 }, { "epoch": 0.44, "learning_rate": 2.8061119501110855e-05, "loss": 2.4013, "step": 251610 }, { "epoch": 0.44, "learning_rate": 2.806024756118403e-05, "loss": 2.4779, "step": 251620 }, { "epoch": 0.44, "learning_rate": 2.80593756212572e-05, "loss": 2.4289, "step": 251630 }, { "epoch": 0.44, "learning_rate": 2.8058503681330373e-05, "loss": 2.4476, "step": 251640 }, { "epoch": 0.44, "learning_rate": 2.8057631741403546e-05, "loss": 2.3937, "step": 251650 }, { "epoch": 0.44, "learning_rate": 2.8056759801476717e-05, "loss": 2.2632, "step": 251660 }, { "epoch": 0.44, "learning_rate": 2.805588786154989e-05, "loss": 2.4158, "step": 251670 }, { "epoch": 0.44, "learning_rate": 2.8055015921623068e-05, "loss": 2.4459, "step": 251680 }, { "epoch": 0.44, "learning_rate": 2.805414398169624e-05, "loss": 2.3605, "step": 251690 }, { "epoch": 0.44, "learning_rate": 2.8053272041769412e-05, "loss": 2.4386, "step": 251700 }, { "epoch": 0.44, "learning_rate": 2.8052400101842586e-05, "loss": 2.5348, "step": 251710 }, { "epoch": 0.44, "learning_rate": 2.805152816191576e-05, "loss": 2.2894, "step": 251720 }, { "epoch": 0.44, "learning_rate": 2.805065622198893e-05, "loss": 2.4002, "step": 251730 }, { "epoch": 0.44, "learning_rate": 2.8049784282062103e-05, "loss": 2.41, "step": 251740 }, { "epoch": 0.44, "learning_rate": 2.8048912342135274e-05, "loss": 2.3929, "step": 251750 }, { "epoch": 0.44, "learning_rate": 2.8048040402208454e-05, "loss": 2.3957, "step": 251760 }, { "epoch": 0.44, "learning_rate": 2.8047168462281625e-05, "loss": 2.3754, "step": 251770 }, { "epoch": 0.44, "learning_rate": 2.80462965223548e-05, "loss": 2.2663, "step": 251780 }, { "epoch": 0.44, "learning_rate": 2.804542458242797e-05, "loss": 2.263, "step": 251790 }, { "epoch": 0.44, "learning_rate": 2.8044552642501143e-05, "loss": 2.4132, "step": 251800 }, { "epoch": 0.44, "learning_rate": 2.8043680702574316e-05, "loss": 2.348, "step": 251810 }, { "epoch": 0.44, "learning_rate": 2.8042808762647487e-05, "loss": 2.313, "step": 251820 }, { "epoch": 0.44, "learning_rate": 2.8041936822720667e-05, "loss": 2.354, "step": 251830 }, { "epoch": 0.44, "learning_rate": 2.8041064882793838e-05, "loss": 2.3332, "step": 251840 }, { "epoch": 0.44, "learning_rate": 2.804019294286701e-05, "loss": 2.3926, "step": 251850 }, { "epoch": 0.44, "learning_rate": 2.8039321002940182e-05, "loss": 2.3949, "step": 251860 }, { "epoch": 0.44, "learning_rate": 2.8038449063013356e-05, "loss": 2.4041, "step": 251870 }, { "epoch": 0.44, "learning_rate": 2.803757712308653e-05, "loss": 2.4173, "step": 251880 }, { "epoch": 0.44, "learning_rate": 2.80367051831597e-05, "loss": 2.3757, "step": 251890 }, { "epoch": 0.44, "learning_rate": 2.8035833243232874e-05, "loss": 2.3737, "step": 251900 }, { "epoch": 0.44, "learning_rate": 2.803496130330605e-05, "loss": 2.4748, "step": 251910 }, { "epoch": 0.44, "learning_rate": 2.8034089363379225e-05, "loss": 2.1998, "step": 251920 }, { "epoch": 0.44, "learning_rate": 2.8033217423452395e-05, "loss": 2.3128, "step": 251930 }, { "epoch": 0.44, "learning_rate": 2.803234548352557e-05, "loss": 2.3982, "step": 251940 }, { "epoch": 0.44, "learning_rate": 2.803147354359874e-05, "loss": 2.4231, "step": 251950 }, { "epoch": 0.44, "learning_rate": 2.8030601603671913e-05, "loss": 2.3601, "step": 251960 }, { "epoch": 0.44, "learning_rate": 2.8029729663745087e-05, "loss": 2.3963, "step": 251970 }, { "epoch": 0.44, "learning_rate": 2.8028857723818264e-05, "loss": 2.4489, "step": 251980 }, { "epoch": 0.44, "learning_rate": 2.8027985783891438e-05, "loss": 2.3805, "step": 251990 }, { "epoch": 0.44, "learning_rate": 2.8027113843964608e-05, "loss": 2.3272, "step": 252000 }, { "epoch": 0.44, "learning_rate": 2.8026241904037782e-05, "loss": 2.4034, "step": 252010 }, { "epoch": 0.44, "learning_rate": 2.8025369964110952e-05, "loss": 2.3077, "step": 252020 }, { "epoch": 0.44, "learning_rate": 2.8024498024184126e-05, "loss": 2.4061, "step": 252030 }, { "epoch": 0.44, "learning_rate": 2.80236260842573e-05, "loss": 2.4026, "step": 252040 }, { "epoch": 0.44, "learning_rate": 2.802275414433047e-05, "loss": 2.3885, "step": 252050 }, { "epoch": 0.44, "learning_rate": 2.8021882204403647e-05, "loss": 2.4024, "step": 252060 }, { "epoch": 0.44, "learning_rate": 2.802101026447682e-05, "loss": 2.5136, "step": 252070 }, { "epoch": 0.44, "learning_rate": 2.8020138324549995e-05, "loss": 2.3906, "step": 252080 }, { "epoch": 0.44, "learning_rate": 2.8019266384623165e-05, "loss": 2.3702, "step": 252090 }, { "epoch": 0.44, "learning_rate": 2.801839444469634e-05, "loss": 2.3901, "step": 252100 }, { "epoch": 0.44, "learning_rate": 2.8017522504769513e-05, "loss": 2.3298, "step": 252110 }, { "epoch": 0.44, "learning_rate": 2.8016650564842683e-05, "loss": 2.456, "step": 252120 }, { "epoch": 0.44, "learning_rate": 2.801577862491586e-05, "loss": 2.4105, "step": 252130 }, { "epoch": 0.44, "learning_rate": 2.8014906684989034e-05, "loss": 2.3389, "step": 252140 }, { "epoch": 0.44, "learning_rate": 2.8014034745062208e-05, "loss": 2.2879, "step": 252150 }, { "epoch": 0.44, "learning_rate": 2.8013162805135378e-05, "loss": 2.3225, "step": 252160 }, { "epoch": 0.44, "learning_rate": 2.8012290865208552e-05, "loss": 2.3801, "step": 252170 }, { "epoch": 0.44, "learning_rate": 2.8011418925281722e-05, "loss": 2.5363, "step": 252180 }, { "epoch": 0.44, "learning_rate": 2.8010546985354896e-05, "loss": 2.3707, "step": 252190 }, { "epoch": 0.44, "learning_rate": 2.8009675045428073e-05, "loss": 2.2859, "step": 252200 }, { "epoch": 0.44, "learning_rate": 2.8008803105501247e-05, "loss": 2.2788, "step": 252210 }, { "epoch": 0.44, "learning_rate": 2.800793116557442e-05, "loss": 2.3235, "step": 252220 }, { "epoch": 0.44, "learning_rate": 2.800705922564759e-05, "loss": 2.3716, "step": 252230 }, { "epoch": 0.44, "learning_rate": 2.8006187285720765e-05, "loss": 2.3452, "step": 252240 }, { "epoch": 0.44, "learning_rate": 2.8005315345793935e-05, "loss": 2.3842, "step": 252250 }, { "epoch": 0.44, "learning_rate": 2.800444340586711e-05, "loss": 2.4005, "step": 252260 }, { "epoch": 0.44, "learning_rate": 2.8003571465940283e-05, "loss": 2.3521, "step": 252270 }, { "epoch": 0.44, "learning_rate": 2.800269952601346e-05, "loss": 2.3703, "step": 252280 }, { "epoch": 0.44, "learning_rate": 2.800182758608663e-05, "loss": 2.4675, "step": 252290 }, { "epoch": 0.44, "learning_rate": 2.8000955646159804e-05, "loss": 2.404, "step": 252300 }, { "epoch": 0.44, "learning_rate": 2.8000083706232978e-05, "loss": 2.4154, "step": 252310 }, { "epoch": 0.44, "learning_rate": 2.7999211766306148e-05, "loss": 2.3558, "step": 252320 }, { "epoch": 0.44, "learning_rate": 2.7998339826379322e-05, "loss": 2.4599, "step": 252330 }, { "epoch": 0.44, "learning_rate": 2.7997467886452496e-05, "loss": 2.337, "step": 252340 }, { "epoch": 0.44, "learning_rate": 2.7996595946525673e-05, "loss": 2.2892, "step": 252350 }, { "epoch": 0.44, "learning_rate": 2.7995724006598843e-05, "loss": 2.4715, "step": 252360 }, { "epoch": 0.44, "learning_rate": 2.7994852066672017e-05, "loss": 2.2382, "step": 252370 }, { "epoch": 0.44, "learning_rate": 2.799398012674519e-05, "loss": 2.4403, "step": 252380 }, { "epoch": 0.44, "learning_rate": 2.799310818681836e-05, "loss": 2.2983, "step": 252390 }, { "epoch": 0.44, "learning_rate": 2.7992236246891535e-05, "loss": 2.4681, "step": 252400 }, { "epoch": 0.44, "learning_rate": 2.7991364306964705e-05, "loss": 2.3082, "step": 252410 }, { "epoch": 0.44, "learning_rate": 2.799049236703788e-05, "loss": 2.4649, "step": 252420 }, { "epoch": 0.44, "learning_rate": 2.7989620427111056e-05, "loss": 2.3244, "step": 252430 }, { "epoch": 0.44, "learning_rate": 2.798874848718423e-05, "loss": 2.4487, "step": 252440 }, { "epoch": 0.44, "learning_rate": 2.7987876547257404e-05, "loss": 2.3717, "step": 252450 }, { "epoch": 0.44, "learning_rate": 2.7987004607330574e-05, "loss": 2.3927, "step": 252460 }, { "epoch": 0.44, "learning_rate": 2.7986132667403748e-05, "loss": 2.4354, "step": 252470 }, { "epoch": 0.44, "learning_rate": 2.798526072747692e-05, "loss": 2.4476, "step": 252480 }, { "epoch": 0.44, "learning_rate": 2.7984388787550092e-05, "loss": 2.3703, "step": 252490 }, { "epoch": 0.44, "learning_rate": 2.798351684762327e-05, "loss": 2.4411, "step": 252500 }, { "epoch": 0.44, "learning_rate": 2.7982644907696443e-05, "loss": 2.4613, "step": 252510 }, { "epoch": 0.44, "learning_rate": 2.7981772967769613e-05, "loss": 2.3301, "step": 252520 }, { "epoch": 0.44, "learning_rate": 2.7980901027842787e-05, "loss": 2.4951, "step": 252530 }, { "epoch": 0.44, "learning_rate": 2.798002908791596e-05, "loss": 2.3589, "step": 252540 }, { "epoch": 0.44, "learning_rate": 2.797915714798913e-05, "loss": 2.3965, "step": 252550 }, { "epoch": 0.44, "learning_rate": 2.7978285208062305e-05, "loss": 2.303, "step": 252560 }, { "epoch": 0.44, "learning_rate": 2.7977413268135476e-05, "loss": 2.2844, "step": 252570 }, { "epoch": 0.44, "learning_rate": 2.7976541328208656e-05, "loss": 2.3835, "step": 252580 }, { "epoch": 0.44, "learning_rate": 2.7975669388281826e-05, "loss": 2.3843, "step": 252590 }, { "epoch": 0.44, "learning_rate": 2.7974797448355e-05, "loss": 2.3619, "step": 252600 }, { "epoch": 0.44, "learning_rate": 2.7973925508428174e-05, "loss": 2.3819, "step": 252610 }, { "epoch": 0.44, "learning_rate": 2.7973053568501344e-05, "loss": 2.3811, "step": 252620 }, { "epoch": 0.44, "learning_rate": 2.7972181628574518e-05, "loss": 2.4021, "step": 252630 }, { "epoch": 0.44, "learning_rate": 2.797130968864769e-05, "loss": 2.381, "step": 252640 }, { "epoch": 0.44, "learning_rate": 2.797043774872087e-05, "loss": 2.4214, "step": 252650 }, { "epoch": 0.44, "learning_rate": 2.796956580879404e-05, "loss": 2.4281, "step": 252660 }, { "epoch": 0.44, "learning_rate": 2.7968693868867213e-05, "loss": 2.5293, "step": 252670 }, { "epoch": 0.44, "learning_rate": 2.7967821928940384e-05, "loss": 2.4871, "step": 252680 }, { "epoch": 0.44, "learning_rate": 2.7966949989013557e-05, "loss": 2.3632, "step": 252690 }, { "epoch": 0.44, "learning_rate": 2.796607804908673e-05, "loss": 2.433, "step": 252700 }, { "epoch": 0.44, "learning_rate": 2.79652061091599e-05, "loss": 2.2376, "step": 252710 }, { "epoch": 0.44, "learning_rate": 2.7964334169233075e-05, "loss": 2.4449, "step": 252720 }, { "epoch": 0.44, "learning_rate": 2.7963462229306252e-05, "loss": 2.3139, "step": 252730 }, { "epoch": 0.44, "learning_rate": 2.7962590289379426e-05, "loss": 2.3087, "step": 252740 }, { "epoch": 0.44, "learning_rate": 2.7961718349452597e-05, "loss": 2.3744, "step": 252750 }, { "epoch": 0.44, "learning_rate": 2.796084640952577e-05, "loss": 2.2595, "step": 252760 }, { "epoch": 0.44, "learning_rate": 2.7959974469598944e-05, "loss": 2.4185, "step": 252770 }, { "epoch": 0.44, "learning_rate": 2.7959102529672115e-05, "loss": 2.4459, "step": 252780 }, { "epoch": 0.44, "learning_rate": 2.795823058974529e-05, "loss": 2.3861, "step": 252790 }, { "epoch": 0.44, "learning_rate": 2.7957358649818466e-05, "loss": 2.2961, "step": 252800 }, { "epoch": 0.44, "learning_rate": 2.795648670989164e-05, "loss": 2.4259, "step": 252810 }, { "epoch": 0.44, "learning_rate": 2.795561476996481e-05, "loss": 2.3727, "step": 252820 }, { "epoch": 0.44, "learning_rate": 2.7954742830037983e-05, "loss": 2.3013, "step": 252830 }, { "epoch": 0.44, "learning_rate": 2.7953870890111157e-05, "loss": 2.455, "step": 252840 }, { "epoch": 0.44, "learning_rate": 2.7952998950184328e-05, "loss": 2.3217, "step": 252850 }, { "epoch": 0.44, "learning_rate": 2.79521270102575e-05, "loss": 2.3621, "step": 252860 }, { "epoch": 0.44, "learning_rate": 2.795125507033068e-05, "loss": 2.4164, "step": 252870 }, { "epoch": 0.44, "learning_rate": 2.7950383130403852e-05, "loss": 2.3609, "step": 252880 }, { "epoch": 0.44, "learning_rate": 2.7949511190477023e-05, "loss": 2.2224, "step": 252890 }, { "epoch": 0.44, "learning_rate": 2.7948639250550196e-05, "loss": 2.4953, "step": 252900 }, { "epoch": 0.44, "learning_rate": 2.7947767310623367e-05, "loss": 2.3584, "step": 252910 }, { "epoch": 0.44, "learning_rate": 2.794689537069654e-05, "loss": 2.2805, "step": 252920 }, { "epoch": 0.44, "learning_rate": 2.7946023430769714e-05, "loss": 2.3276, "step": 252930 }, { "epoch": 0.44, "learning_rate": 2.7945151490842885e-05, "loss": 2.3945, "step": 252940 }, { "epoch": 0.44, "learning_rate": 2.7944279550916065e-05, "loss": 2.3548, "step": 252950 }, { "epoch": 0.44, "learning_rate": 2.7943407610989236e-05, "loss": 2.4061, "step": 252960 }, { "epoch": 0.44, "learning_rate": 2.794253567106241e-05, "loss": 2.3883, "step": 252970 }, { "epoch": 0.44, "learning_rate": 2.794166373113558e-05, "loss": 2.4618, "step": 252980 }, { "epoch": 0.44, "learning_rate": 2.7940791791208754e-05, "loss": 2.3111, "step": 252990 }, { "epoch": 0.44, "learning_rate": 2.7939919851281927e-05, "loss": 2.4725, "step": 253000 }, { "epoch": 0.44, "learning_rate": 2.7939047911355098e-05, "loss": 2.4055, "step": 253010 }, { "epoch": 0.44, "learning_rate": 2.7938175971428275e-05, "loss": 2.3291, "step": 253020 }, { "epoch": 0.44, "learning_rate": 2.793730403150145e-05, "loss": 2.3875, "step": 253030 }, { "epoch": 0.44, "learning_rate": 2.7936432091574622e-05, "loss": 2.3455, "step": 253040 }, { "epoch": 0.44, "learning_rate": 2.7935560151647793e-05, "loss": 2.2478, "step": 253050 }, { "epoch": 0.44, "learning_rate": 2.7934688211720967e-05, "loss": 2.2531, "step": 253060 }, { "epoch": 0.44, "learning_rate": 2.793381627179414e-05, "loss": 2.4143, "step": 253070 }, { "epoch": 0.44, "learning_rate": 2.793294433186731e-05, "loss": 2.4918, "step": 253080 }, { "epoch": 0.44, "learning_rate": 2.7932072391940484e-05, "loss": 2.3475, "step": 253090 }, { "epoch": 0.44, "learning_rate": 2.793120045201366e-05, "loss": 2.4201, "step": 253100 }, { "epoch": 0.44, "learning_rate": 2.7930328512086835e-05, "loss": 2.3384, "step": 253110 }, { "epoch": 0.44, "learning_rate": 2.7929456572160006e-05, "loss": 2.4081, "step": 253120 }, { "epoch": 0.44, "learning_rate": 2.792858463223318e-05, "loss": 2.3123, "step": 253130 }, { "epoch": 0.44, "learning_rate": 2.792771269230635e-05, "loss": 2.4216, "step": 253140 }, { "epoch": 0.44, "learning_rate": 2.7926840752379524e-05, "loss": 2.4099, "step": 253150 }, { "epoch": 0.44, "learning_rate": 2.7925968812452697e-05, "loss": 2.4541, "step": 253160 }, { "epoch": 0.44, "learning_rate": 2.7925096872525875e-05, "loss": 2.3362, "step": 253170 }, { "epoch": 0.44, "learning_rate": 2.792422493259905e-05, "loss": 2.3136, "step": 253180 }, { "epoch": 0.44, "learning_rate": 2.792335299267222e-05, "loss": 2.3909, "step": 253190 }, { "epoch": 0.44, "learning_rate": 2.7922481052745393e-05, "loss": 2.2755, "step": 253200 }, { "epoch": 0.44, "learning_rate": 2.7921609112818563e-05, "loss": 2.3424, "step": 253210 }, { "epoch": 0.44, "learning_rate": 2.7920737172891737e-05, "loss": 2.253, "step": 253220 }, { "epoch": 0.44, "learning_rate": 2.791986523296491e-05, "loss": 2.4602, "step": 253230 }, { "epoch": 0.44, "learning_rate": 2.791899329303808e-05, "loss": 2.2618, "step": 253240 }, { "epoch": 0.44, "learning_rate": 2.7918121353111258e-05, "loss": 2.3649, "step": 253250 }, { "epoch": 0.44, "learning_rate": 2.7917249413184432e-05, "loss": 2.3618, "step": 253260 }, { "epoch": 0.44, "learning_rate": 2.7916377473257606e-05, "loss": 2.3909, "step": 253270 }, { "epoch": 0.44, "learning_rate": 2.7915505533330776e-05, "loss": 2.3346, "step": 253280 }, { "epoch": 0.44, "learning_rate": 2.791463359340395e-05, "loss": 2.3196, "step": 253290 }, { "epoch": 0.44, "learning_rate": 2.791376165347712e-05, "loss": 2.3897, "step": 253300 }, { "epoch": 0.44, "learning_rate": 2.7912889713550294e-05, "loss": 2.2841, "step": 253310 }, { "epoch": 0.44, "learning_rate": 2.791201777362347e-05, "loss": 2.5143, "step": 253320 }, { "epoch": 0.44, "learning_rate": 2.7911145833696645e-05, "loss": 2.3907, "step": 253330 }, { "epoch": 0.44, "learning_rate": 2.791027389376982e-05, "loss": 2.4014, "step": 253340 }, { "epoch": 0.44, "learning_rate": 2.790940195384299e-05, "loss": 2.3574, "step": 253350 }, { "epoch": 0.44, "learning_rate": 2.7908530013916163e-05, "loss": 2.3802, "step": 253360 }, { "epoch": 0.44, "learning_rate": 2.7907658073989333e-05, "loss": 2.4666, "step": 253370 }, { "epoch": 0.44, "learning_rate": 2.7906786134062507e-05, "loss": 2.2977, "step": 253380 }, { "epoch": 0.44, "learning_rate": 2.790591419413568e-05, "loss": 2.325, "step": 253390 }, { "epoch": 0.44, "learning_rate": 2.7905042254208858e-05, "loss": 2.3386, "step": 253400 }, { "epoch": 0.44, "learning_rate": 2.7904170314282028e-05, "loss": 2.4159, "step": 253410 }, { "epoch": 0.44, "learning_rate": 2.7903298374355202e-05, "loss": 2.3303, "step": 253420 }, { "epoch": 0.44, "learning_rate": 2.7902426434428376e-05, "loss": 2.43, "step": 253430 }, { "epoch": 0.44, "learning_rate": 2.7901554494501546e-05, "loss": 2.345, "step": 253440 }, { "epoch": 0.44, "learning_rate": 2.790068255457472e-05, "loss": 2.4161, "step": 253450 }, { "epoch": 0.44, "learning_rate": 2.7899810614647894e-05, "loss": 2.4638, "step": 253460 }, { "epoch": 0.44, "learning_rate": 2.789893867472107e-05, "loss": 2.4566, "step": 253470 }, { "epoch": 0.44, "learning_rate": 2.789806673479424e-05, "loss": 2.3846, "step": 253480 }, { "epoch": 0.44, "learning_rate": 2.7897194794867415e-05, "loss": 2.4392, "step": 253490 }, { "epoch": 0.44, "learning_rate": 2.789632285494059e-05, "loss": 2.3946, "step": 253500 }, { "epoch": 0.44, "learning_rate": 2.789545091501376e-05, "loss": 2.3398, "step": 253510 }, { "epoch": 0.44, "learning_rate": 2.7894578975086933e-05, "loss": 2.2993, "step": 253520 }, { "epoch": 0.44, "learning_rate": 2.7893707035160103e-05, "loss": 2.3719, "step": 253530 }, { "epoch": 0.44, "learning_rate": 2.7892835095233284e-05, "loss": 2.3123, "step": 253540 }, { "epoch": 0.44, "learning_rate": 2.7891963155306454e-05, "loss": 2.4793, "step": 253550 }, { "epoch": 0.44, "learning_rate": 2.7891091215379628e-05, "loss": 2.4993, "step": 253560 }, { "epoch": 0.44, "learning_rate": 2.7890219275452802e-05, "loss": 2.4228, "step": 253570 }, { "epoch": 0.44, "learning_rate": 2.7889347335525972e-05, "loss": 2.4126, "step": 253580 }, { "epoch": 0.44, "learning_rate": 2.7888475395599146e-05, "loss": 2.4234, "step": 253590 }, { "epoch": 0.44, "learning_rate": 2.7887603455672316e-05, "loss": 2.4589, "step": 253600 }, { "epoch": 0.44, "learning_rate": 2.788673151574549e-05, "loss": 2.4502, "step": 253610 }, { "epoch": 0.44, "learning_rate": 2.7885859575818667e-05, "loss": 2.4486, "step": 253620 }, { "epoch": 0.44, "learning_rate": 2.788498763589184e-05, "loss": 2.3778, "step": 253630 }, { "epoch": 0.44, "learning_rate": 2.788411569596501e-05, "loss": 2.3555, "step": 253640 }, { "epoch": 0.44, "learning_rate": 2.7883243756038185e-05, "loss": 2.2546, "step": 253650 }, { "epoch": 0.44, "learning_rate": 2.788237181611136e-05, "loss": 2.371, "step": 253660 }, { "epoch": 0.44, "learning_rate": 2.788149987618453e-05, "loss": 2.2535, "step": 253670 }, { "epoch": 0.44, "learning_rate": 2.7880627936257703e-05, "loss": 2.2754, "step": 253680 }, { "epoch": 0.44, "learning_rate": 2.787975599633088e-05, "loss": 2.4369, "step": 253690 }, { "epoch": 0.44, "learning_rate": 2.7878884056404054e-05, "loss": 2.4667, "step": 253700 }, { "epoch": 0.44, "learning_rate": 2.7878012116477224e-05, "loss": 2.3364, "step": 253710 }, { "epoch": 0.44, "learning_rate": 2.7877140176550398e-05, "loss": 2.3633, "step": 253720 }, { "epoch": 0.44, "learning_rate": 2.7876268236623572e-05, "loss": 2.4322, "step": 253730 }, { "epoch": 0.44, "learning_rate": 2.7875396296696742e-05, "loss": 2.4737, "step": 253740 }, { "epoch": 0.44, "learning_rate": 2.7874524356769916e-05, "loss": 2.3413, "step": 253750 }, { "epoch": 0.44, "learning_rate": 2.7873652416843086e-05, "loss": 2.4138, "step": 253760 }, { "epoch": 0.44, "learning_rate": 2.7872780476916267e-05, "loss": 2.2766, "step": 253770 }, { "epoch": 0.44, "learning_rate": 2.7871908536989437e-05, "loss": 2.3735, "step": 253780 }, { "epoch": 0.44, "learning_rate": 2.787103659706261e-05, "loss": 2.3712, "step": 253790 }, { "epoch": 0.44, "learning_rate": 2.7870164657135785e-05, "loss": 2.3357, "step": 253800 }, { "epoch": 0.44, "learning_rate": 2.7869292717208955e-05, "loss": 2.4494, "step": 253810 }, { "epoch": 0.44, "learning_rate": 2.786842077728213e-05, "loss": 2.3612, "step": 253820 }, { "epoch": 0.44, "learning_rate": 2.78675488373553e-05, "loss": 2.4451, "step": 253830 }, { "epoch": 0.44, "learning_rate": 2.786667689742848e-05, "loss": 2.2992, "step": 253840 }, { "epoch": 0.44, "learning_rate": 2.786580495750165e-05, "loss": 2.379, "step": 253850 }, { "epoch": 0.44, "learning_rate": 2.7864933017574824e-05, "loss": 2.299, "step": 253860 }, { "epoch": 0.44, "learning_rate": 2.7864061077647995e-05, "loss": 2.4501, "step": 253870 }, { "epoch": 0.44, "learning_rate": 2.7863189137721168e-05, "loss": 2.3457, "step": 253880 }, { "epoch": 0.44, "learning_rate": 2.7862317197794342e-05, "loss": 2.3343, "step": 253890 }, { "epoch": 0.44, "learning_rate": 2.7861445257867512e-05, "loss": 2.4601, "step": 253900 }, { "epoch": 0.44, "learning_rate": 2.7860573317940686e-05, "loss": 2.3991, "step": 253910 }, { "epoch": 0.44, "learning_rate": 2.7859701378013863e-05, "loss": 2.3811, "step": 253920 }, { "epoch": 0.44, "learning_rate": 2.7858829438087037e-05, "loss": 2.477, "step": 253930 }, { "epoch": 0.44, "learning_rate": 2.7857957498160208e-05, "loss": 2.3679, "step": 253940 }, { "epoch": 0.44, "learning_rate": 2.785708555823338e-05, "loss": 2.3116, "step": 253950 }, { "epoch": 0.44, "learning_rate": 2.7856213618306555e-05, "loss": 2.3504, "step": 253960 }, { "epoch": 0.44, "learning_rate": 2.7855341678379725e-05, "loss": 2.4954, "step": 253970 }, { "epoch": 0.44, "learning_rate": 2.78544697384529e-05, "loss": 2.3926, "step": 253980 }, { "epoch": 0.44, "learning_rate": 2.7853597798526076e-05, "loss": 2.3871, "step": 253990 }, { "epoch": 0.44, "learning_rate": 2.785272585859925e-05, "loss": 2.3618, "step": 254000 }, { "epoch": 0.44, "learning_rate": 2.785185391867242e-05, "loss": 2.4318, "step": 254010 }, { "epoch": 0.44, "learning_rate": 2.7850981978745594e-05, "loss": 2.2959, "step": 254020 }, { "epoch": 0.44, "learning_rate": 2.7850110038818765e-05, "loss": 2.2827, "step": 254030 }, { "epoch": 0.44, "learning_rate": 2.784923809889194e-05, "loss": 2.4988, "step": 254040 }, { "epoch": 0.44, "learning_rate": 2.7848366158965112e-05, "loss": 2.4331, "step": 254050 }, { "epoch": 0.44, "learning_rate": 2.7847494219038283e-05, "loss": 2.4791, "step": 254060 }, { "epoch": 0.44, "learning_rate": 2.7846622279111463e-05, "loss": 2.2758, "step": 254070 }, { "epoch": 0.44, "learning_rate": 2.7845750339184634e-05, "loss": 2.4256, "step": 254080 }, { "epoch": 0.44, "learning_rate": 2.7844878399257807e-05, "loss": 2.351, "step": 254090 }, { "epoch": 0.44, "learning_rate": 2.7844006459330978e-05, "loss": 2.2288, "step": 254100 }, { "epoch": 0.44, "learning_rate": 2.784313451940415e-05, "loss": 2.4971, "step": 254110 }, { "epoch": 0.44, "learning_rate": 2.7842262579477325e-05, "loss": 2.3977, "step": 254120 }, { "epoch": 0.44, "learning_rate": 2.7841390639550496e-05, "loss": 2.3597, "step": 254130 }, { "epoch": 0.44, "learning_rate": 2.7840518699623673e-05, "loss": 2.3695, "step": 254140 }, { "epoch": 0.44, "learning_rate": 2.7839646759696847e-05, "loss": 2.2908, "step": 254150 }, { "epoch": 0.44, "learning_rate": 2.783877481977002e-05, "loss": 2.3935, "step": 254160 }, { "epoch": 0.44, "learning_rate": 2.783790287984319e-05, "loss": 2.4235, "step": 254170 }, { "epoch": 0.44, "learning_rate": 2.7837030939916364e-05, "loss": 2.454, "step": 254180 }, { "epoch": 0.44, "learning_rate": 2.7836158999989538e-05, "loss": 2.4713, "step": 254190 }, { "epoch": 0.44, "learning_rate": 2.783528706006271e-05, "loss": 2.419, "step": 254200 }, { "epoch": 0.44, "learning_rate": 2.7834415120135886e-05, "loss": 2.243, "step": 254210 }, { "epoch": 0.44, "learning_rate": 2.783354318020906e-05, "loss": 2.2918, "step": 254220 }, { "epoch": 0.44, "learning_rate": 2.7832671240282233e-05, "loss": 2.3447, "step": 254230 }, { "epoch": 0.44, "learning_rate": 2.7831799300355404e-05, "loss": 2.4251, "step": 254240 }, { "epoch": 0.44, "learning_rate": 2.7830927360428577e-05, "loss": 2.4489, "step": 254250 }, { "epoch": 0.44, "learning_rate": 2.7830055420501748e-05, "loss": 2.3353, "step": 254260 }, { "epoch": 0.44, "learning_rate": 2.782918348057492e-05, "loss": 2.4211, "step": 254270 }, { "epoch": 0.44, "learning_rate": 2.7828311540648095e-05, "loss": 2.4775, "step": 254280 }, { "epoch": 0.44, "learning_rate": 2.7827439600721273e-05, "loss": 2.4081, "step": 254290 }, { "epoch": 0.44, "learning_rate": 2.7826567660794446e-05, "loss": 2.3604, "step": 254300 }, { "epoch": 0.44, "learning_rate": 2.7825695720867617e-05, "loss": 2.3533, "step": 254310 }, { "epoch": 0.44, "learning_rate": 2.782482378094079e-05, "loss": 2.4634, "step": 254320 }, { "epoch": 0.44, "learning_rate": 2.782395184101396e-05, "loss": 2.4165, "step": 254330 }, { "epoch": 0.44, "learning_rate": 2.7823079901087135e-05, "loss": 2.3333, "step": 254340 }, { "epoch": 0.44, "learning_rate": 2.782220796116031e-05, "loss": 2.3115, "step": 254350 }, { "epoch": 0.44, "learning_rate": 2.7821336021233486e-05, "loss": 2.3354, "step": 254360 }, { "epoch": 0.44, "learning_rate": 2.7820464081306656e-05, "loss": 2.3869, "step": 254370 }, { "epoch": 0.44, "learning_rate": 2.781959214137983e-05, "loss": 2.3917, "step": 254380 }, { "epoch": 0.44, "learning_rate": 2.7818720201453003e-05, "loss": 2.4059, "step": 254390 }, { "epoch": 0.44, "learning_rate": 2.7817848261526174e-05, "loss": 2.4696, "step": 254400 }, { "epoch": 0.44, "learning_rate": 2.7816976321599348e-05, "loss": 2.4153, "step": 254410 }, { "epoch": 0.44, "learning_rate": 2.781610438167252e-05, "loss": 2.2645, "step": 254420 }, { "epoch": 0.44, "learning_rate": 2.7815232441745692e-05, "loss": 2.4301, "step": 254430 }, { "epoch": 0.44, "learning_rate": 2.781436050181887e-05, "loss": 2.4772, "step": 254440 }, { "epoch": 0.44, "learning_rate": 2.7813488561892043e-05, "loss": 2.2635, "step": 254450 }, { "epoch": 0.44, "learning_rate": 2.7812616621965216e-05, "loss": 2.4847, "step": 254460 }, { "epoch": 0.44, "learning_rate": 2.7811744682038387e-05, "loss": 2.466, "step": 254470 }, { "epoch": 0.44, "learning_rate": 2.781087274211156e-05, "loss": 2.2566, "step": 254480 }, { "epoch": 0.44, "learning_rate": 2.781000080218473e-05, "loss": 2.4071, "step": 254490 }, { "epoch": 0.44, "learning_rate": 2.7809128862257905e-05, "loss": 2.4377, "step": 254500 }, { "epoch": 0.44, "learning_rate": 2.7808256922331082e-05, "loss": 2.496, "step": 254510 }, { "epoch": 0.44, "learning_rate": 2.7807384982404256e-05, "loss": 2.3797, "step": 254520 }, { "epoch": 0.44, "learning_rate": 2.780651304247743e-05, "loss": 2.3672, "step": 254530 }, { "epoch": 0.44, "learning_rate": 2.78056411025506e-05, "loss": 2.4311, "step": 254540 }, { "epoch": 0.44, "learning_rate": 2.7804769162623774e-05, "loss": 2.5014, "step": 254550 }, { "epoch": 0.44, "learning_rate": 2.7803897222696944e-05, "loss": 2.4056, "step": 254560 }, { "epoch": 0.44, "learning_rate": 2.7803025282770118e-05, "loss": 2.3525, "step": 254570 }, { "epoch": 0.44, "learning_rate": 2.780215334284329e-05, "loss": 2.438, "step": 254580 }, { "epoch": 0.44, "learning_rate": 2.780128140291647e-05, "loss": 2.3297, "step": 254590 }, { "epoch": 0.44, "learning_rate": 2.780040946298964e-05, "loss": 2.4038, "step": 254600 }, { "epoch": 0.44, "learning_rate": 2.7799537523062813e-05, "loss": 2.4223, "step": 254610 }, { "epoch": 0.44, "learning_rate": 2.7798665583135987e-05, "loss": 2.2514, "step": 254620 }, { "epoch": 0.44, "learning_rate": 2.7797793643209157e-05, "loss": 2.3068, "step": 254630 }, { "epoch": 0.44, "learning_rate": 2.779692170328233e-05, "loss": 2.3871, "step": 254640 }, { "epoch": 0.44, "learning_rate": 2.77960497633555e-05, "loss": 2.4723, "step": 254650 }, { "epoch": 0.44, "learning_rate": 2.779517782342868e-05, "loss": 2.2598, "step": 254660 }, { "epoch": 0.44, "learning_rate": 2.7794305883501852e-05, "loss": 2.3702, "step": 254670 }, { "epoch": 0.44, "learning_rate": 2.7793433943575026e-05, "loss": 2.4173, "step": 254680 }, { "epoch": 0.44, "learning_rate": 2.77925620036482e-05, "loss": 2.4696, "step": 254690 }, { "epoch": 0.44, "learning_rate": 2.779169006372137e-05, "loss": 2.415, "step": 254700 }, { "epoch": 0.44, "learning_rate": 2.7790818123794544e-05, "loss": 2.297, "step": 254710 }, { "epoch": 0.44, "learning_rate": 2.7789946183867714e-05, "loss": 2.3732, "step": 254720 }, { "epoch": 0.44, "learning_rate": 2.7789074243940895e-05, "loss": 2.2799, "step": 254730 }, { "epoch": 0.44, "learning_rate": 2.7788202304014065e-05, "loss": 2.4427, "step": 254740 }, { "epoch": 0.44, "learning_rate": 2.778733036408724e-05, "loss": 2.3389, "step": 254750 }, { "epoch": 0.44, "learning_rate": 2.778645842416041e-05, "loss": 2.3127, "step": 254760 }, { "epoch": 0.44, "learning_rate": 2.7785586484233583e-05, "loss": 2.3231, "step": 254770 }, { "epoch": 0.44, "learning_rate": 2.7784714544306757e-05, "loss": 2.4384, "step": 254780 }, { "epoch": 0.44, "learning_rate": 2.7783842604379927e-05, "loss": 2.3482, "step": 254790 }, { "epoch": 0.44, "learning_rate": 2.77829706644531e-05, "loss": 2.3672, "step": 254800 }, { "epoch": 0.44, "learning_rate": 2.7782098724526278e-05, "loss": 2.3287, "step": 254810 }, { "epoch": 0.44, "learning_rate": 2.7781226784599452e-05, "loss": 2.3299, "step": 254820 }, { "epoch": 0.44, "learning_rate": 2.7780354844672622e-05, "loss": 2.4149, "step": 254830 }, { "epoch": 0.44, "learning_rate": 2.7779482904745796e-05, "loss": 2.453, "step": 254840 }, { "epoch": 0.44, "learning_rate": 2.777861096481897e-05, "loss": 2.3995, "step": 254850 }, { "epoch": 0.44, "learning_rate": 2.777773902489214e-05, "loss": 2.3704, "step": 254860 }, { "epoch": 0.44, "learning_rate": 2.7776867084965314e-05, "loss": 2.3278, "step": 254870 }, { "epoch": 0.44, "learning_rate": 2.777599514503849e-05, "loss": 2.306, "step": 254880 }, { "epoch": 0.44, "learning_rate": 2.7775123205111665e-05, "loss": 2.3666, "step": 254890 }, { "epoch": 0.44, "learning_rate": 2.7774251265184835e-05, "loss": 2.448, "step": 254900 }, { "epoch": 0.44, "learning_rate": 2.777337932525801e-05, "loss": 2.2609, "step": 254910 }, { "epoch": 0.44, "learning_rate": 2.7772507385331183e-05, "loss": 2.3974, "step": 254920 }, { "epoch": 0.44, "learning_rate": 2.7771635445404353e-05, "loss": 2.4358, "step": 254930 }, { "epoch": 0.44, "learning_rate": 2.7770763505477527e-05, "loss": 2.3303, "step": 254940 }, { "epoch": 0.44, "learning_rate": 2.7769891565550697e-05, "loss": 2.4265, "step": 254950 }, { "epoch": 0.44, "learning_rate": 2.7769019625623878e-05, "loss": 2.3487, "step": 254960 }, { "epoch": 0.44, "learning_rate": 2.7768147685697048e-05, "loss": 2.4594, "step": 254970 }, { "epoch": 0.44, "learning_rate": 2.7767275745770222e-05, "loss": 2.3718, "step": 254980 }, { "epoch": 0.44, "learning_rate": 2.7766403805843392e-05, "loss": 2.3995, "step": 254990 }, { "epoch": 0.44, "learning_rate": 2.7765531865916566e-05, "loss": 2.3212, "step": 255000 }, { "epoch": 0.44, "learning_rate": 2.776465992598974e-05, "loss": 2.4538, "step": 255010 }, { "epoch": 0.44, "learning_rate": 2.776378798606291e-05, "loss": 2.3578, "step": 255020 }, { "epoch": 0.44, "learning_rate": 2.776291604613609e-05, "loss": 2.275, "step": 255030 }, { "epoch": 0.44, "learning_rate": 2.776204410620926e-05, "loss": 2.4287, "step": 255040 }, { "epoch": 0.44, "learning_rate": 2.7761172166282435e-05, "loss": 2.4343, "step": 255050 }, { "epoch": 0.44, "learning_rate": 2.7760300226355605e-05, "loss": 2.4222, "step": 255060 }, { "epoch": 0.44, "learning_rate": 2.775942828642878e-05, "loss": 2.2925, "step": 255070 }, { "epoch": 0.44, "learning_rate": 2.7758556346501953e-05, "loss": 2.4017, "step": 255080 }, { "epoch": 0.44, "learning_rate": 2.7757684406575123e-05, "loss": 2.3306, "step": 255090 }, { "epoch": 0.44, "learning_rate": 2.7756812466648297e-05, "loss": 2.2624, "step": 255100 }, { "epoch": 0.44, "learning_rate": 2.7755940526721474e-05, "loss": 2.3064, "step": 255110 }, { "epoch": 0.44, "learning_rate": 2.7755068586794648e-05, "loss": 2.3719, "step": 255120 }, { "epoch": 0.44, "learning_rate": 2.775419664686782e-05, "loss": 2.4286, "step": 255130 }, { "epoch": 0.44, "learning_rate": 2.7753324706940992e-05, "loss": 2.3838, "step": 255140 }, { "epoch": 0.44, "learning_rate": 2.7752452767014166e-05, "loss": 2.4506, "step": 255150 }, { "epoch": 0.44, "learning_rate": 2.7751580827087336e-05, "loss": 2.5364, "step": 255160 }, { "epoch": 0.44, "learning_rate": 2.775070888716051e-05, "loss": 2.3726, "step": 255170 }, { "epoch": 0.45, "learning_rate": 2.7749836947233687e-05, "loss": 2.3261, "step": 255180 }, { "epoch": 0.45, "learning_rate": 2.774896500730686e-05, "loss": 2.3038, "step": 255190 }, { "epoch": 0.45, "learning_rate": 2.774809306738003e-05, "loss": 2.384, "step": 255200 }, { "epoch": 0.45, "learning_rate": 2.7747221127453205e-05, "loss": 2.4188, "step": 255210 }, { "epoch": 0.45, "learning_rate": 2.7746349187526376e-05, "loss": 2.265, "step": 255220 }, { "epoch": 0.45, "learning_rate": 2.774547724759955e-05, "loss": 2.2837, "step": 255230 }, { "epoch": 0.45, "learning_rate": 2.7744605307672723e-05, "loss": 2.3142, "step": 255240 }, { "epoch": 0.45, "learning_rate": 2.7743733367745893e-05, "loss": 2.4188, "step": 255250 }, { "epoch": 0.45, "learning_rate": 2.7742861427819074e-05, "loss": 2.4214, "step": 255260 }, { "epoch": 0.45, "learning_rate": 2.7741989487892244e-05, "loss": 2.4173, "step": 255270 }, { "epoch": 0.45, "learning_rate": 2.7741117547965418e-05, "loss": 2.3916, "step": 255280 }, { "epoch": 0.45, "learning_rate": 2.774024560803859e-05, "loss": 2.2544, "step": 255290 }, { "epoch": 0.45, "learning_rate": 2.7739373668111762e-05, "loss": 2.4617, "step": 255300 }, { "epoch": 0.45, "learning_rate": 2.7738501728184936e-05, "loss": 2.3542, "step": 255310 }, { "epoch": 0.45, "learning_rate": 2.7737629788258106e-05, "loss": 2.383, "step": 255320 }, { "epoch": 0.45, "learning_rate": 2.7736757848331284e-05, "loss": 2.3188, "step": 255330 }, { "epoch": 0.45, "learning_rate": 2.7735885908404457e-05, "loss": 2.3992, "step": 255340 }, { "epoch": 0.45, "learning_rate": 2.773501396847763e-05, "loss": 2.4868, "step": 255350 }, { "epoch": 0.45, "learning_rate": 2.77341420285508e-05, "loss": 2.4145, "step": 255360 }, { "epoch": 0.45, "learning_rate": 2.7733270088623975e-05, "loss": 2.387, "step": 255370 }, { "epoch": 0.45, "learning_rate": 2.7732398148697146e-05, "loss": 2.177, "step": 255380 }, { "epoch": 0.45, "learning_rate": 2.773152620877032e-05, "loss": 2.4626, "step": 255390 }, { "epoch": 0.45, "learning_rate": 2.7730654268843497e-05, "loss": 2.3987, "step": 255400 }, { "epoch": 0.45, "learning_rate": 2.772978232891667e-05, "loss": 2.4662, "step": 255410 }, { "epoch": 0.45, "learning_rate": 2.7728910388989844e-05, "loss": 2.361, "step": 255420 }, { "epoch": 0.45, "learning_rate": 2.7728038449063015e-05, "loss": 2.2769, "step": 255430 }, { "epoch": 0.45, "learning_rate": 2.7727166509136188e-05, "loss": 2.4207, "step": 255440 }, { "epoch": 0.45, "learning_rate": 2.772629456920936e-05, "loss": 2.3307, "step": 255450 }, { "epoch": 0.45, "learning_rate": 2.7725422629282532e-05, "loss": 2.3883, "step": 255460 }, { "epoch": 0.45, "learning_rate": 2.7724550689355706e-05, "loss": 2.3068, "step": 255470 }, { "epoch": 0.45, "learning_rate": 2.7723678749428883e-05, "loss": 2.3547, "step": 255480 }, { "epoch": 0.45, "learning_rate": 2.7722806809502054e-05, "loss": 2.3186, "step": 255490 }, { "epoch": 0.45, "learning_rate": 2.7721934869575228e-05, "loss": 2.3235, "step": 255500 }, { "epoch": 0.45, "learning_rate": 2.77210629296484e-05, "loss": 2.415, "step": 255510 }, { "epoch": 0.45, "learning_rate": 2.772019098972157e-05, "loss": 2.4369, "step": 255520 }, { "epoch": 0.45, "learning_rate": 2.7719319049794745e-05, "loss": 2.4112, "step": 255530 }, { "epoch": 0.45, "learning_rate": 2.771844710986792e-05, "loss": 2.3755, "step": 255540 }, { "epoch": 0.45, "learning_rate": 2.7717575169941096e-05, "loss": 2.3892, "step": 255550 }, { "epoch": 0.45, "learning_rate": 2.7716703230014267e-05, "loss": 2.4331, "step": 255560 }, { "epoch": 0.45, "learning_rate": 2.771583129008744e-05, "loss": 2.3771, "step": 255570 }, { "epoch": 0.45, "learning_rate": 2.7714959350160614e-05, "loss": 2.3788, "step": 255580 }, { "epoch": 0.45, "learning_rate": 2.7714087410233785e-05, "loss": 2.303, "step": 255590 }, { "epoch": 0.45, "learning_rate": 2.771321547030696e-05, "loss": 2.3653, "step": 255600 }, { "epoch": 0.45, "learning_rate": 2.771234353038013e-05, "loss": 2.3513, "step": 255610 }, { "epoch": 0.45, "learning_rate": 2.7711471590453303e-05, "loss": 2.4204, "step": 255620 }, { "epoch": 0.45, "learning_rate": 2.771059965052648e-05, "loss": 2.3672, "step": 255630 }, { "epoch": 0.45, "learning_rate": 2.7709727710599654e-05, "loss": 2.4254, "step": 255640 }, { "epoch": 0.45, "learning_rate": 2.7708855770672827e-05, "loss": 2.3851, "step": 255650 }, { "epoch": 0.45, "learning_rate": 2.7707983830745998e-05, "loss": 2.4203, "step": 255660 }, { "epoch": 0.45, "learning_rate": 2.770711189081917e-05, "loss": 2.4277, "step": 255670 }, { "epoch": 0.45, "learning_rate": 2.7706239950892342e-05, "loss": 2.3575, "step": 255680 }, { "epoch": 0.45, "learning_rate": 2.7705368010965516e-05, "loss": 2.4017, "step": 255690 }, { "epoch": 0.45, "learning_rate": 2.7704496071038693e-05, "loss": 2.4569, "step": 255700 }, { "epoch": 0.45, "learning_rate": 2.7703624131111867e-05, "loss": 2.392, "step": 255710 }, { "epoch": 0.45, "learning_rate": 2.7702752191185037e-05, "loss": 2.3708, "step": 255720 }, { "epoch": 0.45, "learning_rate": 2.770188025125821e-05, "loss": 2.4555, "step": 255730 }, { "epoch": 0.45, "learning_rate": 2.7701008311331384e-05, "loss": 2.3402, "step": 255740 }, { "epoch": 0.45, "learning_rate": 2.7700136371404555e-05, "loss": 2.3395, "step": 255750 }, { "epoch": 0.45, "learning_rate": 2.769926443147773e-05, "loss": 2.3709, "step": 255760 }, { "epoch": 0.45, "learning_rate": 2.7698392491550902e-05, "loss": 2.3854, "step": 255770 }, { "epoch": 0.45, "learning_rate": 2.769752055162408e-05, "loss": 2.2644, "step": 255780 }, { "epoch": 0.45, "learning_rate": 2.769664861169725e-05, "loss": 2.499, "step": 255790 }, { "epoch": 0.45, "learning_rate": 2.7695776671770424e-05, "loss": 2.3663, "step": 255800 }, { "epoch": 0.45, "learning_rate": 2.7694904731843597e-05, "loss": 2.376, "step": 255810 }, { "epoch": 0.45, "learning_rate": 2.7694032791916768e-05, "loss": 2.4105, "step": 255820 }, { "epoch": 0.45, "learning_rate": 2.769316085198994e-05, "loss": 2.4572, "step": 255830 }, { "epoch": 0.45, "learning_rate": 2.7692288912063112e-05, "loss": 2.3715, "step": 255840 }, { "epoch": 0.45, "learning_rate": 2.7691416972136293e-05, "loss": 2.5044, "step": 255850 }, { "epoch": 0.45, "learning_rate": 2.7690545032209463e-05, "loss": 2.34, "step": 255860 }, { "epoch": 0.45, "learning_rate": 2.7689673092282637e-05, "loss": 2.2933, "step": 255870 }, { "epoch": 0.45, "learning_rate": 2.768880115235581e-05, "loss": 2.3849, "step": 255880 }, { "epoch": 0.45, "learning_rate": 2.768792921242898e-05, "loss": 2.3227, "step": 255890 }, { "epoch": 0.45, "learning_rate": 2.7687057272502155e-05, "loss": 2.3589, "step": 255900 }, { "epoch": 0.45, "learning_rate": 2.7686185332575325e-05, "loss": 2.3998, "step": 255910 }, { "epoch": 0.45, "learning_rate": 2.76853133926485e-05, "loss": 2.4371, "step": 255920 }, { "epoch": 0.45, "learning_rate": 2.7684441452721676e-05, "loss": 2.3606, "step": 255930 }, { "epoch": 0.45, "learning_rate": 2.768356951279485e-05, "loss": 2.3365, "step": 255940 }, { "epoch": 0.45, "learning_rate": 2.768269757286802e-05, "loss": 2.367, "step": 255950 }, { "epoch": 0.45, "learning_rate": 2.7681825632941194e-05, "loss": 2.4008, "step": 255960 }, { "epoch": 0.45, "learning_rate": 2.7680953693014368e-05, "loss": 2.2758, "step": 255970 }, { "epoch": 0.45, "learning_rate": 2.7680081753087538e-05, "loss": 2.3095, "step": 255980 }, { "epoch": 0.45, "learning_rate": 2.7679209813160712e-05, "loss": 2.3736, "step": 255990 }, { "epoch": 0.45, "learning_rate": 2.767833787323389e-05, "loss": 2.3646, "step": 256000 }, { "epoch": 0.89, "learning_rate": 5.354931866614118e-06, "loss": 2.3582, "step": 256010 }, { "epoch": 0.89, "learning_rate": 5.353187986760464e-06, "loss": 2.3675, "step": 256020 }, { "epoch": 0.89, "learning_rate": 5.351444106906811e-06, "loss": 2.4478, "step": 256030 }, { "epoch": 0.89, "learning_rate": 5.349700227053157e-06, "loss": 2.4297, "step": 256040 }, { "epoch": 0.89, "learning_rate": 5.347956347199504e-06, "loss": 2.4002, "step": 256050 }, { "epoch": 0.89, "learning_rate": 5.34621246734585e-06, "loss": 2.3831, "step": 256060 }, { "epoch": 0.89, "learning_rate": 5.344468587492196e-06, "loss": 2.3242, "step": 256070 }, { "epoch": 0.89, "learning_rate": 5.342724707638542e-06, "loss": 2.3855, "step": 256080 }, { "epoch": 0.89, "learning_rate": 5.34098082778489e-06, "loss": 2.3627, "step": 256090 }, { "epoch": 0.89, "learning_rate": 5.339236947931236e-06, "loss": 2.3849, "step": 256100 }, { "epoch": 0.89, "learning_rate": 5.337493068077582e-06, "loss": 2.4403, "step": 256110 }, { "epoch": 0.89, "learning_rate": 5.335749188223928e-06, "loss": 2.4415, "step": 256120 }, { "epoch": 0.89, "learning_rate": 5.334005308370275e-06, "loss": 2.3887, "step": 256130 }, { "epoch": 0.89, "learning_rate": 5.332261428516621e-06, "loss": 2.455, "step": 256140 }, { "epoch": 0.89, "learning_rate": 5.330517548662967e-06, "loss": 2.3745, "step": 256150 }, { "epoch": 0.89, "learning_rate": 5.328773668809314e-06, "loss": 2.4248, "step": 256160 }, { "epoch": 0.89, "learning_rate": 5.327029788955661e-06, "loss": 2.3738, "step": 256170 }, { "epoch": 0.89, "learning_rate": 5.325285909102007e-06, "loss": 2.3599, "step": 256180 }, { "epoch": 0.89, "learning_rate": 5.323542029248353e-06, "loss": 2.3814, "step": 256190 }, { "epoch": 0.89, "learning_rate": 5.321798149394699e-06, "loss": 2.3544, "step": 256200 }, { "epoch": 0.89, "learning_rate": 5.320054269541046e-06, "loss": 2.342, "step": 256210 }, { "epoch": 0.89, "learning_rate": 5.318310389687392e-06, "loss": 2.3765, "step": 256220 }, { "epoch": 0.89, "learning_rate": 5.316566509833739e-06, "loss": 2.4637, "step": 256230 }, { "epoch": 0.89, "learning_rate": 5.314822629980085e-06, "loss": 2.2951, "step": 256240 }, { "epoch": 0.89, "learning_rate": 5.313078750126432e-06, "loss": 2.3562, "step": 256250 }, { "epoch": 0.89, "learning_rate": 5.311334870272778e-06, "loss": 2.3041, "step": 256260 }, { "epoch": 0.89, "learning_rate": 5.309590990419124e-06, "loss": 2.342, "step": 256270 }, { "epoch": 0.89, "learning_rate": 5.30784711056547e-06, "loss": 2.3967, "step": 256280 }, { "epoch": 0.89, "learning_rate": 5.306103230711818e-06, "loss": 2.3413, "step": 256290 }, { "epoch": 0.89, "learning_rate": 5.3043593508581635e-06, "loss": 2.3959, "step": 256300 }, { "epoch": 0.89, "learning_rate": 5.30261547100451e-06, "loss": 2.4433, "step": 256310 }, { "epoch": 0.89, "learning_rate": 5.300871591150856e-06, "loss": 2.3768, "step": 256320 }, { "epoch": 0.89, "learning_rate": 5.299127711297203e-06, "loss": 2.2736, "step": 256330 }, { "epoch": 0.89, "learning_rate": 5.297383831443549e-06, "loss": 2.4386, "step": 256340 }, { "epoch": 0.89, "learning_rate": 5.295639951589895e-06, "loss": 2.3786, "step": 256350 }, { "epoch": 0.89, "learning_rate": 5.293896071736242e-06, "loss": 2.3633, "step": 256360 }, { "epoch": 0.89, "learning_rate": 5.292152191882589e-06, "loss": 2.3843, "step": 256370 }, { "epoch": 0.89, "learning_rate": 5.2904083120289345e-06, "loss": 2.424, "step": 256380 }, { "epoch": 0.89, "learning_rate": 5.288664432175281e-06, "loss": 2.375, "step": 256390 }, { "epoch": 0.89, "learning_rate": 5.286920552321627e-06, "loss": 2.2736, "step": 256400 }, { "epoch": 0.89, "learning_rate": 5.285176672467974e-06, "loss": 2.4225, "step": 256410 }, { "epoch": 0.89, "learning_rate": 5.28343279261432e-06, "loss": 2.3215, "step": 256420 }, { "epoch": 0.89, "learning_rate": 5.281688912760667e-06, "loss": 2.3795, "step": 256430 }, { "epoch": 0.89, "learning_rate": 5.279945032907013e-06, "loss": 2.3795, "step": 256440 }, { "epoch": 0.89, "learning_rate": 5.27820115305336e-06, "loss": 2.338, "step": 256450 }, { "epoch": 0.89, "learning_rate": 5.2764572731997055e-06, "loss": 2.3321, "step": 256460 }, { "epoch": 0.89, "learning_rate": 5.274713393346052e-06, "loss": 2.4215, "step": 256470 }, { "epoch": 0.89, "learning_rate": 5.272969513492398e-06, "loss": 2.4639, "step": 256480 }, { "epoch": 0.89, "learning_rate": 5.271225633638746e-06, "loss": 2.3912, "step": 256490 }, { "epoch": 0.89, "learning_rate": 5.2694817537850914e-06, "loss": 2.3259, "step": 256500 }, { "epoch": 0.89, "learning_rate": 5.267737873931438e-06, "loss": 2.319, "step": 256510 }, { "epoch": 0.89, "learning_rate": 5.265993994077784e-06, "loss": 2.3882, "step": 256520 }, { "epoch": 0.89, "learning_rate": 5.264250114224131e-06, "loss": 2.3908, "step": 256530 }, { "epoch": 0.89, "learning_rate": 5.2625062343704765e-06, "loss": 2.4055, "step": 256540 }, { "epoch": 0.89, "learning_rate": 5.260762354516823e-06, "loss": 2.3113, "step": 256550 }, { "epoch": 0.89, "learning_rate": 5.25901847466317e-06, "loss": 2.3672, "step": 256560 }, { "epoch": 0.89, "learning_rate": 5.257274594809517e-06, "loss": 2.3848, "step": 256570 }, { "epoch": 0.89, "learning_rate": 5.2555307149558624e-06, "loss": 2.4087, "step": 256580 }, { "epoch": 0.89, "learning_rate": 5.253786835102209e-06, "loss": 2.329, "step": 256590 }, { "epoch": 0.89, "learning_rate": 5.252042955248555e-06, "loss": 2.3174, "step": 256600 }, { "epoch": 0.89, "learning_rate": 5.250299075394902e-06, "loss": 2.3467, "step": 256610 }, { "epoch": 0.9, "learning_rate": 5.2485551955412475e-06, "loss": 2.3472, "step": 256620 }, { "epoch": 0.9, "learning_rate": 5.246811315687595e-06, "loss": 2.2868, "step": 256630 }, { "epoch": 0.9, "learning_rate": 5.245067435833941e-06, "loss": 2.3208, "step": 256640 }, { "epoch": 0.9, "learning_rate": 5.243323555980288e-06, "loss": 2.3691, "step": 256650 }, { "epoch": 0.9, "learning_rate": 5.2415796761266334e-06, "loss": 2.4033, "step": 256660 }, { "epoch": 0.9, "learning_rate": 5.23983579627298e-06, "loss": 2.3467, "step": 256670 }, { "epoch": 0.9, "learning_rate": 5.238091916419326e-06, "loss": 2.371, "step": 256680 }, { "epoch": 0.9, "learning_rate": 5.2363480365656735e-06, "loss": 2.3569, "step": 256690 }, { "epoch": 0.9, "learning_rate": 5.234604156712019e-06, "loss": 2.3565, "step": 256700 }, { "epoch": 0.9, "learning_rate": 5.232860276858366e-06, "loss": 2.3014, "step": 256710 }, { "epoch": 0.9, "learning_rate": 5.231116397004712e-06, "loss": 2.3847, "step": 256720 }, { "epoch": 0.9, "learning_rate": 5.229372517151059e-06, "loss": 2.339, "step": 256730 }, { "epoch": 0.9, "learning_rate": 5.2276286372974044e-06, "loss": 2.3468, "step": 256740 }, { "epoch": 0.9, "learning_rate": 5.225884757443751e-06, "loss": 2.3991, "step": 256750 }, { "epoch": 0.9, "learning_rate": 5.224140877590098e-06, "loss": 2.3706, "step": 256760 }, { "epoch": 0.9, "learning_rate": 5.2223969977364445e-06, "loss": 2.3427, "step": 256770 }, { "epoch": 0.9, "learning_rate": 5.22065311788279e-06, "loss": 2.3872, "step": 256780 }, { "epoch": 0.9, "learning_rate": 5.218909238029137e-06, "loss": 2.3275, "step": 256790 }, { "epoch": 0.9, "learning_rate": 5.217165358175483e-06, "loss": 2.3744, "step": 256800 }, { "epoch": 0.9, "learning_rate": 5.21542147832183e-06, "loss": 2.369, "step": 256810 }, { "epoch": 0.9, "learning_rate": 5.2136775984681754e-06, "loss": 2.3179, "step": 256820 }, { "epoch": 0.9, "learning_rate": 5.211933718614523e-06, "loss": 2.362, "step": 256830 }, { "epoch": 0.9, "learning_rate": 5.210189838760869e-06, "loss": 2.3696, "step": 256840 }, { "epoch": 0.9, "learning_rate": 5.2084459589072155e-06, "loss": 2.3714, "step": 256850 }, { "epoch": 0.9, "learning_rate": 5.206702079053561e-06, "loss": 2.3509, "step": 256860 }, { "epoch": 0.9, "learning_rate": 5.204958199199908e-06, "loss": 2.3564, "step": 256870 }, { "epoch": 0.9, "learning_rate": 5.203214319346254e-06, "loss": 2.3223, "step": 256880 }, { "epoch": 0.9, "learning_rate": 5.2014704394926014e-06, "loss": 2.3757, "step": 256890 }, { "epoch": 0.9, "learning_rate": 5.199726559638947e-06, "loss": 2.3983, "step": 256900 }, { "epoch": 0.9, "learning_rate": 5.197982679785294e-06, "loss": 2.367, "step": 256910 }, { "epoch": 0.9, "learning_rate": 5.19623879993164e-06, "loss": 2.3722, "step": 256920 }, { "epoch": 0.9, "learning_rate": 5.1944949200779865e-06, "loss": 2.2908, "step": 256930 }, { "epoch": 0.9, "learning_rate": 5.192751040224332e-06, "loss": 2.4104, "step": 256940 }, { "epoch": 0.9, "learning_rate": 5.191007160370679e-06, "loss": 2.3264, "step": 256950 }, { "epoch": 0.9, "learning_rate": 5.189263280517026e-06, "loss": 2.3562, "step": 256960 }, { "epoch": 0.9, "learning_rate": 5.1875194006633724e-06, "loss": 2.305, "step": 256970 }, { "epoch": 0.9, "learning_rate": 5.185775520809718e-06, "loss": 2.4383, "step": 256980 }, { "epoch": 0.9, "learning_rate": 5.184031640956065e-06, "loss": 2.2791, "step": 256990 }, { "epoch": 0.9, "learning_rate": 5.182287761102411e-06, "loss": 2.4113, "step": 257000 }, { "epoch": 0.9, "learning_rate": 5.1805438812487575e-06, "loss": 2.3209, "step": 257010 }, { "epoch": 0.9, "learning_rate": 5.178800001395104e-06, "loss": 2.427, "step": 257020 }, { "epoch": 0.9, "learning_rate": 5.177056121541451e-06, "loss": 2.4318, "step": 257030 }, { "epoch": 0.9, "learning_rate": 5.175312241687797e-06, "loss": 2.3616, "step": 257040 }, { "epoch": 0.9, "learning_rate": 5.1735683618341434e-06, "loss": 2.3726, "step": 257050 }, { "epoch": 0.9, "learning_rate": 5.171824481980489e-06, "loss": 2.4024, "step": 257060 }, { "epoch": 0.9, "learning_rate": 5.170080602126836e-06, "loss": 2.3935, "step": 257070 }, { "epoch": 0.9, "learning_rate": 5.168336722273182e-06, "loss": 2.3543, "step": 257080 }, { "epoch": 0.9, "learning_rate": 5.166592842419529e-06, "loss": 2.318, "step": 257090 }, { "epoch": 0.9, "learning_rate": 5.164848962565875e-06, "loss": 2.3125, "step": 257100 }, { "epoch": 0.9, "learning_rate": 5.163105082712222e-06, "loss": 2.3714, "step": 257110 }, { "epoch": 0.9, "learning_rate": 5.161361202858568e-06, "loss": 2.3635, "step": 257120 }, { "epoch": 0.9, "learning_rate": 5.1596173230049144e-06, "loss": 2.39, "step": 257130 }, { "epoch": 0.9, "learning_rate": 5.15787344315126e-06, "loss": 2.3963, "step": 257140 }, { "epoch": 0.9, "learning_rate": 5.156129563297607e-06, "loss": 2.3936, "step": 257150 }, { "epoch": 0.9, "learning_rate": 5.154385683443954e-06, "loss": 2.4016, "step": 257160 }, { "epoch": 0.9, "learning_rate": 5.1526418035903e-06, "loss": 2.2812, "step": 257170 }, { "epoch": 0.9, "learning_rate": 5.150897923736646e-06, "loss": 2.3631, "step": 257180 }, { "epoch": 0.9, "learning_rate": 5.149154043882993e-06, "loss": 2.4348, "step": 257190 }, { "epoch": 0.9, "learning_rate": 5.147410164029339e-06, "loss": 2.3934, "step": 257200 }, { "epoch": 0.9, "learning_rate": 5.1456662841756854e-06, "loss": 2.3166, "step": 257210 }, { "epoch": 0.9, "learning_rate": 5.143922404322032e-06, "loss": 2.3631, "step": 257220 }, { "epoch": 0.9, "learning_rate": 5.142178524468379e-06, "loss": 2.4293, "step": 257230 }, { "epoch": 0.9, "learning_rate": 5.140434644614725e-06, "loss": 2.3747, "step": 257240 }, { "epoch": 0.9, "learning_rate": 5.138690764761071e-06, "loss": 2.3977, "step": 257250 }, { "epoch": 0.9, "learning_rate": 5.136946884907417e-06, "loss": 2.2926, "step": 257260 }, { "epoch": 0.9, "learning_rate": 5.135203005053764e-06, "loss": 2.323, "step": 257270 }, { "epoch": 0.9, "learning_rate": 5.133459125200111e-06, "loss": 2.376, "step": 257280 }, { "epoch": 0.9, "learning_rate": 5.131715245346457e-06, "loss": 2.3071, "step": 257290 }, { "epoch": 0.9, "learning_rate": 5.129971365492803e-06, "loss": 2.2773, "step": 257300 }, { "epoch": 0.9, "learning_rate": 5.12822748563915e-06, "loss": 2.3829, "step": 257310 }, { "epoch": 0.9, "learning_rate": 5.126483605785496e-06, "loss": 2.41, "step": 257320 }, { "epoch": 0.9, "learning_rate": 5.124739725931842e-06, "loss": 2.3027, "step": 257330 }, { "epoch": 0.9, "learning_rate": 5.122995846078188e-06, "loss": 2.2588, "step": 257340 }, { "epoch": 0.9, "learning_rate": 5.121251966224535e-06, "loss": 2.2358, "step": 257350 }, { "epoch": 0.9, "learning_rate": 5.119508086370882e-06, "loss": 2.3593, "step": 257360 }, { "epoch": 0.9, "learning_rate": 5.117764206517228e-06, "loss": 2.3454, "step": 257370 }, { "epoch": 0.9, "learning_rate": 5.116020326663574e-06, "loss": 2.3462, "step": 257380 }, { "epoch": 0.9, "learning_rate": 5.114276446809921e-06, "loss": 2.4014, "step": 257390 }, { "epoch": 0.9, "learning_rate": 5.112532566956267e-06, "loss": 2.2754, "step": 257400 }, { "epoch": 0.9, "learning_rate": 5.110788687102613e-06, "loss": 2.3404, "step": 257410 }, { "epoch": 0.9, "learning_rate": 5.10904480724896e-06, "loss": 2.3427, "step": 257420 }, { "epoch": 0.9, "learning_rate": 5.107300927395307e-06, "loss": 2.3379, "step": 257430 }, { "epoch": 0.9, "learning_rate": 5.105557047541653e-06, "loss": 2.3091, "step": 257440 }, { "epoch": 0.9, "learning_rate": 5.103813167687999e-06, "loss": 2.3933, "step": 257450 }, { "epoch": 0.9, "learning_rate": 5.102069287834345e-06, "loss": 2.3192, "step": 257460 }, { "epoch": 0.9, "learning_rate": 5.100325407980692e-06, "loss": 2.4396, "step": 257470 }, { "epoch": 0.9, "learning_rate": 5.0985815281270385e-06, "loss": 2.3595, "step": 257480 }, { "epoch": 0.9, "learning_rate": 5.096837648273385e-06, "loss": 2.3795, "step": 257490 }, { "epoch": 0.9, "learning_rate": 5.095093768419731e-06, "loss": 2.393, "step": 257500 }, { "epoch": 0.9, "learning_rate": 5.093349888566078e-06, "loss": 2.4275, "step": 257510 }, { "epoch": 0.9, "learning_rate": 5.091606008712424e-06, "loss": 2.4011, "step": 257520 }, { "epoch": 0.9, "learning_rate": 5.08986212885877e-06, "loss": 2.3176, "step": 257530 }, { "epoch": 0.9, "learning_rate": 5.088118249005117e-06, "loss": 2.4229, "step": 257540 }, { "epoch": 0.9, "learning_rate": 5.086374369151463e-06, "loss": 2.2913, "step": 257550 }, { "epoch": 0.9, "learning_rate": 5.0846304892978095e-06, "loss": 2.3762, "step": 257560 }, { "epoch": 0.9, "learning_rate": 5.082886609444156e-06, "loss": 2.3367, "step": 257570 }, { "epoch": 0.9, "learning_rate": 5.081142729590502e-06, "loss": 2.3427, "step": 257580 }, { "epoch": 0.9, "learning_rate": 5.079398849736849e-06, "loss": 2.4109, "step": 257590 }, { "epoch": 0.9, "learning_rate": 5.0776549698831955e-06, "loss": 2.3766, "step": 257600 }, { "epoch": 0.9, "learning_rate": 5.075911090029541e-06, "loss": 2.3605, "step": 257610 }, { "epoch": 0.9, "learning_rate": 5.074167210175888e-06, "loss": 2.2901, "step": 257620 }, { "epoch": 0.9, "learning_rate": 5.072423330322235e-06, "loss": 2.2964, "step": 257630 }, { "epoch": 0.9, "learning_rate": 5.0706794504685805e-06, "loss": 2.3229, "step": 257640 }, { "epoch": 0.9, "learning_rate": 5.068935570614927e-06, "loss": 2.3524, "step": 257650 }, { "epoch": 0.9, "learning_rate": 5.067191690761273e-06, "loss": 2.3766, "step": 257660 }, { "epoch": 0.9, "learning_rate": 5.06544781090762e-06, "loss": 2.3261, "step": 257670 }, { "epoch": 0.9, "learning_rate": 5.0637039310539665e-06, "loss": 2.3511, "step": 257680 }, { "epoch": 0.9, "learning_rate": 5.061960051200313e-06, "loss": 2.4216, "step": 257690 }, { "epoch": 0.9, "learning_rate": 5.060216171346659e-06, "loss": 2.4148, "step": 257700 }, { "epoch": 0.9, "learning_rate": 5.058472291493006e-06, "loss": 2.321, "step": 257710 }, { "epoch": 0.9, "learning_rate": 5.0567284116393515e-06, "loss": 2.3601, "step": 257720 }, { "epoch": 0.9, "learning_rate": 5.054984531785698e-06, "loss": 2.3226, "step": 257730 }, { "epoch": 0.9, "learning_rate": 5.053240651932045e-06, "loss": 2.4482, "step": 257740 }, { "epoch": 0.9, "learning_rate": 5.051496772078391e-06, "loss": 2.4066, "step": 257750 }, { "epoch": 0.9, "learning_rate": 5.0497528922247375e-06, "loss": 2.4, "step": 257760 }, { "epoch": 0.9, "learning_rate": 5.048009012371084e-06, "loss": 2.4275, "step": 257770 }, { "epoch": 0.9, "learning_rate": 5.04626513251743e-06, "loss": 2.2931, "step": 257780 }, { "epoch": 0.9, "learning_rate": 5.044521252663777e-06, "loss": 2.2831, "step": 257790 }, { "epoch": 0.9, "learning_rate": 5.042777372810123e-06, "loss": 2.3071, "step": 257800 }, { "epoch": 0.9, "learning_rate": 5.041033492956469e-06, "loss": 2.3743, "step": 257810 }, { "epoch": 0.9, "learning_rate": 5.039289613102816e-06, "loss": 2.3105, "step": 257820 }, { "epoch": 0.9, "learning_rate": 5.037545733249163e-06, "loss": 2.381, "step": 257830 }, { "epoch": 0.9, "learning_rate": 5.0358018533955085e-06, "loss": 2.306, "step": 257840 }, { "epoch": 0.9, "learning_rate": 5.034057973541855e-06, "loss": 2.4386, "step": 257850 }, { "epoch": 0.9, "learning_rate": 5.032314093688202e-06, "loss": 2.2909, "step": 257860 }, { "epoch": 0.9, "learning_rate": 5.030570213834548e-06, "loss": 2.3403, "step": 257870 }, { "epoch": 0.9, "learning_rate": 5.028826333980894e-06, "loss": 2.4475, "step": 257880 }, { "epoch": 0.9, "learning_rate": 5.027082454127241e-06, "loss": 2.3357, "step": 257890 }, { "epoch": 0.9, "learning_rate": 5.025338574273587e-06, "loss": 2.4035, "step": 257900 }, { "epoch": 0.9, "learning_rate": 5.023594694419934e-06, "loss": 2.4184, "step": 257910 }, { "epoch": 0.9, "learning_rate": 5.0218508145662795e-06, "loss": 2.3988, "step": 257920 }, { "epoch": 0.9, "learning_rate": 5.020106934712626e-06, "loss": 2.3095, "step": 257930 }, { "epoch": 0.9, "learning_rate": 5.018363054858973e-06, "loss": 2.3571, "step": 257940 }, { "epoch": 0.9, "learning_rate": 5.016619175005319e-06, "loss": 2.2416, "step": 257950 }, { "epoch": 0.9, "learning_rate": 5.014875295151665e-06, "loss": 2.371, "step": 257960 }, { "epoch": 0.9, "learning_rate": 5.013131415298012e-06, "loss": 2.3062, "step": 257970 }, { "epoch": 0.9, "learning_rate": 5.011387535444358e-06, "loss": 2.383, "step": 257980 }, { "epoch": 0.9, "learning_rate": 5.009643655590705e-06, "loss": 2.3184, "step": 257990 }, { "epoch": 0.9, "learning_rate": 5.007899775737051e-06, "loss": 2.4382, "step": 258000 }, { "epoch": 0.9, "learning_rate": 5.006155895883397e-06, "loss": 2.37, "step": 258010 }, { "epoch": 0.9, "learning_rate": 5.004412016029744e-06, "loss": 2.3484, "step": 258020 }, { "epoch": 0.9, "learning_rate": 5.0026681361760905e-06, "loss": 2.3196, "step": 258030 }, { "epoch": 0.9, "learning_rate": 5.000924256322436e-06, "loss": 2.2903, "step": 258040 }, { "epoch": 0.9, "learning_rate": 4.999180376468783e-06, "loss": 2.4194, "step": 258050 }, { "epoch": 0.9, "learning_rate": 4.99743649661513e-06, "loss": 2.3215, "step": 258060 }, { "epoch": 0.9, "learning_rate": 4.995692616761476e-06, "loss": 2.3148, "step": 258070 }, { "epoch": 0.9, "learning_rate": 4.993948736907822e-06, "loss": 2.4586, "step": 258080 }, { "epoch": 0.9, "learning_rate": 4.992204857054169e-06, "loss": 2.3239, "step": 258090 }, { "epoch": 0.9, "learning_rate": 4.990460977200515e-06, "loss": 2.3785, "step": 258100 }, { "epoch": 0.9, "learning_rate": 4.9887170973468615e-06, "loss": 2.3849, "step": 258110 }, { "epoch": 0.9, "learning_rate": 4.986973217493208e-06, "loss": 2.31, "step": 258120 }, { "epoch": 0.9, "learning_rate": 4.985229337639554e-06, "loss": 2.3325, "step": 258130 }, { "epoch": 0.9, "learning_rate": 4.983485457785901e-06, "loss": 2.3265, "step": 258140 }, { "epoch": 0.9, "learning_rate": 4.981741577932247e-06, "loss": 2.3174, "step": 258150 }, { "epoch": 0.9, "learning_rate": 4.979997698078593e-06, "loss": 2.3649, "step": 258160 }, { "epoch": 0.9, "learning_rate": 4.97825381822494e-06, "loss": 2.3315, "step": 258170 }, { "epoch": 0.9, "learning_rate": 4.976509938371286e-06, "loss": 2.3052, "step": 258180 }, { "epoch": 0.9, "learning_rate": 4.9747660585176325e-06, "loss": 2.2661, "step": 258190 }, { "epoch": 0.9, "learning_rate": 4.973022178663979e-06, "loss": 2.4095, "step": 258200 }, { "epoch": 0.9, "learning_rate": 4.971278298810325e-06, "loss": 2.3187, "step": 258210 }, { "epoch": 0.9, "learning_rate": 4.969534418956672e-06, "loss": 2.3892, "step": 258220 }, { "epoch": 0.9, "learning_rate": 4.9677905391030185e-06, "loss": 2.3149, "step": 258230 }, { "epoch": 0.9, "learning_rate": 4.966046659249364e-06, "loss": 2.3179, "step": 258240 }, { "epoch": 0.9, "learning_rate": 4.964302779395711e-06, "loss": 2.2662, "step": 258250 }, { "epoch": 0.9, "learning_rate": 4.962558899542058e-06, "loss": 2.3628, "step": 258260 }, { "epoch": 0.9, "learning_rate": 4.9608150196884035e-06, "loss": 2.3899, "step": 258270 }, { "epoch": 0.9, "learning_rate": 4.95907113983475e-06, "loss": 2.3703, "step": 258280 }, { "epoch": 0.9, "learning_rate": 4.957327259981097e-06, "loss": 2.3522, "step": 258290 }, { "epoch": 0.9, "learning_rate": 4.955583380127443e-06, "loss": 2.3157, "step": 258300 }, { "epoch": 0.9, "learning_rate": 4.9538395002737895e-06, "loss": 2.3566, "step": 258310 }, { "epoch": 0.9, "learning_rate": 4.952095620420136e-06, "loss": 2.3547, "step": 258320 }, { "epoch": 0.9, "learning_rate": 4.950351740566482e-06, "loss": 2.343, "step": 258330 }, { "epoch": 0.9, "learning_rate": 4.948607860712829e-06, "loss": 2.4028, "step": 258340 }, { "epoch": 0.9, "learning_rate": 4.9468639808591745e-06, "loss": 2.388, "step": 258350 }, { "epoch": 0.9, "learning_rate": 4.945120101005521e-06, "loss": 2.3604, "step": 258360 }, { "epoch": 0.9, "learning_rate": 4.943376221151868e-06, "loss": 2.3053, "step": 258370 }, { "epoch": 0.9, "learning_rate": 4.941632341298215e-06, "loss": 2.3987, "step": 258380 }, { "epoch": 0.9, "learning_rate": 4.9398884614445605e-06, "loss": 2.2759, "step": 258390 }, { "epoch": 0.9, "learning_rate": 4.938144581590907e-06, "loss": 2.3716, "step": 258400 }, { "epoch": 0.9, "learning_rate": 4.936400701737253e-06, "loss": 2.3781, "step": 258410 }, { "epoch": 0.9, "learning_rate": 4.9346568218836e-06, "loss": 2.3589, "step": 258420 }, { "epoch": 0.9, "learning_rate": 4.932912942029946e-06, "loss": 2.3636, "step": 258430 }, { "epoch": 0.9, "learning_rate": 4.931169062176292e-06, "loss": 2.3523, "step": 258440 }, { "epoch": 0.9, "learning_rate": 4.929425182322639e-06, "loss": 2.3438, "step": 258450 }, { "epoch": 0.9, "learning_rate": 4.927681302468986e-06, "loss": 2.3194, "step": 258460 }, { "epoch": 0.9, "learning_rate": 4.9259374226153315e-06, "loss": 2.4383, "step": 258470 }, { "epoch": 0.9, "learning_rate": 4.924193542761678e-06, "loss": 2.2923, "step": 258480 }, { "epoch": 0.9, "learning_rate": 4.922449662908025e-06, "loss": 2.3405, "step": 258490 }, { "epoch": 0.9, "learning_rate": 4.920705783054371e-06, "loss": 2.2166, "step": 258500 }, { "epoch": 0.9, "learning_rate": 4.918961903200717e-06, "loss": 2.4169, "step": 258510 }, { "epoch": 0.9, "learning_rate": 4.917218023347064e-06, "loss": 2.3162, "step": 258520 }, { "epoch": 0.9, "learning_rate": 4.91547414349341e-06, "loss": 2.2827, "step": 258530 }, { "epoch": 0.9, "learning_rate": 4.913730263639757e-06, "loss": 2.3291, "step": 258540 }, { "epoch": 0.9, "learning_rate": 4.9119863837861025e-06, "loss": 2.4561, "step": 258550 }, { "epoch": 0.9, "learning_rate": 4.910242503932449e-06, "loss": 2.3809, "step": 258560 }, { "epoch": 0.9, "learning_rate": 4.908498624078796e-06, "loss": 2.2839, "step": 258570 }, { "epoch": 0.9, "learning_rate": 4.9067547442251425e-06, "loss": 2.2899, "step": 258580 }, { "epoch": 0.9, "learning_rate": 4.905010864371488e-06, "loss": 2.3067, "step": 258590 }, { "epoch": 0.9, "learning_rate": 4.903266984517835e-06, "loss": 2.3839, "step": 258600 }, { "epoch": 0.9, "learning_rate": 4.901523104664181e-06, "loss": 2.3496, "step": 258610 }, { "epoch": 0.9, "learning_rate": 4.899779224810528e-06, "loss": 2.364, "step": 258620 }, { "epoch": 0.9, "learning_rate": 4.898035344956874e-06, "loss": 2.4226, "step": 258630 }, { "epoch": 0.9, "learning_rate": 4.896291465103221e-06, "loss": 2.3899, "step": 258640 }, { "epoch": 0.9, "learning_rate": 4.894547585249567e-06, "loss": 2.476, "step": 258650 }, { "epoch": 0.9, "learning_rate": 4.8928037053959135e-06, "loss": 2.3479, "step": 258660 }, { "epoch": 0.9, "learning_rate": 4.891059825542259e-06, "loss": 2.3859, "step": 258670 }, { "epoch": 0.9, "learning_rate": 4.889315945688606e-06, "loss": 2.4304, "step": 258680 }, { "epoch": 0.9, "learning_rate": 4.887572065834953e-06, "loss": 2.4256, "step": 258690 }, { "epoch": 0.9, "learning_rate": 4.885828185981299e-06, "loss": 2.4201, "step": 258700 }, { "epoch": 0.9, "learning_rate": 4.884084306127645e-06, "loss": 2.3957, "step": 258710 }, { "epoch": 0.9, "learning_rate": 4.882340426273992e-06, "loss": 2.3624, "step": 258720 }, { "epoch": 0.9, "learning_rate": 4.880596546420338e-06, "loss": 2.439, "step": 258730 }, { "epoch": 0.9, "learning_rate": 4.8788526665666845e-06, "loss": 2.3351, "step": 258740 }, { "epoch": 0.9, "learning_rate": 4.87710878671303e-06, "loss": 2.2996, "step": 258750 }, { "epoch": 0.9, "learning_rate": 4.875364906859377e-06, "loss": 2.3144, "step": 258760 }, { "epoch": 0.9, "learning_rate": 4.873621027005724e-06, "loss": 2.3907, "step": 258770 }, { "epoch": 0.9, "learning_rate": 4.8718771471520705e-06, "loss": 2.3612, "step": 258780 }, { "epoch": 0.9, "learning_rate": 4.870133267298416e-06, "loss": 2.3395, "step": 258790 }, { "epoch": 0.9, "learning_rate": 4.868389387444763e-06, "loss": 2.477, "step": 258800 }, { "epoch": 0.9, "learning_rate": 4.866645507591109e-06, "loss": 2.318, "step": 258810 }, { "epoch": 0.9, "learning_rate": 4.8649016277374555e-06, "loss": 2.3336, "step": 258820 }, { "epoch": 0.9, "learning_rate": 4.863157747883802e-06, "loss": 2.4125, "step": 258830 }, { "epoch": 0.9, "learning_rate": 4.861413868030149e-06, "loss": 2.3609, "step": 258840 }, { "epoch": 0.9, "learning_rate": 4.859669988176495e-06, "loss": 2.1989, "step": 258850 }, { "epoch": 0.9, "learning_rate": 4.8579261083228415e-06, "loss": 2.3615, "step": 258860 }, { "epoch": 0.9, "learning_rate": 4.856182228469187e-06, "loss": 2.3676, "step": 258870 }, { "epoch": 0.9, "learning_rate": 4.854438348615534e-06, "loss": 2.3706, "step": 258880 }, { "epoch": 0.9, "learning_rate": 4.852694468761881e-06, "loss": 2.3481, "step": 258890 }, { "epoch": 0.9, "learning_rate": 4.850950588908227e-06, "loss": 2.3869, "step": 258900 }, { "epoch": 0.9, "learning_rate": 4.849206709054573e-06, "loss": 2.2858, "step": 258910 }, { "epoch": 0.9, "learning_rate": 4.84746282920092e-06, "loss": 2.3335, "step": 258920 }, { "epoch": 0.9, "learning_rate": 4.845718949347266e-06, "loss": 2.2927, "step": 258930 }, { "epoch": 0.9, "learning_rate": 4.8439750694936125e-06, "loss": 2.3189, "step": 258940 }, { "epoch": 0.9, "learning_rate": 4.842231189639959e-06, "loss": 2.4216, "step": 258950 }, { "epoch": 0.9, "learning_rate": 4.840487309786305e-06, "loss": 2.3337, "step": 258960 }, { "epoch": 0.9, "learning_rate": 4.838743429932652e-06, "loss": 2.3331, "step": 258970 }, { "epoch": 0.9, "learning_rate": 4.836999550078998e-06, "loss": 2.3653, "step": 258980 }, { "epoch": 0.9, "learning_rate": 4.835255670225344e-06, "loss": 2.3374, "step": 258990 }, { "epoch": 0.9, "learning_rate": 4.833511790371691e-06, "loss": 2.3544, "step": 259000 }, { "epoch": 0.9, "learning_rate": 4.831767910518037e-06, "loss": 2.366, "step": 259010 }, { "epoch": 0.9, "learning_rate": 4.8300240306643835e-06, "loss": 2.2731, "step": 259020 }, { "epoch": 0.9, "learning_rate": 4.82828015081073e-06, "loss": 2.3712, "step": 259030 }, { "epoch": 0.9, "learning_rate": 4.826536270957077e-06, "loss": 2.3226, "step": 259040 }, { "epoch": 0.9, "learning_rate": 4.824792391103423e-06, "loss": 2.4115, "step": 259050 }, { "epoch": 0.9, "learning_rate": 4.823048511249769e-06, "loss": 2.2428, "step": 259060 }, { "epoch": 0.9, "learning_rate": 4.821304631396115e-06, "loss": 2.3345, "step": 259070 }, { "epoch": 0.9, "learning_rate": 4.819560751542462e-06, "loss": 2.3343, "step": 259080 }, { "epoch": 0.9, "learning_rate": 4.817816871688809e-06, "loss": 2.3191, "step": 259090 }, { "epoch": 0.9, "learning_rate": 4.816072991835155e-06, "loss": 2.4026, "step": 259100 }, { "epoch": 0.9, "learning_rate": 4.814329111981501e-06, "loss": 2.3822, "step": 259110 }, { "epoch": 0.9, "learning_rate": 4.812585232127848e-06, "loss": 2.3576, "step": 259120 }, { "epoch": 0.9, "learning_rate": 4.810841352274194e-06, "loss": 2.4168, "step": 259130 }, { "epoch": 0.9, "learning_rate": 4.80909747242054e-06, "loss": 2.4301, "step": 259140 }, { "epoch": 0.9, "learning_rate": 4.807353592566887e-06, "loss": 2.3942, "step": 259150 }, { "epoch": 0.9, "learning_rate": 4.805609712713234e-06, "loss": 2.3377, "step": 259160 }, { "epoch": 0.9, "learning_rate": 4.80386583285958e-06, "loss": 2.3486, "step": 259170 }, { "epoch": 0.9, "learning_rate": 4.802121953005926e-06, "loss": 2.3803, "step": 259180 }, { "epoch": 0.9, "learning_rate": 4.800378073152272e-06, "loss": 2.2363, "step": 259190 }, { "epoch": 0.9, "learning_rate": 4.798634193298619e-06, "loss": 2.3449, "step": 259200 }, { "epoch": 0.9, "learning_rate": 4.796890313444965e-06, "loss": 2.3832, "step": 259210 }, { "epoch": 0.9, "learning_rate": 4.795146433591312e-06, "loss": 2.3288, "step": 259220 }, { "epoch": 0.9, "learning_rate": 4.793402553737658e-06, "loss": 2.3178, "step": 259230 }, { "epoch": 0.9, "learning_rate": 4.791658673884005e-06, "loss": 2.3917, "step": 259240 }, { "epoch": 0.9, "learning_rate": 4.789914794030351e-06, "loss": 2.2798, "step": 259250 }, { "epoch": 0.9, "learning_rate": 4.788170914176697e-06, "loss": 2.38, "step": 259260 }, { "epoch": 0.9, "learning_rate": 4.786427034323043e-06, "loss": 2.2874, "step": 259270 }, { "epoch": 0.9, "learning_rate": 4.78468315446939e-06, "loss": 2.3397, "step": 259280 }, { "epoch": 0.9, "learning_rate": 4.7829392746157366e-06, "loss": 2.3002, "step": 259290 }, { "epoch": 0.9, "learning_rate": 4.781195394762083e-06, "loss": 2.3662, "step": 259300 }, { "epoch": 0.9, "learning_rate": 4.779451514908429e-06, "loss": 2.3571, "step": 259310 }, { "epoch": 0.9, "learning_rate": 4.777707635054776e-06, "loss": 2.3193, "step": 259320 }, { "epoch": 0.9, "learning_rate": 4.775963755201122e-06, "loss": 2.3084, "step": 259330 }, { "epoch": 0.9, "learning_rate": 4.774219875347468e-06, "loss": 2.3055, "step": 259340 }, { "epoch": 0.9, "learning_rate": 4.772475995493815e-06, "loss": 2.3862, "step": 259350 }, { "epoch": 0.9, "learning_rate": 4.770732115640162e-06, "loss": 2.2909, "step": 259360 }, { "epoch": 0.9, "learning_rate": 4.7689882357865076e-06, "loss": 2.3637, "step": 259370 }, { "epoch": 0.9, "learning_rate": 4.767244355932854e-06, "loss": 2.3273, "step": 259380 }, { "epoch": 0.9, "learning_rate": 4.7655004760792e-06, "loss": 2.3745, "step": 259390 }, { "epoch": 0.9, "learning_rate": 4.763756596225547e-06, "loss": 2.344, "step": 259400 }, { "epoch": 0.9, "learning_rate": 4.762012716371893e-06, "loss": 2.3231, "step": 259410 }, { "epoch": 0.9, "learning_rate": 4.76026883651824e-06, "loss": 2.3984, "step": 259420 }, { "epoch": 0.9, "learning_rate": 4.758524956664586e-06, "loss": 2.387, "step": 259430 }, { "epoch": 0.9, "learning_rate": 4.756781076810933e-06, "loss": 2.302, "step": 259440 }, { "epoch": 0.9, "learning_rate": 4.7550371969572786e-06, "loss": 2.2626, "step": 259450 }, { "epoch": 0.9, "learning_rate": 4.753293317103625e-06, "loss": 2.3355, "step": 259460 }, { "epoch": 0.9, "learning_rate": 4.751549437249971e-06, "loss": 2.2764, "step": 259470 }, { "epoch": 0.91, "learning_rate": 4.749805557396318e-06, "loss": 2.3473, "step": 259480 }, { "epoch": 0.91, "learning_rate": 4.7480616775426645e-06, "loss": 2.2861, "step": 259490 }, { "epoch": 0.91, "learning_rate": 4.746317797689011e-06, "loss": 2.3256, "step": 259500 }, { "epoch": 0.91, "learning_rate": 4.744573917835357e-06, "loss": 2.3243, "step": 259510 }, { "epoch": 0.91, "learning_rate": 4.742830037981704e-06, "loss": 2.3573, "step": 259520 }, { "epoch": 0.91, "learning_rate": 4.7410861581280496e-06, "loss": 2.347, "step": 259530 }, { "epoch": 0.91, "learning_rate": 4.739342278274396e-06, "loss": 2.3069, "step": 259540 }, { "epoch": 0.91, "learning_rate": 4.737598398420743e-06, "loss": 2.3542, "step": 259550 }, { "epoch": 0.91, "learning_rate": 4.73585451856709e-06, "loss": 2.3488, "step": 259560 }, { "epoch": 0.91, "learning_rate": 4.7341106387134355e-06, "loss": 2.3554, "step": 259570 }, { "epoch": 0.91, "learning_rate": 4.732366758859782e-06, "loss": 2.4161, "step": 259580 }, { "epoch": 0.91, "learning_rate": 4.730622879006128e-06, "loss": 2.2804, "step": 259590 }, { "epoch": 0.91, "learning_rate": 4.728878999152475e-06, "loss": 2.2962, "step": 259600 }, { "epoch": 0.91, "learning_rate": 4.7271351192988206e-06, "loss": 2.2666, "step": 259610 }, { "epoch": 0.91, "learning_rate": 4.725391239445168e-06, "loss": 2.4088, "step": 259620 }, { "epoch": 0.91, "learning_rate": 4.723647359591514e-06, "loss": 2.3121, "step": 259630 }, { "epoch": 0.91, "learning_rate": 4.721903479737861e-06, "loss": 2.3308, "step": 259640 }, { "epoch": 0.91, "learning_rate": 4.7201595998842065e-06, "loss": 2.4001, "step": 259650 }, { "epoch": 0.91, "learning_rate": 4.718415720030553e-06, "loss": 2.3412, "step": 259660 }, { "epoch": 0.91, "learning_rate": 4.716671840176899e-06, "loss": 2.3498, "step": 259670 }, { "epoch": 0.91, "learning_rate": 4.714927960323246e-06, "loss": 2.3205, "step": 259680 }, { "epoch": 0.91, "learning_rate": 4.713184080469592e-06, "loss": 2.2944, "step": 259690 }, { "epoch": 0.91, "learning_rate": 4.711440200615939e-06, "loss": 2.3969, "step": 259700 }, { "epoch": 0.91, "learning_rate": 4.709696320762285e-06, "loss": 2.3272, "step": 259710 }, { "epoch": 0.91, "learning_rate": 4.707952440908632e-06, "loss": 2.3603, "step": 259720 }, { "epoch": 0.91, "learning_rate": 4.7062085610549775e-06, "loss": 2.3677, "step": 259730 }, { "epoch": 0.91, "learning_rate": 4.704464681201324e-06, "loss": 2.3242, "step": 259740 }, { "epoch": 0.91, "learning_rate": 4.702720801347671e-06, "loss": 2.2827, "step": 259750 }, { "epoch": 0.91, "learning_rate": 4.7009769214940176e-06, "loss": 2.3236, "step": 259760 }, { "epoch": 0.91, "learning_rate": 4.699233041640363e-06, "loss": 2.3765, "step": 259770 }, { "epoch": 0.91, "learning_rate": 4.69748916178671e-06, "loss": 2.3749, "step": 259780 }, { "epoch": 0.91, "learning_rate": 4.695745281933056e-06, "loss": 2.3496, "step": 259790 }, { "epoch": 0.91, "learning_rate": 4.694001402079403e-06, "loss": 2.3346, "step": 259800 }, { "epoch": 0.91, "learning_rate": 4.6922575222257485e-06, "loss": 2.3113, "step": 259810 }, { "epoch": 0.91, "learning_rate": 4.690513642372096e-06, "loss": 2.3166, "step": 259820 }, { "epoch": 0.91, "learning_rate": 4.688769762518442e-06, "loss": 2.328, "step": 259830 }, { "epoch": 0.91, "learning_rate": 4.6870258826647886e-06, "loss": 2.3098, "step": 259840 }, { "epoch": 0.91, "learning_rate": 4.685282002811134e-06, "loss": 2.3288, "step": 259850 }, { "epoch": 0.91, "learning_rate": 4.683538122957481e-06, "loss": 2.3503, "step": 259860 }, { "epoch": 0.91, "learning_rate": 4.681794243103827e-06, "loss": 2.3199, "step": 259870 }, { "epoch": 0.91, "learning_rate": 4.680050363250174e-06, "loss": 2.2534, "step": 259880 }, { "epoch": 0.91, "learning_rate": 4.67830648339652e-06, "loss": 2.3125, "step": 259890 }, { "epoch": 0.91, "learning_rate": 4.676562603542867e-06, "loss": 2.3054, "step": 259900 }, { "epoch": 0.91, "learning_rate": 4.674818723689213e-06, "loss": 2.3888, "step": 259910 }, { "epoch": 0.91, "learning_rate": 4.6730748438355596e-06, "loss": 2.304, "step": 259920 }, { "epoch": 0.91, "learning_rate": 4.671330963981905e-06, "loss": 2.3118, "step": 259930 }, { "epoch": 0.91, "learning_rate": 4.669587084128252e-06, "loss": 2.3723, "step": 259940 }, { "epoch": 0.91, "learning_rate": 4.667843204274599e-06, "loss": 2.3158, "step": 259950 }, { "epoch": 0.91, "learning_rate": 4.6660993244209455e-06, "loss": 2.4279, "step": 259960 }, { "epoch": 0.91, "learning_rate": 4.664355444567291e-06, "loss": 2.3485, "step": 259970 }, { "epoch": 0.91, "learning_rate": 4.662611564713638e-06, "loss": 2.3773, "step": 259980 }, { "epoch": 0.91, "learning_rate": 4.660867684859984e-06, "loss": 2.3709, "step": 259990 }, { "epoch": 0.91, "learning_rate": 4.6591238050063306e-06, "loss": 2.3385, "step": 260000 }, { "epoch": 0.91, "learning_rate": 4.657379925152676e-06, "loss": 2.3604, "step": 260010 }, { "epoch": 0.91, "learning_rate": 4.655636045299024e-06, "loss": 2.3301, "step": 260020 }, { "epoch": 0.91, "learning_rate": 4.65389216544537e-06, "loss": 2.4516, "step": 260030 }, { "epoch": 0.91, "learning_rate": 4.6521482855917165e-06, "loss": 2.2742, "step": 260040 }, { "epoch": 0.91, "learning_rate": 4.650404405738062e-06, "loss": 2.3722, "step": 260050 }, { "epoch": 0.91, "learning_rate": 4.648660525884409e-06, "loss": 2.2697, "step": 260060 }, { "epoch": 0.91, "learning_rate": 4.646916646030755e-06, "loss": 2.2789, "step": 260070 }, { "epoch": 0.91, "learning_rate": 4.6451727661771016e-06, "loss": 2.4295, "step": 260080 }, { "epoch": 0.91, "learning_rate": 4.643428886323448e-06, "loss": 2.3495, "step": 260090 }, { "epoch": 0.91, "learning_rate": 4.641685006469795e-06, "loss": 2.3177, "step": 260100 }, { "epoch": 0.91, "learning_rate": 4.639941126616141e-06, "loss": 2.3613, "step": 260110 }, { "epoch": 0.91, "learning_rate": 4.6381972467624875e-06, "loss": 2.32, "step": 260120 }, { "epoch": 0.91, "learning_rate": 4.636453366908833e-06, "loss": 2.3605, "step": 260130 }, { "epoch": 0.91, "learning_rate": 4.63470948705518e-06, "loss": 2.3197, "step": 260140 }, { "epoch": 0.91, "learning_rate": 4.632965607201527e-06, "loss": 2.3776, "step": 260150 }, { "epoch": 0.91, "learning_rate": 4.631221727347873e-06, "loss": 2.2885, "step": 260160 }, { "epoch": 0.91, "learning_rate": 4.629477847494219e-06, "loss": 2.3737, "step": 260170 }, { "epoch": 0.91, "learning_rate": 4.627733967640566e-06, "loss": 2.3868, "step": 260180 }, { "epoch": 0.91, "learning_rate": 4.625990087786912e-06, "loss": 2.379, "step": 260190 }, { "epoch": 0.91, "learning_rate": 4.6242462079332585e-06, "loss": 2.3408, "step": 260200 }, { "epoch": 0.91, "learning_rate": 4.622502328079604e-06, "loss": 2.4198, "step": 260210 }, { "epoch": 0.91, "learning_rate": 4.620758448225952e-06, "loss": 2.3695, "step": 260220 }, { "epoch": 0.91, "learning_rate": 4.619014568372298e-06, "loss": 2.3107, "step": 260230 }, { "epoch": 0.91, "learning_rate": 4.617270688518644e-06, "loss": 2.3492, "step": 260240 }, { "epoch": 0.91, "learning_rate": 4.61552680866499e-06, "loss": 2.3099, "step": 260250 }, { "epoch": 0.91, "learning_rate": 4.613782928811337e-06, "loss": 2.2823, "step": 260260 }, { "epoch": 0.91, "learning_rate": 4.612039048957683e-06, "loss": 2.3248, "step": 260270 }, { "epoch": 0.91, "learning_rate": 4.61029516910403e-06, "loss": 2.2684, "step": 260280 }, { "epoch": 0.91, "learning_rate": 4.608551289250376e-06, "loss": 2.2762, "step": 260290 }, { "epoch": 0.91, "learning_rate": 4.606807409396723e-06, "loss": 2.4043, "step": 260300 }, { "epoch": 0.91, "learning_rate": 4.605063529543069e-06, "loss": 2.3057, "step": 260310 }, { "epoch": 0.91, "learning_rate": 4.603319649689415e-06, "loss": 2.3005, "step": 260320 }, { "epoch": 0.91, "learning_rate": 4.601575769835761e-06, "loss": 2.4019, "step": 260330 }, { "epoch": 0.91, "learning_rate": 4.599831889982108e-06, "loss": 2.3825, "step": 260340 }, { "epoch": 0.91, "learning_rate": 4.598088010128455e-06, "loss": 2.3293, "step": 260350 }, { "epoch": 0.91, "learning_rate": 4.596344130274801e-06, "loss": 2.3561, "step": 260360 }, { "epoch": 0.91, "learning_rate": 4.594600250421147e-06, "loss": 2.357, "step": 260370 }, { "epoch": 0.91, "learning_rate": 4.592856370567494e-06, "loss": 2.364, "step": 260380 }, { "epoch": 0.91, "learning_rate": 4.59111249071384e-06, "loss": 2.3269, "step": 260390 }, { "epoch": 0.91, "learning_rate": 4.589368610860186e-06, "loss": 2.2807, "step": 260400 }, { "epoch": 0.91, "learning_rate": 4.587624731006532e-06, "loss": 2.3327, "step": 260410 }, { "epoch": 0.91, "learning_rate": 4.58588085115288e-06, "loss": 2.4024, "step": 260420 }, { "epoch": 0.91, "learning_rate": 4.584136971299226e-06, "loss": 2.3821, "step": 260430 }, { "epoch": 0.91, "learning_rate": 4.582393091445572e-06, "loss": 2.3248, "step": 260440 }, { "epoch": 0.91, "learning_rate": 4.580649211591918e-06, "loss": 2.3765, "step": 260450 }, { "epoch": 0.91, "learning_rate": 4.578905331738265e-06, "loss": 2.3548, "step": 260460 }, { "epoch": 0.91, "learning_rate": 4.577161451884611e-06, "loss": 2.3307, "step": 260470 }, { "epoch": 0.91, "learning_rate": 4.575417572030958e-06, "loss": 2.342, "step": 260480 }, { "epoch": 0.91, "learning_rate": 4.573673692177304e-06, "loss": 2.2877, "step": 260490 }, { "epoch": 0.91, "learning_rate": 4.571929812323651e-06, "loss": 2.4089, "step": 260500 }, { "epoch": 0.91, "learning_rate": 4.570185932469997e-06, "loss": 2.304, "step": 260510 }, { "epoch": 0.91, "learning_rate": 4.568442052616343e-06, "loss": 2.3102, "step": 260520 }, { "epoch": 0.91, "learning_rate": 4.566698172762689e-06, "loss": 2.3569, "step": 260530 }, { "epoch": 0.91, "learning_rate": 4.564954292909036e-06, "loss": 2.252, "step": 260540 }, { "epoch": 0.91, "learning_rate": 4.563210413055383e-06, "loss": 2.35, "step": 260550 }, { "epoch": 0.91, "learning_rate": 4.561466533201729e-06, "loss": 2.378, "step": 260560 }, { "epoch": 0.91, "learning_rate": 4.559722653348075e-06, "loss": 2.4026, "step": 260570 }, { "epoch": 0.91, "learning_rate": 4.557978773494422e-06, "loss": 2.3163, "step": 260580 }, { "epoch": 0.91, "learning_rate": 4.556234893640768e-06, "loss": 2.3541, "step": 260590 }, { "epoch": 0.91, "learning_rate": 4.554491013787114e-06, "loss": 2.391, "step": 260600 }, { "epoch": 0.91, "learning_rate": 4.55274713393346e-06, "loss": 2.3464, "step": 260610 }, { "epoch": 0.91, "learning_rate": 4.551003254079808e-06, "loss": 2.3818, "step": 260620 }, { "epoch": 0.91, "learning_rate": 4.549259374226154e-06, "loss": 2.3796, "step": 260630 }, { "epoch": 0.91, "learning_rate": 4.5475154943725e-06, "loss": 2.3831, "step": 260640 }, { "epoch": 0.91, "learning_rate": 4.545771614518846e-06, "loss": 2.3433, "step": 260650 }, { "epoch": 0.91, "learning_rate": 4.544027734665193e-06, "loss": 2.3453, "step": 260660 }, { "epoch": 0.91, "learning_rate": 4.542283854811539e-06, "loss": 2.311, "step": 260670 }, { "epoch": 0.91, "learning_rate": 4.540539974957886e-06, "loss": 2.3437, "step": 260680 }, { "epoch": 0.91, "learning_rate": 4.538796095104232e-06, "loss": 2.3625, "step": 260690 }, { "epoch": 0.91, "learning_rate": 4.537052215250579e-06, "loss": 2.3099, "step": 260700 }, { "epoch": 0.91, "learning_rate": 4.535308335396925e-06, "loss": 2.3377, "step": 260710 }, { "epoch": 0.91, "learning_rate": 4.533564455543271e-06, "loss": 2.2412, "step": 260720 }, { "epoch": 0.91, "learning_rate": 4.531820575689617e-06, "loss": 2.324, "step": 260730 }, { "epoch": 0.91, "learning_rate": 4.530076695835964e-06, "loss": 2.3278, "step": 260740 }, { "epoch": 0.91, "learning_rate": 4.5283328159823105e-06, "loss": 2.3289, "step": 260750 }, { "epoch": 0.91, "learning_rate": 4.526588936128657e-06, "loss": 2.3259, "step": 260760 }, { "epoch": 0.91, "learning_rate": 4.524845056275003e-06, "loss": 2.3945, "step": 260770 }, { "epoch": 0.91, "learning_rate": 4.52310117642135e-06, "loss": 2.3433, "step": 260780 }, { "epoch": 0.91, "learning_rate": 4.521357296567696e-06, "loss": 2.3382, "step": 260790 }, { "epoch": 0.91, "learning_rate": 4.519613416714042e-06, "loss": 2.4201, "step": 260800 }, { "epoch": 0.91, "learning_rate": 4.517869536860388e-06, "loss": 2.3666, "step": 260810 }, { "epoch": 0.91, "learning_rate": 4.516125657006736e-06, "loss": 2.3214, "step": 260820 }, { "epoch": 0.91, "learning_rate": 4.5143817771530815e-06, "loss": 2.2794, "step": 260830 }, { "epoch": 0.91, "learning_rate": 4.512637897299428e-06, "loss": 2.357, "step": 260840 }, { "epoch": 0.91, "learning_rate": 4.510894017445774e-06, "loss": 2.3853, "step": 260850 }, { "epoch": 0.91, "learning_rate": 4.509150137592121e-06, "loss": 2.3714, "step": 260860 }, { "epoch": 0.91, "learning_rate": 4.507406257738467e-06, "loss": 2.3579, "step": 260870 }, { "epoch": 0.91, "learning_rate": 4.505662377884814e-06, "loss": 2.313, "step": 260880 }, { "epoch": 0.91, "learning_rate": 4.50391849803116e-06, "loss": 2.313, "step": 260890 }, { "epoch": 0.91, "learning_rate": 4.502174618177507e-06, "loss": 2.3379, "step": 260900 }, { "epoch": 0.91, "learning_rate": 4.5004307383238525e-06, "loss": 2.3111, "step": 260910 }, { "epoch": 0.91, "learning_rate": 4.498686858470199e-06, "loss": 2.3886, "step": 260920 }, { "epoch": 0.91, "learning_rate": 4.496942978616545e-06, "loss": 2.3052, "step": 260930 }, { "epoch": 0.91, "learning_rate": 4.495199098762892e-06, "loss": 2.3363, "step": 260940 }, { "epoch": 0.91, "learning_rate": 4.4934552189092384e-06, "loss": 2.3539, "step": 260950 }, { "epoch": 0.91, "learning_rate": 4.491711339055585e-06, "loss": 2.4119, "step": 260960 }, { "epoch": 0.91, "learning_rate": 4.489967459201931e-06, "loss": 2.4119, "step": 260970 }, { "epoch": 0.91, "learning_rate": 4.488223579348278e-06, "loss": 2.3076, "step": 260980 }, { "epoch": 0.91, "learning_rate": 4.4864796994946235e-06, "loss": 2.3235, "step": 260990 }, { "epoch": 0.91, "learning_rate": 4.48473581964097e-06, "loss": 2.3114, "step": 261000 }, { "epoch": 0.91, "learning_rate": 4.482991939787316e-06, "loss": 2.3767, "step": 261010 }, { "epoch": 0.91, "learning_rate": 4.481248059933664e-06, "loss": 2.3676, "step": 261020 }, { "epoch": 0.91, "learning_rate": 4.4795041800800094e-06, "loss": 2.3877, "step": 261030 }, { "epoch": 0.91, "learning_rate": 4.477760300226356e-06, "loss": 2.3391, "step": 261040 }, { "epoch": 0.91, "learning_rate": 4.476016420372702e-06, "loss": 2.3292, "step": 261050 }, { "epoch": 0.91, "learning_rate": 4.474272540519049e-06, "loss": 2.3391, "step": 261060 }, { "epoch": 0.91, "learning_rate": 4.4725286606653945e-06, "loss": 2.3339, "step": 261070 }, { "epoch": 0.91, "learning_rate": 4.470784780811742e-06, "loss": 2.315, "step": 261080 }, { "epoch": 0.91, "learning_rate": 4.469040900958088e-06, "loss": 2.4257, "step": 261090 }, { "epoch": 0.91, "learning_rate": 4.467297021104435e-06, "loss": 2.4444, "step": 261100 }, { "epoch": 0.91, "learning_rate": 4.4655531412507804e-06, "loss": 2.3276, "step": 261110 }, { "epoch": 0.91, "learning_rate": 4.463809261397127e-06, "loss": 2.3242, "step": 261120 }, { "epoch": 0.91, "learning_rate": 4.462065381543473e-06, "loss": 2.3685, "step": 261130 }, { "epoch": 0.91, "learning_rate": 4.46032150168982e-06, "loss": 2.3212, "step": 261140 }, { "epoch": 0.91, "learning_rate": 4.458577621836166e-06, "loss": 2.2812, "step": 261150 }, { "epoch": 0.91, "learning_rate": 4.456833741982513e-06, "loss": 2.3493, "step": 261160 }, { "epoch": 0.91, "learning_rate": 4.455089862128859e-06, "loss": 2.3546, "step": 261170 }, { "epoch": 0.91, "learning_rate": 4.453345982275206e-06, "loss": 2.3377, "step": 261180 }, { "epoch": 0.91, "learning_rate": 4.4516021024215514e-06, "loss": 2.3374, "step": 261190 }, { "epoch": 0.91, "learning_rate": 4.449858222567898e-06, "loss": 2.3196, "step": 261200 }, { "epoch": 0.91, "learning_rate": 4.448114342714244e-06, "loss": 2.3462, "step": 261210 }, { "epoch": 0.91, "learning_rate": 4.4463704628605915e-06, "loss": 2.298, "step": 261220 }, { "epoch": 0.91, "learning_rate": 4.444626583006937e-06, "loss": 2.3123, "step": 261230 }, { "epoch": 0.91, "learning_rate": 4.442882703153284e-06, "loss": 2.2913, "step": 261240 }, { "epoch": 0.91, "learning_rate": 4.44113882329963e-06, "loss": 2.4587, "step": 261250 }, { "epoch": 0.91, "learning_rate": 4.439394943445977e-06, "loss": 2.3478, "step": 261260 }, { "epoch": 0.91, "learning_rate": 4.4376510635923224e-06, "loss": 2.4092, "step": 261270 }, { "epoch": 0.91, "learning_rate": 4.43590718373867e-06, "loss": 2.2167, "step": 261280 }, { "epoch": 0.91, "learning_rate": 4.434163303885016e-06, "loss": 2.3615, "step": 261290 }, { "epoch": 0.91, "learning_rate": 4.4324194240313625e-06, "loss": 2.3824, "step": 261300 }, { "epoch": 0.91, "learning_rate": 4.430675544177708e-06, "loss": 2.3713, "step": 261310 }, { "epoch": 0.91, "learning_rate": 4.428931664324055e-06, "loss": 2.276, "step": 261320 }, { "epoch": 0.91, "learning_rate": 4.427187784470401e-06, "loss": 2.4067, "step": 261330 }, { "epoch": 0.91, "learning_rate": 4.425443904616748e-06, "loss": 2.3517, "step": 261340 }, { "epoch": 0.91, "learning_rate": 4.423700024763094e-06, "loss": 2.4016, "step": 261350 }, { "epoch": 0.91, "learning_rate": 4.421956144909441e-06, "loss": 2.2991, "step": 261360 }, { "epoch": 0.91, "learning_rate": 4.420212265055787e-06, "loss": 2.4047, "step": 261370 }, { "epoch": 0.91, "learning_rate": 4.4184683852021335e-06, "loss": 2.3304, "step": 261380 }, { "epoch": 0.91, "learning_rate": 4.416724505348479e-06, "loss": 2.3652, "step": 261390 }, { "epoch": 0.91, "learning_rate": 4.414980625494826e-06, "loss": 2.298, "step": 261400 }, { "epoch": 0.91, "learning_rate": 4.413236745641172e-06, "loss": 2.2839, "step": 261410 }, { "epoch": 0.91, "learning_rate": 4.4114928657875194e-06, "loss": 2.3403, "step": 261420 }, { "epoch": 0.91, "learning_rate": 4.409748985933865e-06, "loss": 2.3475, "step": 261430 }, { "epoch": 0.91, "learning_rate": 4.408005106080212e-06, "loss": 2.354, "step": 261440 }, { "epoch": 0.91, "learning_rate": 4.406261226226558e-06, "loss": 2.3663, "step": 261450 }, { "epoch": 0.91, "learning_rate": 4.4045173463729045e-06, "loss": 2.3451, "step": 261460 }, { "epoch": 0.91, "learning_rate": 4.40277346651925e-06, "loss": 2.3453, "step": 261470 }, { "epoch": 0.91, "learning_rate": 4.401029586665598e-06, "loss": 2.2611, "step": 261480 }, { "epoch": 0.91, "learning_rate": 4.399285706811944e-06, "loss": 2.3622, "step": 261490 }, { "epoch": 0.91, "learning_rate": 4.3975418269582904e-06, "loss": 2.3723, "step": 261500 }, { "epoch": 0.91, "learning_rate": 4.395797947104636e-06, "loss": 2.405, "step": 261510 }, { "epoch": 0.91, "learning_rate": 4.394054067250983e-06, "loss": 2.3213, "step": 261520 }, { "epoch": 0.91, "learning_rate": 4.392310187397329e-06, "loss": 2.3396, "step": 261530 }, { "epoch": 0.91, "learning_rate": 4.3905663075436755e-06, "loss": 2.3476, "step": 261540 }, { "epoch": 0.91, "learning_rate": 4.388822427690022e-06, "loss": 2.2973, "step": 261550 }, { "epoch": 0.91, "learning_rate": 4.387078547836369e-06, "loss": 2.3766, "step": 261560 }, { "epoch": 0.91, "learning_rate": 4.385334667982715e-06, "loss": 2.3364, "step": 261570 }, { "epoch": 0.91, "learning_rate": 4.3835907881290614e-06, "loss": 2.3679, "step": 261580 }, { "epoch": 0.91, "learning_rate": 4.381846908275407e-06, "loss": 2.3401, "step": 261590 }, { "epoch": 0.91, "learning_rate": 4.380103028421754e-06, "loss": 2.2747, "step": 261600 }, { "epoch": 0.91, "learning_rate": 4.3783591485681e-06, "loss": 2.3274, "step": 261610 }, { "epoch": 0.91, "learning_rate": 4.376615268714447e-06, "loss": 2.31, "step": 261620 }, { "epoch": 0.91, "learning_rate": 4.374871388860793e-06, "loss": 2.2706, "step": 261630 }, { "epoch": 0.91, "learning_rate": 4.37312750900714e-06, "loss": 2.3479, "step": 261640 }, { "epoch": 0.91, "learning_rate": 4.371383629153486e-06, "loss": 2.3413, "step": 261650 }, { "epoch": 0.91, "learning_rate": 4.3696397492998324e-06, "loss": 2.3022, "step": 261660 }, { "epoch": 0.91, "learning_rate": 4.367895869446178e-06, "loss": 2.3131, "step": 261670 }, { "epoch": 0.91, "learning_rate": 4.366151989592526e-06, "loss": 2.3363, "step": 261680 }, { "epoch": 0.91, "learning_rate": 4.364408109738872e-06, "loss": 2.2983, "step": 261690 }, { "epoch": 0.91, "learning_rate": 4.362664229885218e-06, "loss": 2.3433, "step": 261700 }, { "epoch": 0.91, "learning_rate": 4.360920350031564e-06, "loss": 2.273, "step": 261710 }, { "epoch": 0.91, "learning_rate": 4.359176470177911e-06, "loss": 2.3276, "step": 261720 }, { "epoch": 0.91, "learning_rate": 4.357432590324257e-06, "loss": 2.353, "step": 261730 }, { "epoch": 0.91, "learning_rate": 4.3556887104706034e-06, "loss": 2.393, "step": 261740 }, { "epoch": 0.91, "learning_rate": 4.35394483061695e-06, "loss": 2.3849, "step": 261750 }, { "epoch": 0.91, "learning_rate": 4.352200950763297e-06, "loss": 2.381, "step": 261760 }, { "epoch": 0.91, "learning_rate": 4.350457070909643e-06, "loss": 2.2692, "step": 261770 }, { "epoch": 0.91, "learning_rate": 4.348713191055989e-06, "loss": 2.3841, "step": 261780 }, { "epoch": 0.91, "learning_rate": 4.346969311202335e-06, "loss": 2.4188, "step": 261790 }, { "epoch": 0.91, "learning_rate": 4.345225431348682e-06, "loss": 2.3197, "step": 261800 }, { "epoch": 0.91, "learning_rate": 4.343481551495029e-06, "loss": 2.3346, "step": 261810 }, { "epoch": 0.91, "learning_rate": 4.341737671641375e-06, "loss": 2.2451, "step": 261820 }, { "epoch": 0.91, "learning_rate": 4.339993791787721e-06, "loss": 2.3623, "step": 261830 }, { "epoch": 0.91, "learning_rate": 4.338249911934068e-06, "loss": 2.304, "step": 261840 }, { "epoch": 0.91, "learning_rate": 4.336506032080414e-06, "loss": 2.2794, "step": 261850 }, { "epoch": 0.91, "learning_rate": 4.33476215222676e-06, "loss": 2.2622, "step": 261860 }, { "epoch": 0.91, "learning_rate": 4.333018272373106e-06, "loss": 2.3138, "step": 261870 }, { "epoch": 0.91, "learning_rate": 4.331274392519454e-06, "loss": 2.3613, "step": 261880 }, { "epoch": 0.91, "learning_rate": 4.3295305126658e-06, "loss": 2.2685, "step": 261890 }, { "epoch": 0.91, "learning_rate": 4.327786632812146e-06, "loss": 2.4418, "step": 261900 }, { "epoch": 0.91, "learning_rate": 4.326042752958492e-06, "loss": 2.2911, "step": 261910 }, { "epoch": 0.91, "learning_rate": 4.324298873104839e-06, "loss": 2.3926, "step": 261920 }, { "epoch": 0.91, "learning_rate": 4.322554993251185e-06, "loss": 2.3643, "step": 261930 }, { "epoch": 0.91, "learning_rate": 4.320811113397531e-06, "loss": 2.3188, "step": 261940 }, { "epoch": 0.91, "learning_rate": 4.319067233543878e-06, "loss": 2.3055, "step": 261950 }, { "epoch": 0.91, "learning_rate": 4.317323353690225e-06, "loss": 2.2993, "step": 261960 }, { "epoch": 0.91, "learning_rate": 4.315579473836571e-06, "loss": 2.3079, "step": 261970 }, { "epoch": 0.91, "learning_rate": 4.313835593982917e-06, "loss": 2.3523, "step": 261980 }, { "epoch": 0.91, "learning_rate": 4.312091714129263e-06, "loss": 2.426, "step": 261990 }, { "epoch": 0.91, "learning_rate": 4.31034783427561e-06, "loss": 2.3084, "step": 262000 }, { "epoch": 0.91, "learning_rate": 4.3086039544219565e-06, "loss": 2.2874, "step": 262010 }, { "epoch": 0.91, "learning_rate": 4.306860074568303e-06, "loss": 2.3822, "step": 262020 }, { "epoch": 0.91, "learning_rate": 4.305116194714649e-06, "loss": 2.3283, "step": 262030 }, { "epoch": 0.91, "learning_rate": 4.303372314860996e-06, "loss": 2.3627, "step": 262040 }, { "epoch": 0.91, "learning_rate": 4.301628435007342e-06, "loss": 2.3847, "step": 262050 }, { "epoch": 0.91, "learning_rate": 4.299884555153688e-06, "loss": 2.2688, "step": 262060 }, { "epoch": 0.91, "learning_rate": 4.298140675300034e-06, "loss": 2.2977, "step": 262070 }, { "epoch": 0.91, "learning_rate": 4.296396795446382e-06, "loss": 2.3685, "step": 262080 }, { "epoch": 0.91, "learning_rate": 4.2946529155927275e-06, "loss": 2.373, "step": 262090 }, { "epoch": 0.91, "learning_rate": 4.292909035739074e-06, "loss": 2.3827, "step": 262100 }, { "epoch": 0.91, "learning_rate": 4.29116515588542e-06, "loss": 2.3523, "step": 262110 }, { "epoch": 0.91, "learning_rate": 4.289421276031767e-06, "loss": 2.3233, "step": 262120 }, { "epoch": 0.91, "learning_rate": 4.287677396178113e-06, "loss": 2.3269, "step": 262130 }, { "epoch": 0.91, "learning_rate": 4.285933516324459e-06, "loss": 2.3678, "step": 262140 }, { "epoch": 0.91, "learning_rate": 4.284189636470806e-06, "loss": 2.4086, "step": 262150 }, { "epoch": 0.91, "learning_rate": 4.282445756617153e-06, "loss": 2.2079, "step": 262160 }, { "epoch": 0.91, "learning_rate": 4.2807018767634985e-06, "loss": 2.3446, "step": 262170 }, { "epoch": 0.91, "learning_rate": 4.278957996909845e-06, "loss": 2.3763, "step": 262180 }, { "epoch": 0.91, "learning_rate": 4.277214117056191e-06, "loss": 2.3336, "step": 262190 }, { "epoch": 0.91, "learning_rate": 4.275470237202538e-06, "loss": 2.3154, "step": 262200 }, { "epoch": 0.91, "learning_rate": 4.2737263573488845e-06, "loss": 2.278, "step": 262210 }, { "epoch": 0.91, "learning_rate": 4.271982477495231e-06, "loss": 2.2952, "step": 262220 }, { "epoch": 0.91, "learning_rate": 4.270238597641577e-06, "loss": 2.3589, "step": 262230 }, { "epoch": 0.91, "learning_rate": 4.268494717787924e-06, "loss": 2.349, "step": 262240 }, { "epoch": 0.91, "learning_rate": 4.2667508379342695e-06, "loss": 2.362, "step": 262250 }, { "epoch": 0.91, "learning_rate": 4.265006958080616e-06, "loss": 2.3746, "step": 262260 }, { "epoch": 0.91, "learning_rate": 4.263263078226962e-06, "loss": 2.3487, "step": 262270 }, { "epoch": 0.91, "learning_rate": 4.26151919837331e-06, "loss": 2.3763, "step": 262280 }, { "epoch": 0.91, "learning_rate": 4.2597753185196555e-06, "loss": 2.4307, "step": 262290 }, { "epoch": 0.91, "learning_rate": 4.258031438666002e-06, "loss": 2.3624, "step": 262300 }, { "epoch": 0.91, "learning_rate": 4.256287558812348e-06, "loss": 2.2976, "step": 262310 }, { "epoch": 0.91, "learning_rate": 4.254543678958695e-06, "loss": 2.3364, "step": 262320 }, { "epoch": 0.91, "learning_rate": 4.2527997991050405e-06, "loss": 2.3508, "step": 262330 }, { "epoch": 0.91, "learning_rate": 4.251055919251387e-06, "loss": 2.3981, "step": 262340 }, { "epoch": 0.92, "learning_rate": 4.249312039397734e-06, "loss": 2.295, "step": 262350 }, { "epoch": 0.92, "learning_rate": 4.247568159544081e-06, "loss": 2.2969, "step": 262360 }, { "epoch": 0.92, "learning_rate": 4.2458242796904265e-06, "loss": 2.3194, "step": 262370 }, { "epoch": 0.92, "learning_rate": 4.244080399836773e-06, "loss": 2.3122, "step": 262380 }, { "epoch": 0.92, "learning_rate": 4.242336519983119e-06, "loss": 2.3445, "step": 262390 }, { "epoch": 0.92, "learning_rate": 4.240592640129466e-06, "loss": 2.3949, "step": 262400 }, { "epoch": 0.92, "learning_rate": 4.238848760275812e-06, "loss": 2.3354, "step": 262410 }, { "epoch": 0.92, "learning_rate": 4.237104880422159e-06, "loss": 2.3003, "step": 262420 }, { "epoch": 0.92, "learning_rate": 4.235361000568505e-06, "loss": 2.3792, "step": 262430 }, { "epoch": 0.92, "learning_rate": 4.233617120714852e-06, "loss": 2.3225, "step": 262440 }, { "epoch": 0.92, "learning_rate": 4.2318732408611975e-06, "loss": 2.3339, "step": 262450 }, { "epoch": 0.92, "learning_rate": 4.230129361007544e-06, "loss": 2.2889, "step": 262460 }, { "epoch": 0.92, "learning_rate": 4.22838548115389e-06, "loss": 2.3707, "step": 262470 }, { "epoch": 0.92, "learning_rate": 4.2266416013002375e-06, "loss": 2.3939, "step": 262480 }, { "epoch": 0.92, "learning_rate": 4.224897721446583e-06, "loss": 2.2476, "step": 262490 }, { "epoch": 0.92, "learning_rate": 4.22315384159293e-06, "loss": 2.3301, "step": 262500 }, { "epoch": 0.92, "learning_rate": 4.221409961739276e-06, "loss": 2.3652, "step": 262510 }, { "epoch": 0.92, "learning_rate": 4.219666081885623e-06, "loss": 2.317, "step": 262520 }, { "epoch": 0.92, "learning_rate": 4.2179222020319685e-06, "loss": 2.3256, "step": 262530 }, { "epoch": 0.92, "learning_rate": 4.216178322178315e-06, "loss": 2.3805, "step": 262540 }, { "epoch": 0.92, "learning_rate": 4.214434442324662e-06, "loss": 2.3207, "step": 262550 }, { "epoch": 0.92, "learning_rate": 4.2126905624710085e-06, "loss": 2.3011, "step": 262560 }, { "epoch": 0.92, "learning_rate": 4.210946682617354e-06, "loss": 2.3197, "step": 262570 }, { "epoch": 0.92, "learning_rate": 4.209202802763701e-06, "loss": 2.3412, "step": 262580 }, { "epoch": 0.92, "learning_rate": 4.207458922910047e-06, "loss": 2.3246, "step": 262590 }, { "epoch": 0.92, "learning_rate": 4.205715043056394e-06, "loss": 2.4308, "step": 262600 }, { "epoch": 0.92, "learning_rate": 4.20397116320274e-06, "loss": 2.3343, "step": 262610 }, { "epoch": 0.92, "learning_rate": 4.202227283349087e-06, "loss": 2.2681, "step": 262620 }, { "epoch": 0.92, "learning_rate": 4.200483403495433e-06, "loss": 2.3522, "step": 262630 }, { "epoch": 0.92, "learning_rate": 4.1987395236417795e-06, "loss": 2.3777, "step": 262640 }, { "epoch": 0.92, "learning_rate": 4.196995643788125e-06, "loss": 2.2508, "step": 262650 }, { "epoch": 0.92, "learning_rate": 4.195251763934472e-06, "loss": 2.3712, "step": 262660 }, { "epoch": 0.92, "learning_rate": 4.193507884080818e-06, "loss": 2.2993, "step": 262670 }, { "epoch": 0.92, "learning_rate": 4.1917640042271655e-06, "loss": 2.343, "step": 262680 }, { "epoch": 0.92, "learning_rate": 4.190020124373511e-06, "loss": 2.3114, "step": 262690 }, { "epoch": 0.92, "learning_rate": 4.188276244519858e-06, "loss": 2.4111, "step": 262700 }, { "epoch": 0.92, "learning_rate": 4.186532364666204e-06, "loss": 2.3451, "step": 262710 }, { "epoch": 0.92, "learning_rate": 4.1847884848125505e-06, "loss": 2.3228, "step": 262720 }, { "epoch": 0.92, "learning_rate": 4.183044604958896e-06, "loss": 2.2874, "step": 262730 }, { "epoch": 0.92, "learning_rate": 4.181300725105243e-06, "loss": 2.3102, "step": 262740 }, { "epoch": 0.92, "learning_rate": 4.17955684525159e-06, "loss": 2.3469, "step": 262750 }, { "epoch": 0.92, "learning_rate": 4.1778129653979365e-06, "loss": 2.3682, "step": 262760 }, { "epoch": 0.92, "learning_rate": 4.176069085544282e-06, "loss": 2.3497, "step": 262770 }, { "epoch": 0.92, "learning_rate": 4.174325205690629e-06, "loss": 2.3546, "step": 262780 }, { "epoch": 0.92, "learning_rate": 4.172581325836975e-06, "loss": 2.4529, "step": 262790 }, { "epoch": 0.92, "learning_rate": 4.1708374459833215e-06, "loss": 2.2522, "step": 262800 }, { "epoch": 0.92, "learning_rate": 4.169093566129668e-06, "loss": 2.3059, "step": 262810 }, { "epoch": 0.92, "learning_rate": 4.167349686276015e-06, "loss": 2.4088, "step": 262820 }, { "epoch": 0.92, "learning_rate": 4.165605806422361e-06, "loss": 2.3307, "step": 262830 }, { "epoch": 0.92, "learning_rate": 4.1638619265687075e-06, "loss": 2.3656, "step": 262840 }, { "epoch": 0.92, "learning_rate": 4.162118046715053e-06, "loss": 2.3476, "step": 262850 }, { "epoch": 0.92, "learning_rate": 4.1603741668614e-06, "loss": 2.3334, "step": 262860 }, { "epoch": 0.92, "learning_rate": 4.158630287007746e-06, "loss": 2.2638, "step": 262870 }, { "epoch": 0.92, "learning_rate": 4.156886407154093e-06, "loss": 2.3666, "step": 262880 }, { "epoch": 0.92, "learning_rate": 4.155142527300439e-06, "loss": 2.3872, "step": 262890 }, { "epoch": 0.92, "learning_rate": 4.153398647446786e-06, "loss": 2.3207, "step": 262900 }, { "epoch": 0.92, "learning_rate": 4.151654767593132e-06, "loss": 2.3152, "step": 262910 }, { "epoch": 0.92, "learning_rate": 4.1499108877394785e-06, "loss": 2.3927, "step": 262920 }, { "epoch": 0.92, "learning_rate": 4.148167007885824e-06, "loss": 2.3011, "step": 262930 }, { "epoch": 0.92, "learning_rate": 4.146423128032171e-06, "loss": 2.3237, "step": 262940 }, { "epoch": 0.92, "learning_rate": 4.144679248178518e-06, "loss": 2.298, "step": 262950 }, { "epoch": 0.92, "learning_rate": 4.142935368324864e-06, "loss": 2.3313, "step": 262960 }, { "epoch": 0.92, "learning_rate": 4.14119148847121e-06, "loss": 2.3022, "step": 262970 }, { "epoch": 0.92, "learning_rate": 4.139447608617557e-06, "loss": 2.362, "step": 262980 }, { "epoch": 0.92, "learning_rate": 4.137703728763903e-06, "loss": 2.3583, "step": 262990 }, { "epoch": 0.92, "learning_rate": 4.1359598489102495e-06, "loss": 2.3251, "step": 263000 }, { "epoch": 0.92, "learning_rate": 4.134215969056596e-06, "loss": 2.3248, "step": 263010 }, { "epoch": 0.92, "learning_rate": 4.132472089202943e-06, "loss": 2.3606, "step": 263020 }, { "epoch": 0.92, "learning_rate": 4.130728209349289e-06, "loss": 2.3407, "step": 263030 }, { "epoch": 0.92, "learning_rate": 4.128984329495635e-06, "loss": 2.3262, "step": 263040 }, { "epoch": 0.92, "learning_rate": 4.127240449641981e-06, "loss": 2.2578, "step": 263050 }, { "epoch": 0.92, "learning_rate": 4.125496569788328e-06, "loss": 2.2956, "step": 263060 }, { "epoch": 0.92, "learning_rate": 4.123752689934674e-06, "loss": 2.2981, "step": 263070 }, { "epoch": 0.92, "learning_rate": 4.122008810081021e-06, "loss": 2.3968, "step": 263080 }, { "epoch": 0.92, "learning_rate": 4.120264930227367e-06, "loss": 2.369, "step": 263090 }, { "epoch": 0.92, "learning_rate": 4.118521050373714e-06, "loss": 2.3547, "step": 263100 }, { "epoch": 0.92, "learning_rate": 4.11677717052006e-06, "loss": 2.3972, "step": 263110 }, { "epoch": 0.92, "learning_rate": 4.115033290666406e-06, "loss": 2.337, "step": 263120 }, { "epoch": 0.92, "learning_rate": 4.113289410812752e-06, "loss": 2.3151, "step": 263130 }, { "epoch": 0.92, "learning_rate": 4.1115455309591e-06, "loss": 2.3547, "step": 263140 }, { "epoch": 0.92, "learning_rate": 4.109801651105446e-06, "loss": 2.2942, "step": 263150 }, { "epoch": 0.92, "learning_rate": 4.108057771251792e-06, "loss": 2.3708, "step": 263160 }, { "epoch": 0.92, "learning_rate": 4.106313891398138e-06, "loss": 2.3687, "step": 263170 }, { "epoch": 0.92, "learning_rate": 4.104570011544485e-06, "loss": 2.4522, "step": 263180 }, { "epoch": 0.92, "learning_rate": 4.102826131690831e-06, "loss": 2.323, "step": 263190 }, { "epoch": 0.92, "learning_rate": 4.101082251837177e-06, "loss": 2.4175, "step": 263200 }, { "epoch": 0.92, "learning_rate": 4.099338371983524e-06, "loss": 2.3018, "step": 263210 }, { "epoch": 0.92, "learning_rate": 4.097594492129871e-06, "loss": 2.3607, "step": 263220 }, { "epoch": 0.92, "learning_rate": 4.095850612276217e-06, "loss": 2.4167, "step": 263230 }, { "epoch": 0.92, "learning_rate": 4.094106732422563e-06, "loss": 2.3524, "step": 263240 }, { "epoch": 0.92, "learning_rate": 4.092362852568909e-06, "loss": 2.3222, "step": 263250 }, { "epoch": 0.92, "learning_rate": 4.090618972715256e-06, "loss": 2.2791, "step": 263260 }, { "epoch": 0.92, "learning_rate": 4.088875092861602e-06, "loss": 2.2899, "step": 263270 }, { "epoch": 0.92, "learning_rate": 4.087131213007949e-06, "loss": 2.3866, "step": 263280 }, { "epoch": 0.92, "learning_rate": 4.085387333154295e-06, "loss": 2.3387, "step": 263290 }, { "epoch": 0.92, "learning_rate": 4.083643453300642e-06, "loss": 2.3567, "step": 263300 }, { "epoch": 0.92, "learning_rate": 4.081899573446988e-06, "loss": 2.3763, "step": 263310 }, { "epoch": 0.92, "learning_rate": 4.080155693593334e-06, "loss": 2.2517, "step": 263320 }, { "epoch": 0.92, "learning_rate": 4.07841181373968e-06, "loss": 2.2759, "step": 263330 }, { "epoch": 0.92, "learning_rate": 4.076667933886028e-06, "loss": 2.364, "step": 263340 }, { "epoch": 0.92, "learning_rate": 4.0749240540323736e-06, "loss": 2.2959, "step": 263350 }, { "epoch": 0.92, "learning_rate": 4.07318017417872e-06, "loss": 2.323, "step": 263360 }, { "epoch": 0.92, "learning_rate": 4.071436294325066e-06, "loss": 2.4053, "step": 263370 }, { "epoch": 0.92, "learning_rate": 4.069692414471413e-06, "loss": 2.2993, "step": 263380 }, { "epoch": 0.92, "learning_rate": 4.067948534617759e-06, "loss": 2.3092, "step": 263390 }, { "epoch": 0.92, "learning_rate": 4.066204654764105e-06, "loss": 2.3892, "step": 263400 }, { "epoch": 0.92, "learning_rate": 4.064460774910452e-06, "loss": 2.3259, "step": 263410 }, { "epoch": 0.92, "learning_rate": 4.062716895056799e-06, "loss": 2.3431, "step": 263420 }, { "epoch": 0.92, "learning_rate": 4.0609730152031446e-06, "loss": 2.3555, "step": 263430 }, { "epoch": 0.92, "learning_rate": 4.059229135349491e-06, "loss": 2.2619, "step": 263440 }, { "epoch": 0.92, "learning_rate": 4.057485255495837e-06, "loss": 2.343, "step": 263450 }, { "epoch": 0.92, "learning_rate": 4.055741375642184e-06, "loss": 2.3969, "step": 263460 }, { "epoch": 0.92, "learning_rate": 4.05399749578853e-06, "loss": 2.3697, "step": 263470 }, { "epoch": 0.92, "learning_rate": 4.052253615934877e-06, "loss": 2.392, "step": 263480 }, { "epoch": 0.92, "learning_rate": 4.050509736081223e-06, "loss": 2.3866, "step": 263490 }, { "epoch": 0.92, "learning_rate": 4.04876585622757e-06, "loss": 2.3541, "step": 263500 }, { "epoch": 0.92, "learning_rate": 4.0470219763739156e-06, "loss": 2.4105, "step": 263510 }, { "epoch": 0.92, "learning_rate": 4.045278096520262e-06, "loss": 2.365, "step": 263520 }, { "epoch": 0.92, "learning_rate": 4.043534216666608e-06, "loss": 2.2937, "step": 263530 }, { "epoch": 0.92, "learning_rate": 4.041790336812956e-06, "loss": 2.301, "step": 263540 }, { "epoch": 0.92, "learning_rate": 4.0400464569593015e-06, "loss": 2.429, "step": 263550 }, { "epoch": 0.92, "learning_rate": 4.038302577105648e-06, "loss": 2.3045, "step": 263560 }, { "epoch": 0.92, "learning_rate": 4.036558697251994e-06, "loss": 2.3929, "step": 263570 }, { "epoch": 0.92, "learning_rate": 4.034814817398341e-06, "loss": 2.284, "step": 263580 }, { "epoch": 0.92, "learning_rate": 4.0330709375446866e-06, "loss": 2.3486, "step": 263590 }, { "epoch": 0.92, "learning_rate": 4.031327057691033e-06, "loss": 2.3002, "step": 263600 }, { "epoch": 0.92, "learning_rate": 4.02958317783738e-06, "loss": 2.379, "step": 263610 }, { "epoch": 0.92, "learning_rate": 4.027839297983727e-06, "loss": 2.3479, "step": 263620 }, { "epoch": 0.92, "learning_rate": 4.0260954181300725e-06, "loss": 2.3824, "step": 263630 }, { "epoch": 0.92, "learning_rate": 4.024351538276419e-06, "loss": 2.286, "step": 263640 }, { "epoch": 0.92, "learning_rate": 4.022607658422765e-06, "loss": 2.3857, "step": 263650 }, { "epoch": 0.92, "learning_rate": 4.020863778569112e-06, "loss": 2.2697, "step": 263660 }, { "epoch": 0.92, "learning_rate": 4.0191198987154576e-06, "loss": 2.3455, "step": 263670 }, { "epoch": 0.92, "learning_rate": 4.017376018861805e-06, "loss": 2.3881, "step": 263680 }, { "epoch": 0.92, "learning_rate": 4.015632139008151e-06, "loss": 2.3679, "step": 263690 }, { "epoch": 0.92, "learning_rate": 4.013888259154498e-06, "loss": 2.3713, "step": 263700 }, { "epoch": 0.92, "learning_rate": 4.0121443793008435e-06, "loss": 2.3311, "step": 263710 }, { "epoch": 0.92, "learning_rate": 4.01040049944719e-06, "loss": 2.363, "step": 263720 }, { "epoch": 0.92, "learning_rate": 4.008656619593536e-06, "loss": 2.3296, "step": 263730 }, { "epoch": 0.92, "learning_rate": 4.0069127397398836e-06, "loss": 2.3856, "step": 263740 }, { "epoch": 0.92, "learning_rate": 4.005168859886229e-06, "loss": 2.3504, "step": 263750 }, { "epoch": 0.92, "learning_rate": 4.003424980032576e-06, "loss": 2.339, "step": 263760 }, { "epoch": 0.92, "learning_rate": 4.001681100178922e-06, "loss": 2.2964, "step": 263770 }, { "epoch": 0.92, "learning_rate": 3.999937220325269e-06, "loss": 2.3172, "step": 263780 }, { "epoch": 0.92, "learning_rate": 3.9981933404716145e-06, "loss": 2.4197, "step": 263790 }, { "epoch": 0.92, "learning_rate": 3.996449460617961e-06, "loss": 2.3102, "step": 263800 }, { "epoch": 0.92, "learning_rate": 3.994705580764308e-06, "loss": 2.3635, "step": 263810 }, { "epoch": 0.92, "learning_rate": 3.9929617009106546e-06, "loss": 2.3284, "step": 263820 }, { "epoch": 0.92, "learning_rate": 3.991217821057e-06, "loss": 2.3255, "step": 263830 }, { "epoch": 0.92, "learning_rate": 3.989473941203347e-06, "loss": 2.3468, "step": 263840 }, { "epoch": 0.92, "learning_rate": 3.987730061349693e-06, "loss": 2.3376, "step": 263850 }, { "epoch": 0.92, "learning_rate": 3.98598618149604e-06, "loss": 2.3345, "step": 263860 }, { "epoch": 0.92, "learning_rate": 3.9842423016423855e-06, "loss": 2.3419, "step": 263870 }, { "epoch": 0.92, "learning_rate": 3.982498421788733e-06, "loss": 2.3282, "step": 263880 }, { "epoch": 0.92, "learning_rate": 3.980754541935079e-06, "loss": 2.4248, "step": 263890 }, { "epoch": 0.92, "learning_rate": 3.9790106620814256e-06, "loss": 2.3664, "step": 263900 }, { "epoch": 0.92, "learning_rate": 3.977266782227771e-06, "loss": 2.3357, "step": 263910 }, { "epoch": 0.92, "learning_rate": 3.975522902374118e-06, "loss": 2.3747, "step": 263920 }, { "epoch": 0.92, "learning_rate": 3.973779022520464e-06, "loss": 2.2631, "step": 263930 }, { "epoch": 0.92, "learning_rate": 3.9720351426668115e-06, "loss": 2.3886, "step": 263940 }, { "epoch": 0.92, "learning_rate": 3.970291262813157e-06, "loss": 2.3887, "step": 263950 }, { "epoch": 0.92, "learning_rate": 3.968547382959504e-06, "loss": 2.2767, "step": 263960 }, { "epoch": 0.92, "learning_rate": 3.96680350310585e-06, "loss": 2.3866, "step": 263970 }, { "epoch": 0.92, "learning_rate": 3.9650596232521966e-06, "loss": 2.3092, "step": 263980 }, { "epoch": 0.92, "learning_rate": 3.963315743398542e-06, "loss": 2.4075, "step": 263990 }, { "epoch": 0.92, "learning_rate": 3.961571863544889e-06, "loss": 2.3982, "step": 264000 }, { "epoch": 0.92, "learning_rate": 3.959827983691236e-06, "loss": 2.3446, "step": 264010 }, { "epoch": 0.92, "learning_rate": 3.9580841038375825e-06, "loss": 2.3195, "step": 264020 }, { "epoch": 0.92, "learning_rate": 3.956340223983928e-06, "loss": 2.2972, "step": 264030 }, { "epoch": 0.92, "learning_rate": 3.954596344130275e-06, "loss": 2.297, "step": 264040 }, { "epoch": 0.92, "learning_rate": 3.952852464276621e-06, "loss": 2.3672, "step": 264050 }, { "epoch": 0.92, "learning_rate": 3.9511085844229676e-06, "loss": 2.3288, "step": 264060 }, { "epoch": 0.92, "learning_rate": 3.949364704569314e-06, "loss": 2.3565, "step": 264070 }, { "epoch": 0.92, "learning_rate": 3.947620824715661e-06, "loss": 2.3376, "step": 264080 }, { "epoch": 0.92, "learning_rate": 3.945876944862007e-06, "loss": 2.3769, "step": 264090 }, { "epoch": 0.92, "learning_rate": 3.9441330650083535e-06, "loss": 2.3342, "step": 264100 }, { "epoch": 0.92, "learning_rate": 3.942389185154699e-06, "loss": 2.3069, "step": 264110 }, { "epoch": 0.92, "learning_rate": 3.940645305301046e-06, "loss": 2.3067, "step": 264120 }, { "epoch": 0.92, "learning_rate": 3.938901425447393e-06, "loss": 2.3776, "step": 264130 }, { "epoch": 0.92, "learning_rate": 3.937157545593739e-06, "loss": 2.337, "step": 264140 }, { "epoch": 0.92, "learning_rate": 3.935413665740085e-06, "loss": 2.3644, "step": 264150 }, { "epoch": 0.92, "learning_rate": 3.933669785886432e-06, "loss": 2.3487, "step": 264160 }, { "epoch": 0.92, "learning_rate": 3.931925906032778e-06, "loss": 2.3456, "step": 264170 }, { "epoch": 0.92, "learning_rate": 3.9301820261791245e-06, "loss": 2.3403, "step": 264180 }, { "epoch": 0.92, "learning_rate": 3.92843814632547e-06, "loss": 2.396, "step": 264190 }, { "epoch": 0.92, "learning_rate": 3.926694266471817e-06, "loss": 2.2129, "step": 264200 }, { "epoch": 0.92, "learning_rate": 3.924950386618164e-06, "loss": 2.2855, "step": 264210 }, { "epoch": 0.92, "learning_rate": 3.92320650676451e-06, "loss": 2.3927, "step": 264220 }, { "epoch": 0.92, "learning_rate": 3.921462626910856e-06, "loss": 2.3499, "step": 264230 }, { "epoch": 0.92, "learning_rate": 3.919718747057203e-06, "loss": 2.3283, "step": 264240 }, { "epoch": 0.92, "learning_rate": 3.917974867203549e-06, "loss": 2.3078, "step": 264250 }, { "epoch": 0.92, "learning_rate": 3.9162309873498955e-06, "loss": 2.3415, "step": 264260 }, { "epoch": 0.92, "learning_rate": 3.914487107496242e-06, "loss": 2.3633, "step": 264270 }, { "epoch": 0.92, "learning_rate": 3.912743227642589e-06, "loss": 2.3757, "step": 264280 }, { "epoch": 0.92, "learning_rate": 3.910999347788935e-06, "loss": 2.3602, "step": 264290 }, { "epoch": 0.92, "learning_rate": 3.909255467935281e-06, "loss": 2.3647, "step": 264300 }, { "epoch": 0.92, "learning_rate": 3.907511588081627e-06, "loss": 2.2689, "step": 264310 }, { "epoch": 0.92, "learning_rate": 3.905767708227974e-06, "loss": 2.4001, "step": 264320 }, { "epoch": 0.92, "learning_rate": 3.904023828374321e-06, "loss": 2.3542, "step": 264330 }, { "epoch": 0.92, "learning_rate": 3.902279948520667e-06, "loss": 2.3069, "step": 264340 }, { "epoch": 0.92, "learning_rate": 3.900536068667013e-06, "loss": 2.3367, "step": 264350 }, { "epoch": 0.92, "learning_rate": 3.89879218881336e-06, "loss": 2.3844, "step": 264360 }, { "epoch": 0.92, "learning_rate": 3.897048308959706e-06, "loss": 2.3939, "step": 264370 }, { "epoch": 0.92, "learning_rate": 3.895304429106052e-06, "loss": 2.3652, "step": 264380 }, { "epoch": 0.92, "learning_rate": 3.893560549252399e-06, "loss": 2.2973, "step": 264390 }, { "epoch": 0.92, "learning_rate": 3.891816669398745e-06, "loss": 2.3474, "step": 264400 }, { "epoch": 0.92, "learning_rate": 3.890072789545092e-06, "loss": 2.4206, "step": 264410 }, { "epoch": 0.92, "learning_rate": 3.888328909691438e-06, "loss": 2.4373, "step": 264420 }, { "epoch": 0.92, "learning_rate": 3.886585029837784e-06, "loss": 2.3135, "step": 264430 }, { "epoch": 0.92, "learning_rate": 3.884841149984131e-06, "loss": 2.3615, "step": 264440 }, { "epoch": 0.92, "learning_rate": 3.883097270130477e-06, "loss": 2.3445, "step": 264450 }, { "epoch": 0.92, "learning_rate": 3.881353390276823e-06, "loss": 2.3221, "step": 264460 }, { "epoch": 0.92, "learning_rate": 3.87960951042317e-06, "loss": 2.394, "step": 264470 }, { "epoch": 0.92, "learning_rate": 3.877865630569517e-06, "loss": 2.3942, "step": 264480 }, { "epoch": 0.92, "learning_rate": 3.876121750715863e-06, "loss": 2.3397, "step": 264490 }, { "epoch": 0.92, "learning_rate": 3.874377870862209e-06, "loss": 2.3002, "step": 264500 }, { "epoch": 0.92, "learning_rate": 3.872633991008555e-06, "loss": 2.3428, "step": 264510 }, { "epoch": 0.92, "learning_rate": 3.870890111154902e-06, "loss": 2.3871, "step": 264520 }, { "epoch": 0.92, "learning_rate": 3.8691462313012486e-06, "loss": 2.437, "step": 264530 }, { "epoch": 0.92, "learning_rate": 3.867402351447595e-06, "loss": 2.4295, "step": 264540 }, { "epoch": 0.92, "learning_rate": 3.865658471593941e-06, "loss": 2.2996, "step": 264550 }, { "epoch": 0.92, "learning_rate": 3.863914591740288e-06, "loss": 2.3448, "step": 264560 }, { "epoch": 0.92, "learning_rate": 3.862170711886634e-06, "loss": 2.2866, "step": 264570 }, { "epoch": 0.92, "learning_rate": 3.86042683203298e-06, "loss": 2.2855, "step": 264580 }, { "epoch": 0.92, "learning_rate": 3.858682952179327e-06, "loss": 2.3627, "step": 264590 }, { "epoch": 0.92, "learning_rate": 3.856939072325673e-06, "loss": 2.3843, "step": 264600 }, { "epoch": 0.92, "learning_rate": 3.8551951924720196e-06, "loss": 2.3303, "step": 264610 }, { "epoch": 0.92, "learning_rate": 3.853451312618366e-06, "loss": 2.3055, "step": 264620 }, { "epoch": 0.92, "learning_rate": 3.851707432764712e-06, "loss": 2.3088, "step": 264630 }, { "epoch": 0.92, "learning_rate": 3.849963552911059e-06, "loss": 2.2491, "step": 264640 }, { "epoch": 0.92, "learning_rate": 3.8482196730574055e-06, "loss": 2.3449, "step": 264650 }, { "epoch": 0.92, "learning_rate": 3.846475793203751e-06, "loss": 2.3297, "step": 264660 }, { "epoch": 0.92, "learning_rate": 3.844731913350098e-06, "loss": 2.3287, "step": 264670 }, { "epoch": 0.92, "learning_rate": 3.842988033496445e-06, "loss": 2.2553, "step": 264680 }, { "epoch": 0.92, "learning_rate": 3.8412441536427906e-06, "loss": 2.3409, "step": 264690 }, { "epoch": 0.92, "learning_rate": 3.839500273789137e-06, "loss": 2.3573, "step": 264700 }, { "epoch": 0.92, "learning_rate": 3.837756393935483e-06, "loss": 2.4352, "step": 264710 }, { "epoch": 0.92, "learning_rate": 3.83601251408183e-06, "loss": 2.311, "step": 264720 }, { "epoch": 0.92, "learning_rate": 3.8342686342281765e-06, "loss": 2.3182, "step": 264730 }, { "epoch": 0.92, "learning_rate": 3.832524754374523e-06, "loss": 2.3018, "step": 264740 }, { "epoch": 0.92, "learning_rate": 3.830780874520869e-06, "loss": 2.3917, "step": 264750 }, { "epoch": 0.92, "learning_rate": 3.829036994667216e-06, "loss": 2.3459, "step": 264760 }, { "epoch": 0.92, "learning_rate": 3.8272931148135616e-06, "loss": 2.3704, "step": 264770 }, { "epoch": 0.92, "learning_rate": 3.825549234959908e-06, "loss": 2.3504, "step": 264780 }, { "epoch": 0.92, "learning_rate": 3.823805355106255e-06, "loss": 2.3117, "step": 264790 }, { "epoch": 0.92, "learning_rate": 3.822061475252601e-06, "loss": 2.3467, "step": 264800 }, { "epoch": 0.92, "learning_rate": 3.8203175953989475e-06, "loss": 2.364, "step": 264810 }, { "epoch": 0.92, "learning_rate": 3.818573715545294e-06, "loss": 2.3797, "step": 264820 }, { "epoch": 0.92, "learning_rate": 3.81682983569164e-06, "loss": 2.282, "step": 264830 }, { "epoch": 0.92, "learning_rate": 3.815085955837987e-06, "loss": 2.4325, "step": 264840 }, { "epoch": 0.92, "learning_rate": 3.813342075984333e-06, "loss": 2.2678, "step": 264850 }, { "epoch": 0.92, "learning_rate": 3.8115981961306793e-06, "loss": 2.2071, "step": 264860 }, { "epoch": 0.92, "learning_rate": 3.8098543162770264e-06, "loss": 2.398, "step": 264870 }, { "epoch": 0.92, "learning_rate": 3.8081104364233727e-06, "loss": 2.3185, "step": 264880 }, { "epoch": 0.92, "learning_rate": 3.806366556569719e-06, "loss": 2.3444, "step": 264890 }, { "epoch": 0.92, "learning_rate": 3.804622676716065e-06, "loss": 2.3493, "step": 264900 }, { "epoch": 0.92, "learning_rate": 3.8028787968624115e-06, "loss": 2.4137, "step": 264910 }, { "epoch": 0.92, "learning_rate": 3.8011349170087577e-06, "loss": 2.3469, "step": 264920 }, { "epoch": 0.92, "learning_rate": 3.799391037155104e-06, "loss": 2.3415, "step": 264930 }, { "epoch": 0.92, "learning_rate": 3.797647157301451e-06, "loss": 2.3261, "step": 264940 }, { "epoch": 0.92, "learning_rate": 3.7959032774477974e-06, "loss": 2.413, "step": 264950 }, { "epoch": 0.92, "learning_rate": 3.7941593975941437e-06, "loss": 2.304, "step": 264960 }, { "epoch": 0.92, "learning_rate": 3.79241551774049e-06, "loss": 2.4432, "step": 264970 }, { "epoch": 0.92, "learning_rate": 3.790671637886836e-06, "loss": 2.3121, "step": 264980 }, { "epoch": 0.92, "learning_rate": 3.7889277580331825e-06, "loss": 2.3189, "step": 264990 }, { "epoch": 0.92, "learning_rate": 3.7871838781795287e-06, "loss": 2.3617, "step": 265000 }, { "epoch": 0.92, "learning_rate": 3.785439998325876e-06, "loss": 2.311, "step": 265010 }, { "epoch": 0.92, "learning_rate": 3.783696118472222e-06, "loss": 2.303, "step": 265020 }, { "epoch": 0.92, "learning_rate": 3.7819522386185684e-06, "loss": 2.3111, "step": 265030 }, { "epoch": 0.92, "learning_rate": 3.7802083587649147e-06, "loss": 2.3427, "step": 265040 }, { "epoch": 0.92, "learning_rate": 3.778464478911261e-06, "loss": 2.2758, "step": 265050 }, { "epoch": 0.92, "learning_rate": 3.776720599057607e-06, "loss": 2.3577, "step": 265060 }, { "epoch": 0.92, "learning_rate": 3.7749767192039543e-06, "loss": 2.3736, "step": 265070 }, { "epoch": 0.92, "learning_rate": 3.7732328393503006e-06, "loss": 2.3013, "step": 265080 }, { "epoch": 0.92, "learning_rate": 3.771488959496647e-06, "loss": 2.3529, "step": 265090 }, { "epoch": 0.92, "learning_rate": 3.769745079642993e-06, "loss": 2.362, "step": 265100 }, { "epoch": 0.92, "learning_rate": 3.7680011997893394e-06, "loss": 2.2488, "step": 265110 }, { "epoch": 0.92, "learning_rate": 3.7662573199356857e-06, "loss": 2.2634, "step": 265120 }, { "epoch": 0.92, "learning_rate": 3.764513440082032e-06, "loss": 2.4154, "step": 265130 }, { "epoch": 0.92, "learning_rate": 3.762769560228379e-06, "loss": 2.3629, "step": 265140 }, { "epoch": 0.92, "learning_rate": 3.7610256803747253e-06, "loss": 2.4116, "step": 265150 }, { "epoch": 0.92, "learning_rate": 3.7592818005210716e-06, "loss": 2.2957, "step": 265160 }, { "epoch": 0.92, "learning_rate": 3.757537920667418e-06, "loss": 2.3014, "step": 265170 }, { "epoch": 0.92, "learning_rate": 3.755794040813764e-06, "loss": 2.3475, "step": 265180 }, { "epoch": 0.92, "learning_rate": 3.7540501609601104e-06, "loss": 2.39, "step": 265190 }, { "epoch": 0.92, "learning_rate": 3.7523062811064567e-06, "loss": 2.3508, "step": 265200 }, { "epoch": 0.92, "learning_rate": 3.7505624012528038e-06, "loss": 2.2954, "step": 265210 }, { "epoch": 0.93, "learning_rate": 3.74881852139915e-06, "loss": 2.302, "step": 265220 }, { "epoch": 0.93, "learning_rate": 3.7470746415454963e-06, "loss": 2.3256, "step": 265230 }, { "epoch": 0.93, "learning_rate": 3.7453307616918426e-06, "loss": 2.3226, "step": 265240 }, { "epoch": 0.93, "learning_rate": 3.743586881838189e-06, "loss": 2.292, "step": 265250 }, { "epoch": 0.93, "learning_rate": 3.741843001984535e-06, "loss": 2.3923, "step": 265260 }, { "epoch": 0.93, "learning_rate": 3.7400991221308822e-06, "loss": 2.2258, "step": 265270 }, { "epoch": 0.93, "learning_rate": 3.7383552422772285e-06, "loss": 2.3653, "step": 265280 }, { "epoch": 0.93, "learning_rate": 3.7366113624235748e-06, "loss": 2.2834, "step": 265290 }, { "epoch": 0.93, "learning_rate": 3.734867482569921e-06, "loss": 2.2833, "step": 265300 }, { "epoch": 0.93, "learning_rate": 3.7331236027162673e-06, "loss": 2.2791, "step": 265310 }, { "epoch": 0.93, "learning_rate": 3.7313797228626136e-06, "loss": 2.3695, "step": 265320 }, { "epoch": 0.93, "learning_rate": 3.72963584300896e-06, "loss": 2.3274, "step": 265330 }, { "epoch": 0.93, "learning_rate": 3.727891963155307e-06, "loss": 2.3903, "step": 265340 }, { "epoch": 0.93, "learning_rate": 3.7261480833016532e-06, "loss": 2.3072, "step": 265350 }, { "epoch": 0.93, "learning_rate": 3.7244042034479995e-06, "loss": 2.322, "step": 265360 }, { "epoch": 0.93, "learning_rate": 3.7226603235943458e-06, "loss": 2.3224, "step": 265370 }, { "epoch": 0.93, "learning_rate": 3.720916443740692e-06, "loss": 2.371, "step": 265380 }, { "epoch": 0.93, "learning_rate": 3.7191725638870383e-06, "loss": 2.3756, "step": 265390 }, { "epoch": 0.93, "learning_rate": 3.7174286840333846e-06, "loss": 2.3078, "step": 265400 }, { "epoch": 0.93, "learning_rate": 3.7156848041797317e-06, "loss": 2.3213, "step": 265410 }, { "epoch": 0.93, "learning_rate": 3.713940924326078e-06, "loss": 2.3089, "step": 265420 }, { "epoch": 0.93, "learning_rate": 3.7121970444724242e-06, "loss": 2.2647, "step": 265430 }, { "epoch": 0.93, "learning_rate": 3.7104531646187705e-06, "loss": 2.3231, "step": 265440 }, { "epoch": 0.93, "learning_rate": 3.7087092847651168e-06, "loss": 2.3257, "step": 265450 }, { "epoch": 0.93, "learning_rate": 3.706965404911463e-06, "loss": 2.2734, "step": 265460 }, { "epoch": 0.93, "learning_rate": 3.70522152505781e-06, "loss": 2.3316, "step": 265470 }, { "epoch": 0.93, "learning_rate": 3.7034776452041564e-06, "loss": 2.3, "step": 265480 }, { "epoch": 0.93, "learning_rate": 3.7017337653505027e-06, "loss": 2.4456, "step": 265490 }, { "epoch": 0.93, "learning_rate": 3.699989885496849e-06, "loss": 2.335, "step": 265500 }, { "epoch": 0.93, "learning_rate": 3.6982460056431952e-06, "loss": 2.3089, "step": 265510 }, { "epoch": 0.93, "learning_rate": 3.6965021257895415e-06, "loss": 2.3952, "step": 265520 }, { "epoch": 0.93, "learning_rate": 3.6947582459358878e-06, "loss": 2.253, "step": 265530 }, { "epoch": 0.93, "learning_rate": 3.693014366082235e-06, "loss": 2.4005, "step": 265540 }, { "epoch": 0.93, "learning_rate": 3.691270486228581e-06, "loss": 2.3434, "step": 265550 }, { "epoch": 0.93, "learning_rate": 3.6895266063749274e-06, "loss": 2.3186, "step": 265560 }, { "epoch": 0.93, "learning_rate": 3.6877827265212737e-06, "loss": 2.3589, "step": 265570 }, { "epoch": 0.93, "learning_rate": 3.68603884666762e-06, "loss": 2.4055, "step": 265580 }, { "epoch": 0.93, "learning_rate": 3.6842949668139662e-06, "loss": 2.3037, "step": 265590 }, { "epoch": 0.93, "learning_rate": 3.6825510869603125e-06, "loss": 2.3587, "step": 265600 }, { "epoch": 0.93, "learning_rate": 3.6808072071066596e-06, "loss": 2.343, "step": 265610 }, { "epoch": 0.93, "learning_rate": 3.679063327253006e-06, "loss": 2.3881, "step": 265620 }, { "epoch": 0.93, "learning_rate": 3.677319447399352e-06, "loss": 2.3408, "step": 265630 }, { "epoch": 0.93, "learning_rate": 3.6755755675456984e-06, "loss": 2.3956, "step": 265640 }, { "epoch": 0.93, "learning_rate": 3.6738316876920447e-06, "loss": 2.3293, "step": 265650 }, { "epoch": 0.93, "learning_rate": 3.672087807838391e-06, "loss": 2.2661, "step": 265660 }, { "epoch": 0.93, "learning_rate": 3.670343927984738e-06, "loss": 2.3063, "step": 265670 }, { "epoch": 0.93, "learning_rate": 3.6686000481310844e-06, "loss": 2.3874, "step": 265680 }, { "epoch": 0.93, "learning_rate": 3.6668561682774306e-06, "loss": 2.3332, "step": 265690 }, { "epoch": 0.93, "learning_rate": 3.665112288423777e-06, "loss": 2.2872, "step": 265700 }, { "epoch": 0.93, "learning_rate": 3.663368408570123e-06, "loss": 2.3892, "step": 265710 }, { "epoch": 0.93, "learning_rate": 3.6616245287164694e-06, "loss": 2.2746, "step": 265720 }, { "epoch": 0.93, "learning_rate": 3.6598806488628157e-06, "loss": 2.3146, "step": 265730 }, { "epoch": 0.93, "learning_rate": 3.658136769009163e-06, "loss": 2.3466, "step": 265740 }, { "epoch": 0.93, "learning_rate": 3.656392889155509e-06, "loss": 2.3252, "step": 265750 }, { "epoch": 0.93, "learning_rate": 3.6546490093018554e-06, "loss": 2.3822, "step": 265760 }, { "epoch": 0.93, "learning_rate": 3.6529051294482016e-06, "loss": 2.3106, "step": 265770 }, { "epoch": 0.93, "learning_rate": 3.651161249594548e-06, "loss": 2.2679, "step": 265780 }, { "epoch": 0.93, "learning_rate": 3.649417369740894e-06, "loss": 2.2942, "step": 265790 }, { "epoch": 0.93, "learning_rate": 3.6476734898872404e-06, "loss": 2.3782, "step": 265800 }, { "epoch": 0.93, "learning_rate": 3.6459296100335876e-06, "loss": 2.3444, "step": 265810 }, { "epoch": 0.93, "learning_rate": 3.644185730179934e-06, "loss": 2.3393, "step": 265820 }, { "epoch": 0.93, "learning_rate": 3.64244185032628e-06, "loss": 2.3585, "step": 265830 }, { "epoch": 0.93, "learning_rate": 3.6406979704726264e-06, "loss": 2.4124, "step": 265840 }, { "epoch": 0.93, "learning_rate": 3.6389540906189726e-06, "loss": 2.3652, "step": 265850 }, { "epoch": 0.93, "learning_rate": 3.637210210765319e-06, "loss": 2.276, "step": 265860 }, { "epoch": 0.93, "learning_rate": 3.635466330911666e-06, "loss": 2.2848, "step": 265870 }, { "epoch": 0.93, "learning_rate": 3.6337224510580123e-06, "loss": 2.3276, "step": 265880 }, { "epoch": 0.93, "learning_rate": 3.6319785712043586e-06, "loss": 2.2898, "step": 265890 }, { "epoch": 0.93, "learning_rate": 3.630234691350705e-06, "loss": 2.281, "step": 265900 }, { "epoch": 0.93, "learning_rate": 3.628490811497051e-06, "loss": 2.3182, "step": 265910 }, { "epoch": 0.93, "learning_rate": 3.6267469316433974e-06, "loss": 2.3461, "step": 265920 }, { "epoch": 0.93, "learning_rate": 3.6250030517897436e-06, "loss": 2.3638, "step": 265930 }, { "epoch": 0.93, "learning_rate": 3.6232591719360907e-06, "loss": 2.2368, "step": 265940 }, { "epoch": 0.93, "learning_rate": 3.621515292082437e-06, "loss": 2.3, "step": 265950 }, { "epoch": 0.93, "learning_rate": 3.6197714122287833e-06, "loss": 2.3248, "step": 265960 }, { "epoch": 0.93, "learning_rate": 3.6180275323751296e-06, "loss": 2.3465, "step": 265970 }, { "epoch": 0.93, "learning_rate": 3.616283652521476e-06, "loss": 2.3111, "step": 265980 }, { "epoch": 0.93, "learning_rate": 3.614539772667822e-06, "loss": 2.4125, "step": 265990 }, { "epoch": 0.93, "learning_rate": 3.6127958928141692e-06, "loss": 2.1898, "step": 266000 }, { "epoch": 0.93, "learning_rate": 3.6110520129605155e-06, "loss": 2.3098, "step": 266010 }, { "epoch": 0.93, "learning_rate": 3.6093081331068618e-06, "loss": 2.2912, "step": 266020 }, { "epoch": 0.93, "learning_rate": 3.607564253253208e-06, "loss": 2.4039, "step": 266030 }, { "epoch": 0.93, "learning_rate": 3.6058203733995543e-06, "loss": 2.4078, "step": 266040 }, { "epoch": 0.93, "learning_rate": 3.6040764935459006e-06, "loss": 2.2981, "step": 266050 }, { "epoch": 0.93, "learning_rate": 3.602332613692247e-06, "loss": 2.3001, "step": 266060 }, { "epoch": 0.93, "learning_rate": 3.600588733838594e-06, "loss": 2.3784, "step": 266070 }, { "epoch": 0.93, "learning_rate": 3.5988448539849402e-06, "loss": 2.3399, "step": 266080 }, { "epoch": 0.93, "learning_rate": 3.5971009741312865e-06, "loss": 2.3308, "step": 266090 }, { "epoch": 0.93, "learning_rate": 3.5953570942776328e-06, "loss": 2.3592, "step": 266100 }, { "epoch": 0.93, "learning_rate": 3.593613214423979e-06, "loss": 2.3796, "step": 266110 }, { "epoch": 0.93, "learning_rate": 3.5918693345703253e-06, "loss": 2.3688, "step": 266120 }, { "epoch": 0.93, "learning_rate": 3.5901254547166716e-06, "loss": 2.3245, "step": 266130 }, { "epoch": 0.93, "learning_rate": 3.5883815748630187e-06, "loss": 2.2686, "step": 266140 }, { "epoch": 0.93, "learning_rate": 3.586637695009365e-06, "loss": 2.3073, "step": 266150 }, { "epoch": 0.93, "learning_rate": 3.5848938151557112e-06, "loss": 2.2903, "step": 266160 }, { "epoch": 0.93, "learning_rate": 3.5831499353020575e-06, "loss": 2.2968, "step": 266170 }, { "epoch": 0.93, "learning_rate": 3.5814060554484038e-06, "loss": 2.3731, "step": 266180 }, { "epoch": 0.93, "learning_rate": 3.57966217559475e-06, "loss": 2.4027, "step": 266190 }, { "epoch": 0.93, "learning_rate": 3.577918295741097e-06, "loss": 2.2898, "step": 266200 }, { "epoch": 0.93, "learning_rate": 3.5761744158874434e-06, "loss": 2.3542, "step": 266210 }, { "epoch": 0.93, "learning_rate": 3.5744305360337897e-06, "loss": 2.3173, "step": 266220 }, { "epoch": 0.93, "learning_rate": 3.572686656180136e-06, "loss": 2.3923, "step": 266230 }, { "epoch": 0.93, "learning_rate": 3.5709427763264822e-06, "loss": 2.3336, "step": 266240 }, { "epoch": 0.93, "learning_rate": 3.5691988964728285e-06, "loss": 2.3609, "step": 266250 }, { "epoch": 0.93, "learning_rate": 3.5674550166191748e-06, "loss": 2.3022, "step": 266260 }, { "epoch": 0.93, "learning_rate": 3.565711136765522e-06, "loss": 2.4148, "step": 266270 }, { "epoch": 0.93, "learning_rate": 3.563967256911868e-06, "loss": 2.3909, "step": 266280 }, { "epoch": 0.93, "learning_rate": 3.5622233770582144e-06, "loss": 2.2906, "step": 266290 }, { "epoch": 0.93, "learning_rate": 3.5604794972045607e-06, "loss": 2.2873, "step": 266300 }, { "epoch": 0.93, "learning_rate": 3.558735617350907e-06, "loss": 2.3069, "step": 266310 }, { "epoch": 0.93, "learning_rate": 3.5569917374972532e-06, "loss": 2.3801, "step": 266320 }, { "epoch": 0.93, "learning_rate": 3.5552478576435995e-06, "loss": 2.3356, "step": 266330 }, { "epoch": 0.93, "learning_rate": 3.5535039777899466e-06, "loss": 2.3705, "step": 266340 }, { "epoch": 0.93, "learning_rate": 3.551760097936293e-06, "loss": 2.249, "step": 266350 }, { "epoch": 0.93, "learning_rate": 3.550016218082639e-06, "loss": 2.353, "step": 266360 }, { "epoch": 0.93, "learning_rate": 3.5482723382289854e-06, "loss": 2.319, "step": 266370 }, { "epoch": 0.93, "learning_rate": 3.5465284583753317e-06, "loss": 2.3714, "step": 266380 }, { "epoch": 0.93, "learning_rate": 3.544784578521678e-06, "loss": 2.2841, "step": 266390 }, { "epoch": 0.93, "learning_rate": 3.543040698668025e-06, "loss": 2.2804, "step": 266400 }, { "epoch": 0.93, "learning_rate": 3.5412968188143713e-06, "loss": 2.3125, "step": 266410 }, { "epoch": 0.93, "learning_rate": 3.5395529389607176e-06, "loss": 2.4291, "step": 266420 }, { "epoch": 0.93, "learning_rate": 3.537809059107064e-06, "loss": 2.3824, "step": 266430 }, { "epoch": 0.93, "learning_rate": 3.53606517925341e-06, "loss": 2.3229, "step": 266440 }, { "epoch": 0.93, "learning_rate": 3.5343212993997564e-06, "loss": 2.4473, "step": 266450 }, { "epoch": 0.93, "learning_rate": 3.5325774195461027e-06, "loss": 2.2893, "step": 266460 }, { "epoch": 0.93, "learning_rate": 3.53083353969245e-06, "loss": 2.383, "step": 266470 }, { "epoch": 0.93, "learning_rate": 3.529089659838796e-06, "loss": 2.299, "step": 266480 }, { "epoch": 0.93, "learning_rate": 3.5273457799851423e-06, "loss": 2.3111, "step": 266490 }, { "epoch": 0.93, "learning_rate": 3.5256019001314886e-06, "loss": 2.2211, "step": 266500 }, { "epoch": 0.93, "learning_rate": 3.523858020277835e-06, "loss": 2.3219, "step": 266510 }, { "epoch": 0.93, "learning_rate": 3.522114140424181e-06, "loss": 2.3303, "step": 266520 }, { "epoch": 0.93, "learning_rate": 3.5203702605705274e-06, "loss": 2.3204, "step": 266530 }, { "epoch": 0.93, "learning_rate": 3.5186263807168745e-06, "loss": 2.3362, "step": 266540 }, { "epoch": 0.93, "learning_rate": 3.516882500863221e-06, "loss": 2.3666, "step": 266550 }, { "epoch": 0.93, "learning_rate": 3.515138621009567e-06, "loss": 2.3897, "step": 266560 }, { "epoch": 0.93, "learning_rate": 3.5133947411559133e-06, "loss": 2.3146, "step": 266570 }, { "epoch": 0.93, "learning_rate": 3.5116508613022596e-06, "loss": 2.363, "step": 266580 }, { "epoch": 0.93, "learning_rate": 3.509906981448606e-06, "loss": 2.3554, "step": 266590 }, { "epoch": 0.93, "learning_rate": 3.508163101594953e-06, "loss": 2.3614, "step": 266600 }, { "epoch": 0.93, "learning_rate": 3.5064192217412993e-06, "loss": 2.3096, "step": 266610 }, { "epoch": 0.93, "learning_rate": 3.5046753418876455e-06, "loss": 2.345, "step": 266620 }, { "epoch": 0.93, "learning_rate": 3.502931462033992e-06, "loss": 2.3429, "step": 266630 }, { "epoch": 0.93, "learning_rate": 3.501187582180338e-06, "loss": 2.3769, "step": 266640 }, { "epoch": 0.93, "learning_rate": 3.4994437023266843e-06, "loss": 2.3159, "step": 266650 }, { "epoch": 0.93, "learning_rate": 3.4976998224730306e-06, "loss": 2.3686, "step": 266660 }, { "epoch": 0.93, "learning_rate": 3.4959559426193777e-06, "loss": 2.3115, "step": 266670 }, { "epoch": 0.93, "learning_rate": 3.494212062765724e-06, "loss": 2.4107, "step": 266680 }, { "epoch": 0.93, "learning_rate": 3.4924681829120703e-06, "loss": 2.4326, "step": 266690 }, { "epoch": 0.93, "learning_rate": 3.4907243030584165e-06, "loss": 2.2815, "step": 266700 }, { "epoch": 0.93, "learning_rate": 3.488980423204763e-06, "loss": 2.3355, "step": 266710 }, { "epoch": 0.93, "learning_rate": 3.487236543351109e-06, "loss": 2.263, "step": 266720 }, { "epoch": 0.93, "learning_rate": 3.4854926634974553e-06, "loss": 2.2563, "step": 266730 }, { "epoch": 0.93, "learning_rate": 3.4837487836438025e-06, "loss": 2.3375, "step": 266740 }, { "epoch": 0.93, "learning_rate": 3.4820049037901487e-06, "loss": 2.3437, "step": 266750 }, { "epoch": 0.93, "learning_rate": 3.480261023936495e-06, "loss": 2.3592, "step": 266760 }, { "epoch": 0.93, "learning_rate": 3.4785171440828413e-06, "loss": 2.3706, "step": 266770 }, { "epoch": 0.93, "learning_rate": 3.4767732642291875e-06, "loss": 2.2843, "step": 266780 }, { "epoch": 0.93, "learning_rate": 3.475029384375534e-06, "loss": 2.3018, "step": 266790 }, { "epoch": 0.93, "learning_rate": 3.473285504521881e-06, "loss": 2.3706, "step": 266800 }, { "epoch": 0.93, "learning_rate": 3.471541624668227e-06, "loss": 2.3475, "step": 266810 }, { "epoch": 0.93, "learning_rate": 3.4697977448145735e-06, "loss": 2.3033, "step": 266820 }, { "epoch": 0.93, "learning_rate": 3.4680538649609197e-06, "loss": 2.3763, "step": 266830 }, { "epoch": 0.93, "learning_rate": 3.466309985107266e-06, "loss": 2.3745, "step": 266840 }, { "epoch": 0.93, "learning_rate": 3.4645661052536123e-06, "loss": 2.3273, "step": 266850 }, { "epoch": 0.93, "learning_rate": 3.4628222253999585e-06, "loss": 2.3591, "step": 266860 }, { "epoch": 0.93, "learning_rate": 3.4610783455463057e-06, "loss": 2.2275, "step": 266870 }, { "epoch": 0.93, "learning_rate": 3.459334465692652e-06, "loss": 2.3162, "step": 266880 }, { "epoch": 0.93, "learning_rate": 3.457590585838998e-06, "loss": 2.2853, "step": 266890 }, { "epoch": 0.93, "learning_rate": 3.4558467059853445e-06, "loss": 2.3643, "step": 266900 }, { "epoch": 0.93, "learning_rate": 3.4541028261316907e-06, "loss": 2.3028, "step": 266910 }, { "epoch": 0.93, "learning_rate": 3.452358946278037e-06, "loss": 2.3613, "step": 266920 }, { "epoch": 0.93, "learning_rate": 3.4506150664243833e-06, "loss": 2.2521, "step": 266930 }, { "epoch": 0.93, "learning_rate": 3.4488711865707304e-06, "loss": 2.3243, "step": 266940 }, { "epoch": 0.93, "learning_rate": 3.4471273067170767e-06, "loss": 2.3382, "step": 266950 }, { "epoch": 0.93, "learning_rate": 3.445383426863423e-06, "loss": 2.3688, "step": 266960 }, { "epoch": 0.93, "learning_rate": 3.443639547009769e-06, "loss": 2.2794, "step": 266970 }, { "epoch": 0.93, "learning_rate": 3.4418956671561155e-06, "loss": 2.3549, "step": 266980 }, { "epoch": 0.93, "learning_rate": 3.4401517873024617e-06, "loss": 2.4083, "step": 266990 }, { "epoch": 0.93, "learning_rate": 3.438407907448809e-06, "loss": 2.3066, "step": 267000 }, { "epoch": 0.93, "learning_rate": 3.436664027595155e-06, "loss": 2.2904, "step": 267010 }, { "epoch": 0.93, "learning_rate": 3.4349201477415014e-06, "loss": 2.3522, "step": 267020 }, { "epoch": 0.93, "learning_rate": 3.4331762678878477e-06, "loss": 2.344, "step": 267030 }, { "epoch": 0.93, "learning_rate": 3.431432388034194e-06, "loss": 2.3757, "step": 267040 }, { "epoch": 0.93, "learning_rate": 3.42968850818054e-06, "loss": 2.3024, "step": 267050 }, { "epoch": 0.93, "learning_rate": 3.4279446283268865e-06, "loss": 2.3597, "step": 267060 }, { "epoch": 0.93, "learning_rate": 3.4262007484732336e-06, "loss": 2.3522, "step": 267070 }, { "epoch": 0.93, "learning_rate": 3.42445686861958e-06, "loss": 2.4137, "step": 267080 }, { "epoch": 0.93, "learning_rate": 3.422712988765926e-06, "loss": 2.3719, "step": 267090 }, { "epoch": 0.93, "learning_rate": 3.4209691089122724e-06, "loss": 2.3035, "step": 267100 }, { "epoch": 0.93, "learning_rate": 3.4192252290586187e-06, "loss": 2.3632, "step": 267110 }, { "epoch": 0.93, "learning_rate": 3.417481349204965e-06, "loss": 2.3134, "step": 267120 }, { "epoch": 0.93, "learning_rate": 3.415737469351311e-06, "loss": 2.335, "step": 267130 }, { "epoch": 0.93, "learning_rate": 3.4139935894976583e-06, "loss": 2.3303, "step": 267140 }, { "epoch": 0.93, "learning_rate": 3.4122497096440046e-06, "loss": 2.318, "step": 267150 }, { "epoch": 0.93, "learning_rate": 3.410505829790351e-06, "loss": 2.2738, "step": 267160 }, { "epoch": 0.93, "learning_rate": 3.408761949936697e-06, "loss": 2.3255, "step": 267170 }, { "epoch": 0.93, "learning_rate": 3.4070180700830434e-06, "loss": 2.322, "step": 267180 }, { "epoch": 0.93, "learning_rate": 3.4052741902293897e-06, "loss": 2.358, "step": 267190 }, { "epoch": 0.93, "learning_rate": 3.4035303103757368e-06, "loss": 2.2675, "step": 267200 }, { "epoch": 0.93, "learning_rate": 3.401786430522083e-06, "loss": 2.226, "step": 267210 }, { "epoch": 0.93, "learning_rate": 3.4000425506684293e-06, "loss": 2.2367, "step": 267220 }, { "epoch": 0.93, "learning_rate": 3.3982986708147756e-06, "loss": 2.3331, "step": 267230 }, { "epoch": 0.93, "learning_rate": 3.396554790961122e-06, "loss": 2.2976, "step": 267240 }, { "epoch": 0.93, "learning_rate": 3.394810911107468e-06, "loss": 2.3992, "step": 267250 }, { "epoch": 0.93, "learning_rate": 3.3930670312538144e-06, "loss": 2.3074, "step": 267260 }, { "epoch": 0.93, "learning_rate": 3.3913231514001615e-06, "loss": 2.3595, "step": 267270 }, { "epoch": 0.93, "learning_rate": 3.3895792715465078e-06, "loss": 2.311, "step": 267280 }, { "epoch": 0.93, "learning_rate": 3.387835391692854e-06, "loss": 2.3818, "step": 267290 }, { "epoch": 0.93, "learning_rate": 3.3860915118392003e-06, "loss": 2.289, "step": 267300 }, { "epoch": 0.93, "learning_rate": 3.3843476319855466e-06, "loss": 2.3316, "step": 267310 }, { "epoch": 0.93, "learning_rate": 3.382603752131893e-06, "loss": 2.2752, "step": 267320 }, { "epoch": 0.93, "learning_rate": 3.38085987227824e-06, "loss": 2.2869, "step": 267330 }, { "epoch": 0.93, "learning_rate": 3.3791159924245862e-06, "loss": 2.3024, "step": 267340 }, { "epoch": 0.93, "learning_rate": 3.3773721125709325e-06, "loss": 2.3786, "step": 267350 }, { "epoch": 0.93, "learning_rate": 3.3756282327172788e-06, "loss": 2.2741, "step": 267360 }, { "epoch": 0.93, "learning_rate": 3.373884352863625e-06, "loss": 2.3737, "step": 267370 }, { "epoch": 0.93, "learning_rate": 3.3721404730099713e-06, "loss": 2.3043, "step": 267380 }, { "epoch": 0.93, "learning_rate": 3.3703965931563176e-06, "loss": 2.3322, "step": 267390 }, { "epoch": 0.93, "learning_rate": 3.3686527133026647e-06, "loss": 2.3883, "step": 267400 }, { "epoch": 0.93, "learning_rate": 3.366908833449011e-06, "loss": 2.3329, "step": 267410 }, { "epoch": 0.93, "learning_rate": 3.3651649535953572e-06, "loss": 2.3555, "step": 267420 }, { "epoch": 0.93, "learning_rate": 3.3634210737417035e-06, "loss": 2.356, "step": 267430 }, { "epoch": 0.93, "learning_rate": 3.3616771938880498e-06, "loss": 2.3098, "step": 267440 }, { "epoch": 0.93, "learning_rate": 3.359933314034396e-06, "loss": 2.2992, "step": 267450 }, { "epoch": 0.93, "learning_rate": 3.3581894341807427e-06, "loss": 2.3365, "step": 267460 }, { "epoch": 0.93, "learning_rate": 3.3564455543270894e-06, "loss": 2.345, "step": 267470 }, { "epoch": 0.93, "learning_rate": 3.3547016744734357e-06, "loss": 2.3076, "step": 267480 }, { "epoch": 0.93, "learning_rate": 3.352957794619782e-06, "loss": 2.3383, "step": 267490 }, { "epoch": 0.93, "learning_rate": 3.3512139147661282e-06, "loss": 2.3646, "step": 267500 }, { "epoch": 0.93, "learning_rate": 3.3494700349124745e-06, "loss": 2.3481, "step": 267510 }, { "epoch": 0.93, "learning_rate": 3.3477261550588208e-06, "loss": 2.3944, "step": 267520 }, { "epoch": 0.93, "learning_rate": 3.345982275205168e-06, "loss": 2.3985, "step": 267530 }, { "epoch": 0.93, "learning_rate": 3.344238395351514e-06, "loss": 2.2963, "step": 267540 }, { "epoch": 0.93, "learning_rate": 3.3424945154978604e-06, "loss": 2.2761, "step": 267550 }, { "epoch": 0.93, "learning_rate": 3.3407506356442067e-06, "loss": 2.2863, "step": 267560 }, { "epoch": 0.93, "learning_rate": 3.339006755790553e-06, "loss": 2.2918, "step": 267570 }, { "epoch": 0.93, "learning_rate": 3.3372628759368992e-06, "loss": 2.3587, "step": 267580 }, { "epoch": 0.93, "learning_rate": 3.335518996083246e-06, "loss": 2.3693, "step": 267590 }, { "epoch": 0.93, "learning_rate": 3.3337751162295926e-06, "loss": 2.3696, "step": 267600 }, { "epoch": 0.93, "learning_rate": 3.332031236375939e-06, "loss": 2.3348, "step": 267610 }, { "epoch": 0.93, "learning_rate": 3.330287356522285e-06, "loss": 2.2981, "step": 267620 }, { "epoch": 0.93, "learning_rate": 3.3285434766686314e-06, "loss": 2.3229, "step": 267630 }, { "epoch": 0.93, "learning_rate": 3.3267995968149777e-06, "loss": 2.2666, "step": 267640 }, { "epoch": 0.93, "learning_rate": 3.325055716961324e-06, "loss": 2.3446, "step": 267650 }, { "epoch": 0.93, "learning_rate": 3.3233118371076707e-06, "loss": 2.3567, "step": 267660 }, { "epoch": 0.93, "learning_rate": 3.3215679572540174e-06, "loss": 2.3447, "step": 267670 }, { "epoch": 0.93, "learning_rate": 3.3198240774003636e-06, "loss": 2.2937, "step": 267680 }, { "epoch": 0.93, "learning_rate": 3.31808019754671e-06, "loss": 2.3696, "step": 267690 }, { "epoch": 0.93, "learning_rate": 3.316336317693056e-06, "loss": 2.2323, "step": 267700 }, { "epoch": 0.93, "learning_rate": 3.3145924378394024e-06, "loss": 2.3762, "step": 267710 }, { "epoch": 0.93, "learning_rate": 3.312848557985749e-06, "loss": 2.346, "step": 267720 }, { "epoch": 0.93, "learning_rate": 3.311104678132096e-06, "loss": 2.3333, "step": 267730 }, { "epoch": 0.93, "learning_rate": 3.309360798278442e-06, "loss": 2.3027, "step": 267740 }, { "epoch": 0.93, "learning_rate": 3.3076169184247884e-06, "loss": 2.2835, "step": 267750 }, { "epoch": 0.93, "learning_rate": 3.3058730385711346e-06, "loss": 2.3054, "step": 267760 }, { "epoch": 0.93, "learning_rate": 3.304129158717481e-06, "loss": 2.3485, "step": 267770 }, { "epoch": 0.93, "learning_rate": 3.302385278863827e-06, "loss": 2.2954, "step": 267780 }, { "epoch": 0.93, "learning_rate": 3.300641399010174e-06, "loss": 2.3449, "step": 267790 }, { "epoch": 0.93, "learning_rate": 3.2988975191565206e-06, "loss": 2.3644, "step": 267800 }, { "epoch": 0.93, "learning_rate": 3.297153639302867e-06, "loss": 2.3879, "step": 267810 }, { "epoch": 0.93, "learning_rate": 3.295409759449213e-06, "loss": 2.3376, "step": 267820 }, { "epoch": 0.93, "learning_rate": 3.2936658795955594e-06, "loss": 2.3645, "step": 267830 }, { "epoch": 0.93, "learning_rate": 3.2919219997419056e-06, "loss": 2.3407, "step": 267840 }, { "epoch": 0.93, "learning_rate": 3.2901781198882523e-06, "loss": 2.3452, "step": 267850 }, { "epoch": 0.93, "learning_rate": 3.2884342400345986e-06, "loss": 2.3048, "step": 267860 }, { "epoch": 0.93, "learning_rate": 3.2866903601809453e-06, "loss": 2.4246, "step": 267870 }, { "epoch": 0.93, "learning_rate": 3.2849464803272916e-06, "loss": 2.2928, "step": 267880 }, { "epoch": 0.93, "learning_rate": 3.283202600473638e-06, "loss": 2.3369, "step": 267890 }, { "epoch": 0.93, "learning_rate": 3.281458720619984e-06, "loss": 2.3034, "step": 267900 }, { "epoch": 0.93, "learning_rate": 3.2797148407663304e-06, "loss": 2.3432, "step": 267910 }, { "epoch": 0.93, "learning_rate": 3.277970960912677e-06, "loss": 2.3047, "step": 267920 }, { "epoch": 0.93, "learning_rate": 3.2762270810590237e-06, "loss": 2.2404, "step": 267930 }, { "epoch": 0.93, "learning_rate": 3.27448320120537e-06, "loss": 2.2812, "step": 267940 }, { "epoch": 0.93, "learning_rate": 3.2727393213517163e-06, "loss": 2.3261, "step": 267950 }, { "epoch": 0.93, "learning_rate": 3.2709954414980626e-06, "loss": 2.376, "step": 267960 }, { "epoch": 0.93, "learning_rate": 3.269251561644409e-06, "loss": 2.2771, "step": 267970 }, { "epoch": 0.93, "learning_rate": 3.2675076817907555e-06, "loss": 2.3382, "step": 267980 }, { "epoch": 0.93, "learning_rate": 3.2657638019371018e-06, "loss": 2.3275, "step": 267990 }, { "epoch": 0.93, "learning_rate": 3.2640199220834485e-06, "loss": 2.3548, "step": 268000 }, { "epoch": 0.93, "learning_rate": 3.2622760422297947e-06, "loss": 2.3071, "step": 268010 }, { "epoch": 0.93, "learning_rate": 3.260532162376141e-06, "loss": 2.4043, "step": 268020 }, { "epoch": 0.93, "learning_rate": 3.2587882825224873e-06, "loss": 2.3464, "step": 268030 }, { "epoch": 0.93, "learning_rate": 3.2570444026688336e-06, "loss": 2.3215, "step": 268040 }, { "epoch": 0.93, "learning_rate": 3.2553005228151802e-06, "loss": 2.3359, "step": 268050 }, { "epoch": 0.93, "learning_rate": 3.2535566429615265e-06, "loss": 2.3352, "step": 268060 }, { "epoch": 0.93, "learning_rate": 3.251812763107873e-06, "loss": 2.3163, "step": 268070 }, { "epoch": 0.93, "learning_rate": 3.2500688832542195e-06, "loss": 2.296, "step": 268080 }, { "epoch": 0.94, "learning_rate": 3.2483250034005657e-06, "loss": 2.2871, "step": 268090 }, { "epoch": 0.94, "learning_rate": 3.246581123546912e-06, "loss": 2.4058, "step": 268100 }, { "epoch": 0.94, "learning_rate": 3.2448372436932587e-06, "loss": 2.3273, "step": 268110 }, { "epoch": 0.94, "learning_rate": 3.243093363839605e-06, "loss": 2.3632, "step": 268120 }, { "epoch": 0.94, "learning_rate": 3.2413494839859517e-06, "loss": 2.3912, "step": 268130 }, { "epoch": 0.94, "learning_rate": 3.239605604132298e-06, "loss": 2.3127, "step": 268140 }, { "epoch": 0.94, "learning_rate": 3.237861724278644e-06, "loss": 2.2076, "step": 268150 }, { "epoch": 0.94, "learning_rate": 3.2361178444249905e-06, "loss": 2.3005, "step": 268160 }, { "epoch": 0.94, "learning_rate": 3.2343739645713367e-06, "loss": 2.3812, "step": 268170 }, { "epoch": 0.94, "learning_rate": 3.2326300847176834e-06, "loss": 2.3721, "step": 268180 }, { "epoch": 0.94, "learning_rate": 3.2308862048640297e-06, "loss": 2.3867, "step": 268190 }, { "epoch": 0.94, "learning_rate": 3.2291423250103764e-06, "loss": 2.2818, "step": 268200 }, { "epoch": 0.94, "learning_rate": 3.2273984451567227e-06, "loss": 2.3186, "step": 268210 }, { "epoch": 0.94, "learning_rate": 3.225654565303069e-06, "loss": 2.3183, "step": 268220 }, { "epoch": 0.94, "learning_rate": 3.2239106854494152e-06, "loss": 2.283, "step": 268230 }, { "epoch": 0.94, "learning_rate": 3.222166805595762e-06, "loss": 2.3152, "step": 268240 }, { "epoch": 0.94, "learning_rate": 3.220422925742108e-06, "loss": 2.2902, "step": 268250 }, { "epoch": 0.94, "learning_rate": 3.2186790458884544e-06, "loss": 2.3699, "step": 268260 }, { "epoch": 0.94, "learning_rate": 3.216935166034801e-06, "loss": 2.3356, "step": 268270 }, { "epoch": 0.94, "learning_rate": 3.2151912861811474e-06, "loss": 2.3143, "step": 268280 }, { "epoch": 0.94, "learning_rate": 3.2134474063274937e-06, "loss": 2.3904, "step": 268290 }, { "epoch": 0.94, "learning_rate": 3.21170352647384e-06, "loss": 2.3018, "step": 268300 }, { "epoch": 0.94, "learning_rate": 3.2099596466201866e-06, "loss": 2.3431, "step": 268310 }, { "epoch": 0.94, "learning_rate": 3.208215766766533e-06, "loss": 2.2835, "step": 268320 }, { "epoch": 0.94, "learning_rate": 3.2064718869128796e-06, "loss": 2.3903, "step": 268330 }, { "epoch": 0.94, "learning_rate": 3.204728007059226e-06, "loss": 2.2608, "step": 268340 }, { "epoch": 0.94, "learning_rate": 3.202984127205572e-06, "loss": 2.3174, "step": 268350 }, { "epoch": 0.94, "learning_rate": 3.2012402473519184e-06, "loss": 2.3496, "step": 268360 }, { "epoch": 0.94, "learning_rate": 3.199496367498265e-06, "loss": 2.3752, "step": 268370 }, { "epoch": 0.94, "learning_rate": 3.1977524876446114e-06, "loss": 2.3236, "step": 268380 }, { "epoch": 0.94, "learning_rate": 3.1960086077909576e-06, "loss": 2.3275, "step": 268390 }, { "epoch": 0.94, "learning_rate": 3.1942647279373043e-06, "loss": 2.3365, "step": 268400 }, { "epoch": 0.94, "learning_rate": 3.1925208480836506e-06, "loss": 2.3484, "step": 268410 }, { "epoch": 0.94, "learning_rate": 3.190776968229997e-06, "loss": 2.3008, "step": 268420 }, { "epoch": 0.94, "learning_rate": 3.189033088376343e-06, "loss": 2.3974, "step": 268430 }, { "epoch": 0.94, "learning_rate": 3.18728920852269e-06, "loss": 2.3647, "step": 268440 }, { "epoch": 0.94, "learning_rate": 3.185545328669036e-06, "loss": 2.3493, "step": 268450 }, { "epoch": 0.94, "learning_rate": 3.1838014488153824e-06, "loss": 2.4011, "step": 268460 }, { "epoch": 0.94, "learning_rate": 3.182057568961729e-06, "loss": 2.3831, "step": 268470 }, { "epoch": 0.94, "learning_rate": 3.1803136891080753e-06, "loss": 2.3335, "step": 268480 }, { "epoch": 0.94, "learning_rate": 3.1785698092544216e-06, "loss": 2.3677, "step": 268490 }, { "epoch": 0.94, "learning_rate": 3.1768259294007683e-06, "loss": 2.2806, "step": 268500 }, { "epoch": 0.94, "learning_rate": 3.1750820495471146e-06, "loss": 2.274, "step": 268510 }, { "epoch": 0.94, "learning_rate": 3.173338169693461e-06, "loss": 2.3286, "step": 268520 }, { "epoch": 0.94, "learning_rate": 3.1715942898398075e-06, "loss": 2.3776, "step": 268530 }, { "epoch": 0.94, "learning_rate": 3.169850409986154e-06, "loss": 2.296, "step": 268540 }, { "epoch": 0.94, "learning_rate": 3.1681065301325e-06, "loss": 2.3454, "step": 268550 }, { "epoch": 0.94, "learning_rate": 3.1663626502788463e-06, "loss": 2.3205, "step": 268560 }, { "epoch": 0.94, "learning_rate": 3.164618770425193e-06, "loss": 2.3179, "step": 268570 }, { "epoch": 0.94, "learning_rate": 3.1628748905715393e-06, "loss": 2.2403, "step": 268580 }, { "epoch": 0.94, "learning_rate": 3.1611310107178856e-06, "loss": 2.2327, "step": 268590 }, { "epoch": 0.94, "learning_rate": 3.1593871308642323e-06, "loss": 2.3172, "step": 268600 }, { "epoch": 0.94, "learning_rate": 3.1576432510105785e-06, "loss": 2.3386, "step": 268610 }, { "epoch": 0.94, "learning_rate": 3.155899371156925e-06, "loss": 2.4413, "step": 268620 }, { "epoch": 0.94, "learning_rate": 3.1541554913032715e-06, "loss": 2.3189, "step": 268630 }, { "epoch": 0.94, "learning_rate": 3.1524116114496178e-06, "loss": 2.2961, "step": 268640 }, { "epoch": 0.94, "learning_rate": 3.150667731595964e-06, "loss": 2.4254, "step": 268650 }, { "epoch": 0.94, "learning_rate": 3.1489238517423103e-06, "loss": 2.3424, "step": 268660 }, { "epoch": 0.94, "learning_rate": 3.147179971888657e-06, "loss": 2.34, "step": 268670 }, { "epoch": 0.94, "learning_rate": 3.1454360920350033e-06, "loss": 2.3444, "step": 268680 }, { "epoch": 0.94, "learning_rate": 3.1436922121813495e-06, "loss": 2.4197, "step": 268690 }, { "epoch": 0.94, "learning_rate": 3.1419483323276962e-06, "loss": 2.2884, "step": 268700 }, { "epoch": 0.94, "learning_rate": 3.1402044524740425e-06, "loss": 2.3535, "step": 268710 }, { "epoch": 0.94, "learning_rate": 3.1384605726203888e-06, "loss": 2.2627, "step": 268720 }, { "epoch": 0.94, "learning_rate": 3.1367166927667355e-06, "loss": 2.313, "step": 268730 }, { "epoch": 0.94, "learning_rate": 3.1349728129130817e-06, "loss": 2.2839, "step": 268740 }, { "epoch": 0.94, "learning_rate": 3.133228933059428e-06, "loss": 2.3278, "step": 268750 }, { "epoch": 0.94, "learning_rate": 3.1314850532057747e-06, "loss": 2.3351, "step": 268760 }, { "epoch": 0.94, "learning_rate": 3.129741173352121e-06, "loss": 2.3313, "step": 268770 }, { "epoch": 0.94, "learning_rate": 3.1279972934984672e-06, "loss": 2.328, "step": 268780 }, { "epoch": 0.94, "learning_rate": 3.1262534136448135e-06, "loss": 2.3402, "step": 268790 }, { "epoch": 0.94, "learning_rate": 3.12450953379116e-06, "loss": 2.3378, "step": 268800 }, { "epoch": 0.94, "learning_rate": 3.1227656539375065e-06, "loss": 2.3087, "step": 268810 }, { "epoch": 0.94, "learning_rate": 3.121021774083853e-06, "loss": 2.299, "step": 268820 }, { "epoch": 0.94, "learning_rate": 3.1192778942301994e-06, "loss": 2.3322, "step": 268830 }, { "epoch": 0.94, "learning_rate": 3.1175340143765457e-06, "loss": 2.3527, "step": 268840 }, { "epoch": 0.94, "learning_rate": 3.115790134522892e-06, "loss": 2.3992, "step": 268850 }, { "epoch": 0.94, "learning_rate": 3.1140462546692386e-06, "loss": 2.3188, "step": 268860 }, { "epoch": 0.94, "learning_rate": 3.112302374815585e-06, "loss": 2.2936, "step": 268870 }, { "epoch": 0.94, "learning_rate": 3.110558494961931e-06, "loss": 2.2889, "step": 268880 }, { "epoch": 0.94, "learning_rate": 3.108814615108278e-06, "loss": 2.4106, "step": 268890 }, { "epoch": 0.94, "learning_rate": 3.107070735254624e-06, "loss": 2.4032, "step": 268900 }, { "epoch": 0.94, "learning_rate": 3.1053268554009704e-06, "loss": 2.3112, "step": 268910 }, { "epoch": 0.94, "learning_rate": 3.103582975547317e-06, "loss": 2.2897, "step": 268920 }, { "epoch": 0.94, "learning_rate": 3.1018390956936634e-06, "loss": 2.2743, "step": 268930 }, { "epoch": 0.94, "learning_rate": 3.1000952158400096e-06, "loss": 2.2386, "step": 268940 }, { "epoch": 0.94, "learning_rate": 3.0983513359863563e-06, "loss": 2.3569, "step": 268950 }, { "epoch": 0.94, "learning_rate": 3.0966074561327026e-06, "loss": 2.301, "step": 268960 }, { "epoch": 0.94, "learning_rate": 3.094863576279049e-06, "loss": 2.3022, "step": 268970 }, { "epoch": 0.94, "learning_rate": 3.093119696425395e-06, "loss": 2.2962, "step": 268980 }, { "epoch": 0.94, "learning_rate": 3.091375816571742e-06, "loss": 2.4098, "step": 268990 }, { "epoch": 0.94, "learning_rate": 3.089631936718088e-06, "loss": 2.3266, "step": 269000 }, { "epoch": 0.94, "learning_rate": 3.0878880568644344e-06, "loss": 2.3752, "step": 269010 }, { "epoch": 0.94, "learning_rate": 3.086144177010781e-06, "loss": 2.4, "step": 269020 }, { "epoch": 0.94, "learning_rate": 3.0844002971571273e-06, "loss": 2.3554, "step": 269030 }, { "epoch": 0.94, "learning_rate": 3.0826564173034736e-06, "loss": 2.3156, "step": 269040 }, { "epoch": 0.94, "learning_rate": 3.0809125374498203e-06, "loss": 2.3556, "step": 269050 }, { "epoch": 0.94, "learning_rate": 3.0791686575961666e-06, "loss": 2.2963, "step": 269060 }, { "epoch": 0.94, "learning_rate": 3.077424777742513e-06, "loss": 2.3522, "step": 269070 }, { "epoch": 0.94, "learning_rate": 3.0756808978888595e-06, "loss": 2.2944, "step": 269080 }, { "epoch": 0.94, "learning_rate": 3.073937018035206e-06, "loss": 2.29, "step": 269090 }, { "epoch": 0.94, "learning_rate": 3.072193138181552e-06, "loss": 2.4056, "step": 269100 }, { "epoch": 0.94, "learning_rate": 3.0704492583278983e-06, "loss": 2.3714, "step": 269110 }, { "epoch": 0.94, "learning_rate": 3.068705378474245e-06, "loss": 2.2994, "step": 269120 }, { "epoch": 0.94, "learning_rate": 3.0669614986205913e-06, "loss": 2.436, "step": 269130 }, { "epoch": 0.94, "learning_rate": 3.0652176187669376e-06, "loss": 2.3371, "step": 269140 }, { "epoch": 0.94, "learning_rate": 3.0634737389132843e-06, "loss": 2.3262, "step": 269150 }, { "epoch": 0.94, "learning_rate": 3.0617298590596305e-06, "loss": 2.3707, "step": 269160 }, { "epoch": 0.94, "learning_rate": 3.059985979205977e-06, "loss": 2.28, "step": 269170 }, { "epoch": 0.94, "learning_rate": 3.0582420993523235e-06, "loss": 2.3005, "step": 269180 }, { "epoch": 0.94, "learning_rate": 3.0564982194986698e-06, "loss": 2.3709, "step": 269190 }, { "epoch": 0.94, "learning_rate": 3.054754339645016e-06, "loss": 2.3341, "step": 269200 }, { "epoch": 0.94, "learning_rate": 3.0530104597913627e-06, "loss": 2.3063, "step": 269210 }, { "epoch": 0.94, "learning_rate": 3.051266579937709e-06, "loss": 2.35, "step": 269220 }, { "epoch": 0.94, "learning_rate": 3.0495227000840553e-06, "loss": 2.3585, "step": 269230 }, { "epoch": 0.94, "learning_rate": 3.0477788202304015e-06, "loss": 2.3599, "step": 269240 }, { "epoch": 0.94, "learning_rate": 3.0460349403767482e-06, "loss": 2.275, "step": 269250 }, { "epoch": 0.94, "learning_rate": 3.0442910605230945e-06, "loss": 2.3699, "step": 269260 }, { "epoch": 0.94, "learning_rate": 3.0425471806694408e-06, "loss": 2.257, "step": 269270 }, { "epoch": 0.94, "learning_rate": 3.0408033008157875e-06, "loss": 2.3226, "step": 269280 }, { "epoch": 0.94, "learning_rate": 3.0390594209621337e-06, "loss": 2.3167, "step": 269290 }, { "epoch": 0.94, "learning_rate": 3.03731554110848e-06, "loss": 2.3049, "step": 269300 }, { "epoch": 0.94, "learning_rate": 3.0355716612548267e-06, "loss": 2.3278, "step": 269310 }, { "epoch": 0.94, "learning_rate": 3.033827781401173e-06, "loss": 2.3351, "step": 269320 }, { "epoch": 0.94, "learning_rate": 3.0320839015475192e-06, "loss": 2.3905, "step": 269330 }, { "epoch": 0.94, "learning_rate": 3.0303400216938655e-06, "loss": 2.317, "step": 269340 }, { "epoch": 0.94, "learning_rate": 3.028596141840212e-06, "loss": 2.3319, "step": 269350 }, { "epoch": 0.94, "learning_rate": 3.0268522619865585e-06, "loss": 2.3439, "step": 269360 }, { "epoch": 0.94, "learning_rate": 3.0251083821329047e-06, "loss": 2.3149, "step": 269370 }, { "epoch": 0.94, "learning_rate": 3.0233645022792514e-06, "loss": 2.35, "step": 269380 }, { "epoch": 0.94, "learning_rate": 3.0216206224255977e-06, "loss": 2.3662, "step": 269390 }, { "epoch": 0.94, "learning_rate": 3.019876742571944e-06, "loss": 2.3149, "step": 269400 }, { "epoch": 0.94, "learning_rate": 3.0181328627182907e-06, "loss": 2.2984, "step": 269410 }, { "epoch": 0.94, "learning_rate": 3.016388982864637e-06, "loss": 2.2738, "step": 269420 }, { "epoch": 0.94, "learning_rate": 3.014645103010983e-06, "loss": 2.2756, "step": 269430 }, { "epoch": 0.94, "learning_rate": 3.0129012231573295e-06, "loss": 2.2727, "step": 269440 }, { "epoch": 0.94, "learning_rate": 3.011157343303676e-06, "loss": 2.2752, "step": 269450 }, { "epoch": 0.94, "learning_rate": 3.0094134634500224e-06, "loss": 2.3502, "step": 269460 }, { "epoch": 0.94, "learning_rate": 3.0076695835963687e-06, "loss": 2.3799, "step": 269470 }, { "epoch": 0.94, "learning_rate": 3.0059257037427154e-06, "loss": 2.3095, "step": 269480 }, { "epoch": 0.94, "learning_rate": 3.0041818238890617e-06, "loss": 2.3235, "step": 269490 }, { "epoch": 0.94, "learning_rate": 3.002437944035408e-06, "loss": 2.3587, "step": 269500 }, { "epoch": 0.94, "learning_rate": 3.0006940641817546e-06, "loss": 2.2959, "step": 269510 }, { "epoch": 0.94, "learning_rate": 2.998950184328101e-06, "loss": 2.2488, "step": 269520 }, { "epoch": 0.94, "learning_rate": 2.997206304474447e-06, "loss": 2.4415, "step": 269530 }, { "epoch": 0.94, "learning_rate": 2.9954624246207934e-06, "loss": 2.3114, "step": 269540 }, { "epoch": 0.94, "learning_rate": 2.99371854476714e-06, "loss": 2.3242, "step": 269550 }, { "epoch": 0.94, "learning_rate": 2.9919746649134864e-06, "loss": 2.2573, "step": 269560 }, { "epoch": 0.94, "learning_rate": 2.9902307850598327e-06, "loss": 2.3017, "step": 269570 }, { "epoch": 0.94, "learning_rate": 2.9884869052061794e-06, "loss": 2.3151, "step": 269580 }, { "epoch": 0.94, "learning_rate": 2.9867430253525256e-06, "loss": 2.2936, "step": 269590 }, { "epoch": 0.94, "learning_rate": 2.984999145498872e-06, "loss": 2.2979, "step": 269600 }, { "epoch": 0.94, "learning_rate": 2.9832552656452186e-06, "loss": 2.2841, "step": 269610 }, { "epoch": 0.94, "learning_rate": 2.981511385791565e-06, "loss": 2.3825, "step": 269620 }, { "epoch": 0.94, "learning_rate": 2.979767505937911e-06, "loss": 2.3372, "step": 269630 }, { "epoch": 0.94, "learning_rate": 2.9780236260842574e-06, "loss": 2.4489, "step": 269640 }, { "epoch": 0.94, "learning_rate": 2.976279746230604e-06, "loss": 2.2436, "step": 269650 }, { "epoch": 0.94, "learning_rate": 2.9745358663769504e-06, "loss": 2.2951, "step": 269660 }, { "epoch": 0.94, "learning_rate": 2.9727919865232966e-06, "loss": 2.4182, "step": 269670 }, { "epoch": 0.94, "learning_rate": 2.9710481066696433e-06, "loss": 2.2777, "step": 269680 }, { "epoch": 0.94, "learning_rate": 2.9693042268159896e-06, "loss": 2.3449, "step": 269690 }, { "epoch": 0.94, "learning_rate": 2.967560346962336e-06, "loss": 2.4102, "step": 269700 }, { "epoch": 0.94, "learning_rate": 2.9658164671086825e-06, "loss": 2.2411, "step": 269710 }, { "epoch": 0.94, "learning_rate": 2.964072587255029e-06, "loss": 2.2837, "step": 269720 }, { "epoch": 0.94, "learning_rate": 2.962328707401375e-06, "loss": 2.3396, "step": 269730 }, { "epoch": 0.94, "learning_rate": 2.9605848275477214e-06, "loss": 2.3519, "step": 269740 }, { "epoch": 0.94, "learning_rate": 2.958840947694068e-06, "loss": 2.3368, "step": 269750 }, { "epoch": 0.94, "learning_rate": 2.9570970678404143e-06, "loss": 2.3734, "step": 269760 }, { "epoch": 0.94, "learning_rate": 2.9553531879867606e-06, "loss": 2.3449, "step": 269770 }, { "epoch": 0.94, "learning_rate": 2.9536093081331073e-06, "loss": 2.3784, "step": 269780 }, { "epoch": 0.94, "learning_rate": 2.9518654282794535e-06, "loss": 2.2199, "step": 269790 }, { "epoch": 0.94, "learning_rate": 2.9501215484258e-06, "loss": 2.2989, "step": 269800 }, { "epoch": 0.94, "learning_rate": 2.9483776685721465e-06, "loss": 2.3559, "step": 269810 }, { "epoch": 0.94, "learning_rate": 2.9466337887184928e-06, "loss": 2.3124, "step": 269820 }, { "epoch": 0.94, "learning_rate": 2.944889908864839e-06, "loss": 2.3662, "step": 269830 }, { "epoch": 0.94, "learning_rate": 2.9431460290111853e-06, "loss": 2.2884, "step": 269840 }, { "epoch": 0.94, "learning_rate": 2.941402149157532e-06, "loss": 2.3413, "step": 269850 }, { "epoch": 0.94, "learning_rate": 2.9396582693038783e-06, "loss": 2.2455, "step": 269860 }, { "epoch": 0.94, "learning_rate": 2.9379143894502245e-06, "loss": 2.3433, "step": 269870 }, { "epoch": 0.94, "learning_rate": 2.9361705095965712e-06, "loss": 2.3557, "step": 269880 }, { "epoch": 0.94, "learning_rate": 2.9344266297429175e-06, "loss": 2.3348, "step": 269890 }, { "epoch": 0.94, "learning_rate": 2.9326827498892638e-06, "loss": 2.3514, "step": 269900 }, { "epoch": 0.94, "learning_rate": 2.9309388700356105e-06, "loss": 2.3032, "step": 269910 }, { "epoch": 0.94, "learning_rate": 2.9291949901819567e-06, "loss": 2.3114, "step": 269920 }, { "epoch": 0.94, "learning_rate": 2.927451110328303e-06, "loss": 2.3436, "step": 269930 }, { "epoch": 0.94, "learning_rate": 2.9257072304746493e-06, "loss": 2.3158, "step": 269940 }, { "epoch": 0.94, "learning_rate": 2.923963350620996e-06, "loss": 2.2469, "step": 269950 }, { "epoch": 0.94, "learning_rate": 2.9222194707673422e-06, "loss": 2.2406, "step": 269960 }, { "epoch": 0.94, "learning_rate": 2.9204755909136885e-06, "loss": 2.4245, "step": 269970 }, { "epoch": 0.94, "learning_rate": 2.918731711060035e-06, "loss": 2.3021, "step": 269980 }, { "epoch": 0.94, "learning_rate": 2.9169878312063815e-06, "loss": 2.3799, "step": 269990 }, { "epoch": 0.94, "learning_rate": 2.9152439513527277e-06, "loss": 2.3248, "step": 270000 }, { "epoch": 0.94, "learning_rate": 2.9135000714990744e-06, "loss": 2.3114, "step": 270010 }, { "epoch": 0.94, "learning_rate": 2.9117561916454207e-06, "loss": 2.3445, "step": 270020 }, { "epoch": 0.94, "learning_rate": 2.910012311791767e-06, "loss": 2.325, "step": 270030 }, { "epoch": 0.94, "learning_rate": 2.9082684319381132e-06, "loss": 2.3891, "step": 270040 }, { "epoch": 0.94, "learning_rate": 2.90652455208446e-06, "loss": 2.2664, "step": 270050 }, { "epoch": 0.94, "learning_rate": 2.904780672230806e-06, "loss": 2.4291, "step": 270060 }, { "epoch": 0.94, "learning_rate": 2.9030367923771525e-06, "loss": 2.2906, "step": 270070 }, { "epoch": 0.94, "learning_rate": 2.901292912523499e-06, "loss": 2.2769, "step": 270080 }, { "epoch": 0.94, "learning_rate": 2.8995490326698454e-06, "loss": 2.3497, "step": 270090 }, { "epoch": 0.94, "learning_rate": 2.8978051528161917e-06, "loss": 2.2963, "step": 270100 }, { "epoch": 0.94, "learning_rate": 2.8960612729625384e-06, "loss": 2.3283, "step": 270110 }, { "epoch": 0.94, "learning_rate": 2.8943173931088847e-06, "loss": 2.3653, "step": 270120 }, { "epoch": 0.94, "learning_rate": 2.892573513255231e-06, "loss": 2.3887, "step": 270130 }, { "epoch": 0.94, "learning_rate": 2.8908296334015776e-06, "loss": 2.3836, "step": 270140 }, { "epoch": 0.94, "learning_rate": 2.889085753547924e-06, "loss": 2.3385, "step": 270150 }, { "epoch": 0.94, "learning_rate": 2.88734187369427e-06, "loss": 2.3122, "step": 270160 }, { "epoch": 0.94, "learning_rate": 2.8855979938406164e-06, "loss": 2.3411, "step": 270170 }, { "epoch": 0.94, "learning_rate": 2.883854113986963e-06, "loss": 2.3776, "step": 270180 }, { "epoch": 0.94, "learning_rate": 2.8821102341333094e-06, "loss": 2.3298, "step": 270190 }, { "epoch": 0.94, "learning_rate": 2.8803663542796557e-06, "loss": 2.3978, "step": 270200 }, { "epoch": 0.94, "learning_rate": 2.8786224744260024e-06, "loss": 2.3419, "step": 270210 }, { "epoch": 0.94, "learning_rate": 2.8768785945723486e-06, "loss": 2.2454, "step": 270220 }, { "epoch": 0.94, "learning_rate": 2.875134714718695e-06, "loss": 2.4229, "step": 270230 }, { "epoch": 0.94, "learning_rate": 2.8733908348650416e-06, "loss": 2.3243, "step": 270240 }, { "epoch": 0.94, "learning_rate": 2.871646955011388e-06, "loss": 2.4248, "step": 270250 }, { "epoch": 0.94, "learning_rate": 2.869903075157734e-06, "loss": 2.3533, "step": 270260 }, { "epoch": 0.94, "learning_rate": 2.8681591953040804e-06, "loss": 2.3551, "step": 270270 }, { "epoch": 0.94, "learning_rate": 2.866415315450427e-06, "loss": 2.3305, "step": 270280 }, { "epoch": 0.94, "learning_rate": 2.8646714355967734e-06, "loss": 2.3669, "step": 270290 }, { "epoch": 0.94, "learning_rate": 2.8629275557431196e-06, "loss": 2.345, "step": 270300 }, { "epoch": 0.94, "learning_rate": 2.8611836758894663e-06, "loss": 2.3724, "step": 270310 }, { "epoch": 0.94, "learning_rate": 2.8594397960358126e-06, "loss": 2.3107, "step": 270320 }, { "epoch": 0.94, "learning_rate": 2.857695916182159e-06, "loss": 2.2408, "step": 270330 }, { "epoch": 0.94, "learning_rate": 2.8559520363285056e-06, "loss": 2.4362, "step": 270340 }, { "epoch": 0.94, "learning_rate": 2.854208156474852e-06, "loss": 2.3744, "step": 270350 }, { "epoch": 0.94, "learning_rate": 2.852464276621198e-06, "loss": 2.4255, "step": 270360 }, { "epoch": 0.94, "learning_rate": 2.8507203967675444e-06, "loss": 2.3815, "step": 270370 }, { "epoch": 0.94, "learning_rate": 2.848976516913891e-06, "loss": 2.3253, "step": 270380 }, { "epoch": 0.94, "learning_rate": 2.8472326370602373e-06, "loss": 2.3254, "step": 270390 }, { "epoch": 0.94, "learning_rate": 2.8454887572065836e-06, "loss": 2.3259, "step": 270400 }, { "epoch": 0.94, "learning_rate": 2.8437448773529303e-06, "loss": 2.3337, "step": 270410 }, { "epoch": 0.94, "learning_rate": 2.8420009974992766e-06, "loss": 2.3464, "step": 270420 }, { "epoch": 0.94, "learning_rate": 2.840257117645623e-06, "loss": 2.4134, "step": 270430 }, { "epoch": 0.94, "learning_rate": 2.8385132377919695e-06, "loss": 2.2933, "step": 270440 }, { "epoch": 0.94, "learning_rate": 2.836769357938316e-06, "loss": 2.3104, "step": 270450 }, { "epoch": 0.94, "learning_rate": 2.835025478084662e-06, "loss": 2.3252, "step": 270460 }, { "epoch": 0.94, "learning_rate": 2.8332815982310083e-06, "loss": 2.2065, "step": 270470 }, { "epoch": 0.94, "learning_rate": 2.831537718377355e-06, "loss": 2.3405, "step": 270480 }, { "epoch": 0.94, "learning_rate": 2.8297938385237013e-06, "loss": 2.298, "step": 270490 }, { "epoch": 0.94, "learning_rate": 2.8280499586700476e-06, "loss": 2.2619, "step": 270500 }, { "epoch": 0.94, "learning_rate": 2.8263060788163943e-06, "loss": 2.4311, "step": 270510 }, { "epoch": 0.94, "learning_rate": 2.8245621989627405e-06, "loss": 2.2746, "step": 270520 }, { "epoch": 0.94, "learning_rate": 2.822818319109087e-06, "loss": 2.3598, "step": 270530 }, { "epoch": 0.94, "learning_rate": 2.8210744392554335e-06, "loss": 2.313, "step": 270540 }, { "epoch": 0.94, "learning_rate": 2.8193305594017798e-06, "loss": 2.3221, "step": 270550 }, { "epoch": 0.94, "learning_rate": 2.817586679548126e-06, "loss": 2.2554, "step": 270560 }, { "epoch": 0.94, "learning_rate": 2.8158427996944723e-06, "loss": 2.394, "step": 270570 }, { "epoch": 0.94, "learning_rate": 2.814098919840819e-06, "loss": 2.3707, "step": 270580 }, { "epoch": 0.94, "learning_rate": 2.8123550399871653e-06, "loss": 2.3269, "step": 270590 }, { "epoch": 0.94, "learning_rate": 2.8106111601335115e-06, "loss": 2.304, "step": 270600 }, { "epoch": 0.94, "learning_rate": 2.8088672802798582e-06, "loss": 2.3656, "step": 270610 }, { "epoch": 0.94, "learning_rate": 2.8071234004262045e-06, "loss": 2.338, "step": 270620 }, { "epoch": 0.94, "learning_rate": 2.8053795205725508e-06, "loss": 2.3098, "step": 270630 }, { "epoch": 0.94, "learning_rate": 2.8036356407188974e-06, "loss": 2.2503, "step": 270640 }, { "epoch": 0.94, "learning_rate": 2.8018917608652437e-06, "loss": 2.3283, "step": 270650 }, { "epoch": 0.94, "learning_rate": 2.80014788101159e-06, "loss": 2.353, "step": 270660 }, { "epoch": 0.94, "learning_rate": 2.7984040011579363e-06, "loss": 2.3632, "step": 270670 }, { "epoch": 0.94, "learning_rate": 2.796660121304283e-06, "loss": 2.3495, "step": 270680 }, { "epoch": 0.94, "learning_rate": 2.7949162414506292e-06, "loss": 2.3278, "step": 270690 }, { "epoch": 0.94, "learning_rate": 2.7931723615969755e-06, "loss": 2.3607, "step": 270700 }, { "epoch": 0.94, "learning_rate": 2.791428481743322e-06, "loss": 2.3067, "step": 270710 }, { "epoch": 0.94, "learning_rate": 2.7896846018896684e-06, "loss": 2.3528, "step": 270720 }, { "epoch": 0.94, "learning_rate": 2.7879407220360147e-06, "loss": 2.2896, "step": 270730 }, { "epoch": 0.94, "learning_rate": 2.7861968421823614e-06, "loss": 2.3736, "step": 270740 }, { "epoch": 0.94, "learning_rate": 2.7844529623287077e-06, "loss": 2.3546, "step": 270750 }, { "epoch": 0.94, "learning_rate": 2.782709082475054e-06, "loss": 2.3095, "step": 270760 }, { "epoch": 0.94, "learning_rate": 2.7809652026214002e-06, "loss": 2.3289, "step": 270770 }, { "epoch": 0.94, "learning_rate": 2.779221322767747e-06, "loss": 2.3877, "step": 270780 }, { "epoch": 0.94, "learning_rate": 2.777477442914093e-06, "loss": 2.3596, "step": 270790 }, { "epoch": 0.94, "learning_rate": 2.7757335630604394e-06, "loss": 2.3212, "step": 270800 }, { "epoch": 0.94, "learning_rate": 2.773989683206786e-06, "loss": 2.3089, "step": 270810 }, { "epoch": 0.94, "learning_rate": 2.7722458033531324e-06, "loss": 2.316, "step": 270820 }, { "epoch": 0.94, "learning_rate": 2.7705019234994787e-06, "loss": 2.3183, "step": 270830 }, { "epoch": 0.94, "learning_rate": 2.7687580436458254e-06, "loss": 2.3197, "step": 270840 }, { "epoch": 0.94, "learning_rate": 2.7670141637921716e-06, "loss": 2.4082, "step": 270850 }, { "epoch": 0.94, "learning_rate": 2.765270283938518e-06, "loss": 2.2909, "step": 270860 }, { "epoch": 0.94, "learning_rate": 2.763526404084864e-06, "loss": 2.3013, "step": 270870 }, { "epoch": 0.94, "learning_rate": 2.761782524231211e-06, "loss": 2.3013, "step": 270880 }, { "epoch": 0.94, "learning_rate": 2.760038644377557e-06, "loss": 2.3941, "step": 270890 }, { "epoch": 0.94, "learning_rate": 2.7582947645239034e-06, "loss": 2.3225, "step": 270900 }, { "epoch": 0.94, "learning_rate": 2.75655088467025e-06, "loss": 2.3719, "step": 270910 }, { "epoch": 0.94, "learning_rate": 2.7548070048165964e-06, "loss": 2.3885, "step": 270920 }, { "epoch": 0.94, "learning_rate": 2.7530631249629426e-06, "loss": 2.3342, "step": 270930 }, { "epoch": 0.94, "learning_rate": 2.7513192451092893e-06, "loss": 2.3459, "step": 270940 }, { "epoch": 0.95, "learning_rate": 2.7495753652556356e-06, "loss": 2.2301, "step": 270950 }, { "epoch": 0.95, "learning_rate": 2.747831485401982e-06, "loss": 2.3882, "step": 270960 }, { "epoch": 0.95, "learning_rate": 2.746087605548328e-06, "loss": 2.3156, "step": 270970 }, { "epoch": 0.95, "learning_rate": 2.744343725694675e-06, "loss": 2.3097, "step": 270980 }, { "epoch": 0.95, "learning_rate": 2.742599845841021e-06, "loss": 2.2995, "step": 270990 }, { "epoch": 0.95, "learning_rate": 2.7408559659873674e-06, "loss": 2.37, "step": 271000 }, { "epoch": 0.95, "learning_rate": 2.739112086133714e-06, "loss": 2.2871, "step": 271010 }, { "epoch": 0.95, "learning_rate": 2.7373682062800603e-06, "loss": 2.3205, "step": 271020 }, { "epoch": 0.95, "learning_rate": 2.7356243264264066e-06, "loss": 2.3332, "step": 271030 }, { "epoch": 0.95, "learning_rate": 2.7338804465727533e-06, "loss": 2.3461, "step": 271040 }, { "epoch": 0.95, "learning_rate": 2.7321365667190996e-06, "loss": 2.3063, "step": 271050 }, { "epoch": 0.95, "learning_rate": 2.730392686865446e-06, "loss": 2.436, "step": 271060 }, { "epoch": 0.95, "learning_rate": 2.728648807011792e-06, "loss": 2.3583, "step": 271070 }, { "epoch": 0.95, "learning_rate": 2.726904927158139e-06, "loss": 2.3167, "step": 271080 }, { "epoch": 0.95, "learning_rate": 2.725161047304485e-06, "loss": 2.3398, "step": 271090 }, { "epoch": 0.95, "learning_rate": 2.7234171674508313e-06, "loss": 2.4425, "step": 271100 }, { "epoch": 0.95, "learning_rate": 2.721673287597178e-06, "loss": 2.35, "step": 271110 }, { "epoch": 0.95, "learning_rate": 2.7199294077435243e-06, "loss": 2.3008, "step": 271120 }, { "epoch": 0.95, "learning_rate": 2.7181855278898706e-06, "loss": 2.3306, "step": 271130 }, { "epoch": 0.95, "learning_rate": 2.7164416480362173e-06, "loss": 2.3078, "step": 271140 }, { "epoch": 0.95, "learning_rate": 2.7146977681825635e-06, "loss": 2.3845, "step": 271150 }, { "epoch": 0.95, "learning_rate": 2.71295388832891e-06, "loss": 2.3766, "step": 271160 }, { "epoch": 0.95, "learning_rate": 2.711210008475256e-06, "loss": 2.4144, "step": 271170 }, { "epoch": 0.95, "learning_rate": 2.7094661286216028e-06, "loss": 2.2634, "step": 271180 }, { "epoch": 0.95, "learning_rate": 2.707722248767949e-06, "loss": 2.4086, "step": 271190 }, { "epoch": 0.95, "learning_rate": 2.7059783689142953e-06, "loss": 2.3091, "step": 271200 }, { "epoch": 0.95, "learning_rate": 2.704234489060642e-06, "loss": 2.2234, "step": 271210 }, { "epoch": 0.95, "learning_rate": 2.7024906092069883e-06, "loss": 2.2804, "step": 271220 }, { "epoch": 0.95, "learning_rate": 2.7007467293533345e-06, "loss": 2.2997, "step": 271230 }, { "epoch": 0.95, "learning_rate": 2.6990028494996812e-06, "loss": 2.3765, "step": 271240 }, { "epoch": 0.95, "learning_rate": 2.6972589696460275e-06, "loss": 2.3811, "step": 271250 }, { "epoch": 0.95, "learning_rate": 2.6955150897923738e-06, "loss": 2.2881, "step": 271260 }, { "epoch": 0.95, "learning_rate": 2.69377120993872e-06, "loss": 2.3132, "step": 271270 }, { "epoch": 0.95, "learning_rate": 2.6920273300850667e-06, "loss": 2.245, "step": 271280 }, { "epoch": 0.95, "learning_rate": 2.690283450231413e-06, "loss": 2.3532, "step": 271290 }, { "epoch": 0.95, "learning_rate": 2.6885395703777593e-06, "loss": 2.335, "step": 271300 }, { "epoch": 0.95, "learning_rate": 2.686795690524106e-06, "loss": 2.3658, "step": 271310 }, { "epoch": 0.95, "learning_rate": 2.6850518106704522e-06, "loss": 2.3095, "step": 271320 }, { "epoch": 0.95, "learning_rate": 2.6833079308167985e-06, "loss": 2.2514, "step": 271330 }, { "epoch": 0.95, "learning_rate": 2.681564050963145e-06, "loss": 2.2628, "step": 271340 }, { "epoch": 0.95, "learning_rate": 2.6798201711094915e-06, "loss": 2.3305, "step": 271350 }, { "epoch": 0.95, "learning_rate": 2.6780762912558377e-06, "loss": 2.3406, "step": 271360 }, { "epoch": 0.95, "learning_rate": 2.676332411402184e-06, "loss": 2.3311, "step": 271370 }, { "epoch": 0.95, "learning_rate": 2.6745885315485307e-06, "loss": 2.3472, "step": 271380 }, { "epoch": 0.95, "learning_rate": 2.672844651694877e-06, "loss": 2.2616, "step": 271390 }, { "epoch": 0.95, "learning_rate": 2.6711007718412232e-06, "loss": 2.2225, "step": 271400 }, { "epoch": 0.95, "learning_rate": 2.66935689198757e-06, "loss": 2.2846, "step": 271410 }, { "epoch": 0.95, "learning_rate": 2.667613012133916e-06, "loss": 2.3027, "step": 271420 }, { "epoch": 0.95, "learning_rate": 2.6658691322802625e-06, "loss": 2.3747, "step": 271430 }, { "epoch": 0.95, "learning_rate": 2.664125252426609e-06, "loss": 2.3506, "step": 271440 }, { "epoch": 0.95, "learning_rate": 2.6623813725729554e-06, "loss": 2.3624, "step": 271450 }, { "epoch": 0.95, "learning_rate": 2.6606374927193017e-06, "loss": 2.3299, "step": 271460 }, { "epoch": 0.95, "learning_rate": 2.6588936128656484e-06, "loss": 2.3015, "step": 271470 }, { "epoch": 0.95, "learning_rate": 2.6571497330119947e-06, "loss": 2.2927, "step": 271480 }, { "epoch": 0.95, "learning_rate": 2.655405853158341e-06, "loss": 2.3088, "step": 271490 }, { "epoch": 0.95, "learning_rate": 2.653661973304687e-06, "loss": 2.3335, "step": 271500 }, { "epoch": 0.95, "learning_rate": 2.651918093451034e-06, "loss": 2.3003, "step": 271510 }, { "epoch": 0.95, "learning_rate": 2.65017421359738e-06, "loss": 2.2914, "step": 271520 }, { "epoch": 0.95, "learning_rate": 2.6484303337437264e-06, "loss": 2.2662, "step": 271530 }, { "epoch": 0.95, "learning_rate": 2.646686453890073e-06, "loss": 2.3501, "step": 271540 }, { "epoch": 0.95, "learning_rate": 2.6449425740364194e-06, "loss": 2.3654, "step": 271550 }, { "epoch": 0.95, "learning_rate": 2.6431986941827657e-06, "loss": 2.3714, "step": 271560 }, { "epoch": 0.95, "learning_rate": 2.6414548143291123e-06, "loss": 2.3575, "step": 271570 }, { "epoch": 0.95, "learning_rate": 2.6397109344754586e-06, "loss": 2.3583, "step": 271580 }, { "epoch": 0.95, "learning_rate": 2.637967054621805e-06, "loss": 2.3062, "step": 271590 }, { "epoch": 0.95, "learning_rate": 2.636223174768151e-06, "loss": 2.2755, "step": 271600 }, { "epoch": 0.95, "learning_rate": 2.634479294914498e-06, "loss": 2.3829, "step": 271610 }, { "epoch": 0.95, "learning_rate": 2.632735415060844e-06, "loss": 2.3207, "step": 271620 }, { "epoch": 0.95, "learning_rate": 2.6309915352071904e-06, "loss": 2.3587, "step": 271630 }, { "epoch": 0.95, "learning_rate": 2.629247655353537e-06, "loss": 2.3714, "step": 271640 }, { "epoch": 0.95, "learning_rate": 2.6275037754998833e-06, "loss": 2.2926, "step": 271650 }, { "epoch": 0.95, "learning_rate": 2.6257598956462296e-06, "loss": 2.2678, "step": 271660 }, { "epoch": 0.95, "learning_rate": 2.6240160157925763e-06, "loss": 2.2691, "step": 271670 }, { "epoch": 0.95, "learning_rate": 2.6222721359389226e-06, "loss": 2.298, "step": 271680 }, { "epoch": 0.95, "learning_rate": 2.620528256085269e-06, "loss": 2.3071, "step": 271690 }, { "epoch": 0.95, "learning_rate": 2.618784376231615e-06, "loss": 2.3615, "step": 271700 }, { "epoch": 0.95, "learning_rate": 2.617040496377962e-06, "loss": 2.3659, "step": 271710 }, { "epoch": 0.95, "learning_rate": 2.615296616524308e-06, "loss": 2.3277, "step": 271720 }, { "epoch": 0.95, "learning_rate": 2.6135527366706543e-06, "loss": 2.3123, "step": 271730 }, { "epoch": 0.95, "learning_rate": 2.611808856817001e-06, "loss": 2.3959, "step": 271740 }, { "epoch": 0.95, "learning_rate": 2.6100649769633473e-06, "loss": 2.3088, "step": 271750 }, { "epoch": 0.95, "learning_rate": 2.6083210971096936e-06, "loss": 2.3117, "step": 271760 }, { "epoch": 0.95, "learning_rate": 2.6065772172560403e-06, "loss": 2.3073, "step": 271770 }, { "epoch": 0.95, "learning_rate": 2.6048333374023865e-06, "loss": 2.2573, "step": 271780 }, { "epoch": 0.95, "learning_rate": 2.603089457548733e-06, "loss": 2.3664, "step": 271790 }, { "epoch": 0.95, "learning_rate": 2.601345577695079e-06, "loss": 2.2853, "step": 271800 }, { "epoch": 0.95, "learning_rate": 2.5996016978414258e-06, "loss": 2.3481, "step": 271810 }, { "epoch": 0.95, "learning_rate": 2.597857817987772e-06, "loss": 2.2707, "step": 271820 }, { "epoch": 0.95, "learning_rate": 2.5961139381341183e-06, "loss": 2.4036, "step": 271830 }, { "epoch": 0.95, "learning_rate": 2.594370058280465e-06, "loss": 2.306, "step": 271840 }, { "epoch": 0.95, "learning_rate": 2.5926261784268113e-06, "loss": 2.385, "step": 271850 }, { "epoch": 0.95, "learning_rate": 2.5908822985731575e-06, "loss": 2.2721, "step": 271860 }, { "epoch": 0.95, "learning_rate": 2.5891384187195042e-06, "loss": 2.4067, "step": 271870 }, { "epoch": 0.95, "learning_rate": 2.5873945388658505e-06, "loss": 2.2781, "step": 271880 }, { "epoch": 0.95, "learning_rate": 2.5856506590121968e-06, "loss": 2.3242, "step": 271890 }, { "epoch": 0.95, "learning_rate": 2.583906779158543e-06, "loss": 2.3422, "step": 271900 }, { "epoch": 0.95, "learning_rate": 2.5821628993048897e-06, "loss": 2.3681, "step": 271910 }, { "epoch": 0.95, "learning_rate": 2.580419019451236e-06, "loss": 2.3108, "step": 271920 }, { "epoch": 0.95, "learning_rate": 2.5786751395975823e-06, "loss": 2.2614, "step": 271930 }, { "epoch": 0.95, "learning_rate": 2.576931259743929e-06, "loss": 2.2715, "step": 271940 }, { "epoch": 0.95, "learning_rate": 2.5751873798902752e-06, "loss": 2.3854, "step": 271950 }, { "epoch": 0.95, "learning_rate": 2.5734435000366215e-06, "loss": 2.3528, "step": 271960 }, { "epoch": 0.95, "learning_rate": 2.571699620182968e-06, "loss": 2.2808, "step": 271970 }, { "epoch": 0.95, "learning_rate": 2.5699557403293145e-06, "loss": 2.359, "step": 271980 }, { "epoch": 0.95, "learning_rate": 2.5682118604756607e-06, "loss": 2.2917, "step": 271990 }, { "epoch": 0.95, "learning_rate": 2.566467980622007e-06, "loss": 2.3359, "step": 272000 }, { "epoch": 0.95, "learning_rate": 2.5647241007683537e-06, "loss": 2.3444, "step": 272010 }, { "epoch": 0.95, "learning_rate": 2.5629802209147e-06, "loss": 2.3435, "step": 272020 }, { "epoch": 0.95, "learning_rate": 2.5612363410610462e-06, "loss": 2.3013, "step": 272030 }, { "epoch": 0.95, "learning_rate": 2.559492461207393e-06, "loss": 2.2416, "step": 272040 }, { "epoch": 0.95, "learning_rate": 2.557748581353739e-06, "loss": 2.3011, "step": 272050 }, { "epoch": 0.95, "learning_rate": 2.5560047015000855e-06, "loss": 2.3393, "step": 272060 }, { "epoch": 0.95, "learning_rate": 2.554260821646432e-06, "loss": 2.389, "step": 272070 }, { "epoch": 0.95, "learning_rate": 2.5525169417927784e-06, "loss": 2.3676, "step": 272080 }, { "epoch": 0.95, "learning_rate": 2.5507730619391247e-06, "loss": 2.3476, "step": 272090 }, { "epoch": 0.95, "learning_rate": 2.549029182085471e-06, "loss": 2.3495, "step": 272100 }, { "epoch": 0.95, "learning_rate": 2.5472853022318177e-06, "loss": 2.3751, "step": 272110 }, { "epoch": 0.95, "learning_rate": 2.545541422378164e-06, "loss": 2.2783, "step": 272120 }, { "epoch": 0.95, "learning_rate": 2.54379754252451e-06, "loss": 2.2615, "step": 272130 }, { "epoch": 0.95, "learning_rate": 2.542053662670857e-06, "loss": 2.3595, "step": 272140 }, { "epoch": 0.95, "learning_rate": 2.540309782817203e-06, "loss": 2.4117, "step": 272150 }, { "epoch": 0.95, "learning_rate": 2.5385659029635494e-06, "loss": 2.3642, "step": 272160 }, { "epoch": 0.95, "learning_rate": 2.536822023109896e-06, "loss": 2.3899, "step": 272170 }, { "epoch": 0.95, "learning_rate": 2.5350781432562424e-06, "loss": 2.3652, "step": 272180 }, { "epoch": 0.95, "learning_rate": 2.5333342634025887e-06, "loss": 2.2997, "step": 272190 }, { "epoch": 0.95, "learning_rate": 2.531590383548935e-06, "loss": 2.3388, "step": 272200 }, { "epoch": 0.95, "learning_rate": 2.5298465036952816e-06, "loss": 2.3226, "step": 272210 }, { "epoch": 0.95, "learning_rate": 2.528102623841628e-06, "loss": 2.3382, "step": 272220 }, { "epoch": 0.95, "learning_rate": 2.526358743987974e-06, "loss": 2.3605, "step": 272230 }, { "epoch": 0.95, "learning_rate": 2.524614864134321e-06, "loss": 2.3148, "step": 272240 }, { "epoch": 0.95, "learning_rate": 2.522870984280667e-06, "loss": 2.342, "step": 272250 }, { "epoch": 0.95, "learning_rate": 2.5211271044270134e-06, "loss": 2.2945, "step": 272260 }, { "epoch": 0.95, "learning_rate": 2.51938322457336e-06, "loss": 2.2947, "step": 272270 }, { "epoch": 0.95, "learning_rate": 2.5176393447197064e-06, "loss": 2.3311, "step": 272280 }, { "epoch": 0.95, "learning_rate": 2.5158954648660526e-06, "loss": 2.4195, "step": 272290 }, { "epoch": 0.95, "learning_rate": 2.514151585012399e-06, "loss": 2.3283, "step": 272300 }, { "epoch": 0.95, "learning_rate": 2.5124077051587456e-06, "loss": 2.338, "step": 272310 }, { "epoch": 0.95, "learning_rate": 2.510663825305092e-06, "loss": 2.3117, "step": 272320 }, { "epoch": 0.95, "learning_rate": 2.508919945451438e-06, "loss": 2.3031, "step": 272330 }, { "epoch": 0.95, "learning_rate": 2.507176065597785e-06, "loss": 2.3144, "step": 272340 }, { "epoch": 0.95, "learning_rate": 2.505432185744131e-06, "loss": 2.2741, "step": 272350 }, { "epoch": 0.95, "learning_rate": 2.5036883058904774e-06, "loss": 2.4127, "step": 272360 }, { "epoch": 0.95, "learning_rate": 2.501944426036824e-06, "loss": 2.2104, "step": 272370 }, { "epoch": 0.95, "learning_rate": 2.5002005461831703e-06, "loss": 2.3148, "step": 272380 }, { "epoch": 0.95, "learning_rate": 2.4984566663295166e-06, "loss": 2.3321, "step": 272390 }, { "epoch": 0.95, "learning_rate": 2.496712786475863e-06, "loss": 2.272, "step": 272400 }, { "epoch": 0.95, "learning_rate": 2.4949689066222096e-06, "loss": 2.3213, "step": 272410 }, { "epoch": 0.95, "learning_rate": 2.493225026768556e-06, "loss": 2.2354, "step": 272420 }, { "epoch": 0.95, "learning_rate": 2.491481146914902e-06, "loss": 2.3524, "step": 272430 }, { "epoch": 0.95, "learning_rate": 2.4897372670612488e-06, "loss": 2.3168, "step": 272440 }, { "epoch": 0.95, "learning_rate": 2.487993387207595e-06, "loss": 2.2609, "step": 272450 }, { "epoch": 0.95, "learning_rate": 2.4862495073539413e-06, "loss": 2.2772, "step": 272460 }, { "epoch": 0.95, "learning_rate": 2.484505627500288e-06, "loss": 2.3916, "step": 272470 }, { "epoch": 0.95, "learning_rate": 2.4827617476466343e-06, "loss": 2.295, "step": 272480 }, { "epoch": 0.95, "learning_rate": 2.4810178677929806e-06, "loss": 2.3073, "step": 272490 }, { "epoch": 0.95, "learning_rate": 2.479273987939327e-06, "loss": 2.312, "step": 272500 }, { "epoch": 0.95, "learning_rate": 2.4775301080856735e-06, "loss": 2.3995, "step": 272510 }, { "epoch": 0.95, "learning_rate": 2.4757862282320198e-06, "loss": 2.3092, "step": 272520 }, { "epoch": 0.95, "learning_rate": 2.474042348378366e-06, "loss": 2.2973, "step": 272530 }, { "epoch": 0.95, "learning_rate": 2.4722984685247127e-06, "loss": 2.3502, "step": 272540 }, { "epoch": 0.95, "learning_rate": 2.470554588671059e-06, "loss": 2.3249, "step": 272550 }, { "epoch": 0.95, "learning_rate": 2.4688107088174053e-06, "loss": 2.3259, "step": 272560 }, { "epoch": 0.95, "learning_rate": 2.467066828963752e-06, "loss": 2.3198, "step": 272570 }, { "epoch": 0.95, "learning_rate": 2.4653229491100982e-06, "loss": 2.3808, "step": 272580 }, { "epoch": 0.95, "learning_rate": 2.4635790692564445e-06, "loss": 2.2741, "step": 272590 }, { "epoch": 0.95, "learning_rate": 2.4618351894027908e-06, "loss": 2.3257, "step": 272600 }, { "epoch": 0.95, "learning_rate": 2.4600913095491375e-06, "loss": 2.3466, "step": 272610 }, { "epoch": 0.95, "learning_rate": 2.4583474296954837e-06, "loss": 2.3634, "step": 272620 }, { "epoch": 0.95, "learning_rate": 2.45660354984183e-06, "loss": 2.232, "step": 272630 }, { "epoch": 0.95, "learning_rate": 2.4548596699881767e-06, "loss": 2.303, "step": 272640 }, { "epoch": 0.95, "learning_rate": 2.453115790134523e-06, "loss": 2.3257, "step": 272650 }, { "epoch": 0.95, "learning_rate": 2.4513719102808692e-06, "loss": 2.3724, "step": 272660 }, { "epoch": 0.95, "learning_rate": 2.449628030427216e-06, "loss": 2.297, "step": 272670 }, { "epoch": 0.95, "learning_rate": 2.4478841505735622e-06, "loss": 2.3563, "step": 272680 }, { "epoch": 0.95, "learning_rate": 2.4461402707199085e-06, "loss": 2.2821, "step": 272690 }, { "epoch": 0.95, "learning_rate": 2.4443963908662548e-06, "loss": 2.3591, "step": 272700 }, { "epoch": 0.95, "learning_rate": 2.4426525110126014e-06, "loss": 2.3441, "step": 272710 }, { "epoch": 0.95, "learning_rate": 2.4409086311589477e-06, "loss": 2.2619, "step": 272720 }, { "epoch": 0.95, "learning_rate": 2.439164751305294e-06, "loss": 2.3653, "step": 272730 }, { "epoch": 0.95, "learning_rate": 2.4374208714516407e-06, "loss": 2.326, "step": 272740 }, { "epoch": 0.95, "learning_rate": 2.435676991597987e-06, "loss": 2.3282, "step": 272750 }, { "epoch": 0.95, "learning_rate": 2.4339331117443332e-06, "loss": 2.2854, "step": 272760 }, { "epoch": 0.95, "learning_rate": 2.43218923189068e-06, "loss": 2.3457, "step": 272770 }, { "epoch": 0.95, "learning_rate": 2.430445352037026e-06, "loss": 2.3382, "step": 272780 }, { "epoch": 0.95, "learning_rate": 2.4287014721833724e-06, "loss": 2.2922, "step": 272790 }, { "epoch": 0.95, "learning_rate": 2.4269575923297187e-06, "loss": 2.3434, "step": 272800 }, { "epoch": 0.95, "learning_rate": 2.4252137124760654e-06, "loss": 2.3069, "step": 272810 }, { "epoch": 0.95, "learning_rate": 2.4234698326224117e-06, "loss": 2.3845, "step": 272820 }, { "epoch": 0.95, "learning_rate": 2.421725952768758e-06, "loss": 2.2586, "step": 272830 }, { "epoch": 0.95, "learning_rate": 2.4199820729151046e-06, "loss": 2.3446, "step": 272840 }, { "epoch": 0.95, "learning_rate": 2.418238193061451e-06, "loss": 2.4214, "step": 272850 }, { "epoch": 0.95, "learning_rate": 2.416494313207797e-06, "loss": 2.4293, "step": 272860 }, { "epoch": 0.95, "learning_rate": 2.414750433354144e-06, "loss": 2.3523, "step": 272870 }, { "epoch": 0.95, "learning_rate": 2.41300655350049e-06, "loss": 2.3879, "step": 272880 }, { "epoch": 0.95, "learning_rate": 2.4112626736468364e-06, "loss": 2.3195, "step": 272890 }, { "epoch": 0.95, "learning_rate": 2.409518793793183e-06, "loss": 2.3587, "step": 272900 }, { "epoch": 0.95, "learning_rate": 2.4077749139395294e-06, "loss": 2.2615, "step": 272910 }, { "epoch": 0.95, "learning_rate": 2.4060310340858756e-06, "loss": 2.3716, "step": 272920 }, { "epoch": 0.95, "learning_rate": 2.404287154232222e-06, "loss": 2.3153, "step": 272930 }, { "epoch": 0.95, "learning_rate": 2.4025432743785686e-06, "loss": 2.3802, "step": 272940 }, { "epoch": 0.95, "learning_rate": 2.400799394524915e-06, "loss": 2.4251, "step": 272950 }, { "epoch": 0.95, "learning_rate": 2.399055514671261e-06, "loss": 2.3143, "step": 272960 }, { "epoch": 0.95, "learning_rate": 2.397311634817608e-06, "loss": 2.2254, "step": 272970 }, { "epoch": 0.95, "learning_rate": 2.395567754963954e-06, "loss": 2.3321, "step": 272980 }, { "epoch": 0.95, "learning_rate": 2.3938238751103004e-06, "loss": 2.3005, "step": 272990 }, { "epoch": 0.95, "learning_rate": 2.392079995256647e-06, "loss": 2.2623, "step": 273000 }, { "epoch": 0.95, "learning_rate": 2.3903361154029933e-06, "loss": 2.3408, "step": 273010 }, { "epoch": 0.95, "learning_rate": 2.3885922355493396e-06, "loss": 2.3309, "step": 273020 }, { "epoch": 0.95, "learning_rate": 2.386848355695686e-06, "loss": 2.3185, "step": 273030 }, { "epoch": 0.95, "learning_rate": 2.3851044758420326e-06, "loss": 2.2923, "step": 273040 }, { "epoch": 0.95, "learning_rate": 2.383360595988379e-06, "loss": 2.3042, "step": 273050 }, { "epoch": 0.95, "learning_rate": 2.381616716134725e-06, "loss": 2.3723, "step": 273060 }, { "epoch": 0.95, "learning_rate": 2.379872836281072e-06, "loss": 2.3807, "step": 273070 }, { "epoch": 0.95, "learning_rate": 2.378128956427418e-06, "loss": 2.2967, "step": 273080 }, { "epoch": 0.95, "learning_rate": 2.3763850765737643e-06, "loss": 2.3268, "step": 273090 }, { "epoch": 0.95, "learning_rate": 2.374641196720111e-06, "loss": 2.3374, "step": 273100 }, { "epoch": 0.95, "learning_rate": 2.3728973168664573e-06, "loss": 2.2927, "step": 273110 }, { "epoch": 0.95, "learning_rate": 2.3711534370128036e-06, "loss": 2.3044, "step": 273120 }, { "epoch": 0.95, "learning_rate": 2.36940955715915e-06, "loss": 2.3669, "step": 273130 }, { "epoch": 0.95, "learning_rate": 2.3676656773054965e-06, "loss": 2.3811, "step": 273140 }, { "epoch": 0.95, "learning_rate": 2.365921797451843e-06, "loss": 2.2811, "step": 273150 }, { "epoch": 0.95, "learning_rate": 2.364177917598189e-06, "loss": 2.2704, "step": 273160 }, { "epoch": 0.95, "learning_rate": 2.3624340377445358e-06, "loss": 2.3885, "step": 273170 }, { "epoch": 0.95, "learning_rate": 2.360690157890882e-06, "loss": 2.3676, "step": 273180 }, { "epoch": 0.95, "learning_rate": 2.3589462780372283e-06, "loss": 2.3481, "step": 273190 }, { "epoch": 0.95, "learning_rate": 2.357202398183575e-06, "loss": 2.3718, "step": 273200 }, { "epoch": 0.95, "learning_rate": 2.3554585183299213e-06, "loss": 2.3371, "step": 273210 }, { "epoch": 0.95, "learning_rate": 2.3537146384762675e-06, "loss": 2.3233, "step": 273220 }, { "epoch": 0.95, "learning_rate": 2.351970758622614e-06, "loss": 2.3068, "step": 273230 }, { "epoch": 0.95, "learning_rate": 2.3502268787689605e-06, "loss": 2.3857, "step": 273240 }, { "epoch": 0.95, "learning_rate": 2.3484829989153068e-06, "loss": 2.3148, "step": 273250 }, { "epoch": 0.95, "learning_rate": 2.346739119061653e-06, "loss": 2.2558, "step": 273260 }, { "epoch": 0.95, "learning_rate": 2.3449952392079997e-06, "loss": 2.2878, "step": 273270 }, { "epoch": 0.95, "learning_rate": 2.343251359354346e-06, "loss": 2.3722, "step": 273280 }, { "epoch": 0.95, "learning_rate": 2.3415074795006923e-06, "loss": 2.3527, "step": 273290 }, { "epoch": 0.95, "learning_rate": 2.339763599647039e-06, "loss": 2.3057, "step": 273300 }, { "epoch": 0.95, "learning_rate": 2.3380197197933852e-06, "loss": 2.3358, "step": 273310 }, { "epoch": 0.95, "learning_rate": 2.3362758399397315e-06, "loss": 2.3571, "step": 273320 }, { "epoch": 0.95, "learning_rate": 2.3345319600860778e-06, "loss": 2.3242, "step": 273330 }, { "epoch": 0.95, "learning_rate": 2.3327880802324245e-06, "loss": 2.3866, "step": 273340 }, { "epoch": 0.95, "learning_rate": 2.3310442003787707e-06, "loss": 2.299, "step": 273350 }, { "epoch": 0.95, "learning_rate": 2.329300320525117e-06, "loss": 2.2989, "step": 273360 }, { "epoch": 0.95, "learning_rate": 2.3275564406714637e-06, "loss": 2.3507, "step": 273370 }, { "epoch": 0.95, "learning_rate": 2.32581256081781e-06, "loss": 2.3549, "step": 273380 }, { "epoch": 0.95, "learning_rate": 2.3240686809641562e-06, "loss": 2.3343, "step": 273390 }, { "epoch": 0.95, "learning_rate": 2.322324801110503e-06, "loss": 2.3567, "step": 273400 }, { "epoch": 0.95, "learning_rate": 2.320580921256849e-06, "loss": 2.3371, "step": 273410 }, { "epoch": 0.95, "learning_rate": 2.3188370414031955e-06, "loss": 2.4294, "step": 273420 }, { "epoch": 0.95, "learning_rate": 2.3170931615495417e-06, "loss": 2.3599, "step": 273430 }, { "epoch": 0.95, "learning_rate": 2.3153492816958884e-06, "loss": 2.3629, "step": 273440 }, { "epoch": 0.95, "learning_rate": 2.3136054018422347e-06, "loss": 2.3402, "step": 273450 }, { "epoch": 0.95, "learning_rate": 2.311861521988581e-06, "loss": 2.3366, "step": 273460 }, { "epoch": 0.95, "learning_rate": 2.3101176421349276e-06, "loss": 2.3377, "step": 273470 }, { "epoch": 0.95, "learning_rate": 2.308373762281274e-06, "loss": 2.3716, "step": 273480 }, { "epoch": 0.95, "learning_rate": 2.30662988242762e-06, "loss": 2.3096, "step": 273490 }, { "epoch": 0.95, "learning_rate": 2.304886002573967e-06, "loss": 2.313, "step": 273500 }, { "epoch": 0.95, "learning_rate": 2.303142122720313e-06, "loss": 2.4223, "step": 273510 }, { "epoch": 0.95, "learning_rate": 2.3013982428666594e-06, "loss": 2.3661, "step": 273520 }, { "epoch": 0.95, "learning_rate": 2.2996543630130057e-06, "loss": 2.3461, "step": 273530 }, { "epoch": 0.95, "learning_rate": 2.2979104831593524e-06, "loss": 2.3093, "step": 273540 }, { "epoch": 0.95, "learning_rate": 2.2961666033056986e-06, "loss": 2.312, "step": 273550 }, { "epoch": 0.95, "learning_rate": 2.294422723452045e-06, "loss": 2.3774, "step": 273560 }, { "epoch": 0.95, "learning_rate": 2.2926788435983916e-06, "loss": 2.2529, "step": 273570 }, { "epoch": 0.95, "learning_rate": 2.290934963744738e-06, "loss": 2.2894, "step": 273580 }, { "epoch": 0.95, "learning_rate": 2.289191083891084e-06, "loss": 2.3238, "step": 273590 }, { "epoch": 0.95, "learning_rate": 2.287447204037431e-06, "loss": 2.3109, "step": 273600 }, { "epoch": 0.95, "learning_rate": 2.285703324183777e-06, "loss": 2.27, "step": 273610 }, { "epoch": 0.95, "learning_rate": 2.2839594443301234e-06, "loss": 2.2857, "step": 273620 }, { "epoch": 0.95, "learning_rate": 2.2822155644764697e-06, "loss": 2.4713, "step": 273630 }, { "epoch": 0.95, "learning_rate": 2.2804716846228163e-06, "loss": 2.3202, "step": 273640 }, { "epoch": 0.95, "learning_rate": 2.2787278047691626e-06, "loss": 2.3176, "step": 273650 }, { "epoch": 0.95, "learning_rate": 2.276983924915509e-06, "loss": 2.3788, "step": 273660 }, { "epoch": 0.95, "learning_rate": 2.2752400450618556e-06, "loss": 2.3163, "step": 273670 }, { "epoch": 0.95, "learning_rate": 2.273496165208202e-06, "loss": 2.3158, "step": 273680 }, { "epoch": 0.95, "learning_rate": 2.271752285354548e-06, "loss": 2.336, "step": 273690 }, { "epoch": 0.95, "learning_rate": 2.270008405500895e-06, "loss": 2.3108, "step": 273700 }, { "epoch": 0.95, "learning_rate": 2.268264525647241e-06, "loss": 2.3647, "step": 273710 }, { "epoch": 0.95, "learning_rate": 2.2665206457935873e-06, "loss": 2.3096, "step": 273720 }, { "epoch": 0.95, "learning_rate": 2.2647767659399336e-06, "loss": 2.1996, "step": 273730 }, { "epoch": 0.95, "learning_rate": 2.2630328860862803e-06, "loss": 2.3169, "step": 273740 }, { "epoch": 0.95, "learning_rate": 2.2612890062326266e-06, "loss": 2.2509, "step": 273750 }, { "epoch": 0.95, "learning_rate": 2.259545126378973e-06, "loss": 2.3441, "step": 273760 }, { "epoch": 0.95, "learning_rate": 2.2578012465253195e-06, "loss": 2.3411, "step": 273770 }, { "epoch": 0.95, "learning_rate": 2.256057366671666e-06, "loss": 2.3465, "step": 273780 }, { "epoch": 0.95, "learning_rate": 2.254313486818012e-06, "loss": 2.3026, "step": 273790 }, { "epoch": 0.95, "learning_rate": 2.2525696069643588e-06, "loss": 2.3896, "step": 273800 }, { "epoch": 0.95, "learning_rate": 2.250825727110705e-06, "loss": 2.4198, "step": 273810 }, { "epoch": 0.96, "learning_rate": 2.2490818472570513e-06, "loss": 2.3355, "step": 273820 }, { "epoch": 0.96, "learning_rate": 2.2473379674033976e-06, "loss": 2.286, "step": 273830 }, { "epoch": 0.96, "learning_rate": 2.2455940875497443e-06, "loss": 2.3926, "step": 273840 }, { "epoch": 0.96, "learning_rate": 2.2438502076960905e-06, "loss": 2.3556, "step": 273850 }, { "epoch": 0.96, "learning_rate": 2.242106327842437e-06, "loss": 2.3667, "step": 273860 }, { "epoch": 0.96, "learning_rate": 2.2403624479887835e-06, "loss": 2.3031, "step": 273870 }, { "epoch": 0.96, "learning_rate": 2.2386185681351298e-06, "loss": 2.3479, "step": 273880 }, { "epoch": 0.96, "learning_rate": 2.236874688281476e-06, "loss": 2.3203, "step": 273890 }, { "epoch": 0.96, "learning_rate": 2.2351308084278227e-06, "loss": 2.2561, "step": 273900 }, { "epoch": 0.96, "learning_rate": 2.233386928574169e-06, "loss": 2.2922, "step": 273910 }, { "epoch": 0.96, "learning_rate": 2.2316430487205153e-06, "loss": 2.3061, "step": 273920 }, { "epoch": 0.96, "learning_rate": 2.2298991688668615e-06, "loss": 2.3525, "step": 273930 }, { "epoch": 0.96, "learning_rate": 2.2281552890132082e-06, "loss": 2.297, "step": 273940 }, { "epoch": 0.96, "learning_rate": 2.2264114091595545e-06, "loss": 2.2604, "step": 273950 }, { "epoch": 0.96, "learning_rate": 2.2246675293059008e-06, "loss": 2.3814, "step": 273960 }, { "epoch": 0.96, "learning_rate": 2.2229236494522475e-06, "loss": 2.3741, "step": 273970 }, { "epoch": 0.96, "learning_rate": 2.2211797695985937e-06, "loss": 2.308, "step": 273980 }, { "epoch": 0.96, "learning_rate": 2.21943588974494e-06, "loss": 2.3193, "step": 273990 }, { "epoch": 0.96, "learning_rate": 2.2176920098912867e-06, "loss": 2.3547, "step": 274000 }, { "epoch": 0.96, "learning_rate": 2.215948130037633e-06, "loss": 2.3183, "step": 274010 }, { "epoch": 0.96, "learning_rate": 2.2142042501839792e-06, "loss": 2.2997, "step": 274020 }, { "epoch": 0.96, "learning_rate": 2.2124603703303255e-06, "loss": 2.3355, "step": 274030 }, { "epoch": 0.96, "learning_rate": 2.210716490476672e-06, "loss": 2.3697, "step": 274040 }, { "epoch": 0.96, "learning_rate": 2.2089726106230185e-06, "loss": 2.3243, "step": 274050 }, { "epoch": 0.96, "learning_rate": 2.2072287307693647e-06, "loss": 2.3147, "step": 274060 }, { "epoch": 0.96, "learning_rate": 2.2054848509157114e-06, "loss": 2.261, "step": 274070 }, { "epoch": 0.96, "learning_rate": 2.2037409710620577e-06, "loss": 2.3387, "step": 274080 }, { "epoch": 0.96, "learning_rate": 2.201997091208404e-06, "loss": 2.3752, "step": 274090 }, { "epoch": 0.96, "learning_rate": 2.2002532113547507e-06, "loss": 2.3558, "step": 274100 }, { "epoch": 0.96, "learning_rate": 2.198509331501097e-06, "loss": 2.4127, "step": 274110 }, { "epoch": 0.96, "learning_rate": 2.196765451647443e-06, "loss": 2.2437, "step": 274120 }, { "epoch": 0.96, "learning_rate": 2.1950215717937895e-06, "loss": 2.3375, "step": 274130 }, { "epoch": 0.96, "learning_rate": 2.193277691940136e-06, "loss": 2.2846, "step": 274140 }, { "epoch": 0.96, "learning_rate": 2.1915338120864824e-06, "loss": 2.2826, "step": 274150 }, { "epoch": 0.96, "learning_rate": 2.1897899322328287e-06, "loss": 2.351, "step": 274160 }, { "epoch": 0.96, "learning_rate": 2.1880460523791754e-06, "loss": 2.3876, "step": 274170 }, { "epoch": 0.96, "learning_rate": 2.1863021725255217e-06, "loss": 2.3793, "step": 274180 }, { "epoch": 0.96, "learning_rate": 2.184558292671868e-06, "loss": 2.3074, "step": 274190 }, { "epoch": 0.96, "learning_rate": 2.1828144128182146e-06, "loss": 2.3653, "step": 274200 }, { "epoch": 0.96, "learning_rate": 2.181070532964561e-06, "loss": 2.3009, "step": 274210 }, { "epoch": 0.96, "learning_rate": 2.179326653110907e-06, "loss": 2.3164, "step": 274220 }, { "epoch": 0.96, "learning_rate": 2.1775827732572534e-06, "loss": 2.3166, "step": 274230 }, { "epoch": 0.96, "learning_rate": 2.1758388934036e-06, "loss": 2.3332, "step": 274240 }, { "epoch": 0.96, "learning_rate": 2.1740950135499464e-06, "loss": 2.3572, "step": 274250 }, { "epoch": 0.96, "learning_rate": 2.1723511336962927e-06, "loss": 2.3211, "step": 274260 }, { "epoch": 0.96, "learning_rate": 2.1706072538426394e-06, "loss": 2.4078, "step": 274270 }, { "epoch": 0.96, "learning_rate": 2.1688633739889856e-06, "loss": 2.2922, "step": 274280 }, { "epoch": 0.96, "learning_rate": 2.167119494135332e-06, "loss": 2.3202, "step": 274290 }, { "epoch": 0.96, "learning_rate": 2.1653756142816786e-06, "loss": 2.3592, "step": 274300 }, { "epoch": 0.96, "learning_rate": 2.163631734428025e-06, "loss": 2.3858, "step": 274310 }, { "epoch": 0.96, "learning_rate": 2.161887854574371e-06, "loss": 2.4393, "step": 274320 }, { "epoch": 0.96, "learning_rate": 2.160143974720718e-06, "loss": 2.298, "step": 274330 }, { "epoch": 0.96, "learning_rate": 2.158400094867064e-06, "loss": 2.4091, "step": 274340 }, { "epoch": 0.96, "learning_rate": 2.1566562150134104e-06, "loss": 2.3558, "step": 274350 }, { "epoch": 0.96, "learning_rate": 2.1549123351597566e-06, "loss": 2.298, "step": 274360 }, { "epoch": 0.96, "learning_rate": 2.1531684553061033e-06, "loss": 2.3073, "step": 274370 }, { "epoch": 0.96, "learning_rate": 2.1514245754524496e-06, "loss": 2.3828, "step": 274380 }, { "epoch": 0.96, "learning_rate": 2.149680695598796e-06, "loss": 2.3839, "step": 274390 }, { "epoch": 0.96, "learning_rate": 2.1479368157451425e-06, "loss": 2.3284, "step": 274400 }, { "epoch": 0.96, "learning_rate": 2.146192935891489e-06, "loss": 2.2772, "step": 274410 }, { "epoch": 0.96, "learning_rate": 2.144449056037835e-06, "loss": 2.3047, "step": 274420 }, { "epoch": 0.96, "learning_rate": 2.1427051761841818e-06, "loss": 2.2724, "step": 274430 }, { "epoch": 0.96, "learning_rate": 2.140961296330528e-06, "loss": 2.3424, "step": 274440 }, { "epoch": 0.96, "learning_rate": 2.1392174164768743e-06, "loss": 2.3322, "step": 274450 }, { "epoch": 0.96, "learning_rate": 2.1374735366232206e-06, "loss": 2.3172, "step": 274460 }, { "epoch": 0.96, "learning_rate": 2.1357296567695673e-06, "loss": 2.3071, "step": 274470 }, { "epoch": 0.96, "learning_rate": 2.1339857769159136e-06, "loss": 2.3887, "step": 274480 }, { "epoch": 0.96, "learning_rate": 2.13224189706226e-06, "loss": 2.3214, "step": 274490 }, { "epoch": 0.96, "learning_rate": 2.1304980172086065e-06, "loss": 2.3045, "step": 274500 }, { "epoch": 0.96, "learning_rate": 2.1287541373549528e-06, "loss": 2.396, "step": 274510 }, { "epoch": 0.96, "learning_rate": 2.127010257501299e-06, "loss": 2.3619, "step": 274520 }, { "epoch": 0.96, "learning_rate": 2.1252663776476457e-06, "loss": 2.3419, "step": 274530 }, { "epoch": 0.96, "learning_rate": 2.123522497793992e-06, "loss": 2.2917, "step": 274540 }, { "epoch": 0.96, "learning_rate": 2.1217786179403383e-06, "loss": 2.3453, "step": 274550 }, { "epoch": 0.96, "learning_rate": 2.1200347380866846e-06, "loss": 2.3359, "step": 274560 }, { "epoch": 0.96, "learning_rate": 2.1182908582330312e-06, "loss": 2.3889, "step": 274570 }, { "epoch": 0.96, "learning_rate": 2.1165469783793775e-06, "loss": 2.4124, "step": 274580 }, { "epoch": 0.96, "learning_rate": 2.1148030985257238e-06, "loss": 2.3087, "step": 274590 }, { "epoch": 0.96, "learning_rate": 2.1130592186720705e-06, "loss": 2.3771, "step": 274600 }, { "epoch": 0.96, "learning_rate": 2.1113153388184167e-06, "loss": 2.3879, "step": 274610 }, { "epoch": 0.96, "learning_rate": 2.109571458964763e-06, "loss": 2.2912, "step": 274620 }, { "epoch": 0.96, "learning_rate": 2.1078275791111097e-06, "loss": 2.2613, "step": 274630 }, { "epoch": 0.96, "learning_rate": 2.106083699257456e-06, "loss": 2.404, "step": 274640 }, { "epoch": 0.96, "learning_rate": 2.1043398194038022e-06, "loss": 2.3875, "step": 274650 }, { "epoch": 0.96, "learning_rate": 2.1025959395501485e-06, "loss": 2.3276, "step": 274660 }, { "epoch": 0.96, "learning_rate": 2.100852059696495e-06, "loss": 2.3156, "step": 274670 }, { "epoch": 0.96, "learning_rate": 2.0991081798428415e-06, "loss": 2.3283, "step": 274680 }, { "epoch": 0.96, "learning_rate": 2.0973642999891877e-06, "loss": 2.3721, "step": 274690 }, { "epoch": 0.96, "learning_rate": 2.0956204201355344e-06, "loss": 2.3503, "step": 274700 }, { "epoch": 0.96, "learning_rate": 2.0938765402818807e-06, "loss": 2.3894, "step": 274710 }, { "epoch": 0.96, "learning_rate": 2.092132660428227e-06, "loss": 2.3067, "step": 274720 }, { "epoch": 0.96, "learning_rate": 2.0903887805745737e-06, "loss": 2.3593, "step": 274730 }, { "epoch": 0.96, "learning_rate": 2.08864490072092e-06, "loss": 2.309, "step": 274740 }, { "epoch": 0.96, "learning_rate": 2.086901020867266e-06, "loss": 2.3897, "step": 274750 }, { "epoch": 0.96, "learning_rate": 2.0851571410136125e-06, "loss": 2.3265, "step": 274760 }, { "epoch": 0.96, "learning_rate": 2.083413261159959e-06, "loss": 2.3059, "step": 274770 }, { "epoch": 0.96, "learning_rate": 2.0816693813063054e-06, "loss": 2.3484, "step": 274780 }, { "epoch": 0.96, "learning_rate": 2.0799255014526517e-06, "loss": 2.1853, "step": 274790 }, { "epoch": 0.96, "learning_rate": 2.0781816215989984e-06, "loss": 2.2944, "step": 274800 }, { "epoch": 0.96, "learning_rate": 2.0764377417453447e-06, "loss": 2.3021, "step": 274810 }, { "epoch": 0.96, "learning_rate": 2.074693861891691e-06, "loss": 2.2836, "step": 274820 }, { "epoch": 0.96, "learning_rate": 2.0729499820380376e-06, "loss": 2.3293, "step": 274830 }, { "epoch": 0.96, "learning_rate": 2.071206102184384e-06, "loss": 2.2852, "step": 274840 }, { "epoch": 0.96, "learning_rate": 2.06946222233073e-06, "loss": 2.327, "step": 274850 }, { "epoch": 0.96, "learning_rate": 2.0677183424770764e-06, "loss": 2.3523, "step": 274860 }, { "epoch": 0.96, "learning_rate": 2.065974462623423e-06, "loss": 2.3128, "step": 274870 }, { "epoch": 0.96, "learning_rate": 2.0642305827697694e-06, "loss": 2.275, "step": 274880 }, { "epoch": 0.96, "learning_rate": 2.0624867029161157e-06, "loss": 2.3001, "step": 274890 }, { "epoch": 0.96, "learning_rate": 2.0607428230624624e-06, "loss": 2.3736, "step": 274900 }, { "epoch": 0.96, "learning_rate": 2.0589989432088086e-06, "loss": 2.2424, "step": 274910 }, { "epoch": 0.96, "learning_rate": 2.057255063355155e-06, "loss": 2.2527, "step": 274920 }, { "epoch": 0.96, "learning_rate": 2.0555111835015016e-06, "loss": 2.3981, "step": 274930 }, { "epoch": 0.96, "learning_rate": 2.053767303647848e-06, "loss": 2.3283, "step": 274940 }, { "epoch": 0.96, "learning_rate": 2.052023423794194e-06, "loss": 2.3447, "step": 274950 }, { "epoch": 0.96, "learning_rate": 2.0502795439405404e-06, "loss": 2.3548, "step": 274960 }, { "epoch": 0.96, "learning_rate": 2.048535664086887e-06, "loss": 2.255, "step": 274970 }, { "epoch": 0.96, "learning_rate": 2.0467917842332334e-06, "loss": 2.4082, "step": 274980 }, { "epoch": 0.96, "learning_rate": 2.0450479043795796e-06, "loss": 2.312, "step": 274990 }, { "epoch": 0.96, "learning_rate": 2.0433040245259263e-06, "loss": 2.3026, "step": 275000 }, { "epoch": 0.96, "learning_rate": 2.0415601446722726e-06, "loss": 2.2922, "step": 275010 }, { "epoch": 0.96, "learning_rate": 2.039816264818619e-06, "loss": 2.3222, "step": 275020 }, { "epoch": 0.96, "learning_rate": 2.0380723849649656e-06, "loss": 2.3625, "step": 275030 }, { "epoch": 0.96, "learning_rate": 2.036328505111312e-06, "loss": 2.3323, "step": 275040 }, { "epoch": 0.96, "learning_rate": 2.034584625257658e-06, "loss": 2.3488, "step": 275050 }, { "epoch": 0.96, "learning_rate": 2.032840745404005e-06, "loss": 2.3135, "step": 275060 }, { "epoch": 0.96, "learning_rate": 2.031096865550351e-06, "loss": 2.3037, "step": 275070 }, { "epoch": 0.96, "learning_rate": 2.0293529856966973e-06, "loss": 2.3385, "step": 275080 }, { "epoch": 0.96, "learning_rate": 2.0276091058430436e-06, "loss": 2.394, "step": 275090 }, { "epoch": 0.96, "learning_rate": 2.0258652259893903e-06, "loss": 2.3197, "step": 275100 }, { "epoch": 0.96, "learning_rate": 2.0241213461357366e-06, "loss": 2.3323, "step": 275110 }, { "epoch": 0.96, "learning_rate": 2.022377466282083e-06, "loss": 2.3382, "step": 275120 }, { "epoch": 0.96, "learning_rate": 2.0206335864284295e-06, "loss": 2.3887, "step": 275130 }, { "epoch": 0.96, "learning_rate": 2.018889706574776e-06, "loss": 2.3314, "step": 275140 }, { "epoch": 0.96, "learning_rate": 2.017145826721122e-06, "loss": 2.3205, "step": 275150 }, { "epoch": 0.96, "learning_rate": 2.0154019468674688e-06, "loss": 2.3327, "step": 275160 }, { "epoch": 0.96, "learning_rate": 2.013658067013815e-06, "loss": 2.3482, "step": 275170 }, { "epoch": 0.96, "learning_rate": 2.0119141871601613e-06, "loss": 2.3581, "step": 275180 }, { "epoch": 0.96, "learning_rate": 2.010170307306508e-06, "loss": 2.3118, "step": 275190 }, { "epoch": 0.96, "learning_rate": 2.0084264274528543e-06, "loss": 2.2349, "step": 275200 }, { "epoch": 0.96, "learning_rate": 2.0066825475992005e-06, "loss": 2.2948, "step": 275210 }, { "epoch": 0.96, "learning_rate": 2.0049386677455472e-06, "loss": 2.3567, "step": 275220 }, { "epoch": 0.96, "learning_rate": 2.0031947878918935e-06, "loss": 2.2716, "step": 275230 }, { "epoch": 0.96, "learning_rate": 2.0014509080382398e-06, "loss": 2.2971, "step": 275240 }, { "epoch": 0.96, "learning_rate": 1.999707028184586e-06, "loss": 2.3372, "step": 275250 }, { "epoch": 0.96, "learning_rate": 1.9979631483309327e-06, "loss": 2.3474, "step": 275260 }, { "epoch": 0.96, "learning_rate": 1.996219268477279e-06, "loss": 2.2739, "step": 275270 }, { "epoch": 0.96, "learning_rate": 1.9944753886236253e-06, "loss": 2.3179, "step": 275280 }, { "epoch": 0.96, "learning_rate": 1.992731508769972e-06, "loss": 2.2849, "step": 275290 }, { "epoch": 0.96, "learning_rate": 1.9909876289163182e-06, "loss": 2.3341, "step": 275300 }, { "epoch": 0.96, "learning_rate": 1.9892437490626645e-06, "loss": 2.2688, "step": 275310 }, { "epoch": 0.96, "learning_rate": 1.987499869209011e-06, "loss": 2.3151, "step": 275320 }, { "epoch": 0.96, "learning_rate": 1.9857559893553574e-06, "loss": 2.2506, "step": 275330 }, { "epoch": 0.96, "learning_rate": 1.9840121095017037e-06, "loss": 2.3954, "step": 275340 }, { "epoch": 0.96, "learning_rate": 1.9822682296480504e-06, "loss": 2.4046, "step": 275350 }, { "epoch": 0.96, "learning_rate": 1.9805243497943967e-06, "loss": 2.3448, "step": 275360 }, { "epoch": 0.96, "learning_rate": 1.978780469940743e-06, "loss": 2.3901, "step": 275370 }, { "epoch": 0.96, "learning_rate": 1.9770365900870892e-06, "loss": 2.3331, "step": 275380 }, { "epoch": 0.96, "learning_rate": 1.975292710233436e-06, "loss": 2.4041, "step": 275390 }, { "epoch": 0.96, "learning_rate": 1.973548830379782e-06, "loss": 2.3101, "step": 275400 }, { "epoch": 0.96, "learning_rate": 1.9718049505261285e-06, "loss": 2.3062, "step": 275410 }, { "epoch": 0.96, "learning_rate": 1.970061070672475e-06, "loss": 2.3676, "step": 275420 }, { "epoch": 0.96, "learning_rate": 1.9683171908188214e-06, "loss": 2.2438, "step": 275430 }, { "epoch": 0.96, "learning_rate": 1.9665733109651677e-06, "loss": 2.3814, "step": 275440 }, { "epoch": 0.96, "learning_rate": 1.9648294311115144e-06, "loss": 2.2665, "step": 275450 }, { "epoch": 0.96, "learning_rate": 1.9630855512578606e-06, "loss": 2.3347, "step": 275460 }, { "epoch": 0.96, "learning_rate": 1.961341671404207e-06, "loss": 2.309, "step": 275470 }, { "epoch": 0.96, "learning_rate": 1.9595977915505536e-06, "loss": 2.2642, "step": 275480 }, { "epoch": 0.96, "learning_rate": 1.9578539116969e-06, "loss": 2.3468, "step": 275490 }, { "epoch": 0.96, "learning_rate": 1.956110031843246e-06, "loss": 2.3683, "step": 275500 }, { "epoch": 0.96, "learning_rate": 1.9543661519895924e-06, "loss": 2.3313, "step": 275510 }, { "epoch": 0.96, "learning_rate": 1.952622272135939e-06, "loss": 2.3105, "step": 275520 }, { "epoch": 0.96, "learning_rate": 1.9508783922822854e-06, "loss": 2.411, "step": 275530 }, { "epoch": 0.96, "learning_rate": 1.9491345124286316e-06, "loss": 2.3335, "step": 275540 }, { "epoch": 0.96, "learning_rate": 1.9473906325749783e-06, "loss": 2.2698, "step": 275550 }, { "epoch": 0.96, "learning_rate": 1.9456467527213246e-06, "loss": 2.4546, "step": 275560 }, { "epoch": 0.96, "learning_rate": 1.943902872867671e-06, "loss": 2.3219, "step": 275570 }, { "epoch": 0.96, "learning_rate": 1.9421589930140176e-06, "loss": 2.3859, "step": 275580 }, { "epoch": 0.96, "learning_rate": 1.940415113160364e-06, "loss": 2.2927, "step": 275590 }, { "epoch": 0.96, "learning_rate": 1.93867123330671e-06, "loss": 2.3691, "step": 275600 }, { "epoch": 0.96, "learning_rate": 1.936927353453057e-06, "loss": 2.3029, "step": 275610 }, { "epoch": 0.96, "learning_rate": 1.935183473599403e-06, "loss": 2.3409, "step": 275620 }, { "epoch": 0.96, "learning_rate": 1.9334395937457493e-06, "loss": 2.3698, "step": 275630 }, { "epoch": 0.96, "learning_rate": 1.9316957138920956e-06, "loss": 2.3615, "step": 275640 }, { "epoch": 0.96, "learning_rate": 1.9299518340384423e-06, "loss": 2.3045, "step": 275650 }, { "epoch": 0.96, "learning_rate": 1.9282079541847886e-06, "loss": 2.3302, "step": 275660 }, { "epoch": 0.96, "learning_rate": 1.926464074331135e-06, "loss": 2.329, "step": 275670 }, { "epoch": 0.96, "learning_rate": 1.9247201944774815e-06, "loss": 2.3134, "step": 275680 }, { "epoch": 0.96, "learning_rate": 1.922976314623828e-06, "loss": 2.3282, "step": 275690 }, { "epoch": 0.96, "learning_rate": 1.921232434770174e-06, "loss": 2.2998, "step": 275700 }, { "epoch": 0.96, "learning_rate": 1.9194885549165208e-06, "loss": 2.2873, "step": 275710 }, { "epoch": 0.96, "learning_rate": 1.917744675062867e-06, "loss": 2.3491, "step": 275720 }, { "epoch": 0.96, "learning_rate": 1.9160007952092133e-06, "loss": 2.3489, "step": 275730 }, { "epoch": 0.96, "learning_rate": 1.91425691535556e-06, "loss": 2.337, "step": 275740 }, { "epoch": 0.96, "learning_rate": 1.9125130355019063e-06, "loss": 2.2839, "step": 275750 }, { "epoch": 0.96, "learning_rate": 1.9107691556482525e-06, "loss": 2.3607, "step": 275760 }, { "epoch": 0.96, "learning_rate": 1.909025275794599e-06, "loss": 2.235, "step": 275770 }, { "epoch": 0.96, "learning_rate": 1.9072813959409453e-06, "loss": 2.3272, "step": 275780 }, { "epoch": 0.96, "learning_rate": 1.9055375160872916e-06, "loss": 2.3307, "step": 275790 }, { "epoch": 0.96, "learning_rate": 1.9037936362336382e-06, "loss": 2.37, "step": 275800 }, { "epoch": 0.96, "learning_rate": 1.9020497563799845e-06, "loss": 2.2042, "step": 275810 }, { "epoch": 0.96, "learning_rate": 1.9003058765263308e-06, "loss": 2.3326, "step": 275820 }, { "epoch": 0.96, "learning_rate": 1.8985619966726775e-06, "loss": 2.3651, "step": 275830 }, { "epoch": 0.96, "learning_rate": 1.8968181168190237e-06, "loss": 2.3727, "step": 275840 }, { "epoch": 0.96, "learning_rate": 1.89507423696537e-06, "loss": 2.3866, "step": 275850 }, { "epoch": 0.96, "learning_rate": 1.8933303571117167e-06, "loss": 2.3295, "step": 275860 }, { "epoch": 0.96, "learning_rate": 1.891586477258063e-06, "loss": 2.3098, "step": 275870 }, { "epoch": 0.96, "learning_rate": 1.8898425974044092e-06, "loss": 2.3766, "step": 275880 }, { "epoch": 0.96, "learning_rate": 1.8880987175507555e-06, "loss": 2.2799, "step": 275890 }, { "epoch": 0.96, "learning_rate": 1.8863548376971022e-06, "loss": 2.3846, "step": 275900 }, { "epoch": 0.96, "learning_rate": 1.8846109578434485e-06, "loss": 2.3239, "step": 275910 }, { "epoch": 0.96, "learning_rate": 1.8828670779897947e-06, "loss": 2.3721, "step": 275920 }, { "epoch": 0.96, "learning_rate": 1.8811231981361414e-06, "loss": 2.3207, "step": 275930 }, { "epoch": 0.96, "learning_rate": 1.8793793182824877e-06, "loss": 2.3132, "step": 275940 }, { "epoch": 0.96, "learning_rate": 1.877635438428834e-06, "loss": 2.3017, "step": 275950 }, { "epoch": 0.96, "learning_rate": 1.8758915585751807e-06, "loss": 2.382, "step": 275960 }, { "epoch": 0.96, "learning_rate": 1.874147678721527e-06, "loss": 2.3504, "step": 275970 }, { "epoch": 0.96, "learning_rate": 1.8724037988678732e-06, "loss": 2.2937, "step": 275980 }, { "epoch": 0.96, "learning_rate": 1.8706599190142195e-06, "loss": 2.3851, "step": 275990 }, { "epoch": 0.96, "learning_rate": 1.8689160391605662e-06, "loss": 2.3471, "step": 276000 }, { "epoch": 0.96, "learning_rate": 1.8671721593069124e-06, "loss": 2.3789, "step": 276010 }, { "epoch": 0.96, "learning_rate": 1.8654282794532587e-06, "loss": 2.3189, "step": 276020 }, { "epoch": 0.96, "learning_rate": 1.8636843995996054e-06, "loss": 2.3399, "step": 276030 }, { "epoch": 0.96, "learning_rate": 1.8619405197459517e-06, "loss": 2.2782, "step": 276040 }, { "epoch": 0.96, "learning_rate": 1.860196639892298e-06, "loss": 2.3252, "step": 276050 }, { "epoch": 0.96, "learning_rate": 1.8584527600386446e-06, "loss": 2.3058, "step": 276060 }, { "epoch": 0.96, "learning_rate": 1.856708880184991e-06, "loss": 2.2655, "step": 276070 }, { "epoch": 0.96, "learning_rate": 1.8549650003313372e-06, "loss": 2.3606, "step": 276080 }, { "epoch": 0.96, "learning_rate": 1.8532211204776834e-06, "loss": 2.3828, "step": 276090 }, { "epoch": 0.96, "learning_rate": 1.8514772406240301e-06, "loss": 2.321, "step": 276100 }, { "epoch": 0.96, "learning_rate": 1.8497333607703764e-06, "loss": 2.3105, "step": 276110 }, { "epoch": 0.96, "learning_rate": 1.8479894809167227e-06, "loss": 2.4135, "step": 276120 }, { "epoch": 0.96, "learning_rate": 1.8462456010630694e-06, "loss": 2.2479, "step": 276130 }, { "epoch": 0.96, "learning_rate": 1.8445017212094156e-06, "loss": 2.3275, "step": 276140 }, { "epoch": 0.96, "learning_rate": 1.842757841355762e-06, "loss": 2.3251, "step": 276150 }, { "epoch": 0.96, "learning_rate": 1.8410139615021086e-06, "loss": 2.2878, "step": 276160 }, { "epoch": 0.96, "learning_rate": 1.8392700816484549e-06, "loss": 2.3252, "step": 276170 }, { "epoch": 0.96, "learning_rate": 1.8375262017948011e-06, "loss": 2.3657, "step": 276180 }, { "epoch": 0.96, "learning_rate": 1.8357823219411474e-06, "loss": 2.2991, "step": 276190 }, { "epoch": 0.96, "learning_rate": 1.834038442087494e-06, "loss": 2.3454, "step": 276200 }, { "epoch": 0.96, "learning_rate": 1.8322945622338404e-06, "loss": 2.3604, "step": 276210 }, { "epoch": 0.96, "learning_rate": 1.8305506823801866e-06, "loss": 2.3496, "step": 276220 }, { "epoch": 0.96, "learning_rate": 1.8288068025265333e-06, "loss": 2.3492, "step": 276230 }, { "epoch": 0.96, "learning_rate": 1.8270629226728796e-06, "loss": 2.3135, "step": 276240 }, { "epoch": 0.96, "learning_rate": 1.8253190428192259e-06, "loss": 2.3531, "step": 276250 }, { "epoch": 0.96, "learning_rate": 1.8235751629655726e-06, "loss": 2.2857, "step": 276260 }, { "epoch": 0.96, "learning_rate": 1.8218312831119188e-06, "loss": 2.3243, "step": 276270 }, { "epoch": 0.96, "learning_rate": 1.820087403258265e-06, "loss": 2.3525, "step": 276280 }, { "epoch": 0.96, "learning_rate": 1.8183435234046114e-06, "loss": 2.3343, "step": 276290 }, { "epoch": 0.96, "learning_rate": 1.816599643550958e-06, "loss": 2.3231, "step": 276300 }, { "epoch": 0.96, "learning_rate": 1.8148557636973043e-06, "loss": 2.374, "step": 276310 }, { "epoch": 0.96, "learning_rate": 1.8131118838436506e-06, "loss": 2.2764, "step": 276320 }, { "epoch": 0.96, "learning_rate": 1.8113680039899973e-06, "loss": 2.4468, "step": 276330 }, { "epoch": 0.96, "learning_rate": 1.8096241241363436e-06, "loss": 2.3348, "step": 276340 }, { "epoch": 0.96, "learning_rate": 1.8078802442826898e-06, "loss": 2.3468, "step": 276350 }, { "epoch": 0.96, "learning_rate": 1.8061363644290365e-06, "loss": 2.4003, "step": 276360 }, { "epoch": 0.96, "learning_rate": 1.8043924845753828e-06, "loss": 2.2987, "step": 276370 }, { "epoch": 0.96, "learning_rate": 1.802648604721729e-06, "loss": 2.364, "step": 276380 }, { "epoch": 0.96, "learning_rate": 1.8009047248680753e-06, "loss": 2.2562, "step": 276390 }, { "epoch": 0.96, "learning_rate": 1.799160845014422e-06, "loss": 2.3153, "step": 276400 }, { "epoch": 0.96, "learning_rate": 1.7974169651607683e-06, "loss": 2.3523, "step": 276410 }, { "epoch": 0.96, "learning_rate": 1.7956730853071146e-06, "loss": 2.4001, "step": 276420 }, { "epoch": 0.96, "learning_rate": 1.7939292054534613e-06, "loss": 2.3622, "step": 276430 }, { "epoch": 0.96, "learning_rate": 1.7921853255998075e-06, "loss": 2.3533, "step": 276440 }, { "epoch": 0.96, "learning_rate": 1.7904414457461538e-06, "loss": 2.3299, "step": 276450 }, { "epoch": 0.96, "learning_rate": 1.7886975658925005e-06, "loss": 2.4218, "step": 276460 }, { "epoch": 0.96, "learning_rate": 1.7869536860388468e-06, "loss": 2.3467, "step": 276470 }, { "epoch": 0.96, "learning_rate": 1.785209806185193e-06, "loss": 2.2999, "step": 276480 }, { "epoch": 0.96, "learning_rate": 1.7834659263315393e-06, "loss": 2.3576, "step": 276490 }, { "epoch": 0.96, "learning_rate": 1.781722046477886e-06, "loss": 2.323, "step": 276500 }, { "epoch": 0.96, "learning_rate": 1.7799781666242323e-06, "loss": 2.3741, "step": 276510 }, { "epoch": 0.96, "learning_rate": 1.7782342867705785e-06, "loss": 2.3608, "step": 276520 }, { "epoch": 0.96, "learning_rate": 1.7764904069169252e-06, "loss": 2.3261, "step": 276530 }, { "epoch": 0.96, "learning_rate": 1.7747465270632715e-06, "loss": 2.3398, "step": 276540 }, { "epoch": 0.96, "learning_rate": 1.7730026472096178e-06, "loss": 2.3549, "step": 276550 }, { "epoch": 0.96, "learning_rate": 1.7712587673559645e-06, "loss": 2.2308, "step": 276560 }, { "epoch": 0.96, "learning_rate": 1.7695148875023107e-06, "loss": 2.382, "step": 276570 }, { "epoch": 0.96, "learning_rate": 1.767771007648657e-06, "loss": 2.228, "step": 276580 }, { "epoch": 0.96, "learning_rate": 1.7660271277950033e-06, "loss": 2.2977, "step": 276590 }, { "epoch": 0.96, "learning_rate": 1.76428324794135e-06, "loss": 2.3622, "step": 276600 }, { "epoch": 0.96, "learning_rate": 1.7625393680876962e-06, "loss": 2.3321, "step": 276610 }, { "epoch": 0.96, "learning_rate": 1.7607954882340425e-06, "loss": 2.2714, "step": 276620 }, { "epoch": 0.96, "learning_rate": 1.7590516083803892e-06, "loss": 2.2618, "step": 276630 }, { "epoch": 0.96, "learning_rate": 1.7573077285267355e-06, "loss": 2.393, "step": 276640 }, { "epoch": 0.96, "learning_rate": 1.7555638486730817e-06, "loss": 2.3936, "step": 276650 }, { "epoch": 0.96, "learning_rate": 1.7538199688194284e-06, "loss": 2.3609, "step": 276660 }, { "epoch": 0.96, "learning_rate": 1.7520760889657747e-06, "loss": 2.2251, "step": 276670 }, { "epoch": 0.96, "learning_rate": 1.750332209112121e-06, "loss": 2.4141, "step": 276680 }, { "epoch": 0.97, "learning_rate": 1.7485883292584672e-06, "loss": 2.3278, "step": 276690 }, { "epoch": 0.97, "learning_rate": 1.746844449404814e-06, "loss": 2.3494, "step": 276700 }, { "epoch": 0.97, "learning_rate": 1.7451005695511602e-06, "loss": 2.3395, "step": 276710 }, { "epoch": 0.97, "learning_rate": 1.7433566896975065e-06, "loss": 2.3495, "step": 276720 }, { "epoch": 0.97, "learning_rate": 1.7416128098438531e-06, "loss": 2.3565, "step": 276730 }, { "epoch": 0.97, "learning_rate": 1.7398689299901994e-06, "loss": 2.2603, "step": 276740 }, { "epoch": 0.97, "learning_rate": 1.7381250501365457e-06, "loss": 2.2585, "step": 276750 }, { "epoch": 0.97, "learning_rate": 1.7363811702828924e-06, "loss": 2.3886, "step": 276760 }, { "epoch": 0.97, "learning_rate": 1.7346372904292386e-06, "loss": 2.4339, "step": 276770 }, { "epoch": 0.97, "learning_rate": 1.732893410575585e-06, "loss": 2.3027, "step": 276780 }, { "epoch": 0.97, "learning_rate": 1.7311495307219314e-06, "loss": 2.3191, "step": 276790 }, { "epoch": 0.97, "learning_rate": 1.7294056508682779e-06, "loss": 2.3628, "step": 276800 }, { "epoch": 0.97, "learning_rate": 1.7276617710146241e-06, "loss": 2.3321, "step": 276810 }, { "epoch": 0.97, "learning_rate": 1.7259178911609706e-06, "loss": 2.3095, "step": 276820 }, { "epoch": 0.97, "learning_rate": 1.7241740113073171e-06, "loss": 2.3266, "step": 276830 }, { "epoch": 0.97, "learning_rate": 1.7224301314536634e-06, "loss": 2.3622, "step": 276840 }, { "epoch": 0.97, "learning_rate": 1.7206862516000096e-06, "loss": 2.2989, "step": 276850 }, { "epoch": 0.97, "learning_rate": 1.7189423717463563e-06, "loss": 2.3263, "step": 276860 }, { "epoch": 0.97, "learning_rate": 1.7171984918927026e-06, "loss": 2.3001, "step": 276870 }, { "epoch": 0.97, "learning_rate": 1.7154546120390489e-06, "loss": 2.3504, "step": 276880 }, { "epoch": 0.97, "learning_rate": 1.7137107321853954e-06, "loss": 2.3081, "step": 276890 }, { "epoch": 0.97, "learning_rate": 1.7119668523317418e-06, "loss": 2.271, "step": 276900 }, { "epoch": 0.97, "learning_rate": 1.7102229724780881e-06, "loss": 2.3143, "step": 276910 }, { "epoch": 0.97, "learning_rate": 1.7084790926244346e-06, "loss": 2.2501, "step": 276920 }, { "epoch": 0.97, "learning_rate": 1.706735212770781e-06, "loss": 2.3304, "step": 276930 }, { "epoch": 0.97, "learning_rate": 1.7049913329171273e-06, "loss": 2.3647, "step": 276940 }, { "epoch": 0.97, "learning_rate": 1.7032474530634738e-06, "loss": 2.4319, "step": 276950 }, { "epoch": 0.97, "learning_rate": 1.7015035732098203e-06, "loss": 2.3793, "step": 276960 }, { "epoch": 0.97, "learning_rate": 1.6997596933561666e-06, "loss": 2.3636, "step": 276970 }, { "epoch": 0.97, "learning_rate": 1.6980158135025128e-06, "loss": 2.3312, "step": 276980 }, { "epoch": 0.97, "learning_rate": 1.6962719336488593e-06, "loss": 2.3593, "step": 276990 }, { "epoch": 0.97, "learning_rate": 1.6945280537952058e-06, "loss": 2.2383, "step": 277000 }, { "epoch": 0.97, "learning_rate": 1.692784173941552e-06, "loss": 2.3458, "step": 277010 }, { "epoch": 0.97, "learning_rate": 1.6910402940878986e-06, "loss": 2.3504, "step": 277020 }, { "epoch": 0.97, "learning_rate": 1.689296414234245e-06, "loss": 2.3521, "step": 277030 }, { "epoch": 0.97, "learning_rate": 1.6875525343805913e-06, "loss": 2.2828, "step": 277040 }, { "epoch": 0.97, "learning_rate": 1.6858086545269378e-06, "loss": 2.2399, "step": 277050 }, { "epoch": 0.97, "learning_rate": 1.6840647746732843e-06, "loss": 2.3979, "step": 277060 }, { "epoch": 0.97, "learning_rate": 1.6823208948196305e-06, "loss": 2.3229, "step": 277070 }, { "epoch": 0.97, "learning_rate": 1.680577014965977e-06, "loss": 2.285, "step": 277080 }, { "epoch": 0.97, "learning_rate": 1.6788331351123235e-06, "loss": 2.319, "step": 277090 }, { "epoch": 0.97, "learning_rate": 1.6770892552586698e-06, "loss": 2.3974, "step": 277100 }, { "epoch": 0.97, "learning_rate": 1.675345375405016e-06, "loss": 2.314, "step": 277110 }, { "epoch": 0.97, "learning_rate": 1.6736014955513625e-06, "loss": 2.4143, "step": 277120 }, { "epoch": 0.97, "learning_rate": 1.671857615697709e-06, "loss": 2.3344, "step": 277130 }, { "epoch": 0.97, "learning_rate": 1.6701137358440553e-06, "loss": 2.3571, "step": 277140 }, { "epoch": 0.97, "learning_rate": 1.6683698559904018e-06, "loss": 2.3296, "step": 277150 }, { "epoch": 0.97, "learning_rate": 1.6666259761367482e-06, "loss": 2.2606, "step": 277160 }, { "epoch": 0.97, "learning_rate": 1.6648820962830945e-06, "loss": 2.4344, "step": 277170 }, { "epoch": 0.97, "learning_rate": 1.663138216429441e-06, "loss": 2.3219, "step": 277180 }, { "epoch": 0.97, "learning_rate": 1.6613943365757875e-06, "loss": 2.3587, "step": 277190 }, { "epoch": 0.97, "learning_rate": 1.6596504567221337e-06, "loss": 2.3343, "step": 277200 }, { "epoch": 0.97, "learning_rate": 1.6579065768684802e-06, "loss": 2.337, "step": 277210 }, { "epoch": 0.97, "learning_rate": 1.6561626970148265e-06, "loss": 2.3272, "step": 277220 }, { "epoch": 0.97, "learning_rate": 1.654418817161173e-06, "loss": 2.3238, "step": 277230 }, { "epoch": 0.97, "learning_rate": 1.6526749373075192e-06, "loss": 2.3029, "step": 277240 }, { "epoch": 0.97, "learning_rate": 1.6509310574538657e-06, "loss": 2.2861, "step": 277250 }, { "epoch": 0.97, "learning_rate": 1.6491871776002122e-06, "loss": 2.3319, "step": 277260 }, { "epoch": 0.97, "learning_rate": 1.6474432977465585e-06, "loss": 2.326, "step": 277270 }, { "epoch": 0.97, "learning_rate": 1.645699417892905e-06, "loss": 2.3139, "step": 277280 }, { "epoch": 0.97, "learning_rate": 1.6439555380392514e-06, "loss": 2.3772, "step": 277290 }, { "epoch": 0.97, "learning_rate": 1.6422116581855977e-06, "loss": 2.2054, "step": 277300 }, { "epoch": 0.97, "learning_rate": 1.6404677783319442e-06, "loss": 2.3364, "step": 277310 }, { "epoch": 0.97, "learning_rate": 1.6387238984782904e-06, "loss": 2.3758, "step": 277320 }, { "epoch": 0.97, "learning_rate": 1.636980018624637e-06, "loss": 2.3141, "step": 277330 }, { "epoch": 0.97, "learning_rate": 1.6352361387709834e-06, "loss": 2.3557, "step": 277340 }, { "epoch": 0.97, "learning_rate": 1.6334922589173297e-06, "loss": 2.316, "step": 277350 }, { "epoch": 0.97, "learning_rate": 1.6317483790636762e-06, "loss": 2.3097, "step": 277360 }, { "epoch": 0.97, "learning_rate": 1.6300044992100224e-06, "loss": 2.355, "step": 277370 }, { "epoch": 0.97, "learning_rate": 1.628260619356369e-06, "loss": 2.2859, "step": 277380 }, { "epoch": 0.97, "learning_rate": 1.6265167395027154e-06, "loss": 2.3626, "step": 277390 }, { "epoch": 0.97, "learning_rate": 1.6247728596490617e-06, "loss": 2.3168, "step": 277400 }, { "epoch": 0.97, "learning_rate": 1.6230289797954081e-06, "loss": 2.4259, "step": 277410 }, { "epoch": 0.97, "learning_rate": 1.6212850999417544e-06, "loss": 2.2657, "step": 277420 }, { "epoch": 0.97, "learning_rate": 1.6195412200881009e-06, "loss": 2.3692, "step": 277430 }, { "epoch": 0.97, "learning_rate": 1.6177973402344474e-06, "loss": 2.287, "step": 277440 }, { "epoch": 0.97, "learning_rate": 1.6160534603807936e-06, "loss": 2.325, "step": 277450 }, { "epoch": 0.97, "learning_rate": 1.6143095805271401e-06, "loss": 2.3548, "step": 277460 }, { "epoch": 0.97, "learning_rate": 1.6125657006734866e-06, "loss": 2.2935, "step": 277470 }, { "epoch": 0.97, "learning_rate": 1.6108218208198329e-06, "loss": 2.3515, "step": 277480 }, { "epoch": 0.97, "learning_rate": 1.6090779409661794e-06, "loss": 2.3388, "step": 277490 }, { "epoch": 0.97, "learning_rate": 1.6073340611125256e-06, "loss": 2.4097, "step": 277500 }, { "epoch": 0.97, "learning_rate": 1.605590181258872e-06, "loss": 2.2745, "step": 277510 }, { "epoch": 0.97, "learning_rate": 1.6038463014052184e-06, "loss": 2.3393, "step": 277520 }, { "epoch": 0.97, "learning_rate": 1.6021024215515649e-06, "loss": 2.3539, "step": 277530 }, { "epoch": 0.97, "learning_rate": 1.6003585416979113e-06, "loss": 2.3548, "step": 277540 }, { "epoch": 0.97, "learning_rate": 1.5986146618442576e-06, "loss": 2.3452, "step": 277550 }, { "epoch": 0.97, "learning_rate": 1.596870781990604e-06, "loss": 2.2808, "step": 277560 }, { "epoch": 0.97, "learning_rate": 1.5951269021369506e-06, "loss": 2.3374, "step": 277570 }, { "epoch": 0.97, "learning_rate": 1.5933830222832968e-06, "loss": 2.3638, "step": 277580 }, { "epoch": 0.97, "learning_rate": 1.5916391424296433e-06, "loss": 2.3934, "step": 277590 }, { "epoch": 0.97, "learning_rate": 1.5898952625759898e-06, "loss": 2.3649, "step": 277600 }, { "epoch": 0.97, "learning_rate": 1.588151382722336e-06, "loss": 2.2947, "step": 277610 }, { "epoch": 0.97, "learning_rate": 1.5864075028686823e-06, "loss": 2.3803, "step": 277620 }, { "epoch": 0.97, "learning_rate": 1.584663623015029e-06, "loss": 2.383, "step": 277630 }, { "epoch": 0.97, "learning_rate": 1.5829197431613753e-06, "loss": 2.3436, "step": 277640 }, { "epoch": 0.97, "learning_rate": 1.5811758633077216e-06, "loss": 2.34, "step": 277650 }, { "epoch": 0.97, "learning_rate": 1.579431983454068e-06, "loss": 2.3076, "step": 277660 }, { "epoch": 0.97, "learning_rate": 1.5776881036004145e-06, "loss": 2.3054, "step": 277670 }, { "epoch": 0.97, "learning_rate": 1.5759442237467608e-06, "loss": 2.2583, "step": 277680 }, { "epoch": 0.97, "learning_rate": 1.5742003438931073e-06, "loss": 2.2651, "step": 277690 }, { "epoch": 0.97, "learning_rate": 1.5724564640394538e-06, "loss": 2.3163, "step": 277700 }, { "epoch": 0.97, "learning_rate": 1.5707125841858e-06, "loss": 2.4028, "step": 277710 }, { "epoch": 0.97, "learning_rate": 1.5689687043321463e-06, "loss": 2.4175, "step": 277720 }, { "epoch": 0.97, "learning_rate": 1.567224824478493e-06, "loss": 2.3436, "step": 277730 }, { "epoch": 0.97, "learning_rate": 1.5654809446248393e-06, "loss": 2.2984, "step": 277740 }, { "epoch": 0.97, "learning_rate": 1.5637370647711855e-06, "loss": 2.3267, "step": 277750 }, { "epoch": 0.97, "learning_rate": 1.561993184917532e-06, "loss": 2.2867, "step": 277760 }, { "epoch": 0.97, "learning_rate": 1.5602493050638785e-06, "loss": 2.3264, "step": 277770 }, { "epoch": 0.97, "learning_rate": 1.558505425210225e-06, "loss": 2.3827, "step": 277780 }, { "epoch": 0.97, "learning_rate": 1.5567615453565712e-06, "loss": 2.3638, "step": 277790 }, { "epoch": 0.97, "learning_rate": 1.5550176655029177e-06, "loss": 2.3849, "step": 277800 }, { "epoch": 0.97, "learning_rate": 1.553273785649264e-06, "loss": 2.3541, "step": 277810 }, { "epoch": 0.97, "learning_rate": 1.5515299057956105e-06, "loss": 2.3494, "step": 277820 }, { "epoch": 0.97, "learning_rate": 1.549786025941957e-06, "loss": 2.3292, "step": 277830 }, { "epoch": 0.97, "learning_rate": 1.5480421460883032e-06, "loss": 2.3899, "step": 277840 }, { "epoch": 0.97, "learning_rate": 1.5462982662346497e-06, "loss": 2.2984, "step": 277850 }, { "epoch": 0.97, "learning_rate": 1.544554386380996e-06, "loss": 2.372, "step": 277860 }, { "epoch": 0.97, "learning_rate": 1.5428105065273425e-06, "loss": 2.3663, "step": 277870 }, { "epoch": 0.97, "learning_rate": 1.541066626673689e-06, "loss": 2.3788, "step": 277880 }, { "epoch": 0.97, "learning_rate": 1.5393227468200352e-06, "loss": 2.3532, "step": 277890 }, { "epoch": 0.97, "learning_rate": 1.5375788669663817e-06, "loss": 2.3135, "step": 277900 }, { "epoch": 0.97, "learning_rate": 1.535834987112728e-06, "loss": 2.3348, "step": 277910 }, { "epoch": 0.97, "learning_rate": 1.5340911072590744e-06, "loss": 2.3544, "step": 277920 }, { "epoch": 0.97, "learning_rate": 1.532347227405421e-06, "loss": 2.324, "step": 277930 }, { "epoch": 0.97, "learning_rate": 1.5306033475517672e-06, "loss": 2.3515, "step": 277940 }, { "epoch": 0.97, "learning_rate": 1.5288594676981137e-06, "loss": 2.4157, "step": 277950 }, { "epoch": 0.97, "learning_rate": 1.52711558784446e-06, "loss": 2.3576, "step": 277960 }, { "epoch": 0.97, "learning_rate": 1.5253717079908064e-06, "loss": 2.3078, "step": 277970 }, { "epoch": 0.97, "learning_rate": 1.523627828137153e-06, "loss": 2.2789, "step": 277980 }, { "epoch": 0.97, "learning_rate": 1.5218839482834992e-06, "loss": 2.3361, "step": 277990 }, { "epoch": 0.97, "learning_rate": 1.5201400684298456e-06, "loss": 2.3902, "step": 278000 }, { "epoch": 0.97, "learning_rate": 1.518396188576192e-06, "loss": 2.3209, "step": 278010 }, { "epoch": 0.97, "learning_rate": 1.5166523087225384e-06, "loss": 2.3122, "step": 278020 }, { "epoch": 0.97, "learning_rate": 1.5149084288688849e-06, "loss": 2.3805, "step": 278030 }, { "epoch": 0.97, "learning_rate": 1.5131645490152312e-06, "loss": 2.3204, "step": 278040 }, { "epoch": 0.97, "learning_rate": 1.5114206691615776e-06, "loss": 2.4093, "step": 278050 }, { "epoch": 0.97, "learning_rate": 1.509676789307924e-06, "loss": 2.3556, "step": 278060 }, { "epoch": 0.97, "learning_rate": 1.5079329094542704e-06, "loss": 2.2265, "step": 278070 }, { "epoch": 0.97, "learning_rate": 1.5061890296006169e-06, "loss": 2.2627, "step": 278080 }, { "epoch": 0.97, "learning_rate": 1.5044451497469631e-06, "loss": 2.3667, "step": 278090 }, { "epoch": 0.97, "learning_rate": 1.5027012698933096e-06, "loss": 2.3332, "step": 278100 }, { "epoch": 0.97, "learning_rate": 1.5009573900396559e-06, "loss": 2.3032, "step": 278110 }, { "epoch": 0.97, "learning_rate": 1.4992135101860024e-06, "loss": 2.2543, "step": 278120 }, { "epoch": 0.97, "learning_rate": 1.4974696303323488e-06, "loss": 2.2899, "step": 278130 }, { "epoch": 0.97, "learning_rate": 1.4957257504786951e-06, "loss": 2.3835, "step": 278140 }, { "epoch": 0.97, "learning_rate": 1.4939818706250416e-06, "loss": 2.304, "step": 278150 }, { "epoch": 0.97, "learning_rate": 1.4922379907713879e-06, "loss": 2.3797, "step": 278160 }, { "epoch": 0.97, "learning_rate": 1.4904941109177343e-06, "loss": 2.3348, "step": 278170 }, { "epoch": 0.97, "learning_rate": 1.4887502310640808e-06, "loss": 2.3014, "step": 278180 }, { "epoch": 0.97, "learning_rate": 1.487006351210427e-06, "loss": 2.2613, "step": 278190 }, { "epoch": 0.97, "learning_rate": 1.4852624713567736e-06, "loss": 2.3769, "step": 278200 }, { "epoch": 0.97, "learning_rate": 1.4835185915031198e-06, "loss": 2.2904, "step": 278210 }, { "epoch": 0.97, "learning_rate": 1.4817747116494663e-06, "loss": 2.3174, "step": 278220 }, { "epoch": 0.97, "learning_rate": 1.4800308317958128e-06, "loss": 2.3162, "step": 278230 }, { "epoch": 0.97, "learning_rate": 1.478286951942159e-06, "loss": 2.4036, "step": 278240 }, { "epoch": 0.97, "learning_rate": 1.4765430720885056e-06, "loss": 2.3364, "step": 278250 }, { "epoch": 0.97, "learning_rate": 1.4747991922348518e-06, "loss": 2.2916, "step": 278260 }, { "epoch": 0.97, "learning_rate": 1.4730553123811983e-06, "loss": 2.343, "step": 278270 }, { "epoch": 0.97, "learning_rate": 1.4713114325275448e-06, "loss": 2.2887, "step": 278280 }, { "epoch": 0.97, "learning_rate": 1.469567552673891e-06, "loss": 2.3626, "step": 278290 }, { "epoch": 0.97, "learning_rate": 1.4678236728202375e-06, "loss": 2.3092, "step": 278300 }, { "epoch": 0.97, "learning_rate": 1.4660797929665838e-06, "loss": 2.352, "step": 278310 }, { "epoch": 0.97, "learning_rate": 1.4643359131129303e-06, "loss": 2.3208, "step": 278320 }, { "epoch": 0.97, "learning_rate": 1.4625920332592768e-06, "loss": 2.354, "step": 278330 }, { "epoch": 0.97, "learning_rate": 1.460848153405623e-06, "loss": 2.2933, "step": 278340 }, { "epoch": 0.97, "learning_rate": 1.4591042735519695e-06, "loss": 2.3144, "step": 278350 }, { "epoch": 0.97, "learning_rate": 1.4573603936983158e-06, "loss": 2.337, "step": 278360 }, { "epoch": 0.97, "learning_rate": 1.4556165138446623e-06, "loss": 2.3463, "step": 278370 }, { "epoch": 0.97, "learning_rate": 1.4538726339910088e-06, "loss": 2.3786, "step": 278380 }, { "epoch": 0.97, "learning_rate": 1.452128754137355e-06, "loss": 2.3333, "step": 278390 }, { "epoch": 0.97, "learning_rate": 1.4503848742837015e-06, "loss": 2.3508, "step": 278400 }, { "epoch": 0.97, "learning_rate": 1.4486409944300478e-06, "loss": 2.3259, "step": 278410 }, { "epoch": 0.97, "learning_rate": 1.4468971145763943e-06, "loss": 2.3298, "step": 278420 }, { "epoch": 0.97, "learning_rate": 1.4451532347227407e-06, "loss": 2.3153, "step": 278430 }, { "epoch": 0.97, "learning_rate": 1.443409354869087e-06, "loss": 2.2877, "step": 278440 }, { "epoch": 0.97, "learning_rate": 1.4416654750154335e-06, "loss": 2.3431, "step": 278450 }, { "epoch": 0.97, "learning_rate": 1.4399215951617798e-06, "loss": 2.2773, "step": 278460 }, { "epoch": 0.97, "learning_rate": 1.4381777153081262e-06, "loss": 2.3317, "step": 278470 }, { "epoch": 0.97, "learning_rate": 1.4364338354544727e-06, "loss": 2.3628, "step": 278480 }, { "epoch": 0.97, "learning_rate": 1.434689955600819e-06, "loss": 2.3132, "step": 278490 }, { "epoch": 0.97, "learning_rate": 1.4329460757471655e-06, "loss": 2.2925, "step": 278500 }, { "epoch": 0.97, "learning_rate": 1.4312021958935117e-06, "loss": 2.3429, "step": 278510 }, { "epoch": 0.97, "learning_rate": 1.4294583160398582e-06, "loss": 2.2532, "step": 278520 }, { "epoch": 0.97, "learning_rate": 1.4277144361862047e-06, "loss": 2.3449, "step": 278530 }, { "epoch": 0.97, "learning_rate": 1.425970556332551e-06, "loss": 2.3521, "step": 278540 }, { "epoch": 0.97, "learning_rate": 1.4242266764788974e-06, "loss": 2.3178, "step": 278550 }, { "epoch": 0.97, "learning_rate": 1.4224827966252437e-06, "loss": 2.3759, "step": 278560 }, { "epoch": 0.97, "learning_rate": 1.4207389167715902e-06, "loss": 2.3996, "step": 278570 }, { "epoch": 0.97, "learning_rate": 1.4189950369179367e-06, "loss": 2.3713, "step": 278580 }, { "epoch": 0.97, "learning_rate": 1.417251157064283e-06, "loss": 2.3159, "step": 278590 }, { "epoch": 0.97, "learning_rate": 1.4155072772106294e-06, "loss": 2.3245, "step": 278600 }, { "epoch": 0.97, "learning_rate": 1.4137633973569757e-06, "loss": 2.3682, "step": 278610 }, { "epoch": 0.97, "learning_rate": 1.4120195175033222e-06, "loss": 2.3625, "step": 278620 }, { "epoch": 0.97, "learning_rate": 1.4102756376496687e-06, "loss": 2.3136, "step": 278630 }, { "epoch": 0.97, "learning_rate": 1.408531757796015e-06, "loss": 2.3661, "step": 278640 }, { "epoch": 0.97, "learning_rate": 1.4067878779423614e-06, "loss": 2.3093, "step": 278650 }, { "epoch": 0.97, "learning_rate": 1.4050439980887077e-06, "loss": 2.3357, "step": 278660 }, { "epoch": 0.97, "learning_rate": 1.4033001182350542e-06, "loss": 2.4361, "step": 278670 }, { "epoch": 0.97, "learning_rate": 1.4015562383814006e-06, "loss": 2.3896, "step": 278680 }, { "epoch": 0.97, "learning_rate": 1.399812358527747e-06, "loss": 2.3109, "step": 278690 }, { "epoch": 0.97, "learning_rate": 1.3980684786740934e-06, "loss": 2.318, "step": 278700 }, { "epoch": 0.97, "learning_rate": 1.3963245988204397e-06, "loss": 2.2617, "step": 278710 }, { "epoch": 0.97, "learning_rate": 1.3945807189667861e-06, "loss": 2.258, "step": 278720 }, { "epoch": 0.97, "learning_rate": 1.3928368391131326e-06, "loss": 2.2691, "step": 278730 }, { "epoch": 0.97, "learning_rate": 1.3910929592594789e-06, "loss": 2.3656, "step": 278740 }, { "epoch": 0.97, "learning_rate": 1.3893490794058254e-06, "loss": 2.3934, "step": 278750 }, { "epoch": 0.97, "learning_rate": 1.3876051995521716e-06, "loss": 2.3395, "step": 278760 }, { "epoch": 0.97, "learning_rate": 1.3858613196985181e-06, "loss": 2.2575, "step": 278770 }, { "epoch": 0.97, "learning_rate": 1.3841174398448646e-06, "loss": 2.3381, "step": 278780 }, { "epoch": 0.97, "learning_rate": 1.3823735599912109e-06, "loss": 2.3656, "step": 278790 }, { "epoch": 0.97, "learning_rate": 1.3806296801375574e-06, "loss": 2.3697, "step": 278800 }, { "epoch": 0.97, "learning_rate": 1.3788858002839036e-06, "loss": 2.3138, "step": 278810 }, { "epoch": 0.97, "learning_rate": 1.3771419204302501e-06, "loss": 2.3266, "step": 278820 }, { "epoch": 0.97, "learning_rate": 1.3753980405765966e-06, "loss": 2.3138, "step": 278830 }, { "epoch": 0.97, "learning_rate": 1.3736541607229429e-06, "loss": 2.3549, "step": 278840 }, { "epoch": 0.97, "learning_rate": 1.3719102808692893e-06, "loss": 2.3384, "step": 278850 }, { "epoch": 0.97, "learning_rate": 1.3701664010156356e-06, "loss": 2.2917, "step": 278860 }, { "epoch": 0.97, "learning_rate": 1.368422521161982e-06, "loss": 2.3026, "step": 278870 }, { "epoch": 0.97, "learning_rate": 1.3666786413083286e-06, "loss": 2.3492, "step": 278880 }, { "epoch": 0.97, "learning_rate": 1.3649347614546748e-06, "loss": 2.2768, "step": 278890 }, { "epoch": 0.97, "learning_rate": 1.3631908816010213e-06, "loss": 2.345, "step": 278900 }, { "epoch": 0.97, "learning_rate": 1.3614470017473676e-06, "loss": 2.3044, "step": 278910 }, { "epoch": 0.97, "learning_rate": 1.359703121893714e-06, "loss": 2.3242, "step": 278920 }, { "epoch": 0.97, "learning_rate": 1.3579592420400606e-06, "loss": 2.3329, "step": 278930 }, { "epoch": 0.97, "learning_rate": 1.3562153621864068e-06, "loss": 2.2569, "step": 278940 }, { "epoch": 0.97, "learning_rate": 1.3544714823327533e-06, "loss": 2.2592, "step": 278950 }, { "epoch": 0.97, "learning_rate": 1.3527276024790996e-06, "loss": 2.3681, "step": 278960 }, { "epoch": 0.97, "learning_rate": 1.350983722625446e-06, "loss": 2.3242, "step": 278970 }, { "epoch": 0.97, "learning_rate": 1.3492398427717925e-06, "loss": 2.3777, "step": 278980 }, { "epoch": 0.97, "learning_rate": 1.3474959629181388e-06, "loss": 2.381, "step": 278990 }, { "epoch": 0.97, "learning_rate": 1.3457520830644853e-06, "loss": 2.3802, "step": 279000 }, { "epoch": 0.97, "learning_rate": 1.3440082032108316e-06, "loss": 2.2971, "step": 279010 }, { "epoch": 0.97, "learning_rate": 1.342264323357178e-06, "loss": 2.3322, "step": 279020 }, { "epoch": 0.97, "learning_rate": 1.3405204435035245e-06, "loss": 2.2185, "step": 279030 }, { "epoch": 0.97, "learning_rate": 1.3387765636498708e-06, "loss": 2.3178, "step": 279040 }, { "epoch": 0.97, "learning_rate": 1.3370326837962173e-06, "loss": 2.3357, "step": 279050 }, { "epoch": 0.97, "learning_rate": 1.3352888039425635e-06, "loss": 2.3796, "step": 279060 }, { "epoch": 0.97, "learning_rate": 1.33354492408891e-06, "loss": 2.3719, "step": 279070 }, { "epoch": 0.97, "learning_rate": 1.3318010442352565e-06, "loss": 2.3669, "step": 279080 }, { "epoch": 0.97, "learning_rate": 1.3300571643816028e-06, "loss": 2.3042, "step": 279090 }, { "epoch": 0.97, "learning_rate": 1.3283132845279492e-06, "loss": 2.2563, "step": 279100 }, { "epoch": 0.97, "learning_rate": 1.3265694046742955e-06, "loss": 2.322, "step": 279110 }, { "epoch": 0.97, "learning_rate": 1.324825524820642e-06, "loss": 2.3694, "step": 279120 }, { "epoch": 0.97, "learning_rate": 1.3230816449669885e-06, "loss": 2.3016, "step": 279130 }, { "epoch": 0.97, "learning_rate": 1.3213377651133347e-06, "loss": 2.3438, "step": 279140 }, { "epoch": 0.97, "learning_rate": 1.3195938852596812e-06, "loss": 2.3434, "step": 279150 }, { "epoch": 0.97, "learning_rate": 1.3178500054060275e-06, "loss": 2.3054, "step": 279160 }, { "epoch": 0.97, "learning_rate": 1.316106125552374e-06, "loss": 2.3734, "step": 279170 }, { "epoch": 0.97, "learning_rate": 1.3143622456987205e-06, "loss": 2.4254, "step": 279180 }, { "epoch": 0.97, "learning_rate": 1.3126183658450667e-06, "loss": 2.3152, "step": 279190 }, { "epoch": 0.97, "learning_rate": 1.3108744859914132e-06, "loss": 2.3591, "step": 279200 }, { "epoch": 0.97, "learning_rate": 1.3091306061377597e-06, "loss": 2.3276, "step": 279210 }, { "epoch": 0.97, "learning_rate": 1.307386726284106e-06, "loss": 2.3104, "step": 279220 }, { "epoch": 0.97, "learning_rate": 1.3056428464304524e-06, "loss": 2.2852, "step": 279230 }, { "epoch": 0.97, "learning_rate": 1.3038989665767987e-06, "loss": 2.3251, "step": 279240 }, { "epoch": 0.97, "learning_rate": 1.3021550867231452e-06, "loss": 2.2883, "step": 279250 }, { "epoch": 0.97, "learning_rate": 1.3004112068694917e-06, "loss": 2.3234, "step": 279260 }, { "epoch": 0.97, "learning_rate": 1.298667327015838e-06, "loss": 2.306, "step": 279270 }, { "epoch": 0.97, "learning_rate": 1.2969234471621844e-06, "loss": 2.3825, "step": 279280 }, { "epoch": 0.97, "learning_rate": 1.2951795673085307e-06, "loss": 2.2784, "step": 279290 }, { "epoch": 0.97, "learning_rate": 1.2934356874548772e-06, "loss": 2.3108, "step": 279300 }, { "epoch": 0.97, "learning_rate": 1.2916918076012237e-06, "loss": 2.3376, "step": 279310 }, { "epoch": 0.97, "learning_rate": 1.28994792774757e-06, "loss": 2.3486, "step": 279320 }, { "epoch": 0.97, "learning_rate": 1.2882040478939164e-06, "loss": 2.3376, "step": 279330 }, { "epoch": 0.97, "learning_rate": 1.2864601680402627e-06, "loss": 2.3637, "step": 279340 }, { "epoch": 0.97, "learning_rate": 1.2847162881866092e-06, "loss": 2.3065, "step": 279350 }, { "epoch": 0.97, "learning_rate": 1.2829724083329556e-06, "loss": 2.3613, "step": 279360 }, { "epoch": 0.97, "learning_rate": 1.281228528479302e-06, "loss": 2.3279, "step": 279370 }, { "epoch": 0.97, "learning_rate": 1.2794846486256484e-06, "loss": 2.3155, "step": 279380 }, { "epoch": 0.97, "learning_rate": 1.2777407687719947e-06, "loss": 2.3052, "step": 279390 }, { "epoch": 0.97, "learning_rate": 1.2759968889183411e-06, "loss": 2.2864, "step": 279400 }, { "epoch": 0.97, "learning_rate": 1.2742530090646876e-06, "loss": 2.299, "step": 279410 }, { "epoch": 0.97, "learning_rate": 1.2725091292110339e-06, "loss": 2.3972, "step": 279420 }, { "epoch": 0.97, "learning_rate": 1.2707652493573804e-06, "loss": 2.3763, "step": 279430 }, { "epoch": 0.97, "learning_rate": 1.2690213695037266e-06, "loss": 2.3201, "step": 279440 }, { "epoch": 0.97, "learning_rate": 1.2672774896500731e-06, "loss": 2.3675, "step": 279450 }, { "epoch": 0.97, "learning_rate": 1.2655336097964196e-06, "loss": 2.3333, "step": 279460 }, { "epoch": 0.97, "learning_rate": 1.2637897299427659e-06, "loss": 2.2821, "step": 279470 }, { "epoch": 0.97, "learning_rate": 1.2620458500891123e-06, "loss": 2.2847, "step": 279480 }, { "epoch": 0.97, "learning_rate": 1.2603019702354586e-06, "loss": 2.2814, "step": 279490 }, { "epoch": 0.97, "learning_rate": 1.258558090381805e-06, "loss": 2.307, "step": 279500 }, { "epoch": 0.97, "learning_rate": 1.2568142105281516e-06, "loss": 2.3682, "step": 279510 }, { "epoch": 0.97, "learning_rate": 1.2550703306744978e-06, "loss": 2.3472, "step": 279520 }, { "epoch": 0.97, "learning_rate": 1.2533264508208443e-06, "loss": 2.3717, "step": 279530 }, { "epoch": 0.97, "learning_rate": 1.2515825709671906e-06, "loss": 2.2552, "step": 279540 }, { "epoch": 0.98, "learning_rate": 1.249838691113537e-06, "loss": 2.3178, "step": 279550 }, { "epoch": 0.98, "learning_rate": 1.2480948112598836e-06, "loss": 2.3326, "step": 279560 }, { "epoch": 0.98, "learning_rate": 1.2463509314062298e-06, "loss": 2.3331, "step": 279570 }, { "epoch": 0.98, "learning_rate": 1.2446070515525763e-06, "loss": 2.3915, "step": 279580 }, { "epoch": 0.98, "learning_rate": 1.2428631716989226e-06, "loss": 2.2427, "step": 279590 }, { "epoch": 0.98, "learning_rate": 1.241119291845269e-06, "loss": 2.3555, "step": 279600 }, { "epoch": 0.98, "learning_rate": 1.2393754119916155e-06, "loss": 2.353, "step": 279610 }, { "epoch": 0.98, "learning_rate": 1.2376315321379618e-06, "loss": 2.3514, "step": 279620 }, { "epoch": 0.98, "learning_rate": 1.2358876522843083e-06, "loss": 2.3847, "step": 279630 }, { "epoch": 0.98, "learning_rate": 1.2341437724306546e-06, "loss": 2.2868, "step": 279640 }, { "epoch": 0.98, "learning_rate": 1.232399892577001e-06, "loss": 2.3753, "step": 279650 }, { "epoch": 0.98, "learning_rate": 1.2306560127233475e-06, "loss": 2.3654, "step": 279660 }, { "epoch": 0.98, "learning_rate": 1.2289121328696938e-06, "loss": 2.3612, "step": 279670 }, { "epoch": 0.98, "learning_rate": 1.2271682530160403e-06, "loss": 2.3094, "step": 279680 }, { "epoch": 0.98, "learning_rate": 1.2254243731623865e-06, "loss": 2.2026, "step": 279690 }, { "epoch": 0.98, "learning_rate": 1.223680493308733e-06, "loss": 2.3017, "step": 279700 }, { "epoch": 0.98, "learning_rate": 1.2219366134550795e-06, "loss": 2.333, "step": 279710 }, { "epoch": 0.98, "learning_rate": 1.2201927336014258e-06, "loss": 2.2436, "step": 279720 }, { "epoch": 0.98, "learning_rate": 1.2184488537477723e-06, "loss": 2.4421, "step": 279730 }, { "epoch": 0.98, "learning_rate": 1.2167049738941185e-06, "loss": 2.2402, "step": 279740 }, { "epoch": 0.98, "learning_rate": 1.214961094040465e-06, "loss": 2.3128, "step": 279750 }, { "epoch": 0.98, "learning_rate": 1.2132172141868115e-06, "loss": 2.3544, "step": 279760 }, { "epoch": 0.98, "learning_rate": 1.2114733343331578e-06, "loss": 2.2452, "step": 279770 }, { "epoch": 0.98, "learning_rate": 1.2097294544795042e-06, "loss": 2.3058, "step": 279780 }, { "epoch": 0.98, "learning_rate": 1.2079855746258505e-06, "loss": 2.3217, "step": 279790 }, { "epoch": 0.98, "learning_rate": 1.206241694772197e-06, "loss": 2.2893, "step": 279800 }, { "epoch": 0.98, "learning_rate": 1.2044978149185435e-06, "loss": 2.3332, "step": 279810 }, { "epoch": 0.98, "learning_rate": 1.2027539350648897e-06, "loss": 2.2755, "step": 279820 }, { "epoch": 0.98, "learning_rate": 1.2010100552112362e-06, "loss": 2.2943, "step": 279830 }, { "epoch": 0.98, "learning_rate": 1.1992661753575825e-06, "loss": 2.3852, "step": 279840 }, { "epoch": 0.98, "learning_rate": 1.197522295503929e-06, "loss": 2.3405, "step": 279850 }, { "epoch": 0.98, "learning_rate": 1.1957784156502755e-06, "loss": 2.4067, "step": 279860 }, { "epoch": 0.98, "learning_rate": 1.1940345357966217e-06, "loss": 2.3257, "step": 279870 }, { "epoch": 0.98, "learning_rate": 1.1922906559429682e-06, "loss": 2.3366, "step": 279880 }, { "epoch": 0.98, "learning_rate": 1.1905467760893145e-06, "loss": 2.3337, "step": 279890 }, { "epoch": 0.98, "learning_rate": 1.188802896235661e-06, "loss": 2.3136, "step": 279900 }, { "epoch": 0.98, "learning_rate": 1.1870590163820074e-06, "loss": 2.3004, "step": 279910 }, { "epoch": 0.98, "learning_rate": 1.1853151365283537e-06, "loss": 2.3569, "step": 279920 }, { "epoch": 0.98, "learning_rate": 1.1835712566747002e-06, "loss": 2.3974, "step": 279930 }, { "epoch": 0.98, "learning_rate": 1.1818273768210465e-06, "loss": 2.3285, "step": 279940 }, { "epoch": 0.98, "learning_rate": 1.180083496967393e-06, "loss": 2.2694, "step": 279950 }, { "epoch": 0.98, "learning_rate": 1.1783396171137394e-06, "loss": 2.3329, "step": 279960 }, { "epoch": 0.98, "learning_rate": 1.1765957372600857e-06, "loss": 2.3159, "step": 279970 }, { "epoch": 0.98, "learning_rate": 1.1748518574064322e-06, "loss": 2.3179, "step": 279980 }, { "epoch": 0.98, "learning_rate": 1.1731079775527784e-06, "loss": 2.3373, "step": 279990 }, { "epoch": 0.98, "learning_rate": 1.171364097699125e-06, "loss": 2.25, "step": 280000 }, { "epoch": 0.98, "learning_rate": 1.1696202178454714e-06, "loss": 2.3636, "step": 280010 }, { "epoch": 0.98, "learning_rate": 1.1678763379918177e-06, "loss": 2.3867, "step": 280020 }, { "epoch": 0.98, "learning_rate": 1.1661324581381641e-06, "loss": 2.2982, "step": 280030 }, { "epoch": 0.98, "learning_rate": 1.1643885782845104e-06, "loss": 2.3727, "step": 280040 }, { "epoch": 0.98, "learning_rate": 1.162644698430857e-06, "loss": 2.2825, "step": 280050 }, { "epoch": 0.98, "learning_rate": 1.1609008185772034e-06, "loss": 2.244, "step": 280060 }, { "epoch": 0.98, "learning_rate": 1.1591569387235496e-06, "loss": 2.3003, "step": 280070 }, { "epoch": 0.98, "learning_rate": 1.1574130588698961e-06, "loss": 2.33, "step": 280080 }, { "epoch": 0.98, "learning_rate": 1.1556691790162424e-06, "loss": 2.3407, "step": 280090 }, { "epoch": 0.98, "learning_rate": 1.1539252991625889e-06, "loss": 2.2636, "step": 280100 }, { "epoch": 0.98, "learning_rate": 1.1521814193089354e-06, "loss": 2.3598, "step": 280110 }, { "epoch": 0.98, "learning_rate": 1.1504375394552816e-06, "loss": 2.3698, "step": 280120 }, { "epoch": 0.98, "learning_rate": 1.1486936596016281e-06, "loss": 2.268, "step": 280130 }, { "epoch": 0.98, "learning_rate": 1.1469497797479744e-06, "loss": 2.2854, "step": 280140 }, { "epoch": 0.98, "learning_rate": 1.1452058998943209e-06, "loss": 2.341, "step": 280150 }, { "epoch": 0.98, "learning_rate": 1.1434620200406673e-06, "loss": 2.2885, "step": 280160 }, { "epoch": 0.98, "learning_rate": 1.1417181401870136e-06, "loss": 2.2885, "step": 280170 }, { "epoch": 0.98, "learning_rate": 1.13997426033336e-06, "loss": 2.374, "step": 280180 }, { "epoch": 0.98, "learning_rate": 1.1382303804797064e-06, "loss": 2.3493, "step": 280190 }, { "epoch": 0.98, "learning_rate": 1.1364865006260528e-06, "loss": 2.2976, "step": 280200 }, { "epoch": 0.98, "learning_rate": 1.1347426207723993e-06, "loss": 2.3391, "step": 280210 }, { "epoch": 0.98, "learning_rate": 1.1329987409187456e-06, "loss": 2.3192, "step": 280220 }, { "epoch": 0.98, "learning_rate": 1.131254861065092e-06, "loss": 2.2497, "step": 280230 }, { "epoch": 0.98, "learning_rate": 1.1295109812114383e-06, "loss": 2.3443, "step": 280240 }, { "epoch": 0.98, "learning_rate": 1.1277671013577848e-06, "loss": 2.3276, "step": 280250 }, { "epoch": 0.98, "learning_rate": 1.1260232215041313e-06, "loss": 2.4156, "step": 280260 }, { "epoch": 0.98, "learning_rate": 1.1242793416504776e-06, "loss": 2.3265, "step": 280270 }, { "epoch": 0.98, "learning_rate": 1.122535461796824e-06, "loss": 2.2524, "step": 280280 }, { "epoch": 0.98, "learning_rate": 1.1207915819431703e-06, "loss": 2.3486, "step": 280290 }, { "epoch": 0.98, "learning_rate": 1.1190477020895168e-06, "loss": 2.3647, "step": 280300 }, { "epoch": 0.98, "learning_rate": 1.1173038222358633e-06, "loss": 2.3989, "step": 280310 }, { "epoch": 0.98, "learning_rate": 1.1155599423822096e-06, "loss": 2.3715, "step": 280320 }, { "epoch": 0.98, "learning_rate": 1.113816062528556e-06, "loss": 2.2271, "step": 280330 }, { "epoch": 0.98, "learning_rate": 1.1120721826749023e-06, "loss": 2.3418, "step": 280340 }, { "epoch": 0.98, "learning_rate": 1.1103283028212488e-06, "loss": 2.3049, "step": 280350 }, { "epoch": 0.98, "learning_rate": 1.1085844229675953e-06, "loss": 2.2826, "step": 280360 }, { "epoch": 0.98, "learning_rate": 1.1068405431139415e-06, "loss": 2.3888, "step": 280370 }, { "epoch": 0.98, "learning_rate": 1.105096663260288e-06, "loss": 2.3753, "step": 280380 }, { "epoch": 0.98, "learning_rate": 1.1033527834066343e-06, "loss": 2.3884, "step": 280390 }, { "epoch": 0.98, "learning_rate": 1.1016089035529808e-06, "loss": 2.3417, "step": 280400 }, { "epoch": 0.98, "learning_rate": 1.0998650236993272e-06, "loss": 2.2516, "step": 280410 }, { "epoch": 0.98, "learning_rate": 1.0981211438456735e-06, "loss": 2.2852, "step": 280420 }, { "epoch": 0.98, "learning_rate": 1.09637726399202e-06, "loss": 2.3511, "step": 280430 }, { "epoch": 0.98, "learning_rate": 1.0946333841383663e-06, "loss": 2.3162, "step": 280440 }, { "epoch": 0.98, "learning_rate": 1.0928895042847127e-06, "loss": 2.3128, "step": 280450 }, { "epoch": 0.98, "learning_rate": 1.0911456244310592e-06, "loss": 2.3081, "step": 280460 }, { "epoch": 0.98, "learning_rate": 1.0894017445774055e-06, "loss": 2.2366, "step": 280470 }, { "epoch": 0.98, "learning_rate": 1.087657864723752e-06, "loss": 2.3583, "step": 280480 }, { "epoch": 0.98, "learning_rate": 1.0859139848700985e-06, "loss": 2.4366, "step": 280490 }, { "epoch": 0.98, "learning_rate": 1.0841701050164447e-06, "loss": 2.3559, "step": 280500 }, { "epoch": 0.98, "learning_rate": 1.0824262251627912e-06, "loss": 2.3926, "step": 280510 }, { "epoch": 0.98, "learning_rate": 1.0806823453091375e-06, "loss": 2.3255, "step": 280520 }, { "epoch": 0.98, "learning_rate": 1.078938465455484e-06, "loss": 2.2952, "step": 280530 }, { "epoch": 0.98, "learning_rate": 1.0771945856018304e-06, "loss": 2.3156, "step": 280540 }, { "epoch": 0.98, "learning_rate": 1.0754507057481767e-06, "loss": 2.3685, "step": 280550 }, { "epoch": 0.98, "learning_rate": 1.0737068258945232e-06, "loss": 2.3392, "step": 280560 }, { "epoch": 0.98, "learning_rate": 1.0719629460408695e-06, "loss": 2.2513, "step": 280570 }, { "epoch": 0.98, "learning_rate": 1.070219066187216e-06, "loss": 2.3906, "step": 280580 }, { "epoch": 0.98, "learning_rate": 1.0684751863335624e-06, "loss": 2.4292, "step": 280590 }, { "epoch": 0.98, "learning_rate": 1.0667313064799087e-06, "loss": 2.3071, "step": 280600 }, { "epoch": 0.98, "learning_rate": 1.0649874266262552e-06, "loss": 2.2823, "step": 280610 }, { "epoch": 0.98, "learning_rate": 1.0632435467726017e-06, "loss": 2.3918, "step": 280620 }, { "epoch": 0.98, "learning_rate": 1.061499666918948e-06, "loss": 2.373, "step": 280630 }, { "epoch": 0.98, "learning_rate": 1.0597557870652944e-06, "loss": 2.2933, "step": 280640 }, { "epoch": 0.98, "learning_rate": 1.0580119072116407e-06, "loss": 2.3902, "step": 280650 }, { "epoch": 0.98, "learning_rate": 1.0562680273579872e-06, "loss": 2.3038, "step": 280660 }, { "epoch": 0.98, "learning_rate": 1.0545241475043336e-06, "loss": 2.3193, "step": 280670 }, { "epoch": 0.98, "learning_rate": 1.05278026765068e-06, "loss": 2.318, "step": 280680 }, { "epoch": 0.98, "learning_rate": 1.0510363877970264e-06, "loss": 2.2825, "step": 280690 }, { "epoch": 0.98, "learning_rate": 1.0492925079433727e-06, "loss": 2.3866, "step": 280700 }, { "epoch": 0.98, "learning_rate": 1.0475486280897191e-06, "loss": 2.3139, "step": 280710 }, { "epoch": 0.98, "learning_rate": 1.0458047482360656e-06, "loss": 2.3015, "step": 280720 }, { "epoch": 0.98, "learning_rate": 1.0440608683824119e-06, "loss": 2.3487, "step": 280730 }, { "epoch": 0.98, "learning_rate": 1.0423169885287584e-06, "loss": 2.3054, "step": 280740 }, { "epoch": 0.98, "learning_rate": 1.0405731086751049e-06, "loss": 2.3619, "step": 280750 }, { "epoch": 0.98, "learning_rate": 1.0388292288214511e-06, "loss": 2.3117, "step": 280760 }, { "epoch": 0.98, "learning_rate": 1.0370853489677976e-06, "loss": 2.2986, "step": 280770 }, { "epoch": 0.98, "learning_rate": 1.0353414691141439e-06, "loss": 2.38, "step": 280780 }, { "epoch": 0.98, "learning_rate": 1.0335975892604904e-06, "loss": 2.3388, "step": 280790 }, { "epoch": 0.98, "learning_rate": 1.0318537094068368e-06, "loss": 2.3113, "step": 280800 }, { "epoch": 0.98, "learning_rate": 1.030109829553183e-06, "loss": 2.3712, "step": 280810 }, { "epoch": 0.98, "learning_rate": 1.0283659496995296e-06, "loss": 2.3473, "step": 280820 }, { "epoch": 0.98, "learning_rate": 1.026622069845876e-06, "loss": 2.2589, "step": 280830 }, { "epoch": 0.98, "learning_rate": 1.0248781899922223e-06, "loss": 2.3086, "step": 280840 }, { "epoch": 0.98, "learning_rate": 1.0231343101385688e-06, "loss": 2.2784, "step": 280850 }, { "epoch": 0.98, "learning_rate": 1.021390430284915e-06, "loss": 2.3585, "step": 280860 }, { "epoch": 0.98, "learning_rate": 1.0196465504312616e-06, "loss": 2.3574, "step": 280870 }, { "epoch": 0.98, "learning_rate": 1.017902670577608e-06, "loss": 2.3566, "step": 280880 }, { "epoch": 0.98, "learning_rate": 1.0161587907239543e-06, "loss": 2.391, "step": 280890 }, { "epoch": 0.98, "learning_rate": 1.0144149108703008e-06, "loss": 2.327, "step": 280900 }, { "epoch": 0.98, "learning_rate": 1.012671031016647e-06, "loss": 2.3959, "step": 280910 }, { "epoch": 0.98, "learning_rate": 1.0109271511629935e-06, "loss": 2.2774, "step": 280920 }, { "epoch": 0.98, "learning_rate": 1.00918327130934e-06, "loss": 2.3272, "step": 280930 }, { "epoch": 0.98, "learning_rate": 1.0074393914556863e-06, "loss": 2.3326, "step": 280940 }, { "epoch": 0.98, "learning_rate": 1.0056955116020328e-06, "loss": 2.35, "step": 280950 }, { "epoch": 0.98, "learning_rate": 1.0039516317483793e-06, "loss": 2.3604, "step": 280960 }, { "epoch": 0.98, "learning_rate": 1.0022077518947255e-06, "loss": 2.3668, "step": 280970 }, { "epoch": 0.98, "learning_rate": 1.000463872041072e-06, "loss": 2.3462, "step": 280980 }, { "epoch": 0.98, "learning_rate": 9.987199921874183e-07, "loss": 2.3687, "step": 280990 }, { "epoch": 0.98, "learning_rate": 9.969761123337648e-07, "loss": 2.2979, "step": 281000 }, { "epoch": 0.98, "learning_rate": 9.952322324801112e-07, "loss": 2.3385, "step": 281010 }, { "epoch": 0.98, "learning_rate": 9.934883526264575e-07, "loss": 2.4258, "step": 281020 }, { "epoch": 0.98, "learning_rate": 9.91744472772804e-07, "loss": 2.3557, "step": 281030 }, { "epoch": 0.98, "learning_rate": 9.900005929191503e-07, "loss": 2.3582, "step": 281040 }, { "epoch": 0.98, "learning_rate": 9.882567130654967e-07, "loss": 2.4087, "step": 281050 }, { "epoch": 0.98, "learning_rate": 9.865128332118432e-07, "loss": 2.3294, "step": 281060 }, { "epoch": 0.98, "learning_rate": 9.847689533581895e-07, "loss": 2.4166, "step": 281070 }, { "epoch": 0.98, "learning_rate": 9.83025073504536e-07, "loss": 2.3247, "step": 281080 }, { "epoch": 0.98, "learning_rate": 9.812811936508825e-07, "loss": 2.4197, "step": 281090 }, { "epoch": 0.98, "learning_rate": 9.795373137972287e-07, "loss": 2.4286, "step": 281100 }, { "epoch": 0.98, "learning_rate": 9.777934339435752e-07, "loss": 2.3266, "step": 281110 }, { "epoch": 0.98, "learning_rate": 9.760495540899215e-07, "loss": 2.2863, "step": 281120 }, { "epoch": 0.98, "learning_rate": 9.74305674236268e-07, "loss": 2.3422, "step": 281130 }, { "epoch": 0.98, "learning_rate": 9.725617943826144e-07, "loss": 2.2647, "step": 281140 }, { "epoch": 0.98, "learning_rate": 9.708179145289607e-07, "loss": 2.3572, "step": 281150 }, { "epoch": 0.98, "learning_rate": 9.690740346753072e-07, "loss": 2.3612, "step": 281160 }, { "epoch": 0.98, "learning_rate": 9.673301548216535e-07, "loss": 2.3459, "step": 281170 }, { "epoch": 0.98, "learning_rate": 9.65586274968e-07, "loss": 2.343, "step": 281180 }, { "epoch": 0.98, "learning_rate": 9.638423951143464e-07, "loss": 2.3679, "step": 281190 }, { "epoch": 0.98, "learning_rate": 9.620985152606927e-07, "loss": 2.3644, "step": 281200 }, { "epoch": 0.98, "learning_rate": 9.603546354070392e-07, "loss": 2.2363, "step": 281210 }, { "epoch": 0.98, "learning_rate": 9.586107555533854e-07, "loss": 2.3714, "step": 281220 }, { "epoch": 0.98, "learning_rate": 9.56866875699732e-07, "loss": 2.3376, "step": 281230 }, { "epoch": 0.98, "learning_rate": 9.551229958460784e-07, "loss": 2.3771, "step": 281240 }, { "epoch": 0.98, "learning_rate": 9.533791159924246e-07, "loss": 2.3976, "step": 281250 }, { "epoch": 0.98, "learning_rate": 9.51635236138771e-07, "loss": 2.3164, "step": 281260 }, { "epoch": 0.98, "learning_rate": 9.498913562851173e-07, "loss": 2.3819, "step": 281270 }, { "epoch": 0.98, "learning_rate": 9.481474764314638e-07, "loss": 2.2821, "step": 281280 }, { "epoch": 0.98, "learning_rate": 9.464035965778103e-07, "loss": 2.3486, "step": 281290 }, { "epoch": 0.98, "learning_rate": 9.446597167241565e-07, "loss": 2.2531, "step": 281300 }, { "epoch": 0.98, "learning_rate": 9.42915836870503e-07, "loss": 2.3854, "step": 281310 }, { "epoch": 0.98, "learning_rate": 9.411719570168493e-07, "loss": 2.2448, "step": 281320 }, { "epoch": 0.98, "learning_rate": 9.394280771631958e-07, "loss": 2.3203, "step": 281330 }, { "epoch": 0.98, "learning_rate": 9.376841973095423e-07, "loss": 2.3181, "step": 281340 }, { "epoch": 0.98, "learning_rate": 9.359403174558885e-07, "loss": 2.3696, "step": 281350 }, { "epoch": 0.98, "learning_rate": 9.34196437602235e-07, "loss": 2.3394, "step": 281360 }, { "epoch": 0.98, "learning_rate": 9.324525577485813e-07, "loss": 2.3591, "step": 281370 }, { "epoch": 0.98, "learning_rate": 9.307086778949278e-07, "loss": 2.2944, "step": 281380 }, { "epoch": 0.98, "learning_rate": 9.289647980412742e-07, "loss": 2.4315, "step": 281390 }, { "epoch": 0.98, "learning_rate": 9.272209181876205e-07, "loss": 2.3634, "step": 281400 }, { "epoch": 0.98, "learning_rate": 9.25477038333967e-07, "loss": 2.3138, "step": 281410 }, { "epoch": 0.98, "learning_rate": 9.237331584803134e-07, "loss": 2.3839, "step": 281420 }, { "epoch": 0.98, "learning_rate": 9.219892786266597e-07, "loss": 2.3177, "step": 281430 }, { "epoch": 0.98, "learning_rate": 9.202453987730062e-07, "loss": 2.3894, "step": 281440 }, { "epoch": 0.98, "learning_rate": 9.185015189193525e-07, "loss": 2.2278, "step": 281450 }, { "epoch": 0.98, "learning_rate": 9.16757639065699e-07, "loss": 2.2884, "step": 281460 }, { "epoch": 0.98, "learning_rate": 9.150137592120453e-07, "loss": 2.3761, "step": 281470 }, { "epoch": 0.98, "learning_rate": 9.132698793583917e-07, "loss": 2.294, "step": 281480 }, { "epoch": 0.98, "learning_rate": 9.115259995047382e-07, "loss": 2.288, "step": 281490 }, { "epoch": 0.98, "learning_rate": 9.097821196510845e-07, "loss": 2.3138, "step": 281500 }, { "epoch": 0.98, "learning_rate": 9.08038239797431e-07, "loss": 2.3369, "step": 281510 }, { "epoch": 0.98, "learning_rate": 9.062943599437773e-07, "loss": 2.3283, "step": 281520 }, { "epoch": 0.98, "learning_rate": 9.045504800901237e-07, "loss": 2.3233, "step": 281530 }, { "epoch": 0.98, "learning_rate": 9.028066002364702e-07, "loss": 2.2671, "step": 281540 }, { "epoch": 0.98, "learning_rate": 9.010627203828166e-07, "loss": 2.3504, "step": 281550 }, { "epoch": 0.98, "learning_rate": 8.993188405291629e-07, "loss": 2.3056, "step": 281560 }, { "epoch": 0.98, "learning_rate": 8.975749606755093e-07, "loss": 2.4085, "step": 281570 }, { "epoch": 0.98, "learning_rate": 8.958310808218557e-07, "loss": 2.3825, "step": 281580 }, { "epoch": 0.98, "learning_rate": 8.940872009682022e-07, "loss": 2.3499, "step": 281590 }, { "epoch": 0.98, "learning_rate": 8.923433211145485e-07, "loss": 2.3309, "step": 281600 }, { "epoch": 0.98, "learning_rate": 8.905994412608949e-07, "loss": 2.2264, "step": 281610 }, { "epoch": 0.98, "learning_rate": 8.888555614072413e-07, "loss": 2.3761, "step": 281620 }, { "epoch": 0.98, "learning_rate": 8.871116815535878e-07, "loss": 2.335, "step": 281630 }, { "epoch": 0.98, "learning_rate": 8.853678016999341e-07, "loss": 2.3898, "step": 281640 }, { "epoch": 0.98, "learning_rate": 8.836239218462805e-07, "loss": 2.3194, "step": 281650 }, { "epoch": 0.98, "learning_rate": 8.818800419926269e-07, "loss": 2.3476, "step": 281660 }, { "epoch": 0.98, "learning_rate": 8.801361621389733e-07, "loss": 2.3572, "step": 281670 }, { "epoch": 0.98, "learning_rate": 8.783922822853198e-07, "loss": 2.3646, "step": 281680 }, { "epoch": 0.98, "learning_rate": 8.766484024316661e-07, "loss": 2.2714, "step": 281690 }, { "epoch": 0.98, "learning_rate": 8.749045225780125e-07, "loss": 2.3454, "step": 281700 }, { "epoch": 0.98, "learning_rate": 8.731606427243589e-07, "loss": 2.3261, "step": 281710 }, { "epoch": 0.98, "learning_rate": 8.714167628707053e-07, "loss": 2.3365, "step": 281720 }, { "epoch": 0.98, "learning_rate": 8.696728830170517e-07, "loss": 2.3636, "step": 281730 }, { "epoch": 0.98, "learning_rate": 8.679290031633981e-07, "loss": 2.373, "step": 281740 }, { "epoch": 0.98, "learning_rate": 8.661851233097445e-07, "loss": 2.3549, "step": 281750 }, { "epoch": 0.98, "learning_rate": 8.64441243456091e-07, "loss": 2.277, "step": 281760 }, { "epoch": 0.98, "learning_rate": 8.626973636024372e-07, "loss": 2.3167, "step": 281770 }, { "epoch": 0.98, "learning_rate": 8.609534837487837e-07, "loss": 2.2656, "step": 281780 }, { "epoch": 0.98, "learning_rate": 8.592096038951301e-07, "loss": 2.2952, "step": 281790 }, { "epoch": 0.98, "learning_rate": 8.574657240414765e-07, "loss": 2.2873, "step": 281800 }, { "epoch": 0.98, "learning_rate": 8.557218441878229e-07, "loss": 2.3304, "step": 281810 }, { "epoch": 0.98, "learning_rate": 8.539779643341692e-07, "loss": 2.3978, "step": 281820 }, { "epoch": 0.98, "learning_rate": 8.522340844805157e-07, "loss": 2.3379, "step": 281830 }, { "epoch": 0.98, "learning_rate": 8.504902046268621e-07, "loss": 2.2752, "step": 281840 }, { "epoch": 0.98, "learning_rate": 8.487463247732084e-07, "loss": 2.3552, "step": 281850 }, { "epoch": 0.98, "learning_rate": 8.470024449195549e-07, "loss": 2.287, "step": 281860 }, { "epoch": 0.98, "learning_rate": 8.452585650659012e-07, "loss": 2.282, "step": 281870 }, { "epoch": 0.98, "learning_rate": 8.435146852122477e-07, "loss": 2.3143, "step": 281880 }, { "epoch": 0.98, "learning_rate": 8.417708053585942e-07, "loss": 2.3158, "step": 281890 }, { "epoch": 0.98, "learning_rate": 8.400269255049404e-07, "loss": 2.2618, "step": 281900 }, { "epoch": 0.98, "learning_rate": 8.382830456512869e-07, "loss": 2.3409, "step": 281910 }, { "epoch": 0.98, "learning_rate": 8.365391657976332e-07, "loss": 2.3767, "step": 281920 }, { "epoch": 0.98, "learning_rate": 8.347952859439797e-07, "loss": 2.2711, "step": 281930 }, { "epoch": 0.98, "learning_rate": 8.330514060903261e-07, "loss": 2.3815, "step": 281940 }, { "epoch": 0.98, "learning_rate": 8.313075262366724e-07, "loss": 2.2724, "step": 281950 }, { "epoch": 0.98, "learning_rate": 8.295636463830189e-07, "loss": 2.3543, "step": 281960 }, { "epoch": 0.98, "learning_rate": 8.278197665293653e-07, "loss": 2.3453, "step": 281970 }, { "epoch": 0.98, "learning_rate": 8.260758866757116e-07, "loss": 2.3363, "step": 281980 }, { "epoch": 0.98, "learning_rate": 8.243320068220581e-07, "loss": 2.3354, "step": 281990 }, { "epoch": 0.98, "learning_rate": 8.225881269684044e-07, "loss": 2.3087, "step": 282000 }, { "epoch": 0.98, "learning_rate": 8.208442471147509e-07, "loss": 2.3674, "step": 282010 }, { "epoch": 0.98, "learning_rate": 8.191003672610974e-07, "loss": 2.344, "step": 282020 }, { "epoch": 0.98, "learning_rate": 8.173564874074436e-07, "loss": 2.3747, "step": 282030 }, { "epoch": 0.98, "learning_rate": 8.156126075537901e-07, "loss": 2.3266, "step": 282040 }, { "epoch": 0.98, "learning_rate": 8.138687277001364e-07, "loss": 2.3022, "step": 282050 }, { "epoch": 0.98, "learning_rate": 8.121248478464829e-07, "loss": 2.3633, "step": 282060 }, { "epoch": 0.98, "learning_rate": 8.103809679928293e-07, "loss": 2.2927, "step": 282070 }, { "epoch": 0.98, "learning_rate": 8.086370881391756e-07, "loss": 2.3445, "step": 282080 }, { "epoch": 0.98, "learning_rate": 8.068932082855221e-07, "loss": 2.2949, "step": 282090 }, { "epoch": 0.98, "learning_rate": 8.051493284318684e-07, "loss": 2.3551, "step": 282100 }, { "epoch": 0.98, "learning_rate": 8.034054485782148e-07, "loss": 2.3136, "step": 282110 }, { "epoch": 0.98, "learning_rate": 8.016615687245613e-07, "loss": 2.382, "step": 282120 }, { "epoch": 0.98, "learning_rate": 7.999176888709076e-07, "loss": 2.3544, "step": 282130 }, { "epoch": 0.98, "learning_rate": 7.981738090172541e-07, "loss": 2.3458, "step": 282140 }, { "epoch": 0.98, "learning_rate": 7.964299291636003e-07, "loss": 2.2563, "step": 282150 }, { "epoch": 0.98, "learning_rate": 7.946860493099468e-07, "loss": 2.3455, "step": 282160 }, { "epoch": 0.98, "learning_rate": 7.929421694562933e-07, "loss": 2.3211, "step": 282170 }, { "epoch": 0.98, "learning_rate": 7.911982896026396e-07, "loss": 2.3328, "step": 282180 }, { "epoch": 0.98, "learning_rate": 7.89454409748986e-07, "loss": 2.4276, "step": 282190 }, { "epoch": 0.98, "learning_rate": 7.877105298953323e-07, "loss": 2.3753, "step": 282200 }, { "epoch": 0.98, "learning_rate": 7.859666500416788e-07, "loss": 2.3778, "step": 282210 }, { "epoch": 0.98, "learning_rate": 7.842227701880253e-07, "loss": 2.2464, "step": 282220 }, { "epoch": 0.98, "learning_rate": 7.824788903343715e-07, "loss": 2.3475, "step": 282230 }, { "epoch": 0.98, "learning_rate": 7.807350104807179e-07, "loss": 2.2435, "step": 282240 }, { "epoch": 0.98, "learning_rate": 7.789911306270644e-07, "loss": 2.2741, "step": 282250 }, { "epoch": 0.98, "learning_rate": 7.772472507734108e-07, "loss": 2.3004, "step": 282260 }, { "epoch": 0.98, "learning_rate": 7.755033709197572e-07, "loss": 2.2979, "step": 282270 }, { "epoch": 0.98, "learning_rate": 7.737594910661035e-07, "loss": 2.2956, "step": 282280 }, { "epoch": 0.98, "learning_rate": 7.720156112124499e-07, "loss": 2.3233, "step": 282290 }, { "epoch": 0.98, "learning_rate": 7.702717313587964e-07, "loss": 2.2008, "step": 282300 }, { "epoch": 0.98, "learning_rate": 7.685278515051428e-07, "loss": 2.3525, "step": 282310 }, { "epoch": 0.98, "learning_rate": 7.667839716514891e-07, "loss": 2.235, "step": 282320 }, { "epoch": 0.98, "learning_rate": 7.650400917978355e-07, "loss": 2.3593, "step": 282330 }, { "epoch": 0.98, "learning_rate": 7.63296211944182e-07, "loss": 2.3963, "step": 282340 }, { "epoch": 0.98, "learning_rate": 7.615523320905284e-07, "loss": 2.3911, "step": 282350 }, { "epoch": 0.98, "learning_rate": 7.598084522368747e-07, "loss": 2.3703, "step": 282360 }, { "epoch": 0.98, "learning_rate": 7.580645723832211e-07, "loss": 2.3119, "step": 282370 }, { "epoch": 0.98, "learning_rate": 7.563206925295675e-07, "loss": 2.3903, "step": 282380 }, { "epoch": 0.98, "learning_rate": 7.54576812675914e-07, "loss": 2.3027, "step": 282390 }, { "epoch": 0.98, "learning_rate": 7.528329328222604e-07, "loss": 2.3275, "step": 282400 }, { "epoch": 0.98, "learning_rate": 7.510890529686067e-07, "loss": 2.3849, "step": 282410 }, { "epoch": 0.99, "learning_rate": 7.493451731149531e-07, "loss": 2.3039, "step": 282420 }, { "epoch": 0.99, "learning_rate": 7.476012932612995e-07, "loss": 2.377, "step": 282430 }, { "epoch": 0.99, "learning_rate": 7.45857413407646e-07, "loss": 2.2787, "step": 282440 }, { "epoch": 0.99, "learning_rate": 7.441135335539923e-07, "loss": 2.3314, "step": 282450 }, { "epoch": 0.99, "learning_rate": 7.423696537003387e-07, "loss": 2.2548, "step": 282460 }, { "epoch": 0.99, "learning_rate": 7.406257738466851e-07, "loss": 2.3269, "step": 282470 }, { "epoch": 0.99, "learning_rate": 7.388818939930315e-07, "loss": 2.3293, "step": 282480 }, { "epoch": 0.99, "learning_rate": 7.371380141393779e-07, "loss": 2.3191, "step": 282490 }, { "epoch": 0.99, "learning_rate": 7.353941342857243e-07, "loss": 2.228, "step": 282500 }, { "epoch": 0.99, "learning_rate": 7.336502544320707e-07, "loss": 2.4329, "step": 282510 }, { "epoch": 0.99, "learning_rate": 7.319063745784171e-07, "loss": 2.3127, "step": 282520 }, { "epoch": 0.99, "learning_rate": 7.301624947247634e-07, "loss": 2.3122, "step": 282530 }, { "epoch": 0.99, "learning_rate": 7.284186148711099e-07, "loss": 2.3745, "step": 282540 }, { "epoch": 0.99, "learning_rate": 7.266747350174563e-07, "loss": 2.3631, "step": 282550 }, { "epoch": 0.99, "learning_rate": 7.249308551638027e-07, "loss": 2.3507, "step": 282560 }, { "epoch": 0.99, "learning_rate": 7.23186975310149e-07, "loss": 2.41, "step": 282570 }, { "epoch": 0.99, "learning_rate": 7.214430954564954e-07, "loss": 2.2302, "step": 282580 }, { "epoch": 0.99, "learning_rate": 7.196992156028419e-07, "loss": 2.3326, "step": 282590 }, { "epoch": 0.99, "learning_rate": 7.179553357491883e-07, "loss": 2.3485, "step": 282600 }, { "epoch": 0.99, "learning_rate": 7.162114558955347e-07, "loss": 2.2698, "step": 282610 }, { "epoch": 0.99, "learning_rate": 7.14467576041881e-07, "loss": 2.3212, "step": 282620 }, { "epoch": 0.99, "learning_rate": 7.127236961882274e-07, "loss": 2.3231, "step": 282630 }, { "epoch": 0.99, "learning_rate": 7.109798163345739e-07, "loss": 2.3417, "step": 282640 }, { "epoch": 0.99, "learning_rate": 7.092359364809203e-07, "loss": 2.3404, "step": 282650 }, { "epoch": 0.99, "learning_rate": 7.074920566272666e-07, "loss": 2.2906, "step": 282660 }, { "epoch": 0.99, "learning_rate": 7.05748176773613e-07, "loss": 2.3511, "step": 282670 }, { "epoch": 0.99, "learning_rate": 7.040042969199594e-07, "loss": 2.2879, "step": 282680 }, { "epoch": 0.99, "learning_rate": 7.022604170663059e-07, "loss": 2.3241, "step": 282690 }, { "epoch": 0.99, "learning_rate": 7.005165372126522e-07, "loss": 2.2852, "step": 282700 }, { "epoch": 0.99, "learning_rate": 6.987726573589986e-07, "loss": 2.4131, "step": 282710 }, { "epoch": 0.99, "learning_rate": 6.97028777505345e-07, "loss": 2.3323, "step": 282720 }, { "epoch": 0.99, "learning_rate": 6.952848976516914e-07, "loss": 2.3137, "step": 282730 }, { "epoch": 0.99, "learning_rate": 6.935410177980378e-07, "loss": 2.249, "step": 282740 }, { "epoch": 0.99, "learning_rate": 6.917971379443842e-07, "loss": 2.2877, "step": 282750 }, { "epoch": 0.99, "learning_rate": 6.900532580907306e-07, "loss": 2.2895, "step": 282760 }, { "epoch": 0.99, "learning_rate": 6.88309378237077e-07, "loss": 2.3724, "step": 282770 }, { "epoch": 0.99, "learning_rate": 6.865654983834233e-07, "loss": 2.3992, "step": 282780 }, { "epoch": 0.99, "learning_rate": 6.848216185297698e-07, "loss": 2.2934, "step": 282790 }, { "epoch": 0.99, "learning_rate": 6.830777386761162e-07, "loss": 2.3613, "step": 282800 }, { "epoch": 0.99, "learning_rate": 6.813338588224626e-07, "loss": 2.3402, "step": 282810 }, { "epoch": 0.99, "learning_rate": 6.79589978968809e-07, "loss": 2.3588, "step": 282820 }, { "epoch": 0.99, "learning_rate": 6.778460991151553e-07, "loss": 2.319, "step": 282830 }, { "epoch": 0.99, "learning_rate": 6.761022192615018e-07, "loss": 2.3636, "step": 282840 }, { "epoch": 0.99, "learning_rate": 6.743583394078482e-07, "loss": 2.3509, "step": 282850 }, { "epoch": 0.99, "learning_rate": 6.726144595541946e-07, "loss": 2.3746, "step": 282860 }, { "epoch": 0.99, "learning_rate": 6.708705797005409e-07, "loss": 2.3772, "step": 282870 }, { "epoch": 0.99, "learning_rate": 6.691266998468873e-07, "loss": 2.3842, "step": 282880 }, { "epoch": 0.99, "learning_rate": 6.673828199932338e-07, "loss": 2.2784, "step": 282890 }, { "epoch": 0.99, "learning_rate": 6.656389401395802e-07, "loss": 2.3813, "step": 282900 }, { "epoch": 0.99, "learning_rate": 6.638950602859265e-07, "loss": 2.2373, "step": 282910 }, { "epoch": 0.99, "learning_rate": 6.621511804322729e-07, "loss": 2.3699, "step": 282920 }, { "epoch": 0.99, "learning_rate": 6.604073005786193e-07, "loss": 2.3536, "step": 282930 }, { "epoch": 0.99, "learning_rate": 6.586634207249658e-07, "loss": 2.2131, "step": 282940 }, { "epoch": 0.99, "learning_rate": 6.569195408713121e-07, "loss": 2.2766, "step": 282950 }, { "epoch": 0.99, "learning_rate": 6.551756610176585e-07, "loss": 2.4027, "step": 282960 }, { "epoch": 0.99, "learning_rate": 6.534317811640049e-07, "loss": 2.343, "step": 282970 }, { "epoch": 0.99, "learning_rate": 6.516879013103513e-07, "loss": 2.3381, "step": 282980 }, { "epoch": 0.99, "learning_rate": 6.499440214566978e-07, "loss": 2.3429, "step": 282990 }, { "epoch": 0.99, "learning_rate": 6.482001416030441e-07, "loss": 2.3695, "step": 283000 }, { "epoch": 0.99, "learning_rate": 6.464562617493905e-07, "loss": 2.3262, "step": 283010 }, { "epoch": 0.99, "learning_rate": 6.447123818957369e-07, "loss": 2.3401, "step": 283020 }, { "epoch": 0.99, "learning_rate": 6.429685020420834e-07, "loss": 2.3313, "step": 283030 }, { "epoch": 0.99, "learning_rate": 6.412246221884297e-07, "loss": 2.2955, "step": 283040 }, { "epoch": 0.99, "learning_rate": 6.394807423347761e-07, "loss": 2.2764, "step": 283050 }, { "epoch": 0.99, "learning_rate": 6.377368624811225e-07, "loss": 2.2873, "step": 283060 }, { "epoch": 0.99, "learning_rate": 6.359929826274689e-07, "loss": 2.3367, "step": 283070 }, { "epoch": 0.99, "learning_rate": 6.342491027738153e-07, "loss": 2.417, "step": 283080 }, { "epoch": 0.99, "learning_rate": 6.325052229201617e-07, "loss": 2.3281, "step": 283090 }, { "epoch": 0.99, "learning_rate": 6.307613430665081e-07, "loss": 2.2836, "step": 283100 }, { "epoch": 0.99, "learning_rate": 6.290174632128545e-07, "loss": 2.2985, "step": 283110 }, { "epoch": 0.99, "learning_rate": 6.272735833592008e-07, "loss": 2.3593, "step": 283120 }, { "epoch": 0.99, "learning_rate": 6.255297035055473e-07, "loss": 2.3097, "step": 283130 }, { "epoch": 0.99, "learning_rate": 6.237858236518937e-07, "loss": 2.3018, "step": 283140 }, { "epoch": 0.99, "learning_rate": 6.220419437982401e-07, "loss": 2.3755, "step": 283150 }, { "epoch": 0.99, "learning_rate": 6.202980639445865e-07, "loss": 2.3526, "step": 283160 }, { "epoch": 0.99, "learning_rate": 6.185541840909328e-07, "loss": 2.3508, "step": 283170 }, { "epoch": 0.99, "learning_rate": 6.168103042372793e-07, "loss": 2.338, "step": 283180 }, { "epoch": 0.99, "learning_rate": 6.150664243836257e-07, "loss": 2.1332, "step": 283190 }, { "epoch": 0.99, "learning_rate": 6.133225445299721e-07, "loss": 2.3001, "step": 283200 }, { "epoch": 0.99, "learning_rate": 6.115786646763184e-07, "loss": 2.3204, "step": 283210 }, { "epoch": 0.99, "learning_rate": 6.098347848226648e-07, "loss": 2.2727, "step": 283220 }, { "epoch": 0.99, "learning_rate": 6.080909049690113e-07, "loss": 2.3279, "step": 283230 }, { "epoch": 0.99, "learning_rate": 6.063470251153577e-07, "loss": 2.3629, "step": 283240 }, { "epoch": 0.99, "learning_rate": 6.04603145261704e-07, "loss": 2.3158, "step": 283250 }, { "epoch": 0.99, "learning_rate": 6.028592654080504e-07, "loss": 2.3372, "step": 283260 }, { "epoch": 0.99, "learning_rate": 6.011153855543968e-07, "loss": 2.2748, "step": 283270 }, { "epoch": 0.99, "learning_rate": 5.993715057007433e-07, "loss": 2.31, "step": 283280 }, { "epoch": 0.99, "learning_rate": 5.976276258470896e-07, "loss": 2.3231, "step": 283290 }, { "epoch": 0.99, "learning_rate": 5.95883745993436e-07, "loss": 2.286, "step": 283300 }, { "epoch": 0.99, "learning_rate": 5.941398661397824e-07, "loss": 2.3155, "step": 283310 }, { "epoch": 0.99, "learning_rate": 5.923959862861289e-07, "loss": 2.3249, "step": 283320 }, { "epoch": 0.99, "learning_rate": 5.906521064324753e-07, "loss": 2.3789, "step": 283330 }, { "epoch": 0.99, "learning_rate": 5.889082265788216e-07, "loss": 2.3361, "step": 283340 }, { "epoch": 0.99, "learning_rate": 5.87164346725168e-07, "loss": 2.3074, "step": 283350 }, { "epoch": 0.99, "learning_rate": 5.854204668715145e-07, "loss": 2.3405, "step": 283360 }, { "epoch": 0.99, "learning_rate": 5.836765870178609e-07, "loss": 2.3741, "step": 283370 }, { "epoch": 0.99, "learning_rate": 5.819327071642072e-07, "loss": 2.3988, "step": 283380 }, { "epoch": 0.99, "learning_rate": 5.801888273105536e-07, "loss": 2.3032, "step": 283390 }, { "epoch": 0.99, "learning_rate": 5.784449474569001e-07, "loss": 2.3074, "step": 283400 }, { "epoch": 0.99, "learning_rate": 5.767010676032465e-07, "loss": 2.4214, "step": 283410 }, { "epoch": 0.99, "learning_rate": 5.749571877495928e-07, "loss": 2.3618, "step": 283420 }, { "epoch": 0.99, "learning_rate": 5.732133078959392e-07, "loss": 2.2689, "step": 283430 }, { "epoch": 0.99, "learning_rate": 5.714694280422856e-07, "loss": 2.3147, "step": 283440 }, { "epoch": 0.99, "learning_rate": 5.697255481886321e-07, "loss": 2.3397, "step": 283450 }, { "epoch": 0.99, "learning_rate": 5.679816683349784e-07, "loss": 2.3017, "step": 283460 }, { "epoch": 0.99, "learning_rate": 5.662377884813248e-07, "loss": 2.3301, "step": 283470 }, { "epoch": 0.99, "learning_rate": 5.644939086276712e-07, "loss": 2.3528, "step": 283480 }, { "epoch": 0.99, "learning_rate": 5.627500287740177e-07, "loss": 2.2974, "step": 283490 }, { "epoch": 0.99, "learning_rate": 5.61006148920364e-07, "loss": 2.325, "step": 283500 }, { "epoch": 0.99, "learning_rate": 5.592622690667104e-07, "loss": 2.2558, "step": 283510 }, { "epoch": 0.99, "learning_rate": 5.575183892130568e-07, "loss": 2.328, "step": 283520 }, { "epoch": 0.99, "learning_rate": 5.557745093594033e-07, "loss": 2.2929, "step": 283530 }, { "epoch": 0.99, "learning_rate": 5.540306295057497e-07, "loss": 2.3235, "step": 283540 }, { "epoch": 0.99, "learning_rate": 5.52286749652096e-07, "loss": 2.3238, "step": 283550 }, { "epoch": 0.99, "learning_rate": 5.505428697984424e-07, "loss": 2.3884, "step": 283560 }, { "epoch": 0.99, "learning_rate": 5.487989899447888e-07, "loss": 2.3215, "step": 283570 }, { "epoch": 0.99, "learning_rate": 5.470551100911353e-07, "loss": 2.2962, "step": 283580 }, { "epoch": 0.99, "learning_rate": 5.453112302374816e-07, "loss": 2.3559, "step": 283590 }, { "epoch": 0.99, "learning_rate": 5.43567350383828e-07, "loss": 2.4084, "step": 283600 }, { "epoch": 0.99, "learning_rate": 5.418234705301744e-07, "loss": 2.3084, "step": 283610 }, { "epoch": 0.99, "learning_rate": 5.400795906765208e-07, "loss": 2.3351, "step": 283620 }, { "epoch": 0.99, "learning_rate": 5.383357108228672e-07, "loss": 2.2856, "step": 283630 }, { "epoch": 0.99, "learning_rate": 5.365918309692136e-07, "loss": 2.289, "step": 283640 }, { "epoch": 0.99, "learning_rate": 5.3484795111556e-07, "loss": 2.2906, "step": 283650 }, { "epoch": 0.99, "learning_rate": 5.331040712619064e-07, "loss": 2.3654, "step": 283660 }, { "epoch": 0.99, "learning_rate": 5.313601914082527e-07, "loss": 2.3686, "step": 283670 }, { "epoch": 0.99, "learning_rate": 5.296163115545992e-07, "loss": 2.2228, "step": 283680 }, { "epoch": 0.99, "learning_rate": 5.278724317009456e-07, "loss": 2.3487, "step": 283690 }, { "epoch": 0.99, "learning_rate": 5.26128551847292e-07, "loss": 2.3708, "step": 283700 }, { "epoch": 0.99, "learning_rate": 5.243846719936384e-07, "loss": 2.337, "step": 283710 }, { "epoch": 0.99, "learning_rate": 5.226407921399848e-07, "loss": 2.3726, "step": 283720 }, { "epoch": 0.99, "learning_rate": 5.208969122863312e-07, "loss": 2.3544, "step": 283730 }, { "epoch": 0.99, "learning_rate": 5.191530324326776e-07, "loss": 2.3003, "step": 283740 }, { "epoch": 0.99, "learning_rate": 5.17409152579024e-07, "loss": 2.3209, "step": 283750 }, { "epoch": 0.99, "learning_rate": 5.156652727253703e-07, "loss": 2.3011, "step": 283760 }, { "epoch": 0.99, "learning_rate": 5.139213928717168e-07, "loss": 2.3031, "step": 283770 }, { "epoch": 0.99, "learning_rate": 5.121775130180632e-07, "loss": 2.3173, "step": 283780 }, { "epoch": 0.99, "learning_rate": 5.104336331644096e-07, "loss": 2.3157, "step": 283790 }, { "epoch": 0.99, "learning_rate": 5.086897533107559e-07, "loss": 2.3441, "step": 283800 }, { "epoch": 0.99, "learning_rate": 5.069458734571023e-07, "loss": 2.307, "step": 283810 }, { "epoch": 0.99, "learning_rate": 5.052019936034488e-07, "loss": 2.3253, "step": 283820 }, { "epoch": 0.99, "learning_rate": 5.034581137497952e-07, "loss": 2.3387, "step": 283830 }, { "epoch": 0.99, "learning_rate": 5.017142338961415e-07, "loss": 2.3904, "step": 283840 }, { "epoch": 0.99, "learning_rate": 4.999703540424879e-07, "loss": 2.3929, "step": 283850 }, { "epoch": 0.99, "learning_rate": 4.982264741888343e-07, "loss": 2.2951, "step": 283860 }, { "epoch": 0.99, "learning_rate": 4.964825943351808e-07, "loss": 2.3627, "step": 283870 }, { "epoch": 0.99, "learning_rate": 4.947387144815272e-07, "loss": 2.253, "step": 283880 }, { "epoch": 0.99, "learning_rate": 4.929948346278735e-07, "loss": 2.2877, "step": 283890 }, { "epoch": 0.99, "learning_rate": 4.912509547742199e-07, "loss": 2.2268, "step": 283900 }, { "epoch": 0.99, "learning_rate": 4.895070749205663e-07, "loss": 2.4325, "step": 283910 }, { "epoch": 0.99, "learning_rate": 4.877631950669128e-07, "loss": 2.422, "step": 283920 }, { "epoch": 0.99, "learning_rate": 4.860193152132591e-07, "loss": 2.349, "step": 283930 }, { "epoch": 0.99, "learning_rate": 4.842754353596055e-07, "loss": 2.2907, "step": 283940 }, { "epoch": 0.99, "learning_rate": 4.825315555059519e-07, "loss": 2.3822, "step": 283950 }, { "epoch": 0.99, "learning_rate": 4.807876756522983e-07, "loss": 2.2989, "step": 283960 }, { "epoch": 0.99, "learning_rate": 4.790437957986447e-07, "loss": 2.3539, "step": 283970 }, { "epoch": 0.99, "learning_rate": 4.772999159449911e-07, "loss": 2.2657, "step": 283980 }, { "epoch": 0.99, "learning_rate": 4.755560360913375e-07, "loss": 2.2122, "step": 283990 }, { "epoch": 0.99, "learning_rate": 4.7381215623768387e-07, "loss": 2.3463, "step": 284000 }, { "epoch": 0.99, "learning_rate": 4.7206827638403024e-07, "loss": 2.2298, "step": 284010 }, { "epoch": 0.99, "learning_rate": 4.703243965303767e-07, "loss": 2.3329, "step": 284020 }, { "epoch": 0.99, "learning_rate": 4.685805166767231e-07, "loss": 2.3806, "step": 284030 }, { "epoch": 0.99, "learning_rate": 4.668366368230695e-07, "loss": 2.3717, "step": 284040 }, { "epoch": 0.99, "learning_rate": 4.6509275696941585e-07, "loss": 2.2847, "step": 284050 }, { "epoch": 0.99, "learning_rate": 4.633488771157622e-07, "loss": 2.3827, "step": 284060 }, { "epoch": 0.99, "learning_rate": 4.616049972621087e-07, "loss": 2.268, "step": 284070 }, { "epoch": 0.99, "learning_rate": 4.598611174084551e-07, "loss": 2.2801, "step": 284080 }, { "epoch": 0.99, "learning_rate": 4.5811723755480146e-07, "loss": 2.3017, "step": 284090 }, { "epoch": 0.99, "learning_rate": 4.5637335770114783e-07, "loss": 2.3361, "step": 284100 }, { "epoch": 0.99, "learning_rate": 4.546294778474942e-07, "loss": 2.2968, "step": 284110 }, { "epoch": 0.99, "learning_rate": 4.528855979938407e-07, "loss": 2.3798, "step": 284120 }, { "epoch": 0.99, "learning_rate": 4.5114171814018706e-07, "loss": 2.348, "step": 284130 }, { "epoch": 0.99, "learning_rate": 4.4939783828653344e-07, "loss": 2.3687, "step": 284140 }, { "epoch": 0.99, "learning_rate": 4.476539584328798e-07, "loss": 2.2605, "step": 284150 }, { "epoch": 0.99, "learning_rate": 4.459100785792262e-07, "loss": 2.4119, "step": 284160 }, { "epoch": 0.99, "learning_rate": 4.4416619872557267e-07, "loss": 2.3176, "step": 284170 }, { "epoch": 0.99, "learning_rate": 4.4242231887191904e-07, "loss": 2.3288, "step": 284180 }, { "epoch": 0.99, "learning_rate": 4.406784390182654e-07, "loss": 2.348, "step": 284190 }, { "epoch": 0.99, "learning_rate": 4.389345591646118e-07, "loss": 2.4315, "step": 284200 }, { "epoch": 0.99, "learning_rate": 4.3719067931095817e-07, "loss": 2.34, "step": 284210 }, { "epoch": 0.99, "learning_rate": 4.3544679945730465e-07, "loss": 2.3445, "step": 284220 }, { "epoch": 0.99, "learning_rate": 4.33702919603651e-07, "loss": 2.3191, "step": 284230 }, { "epoch": 0.99, "learning_rate": 4.319590397499974e-07, "loss": 2.3146, "step": 284240 }, { "epoch": 0.99, "learning_rate": 4.302151598963438e-07, "loss": 2.3148, "step": 284250 }, { "epoch": 0.99, "learning_rate": 4.2847128004269015e-07, "loss": 2.348, "step": 284260 }, { "epoch": 0.99, "learning_rate": 4.2672740018903663e-07, "loss": 2.3119, "step": 284270 }, { "epoch": 0.99, "learning_rate": 4.24983520335383e-07, "loss": 2.2827, "step": 284280 }, { "epoch": 0.99, "learning_rate": 4.232396404817294e-07, "loss": 2.3554, "step": 284290 }, { "epoch": 0.99, "learning_rate": 4.2149576062807576e-07, "loss": 2.3585, "step": 284300 }, { "epoch": 0.99, "learning_rate": 4.1975188077442213e-07, "loss": 2.3217, "step": 284310 }, { "epoch": 0.99, "learning_rate": 4.180080009207686e-07, "loss": 2.3185, "step": 284320 }, { "epoch": 0.99, "learning_rate": 4.16264121067115e-07, "loss": 2.3849, "step": 284330 }, { "epoch": 0.99, "learning_rate": 4.1452024121346136e-07, "loss": 2.3052, "step": 284340 }, { "epoch": 0.99, "learning_rate": 4.1277636135980774e-07, "loss": 2.3906, "step": 284350 }, { "epoch": 0.99, "learning_rate": 4.110324815061541e-07, "loss": 2.3171, "step": 284360 }, { "epoch": 0.99, "learning_rate": 4.092886016525006e-07, "loss": 2.3196, "step": 284370 }, { "epoch": 0.99, "learning_rate": 4.0754472179884697e-07, "loss": 2.3699, "step": 284380 }, { "epoch": 0.99, "learning_rate": 4.0580084194519335e-07, "loss": 2.2105, "step": 284390 }, { "epoch": 0.99, "learning_rate": 4.040569620915397e-07, "loss": 2.2939, "step": 284400 }, { "epoch": 0.99, "learning_rate": 4.023130822378862e-07, "loss": 2.3235, "step": 284410 }, { "epoch": 0.99, "learning_rate": 4.005692023842326e-07, "loss": 2.3059, "step": 284420 }, { "epoch": 0.99, "learning_rate": 3.9882532253057895e-07, "loss": 2.3178, "step": 284430 }, { "epoch": 0.99, "learning_rate": 3.9708144267692533e-07, "loss": 2.3611, "step": 284440 }, { "epoch": 0.99, "learning_rate": 3.953375628232717e-07, "loss": 2.3311, "step": 284450 }, { "epoch": 0.99, "learning_rate": 3.935936829696182e-07, "loss": 2.3098, "step": 284460 }, { "epoch": 0.99, "learning_rate": 3.9184980311596456e-07, "loss": 2.3504, "step": 284470 }, { "epoch": 0.99, "learning_rate": 3.9010592326231093e-07, "loss": 2.2991, "step": 284480 }, { "epoch": 0.99, "learning_rate": 3.883620434086573e-07, "loss": 2.2902, "step": 284490 }, { "epoch": 0.99, "learning_rate": 3.8661816355500374e-07, "loss": 2.3861, "step": 284500 }, { "epoch": 0.99, "learning_rate": 3.848742837013501e-07, "loss": 2.2868, "step": 284510 }, { "epoch": 0.99, "learning_rate": 3.831304038476965e-07, "loss": 2.2547, "step": 284520 }, { "epoch": 0.99, "learning_rate": 3.813865239940429e-07, "loss": 2.3238, "step": 284530 }, { "epoch": 0.99, "learning_rate": 3.796426441403893e-07, "loss": 2.3756, "step": 284540 }, { "epoch": 0.99, "learning_rate": 3.778987642867357e-07, "loss": 2.2762, "step": 284550 }, { "epoch": 0.99, "learning_rate": 3.761548844330821e-07, "loss": 2.3283, "step": 284560 }, { "epoch": 0.99, "learning_rate": 3.7441100457942847e-07, "loss": 2.2955, "step": 284570 }, { "epoch": 0.99, "learning_rate": 3.726671247257749e-07, "loss": 2.331, "step": 284580 }, { "epoch": 0.99, "learning_rate": 3.7092324487212127e-07, "loss": 2.3289, "step": 284590 }, { "epoch": 0.99, "learning_rate": 3.691793650184677e-07, "loss": 2.3808, "step": 284600 }, { "epoch": 0.99, "learning_rate": 3.674354851648141e-07, "loss": 2.3555, "step": 284610 }, { "epoch": 0.99, "learning_rate": 3.656916053111605e-07, "loss": 2.2899, "step": 284620 }, { "epoch": 0.99, "learning_rate": 3.639477254575069e-07, "loss": 2.3274, "step": 284630 }, { "epoch": 0.99, "learning_rate": 3.6220384560385325e-07, "loss": 2.434, "step": 284640 }, { "epoch": 0.99, "learning_rate": 3.604599657501997e-07, "loss": 2.3477, "step": 284650 }, { "epoch": 0.99, "learning_rate": 3.5871608589654606e-07, "loss": 2.4153, "step": 284660 }, { "epoch": 0.99, "learning_rate": 3.569722060428925e-07, "loss": 2.3372, "step": 284670 }, { "epoch": 0.99, "learning_rate": 3.5522832618923886e-07, "loss": 2.3241, "step": 284680 }, { "epoch": 0.99, "learning_rate": 3.534844463355853e-07, "loss": 2.406, "step": 284690 }, { "epoch": 0.99, "learning_rate": 3.5174056648193166e-07, "loss": 2.3453, "step": 284700 }, { "epoch": 0.99, "learning_rate": 3.499966866282781e-07, "loss": 2.3601, "step": 284710 }, { "epoch": 0.99, "learning_rate": 3.4825280677462447e-07, "loss": 2.3208, "step": 284720 }, { "epoch": 0.99, "learning_rate": 3.465089269209709e-07, "loss": 2.2582, "step": 284730 }, { "epoch": 0.99, "learning_rate": 3.4476504706731727e-07, "loss": 2.3784, "step": 284740 }, { "epoch": 0.99, "learning_rate": 3.430211672136637e-07, "loss": 2.2838, "step": 284750 }, { "epoch": 0.99, "learning_rate": 3.412772873600101e-07, "loss": 2.3326, "step": 284760 }, { "epoch": 0.99, "learning_rate": 3.3953340750635645e-07, "loss": 2.2974, "step": 284770 }, { "epoch": 0.99, "learning_rate": 3.377895276527029e-07, "loss": 2.3348, "step": 284780 }, { "epoch": 0.99, "learning_rate": 3.3604564779904925e-07, "loss": 2.3463, "step": 284790 }, { "epoch": 0.99, "learning_rate": 3.343017679453957e-07, "loss": 2.4124, "step": 284800 }, { "epoch": 0.99, "learning_rate": 3.3255788809174206e-07, "loss": 2.403, "step": 284810 }, { "epoch": 0.99, "learning_rate": 3.308140082380885e-07, "loss": 2.4159, "step": 284820 }, { "epoch": 0.99, "learning_rate": 3.2907012838443486e-07, "loss": 2.3469, "step": 284830 }, { "epoch": 0.99, "learning_rate": 3.2732624853078123e-07, "loss": 2.284, "step": 284840 }, { "epoch": 0.99, "learning_rate": 3.2558236867712766e-07, "loss": 2.3186, "step": 284850 }, { "epoch": 0.99, "learning_rate": 3.2383848882347404e-07, "loss": 2.291, "step": 284860 }, { "epoch": 0.99, "learning_rate": 3.2209460896982047e-07, "loss": 2.3699, "step": 284870 }, { "epoch": 0.99, "learning_rate": 3.2035072911616684e-07, "loss": 2.3248, "step": 284880 }, { "epoch": 0.99, "learning_rate": 3.186068492625132e-07, "loss": 2.2956, "step": 284890 }, { "epoch": 0.99, "learning_rate": 3.1686296940885964e-07, "loss": 2.3296, "step": 284900 }, { "epoch": 0.99, "learning_rate": 3.15119089555206e-07, "loss": 2.3574, "step": 284910 }, { "epoch": 0.99, "learning_rate": 3.1337520970155245e-07, "loss": 2.3039, "step": 284920 }, { "epoch": 0.99, "learning_rate": 3.116313298478988e-07, "loss": 2.2836, "step": 284930 }, { "epoch": 0.99, "learning_rate": 3.0988744999424525e-07, "loss": 2.3209, "step": 284940 }, { "epoch": 0.99, "learning_rate": 3.081435701405916e-07, "loss": 2.3656, "step": 284950 }, { "epoch": 0.99, "learning_rate": 3.06399690286938e-07, "loss": 2.2877, "step": 284960 }, { "epoch": 0.99, "learning_rate": 3.0465581043328443e-07, "loss": 2.2892, "step": 284970 }, { "epoch": 0.99, "learning_rate": 3.029119305796308e-07, "loss": 2.3652, "step": 284980 }, { "epoch": 0.99, "learning_rate": 3.0116805072597723e-07, "loss": 2.3241, "step": 284990 }, { "epoch": 0.99, "learning_rate": 2.994241708723236e-07, "loss": 2.4672, "step": 285000 }, { "epoch": 0.99, "learning_rate": 2.9768029101867e-07, "loss": 2.3113, "step": 285010 }, { "epoch": 0.99, "learning_rate": 2.959364111650164e-07, "loss": 2.3279, "step": 285020 }, { "epoch": 0.99, "learning_rate": 2.941925313113628e-07, "loss": 2.3552, "step": 285030 }, { "epoch": 0.99, "learning_rate": 2.924486514577092e-07, "loss": 2.3431, "step": 285040 }, { "epoch": 0.99, "learning_rate": 2.907047716040556e-07, "loss": 2.3441, "step": 285050 }, { "epoch": 0.99, "learning_rate": 2.8896089175040196e-07, "loss": 2.2145, "step": 285060 }, { "epoch": 0.99, "learning_rate": 2.872170118967484e-07, "loss": 2.2873, "step": 285070 }, { "epoch": 0.99, "learning_rate": 2.8547313204309477e-07, "loss": 2.3932, "step": 285080 }, { "epoch": 0.99, "learning_rate": 2.837292521894412e-07, "loss": 2.3567, "step": 285090 }, { "epoch": 0.99, "learning_rate": 2.8198537233578757e-07, "loss": 2.3222, "step": 285100 }, { "epoch": 0.99, "learning_rate": 2.8024149248213395e-07, "loss": 2.3442, "step": 285110 }, { "epoch": 0.99, "learning_rate": 2.7849761262848037e-07, "loss": 2.264, "step": 285120 }, { "epoch": 0.99, "learning_rate": 2.7675373277482675e-07, "loss": 2.3257, "step": 285130 }, { "epoch": 0.99, "learning_rate": 2.750098529211732e-07, "loss": 2.329, "step": 285140 }, { "epoch": 0.99, "learning_rate": 2.7326597306751955e-07, "loss": 2.2825, "step": 285150 }, { "epoch": 0.99, "learning_rate": 2.7152209321386593e-07, "loss": 2.2741, "step": 285160 }, { "epoch": 0.99, "learning_rate": 2.6977821336021236e-07, "loss": 2.254, "step": 285170 }, { "epoch": 0.99, "learning_rate": 2.6803433350655873e-07, "loss": 2.3768, "step": 285180 }, { "epoch": 0.99, "learning_rate": 2.6629045365290516e-07, "loss": 2.3363, "step": 285190 }, { "epoch": 0.99, "learning_rate": 2.6454657379925153e-07, "loss": 2.2796, "step": 285200 }, { "epoch": 0.99, "learning_rate": 2.628026939455979e-07, "loss": 2.3927, "step": 285210 }, { "epoch": 0.99, "learning_rate": 2.6105881409194434e-07, "loss": 2.3441, "step": 285220 }, { "epoch": 0.99, "learning_rate": 2.593149342382907e-07, "loss": 2.3625, "step": 285230 }, { "epoch": 0.99, "learning_rate": 2.5757105438463714e-07, "loss": 2.305, "step": 285240 }, { "epoch": 0.99, "learning_rate": 2.558271745309835e-07, "loss": 2.3121, "step": 285250 }, { "epoch": 0.99, "learning_rate": 2.540832946773299e-07, "loss": 2.4078, "step": 285260 }, { "epoch": 0.99, "learning_rate": 2.523394148236763e-07, "loss": 2.2495, "step": 285270 }, { "epoch": 0.99, "learning_rate": 2.505955349700227e-07, "loss": 2.3396, "step": 285280 }, { "epoch": 1.0, "learning_rate": 2.488516551163691e-07, "loss": 2.3427, "step": 285290 }, { "epoch": 1.0, "learning_rate": 2.471077752627155e-07, "loss": 2.3511, "step": 285300 }, { "epoch": 1.0, "learning_rate": 2.453638954090619e-07, "loss": 2.3952, "step": 285310 }, { "epoch": 1.0, "learning_rate": 2.436200155554083e-07, "loss": 2.2959, "step": 285320 }, { "epoch": 1.0, "learning_rate": 2.418761357017547e-07, "loss": 2.4302, "step": 285330 }, { "epoch": 1.0, "learning_rate": 2.401322558481011e-07, "loss": 2.3446, "step": 285340 }, { "epoch": 1.0, "learning_rate": 2.383883759944475e-07, "loss": 2.3643, "step": 285350 }, { "epoch": 1.0, "learning_rate": 2.366444961407939e-07, "loss": 2.3104, "step": 285360 }, { "epoch": 1.0, "learning_rate": 2.3490061628714028e-07, "loss": 2.3135, "step": 285370 }, { "epoch": 1.0, "learning_rate": 2.3315673643348668e-07, "loss": 2.2758, "step": 285380 }, { "epoch": 1.0, "learning_rate": 2.3141285657983308e-07, "loss": 2.2784, "step": 285390 }, { "epoch": 1.0, "learning_rate": 2.2966897672617949e-07, "loss": 2.2062, "step": 285400 }, { "epoch": 1.0, "learning_rate": 2.279250968725259e-07, "loss": 2.3775, "step": 285410 }, { "epoch": 1.0, "learning_rate": 2.261812170188723e-07, "loss": 2.3219, "step": 285420 }, { "epoch": 1.0, "learning_rate": 2.2443733716521866e-07, "loss": 2.3049, "step": 285430 }, { "epoch": 1.0, "learning_rate": 2.226934573115651e-07, "loss": 2.325, "step": 285440 }, { "epoch": 1.0, "learning_rate": 2.2094957745791147e-07, "loss": 2.3975, "step": 285450 }, { "epoch": 1.0, "learning_rate": 2.192056976042579e-07, "loss": 2.3468, "step": 285460 }, { "epoch": 1.0, "learning_rate": 2.1746181775060427e-07, "loss": 2.3437, "step": 285470 }, { "epoch": 1.0, "learning_rate": 2.1571793789695065e-07, "loss": 2.3263, "step": 285480 }, { "epoch": 1.0, "learning_rate": 2.1397405804329707e-07, "loss": 2.3357, "step": 285490 }, { "epoch": 1.0, "learning_rate": 2.1223017818964345e-07, "loss": 2.2768, "step": 285500 }, { "epoch": 1.0, "learning_rate": 2.1048629833598988e-07, "loss": 2.356, "step": 285510 }, { "epoch": 1.0, "learning_rate": 2.0874241848233625e-07, "loss": 2.337, "step": 285520 }, { "epoch": 1.0, "learning_rate": 2.0699853862868263e-07, "loss": 2.4426, "step": 285530 }, { "epoch": 1.0, "learning_rate": 2.0525465877502906e-07, "loss": 2.3389, "step": 285540 }, { "epoch": 1.0, "learning_rate": 2.0351077892137543e-07, "loss": 2.3869, "step": 285550 }, { "epoch": 1.0, "learning_rate": 2.0176689906772186e-07, "loss": 2.3117, "step": 285560 }, { "epoch": 1.0, "learning_rate": 2.0002301921406823e-07, "loss": 2.2979, "step": 285570 }, { "epoch": 1.0, "learning_rate": 1.982791393604146e-07, "loss": 2.4086, "step": 285580 }, { "epoch": 1.0, "learning_rate": 1.9653525950676104e-07, "loss": 2.3774, "step": 285590 }, { "epoch": 1.0, "learning_rate": 1.9479137965310744e-07, "loss": 2.3697, "step": 285600 }, { "epoch": 1.0, "learning_rate": 1.9304749979945381e-07, "loss": 2.3417, "step": 285610 }, { "epoch": 1.0, "learning_rate": 1.9130361994580022e-07, "loss": 2.301, "step": 285620 }, { "epoch": 1.0, "learning_rate": 1.8955974009214662e-07, "loss": 2.3374, "step": 285630 }, { "epoch": 1.0, "learning_rate": 1.8781586023849302e-07, "loss": 2.229, "step": 285640 }, { "epoch": 1.0, "learning_rate": 1.8607198038483942e-07, "loss": 2.3062, "step": 285650 }, { "epoch": 1.0, "learning_rate": 1.843281005311858e-07, "loss": 2.2968, "step": 285660 }, { "epoch": 1.0, "learning_rate": 1.825842206775322e-07, "loss": 2.3885, "step": 285670 }, { "epoch": 1.0, "learning_rate": 1.808403408238786e-07, "loss": 2.3288, "step": 285680 }, { "epoch": 1.0, "learning_rate": 1.79096460970225e-07, "loss": 2.2978, "step": 285690 }, { "epoch": 1.0, "learning_rate": 1.773525811165714e-07, "loss": 2.3072, "step": 285700 }, { "epoch": 1.0, "learning_rate": 1.7560870126291778e-07, "loss": 2.3291, "step": 285710 }, { "epoch": 1.0, "learning_rate": 1.7386482140926418e-07, "loss": 2.3093, "step": 285720 }, { "epoch": 1.0, "learning_rate": 1.7212094155561058e-07, "loss": 2.2569, "step": 285730 }, { "epoch": 1.0, "learning_rate": 1.7037706170195698e-07, "loss": 2.3185, "step": 285740 }, { "epoch": 1.0, "learning_rate": 1.6863318184830338e-07, "loss": 2.3159, "step": 285750 }, { "epoch": 1.0, "learning_rate": 1.6688930199464979e-07, "loss": 2.3438, "step": 285760 }, { "epoch": 1.0, "learning_rate": 1.6514542214099616e-07, "loss": 2.3355, "step": 285770 }, { "epoch": 1.0, "learning_rate": 1.6340154228734256e-07, "loss": 2.3262, "step": 285780 }, { "epoch": 1.0, "learning_rate": 1.6165766243368896e-07, "loss": 2.35, "step": 285790 }, { "epoch": 1.0, "learning_rate": 1.5991378258003537e-07, "loss": 2.2904, "step": 285800 }, { "epoch": 1.0, "learning_rate": 1.5816990272638177e-07, "loss": 2.2915, "step": 285810 }, { "epoch": 1.0, "learning_rate": 1.5642602287272817e-07, "loss": 2.2974, "step": 285820 }, { "epoch": 1.0, "learning_rate": 1.5468214301907457e-07, "loss": 2.3712, "step": 285830 }, { "epoch": 1.0, "learning_rate": 1.5293826316542097e-07, "loss": 2.3671, "step": 285840 }, { "epoch": 1.0, "learning_rate": 1.5119438331176737e-07, "loss": 2.3057, "step": 285850 }, { "epoch": 1.0, "learning_rate": 1.4945050345811378e-07, "loss": 2.3911, "step": 285860 }, { "epoch": 1.0, "learning_rate": 1.4770662360446015e-07, "loss": 2.3095, "step": 285870 }, { "epoch": 1.0, "learning_rate": 1.4596274375080655e-07, "loss": 2.3733, "step": 285880 }, { "epoch": 1.0, "learning_rate": 1.4421886389715295e-07, "loss": 2.3348, "step": 285890 }, { "epoch": 1.0, "learning_rate": 1.4247498404349936e-07, "loss": 2.2955, "step": 285900 }, { "epoch": 1.0, "learning_rate": 1.4073110418984576e-07, "loss": 2.3678, "step": 285910 }, { "epoch": 1.0, "learning_rate": 1.3898722433619216e-07, "loss": 2.3681, "step": 285920 }, { "epoch": 1.0, "learning_rate": 1.3724334448253853e-07, "loss": 2.2165, "step": 285930 }, { "epoch": 1.0, "learning_rate": 1.3549946462888494e-07, "loss": 2.3807, "step": 285940 }, { "epoch": 1.0, "learning_rate": 1.3375558477523134e-07, "loss": 2.3771, "step": 285950 }, { "epoch": 1.0, "learning_rate": 1.3201170492157774e-07, "loss": 2.3432, "step": 285960 }, { "epoch": 1.0, "learning_rate": 1.3026782506792414e-07, "loss": 2.3381, "step": 285970 }, { "epoch": 1.0, "learning_rate": 1.2852394521427052e-07, "loss": 2.2467, "step": 285980 }, { "epoch": 1.0, "learning_rate": 1.2678006536061692e-07, "loss": 2.3453, "step": 285990 }, { "epoch": 1.0, "learning_rate": 1.2503618550696332e-07, "loss": 2.3587, "step": 286000 }, { "epoch": 1.0, "learning_rate": 1.2329230565330972e-07, "loss": 2.369, "step": 286010 }, { "epoch": 1.0, "learning_rate": 1.2154842579965612e-07, "loss": 2.3626, "step": 286020 }, { "epoch": 1.0, "learning_rate": 1.198045459460025e-07, "loss": 2.4206, "step": 286030 }, { "epoch": 1.0, "learning_rate": 1.180606660923489e-07, "loss": 2.3219, "step": 286040 }, { "epoch": 1.0, "learning_rate": 1.163167862386953e-07, "loss": 2.2636, "step": 286050 }, { "epoch": 1.0, "learning_rate": 1.145729063850417e-07, "loss": 2.3141, "step": 286060 }, { "epoch": 1.0, "learning_rate": 1.128290265313881e-07, "loss": 2.3573, "step": 286070 }, { "epoch": 1.0, "learning_rate": 1.110851466777345e-07, "loss": 2.3249, "step": 286080 }, { "epoch": 1.0, "learning_rate": 1.0934126682408088e-07, "loss": 2.3467, "step": 286090 }, { "epoch": 1.0, "learning_rate": 1.0759738697042728e-07, "loss": 2.2809, "step": 286100 }, { "epoch": 1.0, "learning_rate": 1.0585350711677368e-07, "loss": 2.2963, "step": 286110 }, { "epoch": 1.0, "learning_rate": 1.0410962726312009e-07, "loss": 2.3127, "step": 286120 }, { "epoch": 1.0, "learning_rate": 1.0236574740946649e-07, "loss": 2.4025, "step": 286130 }, { "epoch": 1.0, "learning_rate": 1.0062186755581288e-07, "loss": 2.3728, "step": 286140 }, { "epoch": 1.0, "learning_rate": 9.887798770215928e-08, "loss": 2.3214, "step": 286150 }, { "epoch": 1.0, "learning_rate": 9.713410784850568e-08, "loss": 2.3407, "step": 286160 }, { "epoch": 1.0, "learning_rate": 9.539022799485208e-08, "loss": 2.363, "step": 286170 }, { "epoch": 1.0, "learning_rate": 9.364634814119847e-08, "loss": 2.3875, "step": 286180 }, { "epoch": 1.0, "learning_rate": 9.190246828754487e-08, "loss": 2.3301, "step": 286190 }, { "epoch": 1.0, "learning_rate": 9.015858843389126e-08, "loss": 2.2799, "step": 286200 }, { "epoch": 1.0, "learning_rate": 8.841470858023766e-08, "loss": 2.3344, "step": 286210 }, { "epoch": 1.0, "learning_rate": 8.667082872658406e-08, "loss": 2.3721, "step": 286220 }, { "epoch": 1.0, "learning_rate": 8.492694887293045e-08, "loss": 2.3437, "step": 286230 }, { "epoch": 1.0, "learning_rate": 8.318306901927685e-08, "loss": 2.3615, "step": 286240 }, { "epoch": 1.0, "learning_rate": 8.143918916562325e-08, "loss": 2.2441, "step": 286250 }, { "epoch": 1.0, "learning_rate": 7.969530931196964e-08, "loss": 2.3586, "step": 286260 }, { "epoch": 1.0, "learning_rate": 7.795142945831604e-08, "loss": 2.3446, "step": 286270 }, { "epoch": 1.0, "learning_rate": 7.620754960466243e-08, "loss": 2.3193, "step": 286280 }, { "epoch": 1.0, "learning_rate": 7.446366975100883e-08, "loss": 2.2415, "step": 286290 }, { "epoch": 1.0, "learning_rate": 7.271978989735524e-08, "loss": 2.375, "step": 286300 }, { "epoch": 1.0, "learning_rate": 7.097591004370162e-08, "loss": 2.3062, "step": 286310 }, { "epoch": 1.0, "learning_rate": 6.923203019004803e-08, "loss": 2.3738, "step": 286320 }, { "epoch": 1.0, "learning_rate": 6.748815033639443e-08, "loss": 2.3729, "step": 286330 }, { "epoch": 1.0, "learning_rate": 6.574427048274083e-08, "loss": 2.4112, "step": 286340 }, { "epoch": 1.0, "learning_rate": 6.400039062908722e-08, "loss": 2.286, "step": 286350 }, { "epoch": 1.0, "learning_rate": 6.225651077543362e-08, "loss": 2.3367, "step": 286360 }, { "epoch": 1.0, "learning_rate": 6.051263092178002e-08, "loss": 2.3127, "step": 286370 }, { "epoch": 1.0, "learning_rate": 5.8768751068126415e-08, "loss": 2.2882, "step": 286380 }, { "epoch": 1.0, "learning_rate": 5.702487121447281e-08, "loss": 2.3549, "step": 286390 }, { "epoch": 1.0, "learning_rate": 5.5280991360819205e-08, "loss": 2.3747, "step": 286400 }, { "epoch": 1.0, "learning_rate": 5.3537111507165607e-08, "loss": 2.304, "step": 286410 }, { "epoch": 1.0, "learning_rate": 5.1793231653512e-08, "loss": 2.2996, "step": 286420 }, { "epoch": 1.0, "learning_rate": 5.00493517998584e-08, "loss": 2.3123, "step": 286430 }, { "epoch": 1.0, "learning_rate": 4.83054719462048e-08, "loss": 2.301, "step": 286440 }, { "epoch": 1.0, "learning_rate": 4.656159209255119e-08, "loss": 2.3676, "step": 286450 }, { "epoch": 1.0, "learning_rate": 4.481771223889759e-08, "loss": 2.298, "step": 286460 }, { "epoch": 1.0, "learning_rate": 4.307383238524399e-08, "loss": 2.3243, "step": 286470 }, { "epoch": 1.0, "learning_rate": 4.1329952531590385e-08, "loss": 2.3733, "step": 286480 }, { "epoch": 1.0, "learning_rate": 3.958607267793678e-08, "loss": 2.3593, "step": 286490 }, { "epoch": 1.0, "learning_rate": 3.7842192824283175e-08, "loss": 2.2642, "step": 286500 }, { "epoch": 0.5, "learning_rate": 2.501804915648532e-05, "loss": 2.2268, "step": 286510 }, { "epoch": 0.5, "learning_rate": 2.501717721655849e-05, "loss": 2.2357, "step": 286520 }, { "epoch": 0.5, "learning_rate": 2.5016305276631664e-05, "loss": 2.2253, "step": 286530 }, { "epoch": 0.5, "learning_rate": 2.5015433336704834e-05, "loss": 2.3401, "step": 286540 }, { "epoch": 0.5, "learning_rate": 2.5014561396778008e-05, "loss": 2.3747, "step": 286550 }, { "epoch": 0.5, "learning_rate": 2.501368945685118e-05, "loss": 2.3105, "step": 286560 }, { "epoch": 0.5, "learning_rate": 2.5012817516924352e-05, "loss": 2.2003, "step": 286570 }, { "epoch": 0.5, "learning_rate": 2.5011945576997532e-05, "loss": 2.3854, "step": 286580 }, { "epoch": 0.5, "learning_rate": 2.5011073637070703e-05, "loss": 2.1984, "step": 286590 }, { "epoch": 0.5, "learning_rate": 2.5010201697143877e-05, "loss": 2.355, "step": 286600 }, { "epoch": 0.5, "learning_rate": 2.5009329757217047e-05, "loss": 2.3667, "step": 286610 }, { "epoch": 0.5, "learning_rate": 2.500845781729022e-05, "loss": 2.2959, "step": 286620 }, { "epoch": 0.5, "learning_rate": 2.5007585877363394e-05, "loss": 2.3303, "step": 286630 }, { "epoch": 0.5, "learning_rate": 2.5006713937436565e-05, "loss": 2.4082, "step": 286640 }, { "epoch": 0.5, "learning_rate": 2.500584199750974e-05, "loss": 2.3471, "step": 286650 }, { "epoch": 0.5, "learning_rate": 2.5004970057582916e-05, "loss": 2.3459, "step": 286660 }, { "epoch": 0.5, "learning_rate": 2.500409811765609e-05, "loss": 2.3638, "step": 286670 }, { "epoch": 0.5, "learning_rate": 2.500322617772926e-05, "loss": 2.4141, "step": 286680 }, { "epoch": 0.5, "learning_rate": 2.5002354237802434e-05, "loss": 2.4243, "step": 286690 }, { "epoch": 0.5, "learning_rate": 2.5001482297875607e-05, "loss": 2.3172, "step": 286700 }, { "epoch": 0.5, "learning_rate": 2.5000610357948778e-05, "loss": 2.2777, "step": 286710 }, { "epoch": 0.5, "learning_rate": 2.4999738418021955e-05, "loss": 2.3301, "step": 286720 }, { "epoch": 0.5, "learning_rate": 2.4998866478095125e-05, "loss": 2.4074, "step": 286730 }, { "epoch": 0.5, "learning_rate": 2.49979945381683e-05, "loss": 2.4159, "step": 286740 }, { "epoch": 0.5, "learning_rate": 2.4997122598241473e-05, "loss": 2.3664, "step": 286750 }, { "epoch": 0.5, "learning_rate": 2.4996250658314647e-05, "loss": 2.425, "step": 286760 }, { "epoch": 0.5, "learning_rate": 2.4995378718387817e-05, "loss": 2.3309, "step": 286770 }, { "epoch": 0.5, "learning_rate": 2.499450677846099e-05, "loss": 2.3227, "step": 286780 }, { "epoch": 0.5, "learning_rate": 2.4993634838534165e-05, "loss": 2.3188, "step": 286790 }, { "epoch": 0.5, "learning_rate": 2.499276289860734e-05, "loss": 2.2535, "step": 286800 }, { "epoch": 0.5, "learning_rate": 2.4991890958680512e-05, "loss": 2.4168, "step": 286810 }, { "epoch": 0.5, "learning_rate": 2.4991019018753686e-05, "loss": 2.3898, "step": 286820 }, { "epoch": 0.5, "learning_rate": 2.499014707882686e-05, "loss": 2.174, "step": 286830 }, { "epoch": 0.5, "learning_rate": 2.498927513890003e-05, "loss": 2.2998, "step": 286840 }, { "epoch": 0.5, "learning_rate": 2.4988403198973204e-05, "loss": 2.4884, "step": 286850 }, { "epoch": 0.5, "learning_rate": 2.4987531259046378e-05, "loss": 2.2641, "step": 286860 }, { "epoch": 0.5, "learning_rate": 2.498665931911955e-05, "loss": 2.2546, "step": 286870 }, { "epoch": 0.5, "learning_rate": 2.4985787379192725e-05, "loss": 2.3294, "step": 286880 }, { "epoch": 0.5, "learning_rate": 2.4984915439265896e-05, "loss": 2.2593, "step": 286890 }, { "epoch": 0.5, "learning_rate": 2.4984043499339073e-05, "loss": 2.3751, "step": 286900 }, { "epoch": 0.5, "learning_rate": 2.4983171559412243e-05, "loss": 2.4327, "step": 286910 }, { "epoch": 0.5, "learning_rate": 2.4982299619485417e-05, "loss": 2.4162, "step": 286920 }, { "epoch": 0.5, "learning_rate": 2.498142767955859e-05, "loss": 2.3835, "step": 286930 }, { "epoch": 0.5, "learning_rate": 2.4980555739631764e-05, "loss": 2.3808, "step": 286940 }, { "epoch": 0.5, "learning_rate": 2.4979683799704938e-05, "loss": 2.4371, "step": 286950 }, { "epoch": 0.5, "learning_rate": 2.497881185977811e-05, "loss": 2.3955, "step": 286960 }, { "epoch": 0.5, "learning_rate": 2.4977939919851286e-05, "loss": 2.3837, "step": 286970 }, { "epoch": 0.5, "learning_rate": 2.4977067979924456e-05, "loss": 2.3439, "step": 286980 }, { "epoch": 0.5, "learning_rate": 2.497619603999763e-05, "loss": 2.3856, "step": 286990 }, { "epoch": 0.5, "learning_rate": 2.49753241000708e-05, "loss": 2.3867, "step": 287000 }, { "epoch": 0.5, "learning_rate": 2.4974452160143977e-05, "loss": 2.2328, "step": 287010 }, { "epoch": 0.5, "learning_rate": 2.4973580220217148e-05, "loss": 2.3675, "step": 287020 }, { "epoch": 0.5, "learning_rate": 2.497270828029032e-05, "loss": 2.4436, "step": 287030 }, { "epoch": 0.5, "learning_rate": 2.4971836340363495e-05, "loss": 2.3239, "step": 287040 }, { "epoch": 0.5, "learning_rate": 2.497096440043667e-05, "loss": 2.4047, "step": 287050 }, { "epoch": 0.5, "learning_rate": 2.4970092460509843e-05, "loss": 2.4817, "step": 287060 }, { "epoch": 0.5, "learning_rate": 2.4969220520583013e-05, "loss": 2.3425, "step": 287070 }, { "epoch": 0.5, "learning_rate": 2.496834858065619e-05, "loss": 2.3675, "step": 287080 }, { "epoch": 0.5, "learning_rate": 2.496747664072936e-05, "loss": 2.386, "step": 287090 }, { "epoch": 0.5, "learning_rate": 2.4966604700802535e-05, "loss": 2.3983, "step": 287100 }, { "epoch": 0.5, "learning_rate": 2.496573276087571e-05, "loss": 2.3558, "step": 287110 }, { "epoch": 0.5, "learning_rate": 2.4964860820948882e-05, "loss": 2.2954, "step": 287120 }, { "epoch": 0.5, "learning_rate": 2.4963988881022056e-05, "loss": 2.4245, "step": 287130 }, { "epoch": 0.5, "learning_rate": 2.4963116941095226e-05, "loss": 2.3726, "step": 287140 }, { "epoch": 0.5, "learning_rate": 2.49622450011684e-05, "loss": 2.4018, "step": 287150 }, { "epoch": 0.5, "learning_rate": 2.4961373061241574e-05, "loss": 2.4077, "step": 287160 }, { "epoch": 0.5, "learning_rate": 2.4960501121314748e-05, "loss": 2.3067, "step": 287170 }, { "epoch": 0.5, "learning_rate": 2.4959629181387918e-05, "loss": 2.4695, "step": 287180 }, { "epoch": 0.5, "learning_rate": 2.4958757241461095e-05, "loss": 2.4182, "step": 287190 }, { "epoch": 0.5, "learning_rate": 2.495788530153427e-05, "loss": 2.3528, "step": 287200 }, { "epoch": 0.5, "learning_rate": 2.495701336160744e-05, "loss": 2.1961, "step": 287210 }, { "epoch": 0.5, "learning_rate": 2.4956141421680613e-05, "loss": 2.4111, "step": 287220 }, { "epoch": 0.5, "learning_rate": 2.4955269481753787e-05, "loss": 2.3462, "step": 287230 }, { "epoch": 0.5, "learning_rate": 2.495439754182696e-05, "loss": 2.4084, "step": 287240 }, { "epoch": 0.5, "learning_rate": 2.495352560190013e-05, "loss": 2.3031, "step": 287250 }, { "epoch": 0.5, "learning_rate": 2.4952653661973305e-05, "loss": 2.4129, "step": 287260 }, { "epoch": 0.5, "learning_rate": 2.495178172204648e-05, "loss": 2.3508, "step": 287270 }, { "epoch": 0.5, "learning_rate": 2.4950909782119652e-05, "loss": 2.2933, "step": 287280 }, { "epoch": 0.5, "learning_rate": 2.4950037842192826e-05, "loss": 2.3969, "step": 287290 }, { "epoch": 0.5, "learning_rate": 2.4949165902265996e-05, "loss": 2.3137, "step": 287300 }, { "epoch": 0.5, "learning_rate": 2.4948293962339174e-05, "loss": 2.3964, "step": 287310 }, { "epoch": 0.5, "learning_rate": 2.4947422022412344e-05, "loss": 2.3855, "step": 287320 }, { "epoch": 0.5, "learning_rate": 2.4946550082485518e-05, "loss": 2.3617, "step": 287330 }, { "epoch": 0.5, "learning_rate": 2.494567814255869e-05, "loss": 2.3448, "step": 287340 }, { "epoch": 0.5, "learning_rate": 2.4944806202631865e-05, "loss": 2.4593, "step": 287350 }, { "epoch": 0.5, "learning_rate": 2.494393426270504e-05, "loss": 2.3693, "step": 287360 }, { "epoch": 0.5, "learning_rate": 2.494306232277821e-05, "loss": 2.3633, "step": 287370 }, { "epoch": 0.5, "learning_rate": 2.4942190382851387e-05, "loss": 2.4289, "step": 287380 }, { "epoch": 0.5, "learning_rate": 2.4941318442924557e-05, "loss": 2.4064, "step": 287390 }, { "epoch": 0.5, "learning_rate": 2.494044650299773e-05, "loss": 2.4214, "step": 287400 }, { "epoch": 0.5, "learning_rate": 2.49395745630709e-05, "loss": 2.3502, "step": 287410 }, { "epoch": 0.5, "learning_rate": 2.4938702623144078e-05, "loss": 2.4025, "step": 287420 }, { "epoch": 0.5, "learning_rate": 2.4937830683217252e-05, "loss": 2.3359, "step": 287430 }, { "epoch": 0.5, "learning_rate": 2.4936958743290422e-05, "loss": 2.4125, "step": 287440 }, { "epoch": 0.5, "learning_rate": 2.49360868033636e-05, "loss": 2.3971, "step": 287450 }, { "epoch": 0.5, "learning_rate": 2.493521486343677e-05, "loss": 2.456, "step": 287460 }, { "epoch": 0.5, "learning_rate": 2.4934342923509944e-05, "loss": 2.4363, "step": 287470 }, { "epoch": 0.5, "learning_rate": 2.4933470983583114e-05, "loss": 2.3761, "step": 287480 }, { "epoch": 0.5, "learning_rate": 2.493259904365629e-05, "loss": 2.4089, "step": 287490 }, { "epoch": 0.5, "learning_rate": 2.493172710372946e-05, "loss": 2.3767, "step": 287500 }, { "epoch": 0.5, "learning_rate": 2.4930855163802635e-05, "loss": 2.3656, "step": 287510 }, { "epoch": 0.5, "learning_rate": 2.492998322387581e-05, "loss": 2.4044, "step": 287520 }, { "epoch": 0.5, "learning_rate": 2.4929111283948983e-05, "loss": 2.4082, "step": 287530 }, { "epoch": 0.5, "learning_rate": 2.4928239344022157e-05, "loss": 2.3255, "step": 287540 }, { "epoch": 0.5, "learning_rate": 2.4927367404095327e-05, "loss": 2.404, "step": 287550 }, { "epoch": 0.5, "learning_rate": 2.49264954641685e-05, "loss": 2.4031, "step": 287560 }, { "epoch": 0.5, "learning_rate": 2.4925623524241675e-05, "loss": 2.4274, "step": 287570 }, { "epoch": 0.5, "learning_rate": 2.492475158431485e-05, "loss": 2.1763, "step": 287580 }, { "epoch": 0.5, "learning_rate": 2.4923879644388022e-05, "loss": 2.3126, "step": 287590 }, { "epoch": 0.5, "learning_rate": 2.4923007704461196e-05, "loss": 2.4297, "step": 287600 }, { "epoch": 0.5, "learning_rate": 2.492213576453437e-05, "loss": 2.3406, "step": 287610 }, { "epoch": 0.5, "learning_rate": 2.492126382460754e-05, "loss": 2.412, "step": 287620 }, { "epoch": 0.5, "learning_rate": 2.4920391884680714e-05, "loss": 2.3748, "step": 287630 }, { "epoch": 0.5, "learning_rate": 2.4919519944753888e-05, "loss": 2.1283, "step": 287640 }, { "epoch": 0.5, "learning_rate": 2.491864800482706e-05, "loss": 2.3526, "step": 287650 }, { "epoch": 0.5, "learning_rate": 2.4917776064900232e-05, "loss": 2.4206, "step": 287660 }, { "epoch": 0.5, "learning_rate": 2.4916904124973406e-05, "loss": 2.351, "step": 287670 }, { "epoch": 0.5, "learning_rate": 2.4916032185046583e-05, "loss": 2.3685, "step": 287680 }, { "epoch": 0.5, "learning_rate": 2.4915160245119753e-05, "loss": 2.338, "step": 287690 }, { "epoch": 0.5, "learning_rate": 2.4914288305192927e-05, "loss": 2.2593, "step": 287700 }, { "epoch": 0.5, "learning_rate": 2.4913416365266097e-05, "loss": 2.3347, "step": 287710 }, { "epoch": 0.5, "learning_rate": 2.4912544425339274e-05, "loss": 2.3992, "step": 287720 }, { "epoch": 0.5, "learning_rate": 2.4911672485412445e-05, "loss": 2.4958, "step": 287730 }, { "epoch": 0.5, "learning_rate": 2.491080054548562e-05, "loss": 2.3532, "step": 287740 }, { "epoch": 0.5, "learning_rate": 2.4909928605558792e-05, "loss": 2.3036, "step": 287750 }, { "epoch": 0.5, "learning_rate": 2.4909056665631966e-05, "loss": 2.3262, "step": 287760 }, { "epoch": 0.5, "learning_rate": 2.490818472570514e-05, "loss": 2.3747, "step": 287770 }, { "epoch": 0.5, "learning_rate": 2.490731278577831e-05, "loss": 2.3014, "step": 287780 }, { "epoch": 0.5, "learning_rate": 2.4906440845851487e-05, "loss": 2.4001, "step": 287790 }, { "epoch": 0.5, "learning_rate": 2.4905568905924658e-05, "loss": 2.3995, "step": 287800 }, { "epoch": 0.5, "learning_rate": 2.490469696599783e-05, "loss": 2.3386, "step": 287810 }, { "epoch": 0.5, "learning_rate": 2.4903825026071005e-05, "loss": 2.4022, "step": 287820 }, { "epoch": 0.5, "learning_rate": 2.490295308614418e-05, "loss": 2.3378, "step": 287830 }, { "epoch": 0.5, "learning_rate": 2.4902081146217353e-05, "loss": 2.3522, "step": 287840 }, { "epoch": 0.5, "learning_rate": 2.4901209206290523e-05, "loss": 2.3204, "step": 287850 }, { "epoch": 0.5, "learning_rate": 2.49003372663637e-05, "loss": 2.3191, "step": 287860 }, { "epoch": 0.5, "learning_rate": 2.489946532643687e-05, "loss": 2.2889, "step": 287870 }, { "epoch": 0.5, "learning_rate": 2.4898593386510045e-05, "loss": 2.3418, "step": 287880 }, { "epoch": 0.5, "learning_rate": 2.4897721446583215e-05, "loss": 2.3664, "step": 287890 }, { "epoch": 0.5, "learning_rate": 2.4896849506656392e-05, "loss": 2.2569, "step": 287900 }, { "epoch": 0.5, "learning_rate": 2.4895977566729562e-05, "loss": 2.3267, "step": 287910 }, { "epoch": 0.5, "learning_rate": 2.4895105626802736e-05, "loss": 2.3981, "step": 287920 }, { "epoch": 0.5, "learning_rate": 2.489423368687591e-05, "loss": 2.4334, "step": 287930 }, { "epoch": 0.5, "learning_rate": 2.4893361746949084e-05, "loss": 2.367, "step": 287940 }, { "epoch": 0.5, "learning_rate": 2.4892489807022258e-05, "loss": 2.5344, "step": 287950 }, { "epoch": 0.5, "learning_rate": 2.4891617867095428e-05, "loss": 2.2886, "step": 287960 }, { "epoch": 0.5, "learning_rate": 2.4890745927168602e-05, "loss": 2.3179, "step": 287970 }, { "epoch": 0.5, "learning_rate": 2.4889873987241775e-05, "loss": 2.3962, "step": 287980 }, { "epoch": 0.5, "learning_rate": 2.488900204731495e-05, "loss": 2.4935, "step": 287990 }, { "epoch": 0.5, "learning_rate": 2.4888130107388123e-05, "loss": 2.3311, "step": 288000 }, { "epoch": 0.5, "learning_rate": 2.4887258167461297e-05, "loss": 2.5074, "step": 288010 }, { "epoch": 0.5, "learning_rate": 2.488638622753447e-05, "loss": 2.4023, "step": 288020 }, { "epoch": 0.5, "learning_rate": 2.488551428760764e-05, "loss": 2.3538, "step": 288030 }, { "epoch": 0.5, "learning_rate": 2.4884642347680815e-05, "loss": 2.3427, "step": 288040 }, { "epoch": 0.5, "learning_rate": 2.488377040775399e-05, "loss": 2.3163, "step": 288050 }, { "epoch": 0.5, "learning_rate": 2.4882898467827162e-05, "loss": 2.4777, "step": 288060 }, { "epoch": 0.5, "learning_rate": 2.4882026527900336e-05, "loss": 2.2752, "step": 288070 }, { "epoch": 0.5, "learning_rate": 2.4881154587973506e-05, "loss": 2.3832, "step": 288080 }, { "epoch": 0.5, "learning_rate": 2.4880282648046684e-05, "loss": 2.4503, "step": 288090 }, { "epoch": 0.5, "learning_rate": 2.4879410708119854e-05, "loss": 2.3353, "step": 288100 }, { "epoch": 0.5, "learning_rate": 2.4878538768193028e-05, "loss": 2.2827, "step": 288110 }, { "epoch": 0.5, "learning_rate": 2.48776668282662e-05, "loss": 2.4014, "step": 288120 }, { "epoch": 0.5, "learning_rate": 2.4876794888339375e-05, "loss": 2.365, "step": 288130 }, { "epoch": 0.5, "learning_rate": 2.4875922948412546e-05, "loss": 2.4174, "step": 288140 }, { "epoch": 0.5, "learning_rate": 2.487505100848572e-05, "loss": 2.3416, "step": 288150 }, { "epoch": 0.5, "learning_rate": 2.4874179068558897e-05, "loss": 2.3422, "step": 288160 }, { "epoch": 0.5, "learning_rate": 2.4873307128632067e-05, "loss": 2.2966, "step": 288170 }, { "epoch": 0.5, "learning_rate": 2.487243518870524e-05, "loss": 2.3593, "step": 288180 }, { "epoch": 0.5, "learning_rate": 2.487156324877841e-05, "loss": 2.2661, "step": 288190 }, { "epoch": 0.5, "learning_rate": 2.4870691308851588e-05, "loss": 2.3521, "step": 288200 }, { "epoch": 0.5, "learning_rate": 2.486981936892476e-05, "loss": 2.4595, "step": 288210 }, { "epoch": 0.5, "learning_rate": 2.4868947428997932e-05, "loss": 2.2664, "step": 288220 }, { "epoch": 0.5, "learning_rate": 2.4868075489071106e-05, "loss": 2.3477, "step": 288230 }, { "epoch": 0.5, "learning_rate": 2.486720354914428e-05, "loss": 2.3825, "step": 288240 }, { "epoch": 0.5, "learning_rate": 2.4866331609217454e-05, "loss": 2.398, "step": 288250 }, { "epoch": 0.5, "learning_rate": 2.4865459669290624e-05, "loss": 2.2126, "step": 288260 }, { "epoch": 0.5, "learning_rate": 2.48645877293638e-05, "loss": 2.4237, "step": 288270 }, { "epoch": 0.5, "learning_rate": 2.486371578943697e-05, "loss": 2.3546, "step": 288280 }, { "epoch": 0.5, "learning_rate": 2.4862843849510145e-05, "loss": 2.3357, "step": 288290 }, { "epoch": 0.5, "learning_rate": 2.486197190958332e-05, "loss": 2.3614, "step": 288300 }, { "epoch": 0.5, "learning_rate": 2.4861099969656493e-05, "loss": 2.4106, "step": 288310 }, { "epoch": 0.5, "learning_rate": 2.4860228029729667e-05, "loss": 2.2382, "step": 288320 }, { "epoch": 0.5, "learning_rate": 2.4859356089802837e-05, "loss": 2.3342, "step": 288330 }, { "epoch": 0.5, "learning_rate": 2.485848414987601e-05, "loss": 2.3817, "step": 288340 }, { "epoch": 0.5, "learning_rate": 2.4857612209949185e-05, "loss": 2.392, "step": 288350 }, { "epoch": 0.5, "learning_rate": 2.485674027002236e-05, "loss": 2.3458, "step": 288360 }, { "epoch": 0.5, "learning_rate": 2.485586833009553e-05, "loss": 2.3879, "step": 288370 }, { "epoch": 0.5, "learning_rate": 2.4854996390168706e-05, "loss": 2.3725, "step": 288380 }, { "epoch": 0.5, "learning_rate": 2.4854124450241876e-05, "loss": 2.3492, "step": 288390 }, { "epoch": 0.5, "learning_rate": 2.485325251031505e-05, "loss": 2.3735, "step": 288400 }, { "epoch": 0.5, "learning_rate": 2.4852380570388224e-05, "loss": 2.3926, "step": 288410 }, { "epoch": 0.5, "learning_rate": 2.4851508630461398e-05, "loss": 2.2688, "step": 288420 }, { "epoch": 0.5, "learning_rate": 2.485063669053457e-05, "loss": 2.295, "step": 288430 }, { "epoch": 0.5, "learning_rate": 2.4849764750607742e-05, "loss": 2.2295, "step": 288440 }, { "epoch": 0.5, "learning_rate": 2.4848892810680916e-05, "loss": 2.2932, "step": 288450 }, { "epoch": 0.5, "learning_rate": 2.484802087075409e-05, "loss": 2.3662, "step": 288460 }, { "epoch": 0.5, "learning_rate": 2.4847148930827263e-05, "loss": 2.4126, "step": 288470 }, { "epoch": 0.5, "learning_rate": 2.4846276990900437e-05, "loss": 2.3616, "step": 288480 }, { "epoch": 0.5, "learning_rate": 2.4845405050973607e-05, "loss": 2.4475, "step": 288490 }, { "epoch": 0.5, "learning_rate": 2.4844533111046784e-05, "loss": 2.2703, "step": 288500 }, { "epoch": 0.5, "learning_rate": 2.4843661171119955e-05, "loss": 2.3055, "step": 288510 }, { "epoch": 0.5, "learning_rate": 2.484278923119313e-05, "loss": 2.3432, "step": 288520 }, { "epoch": 0.5, "learning_rate": 2.4841917291266302e-05, "loss": 2.3521, "step": 288530 }, { "epoch": 0.5, "learning_rate": 2.4841045351339476e-05, "loss": 2.4403, "step": 288540 }, { "epoch": 0.5, "learning_rate": 2.484017341141265e-05, "loss": 2.3355, "step": 288550 }, { "epoch": 0.5, "learning_rate": 2.483930147148582e-05, "loss": 2.3621, "step": 288560 }, { "epoch": 0.5, "learning_rate": 2.4838429531558997e-05, "loss": 2.369, "step": 288570 }, { "epoch": 0.5, "learning_rate": 2.4837557591632168e-05, "loss": 2.2664, "step": 288580 }, { "epoch": 0.5, "learning_rate": 2.483668565170534e-05, "loss": 2.3053, "step": 288590 }, { "epoch": 0.5, "learning_rate": 2.4835813711778512e-05, "loss": 2.345, "step": 288600 }, { "epoch": 0.5, "learning_rate": 2.483494177185169e-05, "loss": 2.376, "step": 288610 }, { "epoch": 0.5, "learning_rate": 2.483406983192486e-05, "loss": 2.3433, "step": 288620 }, { "epoch": 0.5, "learning_rate": 2.4833197891998033e-05, "loss": 2.3061, "step": 288630 }, { "epoch": 0.5, "learning_rate": 2.4832325952071207e-05, "loss": 2.3017, "step": 288640 }, { "epoch": 0.5, "learning_rate": 2.483145401214438e-05, "loss": 2.4045, "step": 288650 }, { "epoch": 0.5, "learning_rate": 2.4830582072217555e-05, "loss": 2.4386, "step": 288660 }, { "epoch": 0.5, "learning_rate": 2.4829710132290725e-05, "loss": 2.3269, "step": 288670 }, { "epoch": 0.5, "learning_rate": 2.4828838192363902e-05, "loss": 2.3436, "step": 288680 }, { "epoch": 0.5, "learning_rate": 2.4827966252437072e-05, "loss": 2.3689, "step": 288690 }, { "epoch": 0.5, "learning_rate": 2.4827094312510246e-05, "loss": 2.343, "step": 288700 }, { "epoch": 0.5, "learning_rate": 2.482622237258342e-05, "loss": 2.4351, "step": 288710 }, { "epoch": 0.5, "learning_rate": 2.4825350432656594e-05, "loss": 2.3617, "step": 288720 }, { "epoch": 0.5, "learning_rate": 2.4824478492729768e-05, "loss": 2.3473, "step": 288730 }, { "epoch": 0.5, "learning_rate": 2.4823606552802938e-05, "loss": 2.3194, "step": 288740 }, { "epoch": 0.5, "learning_rate": 2.4822734612876112e-05, "loss": 2.3265, "step": 288750 }, { "epoch": 0.5, "learning_rate": 2.4821862672949286e-05, "loss": 2.3241, "step": 288760 }, { "epoch": 0.5, "learning_rate": 2.482099073302246e-05, "loss": 2.4199, "step": 288770 }, { "epoch": 0.5, "learning_rate": 2.4820118793095633e-05, "loss": 2.2634, "step": 288780 }, { "epoch": 0.5, "learning_rate": 2.4819246853168807e-05, "loss": 2.4318, "step": 288790 }, { "epoch": 0.5, "learning_rate": 2.481837491324198e-05, "loss": 2.3056, "step": 288800 }, { "epoch": 0.5, "learning_rate": 2.481750297331515e-05, "loss": 2.3648, "step": 288810 }, { "epoch": 0.5, "learning_rate": 2.4816631033388325e-05, "loss": 2.4045, "step": 288820 }, { "epoch": 0.5, "learning_rate": 2.48157590934615e-05, "loss": 2.2624, "step": 288830 }, { "epoch": 0.5, "learning_rate": 2.4814887153534672e-05, "loss": 2.355, "step": 288840 }, { "epoch": 0.5, "learning_rate": 2.4814015213607843e-05, "loss": 2.2775, "step": 288850 }, { "epoch": 0.5, "learning_rate": 2.4813143273681016e-05, "loss": 2.375, "step": 288860 }, { "epoch": 0.5, "learning_rate": 2.481227133375419e-05, "loss": 2.3724, "step": 288870 }, { "epoch": 0.5, "learning_rate": 2.4811399393827364e-05, "loss": 2.4173, "step": 288880 }, { "epoch": 0.5, "learning_rate": 2.4810527453900538e-05, "loss": 2.3648, "step": 288890 }, { "epoch": 0.5, "learning_rate": 2.4809655513973708e-05, "loss": 2.1772, "step": 288900 }, { "epoch": 0.5, "learning_rate": 2.4808783574046885e-05, "loss": 2.4278, "step": 288910 }, { "epoch": 0.5, "learning_rate": 2.4807911634120056e-05, "loss": 2.3561, "step": 288920 }, { "epoch": 0.5, "learning_rate": 2.480703969419323e-05, "loss": 2.2298, "step": 288930 }, { "epoch": 0.5, "learning_rate": 2.4806167754266403e-05, "loss": 2.2692, "step": 288940 }, { "epoch": 0.5, "learning_rate": 2.4805295814339577e-05, "loss": 2.3031, "step": 288950 }, { "epoch": 0.5, "learning_rate": 2.480442387441275e-05, "loss": 2.4073, "step": 288960 }, { "epoch": 0.5, "learning_rate": 2.480355193448592e-05, "loss": 2.4386, "step": 288970 }, { "epoch": 0.5, "learning_rate": 2.4802679994559098e-05, "loss": 2.3414, "step": 288980 }, { "epoch": 0.5, "learning_rate": 2.480180805463227e-05, "loss": 2.3003, "step": 288990 }, { "epoch": 0.5, "learning_rate": 2.4800936114705442e-05, "loss": 2.3353, "step": 289000 }, { "epoch": 0.5, "learning_rate": 2.4800064174778613e-05, "loss": 2.3224, "step": 289010 }, { "epoch": 0.5, "learning_rate": 2.479919223485179e-05, "loss": 2.4021, "step": 289020 }, { "epoch": 0.5, "learning_rate": 2.4798320294924964e-05, "loss": 2.4544, "step": 289030 }, { "epoch": 0.5, "learning_rate": 2.4797448354998134e-05, "loss": 2.4166, "step": 289040 }, { "epoch": 0.5, "learning_rate": 2.479657641507131e-05, "loss": 2.2541, "step": 289050 }, { "epoch": 0.5, "learning_rate": 2.479570447514448e-05, "loss": 2.3954, "step": 289060 }, { "epoch": 0.5, "learning_rate": 2.4794832535217655e-05, "loss": 2.348, "step": 289070 }, { "epoch": 0.5, "learning_rate": 2.4793960595290826e-05, "loss": 2.3917, "step": 289080 }, { "epoch": 0.5, "learning_rate": 2.4793088655364003e-05, "loss": 2.2845, "step": 289090 }, { "epoch": 0.5, "learning_rate": 2.4792216715437173e-05, "loss": 2.3718, "step": 289100 }, { "epoch": 0.5, "learning_rate": 2.4791344775510347e-05, "loss": 2.3641, "step": 289110 }, { "epoch": 0.5, "learning_rate": 2.479047283558352e-05, "loss": 2.3161, "step": 289120 }, { "epoch": 0.5, "learning_rate": 2.4789600895656695e-05, "loss": 2.3821, "step": 289130 }, { "epoch": 0.5, "learning_rate": 2.478872895572987e-05, "loss": 2.3472, "step": 289140 }, { "epoch": 0.5, "learning_rate": 2.478785701580304e-05, "loss": 2.2837, "step": 289150 }, { "epoch": 0.5, "learning_rate": 2.4786985075876213e-05, "loss": 2.2695, "step": 289160 }, { "epoch": 0.5, "learning_rate": 2.4786113135949386e-05, "loss": 2.4039, "step": 289170 }, { "epoch": 0.5, "learning_rate": 2.478524119602256e-05, "loss": 2.3869, "step": 289180 }, { "epoch": 0.5, "learning_rate": 2.4784369256095734e-05, "loss": 2.4482, "step": 289190 }, { "epoch": 0.5, "learning_rate": 2.4783497316168908e-05, "loss": 2.3041, "step": 289200 }, { "epoch": 0.5, "learning_rate": 2.478262537624208e-05, "loss": 2.373, "step": 289210 }, { "epoch": 0.5, "learning_rate": 2.4781753436315252e-05, "loss": 2.2963, "step": 289220 }, { "epoch": 0.5, "learning_rate": 2.4780881496388426e-05, "loss": 2.471, "step": 289230 }, { "epoch": 0.5, "learning_rate": 2.47800095564616e-05, "loss": 2.2769, "step": 289240 }, { "epoch": 0.5, "learning_rate": 2.4779137616534773e-05, "loss": 2.3131, "step": 289250 }, { "epoch": 0.5, "learning_rate": 2.4778265676607944e-05, "loss": 2.2801, "step": 289260 }, { "epoch": 0.5, "learning_rate": 2.4777393736681117e-05, "loss": 2.3475, "step": 289270 }, { "epoch": 0.5, "learning_rate": 2.4776521796754294e-05, "loss": 2.3625, "step": 289280 }, { "epoch": 0.5, "learning_rate": 2.4775649856827465e-05, "loss": 2.2698, "step": 289290 }, { "epoch": 0.5, "learning_rate": 2.477477791690064e-05, "loss": 2.4298, "step": 289300 }, { "epoch": 0.5, "learning_rate": 2.477390597697381e-05, "loss": 2.3185, "step": 289310 }, { "epoch": 0.5, "learning_rate": 2.4773034037046986e-05, "loss": 2.3965, "step": 289320 }, { "epoch": 0.5, "learning_rate": 2.4772162097120157e-05, "loss": 2.3904, "step": 289330 }, { "epoch": 0.5, "learning_rate": 2.477129015719333e-05, "loss": 2.4527, "step": 289340 }, { "epoch": 0.5, "learning_rate": 2.4770418217266504e-05, "loss": 2.3859, "step": 289350 }, { "epoch": 0.5, "learning_rate": 2.4769546277339678e-05, "loss": 2.3495, "step": 289360 }, { "epoch": 0.5, "learning_rate": 2.476867433741285e-05, "loss": 2.1536, "step": 289370 }, { "epoch": 0.5, "learning_rate": 2.4767802397486022e-05, "loss": 2.2443, "step": 289380 }, { "epoch": 0.5, "learning_rate": 2.47669304575592e-05, "loss": 2.3802, "step": 289390 }, { "epoch": 0.5, "learning_rate": 2.476605851763237e-05, "loss": 2.4404, "step": 289400 }, { "epoch": 0.5, "learning_rate": 2.4765186577705543e-05, "loss": 2.3591, "step": 289410 }, { "epoch": 0.5, "learning_rate": 2.4764314637778717e-05, "loss": 2.3411, "step": 289420 }, { "epoch": 0.5, "learning_rate": 2.476344269785189e-05, "loss": 2.3765, "step": 289430 }, { "epoch": 0.5, "learning_rate": 2.4762570757925065e-05, "loss": 2.3931, "step": 289440 }, { "epoch": 0.5, "learning_rate": 2.4761698817998235e-05, "loss": 2.3829, "step": 289450 }, { "epoch": 0.5, "learning_rate": 2.4760826878071412e-05, "loss": 2.4214, "step": 289460 }, { "epoch": 0.5, "learning_rate": 2.4759954938144583e-05, "loss": 2.5588, "step": 289470 }, { "epoch": 0.5, "learning_rate": 2.4759082998217756e-05, "loss": 2.1934, "step": 289480 }, { "epoch": 0.5, "learning_rate": 2.4758211058290927e-05, "loss": 2.3098, "step": 289490 }, { "epoch": 0.5, "learning_rate": 2.4757339118364104e-05, "loss": 2.2045, "step": 289500 }, { "epoch": 0.5, "learning_rate": 2.4756467178437278e-05, "loss": 2.3424, "step": 289510 }, { "epoch": 0.5, "learning_rate": 2.4755595238510448e-05, "loss": 2.3851, "step": 289520 }, { "epoch": 0.5, "learning_rate": 2.4754723298583622e-05, "loss": 2.3599, "step": 289530 }, { "epoch": 0.5, "learning_rate": 2.4753851358656796e-05, "loss": 2.2394, "step": 289540 }, { "epoch": 0.5, "learning_rate": 2.475297941872997e-05, "loss": 2.3502, "step": 289550 }, { "epoch": 0.5, "learning_rate": 2.475210747880314e-05, "loss": 2.2637, "step": 289560 }, { "epoch": 0.5, "learning_rate": 2.4751235538876313e-05, "loss": 2.4154, "step": 289570 }, { "epoch": 0.5, "learning_rate": 2.4750363598949487e-05, "loss": 2.402, "step": 289580 }, { "epoch": 0.51, "learning_rate": 2.474949165902266e-05, "loss": 2.194, "step": 289590 }, { "epoch": 0.51, "learning_rate": 2.4748619719095835e-05, "loss": 2.3227, "step": 289600 }, { "epoch": 0.51, "learning_rate": 2.474774777916901e-05, "loss": 2.3868, "step": 289610 }, { "epoch": 0.51, "learning_rate": 2.4746875839242182e-05, "loss": 2.3488, "step": 289620 }, { "epoch": 0.51, "learning_rate": 2.4746003899315353e-05, "loss": 2.4322, "step": 289630 }, { "epoch": 0.51, "learning_rate": 2.4745131959388526e-05, "loss": 2.5103, "step": 289640 }, { "epoch": 0.51, "learning_rate": 2.47442600194617e-05, "loss": 2.2787, "step": 289650 }, { "epoch": 0.51, "learning_rate": 2.4743388079534874e-05, "loss": 2.3334, "step": 289660 }, { "epoch": 0.51, "learning_rate": 2.4742516139608048e-05, "loss": 2.3668, "step": 289670 }, { "epoch": 0.51, "learning_rate": 2.4741644199681218e-05, "loss": 2.2986, "step": 289680 }, { "epoch": 0.51, "learning_rate": 2.4740772259754395e-05, "loss": 2.3473, "step": 289690 }, { "epoch": 0.51, "learning_rate": 2.4739900319827566e-05, "loss": 2.3773, "step": 289700 }, { "epoch": 0.51, "learning_rate": 2.473902837990074e-05, "loss": 2.4054, "step": 289710 }, { "epoch": 0.51, "learning_rate": 2.4738156439973913e-05, "loss": 2.3478, "step": 289720 }, { "epoch": 0.51, "learning_rate": 2.4737284500047087e-05, "loss": 2.3944, "step": 289730 }, { "epoch": 0.51, "learning_rate": 2.4736412560120257e-05, "loss": 2.2815, "step": 289740 }, { "epoch": 0.51, "learning_rate": 2.473554062019343e-05, "loss": 2.4135, "step": 289750 }, { "epoch": 0.51, "learning_rate": 2.4734668680266608e-05, "loss": 2.3447, "step": 289760 }, { "epoch": 0.51, "learning_rate": 2.473379674033978e-05, "loss": 2.3952, "step": 289770 }, { "epoch": 0.51, "learning_rate": 2.4732924800412952e-05, "loss": 2.371, "step": 289780 }, { "epoch": 0.51, "learning_rate": 2.4732052860486123e-05, "loss": 2.383, "step": 289790 }, { "epoch": 0.51, "learning_rate": 2.47311809205593e-05, "loss": 2.3225, "step": 289800 }, { "epoch": 0.51, "learning_rate": 2.473030898063247e-05, "loss": 2.349, "step": 289810 }, { "epoch": 0.51, "learning_rate": 2.4729437040705644e-05, "loss": 2.4892, "step": 289820 }, { "epoch": 0.51, "learning_rate": 2.4728565100778818e-05, "loss": 2.4997, "step": 289830 }, { "epoch": 0.51, "learning_rate": 2.472769316085199e-05, "loss": 2.2927, "step": 289840 }, { "epoch": 0.51, "learning_rate": 2.4726821220925165e-05, "loss": 2.3983, "step": 289850 }, { "epoch": 0.51, "learning_rate": 2.4725949280998336e-05, "loss": 2.2869, "step": 289860 }, { "epoch": 0.51, "learning_rate": 2.4725077341071513e-05, "loss": 2.2917, "step": 289870 }, { "epoch": 0.51, "learning_rate": 2.4724205401144683e-05, "loss": 2.4332, "step": 289880 }, { "epoch": 0.51, "learning_rate": 2.4723333461217857e-05, "loss": 2.3978, "step": 289890 }, { "epoch": 0.51, "learning_rate": 2.472246152129103e-05, "loss": 2.4321, "step": 289900 }, { "epoch": 0.51, "learning_rate": 2.4721589581364205e-05, "loss": 2.5071, "step": 289910 }, { "epoch": 0.51, "learning_rate": 2.472071764143738e-05, "loss": 2.3462, "step": 289920 }, { "epoch": 0.51, "learning_rate": 2.471984570151055e-05, "loss": 2.4456, "step": 289930 }, { "epoch": 0.51, "learning_rate": 2.4718973761583723e-05, "loss": 2.3691, "step": 289940 }, { "epoch": 0.51, "learning_rate": 2.4718101821656896e-05, "loss": 2.437, "step": 289950 }, { "epoch": 0.51, "learning_rate": 2.471722988173007e-05, "loss": 2.3449, "step": 289960 }, { "epoch": 0.51, "learning_rate": 2.471635794180324e-05, "loss": 2.3039, "step": 289970 }, { "epoch": 0.51, "learning_rate": 2.4715486001876418e-05, "loss": 2.4202, "step": 289980 }, { "epoch": 0.51, "learning_rate": 2.4714614061949588e-05, "loss": 2.3993, "step": 289990 }, { "epoch": 0.51, "learning_rate": 2.4713742122022762e-05, "loss": 2.2215, "step": 290000 }, { "epoch": 0.51, "learning_rate": 2.4712870182095936e-05, "loss": 2.5296, "step": 290010 }, { "epoch": 0.51, "learning_rate": 2.471199824216911e-05, "loss": 2.328, "step": 290020 }, { "epoch": 0.51, "learning_rate": 2.4711126302242283e-05, "loss": 2.3154, "step": 290030 }, { "epoch": 0.51, "learning_rate": 2.4710254362315454e-05, "loss": 2.3397, "step": 290040 }, { "epoch": 0.51, "learning_rate": 2.4709382422388627e-05, "loss": 2.3884, "step": 290050 }, { "epoch": 0.51, "learning_rate": 2.47085104824618e-05, "loss": 2.4105, "step": 290060 }, { "epoch": 0.51, "learning_rate": 2.4707638542534975e-05, "loss": 2.3218, "step": 290070 }, { "epoch": 0.51, "learning_rate": 2.470676660260815e-05, "loss": 2.5264, "step": 290080 }, { "epoch": 0.51, "learning_rate": 2.470589466268132e-05, "loss": 2.2383, "step": 290090 }, { "epoch": 0.51, "learning_rate": 2.4705022722754496e-05, "loss": 2.3599, "step": 290100 }, { "epoch": 0.51, "learning_rate": 2.4704150782827667e-05, "loss": 2.4215, "step": 290110 }, { "epoch": 0.51, "learning_rate": 2.470327884290084e-05, "loss": 2.3351, "step": 290120 }, { "epoch": 0.51, "learning_rate": 2.4702406902974014e-05, "loss": 2.3194, "step": 290130 }, { "epoch": 0.51, "learning_rate": 2.4701534963047188e-05, "loss": 2.3975, "step": 290140 }, { "epoch": 0.51, "learning_rate": 2.470066302312036e-05, "loss": 2.3309, "step": 290150 }, { "epoch": 0.51, "learning_rate": 2.4699791083193532e-05, "loss": 2.4137, "step": 290160 }, { "epoch": 0.51, "learning_rate": 2.469891914326671e-05, "loss": 2.3648, "step": 290170 }, { "epoch": 0.51, "learning_rate": 2.469804720333988e-05, "loss": 2.3223, "step": 290180 }, { "epoch": 0.51, "learning_rate": 2.4697175263413053e-05, "loss": 2.2615, "step": 290190 }, { "epoch": 0.51, "learning_rate": 2.4696303323486224e-05, "loss": 2.2955, "step": 290200 }, { "epoch": 0.51, "learning_rate": 2.46954313835594e-05, "loss": 2.285, "step": 290210 }, { "epoch": 0.51, "learning_rate": 2.469455944363257e-05, "loss": 2.2654, "step": 290220 }, { "epoch": 0.51, "learning_rate": 2.4693687503705745e-05, "loss": 2.4573, "step": 290230 }, { "epoch": 0.51, "learning_rate": 2.469281556377892e-05, "loss": 2.26, "step": 290240 }, { "epoch": 0.51, "learning_rate": 2.4691943623852093e-05, "loss": 2.3259, "step": 290250 }, { "epoch": 0.51, "learning_rate": 2.4691071683925266e-05, "loss": 2.2398, "step": 290260 }, { "epoch": 0.51, "learning_rate": 2.4690199743998437e-05, "loss": 2.3792, "step": 290270 }, { "epoch": 0.51, "learning_rate": 2.4689327804071614e-05, "loss": 2.4395, "step": 290280 }, { "epoch": 0.51, "learning_rate": 2.4688455864144784e-05, "loss": 2.2543, "step": 290290 }, { "epoch": 0.51, "learning_rate": 2.4687583924217958e-05, "loss": 2.3868, "step": 290300 }, { "epoch": 0.51, "learning_rate": 2.4686711984291132e-05, "loss": 2.3944, "step": 290310 }, { "epoch": 0.51, "learning_rate": 2.4685840044364306e-05, "loss": 2.4142, "step": 290320 }, { "epoch": 0.51, "learning_rate": 2.468496810443748e-05, "loss": 2.467, "step": 290330 }, { "epoch": 0.51, "learning_rate": 2.468409616451065e-05, "loss": 2.4157, "step": 290340 }, { "epoch": 0.51, "learning_rate": 2.4683224224583823e-05, "loss": 2.2731, "step": 290350 }, { "epoch": 0.51, "learning_rate": 2.4682352284656997e-05, "loss": 2.4202, "step": 290360 }, { "epoch": 0.51, "learning_rate": 2.468148034473017e-05, "loss": 2.3596, "step": 290370 }, { "epoch": 0.51, "learning_rate": 2.4680608404803345e-05, "loss": 2.2681, "step": 290380 }, { "epoch": 0.51, "learning_rate": 2.467973646487652e-05, "loss": 2.3925, "step": 290390 }, { "epoch": 0.51, "learning_rate": 2.4678864524949692e-05, "loss": 2.4209, "step": 290400 }, { "epoch": 0.51, "learning_rate": 2.4677992585022863e-05, "loss": 2.4489, "step": 290410 }, { "epoch": 0.51, "learning_rate": 2.4677120645096036e-05, "loss": 2.2727, "step": 290420 }, { "epoch": 0.51, "learning_rate": 2.467624870516921e-05, "loss": 2.2134, "step": 290430 }, { "epoch": 0.51, "learning_rate": 2.4675376765242384e-05, "loss": 2.2759, "step": 290440 }, { "epoch": 0.51, "learning_rate": 2.4674504825315554e-05, "loss": 2.3137, "step": 290450 }, { "epoch": 0.51, "learning_rate": 2.4673632885388728e-05, "loss": 2.4497, "step": 290460 }, { "epoch": 0.51, "learning_rate": 2.4672760945461902e-05, "loss": 2.3005, "step": 290470 }, { "epoch": 0.51, "learning_rate": 2.4671889005535076e-05, "loss": 2.3795, "step": 290480 }, { "epoch": 0.51, "learning_rate": 2.467101706560825e-05, "loss": 2.3937, "step": 290490 }, { "epoch": 0.51, "learning_rate": 2.467014512568142e-05, "loss": 2.4106, "step": 290500 }, { "epoch": 0.51, "learning_rate": 2.4669273185754597e-05, "loss": 2.4397, "step": 290510 }, { "epoch": 0.51, "learning_rate": 2.4668401245827767e-05, "loss": 2.3451, "step": 290520 }, { "epoch": 0.51, "learning_rate": 2.466752930590094e-05, "loss": 2.3493, "step": 290530 }, { "epoch": 0.51, "learning_rate": 2.4666657365974115e-05, "loss": 2.3672, "step": 290540 }, { "epoch": 0.51, "learning_rate": 2.466578542604729e-05, "loss": 2.2177, "step": 290550 }, { "epoch": 0.51, "learning_rate": 2.4664913486120462e-05, "loss": 2.3938, "step": 290560 }, { "epoch": 0.51, "learning_rate": 2.4664041546193633e-05, "loss": 2.3694, "step": 290570 }, { "epoch": 0.51, "learning_rate": 2.466316960626681e-05, "loss": 2.3685, "step": 290580 }, { "epoch": 0.51, "learning_rate": 2.466229766633998e-05, "loss": 2.3158, "step": 290590 }, { "epoch": 0.51, "learning_rate": 2.4661425726413154e-05, "loss": 2.4338, "step": 290600 }, { "epoch": 0.51, "learning_rate": 2.4660553786486325e-05, "loss": 2.4061, "step": 290610 }, { "epoch": 0.51, "learning_rate": 2.46596818465595e-05, "loss": 2.4087, "step": 290620 }, { "epoch": 0.51, "learning_rate": 2.4658809906632675e-05, "loss": 2.429, "step": 290630 }, { "epoch": 0.51, "learning_rate": 2.4657937966705846e-05, "loss": 2.3303, "step": 290640 }, { "epoch": 0.51, "learning_rate": 2.4657066026779023e-05, "loss": 2.4193, "step": 290650 }, { "epoch": 0.51, "learning_rate": 2.4656194086852193e-05, "loss": 2.3597, "step": 290660 }, { "epoch": 0.51, "learning_rate": 2.4655322146925367e-05, "loss": 2.3759, "step": 290670 }, { "epoch": 0.51, "learning_rate": 2.4654450206998538e-05, "loss": 2.4201, "step": 290680 }, { "epoch": 0.51, "learning_rate": 2.4653578267071715e-05, "loss": 2.3443, "step": 290690 }, { "epoch": 0.51, "learning_rate": 2.4652706327144885e-05, "loss": 2.3261, "step": 290700 }, { "epoch": 0.51, "learning_rate": 2.465183438721806e-05, "loss": 2.3234, "step": 290710 }, { "epoch": 0.51, "learning_rate": 2.4650962447291233e-05, "loss": 2.4269, "step": 290720 }, { "epoch": 0.51, "learning_rate": 2.4650090507364406e-05, "loss": 2.3269, "step": 290730 }, { "epoch": 0.51, "learning_rate": 2.464921856743758e-05, "loss": 2.3469, "step": 290740 }, { "epoch": 0.51, "learning_rate": 2.464834662751075e-05, "loss": 2.2616, "step": 290750 }, { "epoch": 0.51, "learning_rate": 2.4647474687583924e-05, "loss": 2.4772, "step": 290760 }, { "epoch": 0.51, "learning_rate": 2.4646602747657098e-05, "loss": 2.2957, "step": 290770 }, { "epoch": 0.51, "learning_rate": 2.4645730807730272e-05, "loss": 2.4445, "step": 290780 }, { "epoch": 0.51, "learning_rate": 2.4644858867803446e-05, "loss": 2.2416, "step": 290790 }, { "epoch": 0.51, "learning_rate": 2.464398692787662e-05, "loss": 2.3741, "step": 290800 }, { "epoch": 0.51, "learning_rate": 2.4643114987949793e-05, "loss": 2.4135, "step": 290810 }, { "epoch": 0.51, "learning_rate": 2.4642243048022964e-05, "loss": 2.2906, "step": 290820 }, { "epoch": 0.51, "learning_rate": 2.4641371108096137e-05, "loss": 2.4283, "step": 290830 }, { "epoch": 0.51, "learning_rate": 2.464049916816931e-05, "loss": 2.4637, "step": 290840 }, { "epoch": 0.51, "learning_rate": 2.4639627228242485e-05, "loss": 2.2789, "step": 290850 }, { "epoch": 0.51, "learning_rate": 2.463875528831566e-05, "loss": 2.4686, "step": 290860 }, { "epoch": 0.51, "learning_rate": 2.463788334838883e-05, "loss": 2.4092, "step": 290870 }, { "epoch": 0.51, "learning_rate": 2.4637011408462006e-05, "loss": 2.3775, "step": 290880 }, { "epoch": 0.51, "learning_rate": 2.4636139468535177e-05, "loss": 2.1926, "step": 290890 }, { "epoch": 0.51, "learning_rate": 2.463526752860835e-05, "loss": 2.3059, "step": 290900 }, { "epoch": 0.51, "learning_rate": 2.4634395588681524e-05, "loss": 2.406, "step": 290910 }, { "epoch": 0.51, "learning_rate": 2.4633523648754698e-05, "loss": 2.3754, "step": 290920 }, { "epoch": 0.51, "learning_rate": 2.4632651708827868e-05, "loss": 2.3531, "step": 290930 }, { "epoch": 0.51, "learning_rate": 2.4631779768901042e-05, "loss": 2.3518, "step": 290940 }, { "epoch": 0.51, "learning_rate": 2.4630907828974216e-05, "loss": 2.361, "step": 290950 }, { "epoch": 0.51, "learning_rate": 2.463003588904739e-05, "loss": 2.2983, "step": 290960 }, { "epoch": 0.51, "learning_rate": 2.4629163949120563e-05, "loss": 2.2878, "step": 290970 }, { "epoch": 0.51, "learning_rate": 2.4628292009193734e-05, "loss": 2.2756, "step": 290980 }, { "epoch": 0.51, "learning_rate": 2.462742006926691e-05, "loss": 2.3712, "step": 290990 }, { "epoch": 0.51, "learning_rate": 2.462654812934008e-05, "loss": 2.4059, "step": 291000 }, { "epoch": 0.51, "learning_rate": 2.4625676189413255e-05, "loss": 2.3662, "step": 291010 }, { "epoch": 0.51, "learning_rate": 2.462480424948643e-05, "loss": 2.4489, "step": 291020 }, { "epoch": 0.51, "learning_rate": 2.4623932309559603e-05, "loss": 2.3683, "step": 291030 }, { "epoch": 0.51, "learning_rate": 2.4623060369632776e-05, "loss": 2.3423, "step": 291040 }, { "epoch": 0.51, "learning_rate": 2.4622188429705947e-05, "loss": 2.3977, "step": 291050 }, { "epoch": 0.51, "learning_rate": 2.4621316489779124e-05, "loss": 2.3872, "step": 291060 }, { "epoch": 0.51, "learning_rate": 2.4620444549852294e-05, "loss": 2.2665, "step": 291070 }, { "epoch": 0.51, "learning_rate": 2.4619572609925468e-05, "loss": 2.3818, "step": 291080 }, { "epoch": 0.51, "learning_rate": 2.461870066999864e-05, "loss": 2.3291, "step": 291090 }, { "epoch": 0.51, "learning_rate": 2.4617828730071816e-05, "loss": 2.2563, "step": 291100 }, { "epoch": 0.51, "learning_rate": 2.461695679014499e-05, "loss": 2.4648, "step": 291110 }, { "epoch": 0.51, "learning_rate": 2.461608485021816e-05, "loss": 2.3638, "step": 291120 }, { "epoch": 0.51, "learning_rate": 2.4615212910291333e-05, "loss": 2.4421, "step": 291130 }, { "epoch": 0.51, "learning_rate": 2.4614340970364507e-05, "loss": 2.3165, "step": 291140 }, { "epoch": 0.51, "learning_rate": 2.461346903043768e-05, "loss": 2.2855, "step": 291150 }, { "epoch": 0.51, "learning_rate": 2.461259709051085e-05, "loss": 2.4823, "step": 291160 }, { "epoch": 0.51, "learning_rate": 2.4611725150584025e-05, "loss": 2.3494, "step": 291170 }, { "epoch": 0.51, "learning_rate": 2.46108532106572e-05, "loss": 2.3245, "step": 291180 }, { "epoch": 0.51, "learning_rate": 2.4609981270730373e-05, "loss": 2.3648, "step": 291190 }, { "epoch": 0.51, "learning_rate": 2.4609109330803546e-05, "loss": 2.3025, "step": 291200 }, { "epoch": 0.51, "learning_rate": 2.460823739087672e-05, "loss": 2.3609, "step": 291210 }, { "epoch": 0.51, "learning_rate": 2.4607365450949894e-05, "loss": 2.355, "step": 291220 }, { "epoch": 0.51, "learning_rate": 2.4606493511023064e-05, "loss": 2.3562, "step": 291230 }, { "epoch": 0.51, "learning_rate": 2.4605621571096238e-05, "loss": 2.4601, "step": 291240 }, { "epoch": 0.51, "learning_rate": 2.4604749631169412e-05, "loss": 2.2682, "step": 291250 }, { "epoch": 0.51, "learning_rate": 2.4603877691242586e-05, "loss": 2.3156, "step": 291260 }, { "epoch": 0.51, "learning_rate": 2.460300575131576e-05, "loss": 2.3936, "step": 291270 }, { "epoch": 0.51, "learning_rate": 2.460213381138893e-05, "loss": 2.3774, "step": 291280 }, { "epoch": 0.51, "learning_rate": 2.4601261871462107e-05, "loss": 2.2621, "step": 291290 }, { "epoch": 0.51, "learning_rate": 2.4600389931535277e-05, "loss": 2.4418, "step": 291300 }, { "epoch": 0.51, "learning_rate": 2.459951799160845e-05, "loss": 2.4683, "step": 291310 }, { "epoch": 0.51, "learning_rate": 2.4598646051681625e-05, "loss": 2.4363, "step": 291320 }, { "epoch": 0.51, "learning_rate": 2.45977741117548e-05, "loss": 2.367, "step": 291330 }, { "epoch": 0.51, "learning_rate": 2.459690217182797e-05, "loss": 2.3213, "step": 291340 }, { "epoch": 0.51, "learning_rate": 2.4596030231901143e-05, "loss": 2.3019, "step": 291350 }, { "epoch": 0.51, "learning_rate": 2.459515829197432e-05, "loss": 2.5196, "step": 291360 }, { "epoch": 0.51, "learning_rate": 2.459428635204749e-05, "loss": 2.5076, "step": 291370 }, { "epoch": 0.51, "learning_rate": 2.4593414412120664e-05, "loss": 2.359, "step": 291380 }, { "epoch": 0.51, "learning_rate": 2.4592542472193835e-05, "loss": 2.4206, "step": 291390 }, { "epoch": 0.51, "learning_rate": 2.459167053226701e-05, "loss": 2.4193, "step": 291400 }, { "epoch": 0.51, "learning_rate": 2.4590798592340182e-05, "loss": 2.3422, "step": 291410 }, { "epoch": 0.51, "learning_rate": 2.4589926652413356e-05, "loss": 2.3402, "step": 291420 }, { "epoch": 0.51, "learning_rate": 2.458905471248653e-05, "loss": 2.353, "step": 291430 }, { "epoch": 0.51, "learning_rate": 2.4588182772559703e-05, "loss": 2.477, "step": 291440 }, { "epoch": 0.51, "learning_rate": 2.4587310832632877e-05, "loss": 2.4094, "step": 291450 }, { "epoch": 0.51, "learning_rate": 2.4586438892706048e-05, "loss": 2.4597, "step": 291460 }, { "epoch": 0.51, "learning_rate": 2.4585566952779225e-05, "loss": 2.4476, "step": 291470 }, { "epoch": 0.51, "learning_rate": 2.4584695012852395e-05, "loss": 2.4248, "step": 291480 }, { "epoch": 0.51, "learning_rate": 2.458382307292557e-05, "loss": 2.2478, "step": 291490 }, { "epoch": 0.51, "learning_rate": 2.4582951132998743e-05, "loss": 2.3611, "step": 291500 }, { "epoch": 0.51, "learning_rate": 2.4582079193071916e-05, "loss": 2.3716, "step": 291510 }, { "epoch": 0.51, "learning_rate": 2.458120725314509e-05, "loss": 2.3944, "step": 291520 }, { "epoch": 0.51, "learning_rate": 2.458033531321826e-05, "loss": 2.4157, "step": 291530 }, { "epoch": 0.51, "learning_rate": 2.4579463373291434e-05, "loss": 2.3429, "step": 291540 }, { "epoch": 0.51, "learning_rate": 2.4578591433364608e-05, "loss": 2.2594, "step": 291550 }, { "epoch": 0.51, "learning_rate": 2.4577719493437782e-05, "loss": 2.3294, "step": 291560 }, { "epoch": 0.51, "learning_rate": 2.4576847553510952e-05, "loss": 2.4084, "step": 291570 }, { "epoch": 0.51, "learning_rate": 2.457597561358413e-05, "loss": 2.3373, "step": 291580 }, { "epoch": 0.51, "learning_rate": 2.4575103673657303e-05, "loss": 2.4561, "step": 291590 }, { "epoch": 0.51, "learning_rate": 2.4574231733730474e-05, "loss": 2.297, "step": 291600 }, { "epoch": 0.51, "learning_rate": 2.4573359793803647e-05, "loss": 2.3382, "step": 291610 }, { "epoch": 0.51, "learning_rate": 2.457248785387682e-05, "loss": 2.2478, "step": 291620 }, { "epoch": 0.51, "learning_rate": 2.4571615913949995e-05, "loss": 2.4447, "step": 291630 }, { "epoch": 0.51, "learning_rate": 2.4570743974023165e-05, "loss": 2.2985, "step": 291640 }, { "epoch": 0.51, "learning_rate": 2.456987203409634e-05, "loss": 2.3452, "step": 291650 }, { "epoch": 0.51, "learning_rate": 2.4569000094169513e-05, "loss": 2.3543, "step": 291660 }, { "epoch": 0.51, "learning_rate": 2.4568128154242687e-05, "loss": 2.3935, "step": 291670 }, { "epoch": 0.51, "learning_rate": 2.456725621431586e-05, "loss": 2.4599, "step": 291680 }, { "epoch": 0.51, "learning_rate": 2.456638427438903e-05, "loss": 2.3412, "step": 291690 }, { "epoch": 0.51, "learning_rate": 2.4565512334462208e-05, "loss": 2.3389, "step": 291700 }, { "epoch": 0.51, "learning_rate": 2.4564640394535378e-05, "loss": 2.3661, "step": 291710 }, { "epoch": 0.51, "learning_rate": 2.4563768454608552e-05, "loss": 2.2814, "step": 291720 }, { "epoch": 0.51, "learning_rate": 2.4562896514681726e-05, "loss": 2.2423, "step": 291730 }, { "epoch": 0.51, "learning_rate": 2.45620245747549e-05, "loss": 2.3546, "step": 291740 }, { "epoch": 0.51, "learning_rate": 2.4561152634828073e-05, "loss": 2.3158, "step": 291750 }, { "epoch": 0.51, "learning_rate": 2.4560280694901244e-05, "loss": 2.3967, "step": 291760 }, { "epoch": 0.51, "learning_rate": 2.455940875497442e-05, "loss": 2.2346, "step": 291770 }, { "epoch": 0.51, "learning_rate": 2.455853681504759e-05, "loss": 2.3362, "step": 291780 }, { "epoch": 0.51, "learning_rate": 2.4557664875120765e-05, "loss": 2.2338, "step": 291790 }, { "epoch": 0.51, "learning_rate": 2.4556792935193935e-05, "loss": 2.3445, "step": 291800 }, { "epoch": 0.51, "learning_rate": 2.4555920995267113e-05, "loss": 2.3916, "step": 291810 }, { "epoch": 0.51, "learning_rate": 2.4555049055340283e-05, "loss": 2.3692, "step": 291820 }, { "epoch": 0.51, "learning_rate": 2.4554177115413457e-05, "loss": 2.3902, "step": 291830 }, { "epoch": 0.51, "learning_rate": 2.4553305175486634e-05, "loss": 2.3893, "step": 291840 }, { "epoch": 0.51, "learning_rate": 2.4552433235559804e-05, "loss": 2.4269, "step": 291850 }, { "epoch": 0.51, "learning_rate": 2.4551561295632978e-05, "loss": 2.341, "step": 291860 }, { "epoch": 0.51, "learning_rate": 2.455068935570615e-05, "loss": 2.3313, "step": 291870 }, { "epoch": 0.51, "learning_rate": 2.4549817415779326e-05, "loss": 2.297, "step": 291880 }, { "epoch": 0.51, "learning_rate": 2.4548945475852496e-05, "loss": 2.4171, "step": 291890 }, { "epoch": 0.51, "learning_rate": 2.454807353592567e-05, "loss": 2.3132, "step": 291900 }, { "epoch": 0.51, "learning_rate": 2.4547201595998843e-05, "loss": 2.322, "step": 291910 }, { "epoch": 0.51, "learning_rate": 2.4546329656072017e-05, "loss": 2.5412, "step": 291920 }, { "epoch": 0.51, "learning_rate": 2.454545771614519e-05, "loss": 2.3927, "step": 291930 }, { "epoch": 0.51, "learning_rate": 2.454458577621836e-05, "loss": 2.4048, "step": 291940 }, { "epoch": 0.51, "learning_rate": 2.4543713836291535e-05, "loss": 2.4649, "step": 291950 }, { "epoch": 0.51, "learning_rate": 2.454284189636471e-05, "loss": 2.3086, "step": 291960 }, { "epoch": 0.51, "learning_rate": 2.4541969956437883e-05, "loss": 2.3803, "step": 291970 }, { "epoch": 0.51, "learning_rate": 2.4541098016511056e-05, "loss": 2.4346, "step": 291980 }, { "epoch": 0.51, "learning_rate": 2.454022607658423e-05, "loss": 2.4019, "step": 291990 }, { "epoch": 0.51, "learning_rate": 2.4539354136657404e-05, "loss": 2.3897, "step": 292000 }, { "epoch": 0.51, "learning_rate": 2.4538482196730574e-05, "loss": 2.3577, "step": 292010 }, { "epoch": 0.51, "learning_rate": 2.4537610256803748e-05, "loss": 2.4484, "step": 292020 }, { "epoch": 0.51, "learning_rate": 2.4536738316876922e-05, "loss": 2.297, "step": 292030 }, { "epoch": 0.51, "learning_rate": 2.4535866376950096e-05, "loss": 2.3377, "step": 292040 }, { "epoch": 0.51, "learning_rate": 2.4534994437023266e-05, "loss": 2.3127, "step": 292050 }, { "epoch": 0.51, "learning_rate": 2.453412249709644e-05, "loss": 2.3641, "step": 292060 }, { "epoch": 0.51, "learning_rate": 2.4533250557169614e-05, "loss": 2.4897, "step": 292070 }, { "epoch": 0.51, "learning_rate": 2.4532378617242787e-05, "loss": 2.2379, "step": 292080 }, { "epoch": 0.51, "learning_rate": 2.453150667731596e-05, "loss": 2.3314, "step": 292090 }, { "epoch": 0.51, "learning_rate": 2.453063473738913e-05, "loss": 2.3591, "step": 292100 }, { "epoch": 0.51, "learning_rate": 2.452976279746231e-05, "loss": 2.3668, "step": 292110 }, { "epoch": 0.51, "learning_rate": 2.452889085753548e-05, "loss": 2.2555, "step": 292120 }, { "epoch": 0.51, "learning_rate": 2.4528018917608653e-05, "loss": 2.3345, "step": 292130 }, { "epoch": 0.51, "learning_rate": 2.4527146977681827e-05, "loss": 2.3736, "step": 292140 }, { "epoch": 0.51, "learning_rate": 2.4526275037755e-05, "loss": 2.339, "step": 292150 }, { "epoch": 0.51, "learning_rate": 2.4525403097828174e-05, "loss": 2.4087, "step": 292160 }, { "epoch": 0.51, "learning_rate": 2.4524531157901345e-05, "loss": 2.3367, "step": 292170 }, { "epoch": 0.51, "learning_rate": 2.452365921797452e-05, "loss": 2.4806, "step": 292180 }, { "epoch": 0.51, "learning_rate": 2.4522787278047692e-05, "loss": 2.409, "step": 292190 }, { "epoch": 0.51, "learning_rate": 2.4521915338120866e-05, "loss": 2.3904, "step": 292200 }, { "epoch": 0.51, "learning_rate": 2.452104339819404e-05, "loss": 2.3598, "step": 292210 }, { "epoch": 0.51, "learning_rate": 2.4520171458267213e-05, "loss": 2.3739, "step": 292220 }, { "epoch": 0.51, "learning_rate": 2.4519299518340387e-05, "loss": 2.4826, "step": 292230 }, { "epoch": 0.51, "learning_rate": 2.4518427578413558e-05, "loss": 2.4041, "step": 292240 }, { "epoch": 0.51, "learning_rate": 2.4517555638486735e-05, "loss": 2.3391, "step": 292250 }, { "epoch": 0.51, "learning_rate": 2.4516683698559905e-05, "loss": 2.3471, "step": 292260 }, { "epoch": 0.51, "learning_rate": 2.451581175863308e-05, "loss": 2.3205, "step": 292270 }, { "epoch": 0.51, "learning_rate": 2.451493981870625e-05, "loss": 2.3357, "step": 292280 }, { "epoch": 0.51, "learning_rate": 2.4514067878779426e-05, "loss": 2.3474, "step": 292290 }, { "epoch": 0.51, "learning_rate": 2.4513195938852597e-05, "loss": 2.3294, "step": 292300 }, { "epoch": 0.51, "learning_rate": 2.451232399892577e-05, "loss": 2.3465, "step": 292310 }, { "epoch": 0.51, "learning_rate": 2.4511452058998944e-05, "loss": 2.3982, "step": 292320 }, { "epoch": 0.51, "learning_rate": 2.4510580119072118e-05, "loss": 2.4064, "step": 292330 }, { "epoch": 0.51, "learning_rate": 2.4509708179145292e-05, "loss": 2.43, "step": 292340 }, { "epoch": 0.51, "learning_rate": 2.4508836239218462e-05, "loss": 2.4327, "step": 292350 }, { "epoch": 0.51, "learning_rate": 2.4507964299291636e-05, "loss": 2.36, "step": 292360 }, { "epoch": 0.51, "learning_rate": 2.450709235936481e-05, "loss": 2.3841, "step": 292370 }, { "epoch": 0.51, "learning_rate": 2.4506220419437984e-05, "loss": 2.4096, "step": 292380 }, { "epoch": 0.51, "learning_rate": 2.4505348479511157e-05, "loss": 2.3595, "step": 292390 }, { "epoch": 0.51, "learning_rate": 2.450447653958433e-05, "loss": 2.4283, "step": 292400 }, { "epoch": 0.51, "learning_rate": 2.4503604599657505e-05, "loss": 2.3807, "step": 292410 }, { "epoch": 0.51, "learning_rate": 2.4502732659730675e-05, "loss": 2.4203, "step": 292420 }, { "epoch": 0.51, "learning_rate": 2.450186071980385e-05, "loss": 2.4003, "step": 292430 }, { "epoch": 0.51, "learning_rate": 2.4500988779877023e-05, "loss": 2.4556, "step": 292440 }, { "epoch": 0.51, "learning_rate": 2.4500116839950197e-05, "loss": 2.3077, "step": 292450 }, { "epoch": 0.51, "learning_rate": 2.449924490002337e-05, "loss": 2.2988, "step": 292460 }, { "epoch": 0.51, "learning_rate": 2.449837296009654e-05, "loss": 2.3325, "step": 292470 }, { "epoch": 0.51, "learning_rate": 2.4497501020169718e-05, "loss": 2.3681, "step": 292480 }, { "epoch": 0.51, "learning_rate": 2.4496629080242888e-05, "loss": 2.3967, "step": 292490 }, { "epoch": 0.51, "learning_rate": 2.4495757140316062e-05, "loss": 2.3275, "step": 292500 }, { "epoch": 0.51, "learning_rate": 2.4494885200389236e-05, "loss": 2.4833, "step": 292510 }, { "epoch": 0.51, "learning_rate": 2.449401326046241e-05, "loss": 2.2228, "step": 292520 }, { "epoch": 0.51, "learning_rate": 2.449314132053558e-05, "loss": 2.5103, "step": 292530 }, { "epoch": 0.51, "learning_rate": 2.4492269380608754e-05, "loss": 2.3132, "step": 292540 }, { "epoch": 0.51, "learning_rate": 2.4491397440681927e-05, "loss": 2.3898, "step": 292550 }, { "epoch": 0.51, "learning_rate": 2.44905255007551e-05, "loss": 2.3695, "step": 292560 }, { "epoch": 0.51, "learning_rate": 2.4489653560828275e-05, "loss": 2.4344, "step": 292570 }, { "epoch": 0.51, "learning_rate": 2.4488781620901445e-05, "loss": 2.2135, "step": 292580 }, { "epoch": 0.51, "learning_rate": 2.4487909680974623e-05, "loss": 2.3976, "step": 292590 }, { "epoch": 0.51, "learning_rate": 2.4487037741047793e-05, "loss": 2.2533, "step": 292600 }, { "epoch": 0.51, "learning_rate": 2.4486165801120967e-05, "loss": 2.2601, "step": 292610 }, { "epoch": 0.51, "learning_rate": 2.448529386119414e-05, "loss": 2.4375, "step": 292620 }, { "epoch": 0.51, "learning_rate": 2.4484421921267314e-05, "loss": 2.3092, "step": 292630 }, { "epoch": 0.51, "learning_rate": 2.4483549981340488e-05, "loss": 2.2986, "step": 292640 }, { "epoch": 0.51, "learning_rate": 2.448267804141366e-05, "loss": 2.3482, "step": 292650 }, { "epoch": 0.51, "learning_rate": 2.4481806101486836e-05, "loss": 2.3616, "step": 292660 }, { "epoch": 0.51, "learning_rate": 2.4480934161560006e-05, "loss": 2.2953, "step": 292670 }, { "epoch": 0.51, "learning_rate": 2.448006222163318e-05, "loss": 2.4005, "step": 292680 }, { "epoch": 0.51, "learning_rate": 2.447919028170635e-05, "loss": 2.2635, "step": 292690 }, { "epoch": 0.51, "learning_rate": 2.4478318341779527e-05, "loss": 2.317, "step": 292700 }, { "epoch": 0.51, "learning_rate": 2.44774464018527e-05, "loss": 2.3954, "step": 292710 }, { "epoch": 0.51, "learning_rate": 2.447657446192587e-05, "loss": 2.3817, "step": 292720 }, { "epoch": 0.51, "learning_rate": 2.4475702521999045e-05, "loss": 2.4173, "step": 292730 }, { "epoch": 0.51, "learning_rate": 2.447483058207222e-05, "loss": 2.3736, "step": 292740 }, { "epoch": 0.51, "learning_rate": 2.4473958642145393e-05, "loss": 2.4292, "step": 292750 }, { "epoch": 0.51, "learning_rate": 2.4473086702218563e-05, "loss": 2.4628, "step": 292760 }, { "epoch": 0.51, "learning_rate": 2.447221476229174e-05, "loss": 2.35, "step": 292770 }, { "epoch": 0.51, "learning_rate": 2.447134282236491e-05, "loss": 2.178, "step": 292780 }, { "epoch": 0.51, "learning_rate": 2.4470470882438084e-05, "loss": 2.4586, "step": 292790 }, { "epoch": 0.51, "learning_rate": 2.4469598942511258e-05, "loss": 2.3446, "step": 292800 }, { "epoch": 0.51, "learning_rate": 2.4468727002584432e-05, "loss": 2.376, "step": 292810 }, { "epoch": 0.51, "learning_rate": 2.4467855062657606e-05, "loss": 2.2514, "step": 292820 }, { "epoch": 0.51, "learning_rate": 2.4466983122730776e-05, "loss": 2.3567, "step": 292830 }, { "epoch": 0.51, "learning_rate": 2.446611118280395e-05, "loss": 2.2891, "step": 292840 }, { "epoch": 0.51, "learning_rate": 2.4465239242877124e-05, "loss": 2.4358, "step": 292850 }, { "epoch": 0.51, "learning_rate": 2.4464367302950297e-05, "loss": 2.488, "step": 292860 }, { "epoch": 0.51, "learning_rate": 2.446349536302347e-05, "loss": 2.4034, "step": 292870 }, { "epoch": 0.51, "learning_rate": 2.446262342309664e-05, "loss": 2.4693, "step": 292880 }, { "epoch": 0.51, "learning_rate": 2.446175148316982e-05, "loss": 2.4359, "step": 292890 }, { "epoch": 0.51, "learning_rate": 2.446087954324299e-05, "loss": 2.3533, "step": 292900 }, { "epoch": 0.51, "learning_rate": 2.4460007603316163e-05, "loss": 2.5399, "step": 292910 }, { "epoch": 0.51, "learning_rate": 2.4459135663389337e-05, "loss": 2.3827, "step": 292920 }, { "epoch": 0.51, "learning_rate": 2.445826372346251e-05, "loss": 2.3981, "step": 292930 }, { "epoch": 0.51, "learning_rate": 2.4457391783535684e-05, "loss": 2.3174, "step": 292940 }, { "epoch": 0.51, "learning_rate": 2.4456519843608855e-05, "loss": 2.3619, "step": 292950 }, { "epoch": 0.51, "learning_rate": 2.445564790368203e-05, "loss": 2.4439, "step": 292960 }, { "epoch": 0.51, "learning_rate": 2.4454775963755202e-05, "loss": 2.3195, "step": 292970 }, { "epoch": 0.51, "learning_rate": 2.4453904023828376e-05, "loss": 2.391, "step": 292980 }, { "epoch": 0.51, "learning_rate": 2.4453032083901546e-05, "loss": 2.1927, "step": 292990 }, { "epoch": 0.51, "learning_rate": 2.4452160143974723e-05, "loss": 2.4358, "step": 293000 }, { "epoch": 0.51, "learning_rate": 2.4451288204047894e-05, "loss": 2.3245, "step": 293010 }, { "epoch": 0.51, "learning_rate": 2.4450416264121068e-05, "loss": 2.4803, "step": 293020 }, { "epoch": 0.51, "learning_rate": 2.444954432419424e-05, "loss": 2.3618, "step": 293030 }, { "epoch": 0.51, "learning_rate": 2.4448672384267415e-05, "loss": 2.3453, "step": 293040 }, { "epoch": 0.51, "learning_rate": 2.444780044434059e-05, "loss": 2.3555, "step": 293050 }, { "epoch": 0.51, "learning_rate": 2.444692850441376e-05, "loss": 2.3378, "step": 293060 }, { "epoch": 0.51, "learning_rate": 2.4446056564486936e-05, "loss": 2.3807, "step": 293070 }, { "epoch": 0.51, "learning_rate": 2.4445184624560107e-05, "loss": 2.36, "step": 293080 }, { "epoch": 0.51, "learning_rate": 2.444431268463328e-05, "loss": 2.3589, "step": 293090 }, { "epoch": 0.51, "learning_rate": 2.4443440744706454e-05, "loss": 2.3427, "step": 293100 }, { "epoch": 0.51, "learning_rate": 2.4442568804779628e-05, "loss": 2.3045, "step": 293110 }, { "epoch": 0.51, "learning_rate": 2.4441696864852802e-05, "loss": 2.3685, "step": 293120 }, { "epoch": 0.51, "learning_rate": 2.4440824924925972e-05, "loss": 2.3765, "step": 293130 }, { "epoch": 0.51, "learning_rate": 2.4439952984999146e-05, "loss": 2.4848, "step": 293140 }, { "epoch": 0.51, "learning_rate": 2.443908104507232e-05, "loss": 2.3953, "step": 293150 }, { "epoch": 0.51, "learning_rate": 2.4438209105145494e-05, "loss": 2.3476, "step": 293160 }, { "epoch": 0.51, "learning_rate": 2.4437337165218664e-05, "loss": 2.2844, "step": 293170 }, { "epoch": 0.51, "learning_rate": 2.443646522529184e-05, "loss": 2.26, "step": 293180 }, { "epoch": 0.51, "learning_rate": 2.4435593285365015e-05, "loss": 2.4091, "step": 293190 }, { "epoch": 0.51, "learning_rate": 2.4434721345438185e-05, "loss": 2.3181, "step": 293200 }, { "epoch": 0.51, "learning_rate": 2.443384940551136e-05, "loss": 2.3653, "step": 293210 }, { "epoch": 0.51, "learning_rate": 2.4432977465584533e-05, "loss": 2.3879, "step": 293220 }, { "epoch": 0.51, "learning_rate": 2.4432105525657707e-05, "loss": 2.3799, "step": 293230 }, { "epoch": 0.51, "learning_rate": 2.4431233585730877e-05, "loss": 2.2191, "step": 293240 }, { "epoch": 0.51, "learning_rate": 2.443036164580405e-05, "loss": 2.3914, "step": 293250 }, { "epoch": 0.51, "learning_rate": 2.4429489705877224e-05, "loss": 2.2835, "step": 293260 }, { "epoch": 0.51, "learning_rate": 2.4428617765950398e-05, "loss": 2.4139, "step": 293270 }, { "epoch": 0.51, "learning_rate": 2.4427745826023572e-05, "loss": 2.3899, "step": 293280 }, { "epoch": 0.51, "learning_rate": 2.4426873886096742e-05, "loss": 2.4091, "step": 293290 }, { "epoch": 0.51, "learning_rate": 2.442600194616992e-05, "loss": 2.3656, "step": 293300 }, { "epoch": 0.51, "learning_rate": 2.442513000624309e-05, "loss": 2.3877, "step": 293310 }, { "epoch": 0.51, "learning_rate": 2.4424258066316264e-05, "loss": 2.2914, "step": 293320 }, { "epoch": 0.51, "learning_rate": 2.4423386126389437e-05, "loss": 2.3138, "step": 293330 }, { "epoch": 0.51, "learning_rate": 2.442251418646261e-05, "loss": 2.3753, "step": 293340 }, { "epoch": 0.51, "learning_rate": 2.4421642246535785e-05, "loss": 2.4282, "step": 293350 }, { "epoch": 0.51, "learning_rate": 2.4420770306608955e-05, "loss": 2.4263, "step": 293360 }, { "epoch": 0.51, "learning_rate": 2.4419898366682133e-05, "loss": 2.3755, "step": 293370 }, { "epoch": 0.51, "learning_rate": 2.4419026426755303e-05, "loss": 2.4155, "step": 293380 }, { "epoch": 0.51, "learning_rate": 2.4418154486828477e-05, "loss": 2.3003, "step": 293390 }, { "epoch": 0.51, "learning_rate": 2.4417282546901647e-05, "loss": 2.3015, "step": 293400 }, { "epoch": 0.51, "learning_rate": 2.4416410606974824e-05, "loss": 2.2976, "step": 293410 }, { "epoch": 0.51, "learning_rate": 2.4415538667047995e-05, "loss": 2.4048, "step": 293420 }, { "epoch": 0.51, "learning_rate": 2.441466672712117e-05, "loss": 2.204, "step": 293430 }, { "epoch": 0.51, "learning_rate": 2.4413794787194346e-05, "loss": 2.2934, "step": 293440 }, { "epoch": 0.51, "learning_rate": 2.4412922847267516e-05, "loss": 2.4056, "step": 293450 }, { "epoch": 0.51, "learning_rate": 2.441205090734069e-05, "loss": 2.356, "step": 293460 }, { "epoch": 0.51, "learning_rate": 2.441117896741386e-05, "loss": 2.2916, "step": 293470 }, { "epoch": 0.51, "learning_rate": 2.4410307027487037e-05, "loss": 2.39, "step": 293480 }, { "epoch": 0.51, "learning_rate": 2.4409435087560208e-05, "loss": 2.4137, "step": 293490 }, { "epoch": 0.51, "learning_rate": 2.440856314763338e-05, "loss": 2.4188, "step": 293500 }, { "epoch": 0.51, "learning_rate": 2.4407691207706555e-05, "loss": 2.3316, "step": 293510 }, { "epoch": 0.51, "learning_rate": 2.440681926777973e-05, "loss": 2.4288, "step": 293520 }, { "epoch": 0.51, "learning_rate": 2.4405947327852903e-05, "loss": 2.3076, "step": 293530 }, { "epoch": 0.51, "learning_rate": 2.4405075387926073e-05, "loss": 2.3884, "step": 293540 }, { "epoch": 0.51, "learning_rate": 2.4404203447999247e-05, "loss": 2.3742, "step": 293550 }, { "epoch": 0.51, "learning_rate": 2.440333150807242e-05, "loss": 2.3581, "step": 293560 }, { "epoch": 0.51, "learning_rate": 2.4402459568145594e-05, "loss": 2.3868, "step": 293570 }, { "epoch": 0.51, "learning_rate": 2.4401587628218768e-05, "loss": 2.3257, "step": 293580 }, { "epoch": 0.51, "learning_rate": 2.4400715688291942e-05, "loss": 2.3963, "step": 293590 }, { "epoch": 0.51, "learning_rate": 2.4399843748365116e-05, "loss": 2.4203, "step": 293600 }, { "epoch": 0.51, "learning_rate": 2.4398971808438286e-05, "loss": 2.3502, "step": 293610 }, { "epoch": 0.51, "learning_rate": 2.439809986851146e-05, "loss": 2.3056, "step": 293620 }, { "epoch": 0.51, "learning_rate": 2.4397227928584634e-05, "loss": 2.2855, "step": 293630 }, { "epoch": 0.51, "learning_rate": 2.4396355988657807e-05, "loss": 2.2872, "step": 293640 }, { "epoch": 0.51, "learning_rate": 2.4395484048730978e-05, "loss": 2.3805, "step": 293650 }, { "epoch": 0.51, "learning_rate": 2.439461210880415e-05, "loss": 2.2937, "step": 293660 }, { "epoch": 0.51, "learning_rate": 2.439374016887733e-05, "loss": 2.3208, "step": 293670 }, { "epoch": 0.51, "learning_rate": 2.43928682289505e-05, "loss": 2.2662, "step": 293680 }, { "epoch": 0.51, "learning_rate": 2.4391996289023673e-05, "loss": 2.295, "step": 293690 }, { "epoch": 0.51, "learning_rate": 2.4391124349096843e-05, "loss": 2.4106, "step": 293700 }, { "epoch": 0.51, "learning_rate": 2.439025240917002e-05, "loss": 2.3386, "step": 293710 }, { "epoch": 0.51, "learning_rate": 2.438938046924319e-05, "loss": 2.3495, "step": 293720 }, { "epoch": 0.51, "learning_rate": 2.4388508529316365e-05, "loss": 2.3207, "step": 293730 }, { "epoch": 0.51, "learning_rate": 2.438763658938954e-05, "loss": 2.4888, "step": 293740 }, { "epoch": 0.51, "learning_rate": 2.4386764649462712e-05, "loss": 2.3417, "step": 293750 }, { "epoch": 0.51, "learning_rate": 2.4385892709535886e-05, "loss": 2.2301, "step": 293760 }, { "epoch": 0.51, "learning_rate": 2.4385020769609056e-05, "loss": 2.4015, "step": 293770 }, { "epoch": 0.51, "learning_rate": 2.4384148829682233e-05, "loss": 2.4186, "step": 293780 }, { "epoch": 0.51, "learning_rate": 2.4383276889755404e-05, "loss": 2.3458, "step": 293790 }, { "epoch": 0.51, "learning_rate": 2.4382404949828578e-05, "loss": 2.3081, "step": 293800 }, { "epoch": 0.51, "learning_rate": 2.438153300990175e-05, "loss": 2.4744, "step": 293810 }, { "epoch": 0.51, "learning_rate": 2.4380661069974925e-05, "loss": 2.5508, "step": 293820 }, { "epoch": 0.51, "learning_rate": 2.43797891300481e-05, "loss": 2.4502, "step": 293830 }, { "epoch": 0.51, "learning_rate": 2.437891719012127e-05, "loss": 2.3643, "step": 293840 }, { "epoch": 0.51, "learning_rate": 2.4378045250194446e-05, "loss": 2.3866, "step": 293850 }, { "epoch": 0.51, "learning_rate": 2.4377173310267617e-05, "loss": 2.4414, "step": 293860 }, { "epoch": 0.51, "learning_rate": 2.437630137034079e-05, "loss": 2.3815, "step": 293870 }, { "epoch": 0.51, "learning_rate": 2.437542943041396e-05, "loss": 2.4083, "step": 293880 }, { "epoch": 0.51, "learning_rate": 2.4374557490487138e-05, "loss": 2.4427, "step": 293890 }, { "epoch": 0.51, "learning_rate": 2.437368555056031e-05, "loss": 2.3605, "step": 293900 }, { "epoch": 0.51, "learning_rate": 2.4372813610633482e-05, "loss": 2.3417, "step": 293910 }, { "epoch": 0.51, "learning_rate": 2.4371941670706656e-05, "loss": 2.3296, "step": 293920 }, { "epoch": 0.51, "learning_rate": 2.437106973077983e-05, "loss": 2.3687, "step": 293930 }, { "epoch": 0.51, "learning_rate": 2.4370197790853004e-05, "loss": 2.3422, "step": 293940 }, { "epoch": 0.51, "learning_rate": 2.4369325850926174e-05, "loss": 2.3847, "step": 293950 }, { "epoch": 0.51, "learning_rate": 2.4368453910999348e-05, "loss": 2.3577, "step": 293960 }, { "epoch": 0.51, "learning_rate": 2.436758197107252e-05, "loss": 2.3421, "step": 293970 }, { "epoch": 0.51, "learning_rate": 2.4366710031145695e-05, "loss": 2.1912, "step": 293980 }, { "epoch": 0.51, "learning_rate": 2.436583809121887e-05, "loss": 2.3589, "step": 293990 }, { "epoch": 0.51, "learning_rate": 2.4364966151292043e-05, "loss": 2.3521, "step": 294000 }, { "epoch": 0.51, "learning_rate": 2.4364094211365217e-05, "loss": 2.3625, "step": 294010 }, { "epoch": 0.51, "learning_rate": 2.4363222271438387e-05, "loss": 2.3814, "step": 294020 }, { "epoch": 0.51, "learning_rate": 2.436235033151156e-05, "loss": 2.3563, "step": 294030 }, { "epoch": 0.51, "learning_rate": 2.4361478391584734e-05, "loss": 2.4355, "step": 294040 }, { "epoch": 0.51, "learning_rate": 2.4360606451657908e-05, "loss": 2.4159, "step": 294050 }, { "epoch": 0.51, "learning_rate": 2.4359734511731082e-05, "loss": 2.2859, "step": 294060 }, { "epoch": 0.51, "learning_rate": 2.4358862571804252e-05, "loss": 2.3, "step": 294070 }, { "epoch": 0.51, "learning_rate": 2.435799063187743e-05, "loss": 2.3573, "step": 294080 }, { "epoch": 0.51, "learning_rate": 2.43571186919506e-05, "loss": 2.3259, "step": 294090 }, { "epoch": 0.51, "learning_rate": 2.4356246752023774e-05, "loss": 2.3747, "step": 294100 }, { "epoch": 0.51, "learning_rate": 2.4355374812096947e-05, "loss": 2.4093, "step": 294110 }, { "epoch": 0.51, "learning_rate": 2.435450287217012e-05, "loss": 2.257, "step": 294120 }, { "epoch": 0.51, "learning_rate": 2.435363093224329e-05, "loss": 2.3075, "step": 294130 }, { "epoch": 0.51, "learning_rate": 2.4352758992316465e-05, "loss": 2.3553, "step": 294140 }, { "epoch": 0.51, "learning_rate": 2.435188705238964e-05, "loss": 2.2786, "step": 294150 }, { "epoch": 0.51, "learning_rate": 2.4351015112462813e-05, "loss": 2.3413, "step": 294160 }, { "epoch": 0.51, "learning_rate": 2.4350143172535987e-05, "loss": 2.3248, "step": 294170 }, { "epoch": 0.51, "learning_rate": 2.4349271232609157e-05, "loss": 2.3914, "step": 294180 }, { "epoch": 0.51, "learning_rate": 2.4348399292682334e-05, "loss": 2.3462, "step": 294190 }, { "epoch": 0.51, "learning_rate": 2.4347527352755505e-05, "loss": 2.33, "step": 294200 }, { "epoch": 0.51, "learning_rate": 2.434665541282868e-05, "loss": 2.2559, "step": 294210 }, { "epoch": 0.51, "learning_rate": 2.4345783472901852e-05, "loss": 2.3316, "step": 294220 }, { "epoch": 0.51, "learning_rate": 2.4344911532975026e-05, "loss": 2.3944, "step": 294230 }, { "epoch": 0.51, "learning_rate": 2.43440395930482e-05, "loss": 2.3816, "step": 294240 }, { "epoch": 0.51, "learning_rate": 2.434316765312137e-05, "loss": 2.3007, "step": 294250 }, { "epoch": 0.51, "learning_rate": 2.4342295713194547e-05, "loss": 2.3198, "step": 294260 }, { "epoch": 0.51, "learning_rate": 2.4341423773267718e-05, "loss": 2.4708, "step": 294270 }, { "epoch": 0.51, "learning_rate": 2.434055183334089e-05, "loss": 2.4152, "step": 294280 }, { "epoch": 0.51, "learning_rate": 2.4339679893414065e-05, "loss": 2.3169, "step": 294290 }, { "epoch": 0.51, "learning_rate": 2.433880795348724e-05, "loss": 2.3659, "step": 294300 }, { "epoch": 0.51, "learning_rate": 2.4337936013560413e-05, "loss": 2.4175, "step": 294310 }, { "epoch": 0.51, "learning_rate": 2.4337064073633583e-05, "loss": 2.3175, "step": 294320 }, { "epoch": 0.51, "learning_rate": 2.4336192133706757e-05, "loss": 2.3101, "step": 294330 }, { "epoch": 0.51, "learning_rate": 2.433532019377993e-05, "loss": 2.4071, "step": 294340 }, { "epoch": 0.51, "learning_rate": 2.4334448253853104e-05, "loss": 2.3313, "step": 294350 }, { "epoch": 0.51, "learning_rate": 2.4333576313926275e-05, "loss": 2.4011, "step": 294360 }, { "epoch": 0.51, "learning_rate": 2.4332704373999452e-05, "loss": 2.3934, "step": 294370 }, { "epoch": 0.51, "learning_rate": 2.4331832434072622e-05, "loss": 2.3892, "step": 294380 }, { "epoch": 0.51, "learning_rate": 2.4330960494145796e-05, "loss": 2.3352, "step": 294390 }, { "epoch": 0.51, "learning_rate": 2.433008855421897e-05, "loss": 2.345, "step": 294400 }, { "epoch": 0.51, "learning_rate": 2.4329216614292144e-05, "loss": 2.4206, "step": 294410 }, { "epoch": 0.51, "learning_rate": 2.4328344674365317e-05, "loss": 2.3137, "step": 294420 }, { "epoch": 0.51, "learning_rate": 2.4327472734438488e-05, "loss": 2.4247, "step": 294430 }, { "epoch": 0.51, "learning_rate": 2.432660079451166e-05, "loss": 2.4007, "step": 294440 }, { "epoch": 0.51, "learning_rate": 2.4325728854584835e-05, "loss": 2.2474, "step": 294450 }, { "epoch": 0.51, "learning_rate": 2.432485691465801e-05, "loss": 2.4126, "step": 294460 }, { "epoch": 0.51, "learning_rate": 2.4323984974731183e-05, "loss": 2.2271, "step": 294470 }, { "epoch": 0.51, "learning_rate": 2.4323113034804353e-05, "loss": 2.4587, "step": 294480 }, { "epoch": 0.51, "learning_rate": 2.432224109487753e-05, "loss": 2.3741, "step": 294490 }, { "epoch": 0.51, "learning_rate": 2.43213691549507e-05, "loss": 2.3865, "step": 294500 }, { "epoch": 0.51, "learning_rate": 2.4320497215023875e-05, "loss": 2.3469, "step": 294510 }, { "epoch": 0.51, "learning_rate": 2.431962527509705e-05, "loss": 2.4668, "step": 294520 }, { "epoch": 0.51, "learning_rate": 2.4318753335170222e-05, "loss": 2.2556, "step": 294530 }, { "epoch": 0.51, "learning_rate": 2.4317881395243396e-05, "loss": 2.427, "step": 294540 }, { "epoch": 0.51, "learning_rate": 2.4317009455316566e-05, "loss": 2.4085, "step": 294550 }, { "epoch": 0.51, "learning_rate": 2.4316137515389743e-05, "loss": 2.2341, "step": 294560 }, { "epoch": 0.51, "learning_rate": 2.4315265575462914e-05, "loss": 2.2077, "step": 294570 }, { "epoch": 0.51, "learning_rate": 2.4314393635536088e-05, "loss": 2.272, "step": 294580 }, { "epoch": 0.51, "learning_rate": 2.4313521695609258e-05, "loss": 2.4181, "step": 294590 }, { "epoch": 0.51, "learning_rate": 2.4312649755682435e-05, "loss": 2.4314, "step": 294600 }, { "epoch": 0.51, "learning_rate": 2.4311777815755605e-05, "loss": 2.3632, "step": 294610 }, { "epoch": 0.51, "learning_rate": 2.431090587582878e-05, "loss": 2.2815, "step": 294620 }, { "epoch": 0.51, "learning_rate": 2.4310033935901953e-05, "loss": 2.3291, "step": 294630 }, { "epoch": 0.51, "learning_rate": 2.4309161995975127e-05, "loss": 2.3784, "step": 294640 }, { "epoch": 0.51, "learning_rate": 2.43082900560483e-05, "loss": 2.3663, "step": 294650 }, { "epoch": 0.51, "learning_rate": 2.430741811612147e-05, "loss": 2.2887, "step": 294660 }, { "epoch": 0.51, "learning_rate": 2.4306546176194648e-05, "loss": 2.3531, "step": 294670 }, { "epoch": 0.51, "learning_rate": 2.430567423626782e-05, "loss": 2.3348, "step": 294680 }, { "epoch": 0.51, "learning_rate": 2.4304802296340992e-05, "loss": 2.4173, "step": 294690 }, { "epoch": 0.51, "learning_rate": 2.4303930356414166e-05, "loss": 2.3965, "step": 294700 }, { "epoch": 0.51, "learning_rate": 2.430305841648734e-05, "loss": 2.2771, "step": 294710 }, { "epoch": 0.51, "learning_rate": 2.4302186476560514e-05, "loss": 2.2864, "step": 294720 }, { "epoch": 0.51, "learning_rate": 2.4301314536633684e-05, "loss": 2.3188, "step": 294730 }, { "epoch": 0.51, "learning_rate": 2.4300442596706858e-05, "loss": 2.302, "step": 294740 }, { "epoch": 0.51, "learning_rate": 2.429957065678003e-05, "loss": 2.4366, "step": 294750 }, { "epoch": 0.51, "learning_rate": 2.4298698716853205e-05, "loss": 2.379, "step": 294760 }, { "epoch": 0.51, "learning_rate": 2.429782677692638e-05, "loss": 2.3621, "step": 294770 }, { "epoch": 0.51, "learning_rate": 2.4296954836999553e-05, "loss": 2.3967, "step": 294780 }, { "epoch": 0.51, "learning_rate": 2.4296082897072727e-05, "loss": 2.286, "step": 294790 }, { "epoch": 0.51, "learning_rate": 2.4295210957145897e-05, "loss": 2.378, "step": 294800 }, { "epoch": 0.51, "learning_rate": 2.429433901721907e-05, "loss": 2.2571, "step": 294810 }, { "epoch": 0.51, "learning_rate": 2.4293467077292244e-05, "loss": 2.3375, "step": 294820 }, { "epoch": 0.51, "learning_rate": 2.4292595137365418e-05, "loss": 2.4127, "step": 294830 }, { "epoch": 0.51, "learning_rate": 2.429172319743859e-05, "loss": 2.3337, "step": 294840 }, { "epoch": 0.51, "learning_rate": 2.4290851257511762e-05, "loss": 2.4333, "step": 294850 }, { "epoch": 0.51, "learning_rate": 2.4289979317584936e-05, "loss": 2.3955, "step": 294860 }, { "epoch": 0.51, "learning_rate": 2.428910737765811e-05, "loss": 2.3698, "step": 294870 }, { "epoch": 0.51, "learning_rate": 2.4288235437731284e-05, "loss": 2.345, "step": 294880 }, { "epoch": 0.51, "learning_rate": 2.4287363497804454e-05, "loss": 2.494, "step": 294890 }, { "epoch": 0.51, "learning_rate": 2.428649155787763e-05, "loss": 2.2505, "step": 294900 }, { "epoch": 0.51, "learning_rate": 2.42856196179508e-05, "loss": 2.3602, "step": 294910 }, { "epoch": 0.51, "learning_rate": 2.4284747678023975e-05, "loss": 2.2915, "step": 294920 }, { "epoch": 0.51, "learning_rate": 2.428387573809715e-05, "loss": 2.4685, "step": 294930 }, { "epoch": 0.51, "learning_rate": 2.4283003798170323e-05, "loss": 2.4712, "step": 294940 }, { "epoch": 0.51, "learning_rate": 2.4282131858243497e-05, "loss": 2.4043, "step": 294950 }, { "epoch": 0.51, "learning_rate": 2.4281259918316667e-05, "loss": 2.3163, "step": 294960 }, { "epoch": 0.51, "learning_rate": 2.4280387978389844e-05, "loss": 2.3468, "step": 294970 }, { "epoch": 0.51, "learning_rate": 2.4279516038463015e-05, "loss": 2.358, "step": 294980 }, { "epoch": 0.51, "learning_rate": 2.427864409853619e-05, "loss": 2.2489, "step": 294990 }, { "epoch": 0.51, "learning_rate": 2.427777215860936e-05, "loss": 2.5064, "step": 295000 }, { "epoch": 0.51, "learning_rate": 2.4276900218682536e-05, "loss": 2.4526, "step": 295010 }, { "epoch": 0.51, "learning_rate": 2.427602827875571e-05, "loss": 2.2351, "step": 295020 }, { "epoch": 0.51, "learning_rate": 2.427515633882888e-05, "loss": 2.2259, "step": 295030 }, { "epoch": 0.51, "learning_rate": 2.4274284398902057e-05, "loss": 2.4917, "step": 295040 }, { "epoch": 0.51, "learning_rate": 2.4273412458975228e-05, "loss": 2.2773, "step": 295050 }, { "epoch": 0.51, "learning_rate": 2.42725405190484e-05, "loss": 2.3175, "step": 295060 }, { "epoch": 0.51, "learning_rate": 2.4271668579121572e-05, "loss": 2.3784, "step": 295070 }, { "epoch": 0.51, "learning_rate": 2.427079663919475e-05, "loss": 2.273, "step": 295080 }, { "epoch": 0.51, "learning_rate": 2.426992469926792e-05, "loss": 2.4423, "step": 295090 }, { "epoch": 0.51, "learning_rate": 2.4269052759341093e-05, "loss": 2.2985, "step": 295100 }, { "epoch": 0.51, "learning_rate": 2.4268180819414267e-05, "loss": 2.369, "step": 295110 }, { "epoch": 0.51, "learning_rate": 2.426730887948744e-05, "loss": 2.2971, "step": 295120 }, { "epoch": 0.51, "learning_rate": 2.4266436939560614e-05, "loss": 2.3704, "step": 295130 }, { "epoch": 0.51, "learning_rate": 2.4265564999633785e-05, "loss": 2.3631, "step": 295140 }, { "epoch": 0.51, "learning_rate": 2.426469305970696e-05, "loss": 2.4548, "step": 295150 }, { "epoch": 0.51, "learning_rate": 2.4263821119780132e-05, "loss": 2.3596, "step": 295160 }, { "epoch": 0.51, "learning_rate": 2.4262949179853306e-05, "loss": 2.393, "step": 295170 }, { "epoch": 0.51, "learning_rate": 2.426207723992648e-05, "loss": 2.449, "step": 295180 }, { "epoch": 0.51, "learning_rate": 2.4261205299999654e-05, "loss": 2.3407, "step": 295190 }, { "epoch": 0.51, "learning_rate": 2.4260333360072827e-05, "loss": 2.3338, "step": 295200 }, { "epoch": 0.51, "learning_rate": 2.4259461420145998e-05, "loss": 2.2596, "step": 295210 }, { "epoch": 0.51, "learning_rate": 2.425858948021917e-05, "loss": 2.3164, "step": 295220 }, { "epoch": 0.51, "learning_rate": 2.4257717540292345e-05, "loss": 2.1746, "step": 295230 }, { "epoch": 0.51, "learning_rate": 2.425684560036552e-05, "loss": 2.3627, "step": 295240 }, { "epoch": 0.51, "learning_rate": 2.425597366043869e-05, "loss": 2.4099, "step": 295250 }, { "epoch": 0.51, "learning_rate": 2.4255101720511863e-05, "loss": 2.3606, "step": 295260 }, { "epoch": 0.51, "learning_rate": 2.425422978058504e-05, "loss": 2.3796, "step": 295270 }, { "epoch": 0.51, "learning_rate": 2.425335784065821e-05, "loss": 2.43, "step": 295280 }, { "epoch": 0.51, "learning_rate": 2.4252485900731385e-05, "loss": 2.2416, "step": 295290 }, { "epoch": 0.51, "learning_rate": 2.425161396080456e-05, "loss": 2.371, "step": 295300 }, { "epoch": 0.51, "learning_rate": 2.4250742020877732e-05, "loss": 2.3468, "step": 295310 }, { "epoch": 0.52, "learning_rate": 2.4249870080950902e-05, "loss": 2.397, "step": 295320 }, { "epoch": 0.52, "learning_rate": 2.4248998141024076e-05, "loss": 2.3506, "step": 295330 }, { "epoch": 0.52, "learning_rate": 2.424812620109725e-05, "loss": 2.362, "step": 295340 }, { "epoch": 0.52, "learning_rate": 2.4247254261170424e-05, "loss": 2.3848, "step": 295350 }, { "epoch": 0.52, "learning_rate": 2.4246382321243598e-05, "loss": 2.4137, "step": 295360 }, { "epoch": 0.52, "learning_rate": 2.4245510381316768e-05, "loss": 2.4302, "step": 295370 }, { "epoch": 0.52, "learning_rate": 2.4244638441389945e-05, "loss": 2.3109, "step": 295380 }, { "epoch": 0.52, "learning_rate": 2.4243766501463115e-05, "loss": 2.3739, "step": 295390 }, { "epoch": 0.52, "learning_rate": 2.424289456153629e-05, "loss": 2.49, "step": 295400 }, { "epoch": 0.52, "learning_rate": 2.4242022621609463e-05, "loss": 2.3198, "step": 295410 }, { "epoch": 0.52, "learning_rate": 2.4241150681682637e-05, "loss": 2.3873, "step": 295420 }, { "epoch": 0.52, "learning_rate": 2.424027874175581e-05, "loss": 2.348, "step": 295430 }, { "epoch": 0.52, "learning_rate": 2.423940680182898e-05, "loss": 2.407, "step": 295440 }, { "epoch": 0.52, "learning_rate": 2.4238534861902158e-05, "loss": 2.3074, "step": 295450 }, { "epoch": 0.52, "learning_rate": 2.423766292197533e-05, "loss": 2.3515, "step": 295460 }, { "epoch": 0.52, "learning_rate": 2.4236790982048502e-05, "loss": 2.2991, "step": 295470 }, { "epoch": 0.52, "learning_rate": 2.4235919042121673e-05, "loss": 2.3571, "step": 295480 }, { "epoch": 0.52, "learning_rate": 2.423504710219485e-05, "loss": 2.4773, "step": 295490 }, { "epoch": 0.52, "learning_rate": 2.4234175162268024e-05, "loss": 2.319, "step": 295500 }, { "epoch": 0.52, "learning_rate": 2.4233303222341194e-05, "loss": 2.3215, "step": 295510 }, { "epoch": 0.52, "learning_rate": 2.4232431282414368e-05, "loss": 2.3969, "step": 295520 }, { "epoch": 0.52, "learning_rate": 2.423155934248754e-05, "loss": 2.3433, "step": 295530 }, { "epoch": 0.52, "learning_rate": 2.4230687402560715e-05, "loss": 2.3224, "step": 295540 }, { "epoch": 0.52, "learning_rate": 2.4229815462633886e-05, "loss": 2.4313, "step": 295550 }, { "epoch": 0.52, "learning_rate": 2.422894352270706e-05, "loss": 2.3733, "step": 295560 }, { "epoch": 0.52, "learning_rate": 2.4228071582780233e-05, "loss": 2.3426, "step": 295570 }, { "epoch": 0.52, "learning_rate": 2.4227199642853407e-05, "loss": 2.2331, "step": 295580 }, { "epoch": 0.52, "learning_rate": 2.422632770292658e-05, "loss": 2.3389, "step": 295590 }, { "epoch": 0.52, "learning_rate": 2.4225455762999754e-05, "loss": 2.2931, "step": 295600 }, { "epoch": 0.52, "learning_rate": 2.4224583823072928e-05, "loss": 2.319, "step": 295610 }, { "epoch": 0.52, "learning_rate": 2.42237118831461e-05, "loss": 2.412, "step": 295620 }, { "epoch": 0.52, "learning_rate": 2.4222839943219272e-05, "loss": 2.3956, "step": 295630 }, { "epoch": 0.52, "learning_rate": 2.4221968003292446e-05, "loss": 2.3638, "step": 295640 }, { "epoch": 0.52, "learning_rate": 2.422109606336562e-05, "loss": 2.2816, "step": 295650 }, { "epoch": 0.52, "learning_rate": 2.4220224123438794e-05, "loss": 2.2917, "step": 295660 }, { "epoch": 0.52, "learning_rate": 2.4219352183511964e-05, "loss": 2.3163, "step": 295670 }, { "epoch": 0.52, "learning_rate": 2.421848024358514e-05, "loss": 2.4275, "step": 295680 }, { "epoch": 0.52, "learning_rate": 2.421760830365831e-05, "loss": 2.2805, "step": 295690 }, { "epoch": 0.52, "learning_rate": 2.4216736363731485e-05, "loss": 2.2908, "step": 295700 }, { "epoch": 0.52, "learning_rate": 2.421586442380466e-05, "loss": 2.2296, "step": 295710 }, { "epoch": 0.52, "learning_rate": 2.4214992483877833e-05, "loss": 2.4453, "step": 295720 }, { "epoch": 0.52, "learning_rate": 2.4214120543951003e-05, "loss": 2.3145, "step": 295730 }, { "epoch": 0.52, "learning_rate": 2.4213248604024177e-05, "loss": 2.2828, "step": 295740 }, { "epoch": 0.52, "learning_rate": 2.4212376664097354e-05, "loss": 2.4007, "step": 295750 }, { "epoch": 0.52, "learning_rate": 2.4211504724170525e-05, "loss": 2.3331, "step": 295760 }, { "epoch": 0.52, "learning_rate": 2.42106327842437e-05, "loss": 2.291, "step": 295770 }, { "epoch": 0.52, "learning_rate": 2.420976084431687e-05, "loss": 2.4279, "step": 295780 }, { "epoch": 0.52, "learning_rate": 2.4208888904390046e-05, "loss": 2.3839, "step": 295790 }, { "epoch": 0.52, "learning_rate": 2.4208016964463216e-05, "loss": 2.4101, "step": 295800 }, { "epoch": 0.52, "learning_rate": 2.420714502453639e-05, "loss": 2.1885, "step": 295810 }, { "epoch": 0.52, "learning_rate": 2.4206273084609564e-05, "loss": 2.2554, "step": 295820 }, { "epoch": 0.52, "learning_rate": 2.4205401144682738e-05, "loss": 2.3402, "step": 295830 }, { "epoch": 0.52, "learning_rate": 2.420452920475591e-05, "loss": 2.3298, "step": 295840 }, { "epoch": 0.52, "learning_rate": 2.4203657264829082e-05, "loss": 2.3644, "step": 295850 }, { "epoch": 0.52, "learning_rate": 2.420278532490226e-05, "loss": 2.2729, "step": 295860 }, { "epoch": 0.52, "learning_rate": 2.420191338497543e-05, "loss": 2.4198, "step": 295870 }, { "epoch": 0.52, "learning_rate": 2.4201041445048603e-05, "loss": 2.357, "step": 295880 }, { "epoch": 0.52, "learning_rate": 2.4200169505121777e-05, "loss": 2.3334, "step": 295890 }, { "epoch": 0.52, "learning_rate": 2.419929756519495e-05, "loss": 2.42, "step": 295900 }, { "epoch": 0.52, "learning_rate": 2.4198425625268124e-05, "loss": 2.2355, "step": 295910 }, { "epoch": 0.52, "learning_rate": 2.4197553685341295e-05, "loss": 2.4225, "step": 295920 }, { "epoch": 0.52, "learning_rate": 2.419668174541447e-05, "loss": 2.3122, "step": 295930 }, { "epoch": 0.52, "learning_rate": 2.4195809805487642e-05, "loss": 2.3533, "step": 295940 }, { "epoch": 0.52, "learning_rate": 2.4194937865560816e-05, "loss": 2.3941, "step": 295950 }, { "epoch": 0.52, "learning_rate": 2.4194065925633986e-05, "loss": 2.2337, "step": 295960 }, { "epoch": 0.52, "learning_rate": 2.4193193985707164e-05, "loss": 2.4214, "step": 295970 }, { "epoch": 0.52, "learning_rate": 2.4192322045780334e-05, "loss": 2.3645, "step": 295980 }, { "epoch": 0.52, "learning_rate": 2.4191450105853508e-05, "loss": 2.4198, "step": 295990 }, { "epoch": 0.52, "learning_rate": 2.419057816592668e-05, "loss": 2.3333, "step": 296000 }, { "epoch": 0.52, "learning_rate": 2.4189706225999855e-05, "loss": 2.4367, "step": 296010 }, { "epoch": 0.52, "learning_rate": 2.418883428607303e-05, "loss": 2.3389, "step": 296020 }, { "epoch": 0.52, "learning_rate": 2.41879623461462e-05, "loss": 2.3269, "step": 296030 }, { "epoch": 0.52, "learning_rate": 2.4187090406219373e-05, "loss": 2.4022, "step": 296040 }, { "epoch": 0.52, "learning_rate": 2.4186218466292547e-05, "loss": 2.3568, "step": 296050 }, { "epoch": 0.52, "learning_rate": 2.418534652636572e-05, "loss": 2.3563, "step": 296060 }, { "epoch": 0.52, "learning_rate": 2.4184474586438895e-05, "loss": 2.3961, "step": 296070 }, { "epoch": 0.52, "learning_rate": 2.4183602646512065e-05, "loss": 2.3986, "step": 296080 }, { "epoch": 0.52, "learning_rate": 2.4182730706585242e-05, "loss": 2.3511, "step": 296090 }, { "epoch": 0.52, "learning_rate": 2.4181858766658412e-05, "loss": 2.4208, "step": 296100 }, { "epoch": 0.52, "learning_rate": 2.4180986826731586e-05, "loss": 2.2703, "step": 296110 }, { "epoch": 0.52, "learning_rate": 2.418011488680476e-05, "loss": 2.4193, "step": 296120 }, { "epoch": 0.52, "learning_rate": 2.4179242946877934e-05, "loss": 2.3359, "step": 296130 }, { "epoch": 0.52, "learning_rate": 2.4178371006951108e-05, "loss": 2.5308, "step": 296140 }, { "epoch": 0.52, "learning_rate": 2.4177499067024278e-05, "loss": 2.3087, "step": 296150 }, { "epoch": 0.52, "learning_rate": 2.4176627127097455e-05, "loss": 2.4525, "step": 296160 }, { "epoch": 0.52, "learning_rate": 2.4175755187170625e-05, "loss": 2.4367, "step": 296170 }, { "epoch": 0.52, "learning_rate": 2.41748832472438e-05, "loss": 2.349, "step": 296180 }, { "epoch": 0.52, "learning_rate": 2.417401130731697e-05, "loss": 2.425, "step": 296190 }, { "epoch": 0.52, "learning_rate": 2.4173139367390147e-05, "loss": 2.3491, "step": 296200 }, { "epoch": 0.52, "learning_rate": 2.4172267427463317e-05, "loss": 2.3822, "step": 296210 }, { "epoch": 0.52, "learning_rate": 2.417139548753649e-05, "loss": 2.3717, "step": 296220 }, { "epoch": 0.52, "learning_rate": 2.4170523547609668e-05, "loss": 2.3725, "step": 296230 }, { "epoch": 0.52, "learning_rate": 2.416965160768284e-05, "loss": 2.3642, "step": 296240 }, { "epoch": 0.52, "learning_rate": 2.4168779667756012e-05, "loss": 2.2628, "step": 296250 }, { "epoch": 0.52, "learning_rate": 2.4167907727829183e-05, "loss": 2.3441, "step": 296260 }, { "epoch": 0.52, "learning_rate": 2.416703578790236e-05, "loss": 2.2571, "step": 296270 }, { "epoch": 0.52, "learning_rate": 2.416616384797553e-05, "loss": 2.3014, "step": 296280 }, { "epoch": 0.52, "learning_rate": 2.4165291908048704e-05, "loss": 2.3395, "step": 296290 }, { "epoch": 0.52, "learning_rate": 2.4164419968121878e-05, "loss": 2.3155, "step": 296300 }, { "epoch": 0.52, "learning_rate": 2.416354802819505e-05, "loss": 2.3571, "step": 296310 }, { "epoch": 0.52, "learning_rate": 2.4162676088268225e-05, "loss": 2.4261, "step": 296320 }, { "epoch": 0.52, "learning_rate": 2.4161804148341396e-05, "loss": 2.4282, "step": 296330 }, { "epoch": 0.52, "learning_rate": 2.416093220841457e-05, "loss": 2.3945, "step": 296340 }, { "epoch": 0.52, "learning_rate": 2.4160060268487743e-05, "loss": 2.3914, "step": 296350 }, { "epoch": 0.52, "learning_rate": 2.4159188328560917e-05, "loss": 2.3475, "step": 296360 }, { "epoch": 0.52, "learning_rate": 2.415831638863409e-05, "loss": 2.316, "step": 296370 }, { "epoch": 0.52, "learning_rate": 2.4157444448707264e-05, "loss": 2.3342, "step": 296380 }, { "epoch": 0.52, "learning_rate": 2.4156572508780438e-05, "loss": 2.3956, "step": 296390 }, { "epoch": 0.52, "learning_rate": 2.415570056885361e-05, "loss": 2.3305, "step": 296400 }, { "epoch": 0.52, "learning_rate": 2.4154828628926782e-05, "loss": 2.4679, "step": 296410 }, { "epoch": 0.52, "learning_rate": 2.4153956688999956e-05, "loss": 2.4174, "step": 296420 }, { "epoch": 0.52, "learning_rate": 2.415308474907313e-05, "loss": 2.2616, "step": 296430 }, { "epoch": 0.52, "learning_rate": 2.41522128091463e-05, "loss": 2.3505, "step": 296440 }, { "epoch": 0.52, "learning_rate": 2.4151340869219474e-05, "loss": 2.3103, "step": 296450 }, { "epoch": 0.52, "learning_rate": 2.4150468929292648e-05, "loss": 2.3139, "step": 296460 }, { "epoch": 0.52, "learning_rate": 2.414959698936582e-05, "loss": 2.3818, "step": 296470 }, { "epoch": 0.52, "learning_rate": 2.4148725049438995e-05, "loss": 2.3594, "step": 296480 }, { "epoch": 0.52, "learning_rate": 2.4147853109512166e-05, "loss": 2.2473, "step": 296490 }, { "epoch": 0.52, "learning_rate": 2.4146981169585343e-05, "loss": 2.4907, "step": 296500 }, { "epoch": 0.52, "learning_rate": 2.4146109229658513e-05, "loss": 2.41, "step": 296510 }, { "epoch": 0.52, "learning_rate": 2.4145237289731687e-05, "loss": 2.356, "step": 296520 }, { "epoch": 0.52, "learning_rate": 2.414436534980486e-05, "loss": 2.4267, "step": 296530 }, { "epoch": 0.52, "learning_rate": 2.4143493409878035e-05, "loss": 2.4036, "step": 296540 }, { "epoch": 0.52, "learning_rate": 2.414262146995121e-05, "loss": 2.3708, "step": 296550 }, { "epoch": 0.52, "learning_rate": 2.414174953002438e-05, "loss": 2.3971, "step": 296560 }, { "epoch": 0.52, "learning_rate": 2.4140877590097556e-05, "loss": 2.3912, "step": 296570 }, { "epoch": 0.52, "learning_rate": 2.4140005650170726e-05, "loss": 2.4169, "step": 296580 }, { "epoch": 0.52, "learning_rate": 2.41391337102439e-05, "loss": 2.4244, "step": 296590 }, { "epoch": 0.52, "learning_rate": 2.413826177031707e-05, "loss": 2.4777, "step": 296600 }, { "epoch": 0.52, "learning_rate": 2.4137389830390248e-05, "loss": 2.4467, "step": 296610 }, { "epoch": 0.52, "learning_rate": 2.413651789046342e-05, "loss": 2.4072, "step": 296620 }, { "epoch": 0.52, "learning_rate": 2.4135645950536592e-05, "loss": 2.3297, "step": 296630 }, { "epoch": 0.52, "learning_rate": 2.413477401060977e-05, "loss": 2.4823, "step": 296640 }, { "epoch": 0.52, "learning_rate": 2.413390207068294e-05, "loss": 2.284, "step": 296650 }, { "epoch": 0.52, "learning_rate": 2.4133030130756113e-05, "loss": 2.2946, "step": 296660 }, { "epoch": 0.52, "learning_rate": 2.4132158190829283e-05, "loss": 2.3518, "step": 296670 }, { "epoch": 0.52, "learning_rate": 2.413128625090246e-05, "loss": 2.2944, "step": 296680 }, { "epoch": 0.52, "learning_rate": 2.413041431097563e-05, "loss": 2.4773, "step": 296690 }, { "epoch": 0.52, "learning_rate": 2.4129542371048805e-05, "loss": 2.3016, "step": 296700 }, { "epoch": 0.52, "learning_rate": 2.412867043112198e-05, "loss": 2.3098, "step": 296710 }, { "epoch": 0.52, "learning_rate": 2.4127798491195152e-05, "loss": 2.4037, "step": 296720 }, { "epoch": 0.52, "learning_rate": 2.4126926551268326e-05, "loss": 2.3645, "step": 296730 }, { "epoch": 0.52, "learning_rate": 2.4126054611341496e-05, "loss": 2.2945, "step": 296740 }, { "epoch": 0.52, "learning_rate": 2.412518267141467e-05, "loss": 2.3816, "step": 296750 }, { "epoch": 0.52, "learning_rate": 2.4124310731487844e-05, "loss": 2.4236, "step": 296760 }, { "epoch": 0.52, "learning_rate": 2.4123438791561018e-05, "loss": 2.2445, "step": 296770 }, { "epoch": 0.52, "learning_rate": 2.412256685163419e-05, "loss": 2.3876, "step": 296780 }, { "epoch": 0.52, "learning_rate": 2.4121694911707365e-05, "loss": 2.3426, "step": 296790 }, { "epoch": 0.52, "learning_rate": 2.412082297178054e-05, "loss": 2.2915, "step": 296800 }, { "epoch": 0.52, "learning_rate": 2.411995103185371e-05, "loss": 2.3787, "step": 296810 }, { "epoch": 0.52, "learning_rate": 2.4119079091926883e-05, "loss": 2.3806, "step": 296820 }, { "epoch": 0.52, "learning_rate": 2.4118207152000057e-05, "loss": 2.3306, "step": 296830 }, { "epoch": 0.52, "learning_rate": 2.411733521207323e-05, "loss": 2.4501, "step": 296840 }, { "epoch": 0.52, "learning_rate": 2.4116463272146405e-05, "loss": 2.3546, "step": 296850 }, { "epoch": 0.52, "learning_rate": 2.4115591332219575e-05, "loss": 2.4276, "step": 296860 }, { "epoch": 0.52, "learning_rate": 2.4114719392292752e-05, "loss": 2.3071, "step": 296870 }, { "epoch": 0.52, "learning_rate": 2.4113847452365922e-05, "loss": 2.1949, "step": 296880 }, { "epoch": 0.52, "learning_rate": 2.4112975512439096e-05, "loss": 2.35, "step": 296890 }, { "epoch": 0.52, "learning_rate": 2.411210357251227e-05, "loss": 2.4089, "step": 296900 }, { "epoch": 0.52, "learning_rate": 2.4111231632585444e-05, "loss": 2.3727, "step": 296910 }, { "epoch": 0.52, "learning_rate": 2.4110359692658614e-05, "loss": 2.3974, "step": 296920 }, { "epoch": 0.52, "learning_rate": 2.4109487752731788e-05, "loss": 2.3477, "step": 296930 }, { "epoch": 0.52, "learning_rate": 2.4108615812804962e-05, "loss": 2.4351, "step": 296940 }, { "epoch": 0.52, "learning_rate": 2.4107743872878135e-05, "loss": 2.4083, "step": 296950 }, { "epoch": 0.52, "learning_rate": 2.410687193295131e-05, "loss": 2.4757, "step": 296960 }, { "epoch": 0.52, "learning_rate": 2.410599999302448e-05, "loss": 2.3786, "step": 296970 }, { "epoch": 0.52, "learning_rate": 2.4105128053097657e-05, "loss": 2.3901, "step": 296980 }, { "epoch": 0.52, "learning_rate": 2.4104256113170827e-05, "loss": 2.3225, "step": 296990 }, { "epoch": 0.52, "learning_rate": 2.4103384173244e-05, "loss": 2.3622, "step": 297000 }, { "epoch": 0.52, "learning_rate": 2.4102512233317175e-05, "loss": 2.2861, "step": 297010 }, { "epoch": 0.52, "learning_rate": 2.410164029339035e-05, "loss": 2.3462, "step": 297020 }, { "epoch": 0.52, "learning_rate": 2.4100768353463522e-05, "loss": 2.3164, "step": 297030 }, { "epoch": 0.52, "learning_rate": 2.4099896413536693e-05, "loss": 2.5175, "step": 297040 }, { "epoch": 0.52, "learning_rate": 2.409902447360987e-05, "loss": 2.4223, "step": 297050 }, { "epoch": 0.52, "learning_rate": 2.409815253368304e-05, "loss": 2.3797, "step": 297060 }, { "epoch": 0.52, "learning_rate": 2.4097280593756214e-05, "loss": 2.2892, "step": 297070 }, { "epoch": 0.52, "learning_rate": 2.4096408653829384e-05, "loss": 2.2963, "step": 297080 }, { "epoch": 0.52, "learning_rate": 2.409553671390256e-05, "loss": 2.4475, "step": 297090 }, { "epoch": 0.52, "learning_rate": 2.4094664773975735e-05, "loss": 2.3132, "step": 297100 }, { "epoch": 0.52, "learning_rate": 2.4093792834048906e-05, "loss": 2.3714, "step": 297110 }, { "epoch": 0.52, "learning_rate": 2.409292089412208e-05, "loss": 2.3071, "step": 297120 }, { "epoch": 0.52, "learning_rate": 2.4092048954195253e-05, "loss": 2.3781, "step": 297130 }, { "epoch": 0.52, "learning_rate": 2.4091177014268427e-05, "loss": 2.2608, "step": 297140 }, { "epoch": 0.52, "learning_rate": 2.4090305074341597e-05, "loss": 2.337, "step": 297150 }, { "epoch": 0.52, "learning_rate": 2.4089433134414774e-05, "loss": 2.3308, "step": 297160 }, { "epoch": 0.52, "learning_rate": 2.4088561194487945e-05, "loss": 2.396, "step": 297170 }, { "epoch": 0.52, "learning_rate": 2.408768925456112e-05, "loss": 2.2818, "step": 297180 }, { "epoch": 0.52, "learning_rate": 2.4086817314634292e-05, "loss": 2.3783, "step": 297190 }, { "epoch": 0.52, "learning_rate": 2.4085945374707466e-05, "loss": 2.4016, "step": 297200 }, { "epoch": 0.52, "learning_rate": 2.408507343478064e-05, "loss": 2.3643, "step": 297210 }, { "epoch": 0.52, "learning_rate": 2.408420149485381e-05, "loss": 2.3205, "step": 297220 }, { "epoch": 0.52, "learning_rate": 2.4083329554926984e-05, "loss": 2.3577, "step": 297230 }, { "epoch": 0.52, "learning_rate": 2.4082457615000158e-05, "loss": 2.3293, "step": 297240 }, { "epoch": 0.52, "learning_rate": 2.408158567507333e-05, "loss": 2.4477, "step": 297250 }, { "epoch": 0.52, "learning_rate": 2.4080713735146505e-05, "loss": 2.3044, "step": 297260 }, { "epoch": 0.52, "learning_rate": 2.4079841795219676e-05, "loss": 2.2366, "step": 297270 }, { "epoch": 0.52, "learning_rate": 2.4078969855292853e-05, "loss": 2.349, "step": 297280 }, { "epoch": 0.52, "learning_rate": 2.4078097915366023e-05, "loss": 2.1976, "step": 297290 }, { "epoch": 0.52, "learning_rate": 2.4077225975439197e-05, "loss": 2.3507, "step": 297300 }, { "epoch": 0.52, "learning_rate": 2.407635403551237e-05, "loss": 2.4036, "step": 297310 }, { "epoch": 0.52, "learning_rate": 2.4075482095585545e-05, "loss": 2.406, "step": 297320 }, { "epoch": 0.52, "learning_rate": 2.4074610155658715e-05, "loss": 2.3773, "step": 297330 }, { "epoch": 0.52, "learning_rate": 2.407373821573189e-05, "loss": 2.3741, "step": 297340 }, { "epoch": 0.52, "learning_rate": 2.4072866275805066e-05, "loss": 2.3162, "step": 297350 }, { "epoch": 0.52, "learning_rate": 2.4071994335878236e-05, "loss": 2.3258, "step": 297360 }, { "epoch": 0.52, "learning_rate": 2.407112239595141e-05, "loss": 2.3956, "step": 297370 }, { "epoch": 0.52, "learning_rate": 2.407025045602458e-05, "loss": 2.3212, "step": 297380 }, { "epoch": 0.52, "learning_rate": 2.4069378516097758e-05, "loss": 2.393, "step": 297390 }, { "epoch": 0.52, "learning_rate": 2.4068506576170928e-05, "loss": 2.3889, "step": 297400 }, { "epoch": 0.52, "learning_rate": 2.4067634636244102e-05, "loss": 2.3058, "step": 297410 }, { "epoch": 0.52, "learning_rate": 2.4066762696317276e-05, "loss": 2.4461, "step": 297420 }, { "epoch": 0.52, "learning_rate": 2.406589075639045e-05, "loss": 2.3612, "step": 297430 }, { "epoch": 0.52, "learning_rate": 2.4065018816463623e-05, "loss": 2.3045, "step": 297440 }, { "epoch": 0.52, "learning_rate": 2.4064146876536793e-05, "loss": 2.3221, "step": 297450 }, { "epoch": 0.52, "learning_rate": 2.406327493660997e-05, "loss": 2.3353, "step": 297460 }, { "epoch": 0.52, "learning_rate": 2.406240299668314e-05, "loss": 2.3953, "step": 297470 }, { "epoch": 0.52, "learning_rate": 2.4061531056756315e-05, "loss": 2.4031, "step": 297480 }, { "epoch": 0.52, "learning_rate": 2.406065911682949e-05, "loss": 2.4412, "step": 297490 }, { "epoch": 0.52, "learning_rate": 2.4059787176902662e-05, "loss": 2.3916, "step": 297500 }, { "epoch": 0.52, "learning_rate": 2.4058915236975836e-05, "loss": 2.279, "step": 297510 }, { "epoch": 0.52, "learning_rate": 2.4058043297049006e-05, "loss": 2.4273, "step": 297520 }, { "epoch": 0.52, "learning_rate": 2.405717135712218e-05, "loss": 2.2596, "step": 297530 }, { "epoch": 0.52, "learning_rate": 2.4056299417195354e-05, "loss": 2.3529, "step": 297540 }, { "epoch": 0.52, "learning_rate": 2.4055427477268528e-05, "loss": 2.4115, "step": 297550 }, { "epoch": 0.52, "learning_rate": 2.4054555537341698e-05, "loss": 2.4824, "step": 297560 }, { "epoch": 0.52, "learning_rate": 2.4053683597414875e-05, "loss": 2.3328, "step": 297570 }, { "epoch": 0.52, "learning_rate": 2.405281165748805e-05, "loss": 2.4304, "step": 297580 }, { "epoch": 0.52, "learning_rate": 2.405193971756122e-05, "loss": 2.4048, "step": 297590 }, { "epoch": 0.52, "learning_rate": 2.4051067777634393e-05, "loss": 2.3564, "step": 297600 }, { "epoch": 0.52, "learning_rate": 2.4050195837707567e-05, "loss": 2.234, "step": 297610 }, { "epoch": 0.52, "learning_rate": 2.404932389778074e-05, "loss": 2.4742, "step": 297620 }, { "epoch": 0.52, "learning_rate": 2.404845195785391e-05, "loss": 2.333, "step": 297630 }, { "epoch": 0.52, "learning_rate": 2.4047580017927085e-05, "loss": 2.3936, "step": 297640 }, { "epoch": 0.52, "learning_rate": 2.404670807800026e-05, "loss": 2.3351, "step": 297650 }, { "epoch": 0.52, "learning_rate": 2.4045836138073433e-05, "loss": 2.296, "step": 297660 }, { "epoch": 0.52, "learning_rate": 2.4044964198146606e-05, "loss": 2.3051, "step": 297670 }, { "epoch": 0.52, "learning_rate": 2.4044092258219777e-05, "loss": 2.3947, "step": 297680 }, { "epoch": 0.52, "learning_rate": 2.4043220318292954e-05, "loss": 2.3098, "step": 297690 }, { "epoch": 0.52, "learning_rate": 2.4042348378366124e-05, "loss": 2.3213, "step": 297700 }, { "epoch": 0.52, "learning_rate": 2.4041476438439298e-05, "loss": 2.3768, "step": 297710 }, { "epoch": 0.52, "learning_rate": 2.4040604498512472e-05, "loss": 2.2669, "step": 297720 }, { "epoch": 0.52, "learning_rate": 2.4039732558585646e-05, "loss": 2.4884, "step": 297730 }, { "epoch": 0.52, "learning_rate": 2.403886061865882e-05, "loss": 2.4029, "step": 297740 }, { "epoch": 0.52, "learning_rate": 2.403798867873199e-05, "loss": 2.4367, "step": 297750 }, { "epoch": 0.52, "learning_rate": 2.4037116738805167e-05, "loss": 2.3747, "step": 297760 }, { "epoch": 0.52, "learning_rate": 2.4036244798878337e-05, "loss": 2.3959, "step": 297770 }, { "epoch": 0.52, "learning_rate": 2.403537285895151e-05, "loss": 2.443, "step": 297780 }, { "epoch": 0.52, "learning_rate": 2.403450091902468e-05, "loss": 2.3733, "step": 297790 }, { "epoch": 0.52, "learning_rate": 2.403362897909786e-05, "loss": 2.3583, "step": 297800 }, { "epoch": 0.52, "learning_rate": 2.403275703917103e-05, "loss": 2.3565, "step": 297810 }, { "epoch": 0.52, "learning_rate": 2.4031885099244203e-05, "loss": 2.4303, "step": 297820 }, { "epoch": 0.52, "learning_rate": 2.403101315931738e-05, "loss": 2.3575, "step": 297830 }, { "epoch": 0.52, "learning_rate": 2.403014121939055e-05, "loss": 2.2844, "step": 297840 }, { "epoch": 0.52, "learning_rate": 2.4029269279463724e-05, "loss": 2.413, "step": 297850 }, { "epoch": 0.52, "learning_rate": 2.4028397339536894e-05, "loss": 2.2738, "step": 297860 }, { "epoch": 0.52, "learning_rate": 2.402752539961007e-05, "loss": 2.2955, "step": 297870 }, { "epoch": 0.52, "learning_rate": 2.4026653459683242e-05, "loss": 2.2689, "step": 297880 }, { "epoch": 0.52, "learning_rate": 2.4025781519756416e-05, "loss": 2.2689, "step": 297890 }, { "epoch": 0.52, "learning_rate": 2.402490957982959e-05, "loss": 2.3153, "step": 297900 }, { "epoch": 0.52, "learning_rate": 2.4024037639902763e-05, "loss": 2.386, "step": 297910 }, { "epoch": 0.52, "learning_rate": 2.4023165699975937e-05, "loss": 2.3515, "step": 297920 }, { "epoch": 0.52, "learning_rate": 2.4022293760049107e-05, "loss": 2.3811, "step": 297930 }, { "epoch": 0.52, "learning_rate": 2.402142182012228e-05, "loss": 2.4554, "step": 297940 }, { "epoch": 0.52, "learning_rate": 2.4020549880195455e-05, "loss": 2.3814, "step": 297950 }, { "epoch": 0.52, "learning_rate": 2.401967794026863e-05, "loss": 2.3235, "step": 297960 }, { "epoch": 0.52, "learning_rate": 2.4018806000341802e-05, "loss": 2.3916, "step": 297970 }, { "epoch": 0.52, "learning_rate": 2.4017934060414976e-05, "loss": 2.3604, "step": 297980 }, { "epoch": 0.52, "learning_rate": 2.401706212048815e-05, "loss": 2.3884, "step": 297990 }, { "epoch": 0.52, "learning_rate": 2.401619018056132e-05, "loss": 2.3166, "step": 298000 }, { "epoch": 0.52, "learning_rate": 2.4015318240634494e-05, "loss": 2.3882, "step": 298010 }, { "epoch": 0.52, "learning_rate": 2.4014446300707668e-05, "loss": 2.1687, "step": 298020 }, { "epoch": 0.52, "learning_rate": 2.401357436078084e-05, "loss": 2.3266, "step": 298030 }, { "epoch": 0.52, "learning_rate": 2.4012702420854012e-05, "loss": 2.4029, "step": 298040 }, { "epoch": 0.52, "learning_rate": 2.4011830480927186e-05, "loss": 2.4651, "step": 298050 }, { "epoch": 0.52, "learning_rate": 2.401095854100036e-05, "loss": 2.3789, "step": 298060 }, { "epoch": 0.52, "learning_rate": 2.4010086601073533e-05, "loss": 2.1877, "step": 298070 }, { "epoch": 0.52, "learning_rate": 2.4009214661146707e-05, "loss": 2.2465, "step": 298080 }, { "epoch": 0.52, "learning_rate": 2.400834272121988e-05, "loss": 2.389, "step": 298090 }, { "epoch": 0.52, "learning_rate": 2.4007470781293055e-05, "loss": 2.2933, "step": 298100 }, { "epoch": 0.52, "learning_rate": 2.4006598841366225e-05, "loss": 2.3182, "step": 298110 }, { "epoch": 0.52, "learning_rate": 2.40057269014394e-05, "loss": 2.3552, "step": 298120 }, { "epoch": 0.52, "learning_rate": 2.4004854961512573e-05, "loss": 2.3301, "step": 298130 }, { "epoch": 0.52, "learning_rate": 2.4003983021585746e-05, "loss": 2.2901, "step": 298140 }, { "epoch": 0.52, "learning_rate": 2.400311108165892e-05, "loss": 2.3478, "step": 298150 }, { "epoch": 0.52, "learning_rate": 2.400223914173209e-05, "loss": 2.2687, "step": 298160 }, { "epoch": 0.52, "learning_rate": 2.4001367201805268e-05, "loss": 2.3241, "step": 298170 }, { "epoch": 0.52, "learning_rate": 2.4000495261878438e-05, "loss": 2.4653, "step": 298180 }, { "epoch": 0.52, "learning_rate": 2.3999623321951612e-05, "loss": 2.462, "step": 298190 }, { "epoch": 0.52, "learning_rate": 2.3998751382024786e-05, "loss": 2.3549, "step": 298200 }, { "epoch": 0.52, "learning_rate": 2.399787944209796e-05, "loss": 2.3325, "step": 298210 }, { "epoch": 0.52, "learning_rate": 2.3997007502171133e-05, "loss": 2.3489, "step": 298220 }, { "epoch": 0.52, "learning_rate": 2.3996135562244304e-05, "loss": 2.4747, "step": 298230 }, { "epoch": 0.52, "learning_rate": 2.399526362231748e-05, "loss": 2.3861, "step": 298240 }, { "epoch": 0.52, "learning_rate": 2.399439168239065e-05, "loss": 2.3714, "step": 298250 }, { "epoch": 0.52, "learning_rate": 2.3993519742463825e-05, "loss": 2.3373, "step": 298260 }, { "epoch": 0.52, "learning_rate": 2.3992647802536995e-05, "loss": 2.2479, "step": 298270 }, { "epoch": 0.52, "learning_rate": 2.3991775862610172e-05, "loss": 2.359, "step": 298280 }, { "epoch": 0.52, "learning_rate": 2.3990903922683343e-05, "loss": 2.3528, "step": 298290 }, { "epoch": 0.52, "learning_rate": 2.3990031982756517e-05, "loss": 2.2611, "step": 298300 }, { "epoch": 0.52, "learning_rate": 2.398916004282969e-05, "loss": 2.3599, "step": 298310 }, { "epoch": 0.52, "learning_rate": 2.3988288102902864e-05, "loss": 2.4444, "step": 298320 }, { "epoch": 0.52, "learning_rate": 2.3987416162976038e-05, "loss": 2.3371, "step": 298330 }, { "epoch": 0.52, "learning_rate": 2.3986544223049208e-05, "loss": 2.2852, "step": 298340 }, { "epoch": 0.52, "learning_rate": 2.3985672283122382e-05, "loss": 2.3866, "step": 298350 }, { "epoch": 0.52, "learning_rate": 2.3984800343195556e-05, "loss": 2.332, "step": 298360 }, { "epoch": 0.52, "learning_rate": 2.398392840326873e-05, "loss": 2.2616, "step": 298370 }, { "epoch": 0.52, "learning_rate": 2.3983056463341903e-05, "loss": 2.3193, "step": 298380 }, { "epoch": 0.52, "learning_rate": 2.3982184523415077e-05, "loss": 2.3397, "step": 298390 }, { "epoch": 0.52, "learning_rate": 2.398131258348825e-05, "loss": 2.4031, "step": 298400 }, { "epoch": 0.52, "learning_rate": 2.398044064356142e-05, "loss": 2.4654, "step": 298410 }, { "epoch": 0.52, "learning_rate": 2.3979568703634595e-05, "loss": 2.4139, "step": 298420 }, { "epoch": 0.52, "learning_rate": 2.397869676370777e-05, "loss": 2.4389, "step": 298430 }, { "epoch": 0.52, "learning_rate": 2.3977824823780943e-05, "loss": 2.3445, "step": 298440 }, { "epoch": 0.52, "learning_rate": 2.3976952883854116e-05, "loss": 2.4012, "step": 298450 }, { "epoch": 0.52, "learning_rate": 2.3976080943927287e-05, "loss": 2.392, "step": 298460 }, { "epoch": 0.52, "learning_rate": 2.3975209004000464e-05, "loss": 2.2844, "step": 298470 }, { "epoch": 0.52, "learning_rate": 2.3974337064073634e-05, "loss": 2.3327, "step": 298480 }, { "epoch": 0.52, "learning_rate": 2.3973465124146808e-05, "loss": 2.3495, "step": 298490 }, { "epoch": 0.52, "learning_rate": 2.3972593184219982e-05, "loss": 2.3056, "step": 298500 }, { "epoch": 0.52, "learning_rate": 2.3971721244293156e-05, "loss": 2.3538, "step": 298510 }, { "epoch": 0.52, "learning_rate": 2.3970849304366326e-05, "loss": 2.4222, "step": 298520 }, { "epoch": 0.52, "learning_rate": 2.39699773644395e-05, "loss": 2.3434, "step": 298530 }, { "epoch": 0.52, "learning_rate": 2.3969105424512673e-05, "loss": 2.1794, "step": 298540 }, { "epoch": 0.52, "learning_rate": 2.3968233484585847e-05, "loss": 2.3099, "step": 298550 }, { "epoch": 0.52, "learning_rate": 2.396736154465902e-05, "loss": 2.3143, "step": 298560 }, { "epoch": 0.52, "learning_rate": 2.396648960473219e-05, "loss": 2.4291, "step": 298570 }, { "epoch": 0.52, "learning_rate": 2.396561766480537e-05, "loss": 2.4371, "step": 298580 }, { "epoch": 0.52, "learning_rate": 2.396474572487854e-05, "loss": 2.3971, "step": 298590 }, { "epoch": 0.52, "learning_rate": 2.3963873784951713e-05, "loss": 2.4434, "step": 298600 }, { "epoch": 0.52, "learning_rate": 2.3963001845024886e-05, "loss": 2.3345, "step": 298610 }, { "epoch": 0.52, "learning_rate": 2.396212990509806e-05, "loss": 2.3578, "step": 298620 }, { "epoch": 0.52, "learning_rate": 2.3961257965171234e-05, "loss": 2.4378, "step": 298630 }, { "epoch": 0.52, "learning_rate": 2.3960386025244404e-05, "loss": 2.2763, "step": 298640 }, { "epoch": 0.52, "learning_rate": 2.395951408531758e-05, "loss": 2.3253, "step": 298650 }, { "epoch": 0.52, "learning_rate": 2.3958642145390752e-05, "loss": 2.3756, "step": 298660 }, { "epoch": 0.52, "learning_rate": 2.3957770205463926e-05, "loss": 2.3341, "step": 298670 }, { "epoch": 0.52, "learning_rate": 2.3956898265537096e-05, "loss": 2.3576, "step": 298680 }, { "epoch": 0.52, "learning_rate": 2.3956026325610273e-05, "loss": 2.3172, "step": 298690 }, { "epoch": 0.52, "learning_rate": 2.3955154385683447e-05, "loss": 2.4036, "step": 298700 }, { "epoch": 0.52, "learning_rate": 2.3954282445756617e-05, "loss": 2.4294, "step": 298710 }, { "epoch": 0.52, "learning_rate": 2.395341050582979e-05, "loss": 2.2991, "step": 298720 }, { "epoch": 0.52, "learning_rate": 2.3952538565902965e-05, "loss": 2.2898, "step": 298730 }, { "epoch": 0.52, "learning_rate": 2.395166662597614e-05, "loss": 2.3908, "step": 298740 }, { "epoch": 0.52, "learning_rate": 2.395079468604931e-05, "loss": 2.3507, "step": 298750 }, { "epoch": 0.52, "learning_rate": 2.3949922746122486e-05, "loss": 2.3435, "step": 298760 }, { "epoch": 0.52, "learning_rate": 2.3949050806195657e-05, "loss": 2.3595, "step": 298770 }, { "epoch": 0.52, "learning_rate": 2.394817886626883e-05, "loss": 2.3252, "step": 298780 }, { "epoch": 0.52, "learning_rate": 2.3947306926342004e-05, "loss": 2.3864, "step": 298790 }, { "epoch": 0.52, "learning_rate": 2.3946434986415178e-05, "loss": 2.4623, "step": 298800 }, { "epoch": 0.52, "learning_rate": 2.394556304648835e-05, "loss": 2.3665, "step": 298810 }, { "epoch": 0.52, "learning_rate": 2.3944691106561522e-05, "loss": 2.4105, "step": 298820 }, { "epoch": 0.52, "learning_rate": 2.3943819166634696e-05, "loss": 2.4514, "step": 298830 }, { "epoch": 0.52, "learning_rate": 2.394294722670787e-05, "loss": 2.3404, "step": 298840 }, { "epoch": 0.52, "learning_rate": 2.3942075286781043e-05, "loss": 2.3495, "step": 298850 }, { "epoch": 0.52, "learning_rate": 2.3941203346854217e-05, "loss": 2.2663, "step": 298860 }, { "epoch": 0.52, "learning_rate": 2.3940331406927388e-05, "loss": 2.2043, "step": 298870 }, { "epoch": 0.52, "learning_rate": 2.3939459467000565e-05, "loss": 2.3801, "step": 298880 }, { "epoch": 0.52, "learning_rate": 2.3938587527073735e-05, "loss": 2.3454, "step": 298890 }, { "epoch": 0.52, "learning_rate": 2.393771558714691e-05, "loss": 2.3439, "step": 298900 }, { "epoch": 0.52, "learning_rate": 2.3936843647220083e-05, "loss": 2.4104, "step": 298910 }, { "epoch": 0.52, "learning_rate": 2.3935971707293256e-05, "loss": 2.4333, "step": 298920 }, { "epoch": 0.52, "learning_rate": 2.393509976736643e-05, "loss": 2.4035, "step": 298930 }, { "epoch": 0.52, "learning_rate": 2.39342278274396e-05, "loss": 2.4567, "step": 298940 }, { "epoch": 0.52, "learning_rate": 2.3933355887512778e-05, "loss": 2.3274, "step": 298950 }, { "epoch": 0.52, "learning_rate": 2.3932483947585948e-05, "loss": 2.2209, "step": 298960 }, { "epoch": 0.52, "learning_rate": 2.3931612007659122e-05, "loss": 2.3782, "step": 298970 }, { "epoch": 0.52, "learning_rate": 2.3930740067732292e-05, "loss": 2.4172, "step": 298980 }, { "epoch": 0.52, "learning_rate": 2.392986812780547e-05, "loss": 2.3175, "step": 298990 }, { "epoch": 0.52, "learning_rate": 2.392899618787864e-05, "loss": 2.3399, "step": 299000 }, { "epoch": 0.52, "learning_rate": 2.3928124247951814e-05, "loss": 2.3811, "step": 299010 }, { "epoch": 0.52, "learning_rate": 2.3927252308024987e-05, "loss": 2.3431, "step": 299020 }, { "epoch": 0.52, "learning_rate": 2.392638036809816e-05, "loss": 2.305, "step": 299030 }, { "epoch": 0.52, "learning_rate": 2.3925508428171335e-05, "loss": 2.3377, "step": 299040 }, { "epoch": 0.52, "learning_rate": 2.3924636488244505e-05, "loss": 2.2855, "step": 299050 }, { "epoch": 0.52, "learning_rate": 2.3923764548317682e-05, "loss": 2.3402, "step": 299060 }, { "epoch": 0.52, "learning_rate": 2.3922892608390853e-05, "loss": 2.2562, "step": 299070 }, { "epoch": 0.52, "learning_rate": 2.3922020668464027e-05, "loss": 2.26, "step": 299080 }, { "epoch": 0.52, "learning_rate": 2.39211487285372e-05, "loss": 2.3393, "step": 299090 }, { "epoch": 0.52, "learning_rate": 2.3920276788610374e-05, "loss": 2.2985, "step": 299100 }, { "epoch": 0.52, "learning_rate": 2.3919404848683548e-05, "loss": 2.3349, "step": 299110 }, { "epoch": 0.52, "learning_rate": 2.3918532908756718e-05, "loss": 2.3364, "step": 299120 }, { "epoch": 0.52, "learning_rate": 2.3917660968829892e-05, "loss": 2.4134, "step": 299130 }, { "epoch": 0.52, "learning_rate": 2.3916789028903066e-05, "loss": 2.4021, "step": 299140 }, { "epoch": 0.52, "learning_rate": 2.391591708897624e-05, "loss": 2.2097, "step": 299150 }, { "epoch": 0.52, "learning_rate": 2.391504514904941e-05, "loss": 2.439, "step": 299160 }, { "epoch": 0.52, "learning_rate": 2.3914173209122587e-05, "loss": 2.3635, "step": 299170 }, { "epoch": 0.52, "learning_rate": 2.391330126919576e-05, "loss": 2.4014, "step": 299180 }, { "epoch": 0.52, "learning_rate": 2.391242932926893e-05, "loss": 2.3333, "step": 299190 }, { "epoch": 0.52, "learning_rate": 2.3911557389342105e-05, "loss": 2.3149, "step": 299200 }, { "epoch": 0.52, "learning_rate": 2.391068544941528e-05, "loss": 2.3255, "step": 299210 }, { "epoch": 0.52, "learning_rate": 2.3909813509488453e-05, "loss": 2.2944, "step": 299220 }, { "epoch": 0.52, "learning_rate": 2.3908941569561623e-05, "loss": 2.347, "step": 299230 }, { "epoch": 0.52, "learning_rate": 2.3908069629634797e-05, "loss": 2.379, "step": 299240 }, { "epoch": 0.52, "learning_rate": 2.390719768970797e-05, "loss": 2.3578, "step": 299250 }, { "epoch": 0.52, "learning_rate": 2.3906325749781144e-05, "loss": 2.2682, "step": 299260 }, { "epoch": 0.52, "learning_rate": 2.3905453809854318e-05, "loss": 2.4337, "step": 299270 }, { "epoch": 0.52, "learning_rate": 2.390458186992749e-05, "loss": 2.3057, "step": 299280 }, { "epoch": 0.52, "learning_rate": 2.3903709930000666e-05, "loss": 2.3779, "step": 299290 }, { "epoch": 0.52, "learning_rate": 2.3902837990073836e-05, "loss": 2.3126, "step": 299300 }, { "epoch": 0.52, "learning_rate": 2.390196605014701e-05, "loss": 2.2984, "step": 299310 }, { "epoch": 0.52, "learning_rate": 2.3901094110220183e-05, "loss": 2.4538, "step": 299320 }, { "epoch": 0.52, "learning_rate": 2.3900222170293357e-05, "loss": 2.2232, "step": 299330 }, { "epoch": 0.52, "learning_rate": 2.389935023036653e-05, "loss": 2.218, "step": 299340 }, { "epoch": 0.52, "learning_rate": 2.38984782904397e-05, "loss": 2.3992, "step": 299350 }, { "epoch": 0.52, "learning_rate": 2.389760635051288e-05, "loss": 2.2998, "step": 299360 }, { "epoch": 0.52, "learning_rate": 2.389673441058605e-05, "loss": 2.3024, "step": 299370 }, { "epoch": 0.52, "learning_rate": 2.3895862470659223e-05, "loss": 2.3207, "step": 299380 }, { "epoch": 0.52, "learning_rate": 2.3894990530732393e-05, "loss": 2.3587, "step": 299390 }, { "epoch": 0.52, "learning_rate": 2.389411859080557e-05, "loss": 2.4273, "step": 299400 }, { "epoch": 0.52, "learning_rate": 2.389324665087874e-05, "loss": 2.3814, "step": 299410 }, { "epoch": 0.52, "learning_rate": 2.3892374710951914e-05, "loss": 2.3292, "step": 299420 }, { "epoch": 0.52, "learning_rate": 2.389150277102509e-05, "loss": 2.3233, "step": 299430 }, { "epoch": 0.52, "learning_rate": 2.3890630831098262e-05, "loss": 2.3734, "step": 299440 }, { "epoch": 0.52, "learning_rate": 2.3889758891171436e-05, "loss": 2.3548, "step": 299450 }, { "epoch": 0.52, "learning_rate": 2.3888886951244606e-05, "loss": 2.4766, "step": 299460 }, { "epoch": 0.52, "learning_rate": 2.3888015011317783e-05, "loss": 2.2948, "step": 299470 }, { "epoch": 0.52, "learning_rate": 2.3887143071390954e-05, "loss": 2.3389, "step": 299480 }, { "epoch": 0.52, "learning_rate": 2.3886271131464127e-05, "loss": 2.289, "step": 299490 }, { "epoch": 0.52, "learning_rate": 2.38853991915373e-05, "loss": 2.3675, "step": 299500 }, { "epoch": 0.52, "learning_rate": 2.3884527251610475e-05, "loss": 2.3451, "step": 299510 }, { "epoch": 0.52, "learning_rate": 2.388365531168365e-05, "loss": 2.3353, "step": 299520 }, { "epoch": 0.52, "learning_rate": 2.388278337175682e-05, "loss": 2.3957, "step": 299530 }, { "epoch": 0.52, "learning_rate": 2.3881911431829993e-05, "loss": 2.28, "step": 299540 }, { "epoch": 0.52, "learning_rate": 2.3881039491903167e-05, "loss": 2.2324, "step": 299550 }, { "epoch": 0.52, "learning_rate": 2.388016755197634e-05, "loss": 2.3397, "step": 299560 }, { "epoch": 0.52, "learning_rate": 2.3879295612049514e-05, "loss": 2.3797, "step": 299570 }, { "epoch": 0.52, "learning_rate": 2.3878423672122688e-05, "loss": 2.318, "step": 299580 }, { "epoch": 0.52, "learning_rate": 2.387755173219586e-05, "loss": 2.4466, "step": 299590 }, { "epoch": 0.52, "learning_rate": 2.3876679792269032e-05, "loss": 2.4188, "step": 299600 }, { "epoch": 0.52, "learning_rate": 2.3875807852342206e-05, "loss": 2.4025, "step": 299610 }, { "epoch": 0.52, "learning_rate": 2.387493591241538e-05, "loss": 2.4276, "step": 299620 }, { "epoch": 0.52, "learning_rate": 2.3874063972488553e-05, "loss": 2.1958, "step": 299630 }, { "epoch": 0.52, "learning_rate": 2.3873192032561724e-05, "loss": 2.1722, "step": 299640 }, { "epoch": 0.52, "learning_rate": 2.3872320092634898e-05, "loss": 2.5097, "step": 299650 }, { "epoch": 0.52, "learning_rate": 2.3871448152708075e-05, "loss": 2.3201, "step": 299660 }, { "epoch": 0.52, "learning_rate": 2.3870576212781245e-05, "loss": 2.3811, "step": 299670 }, { "epoch": 0.52, "learning_rate": 2.386970427285442e-05, "loss": 2.3658, "step": 299680 }, { "epoch": 0.52, "learning_rate": 2.3868832332927593e-05, "loss": 2.2777, "step": 299690 }, { "epoch": 0.52, "learning_rate": 2.3867960393000766e-05, "loss": 2.3977, "step": 299700 }, { "epoch": 0.52, "learning_rate": 2.3867088453073937e-05, "loss": 2.4308, "step": 299710 }, { "epoch": 0.52, "learning_rate": 2.386621651314711e-05, "loss": 2.2278, "step": 299720 }, { "epoch": 0.52, "learning_rate": 2.3865344573220284e-05, "loss": 2.3338, "step": 299730 }, { "epoch": 0.52, "learning_rate": 2.3864472633293458e-05, "loss": 2.3737, "step": 299740 }, { "epoch": 0.52, "learning_rate": 2.3863600693366632e-05, "loss": 2.2853, "step": 299750 }, { "epoch": 0.52, "learning_rate": 2.3862728753439802e-05, "loss": 2.3684, "step": 299760 }, { "epoch": 0.52, "learning_rate": 2.386185681351298e-05, "loss": 2.4128, "step": 299770 }, { "epoch": 0.52, "learning_rate": 2.386098487358615e-05, "loss": 2.3138, "step": 299780 }, { "epoch": 0.52, "learning_rate": 2.3860112933659324e-05, "loss": 2.3332, "step": 299790 }, { "epoch": 0.52, "learning_rate": 2.3859240993732497e-05, "loss": 2.3616, "step": 299800 }, { "epoch": 0.52, "learning_rate": 2.385836905380567e-05, "loss": 2.1653, "step": 299810 }, { "epoch": 0.52, "learning_rate": 2.3857497113878845e-05, "loss": 2.371, "step": 299820 }, { "epoch": 0.52, "learning_rate": 2.3856625173952015e-05, "loss": 2.4103, "step": 299830 }, { "epoch": 0.52, "learning_rate": 2.3855753234025192e-05, "loss": 2.2514, "step": 299840 }, { "epoch": 0.52, "learning_rate": 2.3854881294098363e-05, "loss": 2.4345, "step": 299850 }, { "epoch": 0.52, "learning_rate": 2.3854009354171537e-05, "loss": 2.3466, "step": 299860 }, { "epoch": 0.52, "learning_rate": 2.3853137414244707e-05, "loss": 2.3819, "step": 299870 }, { "epoch": 0.52, "learning_rate": 2.3852265474317884e-05, "loss": 2.391, "step": 299880 }, { "epoch": 0.52, "learning_rate": 2.3851393534391054e-05, "loss": 2.4149, "step": 299890 }, { "epoch": 0.52, "learning_rate": 2.3850521594464228e-05, "loss": 2.2777, "step": 299900 }, { "epoch": 0.52, "learning_rate": 2.3849649654537402e-05, "loss": 2.3819, "step": 299910 }, { "epoch": 0.52, "learning_rate": 2.3848777714610576e-05, "loss": 2.3471, "step": 299920 }, { "epoch": 0.52, "learning_rate": 2.384790577468375e-05, "loss": 2.3025, "step": 299930 }, { "epoch": 0.52, "learning_rate": 2.384703383475692e-05, "loss": 2.3968, "step": 299940 }, { "epoch": 0.52, "learning_rate": 2.3846161894830094e-05, "loss": 2.3988, "step": 299950 }, { "epoch": 0.52, "learning_rate": 2.3845289954903267e-05, "loss": 2.3272, "step": 299960 }, { "epoch": 0.52, "learning_rate": 2.384441801497644e-05, "loss": 2.3496, "step": 299970 }, { "epoch": 0.52, "learning_rate": 2.3843546075049615e-05, "loss": 2.4131, "step": 299980 }, { "epoch": 0.52, "learning_rate": 2.384267413512279e-05, "loss": 2.4005, "step": 299990 }, { "epoch": 0.52, "learning_rate": 2.3841802195195963e-05, "loss": 2.3317, "step": 300000 }, { "epoch": 0.52, "learning_rate": 2.3840930255269133e-05, "loss": 2.4029, "step": 300010 }, { "epoch": 0.52, "learning_rate": 2.3840058315342307e-05, "loss": 2.3246, "step": 300020 }, { "epoch": 0.52, "learning_rate": 2.383918637541548e-05, "loss": 2.3127, "step": 300030 }, { "epoch": 0.52, "learning_rate": 2.3838314435488654e-05, "loss": 2.4224, "step": 300040 }, { "epoch": 0.52, "learning_rate": 2.3837442495561828e-05, "loss": 2.3674, "step": 300050 }, { "epoch": 0.52, "learning_rate": 2.3836570555635e-05, "loss": 2.3342, "step": 300060 }, { "epoch": 0.52, "learning_rate": 2.3835698615708176e-05, "loss": 2.4147, "step": 300070 }, { "epoch": 0.52, "learning_rate": 2.3834826675781346e-05, "loss": 2.329, "step": 300080 }, { "epoch": 0.52, "learning_rate": 2.383395473585452e-05, "loss": 2.3219, "step": 300090 }, { "epoch": 0.52, "learning_rate": 2.3833082795927693e-05, "loss": 2.3097, "step": 300100 }, { "epoch": 0.52, "learning_rate": 2.3832210856000867e-05, "loss": 2.4489, "step": 300110 }, { "epoch": 0.52, "learning_rate": 2.3831338916074038e-05, "loss": 2.3109, "step": 300120 }, { "epoch": 0.52, "learning_rate": 2.383046697614721e-05, "loss": 2.3898, "step": 300130 }, { "epoch": 0.52, "learning_rate": 2.3829595036220385e-05, "loss": 2.4545, "step": 300140 }, { "epoch": 0.52, "learning_rate": 2.382872309629356e-05, "loss": 2.3681, "step": 300150 }, { "epoch": 0.52, "learning_rate": 2.3827851156366733e-05, "loss": 2.374, "step": 300160 }, { "epoch": 0.52, "learning_rate": 2.3826979216439903e-05, "loss": 2.3299, "step": 300170 }, { "epoch": 0.52, "learning_rate": 2.382610727651308e-05, "loss": 2.3384, "step": 300180 }, { "epoch": 0.52, "learning_rate": 2.382523533658625e-05, "loss": 2.3792, "step": 300190 }, { "epoch": 0.52, "learning_rate": 2.3824363396659424e-05, "loss": 2.2949, "step": 300200 }, { "epoch": 0.52, "learning_rate": 2.3823491456732598e-05, "loss": 2.4736, "step": 300210 }, { "epoch": 0.52, "learning_rate": 2.3822619516805772e-05, "loss": 2.418, "step": 300220 }, { "epoch": 0.52, "learning_rate": 2.3821747576878946e-05, "loss": 2.4105, "step": 300230 }, { "epoch": 0.52, "learning_rate": 2.3820875636952116e-05, "loss": 2.4319, "step": 300240 }, { "epoch": 0.52, "learning_rate": 2.3820003697025293e-05, "loss": 2.3482, "step": 300250 }, { "epoch": 0.52, "learning_rate": 2.3819131757098464e-05, "loss": 2.375, "step": 300260 }, { "epoch": 0.52, "learning_rate": 2.3818259817171637e-05, "loss": 2.3268, "step": 300270 }, { "epoch": 0.52, "learning_rate": 2.381738787724481e-05, "loss": 2.3331, "step": 300280 }, { "epoch": 0.52, "learning_rate": 2.3816515937317985e-05, "loss": 2.3496, "step": 300290 }, { "epoch": 0.52, "learning_rate": 2.381564399739116e-05, "loss": 2.3152, "step": 300300 }, { "epoch": 0.52, "learning_rate": 2.381477205746433e-05, "loss": 2.2133, "step": 300310 }, { "epoch": 0.52, "learning_rate": 2.3813900117537503e-05, "loss": 2.4334, "step": 300320 }, { "epoch": 0.52, "learning_rate": 2.3813028177610677e-05, "loss": 2.3448, "step": 300330 }, { "epoch": 0.52, "learning_rate": 2.381215623768385e-05, "loss": 2.2927, "step": 300340 }, { "epoch": 0.52, "learning_rate": 2.381128429775702e-05, "loss": 2.3051, "step": 300350 }, { "epoch": 0.52, "learning_rate": 2.3810412357830198e-05, "loss": 2.2859, "step": 300360 }, { "epoch": 0.52, "learning_rate": 2.3809540417903368e-05, "loss": 2.4602, "step": 300370 }, { "epoch": 0.52, "learning_rate": 2.3808668477976542e-05, "loss": 2.295, "step": 300380 }, { "epoch": 0.52, "learning_rate": 2.3807796538049716e-05, "loss": 2.2436, "step": 300390 }, { "epoch": 0.52, "learning_rate": 2.380692459812289e-05, "loss": 2.3343, "step": 300400 }, { "epoch": 0.52, "learning_rate": 2.3806052658196063e-05, "loss": 2.3187, "step": 300410 }, { "epoch": 0.52, "learning_rate": 2.3805180718269234e-05, "loss": 2.4621, "step": 300420 }, { "epoch": 0.52, "learning_rate": 2.3804308778342408e-05, "loss": 2.3796, "step": 300430 }, { "epoch": 0.52, "learning_rate": 2.380343683841558e-05, "loss": 2.3807, "step": 300440 }, { "epoch": 0.52, "learning_rate": 2.3802564898488755e-05, "loss": 2.389, "step": 300450 }, { "epoch": 0.52, "learning_rate": 2.380169295856193e-05, "loss": 2.5112, "step": 300460 }, { "epoch": 0.52, "learning_rate": 2.38008210186351e-05, "loss": 2.3963, "step": 300470 }, { "epoch": 0.52, "learning_rate": 2.3799949078708276e-05, "loss": 2.3261, "step": 300480 }, { "epoch": 0.52, "learning_rate": 2.3799077138781447e-05, "loss": 2.348, "step": 300490 }, { "epoch": 0.52, "learning_rate": 2.379820519885462e-05, "loss": 2.3094, "step": 300500 }, { "epoch": 0.52, "learning_rate": 2.3797333258927794e-05, "loss": 2.3275, "step": 300510 }, { "epoch": 0.52, "learning_rate": 2.3796461319000968e-05, "loss": 2.364, "step": 300520 }, { "epoch": 0.52, "learning_rate": 2.3795589379074142e-05, "loss": 2.4253, "step": 300530 }, { "epoch": 0.52, "learning_rate": 2.3794717439147312e-05, "loss": 2.387, "step": 300540 }, { "epoch": 0.52, "learning_rate": 2.379384549922049e-05, "loss": 2.227, "step": 300550 }, { "epoch": 0.52, "learning_rate": 2.379297355929366e-05, "loss": 2.4034, "step": 300560 }, { "epoch": 0.52, "learning_rate": 2.3792101619366834e-05, "loss": 2.3373, "step": 300570 }, { "epoch": 0.52, "learning_rate": 2.3791229679440004e-05, "loss": 2.2771, "step": 300580 }, { "epoch": 0.52, "learning_rate": 2.379035773951318e-05, "loss": 2.4098, "step": 300590 }, { "epoch": 0.52, "learning_rate": 2.378948579958635e-05, "loss": 2.4892, "step": 300600 }, { "epoch": 0.52, "learning_rate": 2.3788613859659525e-05, "loss": 2.4271, "step": 300610 }, { "epoch": 0.52, "learning_rate": 2.37877419197327e-05, "loss": 2.3235, "step": 300620 }, { "epoch": 0.52, "learning_rate": 2.3786869979805873e-05, "loss": 2.3709, "step": 300630 }, { "epoch": 0.52, "learning_rate": 2.3785998039879047e-05, "loss": 2.3633, "step": 300640 }, { "epoch": 0.52, "learning_rate": 2.3785126099952217e-05, "loss": 2.4392, "step": 300650 }, { "epoch": 0.52, "learning_rate": 2.3784254160025394e-05, "loss": 2.3696, "step": 300660 }, { "epoch": 0.52, "learning_rate": 2.3783382220098564e-05, "loss": 2.4024, "step": 300670 }, { "epoch": 0.52, "learning_rate": 2.3782510280171738e-05, "loss": 2.3702, "step": 300680 }, { "epoch": 0.52, "learning_rate": 2.3781638340244912e-05, "loss": 2.312, "step": 300690 }, { "epoch": 0.52, "learning_rate": 2.3780766400318086e-05, "loss": 2.3198, "step": 300700 }, { "epoch": 0.52, "learning_rate": 2.377989446039126e-05, "loss": 2.3439, "step": 300710 }, { "epoch": 0.52, "learning_rate": 2.377902252046443e-05, "loss": 2.3563, "step": 300720 }, { "epoch": 0.52, "learning_rate": 2.3778150580537604e-05, "loss": 2.4317, "step": 300730 }, { "epoch": 0.52, "learning_rate": 2.3777278640610777e-05, "loss": 2.3422, "step": 300740 }, { "epoch": 0.52, "learning_rate": 2.377640670068395e-05, "loss": 2.3629, "step": 300750 }, { "epoch": 0.52, "learning_rate": 2.377553476075712e-05, "loss": 2.3273, "step": 300760 }, { "epoch": 0.52, "learning_rate": 2.37746628208303e-05, "loss": 2.3552, "step": 300770 }, { "epoch": 0.52, "learning_rate": 2.3773790880903473e-05, "loss": 2.3987, "step": 300780 }, { "epoch": 0.52, "learning_rate": 2.3772918940976643e-05, "loss": 2.4073, "step": 300790 }, { "epoch": 0.52, "learning_rate": 2.3772047001049817e-05, "loss": 2.408, "step": 300800 }, { "epoch": 0.52, "learning_rate": 2.377117506112299e-05, "loss": 2.3465, "step": 300810 }, { "epoch": 0.52, "learning_rate": 2.3770303121196164e-05, "loss": 2.3802, "step": 300820 }, { "epoch": 0.52, "learning_rate": 2.3769431181269335e-05, "loss": 2.4369, "step": 300830 }, { "epoch": 0.52, "learning_rate": 2.376855924134251e-05, "loss": 2.2449, "step": 300840 }, { "epoch": 0.52, "learning_rate": 2.3767687301415682e-05, "loss": 2.2549, "step": 300850 }, { "epoch": 0.52, "learning_rate": 2.3766815361488856e-05, "loss": 2.4913, "step": 300860 }, { "epoch": 0.52, "learning_rate": 2.376594342156203e-05, "loss": 2.2707, "step": 300870 }, { "epoch": 0.52, "learning_rate": 2.37650714816352e-05, "loss": 2.3875, "step": 300880 }, { "epoch": 0.52, "learning_rate": 2.3764199541708377e-05, "loss": 2.392, "step": 300890 }, { "epoch": 0.52, "learning_rate": 2.3763327601781548e-05, "loss": 2.3677, "step": 300900 }, { "epoch": 0.52, "learning_rate": 2.376245566185472e-05, "loss": 2.3618, "step": 300910 }, { "epoch": 0.52, "learning_rate": 2.3761583721927895e-05, "loss": 2.2893, "step": 300920 }, { "epoch": 0.52, "learning_rate": 2.376071178200107e-05, "loss": 2.3625, "step": 300930 }, { "epoch": 0.52, "learning_rate": 2.3759839842074243e-05, "loss": 2.422, "step": 300940 }, { "epoch": 0.52, "learning_rate": 2.3758967902147413e-05, "loss": 2.4033, "step": 300950 }, { "epoch": 0.52, "learning_rate": 2.375809596222059e-05, "loss": 2.399, "step": 300960 }, { "epoch": 0.52, "learning_rate": 2.375722402229376e-05, "loss": 2.4757, "step": 300970 }, { "epoch": 0.52, "learning_rate": 2.3756352082366934e-05, "loss": 2.4271, "step": 300980 }, { "epoch": 0.52, "learning_rate": 2.3755480142440105e-05, "loss": 2.3474, "step": 300990 }, { "epoch": 0.52, "learning_rate": 2.3754608202513282e-05, "loss": 2.3037, "step": 301000 }, { "epoch": 0.52, "learning_rate": 2.3753736262586456e-05, "loss": 2.3524, "step": 301010 }, { "epoch": 0.52, "learning_rate": 2.3752864322659626e-05, "loss": 2.4028, "step": 301020 }, { "epoch": 0.52, "learning_rate": 2.3751992382732803e-05, "loss": 2.3644, "step": 301030 }, { "epoch": 0.52, "learning_rate": 2.3751120442805974e-05, "loss": 2.4088, "step": 301040 }, { "epoch": 0.52, "learning_rate": 2.3750248502879147e-05, "loss": 2.2296, "step": 301050 }, { "epoch": 0.53, "learning_rate": 2.3749376562952318e-05, "loss": 2.4, "step": 301060 }, { "epoch": 0.53, "learning_rate": 2.3748504623025495e-05, "loss": 2.3954, "step": 301070 }, { "epoch": 0.53, "learning_rate": 2.3747632683098665e-05, "loss": 2.3123, "step": 301080 }, { "epoch": 0.53, "learning_rate": 2.374676074317184e-05, "loss": 2.3621, "step": 301090 }, { "epoch": 0.53, "learning_rate": 2.3745888803245013e-05, "loss": 2.4489, "step": 301100 }, { "epoch": 0.53, "learning_rate": 2.3745016863318187e-05, "loss": 2.3608, "step": 301110 }, { "epoch": 0.53, "learning_rate": 2.374414492339136e-05, "loss": 2.3221, "step": 301120 }, { "epoch": 0.53, "learning_rate": 2.374327298346453e-05, "loss": 2.3651, "step": 301130 }, { "epoch": 0.53, "learning_rate": 2.3742401043537705e-05, "loss": 2.3502, "step": 301140 }, { "epoch": 0.53, "learning_rate": 2.3741529103610878e-05, "loss": 2.4234, "step": 301150 }, { "epoch": 0.53, "learning_rate": 2.3740657163684052e-05, "loss": 2.3072, "step": 301160 }, { "epoch": 0.53, "learning_rate": 2.3739785223757226e-05, "loss": 2.3473, "step": 301170 }, { "epoch": 0.53, "learning_rate": 2.37389132838304e-05, "loss": 2.4013, "step": 301180 }, { "epoch": 0.53, "learning_rate": 2.3738041343903573e-05, "loss": 2.3067, "step": 301190 }, { "epoch": 0.53, "learning_rate": 2.3737169403976744e-05, "loss": 2.3212, "step": 301200 }, { "epoch": 0.53, "learning_rate": 2.3736297464049918e-05, "loss": 2.3003, "step": 301210 }, { "epoch": 0.53, "learning_rate": 2.373542552412309e-05, "loss": 2.4968, "step": 301220 }, { "epoch": 0.53, "learning_rate": 2.3734553584196265e-05, "loss": 2.2603, "step": 301230 }, { "epoch": 0.53, "learning_rate": 2.3733681644269435e-05, "loss": 2.3421, "step": 301240 }, { "epoch": 0.53, "learning_rate": 2.373280970434261e-05, "loss": 2.3586, "step": 301250 }, { "epoch": 0.53, "learning_rate": 2.3731937764415786e-05, "loss": 2.3779, "step": 301260 }, { "epoch": 0.53, "learning_rate": 2.3731065824488957e-05, "loss": 2.4461, "step": 301270 }, { "epoch": 0.53, "learning_rate": 2.373019388456213e-05, "loss": 2.3797, "step": 301280 }, { "epoch": 0.53, "learning_rate": 2.3729321944635304e-05, "loss": 2.3383, "step": 301290 }, { "epoch": 0.53, "learning_rate": 2.3728450004708478e-05, "loss": 2.3466, "step": 301300 }, { "epoch": 0.53, "learning_rate": 2.372757806478165e-05, "loss": 2.3369, "step": 301310 }, { "epoch": 0.53, "learning_rate": 2.3726706124854822e-05, "loss": 2.3702, "step": 301320 }, { "epoch": 0.53, "learning_rate": 2.3725834184927996e-05, "loss": 2.3259, "step": 301330 }, { "epoch": 0.53, "learning_rate": 2.372496224500117e-05, "loss": 2.3491, "step": 301340 }, { "epoch": 0.53, "learning_rate": 2.3724090305074344e-05, "loss": 2.3301, "step": 301350 }, { "epoch": 0.53, "learning_rate": 2.3723218365147514e-05, "loss": 2.4424, "step": 301360 }, { "epoch": 0.53, "learning_rate": 2.372234642522069e-05, "loss": 2.4061, "step": 301370 }, { "epoch": 0.53, "learning_rate": 2.372147448529386e-05, "loss": 2.2959, "step": 301380 }, { "epoch": 0.53, "learning_rate": 2.3720602545367035e-05, "loss": 2.3743, "step": 301390 }, { "epoch": 0.53, "learning_rate": 2.371973060544021e-05, "loss": 2.4235, "step": 301400 }, { "epoch": 0.53, "learning_rate": 2.3718858665513383e-05, "loss": 2.3331, "step": 301410 }, { "epoch": 0.53, "learning_rate": 2.3717986725586557e-05, "loss": 2.3316, "step": 301420 }, { "epoch": 0.53, "learning_rate": 2.3717114785659727e-05, "loss": 2.2949, "step": 301430 }, { "epoch": 0.53, "learning_rate": 2.3716242845732904e-05, "loss": 2.3935, "step": 301440 }, { "epoch": 0.53, "learning_rate": 2.3715370905806074e-05, "loss": 2.3381, "step": 301450 }, { "epoch": 0.53, "learning_rate": 2.3714498965879248e-05, "loss": 2.3822, "step": 301460 }, { "epoch": 0.53, "learning_rate": 2.371362702595242e-05, "loss": 2.3171, "step": 301470 }, { "epoch": 0.53, "learning_rate": 2.3712755086025596e-05, "loss": 2.4164, "step": 301480 }, { "epoch": 0.53, "learning_rate": 2.3711883146098766e-05, "loss": 2.4096, "step": 301490 }, { "epoch": 0.53, "learning_rate": 2.371101120617194e-05, "loss": 2.2938, "step": 301500 }, { "epoch": 0.53, "learning_rate": 2.3710139266245114e-05, "loss": 2.2931, "step": 301510 }, { "epoch": 0.53, "learning_rate": 2.3709267326318287e-05, "loss": 2.4137, "step": 301520 }, { "epoch": 0.53, "learning_rate": 2.370839538639146e-05, "loss": 2.3809, "step": 301530 }, { "epoch": 0.53, "learning_rate": 2.370752344646463e-05, "loss": 2.3434, "step": 301540 }, { "epoch": 0.53, "learning_rate": 2.370665150653781e-05, "loss": 2.4694, "step": 301550 }, { "epoch": 0.53, "learning_rate": 2.370577956661098e-05, "loss": 2.2417, "step": 301560 }, { "epoch": 0.53, "learning_rate": 2.3704907626684153e-05, "loss": 2.4017, "step": 301570 }, { "epoch": 0.53, "learning_rate": 2.3704035686757327e-05, "loss": 2.3627, "step": 301580 }, { "epoch": 0.53, "learning_rate": 2.37031637468305e-05, "loss": 2.2268, "step": 301590 }, { "epoch": 0.53, "learning_rate": 2.3702291806903674e-05, "loss": 2.3505, "step": 301600 }, { "epoch": 0.53, "learning_rate": 2.3701419866976845e-05, "loss": 2.2819, "step": 301610 }, { "epoch": 0.53, "learning_rate": 2.370054792705002e-05, "loss": 2.3852, "step": 301620 }, { "epoch": 0.53, "learning_rate": 2.3699675987123192e-05, "loss": 2.3472, "step": 301630 }, { "epoch": 0.53, "learning_rate": 2.3698804047196366e-05, "loss": 2.3174, "step": 301640 }, { "epoch": 0.53, "learning_rate": 2.369793210726954e-05, "loss": 2.3611, "step": 301650 }, { "epoch": 0.53, "learning_rate": 2.369706016734271e-05, "loss": 2.3693, "step": 301660 }, { "epoch": 0.53, "learning_rate": 2.3696188227415887e-05, "loss": 2.3317, "step": 301670 }, { "epoch": 0.53, "learning_rate": 2.3695316287489058e-05, "loss": 2.4929, "step": 301680 }, { "epoch": 0.53, "learning_rate": 2.369444434756223e-05, "loss": 2.4628, "step": 301690 }, { "epoch": 0.53, "learning_rate": 2.3693572407635405e-05, "loss": 2.3623, "step": 301700 }, { "epoch": 0.53, "learning_rate": 2.369270046770858e-05, "loss": 2.2643, "step": 301710 }, { "epoch": 0.53, "learning_rate": 2.369182852778175e-05, "loss": 2.2373, "step": 301720 }, { "epoch": 0.53, "learning_rate": 2.3690956587854923e-05, "loss": 2.3141, "step": 301730 }, { "epoch": 0.53, "learning_rate": 2.36900846479281e-05, "loss": 2.339, "step": 301740 }, { "epoch": 0.53, "learning_rate": 2.368921270800127e-05, "loss": 2.3962, "step": 301750 }, { "epoch": 0.53, "learning_rate": 2.3688340768074444e-05, "loss": 2.2081, "step": 301760 }, { "epoch": 0.53, "learning_rate": 2.3687468828147615e-05, "loss": 2.3665, "step": 301770 }, { "epoch": 0.53, "learning_rate": 2.3686596888220792e-05, "loss": 2.2939, "step": 301780 }, { "epoch": 0.53, "learning_rate": 2.3685724948293962e-05, "loss": 2.4688, "step": 301790 }, { "epoch": 0.53, "learning_rate": 2.3684853008367136e-05, "loss": 2.3763, "step": 301800 }, { "epoch": 0.53, "learning_rate": 2.368398106844031e-05, "loss": 2.3867, "step": 301810 }, { "epoch": 0.53, "learning_rate": 2.3683109128513484e-05, "loss": 2.3927, "step": 301820 }, { "epoch": 0.53, "learning_rate": 2.3682237188586657e-05, "loss": 2.2659, "step": 301830 }, { "epoch": 0.53, "learning_rate": 2.3681365248659828e-05, "loss": 2.3199, "step": 301840 }, { "epoch": 0.53, "learning_rate": 2.3680493308733005e-05, "loss": 2.2609, "step": 301850 }, { "epoch": 0.53, "learning_rate": 2.3679621368806175e-05, "loss": 2.4466, "step": 301860 }, { "epoch": 0.53, "learning_rate": 2.367874942887935e-05, "loss": 2.2935, "step": 301870 }, { "epoch": 0.53, "learning_rate": 2.3677877488952523e-05, "loss": 2.3574, "step": 301880 }, { "epoch": 0.53, "learning_rate": 2.3677005549025697e-05, "loss": 2.4092, "step": 301890 }, { "epoch": 0.53, "learning_rate": 2.367613360909887e-05, "loss": 2.4272, "step": 301900 }, { "epoch": 0.53, "learning_rate": 2.367526166917204e-05, "loss": 2.2743, "step": 301910 }, { "epoch": 0.53, "learning_rate": 2.3674389729245215e-05, "loss": 2.3377, "step": 301920 }, { "epoch": 0.53, "learning_rate": 2.367351778931839e-05, "loss": 2.3911, "step": 301930 }, { "epoch": 0.53, "learning_rate": 2.3672645849391562e-05, "loss": 2.3702, "step": 301940 }, { "epoch": 0.53, "learning_rate": 2.3671773909464732e-05, "loss": 2.4448, "step": 301950 }, { "epoch": 0.53, "learning_rate": 2.367090196953791e-05, "loss": 2.3374, "step": 301960 }, { "epoch": 0.53, "learning_rate": 2.367003002961108e-05, "loss": 2.3366, "step": 301970 }, { "epoch": 0.53, "learning_rate": 2.3669158089684254e-05, "loss": 2.2965, "step": 301980 }, { "epoch": 0.53, "learning_rate": 2.3668286149757428e-05, "loss": 2.3242, "step": 301990 }, { "epoch": 0.53, "learning_rate": 2.36674142098306e-05, "loss": 2.3807, "step": 302000 }, { "epoch": 0.53, "learning_rate": 2.3666542269903775e-05, "loss": 2.2452, "step": 302010 }, { "epoch": 0.53, "learning_rate": 2.3665670329976945e-05, "loss": 2.3459, "step": 302020 }, { "epoch": 0.53, "learning_rate": 2.366479839005012e-05, "loss": 2.4356, "step": 302030 }, { "epoch": 0.53, "learning_rate": 2.3663926450123293e-05, "loss": 2.4115, "step": 302040 }, { "epoch": 0.53, "learning_rate": 2.3663054510196467e-05, "loss": 2.3268, "step": 302050 }, { "epoch": 0.53, "learning_rate": 2.366218257026964e-05, "loss": 2.3882, "step": 302060 }, { "epoch": 0.53, "learning_rate": 2.366131063034281e-05, "loss": 2.3759, "step": 302070 }, { "epoch": 0.53, "learning_rate": 2.3660438690415988e-05, "loss": 2.4027, "step": 302080 }, { "epoch": 0.53, "learning_rate": 2.365956675048916e-05, "loss": 2.392, "step": 302090 }, { "epoch": 0.53, "learning_rate": 2.3658694810562332e-05, "loss": 2.2918, "step": 302100 }, { "epoch": 0.53, "learning_rate": 2.3657822870635506e-05, "loss": 2.334, "step": 302110 }, { "epoch": 0.53, "learning_rate": 2.365695093070868e-05, "loss": 2.3081, "step": 302120 }, { "epoch": 0.53, "learning_rate": 2.3656078990781854e-05, "loss": 2.3328, "step": 302130 }, { "epoch": 0.53, "learning_rate": 2.3655207050855024e-05, "loss": 2.3392, "step": 302140 }, { "epoch": 0.53, "learning_rate": 2.36543351109282e-05, "loss": 2.2693, "step": 302150 }, { "epoch": 0.53, "learning_rate": 2.365346317100137e-05, "loss": 2.4263, "step": 302160 }, { "epoch": 0.53, "learning_rate": 2.3652591231074545e-05, "loss": 2.3253, "step": 302170 }, { "epoch": 0.53, "learning_rate": 2.3651719291147716e-05, "loss": 2.3192, "step": 302180 }, { "epoch": 0.53, "learning_rate": 2.3650847351220893e-05, "loss": 2.323, "step": 302190 }, { "epoch": 0.53, "learning_rate": 2.3649975411294063e-05, "loss": 2.4138, "step": 302200 }, { "epoch": 0.53, "learning_rate": 2.3649103471367237e-05, "loss": 2.4864, "step": 302210 }, { "epoch": 0.53, "learning_rate": 2.364823153144041e-05, "loss": 2.4626, "step": 302220 }, { "epoch": 0.53, "learning_rate": 2.3647359591513584e-05, "loss": 2.3358, "step": 302230 }, { "epoch": 0.53, "learning_rate": 2.3646487651586758e-05, "loss": 2.3601, "step": 302240 }, { "epoch": 0.53, "learning_rate": 2.364561571165993e-05, "loss": 2.3502, "step": 302250 }, { "epoch": 0.53, "learning_rate": 2.3644743771733106e-05, "loss": 2.3826, "step": 302260 }, { "epoch": 0.53, "learning_rate": 2.3643871831806276e-05, "loss": 2.32, "step": 302270 }, { "epoch": 0.53, "learning_rate": 2.364299989187945e-05, "loss": 2.3522, "step": 302280 }, { "epoch": 0.53, "learning_rate": 2.3642127951952624e-05, "loss": 2.3688, "step": 302290 }, { "epoch": 0.53, "learning_rate": 2.3641256012025797e-05, "loss": 2.4282, "step": 302300 }, { "epoch": 0.53, "learning_rate": 2.364038407209897e-05, "loss": 2.3648, "step": 302310 }, { "epoch": 0.53, "learning_rate": 2.363951213217214e-05, "loss": 2.3078, "step": 302320 }, { "epoch": 0.53, "learning_rate": 2.3638640192245315e-05, "loss": 2.3681, "step": 302330 }, { "epoch": 0.53, "learning_rate": 2.363776825231849e-05, "loss": 2.3421, "step": 302340 }, { "epoch": 0.53, "learning_rate": 2.3636896312391663e-05, "loss": 2.3005, "step": 302350 }, { "epoch": 0.53, "learning_rate": 2.3636024372464837e-05, "loss": 2.3122, "step": 302360 }, { "epoch": 0.53, "learning_rate": 2.363515243253801e-05, "loss": 2.4796, "step": 302370 }, { "epoch": 0.53, "learning_rate": 2.3634280492611184e-05, "loss": 2.3926, "step": 302380 }, { "epoch": 0.53, "learning_rate": 2.3633408552684355e-05, "loss": 2.3787, "step": 302390 }, { "epoch": 0.53, "learning_rate": 2.363253661275753e-05, "loss": 2.3531, "step": 302400 }, { "epoch": 0.53, "learning_rate": 2.3631664672830702e-05, "loss": 2.2262, "step": 302410 }, { "epoch": 0.53, "learning_rate": 2.3630792732903876e-05, "loss": 2.2417, "step": 302420 }, { "epoch": 0.53, "learning_rate": 2.3629920792977046e-05, "loss": 2.3424, "step": 302430 }, { "epoch": 0.53, "learning_rate": 2.362904885305022e-05, "loss": 2.3652, "step": 302440 }, { "epoch": 0.53, "learning_rate": 2.3628176913123394e-05, "loss": 2.3944, "step": 302450 }, { "epoch": 0.53, "learning_rate": 2.3627304973196568e-05, "loss": 2.4333, "step": 302460 }, { "epoch": 0.53, "learning_rate": 2.362643303326974e-05, "loss": 2.2318, "step": 302470 }, { "epoch": 0.53, "learning_rate": 2.3625561093342915e-05, "loss": 2.3402, "step": 302480 }, { "epoch": 0.53, "learning_rate": 2.362468915341609e-05, "loss": 2.3971, "step": 302490 }, { "epoch": 0.53, "learning_rate": 2.362381721348926e-05, "loss": 2.4744, "step": 302500 }, { "epoch": 0.53, "learning_rate": 2.3622945273562433e-05, "loss": 2.4682, "step": 302510 }, { "epoch": 0.53, "learning_rate": 2.3622073333635607e-05, "loss": 2.4122, "step": 302520 }, { "epoch": 0.53, "learning_rate": 2.362120139370878e-05, "loss": 2.2915, "step": 302530 }, { "epoch": 0.53, "learning_rate": 2.3620329453781954e-05, "loss": 2.3859, "step": 302540 }, { "epoch": 0.53, "learning_rate": 2.3619457513855125e-05, "loss": 2.4158, "step": 302550 }, { "epoch": 0.53, "learning_rate": 2.3618585573928302e-05, "loss": 2.366, "step": 302560 }, { "epoch": 0.53, "learning_rate": 2.3617713634001472e-05, "loss": 2.4249, "step": 302570 }, { "epoch": 0.53, "learning_rate": 2.3616841694074646e-05, "loss": 2.3413, "step": 302580 }, { "epoch": 0.53, "learning_rate": 2.3615969754147816e-05, "loss": 2.4553, "step": 302590 }, { "epoch": 0.53, "learning_rate": 2.3615097814220994e-05, "loss": 2.4527, "step": 302600 }, { "epoch": 0.53, "learning_rate": 2.3614225874294167e-05, "loss": 2.4346, "step": 302610 }, { "epoch": 0.53, "learning_rate": 2.3613353934367338e-05, "loss": 2.3573, "step": 302620 }, { "epoch": 0.53, "learning_rate": 2.3612481994440515e-05, "loss": 2.3721, "step": 302630 }, { "epoch": 0.53, "learning_rate": 2.3611610054513685e-05, "loss": 2.2834, "step": 302640 }, { "epoch": 0.53, "learning_rate": 2.361073811458686e-05, "loss": 2.3909, "step": 302650 }, { "epoch": 0.53, "learning_rate": 2.360986617466003e-05, "loss": 2.3229, "step": 302660 }, { "epoch": 0.53, "learning_rate": 2.3608994234733207e-05, "loss": 2.238, "step": 302670 }, { "epoch": 0.53, "learning_rate": 2.3608122294806377e-05, "loss": 2.271, "step": 302680 }, { "epoch": 0.53, "learning_rate": 2.360725035487955e-05, "loss": 2.3317, "step": 302690 }, { "epoch": 0.53, "learning_rate": 2.3606378414952725e-05, "loss": 2.3896, "step": 302700 }, { "epoch": 0.53, "learning_rate": 2.36055064750259e-05, "loss": 2.3822, "step": 302710 }, { "epoch": 0.53, "learning_rate": 2.3604634535099072e-05, "loss": 2.2804, "step": 302720 }, { "epoch": 0.53, "learning_rate": 2.3603762595172242e-05, "loss": 2.2609, "step": 302730 }, { "epoch": 0.53, "learning_rate": 2.3602890655245416e-05, "loss": 2.4344, "step": 302740 }, { "epoch": 0.53, "learning_rate": 2.360201871531859e-05, "loss": 2.2908, "step": 302750 }, { "epoch": 0.53, "learning_rate": 2.3601146775391764e-05, "loss": 2.3295, "step": 302760 }, { "epoch": 0.53, "learning_rate": 2.3600274835464938e-05, "loss": 2.3276, "step": 302770 }, { "epoch": 0.53, "learning_rate": 2.359940289553811e-05, "loss": 2.3563, "step": 302780 }, { "epoch": 0.53, "learning_rate": 2.3598530955611285e-05, "loss": 2.3687, "step": 302790 }, { "epoch": 0.53, "learning_rate": 2.3597659015684455e-05, "loss": 2.3655, "step": 302800 }, { "epoch": 0.53, "learning_rate": 2.359678707575763e-05, "loss": 2.3339, "step": 302810 }, { "epoch": 0.53, "learning_rate": 2.3595915135830803e-05, "loss": 2.2707, "step": 302820 }, { "epoch": 0.53, "learning_rate": 2.3595043195903977e-05, "loss": 2.3334, "step": 302830 }, { "epoch": 0.53, "learning_rate": 2.3594171255977147e-05, "loss": 2.3031, "step": 302840 }, { "epoch": 0.53, "learning_rate": 2.359329931605032e-05, "loss": 2.3998, "step": 302850 }, { "epoch": 0.53, "learning_rate": 2.3592427376123498e-05, "loss": 2.3254, "step": 302860 }, { "epoch": 0.53, "learning_rate": 2.359155543619667e-05, "loss": 2.3816, "step": 302870 }, { "epoch": 0.53, "learning_rate": 2.3590683496269842e-05, "loss": 2.4089, "step": 302880 }, { "epoch": 0.53, "learning_rate": 2.3589811556343016e-05, "loss": 2.3967, "step": 302890 }, { "epoch": 0.53, "learning_rate": 2.358893961641619e-05, "loss": 2.4391, "step": 302900 }, { "epoch": 0.53, "learning_rate": 2.358806767648936e-05, "loss": 2.422, "step": 302910 }, { "epoch": 0.53, "learning_rate": 2.3587195736562534e-05, "loss": 2.4401, "step": 302920 }, { "epoch": 0.53, "learning_rate": 2.3586323796635708e-05, "loss": 2.3831, "step": 302930 }, { "epoch": 0.53, "learning_rate": 2.358545185670888e-05, "loss": 2.4387, "step": 302940 }, { "epoch": 0.53, "learning_rate": 2.3584579916782055e-05, "loss": 2.3418, "step": 302950 }, { "epoch": 0.53, "learning_rate": 2.3583707976855226e-05, "loss": 2.256, "step": 302960 }, { "epoch": 0.53, "learning_rate": 2.3582836036928403e-05, "loss": 2.4634, "step": 302970 }, { "epoch": 0.53, "learning_rate": 2.3581964097001573e-05, "loss": 2.2971, "step": 302980 }, { "epoch": 0.53, "learning_rate": 2.3581092157074747e-05, "loss": 2.3762, "step": 302990 }, { "epoch": 0.53, "learning_rate": 2.358022021714792e-05, "loss": 2.3146, "step": 303000 }, { "epoch": 0.53, "learning_rate": 2.3579348277221094e-05, "loss": 2.3465, "step": 303010 }, { "epoch": 0.53, "learning_rate": 2.3578476337294268e-05, "loss": 2.3544, "step": 303020 }, { "epoch": 0.53, "learning_rate": 2.357760439736744e-05, "loss": 2.2447, "step": 303030 }, { "epoch": 0.53, "learning_rate": 2.3576732457440616e-05, "loss": 2.3749, "step": 303040 }, { "epoch": 0.53, "learning_rate": 2.3575860517513786e-05, "loss": 2.2887, "step": 303050 }, { "epoch": 0.53, "learning_rate": 2.357498857758696e-05, "loss": 2.2695, "step": 303060 }, { "epoch": 0.53, "learning_rate": 2.357411663766013e-05, "loss": 2.3104, "step": 303070 }, { "epoch": 0.53, "learning_rate": 2.3573244697733307e-05, "loss": 2.3493, "step": 303080 }, { "epoch": 0.53, "learning_rate": 2.357237275780648e-05, "loss": 2.4712, "step": 303090 }, { "epoch": 0.53, "learning_rate": 2.357150081787965e-05, "loss": 2.3411, "step": 303100 }, { "epoch": 0.53, "learning_rate": 2.3570628877952825e-05, "loss": 2.3155, "step": 303110 }, { "epoch": 0.53, "learning_rate": 2.3569756938026e-05, "loss": 2.4119, "step": 303120 }, { "epoch": 0.53, "learning_rate": 2.3568884998099173e-05, "loss": 2.4102, "step": 303130 }, { "epoch": 0.53, "learning_rate": 2.3568013058172343e-05, "loss": 2.3576, "step": 303140 }, { "epoch": 0.53, "learning_rate": 2.356714111824552e-05, "loss": 2.4071, "step": 303150 }, { "epoch": 0.53, "learning_rate": 2.356626917831869e-05, "loss": 2.4162, "step": 303160 }, { "epoch": 0.53, "learning_rate": 2.3565397238391865e-05, "loss": 2.2413, "step": 303170 }, { "epoch": 0.53, "learning_rate": 2.356452529846504e-05, "loss": 2.363, "step": 303180 }, { "epoch": 0.53, "learning_rate": 2.3563653358538212e-05, "loss": 2.2569, "step": 303190 }, { "epoch": 0.53, "learning_rate": 2.3562781418611386e-05, "loss": 2.3314, "step": 303200 }, { "epoch": 0.53, "learning_rate": 2.3561909478684556e-05, "loss": 2.3624, "step": 303210 }, { "epoch": 0.53, "learning_rate": 2.356103753875773e-05, "loss": 2.3272, "step": 303220 }, { "epoch": 0.53, "learning_rate": 2.3560165598830904e-05, "loss": 2.3366, "step": 303230 }, { "epoch": 0.53, "learning_rate": 2.3559293658904078e-05, "loss": 2.3012, "step": 303240 }, { "epoch": 0.53, "learning_rate": 2.355842171897725e-05, "loss": 2.3195, "step": 303250 }, { "epoch": 0.53, "learning_rate": 2.3557549779050422e-05, "loss": 2.3298, "step": 303260 }, { "epoch": 0.53, "learning_rate": 2.35566778391236e-05, "loss": 2.3087, "step": 303270 }, { "epoch": 0.53, "learning_rate": 2.355580589919677e-05, "loss": 2.3167, "step": 303280 }, { "epoch": 0.53, "learning_rate": 2.3554933959269943e-05, "loss": 2.2715, "step": 303290 }, { "epoch": 0.53, "learning_rate": 2.3554062019343117e-05, "loss": 2.291, "step": 303300 }, { "epoch": 0.53, "learning_rate": 2.355319007941629e-05, "loss": 2.4339, "step": 303310 }, { "epoch": 0.53, "learning_rate": 2.355231813948946e-05, "loss": 2.426, "step": 303320 }, { "epoch": 0.53, "learning_rate": 2.3551446199562635e-05, "loss": 2.3288, "step": 303330 }, { "epoch": 0.53, "learning_rate": 2.3550574259635812e-05, "loss": 2.304, "step": 303340 }, { "epoch": 0.53, "learning_rate": 2.3549702319708982e-05, "loss": 2.2892, "step": 303350 }, { "epoch": 0.53, "learning_rate": 2.3548830379782156e-05, "loss": 2.3325, "step": 303360 }, { "epoch": 0.53, "learning_rate": 2.3547958439855326e-05, "loss": 2.3765, "step": 303370 }, { "epoch": 0.53, "learning_rate": 2.3547086499928504e-05, "loss": 2.366, "step": 303380 }, { "epoch": 0.53, "learning_rate": 2.3546214560001674e-05, "loss": 2.3492, "step": 303390 }, { "epoch": 0.53, "learning_rate": 2.3545342620074848e-05, "loss": 2.354, "step": 303400 }, { "epoch": 0.53, "learning_rate": 2.354447068014802e-05, "loss": 2.3466, "step": 303410 }, { "epoch": 0.53, "learning_rate": 2.3543598740221195e-05, "loss": 2.4431, "step": 303420 }, { "epoch": 0.53, "learning_rate": 2.354272680029437e-05, "loss": 2.3349, "step": 303430 }, { "epoch": 0.53, "learning_rate": 2.354185486036754e-05, "loss": 2.2902, "step": 303440 }, { "epoch": 0.53, "learning_rate": 2.3540982920440717e-05, "loss": 2.31, "step": 303450 }, { "epoch": 0.53, "learning_rate": 2.3540110980513887e-05, "loss": 2.267, "step": 303460 }, { "epoch": 0.53, "learning_rate": 2.353923904058706e-05, "loss": 2.4542, "step": 303470 }, { "epoch": 0.53, "learning_rate": 2.3538367100660235e-05, "loss": 2.2184, "step": 303480 }, { "epoch": 0.53, "learning_rate": 2.353749516073341e-05, "loss": 2.2979, "step": 303490 }, { "epoch": 0.53, "learning_rate": 2.3536623220806582e-05, "loss": 2.4383, "step": 303500 }, { "epoch": 0.53, "learning_rate": 2.3535751280879752e-05, "loss": 2.3656, "step": 303510 }, { "epoch": 0.53, "learning_rate": 2.3534879340952926e-05, "loss": 2.4111, "step": 303520 }, { "epoch": 0.53, "learning_rate": 2.35340074010261e-05, "loss": 2.2684, "step": 303530 }, { "epoch": 0.53, "learning_rate": 2.3533135461099274e-05, "loss": 2.279, "step": 303540 }, { "epoch": 0.53, "learning_rate": 2.3532263521172444e-05, "loss": 2.3443, "step": 303550 }, { "epoch": 0.53, "learning_rate": 2.353139158124562e-05, "loss": 2.385, "step": 303560 }, { "epoch": 0.53, "learning_rate": 2.3530519641318792e-05, "loss": 2.4572, "step": 303570 }, { "epoch": 0.53, "learning_rate": 2.3529647701391965e-05, "loss": 2.3667, "step": 303580 }, { "epoch": 0.53, "learning_rate": 2.352877576146514e-05, "loss": 2.2884, "step": 303590 }, { "epoch": 0.53, "learning_rate": 2.3527903821538313e-05, "loss": 2.413, "step": 303600 }, { "epoch": 0.53, "learning_rate": 2.3527031881611487e-05, "loss": 2.3865, "step": 303610 }, { "epoch": 0.53, "learning_rate": 2.3526159941684657e-05, "loss": 2.4123, "step": 303620 }, { "epoch": 0.53, "learning_rate": 2.352528800175783e-05, "loss": 2.4341, "step": 303630 }, { "epoch": 0.53, "learning_rate": 2.3524416061831005e-05, "loss": 2.2489, "step": 303640 }, { "epoch": 0.53, "learning_rate": 2.352354412190418e-05, "loss": 2.3324, "step": 303650 }, { "epoch": 0.53, "learning_rate": 2.3522672181977352e-05, "loss": 2.4473, "step": 303660 }, { "epoch": 0.53, "learning_rate": 2.3521800242050523e-05, "loss": 2.3907, "step": 303670 }, { "epoch": 0.53, "learning_rate": 2.35209283021237e-05, "loss": 2.3835, "step": 303680 }, { "epoch": 0.53, "learning_rate": 2.352005636219687e-05, "loss": 2.3881, "step": 303690 }, { "epoch": 0.53, "learning_rate": 2.3519184422270044e-05, "loss": 2.3996, "step": 303700 }, { "epoch": 0.53, "learning_rate": 2.3518312482343218e-05, "loss": 2.3181, "step": 303710 }, { "epoch": 0.53, "learning_rate": 2.351744054241639e-05, "loss": 2.4368, "step": 303720 }, { "epoch": 0.53, "learning_rate": 2.3516568602489565e-05, "loss": 2.3566, "step": 303730 }, { "epoch": 0.53, "learning_rate": 2.3515696662562736e-05, "loss": 2.3347, "step": 303740 }, { "epoch": 0.53, "learning_rate": 2.3514824722635913e-05, "loss": 2.368, "step": 303750 }, { "epoch": 0.53, "learning_rate": 2.3513952782709083e-05, "loss": 2.3518, "step": 303760 }, { "epoch": 0.53, "learning_rate": 2.3513080842782257e-05, "loss": 2.2735, "step": 303770 }, { "epoch": 0.53, "learning_rate": 2.3512208902855427e-05, "loss": 2.3975, "step": 303780 }, { "epoch": 0.53, "learning_rate": 2.3511336962928604e-05, "loss": 2.3155, "step": 303790 }, { "epoch": 0.53, "learning_rate": 2.3510465023001775e-05, "loss": 2.3138, "step": 303800 }, { "epoch": 0.53, "learning_rate": 2.350959308307495e-05, "loss": 2.42, "step": 303810 }, { "epoch": 0.53, "learning_rate": 2.3508721143148126e-05, "loss": 2.4714, "step": 303820 }, { "epoch": 0.53, "learning_rate": 2.3507849203221296e-05, "loss": 2.3024, "step": 303830 }, { "epoch": 0.53, "learning_rate": 2.350697726329447e-05, "loss": 2.4194, "step": 303840 }, { "epoch": 0.53, "learning_rate": 2.350610532336764e-05, "loss": 2.4333, "step": 303850 }, { "epoch": 0.53, "learning_rate": 2.3505233383440817e-05, "loss": 2.4367, "step": 303860 }, { "epoch": 0.53, "learning_rate": 2.3504361443513988e-05, "loss": 2.4282, "step": 303870 }, { "epoch": 0.53, "learning_rate": 2.350348950358716e-05, "loss": 2.396, "step": 303880 }, { "epoch": 0.53, "learning_rate": 2.3502617563660335e-05, "loss": 2.2664, "step": 303890 }, { "epoch": 0.53, "learning_rate": 2.350174562373351e-05, "loss": 2.3142, "step": 303900 }, { "epoch": 0.53, "learning_rate": 2.3500873683806683e-05, "loss": 2.3224, "step": 303910 }, { "epoch": 0.53, "learning_rate": 2.3500001743879853e-05, "loss": 2.3727, "step": 303920 }, { "epoch": 0.53, "learning_rate": 2.3499129803953027e-05, "loss": 2.3613, "step": 303930 }, { "epoch": 0.53, "learning_rate": 2.34982578640262e-05, "loss": 2.3297, "step": 303940 }, { "epoch": 0.53, "learning_rate": 2.3497385924099375e-05, "loss": 2.4179, "step": 303950 }, { "epoch": 0.53, "learning_rate": 2.349651398417255e-05, "loss": 2.4246, "step": 303960 }, { "epoch": 0.53, "learning_rate": 2.3495642044245722e-05, "loss": 2.2693, "step": 303970 }, { "epoch": 0.53, "learning_rate": 2.3494770104318896e-05, "loss": 2.2915, "step": 303980 }, { "epoch": 0.53, "learning_rate": 2.3493898164392066e-05, "loss": 2.281, "step": 303990 }, { "epoch": 0.53, "learning_rate": 2.349302622446524e-05, "loss": 2.3728, "step": 304000 }, { "epoch": 0.53, "learning_rate": 2.3492154284538414e-05, "loss": 2.4526, "step": 304010 }, { "epoch": 0.53, "learning_rate": 2.3491282344611588e-05, "loss": 2.4209, "step": 304020 }, { "epoch": 0.53, "learning_rate": 2.3490410404684758e-05, "loss": 2.3715, "step": 304030 }, { "epoch": 0.53, "learning_rate": 2.3489538464757932e-05, "loss": 2.3712, "step": 304040 }, { "epoch": 0.53, "learning_rate": 2.3488666524831106e-05, "loss": 2.3466, "step": 304050 }, { "epoch": 0.53, "learning_rate": 2.348779458490428e-05, "loss": 2.3539, "step": 304060 }, { "epoch": 0.53, "learning_rate": 2.3486922644977453e-05, "loss": 2.3372, "step": 304070 }, { "epoch": 0.53, "learning_rate": 2.3486050705050627e-05, "loss": 2.3369, "step": 304080 }, { "epoch": 0.53, "learning_rate": 2.34851787651238e-05, "loss": 2.2873, "step": 304090 }, { "epoch": 0.53, "learning_rate": 2.348430682519697e-05, "loss": 2.4244, "step": 304100 }, { "epoch": 0.53, "learning_rate": 2.3483434885270145e-05, "loss": 2.4921, "step": 304110 }, { "epoch": 0.53, "learning_rate": 2.348256294534332e-05, "loss": 2.3877, "step": 304120 }, { "epoch": 0.53, "learning_rate": 2.3481691005416492e-05, "loss": 2.3785, "step": 304130 }, { "epoch": 0.53, "learning_rate": 2.3480819065489666e-05, "loss": 2.3163, "step": 304140 }, { "epoch": 0.53, "learning_rate": 2.3479947125562836e-05, "loss": 2.2604, "step": 304150 }, { "epoch": 0.53, "learning_rate": 2.3479075185636014e-05, "loss": 2.3488, "step": 304160 }, { "epoch": 0.53, "learning_rate": 2.3478203245709184e-05, "loss": 2.4512, "step": 304170 }, { "epoch": 0.53, "learning_rate": 2.3477331305782358e-05, "loss": 2.3333, "step": 304180 }, { "epoch": 0.53, "learning_rate": 2.3476459365855528e-05, "loss": 2.4232, "step": 304190 }, { "epoch": 0.53, "learning_rate": 2.3475587425928705e-05, "loss": 2.3311, "step": 304200 }, { "epoch": 0.53, "learning_rate": 2.347471548600188e-05, "loss": 2.3077, "step": 304210 }, { "epoch": 0.53, "learning_rate": 2.347384354607505e-05, "loss": 2.3061, "step": 304220 }, { "epoch": 0.53, "learning_rate": 2.3472971606148227e-05, "loss": 2.4134, "step": 304230 }, { "epoch": 0.53, "learning_rate": 2.3472099666221397e-05, "loss": 2.25, "step": 304240 }, { "epoch": 0.53, "learning_rate": 2.347122772629457e-05, "loss": 2.3004, "step": 304250 }, { "epoch": 0.53, "learning_rate": 2.347035578636774e-05, "loss": 2.4141, "step": 304260 }, { "epoch": 0.53, "learning_rate": 2.346948384644092e-05, "loss": 2.33, "step": 304270 }, { "epoch": 0.53, "learning_rate": 2.346861190651409e-05, "loss": 2.4411, "step": 304280 }, { "epoch": 0.53, "learning_rate": 2.3467739966587262e-05, "loss": 2.3422, "step": 304290 }, { "epoch": 0.53, "learning_rate": 2.3466868026660436e-05, "loss": 2.2222, "step": 304300 }, { "epoch": 0.53, "learning_rate": 2.346599608673361e-05, "loss": 2.4453, "step": 304310 }, { "epoch": 0.53, "learning_rate": 2.3465124146806784e-05, "loss": 2.4185, "step": 304320 }, { "epoch": 0.53, "learning_rate": 2.3464252206879954e-05, "loss": 2.3602, "step": 304330 }, { "epoch": 0.53, "learning_rate": 2.3463380266953128e-05, "loss": 2.3201, "step": 304340 }, { "epoch": 0.53, "learning_rate": 2.3462508327026302e-05, "loss": 2.2294, "step": 304350 }, { "epoch": 0.53, "learning_rate": 2.3461636387099475e-05, "loss": 2.2797, "step": 304360 }, { "epoch": 0.53, "learning_rate": 2.346076444717265e-05, "loss": 2.2957, "step": 304370 }, { "epoch": 0.53, "learning_rate": 2.3459892507245823e-05, "loss": 2.416, "step": 304380 }, { "epoch": 0.53, "learning_rate": 2.3459020567318997e-05, "loss": 2.4102, "step": 304390 }, { "epoch": 0.53, "learning_rate": 2.3458148627392167e-05, "loss": 2.3246, "step": 304400 }, { "epoch": 0.53, "learning_rate": 2.345727668746534e-05, "loss": 2.3112, "step": 304410 }, { "epoch": 0.53, "learning_rate": 2.3456404747538515e-05, "loss": 2.2904, "step": 304420 }, { "epoch": 0.53, "learning_rate": 2.345553280761169e-05, "loss": 2.3722, "step": 304430 }, { "epoch": 0.53, "learning_rate": 2.3454660867684862e-05, "loss": 2.4106, "step": 304440 }, { "epoch": 0.53, "learning_rate": 2.3453788927758033e-05, "loss": 2.2869, "step": 304450 }, { "epoch": 0.53, "learning_rate": 2.345291698783121e-05, "loss": 2.3706, "step": 304460 }, { "epoch": 0.53, "learning_rate": 2.345204504790438e-05, "loss": 2.4087, "step": 304470 }, { "epoch": 0.53, "learning_rate": 2.3451173107977554e-05, "loss": 2.4137, "step": 304480 }, { "epoch": 0.53, "learning_rate": 2.3450301168050728e-05, "loss": 2.4359, "step": 304490 }, { "epoch": 0.53, "learning_rate": 2.34494292281239e-05, "loss": 2.3714, "step": 304500 }, { "epoch": 0.53, "learning_rate": 2.3448557288197072e-05, "loss": 2.3223, "step": 304510 }, { "epoch": 0.53, "learning_rate": 2.3447685348270246e-05, "loss": 2.4282, "step": 304520 }, { "epoch": 0.53, "learning_rate": 2.344681340834342e-05, "loss": 2.3701, "step": 304530 }, { "epoch": 0.53, "learning_rate": 2.3445941468416593e-05, "loss": 2.418, "step": 304540 }, { "epoch": 0.53, "learning_rate": 2.3445069528489767e-05, "loss": 2.2299, "step": 304550 }, { "epoch": 0.53, "learning_rate": 2.3444197588562937e-05, "loss": 2.4502, "step": 304560 }, { "epoch": 0.53, "learning_rate": 2.3443325648636114e-05, "loss": 2.4466, "step": 304570 }, { "epoch": 0.53, "learning_rate": 2.3442453708709285e-05, "loss": 2.3124, "step": 304580 }, { "epoch": 0.53, "learning_rate": 2.344158176878246e-05, "loss": 2.2952, "step": 304590 }, { "epoch": 0.53, "learning_rate": 2.3440709828855632e-05, "loss": 2.3238, "step": 304600 }, { "epoch": 0.53, "learning_rate": 2.3439837888928806e-05, "loss": 2.3543, "step": 304610 }, { "epoch": 0.53, "learning_rate": 2.343896594900198e-05, "loss": 2.3704, "step": 304620 }, { "epoch": 0.53, "learning_rate": 2.343809400907515e-05, "loss": 2.2783, "step": 304630 }, { "epoch": 0.53, "learning_rate": 2.3437222069148327e-05, "loss": 2.4493, "step": 304640 }, { "epoch": 0.53, "learning_rate": 2.3436350129221498e-05, "loss": 2.3167, "step": 304650 }, { "epoch": 0.53, "learning_rate": 2.343547818929467e-05, "loss": 2.3981, "step": 304660 }, { "epoch": 0.53, "learning_rate": 2.3434606249367842e-05, "loss": 2.3315, "step": 304670 }, { "epoch": 0.53, "learning_rate": 2.343373430944102e-05, "loss": 2.3974, "step": 304680 }, { "epoch": 0.53, "learning_rate": 2.3432862369514193e-05, "loss": 2.2042, "step": 304690 }, { "epoch": 0.53, "learning_rate": 2.3431990429587363e-05, "loss": 2.3749, "step": 304700 }, { "epoch": 0.53, "learning_rate": 2.3431118489660537e-05, "loss": 2.3399, "step": 304710 }, { "epoch": 0.53, "learning_rate": 2.343024654973371e-05, "loss": 2.2334, "step": 304720 }, { "epoch": 0.53, "learning_rate": 2.3429374609806885e-05, "loss": 2.3193, "step": 304730 }, { "epoch": 0.53, "learning_rate": 2.3428502669880055e-05, "loss": 2.3672, "step": 304740 }, { "epoch": 0.53, "learning_rate": 2.3427630729953232e-05, "loss": 2.4695, "step": 304750 }, { "epoch": 0.53, "learning_rate": 2.3426758790026403e-05, "loss": 2.3405, "step": 304760 }, { "epoch": 0.53, "learning_rate": 2.3425886850099576e-05, "loss": 2.4381, "step": 304770 }, { "epoch": 0.53, "learning_rate": 2.342501491017275e-05, "loss": 2.3443, "step": 304780 }, { "epoch": 0.53, "learning_rate": 2.3424142970245924e-05, "loss": 2.3277, "step": 304790 }, { "epoch": 0.53, "learning_rate": 2.3423271030319098e-05, "loss": 2.34, "step": 304800 }, { "epoch": 0.53, "learning_rate": 2.3422399090392268e-05, "loss": 2.3158, "step": 304810 }, { "epoch": 0.53, "learning_rate": 2.3421527150465442e-05, "loss": 2.4118, "step": 304820 }, { "epoch": 0.53, "learning_rate": 2.3420655210538616e-05, "loss": 2.2972, "step": 304830 }, { "epoch": 0.53, "learning_rate": 2.341978327061179e-05, "loss": 2.2959, "step": 304840 }, { "epoch": 0.53, "learning_rate": 2.3418911330684963e-05, "loss": 2.3083, "step": 304850 }, { "epoch": 0.53, "learning_rate": 2.3418039390758133e-05, "loss": 2.3564, "step": 304860 }, { "epoch": 0.53, "learning_rate": 2.341716745083131e-05, "loss": 2.3326, "step": 304870 }, { "epoch": 0.53, "learning_rate": 2.341629551090448e-05, "loss": 2.316, "step": 304880 }, { "epoch": 0.53, "learning_rate": 2.3415423570977655e-05, "loss": 2.4068, "step": 304890 }, { "epoch": 0.53, "learning_rate": 2.341455163105083e-05, "loss": 2.4943, "step": 304900 }, { "epoch": 0.53, "learning_rate": 2.3413679691124002e-05, "loss": 2.4787, "step": 304910 }, { "epoch": 0.53, "learning_rate": 2.3412807751197173e-05, "loss": 2.3997, "step": 304920 }, { "epoch": 0.53, "learning_rate": 2.3411935811270346e-05, "loss": 2.275, "step": 304930 }, { "epoch": 0.53, "learning_rate": 2.3411063871343524e-05, "loss": 2.3588, "step": 304940 }, { "epoch": 0.53, "learning_rate": 2.3410191931416694e-05, "loss": 2.4374, "step": 304950 }, { "epoch": 0.53, "learning_rate": 2.3409319991489868e-05, "loss": 2.4661, "step": 304960 }, { "epoch": 0.53, "learning_rate": 2.3408448051563038e-05, "loss": 2.3314, "step": 304970 }, { "epoch": 0.53, "learning_rate": 2.3407576111636215e-05, "loss": 2.3891, "step": 304980 }, { "epoch": 0.53, "learning_rate": 2.3406704171709386e-05, "loss": 2.2607, "step": 304990 }, { "epoch": 0.53, "learning_rate": 2.340583223178256e-05, "loss": 2.2758, "step": 305000 }, { "epoch": 0.53, "learning_rate": 2.3404960291855733e-05, "loss": 2.3161, "step": 305010 }, { "epoch": 0.53, "learning_rate": 2.3404088351928907e-05, "loss": 2.3247, "step": 305020 }, { "epoch": 0.53, "learning_rate": 2.340321641200208e-05, "loss": 2.341, "step": 305030 }, { "epoch": 0.53, "learning_rate": 2.340234447207525e-05, "loss": 2.3846, "step": 305040 }, { "epoch": 0.53, "learning_rate": 2.340147253214843e-05, "loss": 2.3279, "step": 305050 }, { "epoch": 0.53, "learning_rate": 2.34006005922216e-05, "loss": 2.3448, "step": 305060 }, { "epoch": 0.53, "learning_rate": 2.3399728652294772e-05, "loss": 2.4171, "step": 305070 }, { "epoch": 0.53, "learning_rate": 2.3398856712367946e-05, "loss": 2.4226, "step": 305080 }, { "epoch": 0.53, "learning_rate": 2.339798477244112e-05, "loss": 2.3297, "step": 305090 }, { "epoch": 0.53, "learning_rate": 2.3397112832514294e-05, "loss": 2.3843, "step": 305100 }, { "epoch": 0.53, "learning_rate": 2.3396240892587464e-05, "loss": 2.3692, "step": 305110 }, { "epoch": 0.53, "learning_rate": 2.3395368952660638e-05, "loss": 2.4109, "step": 305120 }, { "epoch": 0.53, "learning_rate": 2.3394497012733812e-05, "loss": 2.3301, "step": 305130 }, { "epoch": 0.53, "learning_rate": 2.3393625072806985e-05, "loss": 2.3903, "step": 305140 }, { "epoch": 0.53, "learning_rate": 2.3392753132880156e-05, "loss": 2.3727, "step": 305150 }, { "epoch": 0.53, "learning_rate": 2.3391881192953333e-05, "loss": 2.3635, "step": 305160 }, { "epoch": 0.53, "learning_rate": 2.3391009253026507e-05, "loss": 2.3476, "step": 305170 }, { "epoch": 0.53, "learning_rate": 2.3390137313099677e-05, "loss": 2.3918, "step": 305180 }, { "epoch": 0.53, "learning_rate": 2.338926537317285e-05, "loss": 2.4644, "step": 305190 }, { "epoch": 0.53, "learning_rate": 2.3388393433246025e-05, "loss": 2.4575, "step": 305200 }, { "epoch": 0.53, "learning_rate": 2.33875214933192e-05, "loss": 2.3031, "step": 305210 }, { "epoch": 0.53, "learning_rate": 2.338664955339237e-05, "loss": 2.3484, "step": 305220 }, { "epoch": 0.53, "learning_rate": 2.3385777613465543e-05, "loss": 2.2995, "step": 305230 }, { "epoch": 0.53, "learning_rate": 2.3384905673538716e-05, "loss": 2.3932, "step": 305240 }, { "epoch": 0.53, "learning_rate": 2.338403373361189e-05, "loss": 2.3615, "step": 305250 }, { "epoch": 0.53, "learning_rate": 2.3383161793685064e-05, "loss": 2.3141, "step": 305260 }, { "epoch": 0.53, "learning_rate": 2.3382289853758234e-05, "loss": 2.3311, "step": 305270 }, { "epoch": 0.53, "learning_rate": 2.338141791383141e-05, "loss": 2.3248, "step": 305280 }, { "epoch": 0.53, "learning_rate": 2.3380545973904582e-05, "loss": 2.3792, "step": 305290 }, { "epoch": 0.53, "learning_rate": 2.3379674033977756e-05, "loss": 2.3672, "step": 305300 }, { "epoch": 0.53, "learning_rate": 2.337880209405093e-05, "loss": 2.3641, "step": 305310 }, { "epoch": 0.53, "learning_rate": 2.3377930154124103e-05, "loss": 2.3058, "step": 305320 }, { "epoch": 0.53, "learning_rate": 2.3377058214197277e-05, "loss": 2.411, "step": 305330 }, { "epoch": 0.53, "learning_rate": 2.3376186274270447e-05, "loss": 2.3911, "step": 305340 }, { "epoch": 0.53, "learning_rate": 2.3375314334343624e-05, "loss": 2.4017, "step": 305350 }, { "epoch": 0.53, "learning_rate": 2.3374442394416795e-05, "loss": 2.4498, "step": 305360 }, { "epoch": 0.53, "learning_rate": 2.337357045448997e-05, "loss": 2.3868, "step": 305370 }, { "epoch": 0.53, "learning_rate": 2.337269851456314e-05, "loss": 2.3473, "step": 305380 }, { "epoch": 0.53, "learning_rate": 2.3371826574636316e-05, "loss": 2.4411, "step": 305390 }, { "epoch": 0.53, "learning_rate": 2.3370954634709487e-05, "loss": 2.248, "step": 305400 }, { "epoch": 0.53, "learning_rate": 2.337008269478266e-05, "loss": 2.3263, "step": 305410 }, { "epoch": 0.53, "learning_rate": 2.3369210754855837e-05, "loss": 2.4265, "step": 305420 }, { "epoch": 0.53, "learning_rate": 2.3368338814929008e-05, "loss": 2.3764, "step": 305430 }, { "epoch": 0.53, "learning_rate": 2.336746687500218e-05, "loss": 2.4405, "step": 305440 }, { "epoch": 0.53, "learning_rate": 2.3366594935075352e-05, "loss": 2.2798, "step": 305450 }, { "epoch": 0.53, "learning_rate": 2.336572299514853e-05, "loss": 2.4021, "step": 305460 }, { "epoch": 0.53, "learning_rate": 2.33648510552217e-05, "loss": 2.4359, "step": 305470 }, { "epoch": 0.53, "learning_rate": 2.3363979115294873e-05, "loss": 2.3238, "step": 305480 }, { "epoch": 0.53, "learning_rate": 2.3363107175368047e-05, "loss": 2.3903, "step": 305490 }, { "epoch": 0.53, "learning_rate": 2.336223523544122e-05, "loss": 2.4176, "step": 305500 }, { "epoch": 0.53, "learning_rate": 2.3361363295514395e-05, "loss": 2.3879, "step": 305510 }, { "epoch": 0.53, "learning_rate": 2.3360491355587565e-05, "loss": 2.4457, "step": 305520 }, { "epoch": 0.53, "learning_rate": 2.335961941566074e-05, "loss": 2.3431, "step": 305530 }, { "epoch": 0.53, "learning_rate": 2.3358747475733913e-05, "loss": 2.3429, "step": 305540 }, { "epoch": 0.53, "learning_rate": 2.3357875535807086e-05, "loss": 2.322, "step": 305550 }, { "epoch": 0.53, "learning_rate": 2.335700359588026e-05, "loss": 2.3396, "step": 305560 }, { "epoch": 0.53, "learning_rate": 2.3356131655953434e-05, "loss": 2.4937, "step": 305570 }, { "epoch": 0.53, "learning_rate": 2.3355259716026608e-05, "loss": 2.4149, "step": 305580 }, { "epoch": 0.53, "learning_rate": 2.3354387776099778e-05, "loss": 2.2799, "step": 305590 }, { "epoch": 0.53, "learning_rate": 2.3353515836172952e-05, "loss": 2.3651, "step": 305600 }, { "epoch": 0.53, "learning_rate": 2.3352643896246126e-05, "loss": 2.3432, "step": 305610 }, { "epoch": 0.53, "learning_rate": 2.33517719563193e-05, "loss": 2.3558, "step": 305620 }, { "epoch": 0.53, "learning_rate": 2.335090001639247e-05, "loss": 2.372, "step": 305630 }, { "epoch": 0.53, "learning_rate": 2.3350028076465643e-05, "loss": 2.3735, "step": 305640 }, { "epoch": 0.53, "learning_rate": 2.3349156136538817e-05, "loss": 2.343, "step": 305650 }, { "epoch": 0.53, "learning_rate": 2.334828419661199e-05, "loss": 2.4173, "step": 305660 }, { "epoch": 0.53, "learning_rate": 2.3347412256685165e-05, "loss": 2.3012, "step": 305670 }, { "epoch": 0.53, "learning_rate": 2.334654031675834e-05, "loss": 2.3567, "step": 305680 }, { "epoch": 0.53, "learning_rate": 2.3345668376831512e-05, "loss": 2.3439, "step": 305690 }, { "epoch": 0.53, "learning_rate": 2.3344796436904683e-05, "loss": 2.3233, "step": 305700 }, { "epoch": 0.53, "learning_rate": 2.3343924496977856e-05, "loss": 2.4134, "step": 305710 }, { "epoch": 0.53, "learning_rate": 2.334305255705103e-05, "loss": 2.4283, "step": 305720 }, { "epoch": 0.53, "learning_rate": 2.3342180617124204e-05, "loss": 2.3451, "step": 305730 }, { "epoch": 0.53, "learning_rate": 2.3341308677197378e-05, "loss": 2.3161, "step": 305740 }, { "epoch": 0.53, "learning_rate": 2.3340436737270548e-05, "loss": 2.3403, "step": 305750 }, { "epoch": 0.53, "learning_rate": 2.3339564797343725e-05, "loss": 2.3672, "step": 305760 }, { "epoch": 0.53, "learning_rate": 2.3338692857416896e-05, "loss": 2.3477, "step": 305770 }, { "epoch": 0.53, "learning_rate": 2.333782091749007e-05, "loss": 2.3022, "step": 305780 }, { "epoch": 0.53, "learning_rate": 2.3336948977563243e-05, "loss": 2.3811, "step": 305790 }, { "epoch": 0.53, "learning_rate": 2.3336077037636417e-05, "loss": 2.3271, "step": 305800 }, { "epoch": 0.53, "learning_rate": 2.333520509770959e-05, "loss": 2.4178, "step": 305810 }, { "epoch": 0.53, "learning_rate": 2.333433315778276e-05, "loss": 2.2556, "step": 305820 }, { "epoch": 0.53, "learning_rate": 2.333346121785594e-05, "loss": 2.4738, "step": 305830 }, { "epoch": 0.53, "learning_rate": 2.333258927792911e-05, "loss": 2.2746, "step": 305840 }, { "epoch": 0.53, "learning_rate": 2.3331717338002282e-05, "loss": 2.3853, "step": 305850 }, { "epoch": 0.53, "learning_rate": 2.3330845398075453e-05, "loss": 2.3498, "step": 305860 }, { "epoch": 0.53, "learning_rate": 2.332997345814863e-05, "loss": 2.2895, "step": 305870 }, { "epoch": 0.53, "learning_rate": 2.33291015182218e-05, "loss": 2.3446, "step": 305880 }, { "epoch": 0.53, "learning_rate": 2.3328229578294974e-05, "loss": 2.3856, "step": 305890 }, { "epoch": 0.53, "learning_rate": 2.3327357638368148e-05, "loss": 2.2688, "step": 305900 }, { "epoch": 0.53, "learning_rate": 2.3326485698441322e-05, "loss": 2.3463, "step": 305910 }, { "epoch": 0.53, "learning_rate": 2.3325613758514495e-05, "loss": 2.3384, "step": 305920 }, { "epoch": 0.53, "learning_rate": 2.3324741818587666e-05, "loss": 2.36, "step": 305930 }, { "epoch": 0.53, "learning_rate": 2.3323869878660843e-05, "loss": 2.375, "step": 305940 }, { "epoch": 0.53, "learning_rate": 2.3322997938734013e-05, "loss": 2.4221, "step": 305950 }, { "epoch": 0.53, "learning_rate": 2.3322125998807187e-05, "loss": 2.3571, "step": 305960 }, { "epoch": 0.53, "learning_rate": 2.332125405888036e-05, "loss": 2.5195, "step": 305970 }, { "epoch": 0.53, "learning_rate": 2.3320382118953535e-05, "loss": 2.3496, "step": 305980 }, { "epoch": 0.53, "learning_rate": 2.331951017902671e-05, "loss": 2.3701, "step": 305990 }, { "epoch": 0.53, "learning_rate": 2.331863823909988e-05, "loss": 2.4755, "step": 306000 }, { "epoch": 0.53, "learning_rate": 2.3317766299173053e-05, "loss": 2.26, "step": 306010 }, { "epoch": 0.53, "learning_rate": 2.3316894359246226e-05, "loss": 2.2112, "step": 306020 }, { "epoch": 0.53, "learning_rate": 2.33160224193194e-05, "loss": 2.46, "step": 306030 }, { "epoch": 0.53, "learning_rate": 2.3315150479392574e-05, "loss": 2.3883, "step": 306040 }, { "epoch": 0.53, "learning_rate": 2.3314278539465744e-05, "loss": 2.4129, "step": 306050 }, { "epoch": 0.53, "learning_rate": 2.331340659953892e-05, "loss": 2.3555, "step": 306060 }, { "epoch": 0.53, "learning_rate": 2.3312534659612092e-05, "loss": 2.3615, "step": 306070 }, { "epoch": 0.53, "learning_rate": 2.3311662719685266e-05, "loss": 2.3861, "step": 306080 }, { "epoch": 0.53, "learning_rate": 2.331079077975844e-05, "loss": 2.3499, "step": 306090 }, { "epoch": 0.53, "learning_rate": 2.3309918839831613e-05, "loss": 2.1665, "step": 306100 }, { "epoch": 0.53, "learning_rate": 2.3309046899904784e-05, "loss": 2.2171, "step": 306110 }, { "epoch": 0.53, "learning_rate": 2.3308174959977957e-05, "loss": 2.3761, "step": 306120 }, { "epoch": 0.53, "learning_rate": 2.330730302005113e-05, "loss": 2.331, "step": 306130 }, { "epoch": 0.53, "learning_rate": 2.3306431080124305e-05, "loss": 2.3322, "step": 306140 }, { "epoch": 0.53, "learning_rate": 2.330555914019748e-05, "loss": 2.258, "step": 306150 }, { "epoch": 0.53, "learning_rate": 2.330468720027065e-05, "loss": 2.407, "step": 306160 }, { "epoch": 0.53, "learning_rate": 2.3303815260343826e-05, "loss": 2.4332, "step": 306170 }, { "epoch": 0.53, "learning_rate": 2.3302943320416997e-05, "loss": 2.2975, "step": 306180 }, { "epoch": 0.53, "learning_rate": 2.330207138049017e-05, "loss": 2.3918, "step": 306190 }, { "epoch": 0.53, "learning_rate": 2.3301199440563344e-05, "loss": 2.4251, "step": 306200 }, { "epoch": 0.53, "learning_rate": 2.3300327500636518e-05, "loss": 2.4443, "step": 306210 }, { "epoch": 0.53, "learning_rate": 2.329945556070969e-05, "loss": 2.4317, "step": 306220 }, { "epoch": 0.53, "learning_rate": 2.3298583620782862e-05, "loss": 2.2808, "step": 306230 }, { "epoch": 0.53, "learning_rate": 2.329771168085604e-05, "loss": 2.3702, "step": 306240 }, { "epoch": 0.53, "learning_rate": 2.329683974092921e-05, "loss": 2.29, "step": 306250 }, { "epoch": 0.53, "learning_rate": 2.3295967801002383e-05, "loss": 2.4293, "step": 306260 }, { "epoch": 0.53, "learning_rate": 2.3295095861075554e-05, "loss": 2.3276, "step": 306270 }, { "epoch": 0.53, "learning_rate": 2.329422392114873e-05, "loss": 2.3816, "step": 306280 }, { "epoch": 0.53, "learning_rate": 2.3293351981221905e-05, "loss": 2.3872, "step": 306290 }, { "epoch": 0.53, "learning_rate": 2.3292480041295075e-05, "loss": 2.3305, "step": 306300 }, { "epoch": 0.53, "learning_rate": 2.329160810136825e-05, "loss": 2.2872, "step": 306310 }, { "epoch": 0.53, "learning_rate": 2.3290736161441423e-05, "loss": 2.3478, "step": 306320 }, { "epoch": 0.53, "learning_rate": 2.3289864221514596e-05, "loss": 2.3494, "step": 306330 }, { "epoch": 0.53, "learning_rate": 2.3288992281587767e-05, "loss": 2.4218, "step": 306340 }, { "epoch": 0.53, "learning_rate": 2.3288120341660944e-05, "loss": 2.2799, "step": 306350 }, { "epoch": 0.53, "learning_rate": 2.3287248401734114e-05, "loss": 2.273, "step": 306360 }, { "epoch": 0.53, "learning_rate": 2.3286376461807288e-05, "loss": 2.3505, "step": 306370 }, { "epoch": 0.53, "learning_rate": 2.3285504521880462e-05, "loss": 2.2345, "step": 306380 }, { "epoch": 0.53, "learning_rate": 2.3284632581953636e-05, "loss": 2.3725, "step": 306390 }, { "epoch": 0.53, "learning_rate": 2.328376064202681e-05, "loss": 2.3643, "step": 306400 }, { "epoch": 0.53, "learning_rate": 2.328288870209998e-05, "loss": 2.3694, "step": 306410 }, { "epoch": 0.53, "learning_rate": 2.3282016762173153e-05, "loss": 2.3029, "step": 306420 }, { "epoch": 0.53, "learning_rate": 2.3281144822246327e-05, "loss": 2.2385, "step": 306430 }, { "epoch": 0.53, "learning_rate": 2.32802728823195e-05, "loss": 2.2859, "step": 306440 }, { "epoch": 0.53, "learning_rate": 2.3279400942392675e-05, "loss": 2.5034, "step": 306450 }, { "epoch": 0.53, "learning_rate": 2.3278529002465845e-05, "loss": 2.3145, "step": 306460 }, { "epoch": 0.53, "learning_rate": 2.3277657062539022e-05, "loss": 2.3731, "step": 306470 }, { "epoch": 0.53, "learning_rate": 2.3276785122612193e-05, "loss": 2.3945, "step": 306480 }, { "epoch": 0.53, "learning_rate": 2.3275913182685366e-05, "loss": 2.3619, "step": 306490 }, { "epoch": 0.53, "learning_rate": 2.327504124275854e-05, "loss": 2.3074, "step": 306500 }, { "epoch": 0.53, "learning_rate": 2.3274169302831714e-05, "loss": 2.1831, "step": 306510 }, { "epoch": 0.53, "learning_rate": 2.3273297362904888e-05, "loss": 2.3069, "step": 306520 }, { "epoch": 0.53, "learning_rate": 2.3272425422978058e-05, "loss": 2.3738, "step": 306530 }, { "epoch": 0.53, "learning_rate": 2.3271553483051235e-05, "loss": 2.3375, "step": 306540 }, { "epoch": 0.53, "learning_rate": 2.3270681543124406e-05, "loss": 2.3517, "step": 306550 }, { "epoch": 0.53, "learning_rate": 2.326980960319758e-05, "loss": 2.4286, "step": 306560 }, { "epoch": 0.53, "learning_rate": 2.326893766327075e-05, "loss": 2.3282, "step": 306570 }, { "epoch": 0.53, "learning_rate": 2.3268065723343927e-05, "loss": 2.3311, "step": 306580 }, { "epoch": 0.53, "learning_rate": 2.3267193783417097e-05, "loss": 2.438, "step": 306590 }, { "epoch": 0.53, "learning_rate": 2.326632184349027e-05, "loss": 2.3116, "step": 306600 }, { "epoch": 0.53, "learning_rate": 2.3265449903563445e-05, "loss": 2.4249, "step": 306610 }, { "epoch": 0.53, "learning_rate": 2.326457796363662e-05, "loss": 2.4275, "step": 306620 }, { "epoch": 0.53, "learning_rate": 2.3263706023709793e-05, "loss": 2.218, "step": 306630 }, { "epoch": 0.53, "learning_rate": 2.3262834083782963e-05, "loss": 2.2857, "step": 306640 }, { "epoch": 0.53, "learning_rate": 2.326196214385614e-05, "loss": 2.4008, "step": 306650 }, { "epoch": 0.53, "learning_rate": 2.326109020392931e-05, "loss": 2.2992, "step": 306660 }, { "epoch": 0.53, "learning_rate": 2.3260218264002484e-05, "loss": 2.3449, "step": 306670 }, { "epoch": 0.53, "learning_rate": 2.3259346324075658e-05, "loss": 2.3616, "step": 306680 }, { "epoch": 0.53, "learning_rate": 2.3258474384148832e-05, "loss": 2.4528, "step": 306690 }, { "epoch": 0.53, "learning_rate": 2.3257602444222006e-05, "loss": 2.2744, "step": 306700 }, { "epoch": 0.53, "learning_rate": 2.3256730504295176e-05, "loss": 2.2738, "step": 306710 }, { "epoch": 0.53, "learning_rate": 2.325585856436835e-05, "loss": 2.4185, "step": 306720 }, { "epoch": 0.53, "learning_rate": 2.3254986624441523e-05, "loss": 2.3239, "step": 306730 }, { "epoch": 0.53, "learning_rate": 2.3254114684514697e-05, "loss": 2.3597, "step": 306740 }, { "epoch": 0.53, "learning_rate": 2.3253242744587868e-05, "loss": 2.274, "step": 306750 }, { "epoch": 0.53, "learning_rate": 2.3252370804661045e-05, "loss": 2.2678, "step": 306760 }, { "epoch": 0.53, "learning_rate": 2.325149886473422e-05, "loss": 2.3149, "step": 306770 }, { "epoch": 0.53, "learning_rate": 2.325062692480739e-05, "loss": 2.4488, "step": 306780 }, { "epoch": 0.54, "learning_rate": 2.3249754984880563e-05, "loss": 2.3422, "step": 306790 }, { "epoch": 0.54, "learning_rate": 2.3248883044953736e-05, "loss": 2.3123, "step": 306800 }, { "epoch": 0.54, "learning_rate": 2.324801110502691e-05, "loss": 2.3184, "step": 306810 }, { "epoch": 0.54, "learning_rate": 2.324713916510008e-05, "loss": 2.3598, "step": 306820 }, { "epoch": 0.54, "learning_rate": 2.3246267225173254e-05, "loss": 2.4109, "step": 306830 }, { "epoch": 0.54, "learning_rate": 2.3245395285246428e-05, "loss": 2.4432, "step": 306840 }, { "epoch": 0.54, "learning_rate": 2.3244523345319602e-05, "loss": 2.3933, "step": 306850 }, { "epoch": 0.54, "learning_rate": 2.3243651405392776e-05, "loss": 2.3849, "step": 306860 }, { "epoch": 0.54, "learning_rate": 2.324277946546595e-05, "loss": 2.4041, "step": 306870 }, { "epoch": 0.54, "learning_rate": 2.3241907525539123e-05, "loss": 2.3716, "step": 306880 }, { "epoch": 0.54, "learning_rate": 2.3241035585612294e-05, "loss": 2.4537, "step": 306890 }, { "epoch": 0.54, "learning_rate": 2.3240163645685467e-05, "loss": 2.4438, "step": 306900 }, { "epoch": 0.54, "learning_rate": 2.323929170575864e-05, "loss": 2.3649, "step": 306910 }, { "epoch": 0.54, "learning_rate": 2.3238419765831815e-05, "loss": 2.4837, "step": 306920 }, { "epoch": 0.54, "learning_rate": 2.323754782590499e-05, "loss": 2.3461, "step": 306930 }, { "epoch": 0.54, "learning_rate": 2.323667588597816e-05, "loss": 2.3432, "step": 306940 }, { "epoch": 0.54, "learning_rate": 2.3235803946051336e-05, "loss": 2.4608, "step": 306950 }, { "epoch": 0.54, "learning_rate": 2.3234932006124507e-05, "loss": 2.4227, "step": 306960 }, { "epoch": 0.54, "learning_rate": 2.323406006619768e-05, "loss": 2.3343, "step": 306970 }, { "epoch": 0.54, "learning_rate": 2.323318812627085e-05, "loss": 2.3588, "step": 306980 }, { "epoch": 0.54, "learning_rate": 2.3232316186344028e-05, "loss": 2.3629, "step": 306990 }, { "epoch": 0.54, "learning_rate": 2.3231444246417198e-05, "loss": 2.3383, "step": 307000 }, { "epoch": 0.54, "learning_rate": 2.3230572306490372e-05, "loss": 2.3093, "step": 307010 }, { "epoch": 0.54, "learning_rate": 2.322970036656355e-05, "loss": 2.3129, "step": 307020 }, { "epoch": 0.54, "learning_rate": 2.322882842663672e-05, "loss": 2.2721, "step": 307030 }, { "epoch": 0.54, "learning_rate": 2.3227956486709893e-05, "loss": 2.3325, "step": 307040 }, { "epoch": 0.54, "learning_rate": 2.3227084546783064e-05, "loss": 2.2743, "step": 307050 }, { "epoch": 0.54, "learning_rate": 2.322621260685624e-05, "loss": 2.4088, "step": 307060 }, { "epoch": 0.54, "learning_rate": 2.322534066692941e-05, "loss": 2.3009, "step": 307070 }, { "epoch": 0.54, "learning_rate": 2.3224468727002585e-05, "loss": 2.2164, "step": 307080 }, { "epoch": 0.54, "learning_rate": 2.322359678707576e-05, "loss": 2.2777, "step": 307090 }, { "epoch": 0.54, "learning_rate": 2.3222724847148933e-05, "loss": 2.3933, "step": 307100 }, { "epoch": 0.54, "learning_rate": 2.3221852907222106e-05, "loss": 2.2683, "step": 307110 }, { "epoch": 0.54, "learning_rate": 2.3220980967295277e-05, "loss": 2.2663, "step": 307120 }, { "epoch": 0.54, "learning_rate": 2.322010902736845e-05, "loss": 2.3453, "step": 307130 }, { "epoch": 0.54, "learning_rate": 2.3219237087441624e-05, "loss": 2.3012, "step": 307140 }, { "epoch": 0.54, "learning_rate": 2.3218365147514798e-05, "loss": 2.2845, "step": 307150 }, { "epoch": 0.54, "learning_rate": 2.3217493207587972e-05, "loss": 2.4087, "step": 307160 }, { "epoch": 0.54, "learning_rate": 2.3216621267661146e-05, "loss": 2.3373, "step": 307170 }, { "epoch": 0.54, "learning_rate": 2.321574932773432e-05, "loss": 2.4432, "step": 307180 }, { "epoch": 0.54, "learning_rate": 2.321487738780749e-05, "loss": 2.4192, "step": 307190 }, { "epoch": 0.54, "learning_rate": 2.3214005447880664e-05, "loss": 2.3801, "step": 307200 }, { "epoch": 0.54, "learning_rate": 2.3213133507953837e-05, "loss": 2.3561, "step": 307210 }, { "epoch": 0.54, "learning_rate": 2.321226156802701e-05, "loss": 2.3334, "step": 307220 }, { "epoch": 0.54, "learning_rate": 2.321138962810018e-05, "loss": 2.2995, "step": 307230 }, { "epoch": 0.54, "learning_rate": 2.3210517688173355e-05, "loss": 2.2386, "step": 307240 }, { "epoch": 0.54, "learning_rate": 2.3209645748246532e-05, "loss": 2.2522, "step": 307250 }, { "epoch": 0.54, "learning_rate": 2.3208773808319703e-05, "loss": 2.2986, "step": 307260 }, { "epoch": 0.54, "learning_rate": 2.3207901868392877e-05, "loss": 2.4082, "step": 307270 }, { "epoch": 0.54, "learning_rate": 2.320702992846605e-05, "loss": 2.2183, "step": 307280 }, { "epoch": 0.54, "learning_rate": 2.3206157988539224e-05, "loss": 2.4093, "step": 307290 }, { "epoch": 0.54, "learning_rate": 2.3205286048612394e-05, "loss": 2.2705, "step": 307300 }, { "epoch": 0.54, "learning_rate": 2.3204414108685568e-05, "loss": 2.4365, "step": 307310 }, { "epoch": 0.54, "learning_rate": 2.3203542168758742e-05, "loss": 2.303, "step": 307320 }, { "epoch": 0.54, "learning_rate": 2.3202670228831916e-05, "loss": 2.3416, "step": 307330 }, { "epoch": 0.54, "learning_rate": 2.320179828890509e-05, "loss": 2.3932, "step": 307340 }, { "epoch": 0.54, "learning_rate": 2.320092634897826e-05, "loss": 2.2163, "step": 307350 }, { "epoch": 0.54, "learning_rate": 2.3200054409051437e-05, "loss": 2.4351, "step": 307360 }, { "epoch": 0.54, "learning_rate": 2.3199182469124607e-05, "loss": 2.4136, "step": 307370 }, { "epoch": 0.54, "learning_rate": 2.319831052919778e-05, "loss": 2.3591, "step": 307380 }, { "epoch": 0.54, "learning_rate": 2.3197438589270955e-05, "loss": 2.3674, "step": 307390 }, { "epoch": 0.54, "learning_rate": 2.319656664934413e-05, "loss": 2.349, "step": 307400 }, { "epoch": 0.54, "learning_rate": 2.3195694709417303e-05, "loss": 2.4122, "step": 307410 }, { "epoch": 0.54, "learning_rate": 2.3194822769490473e-05, "loss": 2.2862, "step": 307420 }, { "epoch": 0.54, "learning_rate": 2.319395082956365e-05, "loss": 2.3248, "step": 307430 }, { "epoch": 0.54, "learning_rate": 2.319307888963682e-05, "loss": 2.3845, "step": 307440 }, { "epoch": 0.54, "learning_rate": 2.3192206949709994e-05, "loss": 2.4467, "step": 307450 }, { "epoch": 0.54, "learning_rate": 2.3191335009783165e-05, "loss": 2.3945, "step": 307460 }, { "epoch": 0.54, "learning_rate": 2.3190463069856342e-05, "loss": 2.3087, "step": 307470 }, { "epoch": 0.54, "learning_rate": 2.3189591129929512e-05, "loss": 2.3568, "step": 307480 }, { "epoch": 0.54, "learning_rate": 2.3188719190002686e-05, "loss": 2.3391, "step": 307490 }, { "epoch": 0.54, "learning_rate": 2.318784725007586e-05, "loss": 2.3964, "step": 307500 }, { "epoch": 0.54, "learning_rate": 2.3186975310149033e-05, "loss": 2.3436, "step": 307510 }, { "epoch": 0.54, "learning_rate": 2.3186103370222207e-05, "loss": 2.3028, "step": 307520 }, { "epoch": 0.54, "learning_rate": 2.3185231430295378e-05, "loss": 2.4295, "step": 307530 }, { "epoch": 0.54, "learning_rate": 2.3184359490368555e-05, "loss": 2.365, "step": 307540 }, { "epoch": 0.54, "learning_rate": 2.3183487550441725e-05, "loss": 2.3828, "step": 307550 }, { "epoch": 0.54, "learning_rate": 2.31826156105149e-05, "loss": 2.389, "step": 307560 }, { "epoch": 0.54, "learning_rate": 2.3181743670588073e-05, "loss": 2.3816, "step": 307570 }, { "epoch": 0.54, "learning_rate": 2.3180871730661246e-05, "loss": 2.3344, "step": 307580 }, { "epoch": 0.54, "learning_rate": 2.317999979073442e-05, "loss": 2.3323, "step": 307590 }, { "epoch": 0.54, "learning_rate": 2.317912785080759e-05, "loss": 2.2775, "step": 307600 }, { "epoch": 0.54, "learning_rate": 2.3178255910880764e-05, "loss": 2.3133, "step": 307610 }, { "epoch": 0.54, "learning_rate": 2.3177383970953938e-05, "loss": 2.2677, "step": 307620 }, { "epoch": 0.54, "learning_rate": 2.3176512031027112e-05, "loss": 2.4139, "step": 307630 }, { "epoch": 0.54, "learning_rate": 2.3175640091100286e-05, "loss": 2.4077, "step": 307640 }, { "epoch": 0.54, "learning_rate": 2.3174768151173456e-05, "loss": 2.3651, "step": 307650 }, { "epoch": 0.54, "learning_rate": 2.3173896211246633e-05, "loss": 2.3525, "step": 307660 }, { "epoch": 0.54, "learning_rate": 2.3173024271319804e-05, "loss": 2.2801, "step": 307670 }, { "epoch": 0.54, "learning_rate": 2.3172152331392977e-05, "loss": 2.2808, "step": 307680 }, { "epoch": 0.54, "learning_rate": 2.317128039146615e-05, "loss": 2.3117, "step": 307690 }, { "epoch": 0.54, "learning_rate": 2.3170408451539325e-05, "loss": 2.3952, "step": 307700 }, { "epoch": 0.54, "learning_rate": 2.3169536511612495e-05, "loss": 2.335, "step": 307710 }, { "epoch": 0.54, "learning_rate": 2.316866457168567e-05, "loss": 2.5446, "step": 307720 }, { "epoch": 0.54, "learning_rate": 2.3167792631758846e-05, "loss": 2.3703, "step": 307730 }, { "epoch": 0.54, "learning_rate": 2.3166920691832017e-05, "loss": 2.3234, "step": 307740 }, { "epoch": 0.54, "learning_rate": 2.316604875190519e-05, "loss": 2.3474, "step": 307750 }, { "epoch": 0.54, "learning_rate": 2.316517681197836e-05, "loss": 2.3584, "step": 307760 }, { "epoch": 0.54, "learning_rate": 2.3164304872051538e-05, "loss": 2.3688, "step": 307770 }, { "epoch": 0.54, "learning_rate": 2.3163432932124708e-05, "loss": 2.304, "step": 307780 }, { "epoch": 0.54, "learning_rate": 2.3162560992197882e-05, "loss": 2.3271, "step": 307790 }, { "epoch": 0.54, "learning_rate": 2.3161689052271056e-05, "loss": 2.3117, "step": 307800 }, { "epoch": 0.54, "learning_rate": 2.316081711234423e-05, "loss": 2.3056, "step": 307810 }, { "epoch": 0.54, "learning_rate": 2.3159945172417403e-05, "loss": 2.4345, "step": 307820 }, { "epoch": 0.54, "learning_rate": 2.3159073232490574e-05, "loss": 2.3774, "step": 307830 }, { "epoch": 0.54, "learning_rate": 2.315820129256375e-05, "loss": 2.3886, "step": 307840 }, { "epoch": 0.54, "learning_rate": 2.315732935263692e-05, "loss": 2.3168, "step": 307850 }, { "epoch": 0.54, "learning_rate": 2.3156457412710095e-05, "loss": 2.4064, "step": 307860 }, { "epoch": 0.54, "learning_rate": 2.315558547278327e-05, "loss": 2.4216, "step": 307870 }, { "epoch": 0.54, "learning_rate": 2.3154713532856443e-05, "loss": 2.3461, "step": 307880 }, { "epoch": 0.54, "learning_rate": 2.3153841592929616e-05, "loss": 2.3366, "step": 307890 }, { "epoch": 0.54, "learning_rate": 2.3152969653002787e-05, "loss": 2.3301, "step": 307900 }, { "epoch": 0.54, "learning_rate": 2.315209771307596e-05, "loss": 2.2644, "step": 307910 }, { "epoch": 0.54, "learning_rate": 2.3151225773149134e-05, "loss": 2.3029, "step": 307920 }, { "epoch": 0.54, "learning_rate": 2.3150353833222308e-05, "loss": 2.3099, "step": 307930 }, { "epoch": 0.54, "learning_rate": 2.314948189329548e-05, "loss": 2.2722, "step": 307940 }, { "epoch": 0.54, "learning_rate": 2.3148609953368656e-05, "loss": 2.4429, "step": 307950 }, { "epoch": 0.54, "learning_rate": 2.3147738013441826e-05, "loss": 2.2755, "step": 307960 }, { "epoch": 0.54, "learning_rate": 2.3146866073515e-05, "loss": 2.4211, "step": 307970 }, { "epoch": 0.54, "learning_rate": 2.3145994133588174e-05, "loss": 2.4952, "step": 307980 }, { "epoch": 0.54, "learning_rate": 2.3145122193661347e-05, "loss": 2.2692, "step": 307990 }, { "epoch": 0.54, "learning_rate": 2.314425025373452e-05, "loss": 2.328, "step": 308000 }, { "epoch": 0.54, "learning_rate": 2.314337831380769e-05, "loss": 2.3214, "step": 308010 }, { "epoch": 0.54, "learning_rate": 2.3142506373880865e-05, "loss": 2.2848, "step": 308020 }, { "epoch": 0.54, "learning_rate": 2.314163443395404e-05, "loss": 2.3698, "step": 308030 }, { "epoch": 0.54, "learning_rate": 2.3140762494027213e-05, "loss": 2.4306, "step": 308040 }, { "epoch": 0.54, "learning_rate": 2.3139890554100387e-05, "loss": 2.3984, "step": 308050 }, { "epoch": 0.54, "learning_rate": 2.3139018614173557e-05, "loss": 2.2873, "step": 308060 }, { "epoch": 0.54, "learning_rate": 2.3138146674246734e-05, "loss": 2.3187, "step": 308070 }, { "epoch": 0.54, "learning_rate": 2.3137274734319904e-05, "loss": 2.4468, "step": 308080 }, { "epoch": 0.54, "learning_rate": 2.3136402794393078e-05, "loss": 2.2986, "step": 308090 }, { "epoch": 0.54, "learning_rate": 2.3135530854466252e-05, "loss": 2.3454, "step": 308100 }, { "epoch": 0.54, "learning_rate": 2.3134658914539426e-05, "loss": 2.2789, "step": 308110 }, { "epoch": 0.54, "learning_rate": 2.31337869746126e-05, "loss": 2.2691, "step": 308120 }, { "epoch": 0.54, "learning_rate": 2.313291503468577e-05, "loss": 2.3339, "step": 308130 }, { "epoch": 0.54, "learning_rate": 2.3132043094758947e-05, "loss": 2.362, "step": 308140 }, { "epoch": 0.54, "learning_rate": 2.3131171154832117e-05, "loss": 2.4109, "step": 308150 }, { "epoch": 0.54, "learning_rate": 2.313029921490529e-05, "loss": 2.4519, "step": 308160 }, { "epoch": 0.54, "learning_rate": 2.312942727497846e-05, "loss": 2.3204, "step": 308170 }, { "epoch": 0.54, "learning_rate": 2.312855533505164e-05, "loss": 2.4331, "step": 308180 }, { "epoch": 0.54, "learning_rate": 2.312768339512481e-05, "loss": 2.3897, "step": 308190 }, { "epoch": 0.54, "learning_rate": 2.3126811455197983e-05, "loss": 2.3581, "step": 308200 }, { "epoch": 0.54, "learning_rate": 2.3125939515271157e-05, "loss": 2.4071, "step": 308210 }, { "epoch": 0.54, "learning_rate": 2.312506757534433e-05, "loss": 2.5047, "step": 308220 }, { "epoch": 0.54, "learning_rate": 2.3124195635417504e-05, "loss": 2.3848, "step": 308230 }, { "epoch": 0.54, "learning_rate": 2.3123323695490675e-05, "loss": 2.4267, "step": 308240 }, { "epoch": 0.54, "learning_rate": 2.3122451755563852e-05, "loss": 2.3446, "step": 308250 }, { "epoch": 0.54, "learning_rate": 2.3121579815637022e-05, "loss": 2.2854, "step": 308260 }, { "epoch": 0.54, "learning_rate": 2.3120707875710196e-05, "loss": 2.368, "step": 308270 }, { "epoch": 0.54, "learning_rate": 2.311983593578337e-05, "loss": 2.3558, "step": 308280 }, { "epoch": 0.54, "learning_rate": 2.3118963995856543e-05, "loss": 2.4043, "step": 308290 }, { "epoch": 0.54, "learning_rate": 2.3118092055929717e-05, "loss": 2.3805, "step": 308300 }, { "epoch": 0.54, "learning_rate": 2.3117220116002888e-05, "loss": 2.2663, "step": 308310 }, { "epoch": 0.54, "learning_rate": 2.311634817607606e-05, "loss": 2.3266, "step": 308320 }, { "epoch": 0.54, "learning_rate": 2.3115476236149235e-05, "loss": 2.2826, "step": 308330 }, { "epoch": 0.54, "learning_rate": 2.311460429622241e-05, "loss": 2.34, "step": 308340 }, { "epoch": 0.54, "learning_rate": 2.3113732356295583e-05, "loss": 2.2159, "step": 308350 }, { "epoch": 0.54, "learning_rate": 2.3112860416368756e-05, "loss": 2.2704, "step": 308360 }, { "epoch": 0.54, "learning_rate": 2.311198847644193e-05, "loss": 2.3178, "step": 308370 }, { "epoch": 0.54, "learning_rate": 2.31111165365151e-05, "loss": 2.28, "step": 308380 }, { "epoch": 0.54, "learning_rate": 2.3110244596588274e-05, "loss": 2.4512, "step": 308390 }, { "epoch": 0.54, "learning_rate": 2.3109372656661448e-05, "loss": 2.4277, "step": 308400 }, { "epoch": 0.54, "learning_rate": 2.3108500716734622e-05, "loss": 2.4223, "step": 308410 }, { "epoch": 0.54, "learning_rate": 2.3107628776807792e-05, "loss": 2.4024, "step": 308420 }, { "epoch": 0.54, "learning_rate": 2.3106756836880966e-05, "loss": 2.3133, "step": 308430 }, { "epoch": 0.54, "learning_rate": 2.310588489695414e-05, "loss": 2.4321, "step": 308440 }, { "epoch": 0.54, "learning_rate": 2.3105012957027314e-05, "loss": 2.3256, "step": 308450 }, { "epoch": 0.54, "learning_rate": 2.3104141017100487e-05, "loss": 2.3274, "step": 308460 }, { "epoch": 0.54, "learning_rate": 2.310326907717366e-05, "loss": 2.399, "step": 308470 }, { "epoch": 0.54, "learning_rate": 2.3102397137246835e-05, "loss": 2.2953, "step": 308480 }, { "epoch": 0.54, "learning_rate": 2.3101525197320005e-05, "loss": 2.4566, "step": 308490 }, { "epoch": 0.54, "learning_rate": 2.310065325739318e-05, "loss": 2.2903, "step": 308500 }, { "epoch": 0.54, "learning_rate": 2.3099781317466353e-05, "loss": 2.4233, "step": 308510 }, { "epoch": 0.54, "learning_rate": 2.3098909377539527e-05, "loss": 2.3966, "step": 308520 }, { "epoch": 0.54, "learning_rate": 2.30980374376127e-05, "loss": 2.3474, "step": 308530 }, { "epoch": 0.54, "learning_rate": 2.309716549768587e-05, "loss": 2.2508, "step": 308540 }, { "epoch": 0.54, "learning_rate": 2.3096293557759048e-05, "loss": 2.3078, "step": 308550 }, { "epoch": 0.54, "learning_rate": 2.3095421617832218e-05, "loss": 2.4158, "step": 308560 }, { "epoch": 0.54, "learning_rate": 2.3094549677905392e-05, "loss": 2.3783, "step": 308570 }, { "epoch": 0.54, "learning_rate": 2.3093677737978562e-05, "loss": 2.4238, "step": 308580 }, { "epoch": 0.54, "learning_rate": 2.309280579805174e-05, "loss": 2.3675, "step": 308590 }, { "epoch": 0.54, "learning_rate": 2.3091933858124913e-05, "loss": 2.3529, "step": 308600 }, { "epoch": 0.54, "learning_rate": 2.3091061918198084e-05, "loss": 2.4153, "step": 308610 }, { "epoch": 0.54, "learning_rate": 2.309018997827126e-05, "loss": 2.1741, "step": 308620 }, { "epoch": 0.54, "learning_rate": 2.308931803834443e-05, "loss": 2.345, "step": 308630 }, { "epoch": 0.54, "learning_rate": 2.3088446098417605e-05, "loss": 2.2745, "step": 308640 }, { "epoch": 0.54, "learning_rate": 2.3087574158490775e-05, "loss": 2.2047, "step": 308650 }, { "epoch": 0.54, "learning_rate": 2.3086702218563953e-05, "loss": 2.4047, "step": 308660 }, { "epoch": 0.54, "learning_rate": 2.3085830278637123e-05, "loss": 2.4789, "step": 308670 }, { "epoch": 0.54, "learning_rate": 2.3084958338710297e-05, "loss": 2.3106, "step": 308680 }, { "epoch": 0.54, "learning_rate": 2.308408639878347e-05, "loss": 2.32, "step": 308690 }, { "epoch": 0.54, "learning_rate": 2.3083214458856644e-05, "loss": 2.3605, "step": 308700 }, { "epoch": 0.54, "learning_rate": 2.3082342518929818e-05, "loss": 2.3522, "step": 308710 }, { "epoch": 0.54, "learning_rate": 2.308147057900299e-05, "loss": 2.333, "step": 308720 }, { "epoch": 0.54, "learning_rate": 2.3080598639076162e-05, "loss": 2.3514, "step": 308730 }, { "epoch": 0.54, "learning_rate": 2.3079726699149336e-05, "loss": 2.3047, "step": 308740 }, { "epoch": 0.54, "learning_rate": 2.307885475922251e-05, "loss": 2.4302, "step": 308750 }, { "epoch": 0.54, "learning_rate": 2.3077982819295684e-05, "loss": 2.4445, "step": 308760 }, { "epoch": 0.54, "learning_rate": 2.3077110879368857e-05, "loss": 2.2356, "step": 308770 }, { "epoch": 0.54, "learning_rate": 2.307623893944203e-05, "loss": 2.3144, "step": 308780 }, { "epoch": 0.54, "learning_rate": 2.30753669995152e-05, "loss": 2.327, "step": 308790 }, { "epoch": 0.54, "learning_rate": 2.3074495059588375e-05, "loss": 2.3684, "step": 308800 }, { "epoch": 0.54, "learning_rate": 2.307362311966155e-05, "loss": 2.3763, "step": 308810 }, { "epoch": 0.54, "learning_rate": 2.3072751179734723e-05, "loss": 2.4955, "step": 308820 }, { "epoch": 0.54, "learning_rate": 2.3071879239807893e-05, "loss": 2.217, "step": 308830 }, { "epoch": 0.54, "learning_rate": 2.3071007299881067e-05, "loss": 2.3307, "step": 308840 }, { "epoch": 0.54, "learning_rate": 2.3070135359954244e-05, "loss": 2.3995, "step": 308850 }, { "epoch": 0.54, "learning_rate": 2.3069263420027414e-05, "loss": 2.3188, "step": 308860 }, { "epoch": 0.54, "learning_rate": 2.3068391480100588e-05, "loss": 2.4257, "step": 308870 }, { "epoch": 0.54, "learning_rate": 2.3067519540173762e-05, "loss": 2.358, "step": 308880 }, { "epoch": 0.54, "learning_rate": 2.3066647600246936e-05, "loss": 2.3219, "step": 308890 }, { "epoch": 0.54, "learning_rate": 2.3065775660320106e-05, "loss": 2.3955, "step": 308900 }, { "epoch": 0.54, "learning_rate": 2.306490372039328e-05, "loss": 2.3413, "step": 308910 }, { "epoch": 0.54, "learning_rate": 2.3064031780466454e-05, "loss": 2.2109, "step": 308920 }, { "epoch": 0.54, "learning_rate": 2.3063159840539627e-05, "loss": 2.4715, "step": 308930 }, { "epoch": 0.54, "learning_rate": 2.30622879006128e-05, "loss": 2.4194, "step": 308940 }, { "epoch": 0.54, "learning_rate": 2.306141596068597e-05, "loss": 2.4249, "step": 308950 }, { "epoch": 0.54, "learning_rate": 2.306054402075915e-05, "loss": 2.3834, "step": 308960 }, { "epoch": 0.54, "learning_rate": 2.305967208083232e-05, "loss": 2.3294, "step": 308970 }, { "epoch": 0.54, "learning_rate": 2.3058800140905493e-05, "loss": 2.3259, "step": 308980 }, { "epoch": 0.54, "learning_rate": 2.3057928200978667e-05, "loss": 2.3885, "step": 308990 }, { "epoch": 0.54, "learning_rate": 2.305705626105184e-05, "loss": 2.3564, "step": 309000 }, { "epoch": 0.54, "learning_rate": 2.3056184321125014e-05, "loss": 2.4174, "step": 309010 }, { "epoch": 0.54, "learning_rate": 2.3055312381198185e-05, "loss": 2.3482, "step": 309020 }, { "epoch": 0.54, "learning_rate": 2.3054440441271362e-05, "loss": 2.3369, "step": 309030 }, { "epoch": 0.54, "learning_rate": 2.3053568501344532e-05, "loss": 2.2842, "step": 309040 }, { "epoch": 0.54, "learning_rate": 2.3052696561417706e-05, "loss": 2.3913, "step": 309050 }, { "epoch": 0.54, "learning_rate": 2.3051824621490876e-05, "loss": 2.3162, "step": 309060 }, { "epoch": 0.54, "learning_rate": 2.3050952681564053e-05, "loss": 2.4402, "step": 309070 }, { "epoch": 0.54, "learning_rate": 2.3050080741637227e-05, "loss": 2.3623, "step": 309080 }, { "epoch": 0.54, "learning_rate": 2.3049208801710398e-05, "loss": 2.3617, "step": 309090 }, { "epoch": 0.54, "learning_rate": 2.304833686178357e-05, "loss": 2.2225, "step": 309100 }, { "epoch": 0.54, "learning_rate": 2.3047464921856745e-05, "loss": 2.4258, "step": 309110 }, { "epoch": 0.54, "learning_rate": 2.304659298192992e-05, "loss": 2.2446, "step": 309120 }, { "epoch": 0.54, "learning_rate": 2.304572104200309e-05, "loss": 2.418, "step": 309130 }, { "epoch": 0.54, "learning_rate": 2.3044849102076266e-05, "loss": 2.282, "step": 309140 }, { "epoch": 0.54, "learning_rate": 2.3043977162149437e-05, "loss": 2.3853, "step": 309150 }, { "epoch": 0.54, "learning_rate": 2.304310522222261e-05, "loss": 2.3168, "step": 309160 }, { "epoch": 0.54, "learning_rate": 2.3042233282295784e-05, "loss": 2.3995, "step": 309170 }, { "epoch": 0.54, "learning_rate": 2.3041361342368958e-05, "loss": 2.2738, "step": 309180 }, { "epoch": 0.54, "learning_rate": 2.3040489402442132e-05, "loss": 2.318, "step": 309190 }, { "epoch": 0.54, "learning_rate": 2.3039617462515302e-05, "loss": 2.2969, "step": 309200 }, { "epoch": 0.54, "learning_rate": 2.3038745522588476e-05, "loss": 2.2593, "step": 309210 }, { "epoch": 0.54, "learning_rate": 2.303787358266165e-05, "loss": 2.3654, "step": 309220 }, { "epoch": 0.54, "learning_rate": 2.3037001642734824e-05, "loss": 2.3673, "step": 309230 }, { "epoch": 0.54, "learning_rate": 2.3036129702807997e-05, "loss": 2.3284, "step": 309240 }, { "epoch": 0.54, "learning_rate": 2.3035257762881168e-05, "loss": 2.3593, "step": 309250 }, { "epoch": 0.54, "learning_rate": 2.3034385822954345e-05, "loss": 2.3454, "step": 309260 }, { "epoch": 0.54, "learning_rate": 2.3033513883027515e-05, "loss": 2.3303, "step": 309270 }, { "epoch": 0.54, "learning_rate": 2.303264194310069e-05, "loss": 2.3101, "step": 309280 }, { "epoch": 0.54, "learning_rate": 2.3031770003173863e-05, "loss": 2.3515, "step": 309290 }, { "epoch": 0.54, "learning_rate": 2.3030898063247037e-05, "loss": 2.4038, "step": 309300 }, { "epoch": 0.54, "learning_rate": 2.3030026123320207e-05, "loss": 2.2953, "step": 309310 }, { "epoch": 0.54, "learning_rate": 2.302915418339338e-05, "loss": 2.3679, "step": 309320 }, { "epoch": 0.54, "learning_rate": 2.3028282243466558e-05, "loss": 2.3405, "step": 309330 }, { "epoch": 0.54, "learning_rate": 2.3027410303539728e-05, "loss": 2.395, "step": 309340 }, { "epoch": 0.54, "learning_rate": 2.3026538363612902e-05, "loss": 2.3237, "step": 309350 }, { "epoch": 0.54, "learning_rate": 2.3025666423686072e-05, "loss": 2.3769, "step": 309360 }, { "epoch": 0.54, "learning_rate": 2.302479448375925e-05, "loss": 2.3819, "step": 309370 }, { "epoch": 0.54, "learning_rate": 2.302392254383242e-05, "loss": 2.2777, "step": 309380 }, { "epoch": 0.54, "learning_rate": 2.3023050603905594e-05, "loss": 2.3574, "step": 309390 }, { "epoch": 0.54, "learning_rate": 2.3022178663978768e-05, "loss": 2.2716, "step": 309400 }, { "epoch": 0.54, "learning_rate": 2.302130672405194e-05, "loss": 2.3514, "step": 309410 }, { "epoch": 0.54, "learning_rate": 2.3020434784125115e-05, "loss": 2.2668, "step": 309420 }, { "epoch": 0.54, "learning_rate": 2.3019562844198285e-05, "loss": 2.3517, "step": 309430 }, { "epoch": 0.54, "learning_rate": 2.3018690904271463e-05, "loss": 2.2889, "step": 309440 }, { "epoch": 0.54, "learning_rate": 2.3017818964344633e-05, "loss": 2.3778, "step": 309450 }, { "epoch": 0.54, "learning_rate": 2.3016947024417807e-05, "loss": 2.269, "step": 309460 }, { "epoch": 0.54, "learning_rate": 2.301607508449098e-05, "loss": 2.3228, "step": 309470 }, { "epoch": 0.54, "learning_rate": 2.3015203144564154e-05, "loss": 2.3774, "step": 309480 }, { "epoch": 0.54, "learning_rate": 2.3014331204637328e-05, "loss": 2.4254, "step": 309490 }, { "epoch": 0.54, "learning_rate": 2.30134592647105e-05, "loss": 2.2631, "step": 309500 }, { "epoch": 0.54, "learning_rate": 2.3012587324783672e-05, "loss": 2.4287, "step": 309510 }, { "epoch": 0.54, "learning_rate": 2.3011715384856846e-05, "loss": 2.3152, "step": 309520 }, { "epoch": 0.54, "learning_rate": 2.301084344493002e-05, "loss": 2.344, "step": 309530 }, { "epoch": 0.54, "learning_rate": 2.300997150500319e-05, "loss": 2.2597, "step": 309540 }, { "epoch": 0.54, "learning_rate": 2.3009099565076367e-05, "loss": 2.2466, "step": 309550 }, { "epoch": 0.54, "learning_rate": 2.3008227625149538e-05, "loss": 2.3985, "step": 309560 }, { "epoch": 0.54, "learning_rate": 2.300735568522271e-05, "loss": 2.3702, "step": 309570 }, { "epoch": 0.54, "learning_rate": 2.3006483745295885e-05, "loss": 2.3853, "step": 309580 }, { "epoch": 0.54, "learning_rate": 2.300561180536906e-05, "loss": 2.3261, "step": 309590 }, { "epoch": 0.54, "learning_rate": 2.3004739865442233e-05, "loss": 2.4662, "step": 309600 }, { "epoch": 0.54, "learning_rate": 2.3003867925515403e-05, "loss": 2.2797, "step": 309610 }, { "epoch": 0.54, "learning_rate": 2.3002995985588577e-05, "loss": 2.4746, "step": 309620 }, { "epoch": 0.54, "learning_rate": 2.300212404566175e-05, "loss": 2.2587, "step": 309630 }, { "epoch": 0.54, "learning_rate": 2.3001252105734924e-05, "loss": 2.4215, "step": 309640 }, { "epoch": 0.54, "learning_rate": 2.3000380165808098e-05, "loss": 2.363, "step": 309650 }, { "epoch": 0.54, "learning_rate": 2.299950822588127e-05, "loss": 2.3489, "step": 309660 }, { "epoch": 0.54, "learning_rate": 2.2998636285954446e-05, "loss": 2.4456, "step": 309670 }, { "epoch": 0.54, "learning_rate": 2.2997764346027616e-05, "loss": 2.3488, "step": 309680 }, { "epoch": 0.54, "learning_rate": 2.299689240610079e-05, "loss": 2.454, "step": 309690 }, { "epoch": 0.54, "learning_rate": 2.2996020466173964e-05, "loss": 2.4099, "step": 309700 }, { "epoch": 0.54, "learning_rate": 2.2995148526247137e-05, "loss": 2.5074, "step": 309710 }, { "epoch": 0.54, "learning_rate": 2.299427658632031e-05, "loss": 2.3912, "step": 309720 }, { "epoch": 0.54, "learning_rate": 2.299340464639348e-05, "loss": 2.385, "step": 309730 }, { "epoch": 0.54, "learning_rate": 2.299253270646666e-05, "loss": 2.3678, "step": 309740 }, { "epoch": 0.54, "learning_rate": 2.299166076653983e-05, "loss": 2.4252, "step": 309750 }, { "epoch": 0.54, "learning_rate": 2.2990788826613003e-05, "loss": 2.2554, "step": 309760 }, { "epoch": 0.54, "learning_rate": 2.2989916886686173e-05, "loss": 2.3676, "step": 309770 }, { "epoch": 0.54, "learning_rate": 2.298904494675935e-05, "loss": 2.324, "step": 309780 }, { "epoch": 0.54, "learning_rate": 2.298817300683252e-05, "loss": 2.2739, "step": 309790 }, { "epoch": 0.54, "learning_rate": 2.2987301066905695e-05, "loss": 2.3458, "step": 309800 }, { "epoch": 0.54, "learning_rate": 2.2986429126978872e-05, "loss": 2.4042, "step": 309810 }, { "epoch": 0.54, "learning_rate": 2.2985557187052042e-05, "loss": 2.3376, "step": 309820 }, { "epoch": 0.54, "learning_rate": 2.2984685247125216e-05, "loss": 2.3121, "step": 309830 }, { "epoch": 0.54, "learning_rate": 2.2983813307198386e-05, "loss": 2.438, "step": 309840 }, { "epoch": 0.54, "learning_rate": 2.2982941367271563e-05, "loss": 2.3564, "step": 309850 }, { "epoch": 0.54, "learning_rate": 2.2982069427344734e-05, "loss": 2.4303, "step": 309860 }, { "epoch": 0.54, "learning_rate": 2.2981197487417908e-05, "loss": 2.3761, "step": 309870 }, { "epoch": 0.54, "learning_rate": 2.298032554749108e-05, "loss": 2.365, "step": 309880 }, { "epoch": 0.54, "learning_rate": 2.2979453607564255e-05, "loss": 2.2526, "step": 309890 }, { "epoch": 0.54, "learning_rate": 2.297858166763743e-05, "loss": 2.327, "step": 309900 }, { "epoch": 0.54, "learning_rate": 2.29777097277106e-05, "loss": 2.3498, "step": 309910 }, { "epoch": 0.54, "learning_rate": 2.2976837787783773e-05, "loss": 2.3462, "step": 309920 }, { "epoch": 0.54, "learning_rate": 2.2975965847856947e-05, "loss": 2.3909, "step": 309930 }, { "epoch": 0.54, "learning_rate": 2.297509390793012e-05, "loss": 2.3666, "step": 309940 }, { "epoch": 0.54, "learning_rate": 2.2974221968003294e-05, "loss": 2.4615, "step": 309950 }, { "epoch": 0.54, "learning_rate": 2.2973350028076468e-05, "loss": 2.3342, "step": 309960 }, { "epoch": 0.54, "learning_rate": 2.2972478088149642e-05, "loss": 2.4468, "step": 309970 }, { "epoch": 0.54, "learning_rate": 2.2971606148222812e-05, "loss": 2.3805, "step": 309980 }, { "epoch": 0.54, "learning_rate": 2.2970734208295986e-05, "loss": 2.3317, "step": 309990 }, { "epoch": 0.54, "learning_rate": 2.296986226836916e-05, "loss": 2.3041, "step": 310000 }, { "epoch": 0.54, "learning_rate": 2.2968990328442334e-05, "loss": 2.2814, "step": 310010 }, { "epoch": 0.54, "learning_rate": 2.2968118388515504e-05, "loss": 2.3631, "step": 310020 }, { "epoch": 0.54, "learning_rate": 2.2967246448588678e-05, "loss": 2.3224, "step": 310030 }, { "epoch": 0.54, "learning_rate": 2.296637450866185e-05, "loss": 2.4179, "step": 310040 }, { "epoch": 0.54, "learning_rate": 2.2965502568735025e-05, "loss": 2.2716, "step": 310050 }, { "epoch": 0.54, "learning_rate": 2.29646306288082e-05, "loss": 2.2581, "step": 310060 }, { "epoch": 0.54, "learning_rate": 2.2963758688881373e-05, "loss": 2.3106, "step": 310070 }, { "epoch": 0.54, "learning_rate": 2.2962886748954547e-05, "loss": 2.4251, "step": 310080 }, { "epoch": 0.54, "learning_rate": 2.2962014809027717e-05, "loss": 2.308, "step": 310090 }, { "epoch": 0.54, "learning_rate": 2.296114286910089e-05, "loss": 2.389, "step": 310100 }, { "epoch": 0.54, "learning_rate": 2.2960270929174065e-05, "loss": 2.2577, "step": 310110 }, { "epoch": 0.54, "learning_rate": 2.2959398989247238e-05, "loss": 2.3306, "step": 310120 }, { "epoch": 0.54, "learning_rate": 2.2958527049320412e-05, "loss": 2.3226, "step": 310130 }, { "epoch": 0.54, "learning_rate": 2.2957655109393582e-05, "loss": 2.355, "step": 310140 }, { "epoch": 0.54, "learning_rate": 2.295678316946676e-05, "loss": 2.5563, "step": 310150 }, { "epoch": 0.54, "learning_rate": 2.295591122953993e-05, "loss": 2.3578, "step": 310160 }, { "epoch": 0.54, "learning_rate": 2.2955039289613104e-05, "loss": 2.4279, "step": 310170 }, { "epoch": 0.54, "learning_rate": 2.2954167349686274e-05, "loss": 2.269, "step": 310180 }, { "epoch": 0.54, "learning_rate": 2.295329540975945e-05, "loss": 2.3533, "step": 310190 }, { "epoch": 0.54, "learning_rate": 2.2952423469832625e-05, "loss": 2.2829, "step": 310200 }, { "epoch": 0.54, "learning_rate": 2.2951551529905795e-05, "loss": 2.2822, "step": 310210 }, { "epoch": 0.54, "learning_rate": 2.2950679589978973e-05, "loss": 2.3241, "step": 310220 }, { "epoch": 0.54, "learning_rate": 2.2949807650052143e-05, "loss": 2.2963, "step": 310230 }, { "epoch": 0.54, "learning_rate": 2.2948935710125317e-05, "loss": 2.3264, "step": 310240 }, { "epoch": 0.54, "learning_rate": 2.2948063770198487e-05, "loss": 2.3063, "step": 310250 }, { "epoch": 0.54, "learning_rate": 2.2947191830271664e-05, "loss": 2.299, "step": 310260 }, { "epoch": 0.54, "learning_rate": 2.2946319890344835e-05, "loss": 2.3937, "step": 310270 }, { "epoch": 0.54, "learning_rate": 2.294544795041801e-05, "loss": 2.4553, "step": 310280 }, { "epoch": 0.54, "learning_rate": 2.2944576010491182e-05, "loss": 2.391, "step": 310290 }, { "epoch": 0.54, "learning_rate": 2.2943704070564356e-05, "loss": 2.3434, "step": 310300 }, { "epoch": 0.54, "learning_rate": 2.294283213063753e-05, "loss": 2.296, "step": 310310 }, { "epoch": 0.54, "learning_rate": 2.29419601907107e-05, "loss": 2.3769, "step": 310320 }, { "epoch": 0.54, "learning_rate": 2.2941088250783877e-05, "loss": 2.3734, "step": 310330 }, { "epoch": 0.54, "learning_rate": 2.2940216310857048e-05, "loss": 2.4788, "step": 310340 }, { "epoch": 0.54, "learning_rate": 2.293934437093022e-05, "loss": 2.3037, "step": 310350 }, { "epoch": 0.54, "learning_rate": 2.2938472431003395e-05, "loss": 2.3024, "step": 310360 }, { "epoch": 0.54, "learning_rate": 2.293760049107657e-05, "loss": 2.3725, "step": 310370 }, { "epoch": 0.54, "learning_rate": 2.2936728551149743e-05, "loss": 2.4222, "step": 310380 }, { "epoch": 0.54, "learning_rate": 2.2935856611222913e-05, "loss": 2.4066, "step": 310390 }, { "epoch": 0.54, "learning_rate": 2.2934984671296087e-05, "loss": 2.2567, "step": 310400 }, { "epoch": 0.54, "learning_rate": 2.293411273136926e-05, "loss": 2.3455, "step": 310410 }, { "epoch": 0.54, "learning_rate": 2.2933240791442434e-05, "loss": 2.3122, "step": 310420 }, { "epoch": 0.54, "learning_rate": 2.2932368851515608e-05, "loss": 2.4473, "step": 310430 }, { "epoch": 0.54, "learning_rate": 2.293149691158878e-05, "loss": 2.3213, "step": 310440 }, { "epoch": 0.54, "learning_rate": 2.2930624971661956e-05, "loss": 2.4715, "step": 310450 }, { "epoch": 0.54, "learning_rate": 2.2929753031735126e-05, "loss": 2.3872, "step": 310460 }, { "epoch": 0.54, "learning_rate": 2.29288810918083e-05, "loss": 2.3489, "step": 310470 }, { "epoch": 0.54, "learning_rate": 2.2928009151881474e-05, "loss": 2.3108, "step": 310480 }, { "epoch": 0.54, "learning_rate": 2.2927137211954647e-05, "loss": 2.4139, "step": 310490 }, { "epoch": 0.54, "learning_rate": 2.2926265272027818e-05, "loss": 2.3336, "step": 310500 }, { "epoch": 0.54, "learning_rate": 2.292539333210099e-05, "loss": 2.3945, "step": 310510 }, { "epoch": 0.54, "learning_rate": 2.2924521392174165e-05, "loss": 2.4009, "step": 310520 }, { "epoch": 0.54, "learning_rate": 2.292364945224734e-05, "loss": 2.3049, "step": 310530 }, { "epoch": 0.54, "learning_rate": 2.2922777512320513e-05, "loss": 2.3334, "step": 310540 }, { "epoch": 0.54, "learning_rate": 2.2921905572393683e-05, "loss": 2.3231, "step": 310550 }, { "epoch": 0.54, "learning_rate": 2.292103363246686e-05, "loss": 2.3574, "step": 310560 }, { "epoch": 0.54, "learning_rate": 2.292016169254003e-05, "loss": 2.3374, "step": 310570 }, { "epoch": 0.54, "learning_rate": 2.2919289752613205e-05, "loss": 2.315, "step": 310580 }, { "epoch": 0.54, "learning_rate": 2.291841781268638e-05, "loss": 2.3086, "step": 310590 }, { "epoch": 0.54, "learning_rate": 2.2917545872759552e-05, "loss": 2.2405, "step": 310600 }, { "epoch": 0.54, "learning_rate": 2.2916673932832726e-05, "loss": 2.3102, "step": 310610 }, { "epoch": 0.54, "learning_rate": 2.2915801992905896e-05, "loss": 2.3825, "step": 310620 }, { "epoch": 0.54, "learning_rate": 2.2914930052979073e-05, "loss": 2.2727, "step": 310630 }, { "epoch": 0.54, "learning_rate": 2.2914058113052244e-05, "loss": 2.2433, "step": 310640 }, { "epoch": 0.54, "learning_rate": 2.2913186173125418e-05, "loss": 2.3138, "step": 310650 }, { "epoch": 0.54, "learning_rate": 2.2912314233198588e-05, "loss": 2.363, "step": 310660 }, { "epoch": 0.54, "learning_rate": 2.2911442293271765e-05, "loss": 2.303, "step": 310670 }, { "epoch": 0.54, "learning_rate": 2.291057035334494e-05, "loss": 2.2752, "step": 310680 }, { "epoch": 0.54, "learning_rate": 2.290969841341811e-05, "loss": 2.3406, "step": 310690 }, { "epoch": 0.54, "learning_rate": 2.2908826473491283e-05, "loss": 2.2835, "step": 310700 }, { "epoch": 0.54, "learning_rate": 2.2907954533564457e-05, "loss": 2.2091, "step": 310710 }, { "epoch": 0.54, "learning_rate": 2.290708259363763e-05, "loss": 2.3464, "step": 310720 }, { "epoch": 0.54, "learning_rate": 2.29062106537108e-05, "loss": 2.4372, "step": 310730 }, { "epoch": 0.54, "learning_rate": 2.2905338713783978e-05, "loss": 2.3064, "step": 310740 }, { "epoch": 0.54, "learning_rate": 2.290446677385715e-05, "loss": 2.3329, "step": 310750 }, { "epoch": 0.54, "learning_rate": 2.2903594833930322e-05, "loss": 2.3609, "step": 310760 }, { "epoch": 0.54, "learning_rate": 2.2902722894003496e-05, "loss": 2.3469, "step": 310770 }, { "epoch": 0.54, "learning_rate": 2.290185095407667e-05, "loss": 2.4503, "step": 310780 }, { "epoch": 0.54, "learning_rate": 2.2900979014149844e-05, "loss": 2.3143, "step": 310790 }, { "epoch": 0.54, "learning_rate": 2.2900107074223014e-05, "loss": 2.3876, "step": 310800 }, { "epoch": 0.54, "learning_rate": 2.2899235134296188e-05, "loss": 2.2584, "step": 310810 }, { "epoch": 0.54, "learning_rate": 2.289836319436936e-05, "loss": 2.3295, "step": 310820 }, { "epoch": 0.54, "learning_rate": 2.2897491254442535e-05, "loss": 2.4838, "step": 310830 }, { "epoch": 0.54, "learning_rate": 2.289661931451571e-05, "loss": 2.3394, "step": 310840 }, { "epoch": 0.54, "learning_rate": 2.289574737458888e-05, "loss": 2.2702, "step": 310850 }, { "epoch": 0.54, "learning_rate": 2.2894875434662057e-05, "loss": 2.3025, "step": 310860 }, { "epoch": 0.54, "learning_rate": 2.2894003494735227e-05, "loss": 2.3129, "step": 310870 }, { "epoch": 0.54, "learning_rate": 2.28931315548084e-05, "loss": 2.3993, "step": 310880 }, { "epoch": 0.54, "learning_rate": 2.2892259614881575e-05, "loss": 2.3537, "step": 310890 }, { "epoch": 0.54, "learning_rate": 2.289138767495475e-05, "loss": 2.2166, "step": 310900 }, { "epoch": 0.54, "learning_rate": 2.289051573502792e-05, "loss": 2.3975, "step": 310910 }, { "epoch": 0.54, "learning_rate": 2.2889643795101092e-05, "loss": 2.3784, "step": 310920 }, { "epoch": 0.54, "learning_rate": 2.288877185517427e-05, "loss": 2.3723, "step": 310930 }, { "epoch": 0.54, "learning_rate": 2.288789991524744e-05, "loss": 2.2979, "step": 310940 }, { "epoch": 0.54, "learning_rate": 2.2887027975320614e-05, "loss": 2.2904, "step": 310950 }, { "epoch": 0.54, "learning_rate": 2.2886156035393784e-05, "loss": 2.3426, "step": 310960 }, { "epoch": 0.54, "learning_rate": 2.288528409546696e-05, "loss": 2.2511, "step": 310970 }, { "epoch": 0.54, "learning_rate": 2.288441215554013e-05, "loss": 2.3457, "step": 310980 }, { "epoch": 0.54, "learning_rate": 2.2883540215613305e-05, "loss": 2.2078, "step": 310990 }, { "epoch": 0.54, "learning_rate": 2.288266827568648e-05, "loss": 2.2612, "step": 311000 }, { "epoch": 0.54, "learning_rate": 2.2881796335759653e-05, "loss": 2.5342, "step": 311010 }, { "epoch": 0.54, "learning_rate": 2.2880924395832827e-05, "loss": 2.4467, "step": 311020 }, { "epoch": 0.54, "learning_rate": 2.2880052455905997e-05, "loss": 2.3114, "step": 311030 }, { "epoch": 0.54, "learning_rate": 2.2879180515979174e-05, "loss": 2.2962, "step": 311040 }, { "epoch": 0.54, "learning_rate": 2.2878308576052345e-05, "loss": 2.4604, "step": 311050 }, { "epoch": 0.54, "learning_rate": 2.287743663612552e-05, "loss": 2.4393, "step": 311060 }, { "epoch": 0.54, "learning_rate": 2.2876564696198692e-05, "loss": 2.3673, "step": 311070 }, { "epoch": 0.54, "learning_rate": 2.2875692756271866e-05, "loss": 2.3692, "step": 311080 }, { "epoch": 0.54, "learning_rate": 2.287482081634504e-05, "loss": 2.3674, "step": 311090 }, { "epoch": 0.54, "learning_rate": 2.287394887641821e-05, "loss": 2.3624, "step": 311100 }, { "epoch": 0.54, "learning_rate": 2.2873076936491384e-05, "loss": 2.4216, "step": 311110 }, { "epoch": 0.54, "learning_rate": 2.2872204996564558e-05, "loss": 2.2208, "step": 311120 }, { "epoch": 0.54, "learning_rate": 2.287133305663773e-05, "loss": 2.3237, "step": 311130 }, { "epoch": 0.54, "learning_rate": 2.2870461116710902e-05, "loss": 2.223, "step": 311140 }, { "epoch": 0.54, "learning_rate": 2.286958917678408e-05, "loss": 2.3978, "step": 311150 }, { "epoch": 0.54, "learning_rate": 2.2868717236857253e-05, "loss": 2.378, "step": 311160 }, { "epoch": 0.54, "learning_rate": 2.2867845296930423e-05, "loss": 2.2223, "step": 311170 }, { "epoch": 0.54, "learning_rate": 2.2866973357003597e-05, "loss": 2.4554, "step": 311180 }, { "epoch": 0.54, "learning_rate": 2.286610141707677e-05, "loss": 2.4338, "step": 311190 }, { "epoch": 0.54, "learning_rate": 2.2865229477149944e-05, "loss": 2.3135, "step": 311200 }, { "epoch": 0.54, "learning_rate": 2.2864357537223115e-05, "loss": 2.4422, "step": 311210 }, { "epoch": 0.54, "learning_rate": 2.286348559729629e-05, "loss": 2.2733, "step": 311220 }, { "epoch": 0.54, "learning_rate": 2.2862613657369462e-05, "loss": 2.3215, "step": 311230 }, { "epoch": 0.54, "learning_rate": 2.2861741717442636e-05, "loss": 2.3758, "step": 311240 }, { "epoch": 0.54, "learning_rate": 2.286086977751581e-05, "loss": 2.3548, "step": 311250 }, { "epoch": 0.54, "learning_rate": 2.2859997837588984e-05, "loss": 2.3167, "step": 311260 }, { "epoch": 0.54, "learning_rate": 2.2859125897662157e-05, "loss": 2.315, "step": 311270 }, { "epoch": 0.54, "learning_rate": 2.2858253957735328e-05, "loss": 2.3294, "step": 311280 }, { "epoch": 0.54, "learning_rate": 2.28573820178085e-05, "loss": 2.3582, "step": 311290 }, { "epoch": 0.54, "learning_rate": 2.2856510077881675e-05, "loss": 2.4034, "step": 311300 }, { "epoch": 0.54, "learning_rate": 2.285563813795485e-05, "loss": 2.3458, "step": 311310 }, { "epoch": 0.54, "learning_rate": 2.2854766198028023e-05, "loss": 2.2888, "step": 311320 }, { "epoch": 0.54, "learning_rate": 2.2853894258101193e-05, "loss": 2.4166, "step": 311330 }, { "epoch": 0.54, "learning_rate": 2.285302231817437e-05, "loss": 2.3493, "step": 311340 }, { "epoch": 0.54, "learning_rate": 2.285215037824754e-05, "loss": 2.34, "step": 311350 }, { "epoch": 0.54, "learning_rate": 2.2851278438320715e-05, "loss": 2.3402, "step": 311360 }, { "epoch": 0.54, "learning_rate": 2.2850406498393885e-05, "loss": 2.3165, "step": 311370 }, { "epoch": 0.54, "learning_rate": 2.2849534558467062e-05, "loss": 2.3194, "step": 311380 }, { "epoch": 0.54, "learning_rate": 2.2848662618540233e-05, "loss": 2.407, "step": 311390 }, { "epoch": 0.54, "learning_rate": 2.2847790678613406e-05, "loss": 2.3345, "step": 311400 }, { "epoch": 0.54, "learning_rate": 2.2846918738686583e-05, "loss": 2.3859, "step": 311410 }, { "epoch": 0.54, "learning_rate": 2.2846046798759754e-05, "loss": 2.3354, "step": 311420 }, { "epoch": 0.54, "learning_rate": 2.2845174858832928e-05, "loss": 2.339, "step": 311430 }, { "epoch": 0.54, "learning_rate": 2.2844302918906098e-05, "loss": 2.2823, "step": 311440 }, { "epoch": 0.54, "learning_rate": 2.2843430978979275e-05, "loss": 2.456, "step": 311450 }, { "epoch": 0.54, "learning_rate": 2.2842559039052446e-05, "loss": 2.4084, "step": 311460 }, { "epoch": 0.54, "learning_rate": 2.284168709912562e-05, "loss": 2.2694, "step": 311470 }, { "epoch": 0.54, "learning_rate": 2.2840815159198793e-05, "loss": 2.3406, "step": 311480 }, { "epoch": 0.54, "learning_rate": 2.2839943219271967e-05, "loss": 2.3504, "step": 311490 }, { "epoch": 0.54, "learning_rate": 2.283907127934514e-05, "loss": 2.3869, "step": 311500 }, { "epoch": 0.54, "learning_rate": 2.283819933941831e-05, "loss": 2.4069, "step": 311510 }, { "epoch": 0.54, "learning_rate": 2.2837327399491485e-05, "loss": 2.3829, "step": 311520 }, { "epoch": 0.54, "learning_rate": 2.283645545956466e-05, "loss": 2.3315, "step": 311530 }, { "epoch": 0.54, "learning_rate": 2.2835583519637832e-05, "loss": 2.4456, "step": 311540 }, { "epoch": 0.54, "learning_rate": 2.2834711579711006e-05, "loss": 2.4359, "step": 311550 }, { "epoch": 0.54, "learning_rate": 2.283383963978418e-05, "loss": 2.3643, "step": 311560 }, { "epoch": 0.54, "learning_rate": 2.2832967699857354e-05, "loss": 2.3874, "step": 311570 }, { "epoch": 0.54, "learning_rate": 2.2832095759930524e-05, "loss": 2.2989, "step": 311580 }, { "epoch": 0.54, "learning_rate": 2.2831223820003698e-05, "loss": 2.4085, "step": 311590 }, { "epoch": 0.54, "learning_rate": 2.283035188007687e-05, "loss": 2.3794, "step": 311600 }, { "epoch": 0.54, "learning_rate": 2.2829479940150045e-05, "loss": 2.3747, "step": 311610 }, { "epoch": 0.54, "learning_rate": 2.2828608000223216e-05, "loss": 2.3575, "step": 311620 }, { "epoch": 0.54, "learning_rate": 2.282773606029639e-05, "loss": 2.3367, "step": 311630 }, { "epoch": 0.54, "learning_rate": 2.2826864120369563e-05, "loss": 2.352, "step": 311640 }, { "epoch": 0.54, "learning_rate": 2.2825992180442737e-05, "loss": 2.1931, "step": 311650 }, { "epoch": 0.54, "learning_rate": 2.282512024051591e-05, "loss": 2.4093, "step": 311660 }, { "epoch": 0.54, "learning_rate": 2.2824248300589085e-05, "loss": 2.3494, "step": 311670 }, { "epoch": 0.54, "learning_rate": 2.282337636066226e-05, "loss": 2.3825, "step": 311680 }, { "epoch": 0.54, "learning_rate": 2.282250442073543e-05, "loss": 2.316, "step": 311690 }, { "epoch": 0.54, "learning_rate": 2.2821632480808602e-05, "loss": 2.2928, "step": 311700 }, { "epoch": 0.54, "learning_rate": 2.2820760540881776e-05, "loss": 2.2633, "step": 311710 }, { "epoch": 0.54, "learning_rate": 2.281988860095495e-05, "loss": 2.2747, "step": 311720 }, { "epoch": 0.54, "learning_rate": 2.2819016661028124e-05, "loss": 2.4111, "step": 311730 }, { "epoch": 0.54, "learning_rate": 2.2818144721101294e-05, "loss": 2.3823, "step": 311740 }, { "epoch": 0.54, "learning_rate": 2.281727278117447e-05, "loss": 2.4038, "step": 311750 }, { "epoch": 0.54, "learning_rate": 2.2816400841247642e-05, "loss": 2.4854, "step": 311760 }, { "epoch": 0.54, "learning_rate": 2.2815528901320815e-05, "loss": 2.4312, "step": 311770 }, { "epoch": 0.54, "learning_rate": 2.281465696139399e-05, "loss": 2.2804, "step": 311780 }, { "epoch": 0.54, "learning_rate": 2.2813785021467163e-05, "loss": 2.1642, "step": 311790 }, { "epoch": 0.54, "learning_rate": 2.2812913081540337e-05, "loss": 2.3574, "step": 311800 }, { "epoch": 0.54, "learning_rate": 2.2812041141613507e-05, "loss": 2.3768, "step": 311810 }, { "epoch": 0.54, "learning_rate": 2.2811169201686684e-05, "loss": 2.3778, "step": 311820 }, { "epoch": 0.54, "learning_rate": 2.2810297261759855e-05, "loss": 2.4256, "step": 311830 }, { "epoch": 0.54, "learning_rate": 2.280942532183303e-05, "loss": 2.2905, "step": 311840 }, { "epoch": 0.54, "learning_rate": 2.28085533819062e-05, "loss": 2.3247, "step": 311850 }, { "epoch": 0.54, "learning_rate": 2.2807681441979376e-05, "loss": 2.403, "step": 311860 }, { "epoch": 0.54, "learning_rate": 2.2806809502052546e-05, "loss": 2.5187, "step": 311870 }, { "epoch": 0.54, "learning_rate": 2.280593756212572e-05, "loss": 2.3471, "step": 311880 }, { "epoch": 0.54, "learning_rate": 2.2805065622198894e-05, "loss": 2.3513, "step": 311890 }, { "epoch": 0.54, "learning_rate": 2.2804193682272068e-05, "loss": 2.3286, "step": 311900 }, { "epoch": 0.54, "learning_rate": 2.280332174234524e-05, "loss": 2.4756, "step": 311910 }, { "epoch": 0.54, "learning_rate": 2.2802449802418412e-05, "loss": 2.4419, "step": 311920 }, { "epoch": 0.54, "learning_rate": 2.280157786249159e-05, "loss": 2.2999, "step": 311930 }, { "epoch": 0.54, "learning_rate": 2.280070592256476e-05, "loss": 2.426, "step": 311940 }, { "epoch": 0.54, "learning_rate": 2.2799833982637933e-05, "loss": 2.3991, "step": 311950 }, { "epoch": 0.54, "learning_rate": 2.2798962042711107e-05, "loss": 2.3641, "step": 311960 }, { "epoch": 0.54, "learning_rate": 2.279809010278428e-05, "loss": 2.5196, "step": 311970 }, { "epoch": 0.54, "learning_rate": 2.2797218162857454e-05, "loss": 2.4018, "step": 311980 }, { "epoch": 0.54, "learning_rate": 2.2796346222930625e-05, "loss": 2.3126, "step": 311990 }, { "epoch": 0.54, "learning_rate": 2.27954742830038e-05, "loss": 2.2379, "step": 312000 }, { "epoch": 0.54, "learning_rate": 2.2794602343076972e-05, "loss": 2.4212, "step": 312010 }, { "epoch": 0.54, "learning_rate": 2.2793730403150146e-05, "loss": 2.4378, "step": 312020 }, { "epoch": 0.54, "learning_rate": 2.279285846322332e-05, "loss": 2.3503, "step": 312030 }, { "epoch": 0.54, "learning_rate": 2.279198652329649e-05, "loss": 2.4409, "step": 312040 }, { "epoch": 0.54, "learning_rate": 2.2791114583369667e-05, "loss": 2.3203, "step": 312050 }, { "epoch": 0.54, "learning_rate": 2.2790242643442838e-05, "loss": 2.1087, "step": 312060 }, { "epoch": 0.54, "learning_rate": 2.278937070351601e-05, "loss": 2.4556, "step": 312070 }, { "epoch": 0.54, "learning_rate": 2.2788498763589185e-05, "loss": 2.3684, "step": 312080 }, { "epoch": 0.54, "learning_rate": 2.278762682366236e-05, "loss": 2.4722, "step": 312090 }, { "epoch": 0.54, "learning_rate": 2.278675488373553e-05, "loss": 2.4132, "step": 312100 }, { "epoch": 0.54, "learning_rate": 2.2785882943808703e-05, "loss": 2.3748, "step": 312110 }, { "epoch": 0.54, "learning_rate": 2.2785011003881877e-05, "loss": 2.3852, "step": 312120 }, { "epoch": 0.54, "learning_rate": 2.278413906395505e-05, "loss": 2.4077, "step": 312130 }, { "epoch": 0.54, "learning_rate": 2.2783267124028225e-05, "loss": 2.2971, "step": 312140 }, { "epoch": 0.54, "learning_rate": 2.2782395184101395e-05, "loss": 2.2619, "step": 312150 }, { "epoch": 0.54, "learning_rate": 2.2781523244174572e-05, "loss": 2.3761, "step": 312160 }, { "epoch": 0.54, "learning_rate": 2.2780651304247743e-05, "loss": 2.329, "step": 312170 }, { "epoch": 0.54, "learning_rate": 2.2779779364320916e-05, "loss": 2.3629, "step": 312180 }, { "epoch": 0.54, "learning_rate": 2.277890742439409e-05, "loss": 2.2936, "step": 312190 }, { "epoch": 0.54, "learning_rate": 2.2778035484467264e-05, "loss": 2.4545, "step": 312200 }, { "epoch": 0.54, "learning_rate": 2.2777163544540438e-05, "loss": 2.3475, "step": 312210 }, { "epoch": 0.54, "learning_rate": 2.2776291604613608e-05, "loss": 2.3966, "step": 312220 }, { "epoch": 0.54, "learning_rate": 2.2775419664686785e-05, "loss": 2.4019, "step": 312230 }, { "epoch": 0.54, "learning_rate": 2.2774547724759956e-05, "loss": 2.3677, "step": 312240 }, { "epoch": 0.54, "learning_rate": 2.277367578483313e-05, "loss": 2.3732, "step": 312250 }, { "epoch": 0.54, "learning_rate": 2.27728038449063e-05, "loss": 2.3273, "step": 312260 }, { "epoch": 0.54, "learning_rate": 2.2771931904979477e-05, "loss": 2.3502, "step": 312270 }, { "epoch": 0.54, "learning_rate": 2.277105996505265e-05, "loss": 2.3706, "step": 312280 }, { "epoch": 0.54, "learning_rate": 2.277018802512582e-05, "loss": 2.3331, "step": 312290 }, { "epoch": 0.54, "learning_rate": 2.2769316085198995e-05, "loss": 2.2576, "step": 312300 }, { "epoch": 0.54, "learning_rate": 2.276844414527217e-05, "loss": 2.4447, "step": 312310 }, { "epoch": 0.54, "learning_rate": 2.2767572205345342e-05, "loss": 2.2985, "step": 312320 }, { "epoch": 0.54, "learning_rate": 2.2766700265418513e-05, "loss": 2.4391, "step": 312330 }, { "epoch": 0.54, "learning_rate": 2.276582832549169e-05, "loss": 2.317, "step": 312340 }, { "epoch": 0.54, "learning_rate": 2.276495638556486e-05, "loss": 2.3054, "step": 312350 }, { "epoch": 0.54, "learning_rate": 2.2764084445638034e-05, "loss": 2.2477, "step": 312360 }, { "epoch": 0.54, "learning_rate": 2.2763212505711208e-05, "loss": 2.2919, "step": 312370 }, { "epoch": 0.54, "learning_rate": 2.276234056578438e-05, "loss": 2.3586, "step": 312380 }, { "epoch": 0.54, "learning_rate": 2.2761468625857555e-05, "loss": 2.2678, "step": 312390 }, { "epoch": 0.54, "learning_rate": 2.2760596685930726e-05, "loss": 2.3322, "step": 312400 }, { "epoch": 0.54, "learning_rate": 2.27597247460039e-05, "loss": 2.2897, "step": 312410 }, { "epoch": 0.54, "learning_rate": 2.2758852806077073e-05, "loss": 2.4009, "step": 312420 }, { "epoch": 0.54, "learning_rate": 2.2757980866150247e-05, "loss": 2.4331, "step": 312430 }, { "epoch": 0.54, "learning_rate": 2.275710892622342e-05, "loss": 2.413, "step": 312440 }, { "epoch": 0.54, "learning_rate": 2.275623698629659e-05, "loss": 2.337, "step": 312450 }, { "epoch": 0.54, "learning_rate": 2.275536504636977e-05, "loss": 2.3292, "step": 312460 }, { "epoch": 0.54, "learning_rate": 2.275449310644294e-05, "loss": 2.3816, "step": 312470 }, { "epoch": 0.54, "learning_rate": 2.2753621166516112e-05, "loss": 2.3316, "step": 312480 }, { "epoch": 0.54, "learning_rate": 2.2752749226589286e-05, "loss": 2.2966, "step": 312490 }, { "epoch": 0.54, "learning_rate": 2.275187728666246e-05, "loss": 2.3637, "step": 312500 }, { "epoch": 0.54, "learning_rate": 2.2751005346735634e-05, "loss": 2.2694, "step": 312510 }, { "epoch": 0.54, "learning_rate": 2.2750133406808804e-05, "loss": 2.3574, "step": 312520 }, { "epoch": 0.55, "learning_rate": 2.274926146688198e-05, "loss": 2.3186, "step": 312530 }, { "epoch": 0.55, "learning_rate": 2.2748389526955152e-05, "loss": 2.478, "step": 312540 }, { "epoch": 0.55, "learning_rate": 2.2747517587028325e-05, "loss": 2.3734, "step": 312550 }, { "epoch": 0.55, "learning_rate": 2.2746645647101496e-05, "loss": 2.3221, "step": 312560 }, { "epoch": 0.55, "learning_rate": 2.2745773707174673e-05, "loss": 2.163, "step": 312570 }, { "epoch": 0.55, "learning_rate": 2.2744901767247843e-05, "loss": 2.3498, "step": 312580 }, { "epoch": 0.55, "learning_rate": 2.2744029827321017e-05, "loss": 2.2903, "step": 312590 }, { "epoch": 0.55, "learning_rate": 2.274315788739419e-05, "loss": 2.3541, "step": 312600 }, { "epoch": 0.55, "learning_rate": 2.2742285947467365e-05, "loss": 2.3343, "step": 312610 }, { "epoch": 0.55, "learning_rate": 2.274141400754054e-05, "loss": 2.3407, "step": 312620 }, { "epoch": 0.55, "learning_rate": 2.274054206761371e-05, "loss": 2.3601, "step": 312630 }, { "epoch": 0.55, "learning_rate": 2.2739670127686886e-05, "loss": 2.3501, "step": 312640 }, { "epoch": 0.55, "learning_rate": 2.2738798187760056e-05, "loss": 2.3029, "step": 312650 }, { "epoch": 0.55, "learning_rate": 2.273792624783323e-05, "loss": 2.2851, "step": 312660 }, { "epoch": 0.55, "learning_rate": 2.2737054307906404e-05, "loss": 2.3443, "step": 312670 }, { "epoch": 0.55, "learning_rate": 2.2736182367979578e-05, "loss": 2.3788, "step": 312680 }, { "epoch": 0.55, "learning_rate": 2.273531042805275e-05, "loss": 2.3382, "step": 312690 }, { "epoch": 0.55, "learning_rate": 2.2734438488125922e-05, "loss": 2.1886, "step": 312700 }, { "epoch": 0.55, "learning_rate": 2.2733566548199096e-05, "loss": 2.4349, "step": 312710 }, { "epoch": 0.55, "learning_rate": 2.273269460827227e-05, "loss": 2.2532, "step": 312720 }, { "epoch": 0.55, "learning_rate": 2.2731822668345443e-05, "loss": 2.4559, "step": 312730 }, { "epoch": 0.55, "learning_rate": 2.2730950728418614e-05, "loss": 2.2886, "step": 312740 }, { "epoch": 0.55, "learning_rate": 2.273007878849179e-05, "loss": 2.3527, "step": 312750 }, { "epoch": 0.55, "learning_rate": 2.2729206848564964e-05, "loss": 2.3507, "step": 312760 }, { "epoch": 0.55, "learning_rate": 2.2728334908638135e-05, "loss": 2.4272, "step": 312770 }, { "epoch": 0.55, "learning_rate": 2.272746296871131e-05, "loss": 2.272, "step": 312780 }, { "epoch": 0.55, "learning_rate": 2.2726591028784482e-05, "loss": 2.3665, "step": 312790 }, { "epoch": 0.55, "learning_rate": 2.2725719088857656e-05, "loss": 2.4617, "step": 312800 }, { "epoch": 0.55, "learning_rate": 2.2724847148930827e-05, "loss": 2.3528, "step": 312810 }, { "epoch": 0.55, "learning_rate": 2.2723975209004e-05, "loss": 2.341, "step": 312820 }, { "epoch": 0.55, "learning_rate": 2.2723103269077174e-05, "loss": 2.2878, "step": 312830 }, { "epoch": 0.55, "learning_rate": 2.2722231329150348e-05, "loss": 2.3126, "step": 312840 }, { "epoch": 0.55, "learning_rate": 2.272135938922352e-05, "loss": 2.3771, "step": 312850 }, { "epoch": 0.55, "learning_rate": 2.2720487449296695e-05, "loss": 2.3319, "step": 312860 }, { "epoch": 0.55, "learning_rate": 2.271961550936987e-05, "loss": 2.3409, "step": 312870 }, { "epoch": 0.55, "learning_rate": 2.271874356944304e-05, "loss": 2.406, "step": 312880 }, { "epoch": 0.55, "learning_rate": 2.2717871629516213e-05, "loss": 2.3438, "step": 312890 }, { "epoch": 0.55, "learning_rate": 2.2716999689589387e-05, "loss": 2.3431, "step": 312900 }, { "epoch": 0.55, "learning_rate": 2.271612774966256e-05, "loss": 2.2782, "step": 312910 }, { "epoch": 0.55, "learning_rate": 2.2715255809735735e-05, "loss": 2.3685, "step": 312920 }, { "epoch": 0.55, "learning_rate": 2.2714383869808905e-05, "loss": 2.2011, "step": 312930 }, { "epoch": 0.55, "learning_rate": 2.2713511929882082e-05, "loss": 2.3653, "step": 312940 }, { "epoch": 0.55, "learning_rate": 2.2712639989955253e-05, "loss": 2.3782, "step": 312950 }, { "epoch": 0.55, "learning_rate": 2.2711768050028426e-05, "loss": 2.4416, "step": 312960 }, { "epoch": 0.55, "learning_rate": 2.2710896110101597e-05, "loss": 2.2939, "step": 312970 }, { "epoch": 0.55, "learning_rate": 2.2710024170174774e-05, "loss": 2.3199, "step": 312980 }, { "epoch": 0.55, "learning_rate": 2.2709152230247944e-05, "loss": 2.3631, "step": 312990 }, { "epoch": 0.55, "learning_rate": 2.2708280290321118e-05, "loss": 2.2987, "step": 313000 }, { "epoch": 0.55, "learning_rate": 2.2707408350394295e-05, "loss": 2.2784, "step": 313010 }, { "epoch": 0.55, "learning_rate": 2.2706536410467466e-05, "loss": 2.261, "step": 313020 }, { "epoch": 0.55, "learning_rate": 2.270566447054064e-05, "loss": 2.4226, "step": 313030 }, { "epoch": 0.55, "learning_rate": 2.270479253061381e-05, "loss": 2.3244, "step": 313040 }, { "epoch": 0.55, "learning_rate": 2.2703920590686987e-05, "loss": 2.4178, "step": 313050 }, { "epoch": 0.55, "learning_rate": 2.2703048650760157e-05, "loss": 2.4645, "step": 313060 }, { "epoch": 0.55, "learning_rate": 2.270217671083333e-05, "loss": 2.2625, "step": 313070 }, { "epoch": 0.55, "learning_rate": 2.2701304770906505e-05, "loss": 2.4505, "step": 313080 }, { "epoch": 0.55, "learning_rate": 2.270043283097968e-05, "loss": 2.3709, "step": 313090 }, { "epoch": 0.55, "learning_rate": 2.2699560891052852e-05, "loss": 2.2381, "step": 313100 }, { "epoch": 0.55, "learning_rate": 2.2698688951126023e-05, "loss": 2.2715, "step": 313110 }, { "epoch": 0.55, "learning_rate": 2.2697817011199196e-05, "loss": 2.4123, "step": 313120 }, { "epoch": 0.55, "learning_rate": 2.269694507127237e-05, "loss": 2.3427, "step": 313130 }, { "epoch": 0.55, "learning_rate": 2.2696073131345544e-05, "loss": 2.3766, "step": 313140 }, { "epoch": 0.55, "learning_rate": 2.2695201191418718e-05, "loss": 2.4202, "step": 313150 }, { "epoch": 0.55, "learning_rate": 2.269432925149189e-05, "loss": 2.3421, "step": 313160 }, { "epoch": 0.55, "learning_rate": 2.2693457311565065e-05, "loss": 2.2658, "step": 313170 }, { "epoch": 0.55, "learning_rate": 2.2692585371638236e-05, "loss": 2.2803, "step": 313180 }, { "epoch": 0.55, "learning_rate": 2.269171343171141e-05, "loss": 2.3596, "step": 313190 }, { "epoch": 0.55, "learning_rate": 2.2690841491784583e-05, "loss": 2.2732, "step": 313200 }, { "epoch": 0.55, "learning_rate": 2.2689969551857757e-05, "loss": 2.4464, "step": 313210 }, { "epoch": 0.55, "learning_rate": 2.2689097611930927e-05, "loss": 2.2793, "step": 313220 }, { "epoch": 0.55, "learning_rate": 2.26882256720041e-05, "loss": 2.3806, "step": 313230 }, { "epoch": 0.55, "learning_rate": 2.268735373207728e-05, "loss": 2.3416, "step": 313240 }, { "epoch": 0.55, "learning_rate": 2.268648179215045e-05, "loss": 2.2204, "step": 313250 }, { "epoch": 0.55, "learning_rate": 2.2685609852223622e-05, "loss": 2.2895, "step": 313260 }, { "epoch": 0.55, "learning_rate": 2.2684737912296796e-05, "loss": 2.355, "step": 313270 }, { "epoch": 0.55, "learning_rate": 2.268386597236997e-05, "loss": 2.3114, "step": 313280 }, { "epoch": 0.55, "learning_rate": 2.268299403244314e-05, "loss": 2.3657, "step": 313290 }, { "epoch": 0.55, "learning_rate": 2.2682122092516314e-05, "loss": 2.3091, "step": 313300 }, { "epoch": 0.55, "learning_rate": 2.2681250152589488e-05, "loss": 2.2557, "step": 313310 }, { "epoch": 0.55, "learning_rate": 2.2680378212662662e-05, "loss": 2.2397, "step": 313320 }, { "epoch": 0.55, "learning_rate": 2.2679506272735835e-05, "loss": 2.411, "step": 313330 }, { "epoch": 0.55, "learning_rate": 2.2678634332809006e-05, "loss": 2.3132, "step": 313340 }, { "epoch": 0.55, "learning_rate": 2.2677762392882183e-05, "loss": 2.2849, "step": 313350 }, { "epoch": 0.55, "learning_rate": 2.2676890452955353e-05, "loss": 2.4112, "step": 313360 }, { "epoch": 0.55, "learning_rate": 2.2676018513028527e-05, "loss": 2.3391, "step": 313370 }, { "epoch": 0.55, "learning_rate": 2.26751465731017e-05, "loss": 2.3641, "step": 313380 }, { "epoch": 0.55, "learning_rate": 2.2674274633174875e-05, "loss": 2.249, "step": 313390 }, { "epoch": 0.55, "learning_rate": 2.267340269324805e-05, "loss": 2.3987, "step": 313400 }, { "epoch": 0.55, "learning_rate": 2.267253075332122e-05, "loss": 2.3994, "step": 313410 }, { "epoch": 0.55, "learning_rate": 2.2671658813394396e-05, "loss": 2.345, "step": 313420 }, { "epoch": 0.55, "learning_rate": 2.2670786873467566e-05, "loss": 2.3088, "step": 313430 }, { "epoch": 0.55, "learning_rate": 2.266991493354074e-05, "loss": 2.3802, "step": 313440 }, { "epoch": 0.55, "learning_rate": 2.266904299361391e-05, "loss": 2.2994, "step": 313450 }, { "epoch": 0.55, "learning_rate": 2.2668171053687088e-05, "loss": 2.3061, "step": 313460 }, { "epoch": 0.55, "learning_rate": 2.2667299113760258e-05, "loss": 2.2162, "step": 313470 }, { "epoch": 0.55, "learning_rate": 2.2666427173833432e-05, "loss": 2.2614, "step": 313480 }, { "epoch": 0.55, "learning_rate": 2.2665555233906606e-05, "loss": 2.2692, "step": 313490 }, { "epoch": 0.55, "learning_rate": 2.266468329397978e-05, "loss": 2.3938, "step": 313500 }, { "epoch": 0.55, "learning_rate": 2.2663811354052953e-05, "loss": 2.3281, "step": 313510 }, { "epoch": 0.55, "learning_rate": 2.2662939414126124e-05, "loss": 2.4015, "step": 313520 }, { "epoch": 0.55, "learning_rate": 2.26620674741993e-05, "loss": 2.3454, "step": 313530 }, { "epoch": 0.55, "learning_rate": 2.266119553427247e-05, "loss": 2.3108, "step": 313540 }, { "epoch": 0.55, "learning_rate": 2.2660323594345645e-05, "loss": 2.3644, "step": 313550 }, { "epoch": 0.55, "learning_rate": 2.265945165441882e-05, "loss": 2.3248, "step": 313560 }, { "epoch": 0.55, "learning_rate": 2.2658579714491992e-05, "loss": 2.3353, "step": 313570 }, { "epoch": 0.55, "learning_rate": 2.2657707774565166e-05, "loss": 2.37, "step": 313580 }, { "epoch": 0.55, "learning_rate": 2.2656835834638337e-05, "loss": 2.3323, "step": 313590 }, { "epoch": 0.55, "learning_rate": 2.265596389471151e-05, "loss": 2.2631, "step": 313600 }, { "epoch": 0.55, "learning_rate": 2.2655091954784684e-05, "loss": 2.3017, "step": 313610 }, { "epoch": 0.55, "learning_rate": 2.2654220014857858e-05, "loss": 2.4063, "step": 313620 }, { "epoch": 0.55, "learning_rate": 2.265334807493103e-05, "loss": 2.4248, "step": 313630 }, { "epoch": 0.55, "learning_rate": 2.2652476135004202e-05, "loss": 2.3714, "step": 313640 }, { "epoch": 0.55, "learning_rate": 2.265160419507738e-05, "loss": 2.2849, "step": 313650 }, { "epoch": 0.55, "learning_rate": 2.265073225515055e-05, "loss": 2.3087, "step": 313660 }, { "epoch": 0.55, "learning_rate": 2.2649860315223723e-05, "loss": 2.2466, "step": 313670 }, { "epoch": 0.55, "learning_rate": 2.2648988375296897e-05, "loss": 2.3443, "step": 313680 }, { "epoch": 0.55, "learning_rate": 2.264811643537007e-05, "loss": 2.3187, "step": 313690 }, { "epoch": 0.55, "learning_rate": 2.264724449544324e-05, "loss": 2.2674, "step": 313700 }, { "epoch": 0.55, "learning_rate": 2.2646372555516415e-05, "loss": 2.3645, "step": 313710 }, { "epoch": 0.55, "learning_rate": 2.264550061558959e-05, "loss": 2.4453, "step": 313720 }, { "epoch": 0.55, "learning_rate": 2.2644628675662763e-05, "loss": 2.395, "step": 313730 }, { "epoch": 0.55, "learning_rate": 2.2643756735735936e-05, "loss": 2.3383, "step": 313740 }, { "epoch": 0.55, "learning_rate": 2.2642884795809107e-05, "loss": 2.3368, "step": 313750 }, { "epoch": 0.55, "learning_rate": 2.2642012855882284e-05, "loss": 2.3749, "step": 313760 }, { "epoch": 0.55, "learning_rate": 2.2641140915955454e-05, "loss": 2.3872, "step": 313770 }, { "epoch": 0.55, "learning_rate": 2.2640268976028628e-05, "loss": 2.3082, "step": 313780 }, { "epoch": 0.55, "learning_rate": 2.2639397036101802e-05, "loss": 2.3839, "step": 313790 }, { "epoch": 0.55, "learning_rate": 2.2638525096174976e-05, "loss": 2.3106, "step": 313800 }, { "epoch": 0.55, "learning_rate": 2.263765315624815e-05, "loss": 2.3832, "step": 313810 }, { "epoch": 0.55, "learning_rate": 2.263678121632132e-05, "loss": 2.3185, "step": 313820 }, { "epoch": 0.55, "learning_rate": 2.2635909276394497e-05, "loss": 2.4072, "step": 313830 }, { "epoch": 0.55, "learning_rate": 2.2635037336467667e-05, "loss": 2.3385, "step": 313840 }, { "epoch": 0.55, "learning_rate": 2.263416539654084e-05, "loss": 2.3103, "step": 313850 }, { "epoch": 0.55, "learning_rate": 2.2633293456614015e-05, "loss": 2.3481, "step": 313860 }, { "epoch": 0.55, "learning_rate": 2.263242151668719e-05, "loss": 2.271, "step": 313870 }, { "epoch": 0.55, "learning_rate": 2.2631549576760362e-05, "loss": 2.2799, "step": 313880 }, { "epoch": 0.55, "learning_rate": 2.2630677636833533e-05, "loss": 2.3268, "step": 313890 }, { "epoch": 0.55, "learning_rate": 2.2629805696906706e-05, "loss": 2.2587, "step": 313900 }, { "epoch": 0.55, "learning_rate": 2.262893375697988e-05, "loss": 2.3239, "step": 313910 }, { "epoch": 0.55, "learning_rate": 2.2628061817053054e-05, "loss": 2.3281, "step": 313920 }, { "epoch": 0.55, "learning_rate": 2.2627189877126224e-05, "loss": 2.2842, "step": 313930 }, { "epoch": 0.55, "learning_rate": 2.26263179371994e-05, "loss": 2.3319, "step": 313940 }, { "epoch": 0.55, "learning_rate": 2.2625445997272572e-05, "loss": 2.3536, "step": 313950 }, { "epoch": 0.55, "learning_rate": 2.2624574057345746e-05, "loss": 2.3085, "step": 313960 }, { "epoch": 0.55, "learning_rate": 2.262370211741892e-05, "loss": 2.3999, "step": 313970 }, { "epoch": 0.55, "learning_rate": 2.2622830177492093e-05, "loss": 2.2754, "step": 313980 }, { "epoch": 0.55, "learning_rate": 2.2621958237565267e-05, "loss": 2.3974, "step": 313990 }, { "epoch": 0.55, "learning_rate": 2.2621086297638437e-05, "loss": 2.5112, "step": 314000 }, { "epoch": 0.55, "learning_rate": 2.262021435771161e-05, "loss": 2.3276, "step": 314010 }, { "epoch": 0.55, "learning_rate": 2.2619342417784785e-05, "loss": 2.2369, "step": 314020 }, { "epoch": 0.55, "learning_rate": 2.261847047785796e-05, "loss": 2.3815, "step": 314030 }, { "epoch": 0.55, "learning_rate": 2.2617598537931132e-05, "loss": 2.393, "step": 314040 }, { "epoch": 0.55, "learning_rate": 2.2616726598004303e-05, "loss": 2.3445, "step": 314050 }, { "epoch": 0.55, "learning_rate": 2.261585465807748e-05, "loss": 2.1963, "step": 314060 }, { "epoch": 0.55, "learning_rate": 2.261498271815065e-05, "loss": 2.3228, "step": 314070 }, { "epoch": 0.55, "learning_rate": 2.2614110778223824e-05, "loss": 2.35, "step": 314080 }, { "epoch": 0.55, "learning_rate": 2.2613238838296998e-05, "loss": 2.2615, "step": 314090 }, { "epoch": 0.55, "learning_rate": 2.2612366898370172e-05, "loss": 2.214, "step": 314100 }, { "epoch": 0.55, "learning_rate": 2.2611494958443345e-05, "loss": 2.243, "step": 314110 }, { "epoch": 0.55, "learning_rate": 2.2610623018516516e-05, "loss": 2.3548, "step": 314120 }, { "epoch": 0.55, "learning_rate": 2.2609751078589693e-05, "loss": 2.3954, "step": 314130 }, { "epoch": 0.55, "learning_rate": 2.2608879138662863e-05, "loss": 2.3713, "step": 314140 }, { "epoch": 0.55, "learning_rate": 2.2608007198736037e-05, "loss": 2.4168, "step": 314150 }, { "epoch": 0.55, "learning_rate": 2.2607135258809208e-05, "loss": 2.3869, "step": 314160 }, { "epoch": 0.55, "learning_rate": 2.2606263318882385e-05, "loss": 2.4367, "step": 314170 }, { "epoch": 0.55, "learning_rate": 2.2605391378955555e-05, "loss": 2.4441, "step": 314180 }, { "epoch": 0.55, "learning_rate": 2.260451943902873e-05, "loss": 2.3694, "step": 314190 }, { "epoch": 0.55, "learning_rate": 2.2603647499101903e-05, "loss": 2.4625, "step": 314200 }, { "epoch": 0.55, "learning_rate": 2.2602775559175076e-05, "loss": 2.3353, "step": 314210 }, { "epoch": 0.55, "learning_rate": 2.260190361924825e-05, "loss": 2.2786, "step": 314220 }, { "epoch": 0.55, "learning_rate": 2.260103167932142e-05, "loss": 2.3325, "step": 314230 }, { "epoch": 0.55, "learning_rate": 2.2600159739394598e-05, "loss": 2.2998, "step": 314240 }, { "epoch": 0.55, "learning_rate": 2.2599287799467768e-05, "loss": 2.3386, "step": 314250 }, { "epoch": 0.55, "learning_rate": 2.2598415859540942e-05, "loss": 2.5385, "step": 314260 }, { "epoch": 0.55, "learning_rate": 2.2597543919614116e-05, "loss": 2.3196, "step": 314270 }, { "epoch": 0.55, "learning_rate": 2.259667197968729e-05, "loss": 2.421, "step": 314280 }, { "epoch": 0.55, "learning_rate": 2.2595800039760463e-05, "loss": 2.3855, "step": 314290 }, { "epoch": 0.55, "learning_rate": 2.2594928099833634e-05, "loss": 2.3472, "step": 314300 }, { "epoch": 0.55, "learning_rate": 2.2594056159906807e-05, "loss": 2.4088, "step": 314310 }, { "epoch": 0.55, "learning_rate": 2.259318421997998e-05, "loss": 2.3285, "step": 314320 }, { "epoch": 0.55, "learning_rate": 2.2592312280053155e-05, "loss": 2.2972, "step": 314330 }, { "epoch": 0.55, "learning_rate": 2.2591440340126325e-05, "loss": 2.3606, "step": 314340 }, { "epoch": 0.55, "learning_rate": 2.2590568400199502e-05, "loss": 2.365, "step": 314350 }, { "epoch": 0.55, "learning_rate": 2.2589696460272676e-05, "loss": 2.4118, "step": 314360 }, { "epoch": 0.55, "learning_rate": 2.2588824520345847e-05, "loss": 2.3582, "step": 314370 }, { "epoch": 0.55, "learning_rate": 2.258795258041902e-05, "loss": 2.3403, "step": 314380 }, { "epoch": 0.55, "learning_rate": 2.2587080640492194e-05, "loss": 2.379, "step": 314390 }, { "epoch": 0.55, "learning_rate": 2.2586208700565368e-05, "loss": 2.4509, "step": 314400 }, { "epoch": 0.55, "learning_rate": 2.2585336760638538e-05, "loss": 2.416, "step": 314410 }, { "epoch": 0.55, "learning_rate": 2.2584464820711712e-05, "loss": 2.3756, "step": 314420 }, { "epoch": 0.55, "learning_rate": 2.2583592880784886e-05, "loss": 2.2454, "step": 314430 }, { "epoch": 0.55, "learning_rate": 2.258272094085806e-05, "loss": 2.3783, "step": 314440 }, { "epoch": 0.55, "learning_rate": 2.2581849000931233e-05, "loss": 2.3342, "step": 314450 }, { "epoch": 0.55, "learning_rate": 2.2580977061004407e-05, "loss": 2.2772, "step": 314460 }, { "epoch": 0.55, "learning_rate": 2.258010512107758e-05, "loss": 2.2931, "step": 314470 }, { "epoch": 0.55, "learning_rate": 2.257923318115075e-05, "loss": 2.3205, "step": 314480 }, { "epoch": 0.55, "learning_rate": 2.2578361241223925e-05, "loss": 2.2994, "step": 314490 }, { "epoch": 0.55, "learning_rate": 2.25774893012971e-05, "loss": 2.308, "step": 314500 }, { "epoch": 0.55, "learning_rate": 2.2576617361370273e-05, "loss": 2.3886, "step": 314510 }, { "epoch": 0.55, "learning_rate": 2.2575745421443446e-05, "loss": 2.4213, "step": 314520 }, { "epoch": 0.55, "learning_rate": 2.2574873481516617e-05, "loss": 2.3738, "step": 314530 }, { "epoch": 0.55, "learning_rate": 2.2574001541589794e-05, "loss": 2.2116, "step": 314540 }, { "epoch": 0.55, "learning_rate": 2.2573129601662964e-05, "loss": 2.3064, "step": 314550 }, { "epoch": 0.55, "learning_rate": 2.2572257661736138e-05, "loss": 2.2651, "step": 314560 }, { "epoch": 0.55, "learning_rate": 2.257138572180931e-05, "loss": 2.2532, "step": 314570 }, { "epoch": 0.55, "learning_rate": 2.2570513781882486e-05, "loss": 2.3519, "step": 314580 }, { "epoch": 0.55, "learning_rate": 2.256964184195566e-05, "loss": 2.3007, "step": 314590 }, { "epoch": 0.55, "learning_rate": 2.256876990202883e-05, "loss": 2.2636, "step": 314600 }, { "epoch": 0.55, "learning_rate": 2.2567897962102007e-05, "loss": 2.2958, "step": 314610 }, { "epoch": 0.55, "learning_rate": 2.2567026022175177e-05, "loss": 2.2277, "step": 314620 }, { "epoch": 0.55, "learning_rate": 2.256615408224835e-05, "loss": 2.1732, "step": 314630 }, { "epoch": 0.55, "learning_rate": 2.256528214232152e-05, "loss": 2.3052, "step": 314640 }, { "epoch": 0.55, "learning_rate": 2.25644102023947e-05, "loss": 2.3197, "step": 314650 }, { "epoch": 0.55, "learning_rate": 2.256353826246787e-05, "loss": 2.3446, "step": 314660 }, { "epoch": 0.55, "learning_rate": 2.2562666322541043e-05, "loss": 2.3254, "step": 314670 }, { "epoch": 0.55, "learning_rate": 2.2561794382614216e-05, "loss": 2.2456, "step": 314680 }, { "epoch": 0.55, "learning_rate": 2.256092244268739e-05, "loss": 2.3048, "step": 314690 }, { "epoch": 0.55, "learning_rate": 2.2560050502760564e-05, "loss": 2.3745, "step": 314700 }, { "epoch": 0.55, "learning_rate": 2.2559178562833734e-05, "loss": 2.4663, "step": 314710 }, { "epoch": 0.55, "learning_rate": 2.255830662290691e-05, "loss": 2.2627, "step": 314720 }, { "epoch": 0.55, "learning_rate": 2.2557434682980082e-05, "loss": 2.3445, "step": 314730 }, { "epoch": 0.55, "learning_rate": 2.2556562743053256e-05, "loss": 2.4614, "step": 314740 }, { "epoch": 0.55, "learning_rate": 2.255569080312643e-05, "loss": 2.2756, "step": 314750 }, { "epoch": 0.55, "learning_rate": 2.2554818863199603e-05, "loss": 2.3104, "step": 314760 }, { "epoch": 0.55, "learning_rate": 2.2553946923272777e-05, "loss": 2.2777, "step": 314770 }, { "epoch": 0.55, "learning_rate": 2.2553074983345947e-05, "loss": 2.4317, "step": 314780 }, { "epoch": 0.55, "learning_rate": 2.255220304341912e-05, "loss": 2.3829, "step": 314790 }, { "epoch": 0.55, "learning_rate": 2.2551331103492295e-05, "loss": 2.3904, "step": 314800 }, { "epoch": 0.55, "learning_rate": 2.255045916356547e-05, "loss": 2.3142, "step": 314810 }, { "epoch": 0.55, "learning_rate": 2.254958722363864e-05, "loss": 2.4042, "step": 314820 }, { "epoch": 0.55, "learning_rate": 2.2548715283711813e-05, "loss": 2.4525, "step": 314830 }, { "epoch": 0.55, "learning_rate": 2.254784334378499e-05, "loss": 2.4338, "step": 314840 }, { "epoch": 0.55, "learning_rate": 2.254697140385816e-05, "loss": 2.2556, "step": 314850 }, { "epoch": 0.55, "learning_rate": 2.2546099463931334e-05, "loss": 2.2683, "step": 314860 }, { "epoch": 0.55, "learning_rate": 2.2545227524004508e-05, "loss": 2.3915, "step": 314870 }, { "epoch": 0.55, "learning_rate": 2.2544355584077682e-05, "loss": 2.297, "step": 314880 }, { "epoch": 0.55, "learning_rate": 2.2543483644150852e-05, "loss": 2.3105, "step": 314890 }, { "epoch": 0.55, "learning_rate": 2.2542611704224026e-05, "loss": 2.3908, "step": 314900 }, { "epoch": 0.55, "learning_rate": 2.25417397642972e-05, "loss": 2.2315, "step": 314910 }, { "epoch": 0.55, "learning_rate": 2.2540867824370373e-05, "loss": 2.3294, "step": 314920 }, { "epoch": 0.55, "learning_rate": 2.2539995884443547e-05, "loss": 2.3482, "step": 314930 }, { "epoch": 0.55, "learning_rate": 2.2539123944516718e-05, "loss": 2.2837, "step": 314940 }, { "epoch": 0.55, "learning_rate": 2.2538252004589895e-05, "loss": 2.3622, "step": 314950 }, { "epoch": 0.55, "learning_rate": 2.2537380064663065e-05, "loss": 2.275, "step": 314960 }, { "epoch": 0.55, "learning_rate": 2.253650812473624e-05, "loss": 2.3741, "step": 314970 }, { "epoch": 0.55, "learning_rate": 2.2535636184809413e-05, "loss": 2.3674, "step": 314980 }, { "epoch": 0.55, "learning_rate": 2.2534764244882586e-05, "loss": 2.2629, "step": 314990 }, { "epoch": 0.55, "learning_rate": 2.253389230495576e-05, "loss": 2.3975, "step": 315000 }, { "epoch": 0.55, "learning_rate": 2.253302036502893e-05, "loss": 2.2698, "step": 315010 }, { "epoch": 0.55, "learning_rate": 2.2532148425102108e-05, "loss": 2.3825, "step": 315020 }, { "epoch": 0.55, "learning_rate": 2.2531276485175278e-05, "loss": 2.3417, "step": 315030 }, { "epoch": 0.55, "learning_rate": 2.2530404545248452e-05, "loss": 2.3138, "step": 315040 }, { "epoch": 0.55, "learning_rate": 2.2529532605321622e-05, "loss": 2.3617, "step": 315050 }, { "epoch": 0.55, "learning_rate": 2.25286606653948e-05, "loss": 2.3398, "step": 315060 }, { "epoch": 0.55, "learning_rate": 2.252778872546797e-05, "loss": 2.4565, "step": 315070 }, { "epoch": 0.55, "learning_rate": 2.2526916785541144e-05, "loss": 2.3286, "step": 315080 }, { "epoch": 0.55, "learning_rate": 2.2526044845614317e-05, "loss": 2.3242, "step": 315090 }, { "epoch": 0.55, "learning_rate": 2.252517290568749e-05, "loss": 2.4442, "step": 315100 }, { "epoch": 0.55, "learning_rate": 2.2524300965760665e-05, "loss": 2.2114, "step": 315110 }, { "epoch": 0.55, "learning_rate": 2.2523429025833835e-05, "loss": 2.3648, "step": 315120 }, { "epoch": 0.55, "learning_rate": 2.2522557085907012e-05, "loss": 2.3342, "step": 315130 }, { "epoch": 0.55, "learning_rate": 2.2521685145980183e-05, "loss": 2.3016, "step": 315140 }, { "epoch": 0.55, "learning_rate": 2.2520813206053357e-05, "loss": 2.2343, "step": 315150 }, { "epoch": 0.55, "learning_rate": 2.251994126612653e-05, "loss": 2.2731, "step": 315160 }, { "epoch": 0.55, "learning_rate": 2.2519069326199704e-05, "loss": 2.4034, "step": 315170 }, { "epoch": 0.55, "learning_rate": 2.2518197386272878e-05, "loss": 2.3739, "step": 315180 }, { "epoch": 0.55, "learning_rate": 2.2517325446346048e-05, "loss": 2.4199, "step": 315190 }, { "epoch": 0.55, "learning_rate": 2.2516453506419222e-05, "loss": 2.3775, "step": 315200 }, { "epoch": 0.55, "learning_rate": 2.2515581566492396e-05, "loss": 2.3192, "step": 315210 }, { "epoch": 0.55, "learning_rate": 2.251470962656557e-05, "loss": 2.3017, "step": 315220 }, { "epoch": 0.55, "learning_rate": 2.2513837686638743e-05, "loss": 2.236, "step": 315230 }, { "epoch": 0.55, "learning_rate": 2.2512965746711914e-05, "loss": 2.4782, "step": 315240 }, { "epoch": 0.55, "learning_rate": 2.251209380678509e-05, "loss": 2.3625, "step": 315250 }, { "epoch": 0.55, "learning_rate": 2.251122186685826e-05, "loss": 2.4281, "step": 315260 }, { "epoch": 0.55, "learning_rate": 2.2510349926931435e-05, "loss": 2.316, "step": 315270 }, { "epoch": 0.55, "learning_rate": 2.250947798700461e-05, "loss": 2.3206, "step": 315280 }, { "epoch": 0.55, "learning_rate": 2.2508606047077783e-05, "loss": 2.387, "step": 315290 }, { "epoch": 0.55, "learning_rate": 2.2507734107150953e-05, "loss": 2.4897, "step": 315300 }, { "epoch": 0.55, "learning_rate": 2.2506862167224127e-05, "loss": 2.3392, "step": 315310 }, { "epoch": 0.55, "learning_rate": 2.2505990227297304e-05, "loss": 2.3188, "step": 315320 }, { "epoch": 0.55, "learning_rate": 2.2505118287370474e-05, "loss": 2.4036, "step": 315330 }, { "epoch": 0.55, "learning_rate": 2.2504246347443648e-05, "loss": 2.4711, "step": 315340 }, { "epoch": 0.55, "learning_rate": 2.250337440751682e-05, "loss": 2.2878, "step": 315350 }, { "epoch": 0.55, "learning_rate": 2.2502502467589996e-05, "loss": 2.2966, "step": 315360 }, { "epoch": 0.55, "learning_rate": 2.2501630527663166e-05, "loss": 2.4066, "step": 315370 }, { "epoch": 0.55, "learning_rate": 2.250075858773634e-05, "loss": 2.3954, "step": 315380 }, { "epoch": 0.55, "learning_rate": 2.2499886647809513e-05, "loss": 2.2828, "step": 315390 }, { "epoch": 0.55, "learning_rate": 2.2499014707882687e-05, "loss": 2.4273, "step": 315400 }, { "epoch": 0.55, "learning_rate": 2.249814276795586e-05, "loss": 2.2866, "step": 315410 }, { "epoch": 0.55, "learning_rate": 2.249727082802903e-05, "loss": 2.3235, "step": 315420 }, { "epoch": 0.55, "learning_rate": 2.249639888810221e-05, "loss": 2.3165, "step": 315430 }, { "epoch": 0.55, "learning_rate": 2.249552694817538e-05, "loss": 2.2472, "step": 315440 }, { "epoch": 0.55, "learning_rate": 2.2494655008248553e-05, "loss": 2.3904, "step": 315450 }, { "epoch": 0.55, "learning_rate": 2.2493783068321727e-05, "loss": 2.3681, "step": 315460 }, { "epoch": 0.55, "learning_rate": 2.24929111283949e-05, "loss": 2.3595, "step": 315470 }, { "epoch": 0.55, "learning_rate": 2.2492039188468074e-05, "loss": 2.5414, "step": 315480 }, { "epoch": 0.55, "learning_rate": 2.2491167248541244e-05, "loss": 2.3578, "step": 315490 }, { "epoch": 0.55, "learning_rate": 2.2490295308614418e-05, "loss": 2.2454, "step": 315500 }, { "epoch": 0.55, "learning_rate": 2.2489423368687592e-05, "loss": 2.4158, "step": 315510 }, { "epoch": 0.55, "learning_rate": 2.2488551428760766e-05, "loss": 2.3346, "step": 315520 }, { "epoch": 0.55, "learning_rate": 2.2487679488833936e-05, "loss": 2.2748, "step": 315530 }, { "epoch": 0.55, "learning_rate": 2.2486807548907113e-05, "loss": 2.3915, "step": 315540 }, { "epoch": 0.55, "learning_rate": 2.2485935608980284e-05, "loss": 2.3661, "step": 315550 }, { "epoch": 0.55, "learning_rate": 2.2485063669053457e-05, "loss": 2.3755, "step": 315560 }, { "epoch": 0.55, "learning_rate": 2.248419172912663e-05, "loss": 2.4164, "step": 315570 }, { "epoch": 0.55, "learning_rate": 2.2483319789199805e-05, "loss": 2.3458, "step": 315580 }, { "epoch": 0.55, "learning_rate": 2.248244784927298e-05, "loss": 2.3671, "step": 315590 }, { "epoch": 0.55, "learning_rate": 2.248157590934615e-05, "loss": 2.2906, "step": 315600 }, { "epoch": 0.55, "learning_rate": 2.2480703969419323e-05, "loss": 2.4242, "step": 315610 }, { "epoch": 0.55, "learning_rate": 2.2479832029492497e-05, "loss": 2.2925, "step": 315620 }, { "epoch": 0.55, "learning_rate": 2.247896008956567e-05, "loss": 2.3351, "step": 315630 }, { "epoch": 0.55, "learning_rate": 2.2478088149638844e-05, "loss": 2.3541, "step": 315640 }, { "epoch": 0.55, "learning_rate": 2.2477216209712018e-05, "loss": 2.3871, "step": 315650 }, { "epoch": 0.55, "learning_rate": 2.2476344269785192e-05, "loss": 2.3101, "step": 315660 }, { "epoch": 0.55, "learning_rate": 2.2475472329858362e-05, "loss": 2.3238, "step": 315670 }, { "epoch": 0.55, "learning_rate": 2.2474600389931536e-05, "loss": 2.4171, "step": 315680 }, { "epoch": 0.55, "learning_rate": 2.247372845000471e-05, "loss": 2.4277, "step": 315690 }, { "epoch": 0.55, "learning_rate": 2.2472856510077883e-05, "loss": 2.335, "step": 315700 }, { "epoch": 0.55, "learning_rate": 2.2471984570151057e-05, "loss": 2.4658, "step": 315710 }, { "epoch": 0.55, "learning_rate": 2.2471112630224228e-05, "loss": 2.2941, "step": 315720 }, { "epoch": 0.55, "learning_rate": 2.2470240690297405e-05, "loss": 2.1949, "step": 315730 }, { "epoch": 0.55, "learning_rate": 2.2469368750370575e-05, "loss": 2.3746, "step": 315740 }, { "epoch": 0.55, "learning_rate": 2.246849681044375e-05, "loss": 2.334, "step": 315750 }, { "epoch": 0.55, "learning_rate": 2.246762487051692e-05, "loss": 2.3317, "step": 315760 }, { "epoch": 0.55, "learning_rate": 2.2466752930590096e-05, "loss": 2.3229, "step": 315770 }, { "epoch": 0.55, "learning_rate": 2.2465880990663267e-05, "loss": 2.3577, "step": 315780 }, { "epoch": 0.55, "learning_rate": 2.246500905073644e-05, "loss": 2.2118, "step": 315790 }, { "epoch": 0.55, "learning_rate": 2.2464137110809614e-05, "loss": 2.3778, "step": 315800 }, { "epoch": 0.55, "learning_rate": 2.2463265170882788e-05, "loss": 2.3583, "step": 315810 }, { "epoch": 0.55, "learning_rate": 2.2462393230955962e-05, "loss": 2.4006, "step": 315820 }, { "epoch": 0.55, "learning_rate": 2.2461521291029132e-05, "loss": 2.229, "step": 315830 }, { "epoch": 0.55, "learning_rate": 2.246064935110231e-05, "loss": 2.3129, "step": 315840 }, { "epoch": 0.55, "learning_rate": 2.245977741117548e-05, "loss": 2.3162, "step": 315850 }, { "epoch": 0.55, "learning_rate": 2.2458905471248654e-05, "loss": 2.4268, "step": 315860 }, { "epoch": 0.55, "learning_rate": 2.2458033531321827e-05, "loss": 2.4057, "step": 315870 }, { "epoch": 0.55, "learning_rate": 2.2457161591395e-05, "loss": 2.4097, "step": 315880 }, { "epoch": 0.55, "learning_rate": 2.2456289651468175e-05, "loss": 2.2551, "step": 315890 }, { "epoch": 0.55, "learning_rate": 2.2455417711541345e-05, "loss": 2.2189, "step": 315900 }, { "epoch": 0.55, "learning_rate": 2.245454577161452e-05, "loss": 2.3259, "step": 315910 }, { "epoch": 0.55, "learning_rate": 2.2453673831687693e-05, "loss": 2.3713, "step": 315920 }, { "epoch": 0.55, "learning_rate": 2.2452801891760867e-05, "loss": 2.3185, "step": 315930 }, { "epoch": 0.55, "learning_rate": 2.245192995183404e-05, "loss": 2.3719, "step": 315940 }, { "epoch": 0.55, "learning_rate": 2.2451058011907214e-05, "loss": 2.3073, "step": 315950 }, { "epoch": 0.55, "learning_rate": 2.2450186071980388e-05, "loss": 2.3973, "step": 315960 }, { "epoch": 0.55, "learning_rate": 2.2449314132053558e-05, "loss": 2.351, "step": 315970 }, { "epoch": 0.55, "learning_rate": 2.2448442192126732e-05, "loss": 2.2967, "step": 315980 }, { "epoch": 0.55, "learning_rate": 2.2447570252199906e-05, "loss": 2.4183, "step": 315990 }, { "epoch": 0.55, "learning_rate": 2.244669831227308e-05, "loss": 2.3556, "step": 316000 }, { "epoch": 0.55, "learning_rate": 2.244582637234625e-05, "loss": 2.4114, "step": 316010 }, { "epoch": 0.55, "learning_rate": 2.2444954432419424e-05, "loss": 2.3707, "step": 316020 }, { "epoch": 0.55, "learning_rate": 2.2444082492492598e-05, "loss": 2.4114, "step": 316030 }, { "epoch": 0.55, "learning_rate": 2.244321055256577e-05, "loss": 2.3351, "step": 316040 }, { "epoch": 0.55, "learning_rate": 2.2442338612638945e-05, "loss": 2.3768, "step": 316050 }, { "epoch": 0.55, "learning_rate": 2.244146667271212e-05, "loss": 2.3214, "step": 316060 }, { "epoch": 0.55, "learning_rate": 2.2440594732785293e-05, "loss": 2.3731, "step": 316070 }, { "epoch": 0.55, "learning_rate": 2.2439722792858463e-05, "loss": 2.3255, "step": 316080 }, { "epoch": 0.55, "learning_rate": 2.2438850852931637e-05, "loss": 2.1945, "step": 316090 }, { "epoch": 0.55, "learning_rate": 2.243797891300481e-05, "loss": 2.3499, "step": 316100 }, { "epoch": 0.55, "learning_rate": 2.2437106973077984e-05, "loss": 2.4306, "step": 316110 }, { "epoch": 0.55, "learning_rate": 2.2436235033151158e-05, "loss": 2.313, "step": 316120 }, { "epoch": 0.55, "learning_rate": 2.243536309322433e-05, "loss": 2.3024, "step": 316130 }, { "epoch": 0.55, "learning_rate": 2.2434491153297506e-05, "loss": 2.2512, "step": 316140 }, { "epoch": 0.55, "learning_rate": 2.2433619213370676e-05, "loss": 2.2975, "step": 316150 }, { "epoch": 0.55, "learning_rate": 2.243274727344385e-05, "loss": 2.4051, "step": 316160 }, { "epoch": 0.55, "learning_rate": 2.243187533351702e-05, "loss": 2.2873, "step": 316170 }, { "epoch": 0.55, "learning_rate": 2.2431003393590197e-05, "loss": 2.3373, "step": 316180 }, { "epoch": 0.55, "learning_rate": 2.243013145366337e-05, "loss": 2.4293, "step": 316190 }, { "epoch": 0.55, "learning_rate": 2.242925951373654e-05, "loss": 2.2309, "step": 316200 }, { "epoch": 0.55, "learning_rate": 2.242838757380972e-05, "loss": 2.3317, "step": 316210 }, { "epoch": 0.55, "learning_rate": 2.242751563388289e-05, "loss": 2.3321, "step": 316220 }, { "epoch": 0.55, "learning_rate": 2.2426643693956063e-05, "loss": 2.2578, "step": 316230 }, { "epoch": 0.55, "learning_rate": 2.2425771754029233e-05, "loss": 2.3338, "step": 316240 }, { "epoch": 0.55, "learning_rate": 2.242489981410241e-05, "loss": 2.3166, "step": 316250 }, { "epoch": 0.55, "learning_rate": 2.242402787417558e-05, "loss": 2.315, "step": 316260 }, { "epoch": 0.55, "learning_rate": 2.2423155934248754e-05, "loss": 2.3888, "step": 316270 }, { "epoch": 0.55, "learning_rate": 2.2422283994321928e-05, "loss": 2.2763, "step": 316280 }, { "epoch": 0.55, "learning_rate": 2.2421412054395102e-05, "loss": 2.2771, "step": 316290 }, { "epoch": 0.55, "learning_rate": 2.2420540114468276e-05, "loss": 2.4192, "step": 316300 }, { "epoch": 0.55, "learning_rate": 2.2419668174541446e-05, "loss": 2.2538, "step": 316310 }, { "epoch": 0.55, "learning_rate": 2.2418796234614623e-05, "loss": 2.4536, "step": 316320 }, { "epoch": 0.55, "learning_rate": 2.2417924294687794e-05, "loss": 2.4095, "step": 316330 }, { "epoch": 0.55, "learning_rate": 2.2417052354760967e-05, "loss": 2.3087, "step": 316340 }, { "epoch": 0.55, "learning_rate": 2.241618041483414e-05, "loss": 2.3699, "step": 316350 }, { "epoch": 0.55, "learning_rate": 2.2415308474907315e-05, "loss": 2.3741, "step": 316360 }, { "epoch": 0.55, "learning_rate": 2.241443653498049e-05, "loss": 2.2926, "step": 316370 }, { "epoch": 0.55, "learning_rate": 2.241356459505366e-05, "loss": 2.2625, "step": 316380 }, { "epoch": 0.55, "learning_rate": 2.2412692655126833e-05, "loss": 2.3531, "step": 316390 }, { "epoch": 0.55, "learning_rate": 2.2411820715200007e-05, "loss": 2.2487, "step": 316400 }, { "epoch": 0.55, "learning_rate": 2.241094877527318e-05, "loss": 2.3119, "step": 316410 }, { "epoch": 0.55, "learning_rate": 2.241007683534635e-05, "loss": 2.4335, "step": 316420 }, { "epoch": 0.55, "learning_rate": 2.2409204895419525e-05, "loss": 2.4732, "step": 316430 }, { "epoch": 0.55, "learning_rate": 2.2408332955492702e-05, "loss": 2.3711, "step": 316440 }, { "epoch": 0.55, "learning_rate": 2.2407461015565872e-05, "loss": 2.2668, "step": 316450 }, { "epoch": 0.55, "learning_rate": 2.2406589075639046e-05, "loss": 2.436, "step": 316460 }, { "epoch": 0.55, "learning_rate": 2.240571713571222e-05, "loss": 2.3165, "step": 316470 }, { "epoch": 0.55, "learning_rate": 2.2404845195785393e-05, "loss": 2.2792, "step": 316480 }, { "epoch": 0.55, "learning_rate": 2.2403973255858564e-05, "loss": 2.3029, "step": 316490 }, { "epoch": 0.55, "learning_rate": 2.2403101315931738e-05, "loss": 2.2729, "step": 316500 }, { "epoch": 0.55, "learning_rate": 2.240222937600491e-05, "loss": 2.5285, "step": 316510 }, { "epoch": 0.55, "learning_rate": 2.2401357436078085e-05, "loss": 2.1958, "step": 316520 }, { "epoch": 0.55, "learning_rate": 2.240048549615126e-05, "loss": 2.2366, "step": 316530 }, { "epoch": 0.55, "learning_rate": 2.239961355622443e-05, "loss": 2.3736, "step": 316540 }, { "epoch": 0.55, "learning_rate": 2.2398741616297606e-05, "loss": 2.3696, "step": 316550 }, { "epoch": 0.55, "learning_rate": 2.2397869676370777e-05, "loss": 2.392, "step": 316560 }, { "epoch": 0.55, "learning_rate": 2.239699773644395e-05, "loss": 2.3777, "step": 316570 }, { "epoch": 0.55, "learning_rate": 2.2396125796517124e-05, "loss": 2.353, "step": 316580 }, { "epoch": 0.55, "learning_rate": 2.2395253856590298e-05, "loss": 2.3273, "step": 316590 }, { "epoch": 0.55, "learning_rate": 2.2394381916663472e-05, "loss": 2.3538, "step": 316600 }, { "epoch": 0.55, "learning_rate": 2.2393509976736642e-05, "loss": 2.4374, "step": 316610 }, { "epoch": 0.55, "learning_rate": 2.239263803680982e-05, "loss": 2.3854, "step": 316620 }, { "epoch": 0.55, "learning_rate": 2.239176609688299e-05, "loss": 2.279, "step": 316630 }, { "epoch": 0.55, "learning_rate": 2.2390894156956164e-05, "loss": 2.421, "step": 316640 }, { "epoch": 0.55, "learning_rate": 2.2390022217029334e-05, "loss": 2.2885, "step": 316650 }, { "epoch": 0.55, "learning_rate": 2.238915027710251e-05, "loss": 2.2418, "step": 316660 }, { "epoch": 0.55, "learning_rate": 2.2388278337175685e-05, "loss": 2.2976, "step": 316670 }, { "epoch": 0.55, "learning_rate": 2.2387406397248855e-05, "loss": 2.248, "step": 316680 }, { "epoch": 0.55, "learning_rate": 2.238653445732203e-05, "loss": 2.3827, "step": 316690 }, { "epoch": 0.55, "learning_rate": 2.2385662517395203e-05, "loss": 2.2894, "step": 316700 }, { "epoch": 0.55, "learning_rate": 2.2384790577468377e-05, "loss": 2.3521, "step": 316710 }, { "epoch": 0.55, "learning_rate": 2.2383918637541547e-05, "loss": 2.3344, "step": 316720 }, { "epoch": 0.55, "learning_rate": 2.2383046697614724e-05, "loss": 2.3829, "step": 316730 }, { "epoch": 0.55, "learning_rate": 2.2382174757687895e-05, "loss": 2.3827, "step": 316740 }, { "epoch": 0.55, "learning_rate": 2.2381302817761068e-05, "loss": 2.2964, "step": 316750 }, { "epoch": 0.55, "learning_rate": 2.2380430877834242e-05, "loss": 2.3578, "step": 316760 }, { "epoch": 0.55, "learning_rate": 2.2379558937907416e-05, "loss": 2.3977, "step": 316770 }, { "epoch": 0.55, "learning_rate": 2.237868699798059e-05, "loss": 2.3898, "step": 316780 }, { "epoch": 0.55, "learning_rate": 2.237781505805376e-05, "loss": 2.3822, "step": 316790 }, { "epoch": 0.55, "learning_rate": 2.2376943118126934e-05, "loss": 2.4772, "step": 316800 }, { "epoch": 0.55, "learning_rate": 2.2376071178200108e-05, "loss": 2.304, "step": 316810 }, { "epoch": 0.55, "learning_rate": 2.237519923827328e-05, "loss": 2.3747, "step": 316820 }, { "epoch": 0.55, "learning_rate": 2.2374327298346455e-05, "loss": 2.2857, "step": 316830 }, { "epoch": 0.55, "learning_rate": 2.2373455358419625e-05, "loss": 2.4124, "step": 316840 }, { "epoch": 0.55, "learning_rate": 2.2372583418492803e-05, "loss": 2.3655, "step": 316850 }, { "epoch": 0.55, "learning_rate": 2.2371711478565973e-05, "loss": 2.3696, "step": 316860 }, { "epoch": 0.55, "learning_rate": 2.2370839538639147e-05, "loss": 2.3258, "step": 316870 }, { "epoch": 0.55, "learning_rate": 2.236996759871232e-05, "loss": 2.3341, "step": 316880 }, { "epoch": 0.55, "learning_rate": 2.2369095658785494e-05, "loss": 2.3565, "step": 316890 }, { "epoch": 0.55, "learning_rate": 2.2368223718858665e-05, "loss": 2.445, "step": 316900 }, { "epoch": 0.55, "learning_rate": 2.236735177893184e-05, "loss": 2.2848, "step": 316910 }, { "epoch": 0.55, "learning_rate": 2.2366479839005016e-05, "loss": 2.3512, "step": 316920 }, { "epoch": 0.55, "learning_rate": 2.2365607899078186e-05, "loss": 2.3245, "step": 316930 }, { "epoch": 0.55, "learning_rate": 2.236473595915136e-05, "loss": 2.3897, "step": 316940 }, { "epoch": 0.55, "learning_rate": 2.236386401922453e-05, "loss": 2.315, "step": 316950 }, { "epoch": 0.55, "learning_rate": 2.2362992079297707e-05, "loss": 2.3069, "step": 316960 }, { "epoch": 0.55, "learning_rate": 2.2362120139370878e-05, "loss": 2.3227, "step": 316970 }, { "epoch": 0.55, "learning_rate": 2.236124819944405e-05, "loss": 2.2381, "step": 316980 }, { "epoch": 0.55, "learning_rate": 2.2360376259517225e-05, "loss": 2.4051, "step": 316990 }, { "epoch": 0.55, "learning_rate": 2.23595043195904e-05, "loss": 2.318, "step": 317000 }, { "epoch": 0.55, "learning_rate": 2.2358632379663573e-05, "loss": 2.4065, "step": 317010 }, { "epoch": 0.55, "learning_rate": 2.2357760439736743e-05, "loss": 2.226, "step": 317020 }, { "epoch": 0.55, "learning_rate": 2.235688849980992e-05, "loss": 2.4522, "step": 317030 }, { "epoch": 0.55, "learning_rate": 2.235601655988309e-05, "loss": 2.222, "step": 317040 }, { "epoch": 0.55, "learning_rate": 2.2355144619956264e-05, "loss": 2.3055, "step": 317050 }, { "epoch": 0.55, "learning_rate": 2.2354272680029438e-05, "loss": 2.3006, "step": 317060 }, { "epoch": 0.55, "learning_rate": 2.2353400740102612e-05, "loss": 2.4156, "step": 317070 }, { "epoch": 0.55, "learning_rate": 2.2352528800175786e-05, "loss": 2.4632, "step": 317080 }, { "epoch": 0.55, "learning_rate": 2.2351656860248956e-05, "loss": 2.3122, "step": 317090 }, { "epoch": 0.55, "learning_rate": 2.235078492032213e-05, "loss": 2.3262, "step": 317100 }, { "epoch": 0.55, "learning_rate": 2.2349912980395304e-05, "loss": 2.243, "step": 317110 }, { "epoch": 0.55, "learning_rate": 2.2349041040468477e-05, "loss": 2.4362, "step": 317120 }, { "epoch": 0.55, "learning_rate": 2.2348169100541648e-05, "loss": 2.4393, "step": 317130 }, { "epoch": 0.55, "learning_rate": 2.2347297160614825e-05, "loss": 2.3543, "step": 317140 }, { "epoch": 0.55, "learning_rate": 2.2346425220687995e-05, "loss": 2.4195, "step": 317150 }, { "epoch": 0.55, "learning_rate": 2.234555328076117e-05, "loss": 2.4779, "step": 317160 }, { "epoch": 0.55, "learning_rate": 2.2344681340834343e-05, "loss": 2.4014, "step": 317170 }, { "epoch": 0.55, "learning_rate": 2.2343809400907517e-05, "loss": 2.2794, "step": 317180 }, { "epoch": 0.55, "learning_rate": 2.234293746098069e-05, "loss": 2.3022, "step": 317190 }, { "epoch": 0.55, "learning_rate": 2.234206552105386e-05, "loss": 2.4602, "step": 317200 }, { "epoch": 0.55, "learning_rate": 2.2341193581127035e-05, "loss": 2.3237, "step": 317210 }, { "epoch": 0.55, "learning_rate": 2.234032164120021e-05, "loss": 2.3632, "step": 317220 }, { "epoch": 0.55, "learning_rate": 2.2339449701273382e-05, "loss": 2.2982, "step": 317230 }, { "epoch": 0.55, "learning_rate": 2.2338577761346556e-05, "loss": 2.4608, "step": 317240 }, { "epoch": 0.55, "learning_rate": 2.233770582141973e-05, "loss": 2.3005, "step": 317250 }, { "epoch": 0.55, "learning_rate": 2.2336833881492903e-05, "loss": 2.4035, "step": 317260 }, { "epoch": 0.55, "learning_rate": 2.2335961941566074e-05, "loss": 2.4147, "step": 317270 }, { "epoch": 0.55, "learning_rate": 2.2335090001639248e-05, "loss": 2.3008, "step": 317280 }, { "epoch": 0.55, "learning_rate": 2.233421806171242e-05, "loss": 2.3135, "step": 317290 }, { "epoch": 0.55, "learning_rate": 2.2333346121785595e-05, "loss": 2.3453, "step": 317300 }, { "epoch": 0.55, "learning_rate": 2.233247418185877e-05, "loss": 2.2678, "step": 317310 }, { "epoch": 0.55, "learning_rate": 2.233160224193194e-05, "loss": 2.342, "step": 317320 }, { "epoch": 0.55, "learning_rate": 2.2330730302005116e-05, "loss": 2.3047, "step": 317330 }, { "epoch": 0.55, "learning_rate": 2.2329858362078287e-05, "loss": 2.3495, "step": 317340 }, { "epoch": 0.55, "learning_rate": 2.232898642215146e-05, "loss": 2.3897, "step": 317350 }, { "epoch": 0.55, "learning_rate": 2.232811448222463e-05, "loss": 2.4212, "step": 317360 }, { "epoch": 0.55, "learning_rate": 2.2327242542297808e-05, "loss": 2.339, "step": 317370 }, { "epoch": 0.55, "learning_rate": 2.232637060237098e-05, "loss": 2.4031, "step": 317380 }, { "epoch": 0.55, "learning_rate": 2.2325498662444152e-05, "loss": 2.275, "step": 317390 }, { "epoch": 0.55, "learning_rate": 2.232462672251733e-05, "loss": 2.3781, "step": 317400 }, { "epoch": 0.55, "learning_rate": 2.23237547825905e-05, "loss": 2.4906, "step": 317410 }, { "epoch": 0.55, "learning_rate": 2.2322882842663674e-05, "loss": 2.3438, "step": 317420 }, { "epoch": 0.55, "learning_rate": 2.2322010902736844e-05, "loss": 2.4436, "step": 317430 }, { "epoch": 0.55, "learning_rate": 2.232113896281002e-05, "loss": 2.3118, "step": 317440 }, { "epoch": 0.55, "learning_rate": 2.232026702288319e-05, "loss": 2.332, "step": 317450 }, { "epoch": 0.55, "learning_rate": 2.2319395082956365e-05, "loss": 2.3431, "step": 317460 }, { "epoch": 0.55, "learning_rate": 2.231852314302954e-05, "loss": 2.25, "step": 317470 }, { "epoch": 0.55, "learning_rate": 2.2317651203102713e-05, "loss": 2.3209, "step": 317480 }, { "epoch": 0.55, "learning_rate": 2.2316779263175887e-05, "loss": 2.4146, "step": 317490 }, { "epoch": 0.55, "learning_rate": 2.2315907323249057e-05, "loss": 2.4348, "step": 317500 }, { "epoch": 0.55, "learning_rate": 2.231503538332223e-05, "loss": 2.3966, "step": 317510 }, { "epoch": 0.55, "learning_rate": 2.2314163443395405e-05, "loss": 2.383, "step": 317520 }, { "epoch": 0.55, "learning_rate": 2.2313291503468578e-05, "loss": 2.3926, "step": 317530 }, { "epoch": 0.55, "learning_rate": 2.2312419563541752e-05, "loss": 2.4092, "step": 317540 }, { "epoch": 0.55, "learning_rate": 2.2311547623614926e-05, "loss": 2.3134, "step": 317550 }, { "epoch": 0.55, "learning_rate": 2.23106756836881e-05, "loss": 2.3145, "step": 317560 }, { "epoch": 0.55, "learning_rate": 2.230980374376127e-05, "loss": 2.2945, "step": 317570 }, { "epoch": 0.55, "learning_rate": 2.2308931803834444e-05, "loss": 2.2865, "step": 317580 }, { "epoch": 0.55, "learning_rate": 2.2308059863907618e-05, "loss": 2.4237, "step": 317590 }, { "epoch": 0.55, "learning_rate": 2.230718792398079e-05, "loss": 2.367, "step": 317600 }, { "epoch": 0.55, "learning_rate": 2.230631598405396e-05, "loss": 2.3435, "step": 317610 }, { "epoch": 0.55, "learning_rate": 2.2305444044127135e-05, "loss": 2.3461, "step": 317620 }, { "epoch": 0.55, "learning_rate": 2.230457210420031e-05, "loss": 2.3391, "step": 317630 }, { "epoch": 0.55, "learning_rate": 2.2303700164273483e-05, "loss": 2.2758, "step": 317640 }, { "epoch": 0.55, "learning_rate": 2.2302828224346657e-05, "loss": 2.2627, "step": 317650 }, { "epoch": 0.55, "learning_rate": 2.230195628441983e-05, "loss": 2.3366, "step": 317660 }, { "epoch": 0.55, "learning_rate": 2.2301084344493004e-05, "loss": 2.3684, "step": 317670 }, { "epoch": 0.55, "learning_rate": 2.2300212404566175e-05, "loss": 2.3594, "step": 317680 }, { "epoch": 0.55, "learning_rate": 2.229934046463935e-05, "loss": 2.3101, "step": 317690 }, { "epoch": 0.55, "learning_rate": 2.2298468524712522e-05, "loss": 2.264, "step": 317700 }, { "epoch": 0.55, "learning_rate": 2.2297596584785696e-05, "loss": 2.4543, "step": 317710 }, { "epoch": 0.55, "learning_rate": 2.229672464485887e-05, "loss": 2.3688, "step": 317720 }, { "epoch": 0.55, "learning_rate": 2.229585270493204e-05, "loss": 2.3772, "step": 317730 }, { "epoch": 0.55, "learning_rate": 2.2294980765005217e-05, "loss": 2.3572, "step": 317740 }, { "epoch": 0.55, "learning_rate": 2.2294108825078388e-05, "loss": 2.3625, "step": 317750 }, { "epoch": 0.55, "learning_rate": 2.229323688515156e-05, "loss": 2.3541, "step": 317760 }, { "epoch": 0.55, "learning_rate": 2.2292364945224732e-05, "loss": 2.4044, "step": 317770 }, { "epoch": 0.55, "learning_rate": 2.229149300529791e-05, "loss": 2.3638, "step": 317780 }, { "epoch": 0.55, "learning_rate": 2.2290621065371083e-05, "loss": 2.2829, "step": 317790 }, { "epoch": 0.55, "learning_rate": 2.2289749125444253e-05, "loss": 2.3276, "step": 317800 }, { "epoch": 0.55, "learning_rate": 2.228887718551743e-05, "loss": 2.47, "step": 317810 }, { "epoch": 0.55, "learning_rate": 2.22880052455906e-05, "loss": 2.3498, "step": 317820 }, { "epoch": 0.55, "learning_rate": 2.2287133305663774e-05, "loss": 2.4007, "step": 317830 }, { "epoch": 0.55, "learning_rate": 2.2286261365736945e-05, "loss": 2.4448, "step": 317840 }, { "epoch": 0.55, "learning_rate": 2.2285389425810122e-05, "loss": 2.4125, "step": 317850 }, { "epoch": 0.55, "learning_rate": 2.2284517485883292e-05, "loss": 2.2947, "step": 317860 }, { "epoch": 0.55, "learning_rate": 2.2283645545956466e-05, "loss": 2.4116, "step": 317870 }, { "epoch": 0.55, "learning_rate": 2.228277360602964e-05, "loss": 2.271, "step": 317880 }, { "epoch": 0.55, "learning_rate": 2.2281901666102814e-05, "loss": 2.5024, "step": 317890 }, { "epoch": 0.55, "learning_rate": 2.2281029726175987e-05, "loss": 2.3491, "step": 317900 }, { "epoch": 0.55, "learning_rate": 2.2280157786249158e-05, "loss": 2.2889, "step": 317910 }, { "epoch": 0.55, "learning_rate": 2.2279285846322335e-05, "loss": 2.3039, "step": 317920 }, { "epoch": 0.55, "learning_rate": 2.2278413906395505e-05, "loss": 2.3299, "step": 317930 }, { "epoch": 0.55, "learning_rate": 2.227754196646868e-05, "loss": 2.3497, "step": 317940 }, { "epoch": 0.55, "learning_rate": 2.2276670026541853e-05, "loss": 2.2414, "step": 317950 }, { "epoch": 0.55, "learning_rate": 2.2275798086615027e-05, "loss": 2.4232, "step": 317960 }, { "epoch": 0.55, "learning_rate": 2.22749261466882e-05, "loss": 2.2758, "step": 317970 }, { "epoch": 0.55, "learning_rate": 2.227405420676137e-05, "loss": 2.3025, "step": 317980 }, { "epoch": 0.55, "learning_rate": 2.2273182266834545e-05, "loss": 2.3589, "step": 317990 }, { "epoch": 0.55, "learning_rate": 2.227231032690772e-05, "loss": 2.3658, "step": 318000 }, { "epoch": 0.55, "learning_rate": 2.2271438386980892e-05, "loss": 2.2908, "step": 318010 }, { "epoch": 0.55, "learning_rate": 2.2270566447054066e-05, "loss": 2.4927, "step": 318020 }, { "epoch": 0.55, "learning_rate": 2.2269694507127236e-05, "loss": 2.2872, "step": 318030 }, { "epoch": 0.55, "learning_rate": 2.2268822567200413e-05, "loss": 2.4357, "step": 318040 }, { "epoch": 0.55, "learning_rate": 2.2267950627273584e-05, "loss": 2.3412, "step": 318050 }, { "epoch": 0.55, "learning_rate": 2.2267078687346758e-05, "loss": 2.3953, "step": 318060 }, { "epoch": 0.55, "learning_rate": 2.226620674741993e-05, "loss": 2.3645, "step": 318070 }, { "epoch": 0.55, "learning_rate": 2.2265334807493105e-05, "loss": 2.2403, "step": 318080 }, { "epoch": 0.55, "learning_rate": 2.2264462867566276e-05, "loss": 2.4452, "step": 318090 }, { "epoch": 0.55, "learning_rate": 2.226359092763945e-05, "loss": 2.3932, "step": 318100 }, { "epoch": 0.55, "learning_rate": 2.2262718987712623e-05, "loss": 2.2817, "step": 318110 }, { "epoch": 0.55, "learning_rate": 2.2261847047785797e-05, "loss": 2.3627, "step": 318120 }, { "epoch": 0.55, "learning_rate": 2.226097510785897e-05, "loss": 2.3385, "step": 318130 }, { "epoch": 0.55, "learning_rate": 2.226010316793214e-05, "loss": 2.4189, "step": 318140 }, { "epoch": 0.55, "learning_rate": 2.2259231228005318e-05, "loss": 2.3179, "step": 318150 }, { "epoch": 0.55, "learning_rate": 2.225835928807849e-05, "loss": 2.4425, "step": 318160 }, { "epoch": 0.55, "learning_rate": 2.2257487348151662e-05, "loss": 2.2816, "step": 318170 }, { "epoch": 0.55, "learning_rate": 2.2256615408224836e-05, "loss": 2.3009, "step": 318180 }, { "epoch": 0.55, "learning_rate": 2.225574346829801e-05, "loss": 2.2788, "step": 318190 }, { "epoch": 0.55, "learning_rate": 2.2254871528371184e-05, "loss": 2.3717, "step": 318200 }, { "epoch": 0.55, "learning_rate": 2.2253999588444354e-05, "loss": 2.3794, "step": 318210 }, { "epoch": 0.55, "learning_rate": 2.225312764851753e-05, "loss": 2.2488, "step": 318220 }, { "epoch": 0.55, "learning_rate": 2.22522557085907e-05, "loss": 2.4705, "step": 318230 }, { "epoch": 0.55, "learning_rate": 2.2251383768663875e-05, "loss": 2.3851, "step": 318240 }, { "epoch": 0.55, "learning_rate": 2.2250511828737046e-05, "loss": 2.361, "step": 318250 }, { "epoch": 0.56, "learning_rate": 2.2249639888810223e-05, "loss": 2.3715, "step": 318260 }, { "epoch": 0.56, "learning_rate": 2.2248767948883397e-05, "loss": 2.4219, "step": 318270 }, { "epoch": 0.56, "learning_rate": 2.2247896008956567e-05, "loss": 2.3745, "step": 318280 }, { "epoch": 0.56, "learning_rate": 2.224702406902974e-05, "loss": 2.3387, "step": 318290 }, { "epoch": 0.56, "learning_rate": 2.2246152129102915e-05, "loss": 2.3058, "step": 318300 }, { "epoch": 0.56, "learning_rate": 2.2245280189176088e-05, "loss": 2.3259, "step": 318310 }, { "epoch": 0.56, "learning_rate": 2.224440824924926e-05, "loss": 2.5157, "step": 318320 }, { "epoch": 0.56, "learning_rate": 2.2243536309322436e-05, "loss": 2.3647, "step": 318330 }, { "epoch": 0.56, "learning_rate": 2.2242664369395606e-05, "loss": 2.4175, "step": 318340 }, { "epoch": 0.56, "learning_rate": 2.224179242946878e-05, "loss": 2.4496, "step": 318350 }, { "epoch": 0.56, "learning_rate": 2.2240920489541954e-05, "loss": 2.2956, "step": 318360 }, { "epoch": 0.56, "learning_rate": 2.2240048549615128e-05, "loss": 2.0526, "step": 318370 }, { "epoch": 0.56, "learning_rate": 2.22391766096883e-05, "loss": 2.2604, "step": 318380 }, { "epoch": 0.56, "learning_rate": 2.223830466976147e-05, "loss": 2.5169, "step": 318390 }, { "epoch": 0.56, "learning_rate": 2.2237432729834645e-05, "loss": 2.4378, "step": 318400 }, { "epoch": 0.56, "learning_rate": 2.223656078990782e-05, "loss": 2.3389, "step": 318410 }, { "epoch": 0.56, "learning_rate": 2.2235688849980993e-05, "loss": 2.3136, "step": 318420 }, { "epoch": 0.56, "learning_rate": 2.2234816910054167e-05, "loss": 2.2648, "step": 318430 }, { "epoch": 0.56, "learning_rate": 2.2233944970127337e-05, "loss": 2.3973, "step": 318440 }, { "epoch": 0.56, "learning_rate": 2.2233073030200514e-05, "loss": 2.4024, "step": 318450 }, { "epoch": 0.56, "learning_rate": 2.2232201090273685e-05, "loss": 2.285, "step": 318460 }, { "epoch": 0.56, "learning_rate": 2.223132915034686e-05, "loss": 2.3217, "step": 318470 }, { "epoch": 0.56, "learning_rate": 2.2230457210420032e-05, "loss": 2.2505, "step": 318480 }, { "epoch": 0.56, "learning_rate": 2.2229585270493206e-05, "loss": 2.2464, "step": 318490 }, { "epoch": 0.56, "learning_rate": 2.2228713330566376e-05, "loss": 2.299, "step": 318500 }, { "epoch": 0.56, "learning_rate": 2.222784139063955e-05, "loss": 2.2984, "step": 318510 }, { "epoch": 0.56, "learning_rate": 2.2226969450712727e-05, "loss": 2.2907, "step": 318520 }, { "epoch": 0.56, "learning_rate": 2.2226097510785898e-05, "loss": 2.352, "step": 318530 }, { "epoch": 0.56, "learning_rate": 2.222522557085907e-05, "loss": 2.3077, "step": 318540 }, { "epoch": 0.56, "learning_rate": 2.2224353630932242e-05, "loss": 2.2108, "step": 318550 }, { "epoch": 0.56, "learning_rate": 2.222348169100542e-05, "loss": 2.4585, "step": 318560 }, { "epoch": 0.56, "learning_rate": 2.222260975107859e-05, "loss": 2.3616, "step": 318570 }, { "epoch": 0.56, "learning_rate": 2.2221737811151763e-05, "loss": 2.2455, "step": 318580 }, { "epoch": 0.56, "learning_rate": 2.2220865871224937e-05, "loss": 2.3442, "step": 318590 }, { "epoch": 0.56, "learning_rate": 2.221999393129811e-05, "loss": 2.2599, "step": 318600 }, { "epoch": 0.56, "learning_rate": 2.2219121991371284e-05, "loss": 2.2938, "step": 318610 }, { "epoch": 0.56, "learning_rate": 2.2218250051444455e-05, "loss": 2.3715, "step": 318620 }, { "epoch": 0.56, "learning_rate": 2.2217378111517632e-05, "loss": 2.3437, "step": 318630 }, { "epoch": 0.56, "learning_rate": 2.2216506171590802e-05, "loss": 2.3842, "step": 318640 }, { "epoch": 0.56, "learning_rate": 2.2215634231663976e-05, "loss": 2.379, "step": 318650 }, { "epoch": 0.56, "learning_rate": 2.221476229173715e-05, "loss": 2.2819, "step": 318660 }, { "epoch": 0.56, "learning_rate": 2.2213890351810324e-05, "loss": 2.3621, "step": 318670 }, { "epoch": 0.56, "learning_rate": 2.2213018411883497e-05, "loss": 2.315, "step": 318680 }, { "epoch": 0.56, "learning_rate": 2.2212146471956668e-05, "loss": 2.3439, "step": 318690 }, { "epoch": 0.56, "learning_rate": 2.221127453202984e-05, "loss": 2.2827, "step": 318700 }, { "epoch": 0.56, "learning_rate": 2.2210402592103015e-05, "loss": 2.2616, "step": 318710 }, { "epoch": 0.56, "learning_rate": 2.220953065217619e-05, "loss": 2.3027, "step": 318720 }, { "epoch": 0.56, "learning_rate": 2.220865871224936e-05, "loss": 2.375, "step": 318730 }, { "epoch": 0.56, "learning_rate": 2.2207786772322537e-05, "loss": 2.3976, "step": 318740 }, { "epoch": 0.56, "learning_rate": 2.220691483239571e-05, "loss": 2.4027, "step": 318750 }, { "epoch": 0.56, "learning_rate": 2.220604289246888e-05, "loss": 2.3075, "step": 318760 }, { "epoch": 0.56, "learning_rate": 2.2205170952542055e-05, "loss": 2.2555, "step": 318770 }, { "epoch": 0.56, "learning_rate": 2.220429901261523e-05, "loss": 2.3177, "step": 318780 }, { "epoch": 0.56, "learning_rate": 2.2203427072688402e-05, "loss": 2.3243, "step": 318790 }, { "epoch": 0.56, "learning_rate": 2.2202555132761573e-05, "loss": 2.38, "step": 318800 }, { "epoch": 0.56, "learning_rate": 2.2201683192834746e-05, "loss": 2.2974, "step": 318810 }, { "epoch": 0.56, "learning_rate": 2.220081125290792e-05, "loss": 2.4204, "step": 318820 }, { "epoch": 0.56, "learning_rate": 2.2199939312981094e-05, "loss": 2.392, "step": 318830 }, { "epoch": 0.56, "learning_rate": 2.2199067373054268e-05, "loss": 2.3368, "step": 318840 }, { "epoch": 0.56, "learning_rate": 2.219819543312744e-05, "loss": 2.2559, "step": 318850 }, { "epoch": 0.56, "learning_rate": 2.2197323493200615e-05, "loss": 2.3951, "step": 318860 }, { "epoch": 0.56, "learning_rate": 2.2196451553273786e-05, "loss": 2.3555, "step": 318870 }, { "epoch": 0.56, "learning_rate": 2.219557961334696e-05, "loss": 2.1453, "step": 318880 }, { "epoch": 0.56, "learning_rate": 2.2194707673420133e-05, "loss": 2.5277, "step": 318890 }, { "epoch": 0.56, "learning_rate": 2.2193835733493307e-05, "loss": 2.4172, "step": 318900 }, { "epoch": 0.56, "learning_rate": 2.219296379356648e-05, "loss": 2.3423, "step": 318910 }, { "epoch": 0.56, "learning_rate": 2.219209185363965e-05, "loss": 2.3497, "step": 318920 }, { "epoch": 0.56, "learning_rate": 2.2191219913712828e-05, "loss": 2.3678, "step": 318930 }, { "epoch": 0.56, "learning_rate": 2.2190347973786e-05, "loss": 2.4562, "step": 318940 }, { "epoch": 0.56, "learning_rate": 2.2189476033859172e-05, "loss": 2.2795, "step": 318950 }, { "epoch": 0.56, "learning_rate": 2.2188604093932343e-05, "loss": 2.2934, "step": 318960 }, { "epoch": 0.56, "learning_rate": 2.218773215400552e-05, "loss": 2.453, "step": 318970 }, { "epoch": 0.56, "learning_rate": 2.218686021407869e-05, "loss": 2.271, "step": 318980 }, { "epoch": 0.56, "learning_rate": 2.2185988274151864e-05, "loss": 2.4483, "step": 318990 }, { "epoch": 0.56, "learning_rate": 2.218511633422504e-05, "loss": 2.4944, "step": 319000 }, { "epoch": 0.56, "learning_rate": 2.218424439429821e-05, "loss": 2.444, "step": 319010 }, { "epoch": 0.56, "learning_rate": 2.2183372454371385e-05, "loss": 2.1628, "step": 319020 }, { "epoch": 0.56, "learning_rate": 2.2182500514444556e-05, "loss": 2.2621, "step": 319030 }, { "epoch": 0.56, "learning_rate": 2.2181628574517733e-05, "loss": 2.3111, "step": 319040 }, { "epoch": 0.56, "learning_rate": 2.2180756634590903e-05, "loss": 2.3862, "step": 319050 }, { "epoch": 0.56, "learning_rate": 2.2179884694664077e-05, "loss": 2.2786, "step": 319060 }, { "epoch": 0.56, "learning_rate": 2.217901275473725e-05, "loss": 2.3302, "step": 319070 }, { "epoch": 0.56, "learning_rate": 2.2178140814810425e-05, "loss": 2.3805, "step": 319080 }, { "epoch": 0.56, "learning_rate": 2.2177268874883598e-05, "loss": 2.3411, "step": 319090 }, { "epoch": 0.56, "learning_rate": 2.217639693495677e-05, "loss": 2.3764, "step": 319100 }, { "epoch": 0.56, "learning_rate": 2.2175524995029946e-05, "loss": 2.3173, "step": 319110 }, { "epoch": 0.56, "learning_rate": 2.2174653055103116e-05, "loss": 2.397, "step": 319120 }, { "epoch": 0.56, "learning_rate": 2.217378111517629e-05, "loss": 2.3568, "step": 319130 }, { "epoch": 0.56, "learning_rate": 2.2172909175249464e-05, "loss": 2.2698, "step": 319140 }, { "epoch": 0.56, "learning_rate": 2.2172037235322638e-05, "loss": 2.3397, "step": 319150 }, { "epoch": 0.56, "learning_rate": 2.217116529539581e-05, "loss": 2.3942, "step": 319160 }, { "epoch": 0.56, "learning_rate": 2.217029335546898e-05, "loss": 2.3686, "step": 319170 }, { "epoch": 0.56, "learning_rate": 2.2169421415542155e-05, "loss": 2.4237, "step": 319180 }, { "epoch": 0.56, "learning_rate": 2.216854947561533e-05, "loss": 2.2946, "step": 319190 }, { "epoch": 0.56, "learning_rate": 2.2167677535688503e-05, "loss": 2.31, "step": 319200 }, { "epoch": 0.56, "learning_rate": 2.2166805595761673e-05, "loss": 2.4126, "step": 319210 }, { "epoch": 0.56, "learning_rate": 2.2165933655834847e-05, "loss": 2.3182, "step": 319220 }, { "epoch": 0.56, "learning_rate": 2.216506171590802e-05, "loss": 2.2225, "step": 319230 }, { "epoch": 0.56, "learning_rate": 2.2164189775981195e-05, "loss": 2.2407, "step": 319240 }, { "epoch": 0.56, "learning_rate": 2.216331783605437e-05, "loss": 2.3732, "step": 319250 }, { "epoch": 0.56, "learning_rate": 2.2162445896127542e-05, "loss": 2.2974, "step": 319260 }, { "epoch": 0.56, "learning_rate": 2.2161573956200716e-05, "loss": 2.3994, "step": 319270 }, { "epoch": 0.56, "learning_rate": 2.2160702016273886e-05, "loss": 2.3777, "step": 319280 }, { "epoch": 0.56, "learning_rate": 2.215983007634706e-05, "loss": 2.3297, "step": 319290 }, { "epoch": 0.56, "learning_rate": 2.2158958136420234e-05, "loss": 2.3682, "step": 319300 }, { "epoch": 0.56, "learning_rate": 2.2158086196493408e-05, "loss": 2.3626, "step": 319310 }, { "epoch": 0.56, "learning_rate": 2.215721425656658e-05, "loss": 2.3103, "step": 319320 }, { "epoch": 0.56, "learning_rate": 2.2156342316639752e-05, "loss": 2.3536, "step": 319330 }, { "epoch": 0.56, "learning_rate": 2.215547037671293e-05, "loss": 2.4437, "step": 319340 }, { "epoch": 0.56, "learning_rate": 2.21545984367861e-05, "loss": 2.3866, "step": 319350 }, { "epoch": 0.56, "learning_rate": 2.2153726496859273e-05, "loss": 2.293, "step": 319360 }, { "epoch": 0.56, "learning_rate": 2.2152854556932447e-05, "loss": 2.4152, "step": 319370 }, { "epoch": 0.56, "learning_rate": 2.215198261700562e-05, "loss": 2.4288, "step": 319380 }, { "epoch": 0.56, "learning_rate": 2.2151110677078794e-05, "loss": 2.3295, "step": 319390 }, { "epoch": 0.56, "learning_rate": 2.2150238737151965e-05, "loss": 2.2817, "step": 319400 }, { "epoch": 0.56, "learning_rate": 2.2149366797225142e-05, "loss": 2.2554, "step": 319410 }, { "epoch": 0.56, "learning_rate": 2.2148494857298312e-05, "loss": 2.3334, "step": 319420 }, { "epoch": 0.56, "learning_rate": 2.2147622917371486e-05, "loss": 2.2772, "step": 319430 }, { "epoch": 0.56, "learning_rate": 2.2146750977444657e-05, "loss": 2.459, "step": 319440 }, { "epoch": 0.56, "learning_rate": 2.2145879037517834e-05, "loss": 2.4288, "step": 319450 }, { "epoch": 0.56, "learning_rate": 2.2145007097591004e-05, "loss": 2.3656, "step": 319460 }, { "epoch": 0.56, "learning_rate": 2.2144135157664178e-05, "loss": 2.4663, "step": 319470 }, { "epoch": 0.56, "learning_rate": 2.214326321773735e-05, "loss": 2.3576, "step": 319480 }, { "epoch": 0.56, "learning_rate": 2.2142391277810525e-05, "loss": 2.4527, "step": 319490 }, { "epoch": 0.56, "learning_rate": 2.21415193378837e-05, "loss": 2.3553, "step": 319500 }, { "epoch": 0.56, "learning_rate": 2.214064739795687e-05, "loss": 2.2272, "step": 319510 }, { "epoch": 0.56, "learning_rate": 2.2139775458030047e-05, "loss": 2.2641, "step": 319520 }, { "epoch": 0.56, "learning_rate": 2.2138903518103217e-05, "loss": 2.3054, "step": 319530 }, { "epoch": 0.56, "learning_rate": 2.213803157817639e-05, "loss": 2.2674, "step": 319540 }, { "epoch": 0.56, "learning_rate": 2.2137159638249565e-05, "loss": 2.3325, "step": 319550 }, { "epoch": 0.56, "learning_rate": 2.213628769832274e-05, "loss": 2.4179, "step": 319560 }, { "epoch": 0.56, "learning_rate": 2.2135415758395912e-05, "loss": 2.3024, "step": 319570 }, { "epoch": 0.56, "learning_rate": 2.2134543818469083e-05, "loss": 2.3414, "step": 319580 }, { "epoch": 0.56, "learning_rate": 2.2133671878542256e-05, "loss": 2.4059, "step": 319590 }, { "epoch": 0.56, "learning_rate": 2.213279993861543e-05, "loss": 2.2603, "step": 319600 }, { "epoch": 0.56, "learning_rate": 2.2131927998688604e-05, "loss": 2.3344, "step": 319610 }, { "epoch": 0.56, "learning_rate": 2.2131056058761778e-05, "loss": 2.3425, "step": 319620 }, { "epoch": 0.56, "learning_rate": 2.2130184118834948e-05, "loss": 2.2519, "step": 319630 }, { "epoch": 0.56, "learning_rate": 2.2129312178908125e-05, "loss": 2.3494, "step": 319640 }, { "epoch": 0.56, "learning_rate": 2.2128440238981296e-05, "loss": 2.3569, "step": 319650 }, { "epoch": 0.56, "learning_rate": 2.212756829905447e-05, "loss": 2.3109, "step": 319660 }, { "epoch": 0.56, "learning_rate": 2.2126696359127643e-05, "loss": 2.2998, "step": 319670 }, { "epoch": 0.56, "learning_rate": 2.2125824419200817e-05, "loss": 2.3789, "step": 319680 }, { "epoch": 0.56, "learning_rate": 2.2124952479273987e-05, "loss": 2.3062, "step": 319690 }, { "epoch": 0.56, "learning_rate": 2.212408053934716e-05, "loss": 2.35, "step": 319700 }, { "epoch": 0.56, "learning_rate": 2.2123208599420335e-05, "loss": 2.396, "step": 319710 }, { "epoch": 0.56, "learning_rate": 2.212233665949351e-05, "loss": 2.3283, "step": 319720 }, { "epoch": 0.56, "learning_rate": 2.2121464719566682e-05, "loss": 2.1968, "step": 319730 }, { "epoch": 0.56, "learning_rate": 2.2120592779639853e-05, "loss": 2.4499, "step": 319740 }, { "epoch": 0.56, "learning_rate": 2.211972083971303e-05, "loss": 2.2959, "step": 319750 }, { "epoch": 0.56, "learning_rate": 2.21188488997862e-05, "loss": 2.3699, "step": 319760 }, { "epoch": 0.56, "learning_rate": 2.2117976959859374e-05, "loss": 2.2533, "step": 319770 }, { "epoch": 0.56, "learning_rate": 2.2117105019932548e-05, "loss": 2.4147, "step": 319780 }, { "epoch": 0.56, "learning_rate": 2.211623308000572e-05, "loss": 2.2611, "step": 319790 }, { "epoch": 0.56, "learning_rate": 2.2115361140078895e-05, "loss": 2.395, "step": 319800 }, { "epoch": 0.56, "learning_rate": 2.2114489200152066e-05, "loss": 2.3674, "step": 319810 }, { "epoch": 0.56, "learning_rate": 2.2113617260225243e-05, "loss": 2.3685, "step": 319820 }, { "epoch": 0.56, "learning_rate": 2.2112745320298413e-05, "loss": 2.2834, "step": 319830 }, { "epoch": 0.56, "learning_rate": 2.2111873380371587e-05, "loss": 2.2971, "step": 319840 }, { "epoch": 0.56, "learning_rate": 2.2111001440444757e-05, "loss": 2.2923, "step": 319850 }, { "epoch": 0.56, "learning_rate": 2.2110129500517935e-05, "loss": 2.3142, "step": 319860 }, { "epoch": 0.56, "learning_rate": 2.210925756059111e-05, "loss": 2.3104, "step": 319870 }, { "epoch": 0.56, "learning_rate": 2.210838562066428e-05, "loss": 2.2476, "step": 319880 }, { "epoch": 0.56, "learning_rate": 2.2107513680737452e-05, "loss": 2.3517, "step": 319890 }, { "epoch": 0.56, "learning_rate": 2.2106641740810626e-05, "loss": 2.2838, "step": 319900 }, { "epoch": 0.56, "learning_rate": 2.21057698008838e-05, "loss": 2.3802, "step": 319910 }, { "epoch": 0.56, "learning_rate": 2.210489786095697e-05, "loss": 2.1858, "step": 319920 }, { "epoch": 0.56, "learning_rate": 2.2104025921030148e-05, "loss": 2.4369, "step": 319930 }, { "epoch": 0.56, "learning_rate": 2.2103153981103318e-05, "loss": 2.3436, "step": 319940 }, { "epoch": 0.56, "learning_rate": 2.210228204117649e-05, "loss": 2.2701, "step": 319950 }, { "epoch": 0.56, "learning_rate": 2.2101410101249665e-05, "loss": 2.3148, "step": 319960 }, { "epoch": 0.56, "learning_rate": 2.210053816132284e-05, "loss": 2.3518, "step": 319970 }, { "epoch": 0.56, "learning_rate": 2.2099666221396013e-05, "loss": 2.4018, "step": 319980 }, { "epoch": 0.56, "learning_rate": 2.2098794281469183e-05, "loss": 2.4242, "step": 319990 }, { "epoch": 0.56, "learning_rate": 2.2097922341542357e-05, "loss": 2.2703, "step": 320000 }, { "epoch": 0.56, "learning_rate": 2.209705040161553e-05, "loss": 2.4134, "step": 320010 }, { "epoch": 0.56, "learning_rate": 2.2096178461688705e-05, "loss": 2.3049, "step": 320020 }, { "epoch": 0.56, "learning_rate": 2.209530652176188e-05, "loss": 2.4368, "step": 320030 }, { "epoch": 0.56, "learning_rate": 2.2094434581835052e-05, "loss": 2.4247, "step": 320040 }, { "epoch": 0.56, "learning_rate": 2.2093562641908226e-05, "loss": 2.3378, "step": 320050 }, { "epoch": 0.56, "learning_rate": 2.2092690701981396e-05, "loss": 2.4327, "step": 320060 }, { "epoch": 0.56, "learning_rate": 2.209181876205457e-05, "loss": 2.3488, "step": 320070 }, { "epoch": 0.56, "learning_rate": 2.2090946822127744e-05, "loss": 2.3722, "step": 320080 }, { "epoch": 0.56, "learning_rate": 2.2090074882200918e-05, "loss": 2.42, "step": 320090 }, { "epoch": 0.56, "learning_rate": 2.208920294227409e-05, "loss": 2.4425, "step": 320100 }, { "epoch": 0.56, "learning_rate": 2.2088331002347262e-05, "loss": 2.3405, "step": 320110 }, { "epoch": 0.56, "learning_rate": 2.208745906242044e-05, "loss": 2.2951, "step": 320120 }, { "epoch": 0.56, "learning_rate": 2.208658712249361e-05, "loss": 2.3491, "step": 320130 }, { "epoch": 0.56, "learning_rate": 2.2085715182566783e-05, "loss": 2.3311, "step": 320140 }, { "epoch": 0.56, "learning_rate": 2.2084843242639954e-05, "loss": 2.3843, "step": 320150 }, { "epoch": 0.56, "learning_rate": 2.208397130271313e-05, "loss": 2.3171, "step": 320160 }, { "epoch": 0.56, "learning_rate": 2.20830993627863e-05, "loss": 2.4045, "step": 320170 }, { "epoch": 0.56, "learning_rate": 2.2082227422859475e-05, "loss": 2.3014, "step": 320180 }, { "epoch": 0.56, "learning_rate": 2.208135548293265e-05, "loss": 2.3695, "step": 320190 }, { "epoch": 0.56, "learning_rate": 2.2080483543005822e-05, "loss": 2.4005, "step": 320200 }, { "epoch": 0.56, "learning_rate": 2.2079611603078996e-05, "loss": 2.346, "step": 320210 }, { "epoch": 0.56, "learning_rate": 2.2078739663152167e-05, "loss": 2.2974, "step": 320220 }, { "epoch": 0.56, "learning_rate": 2.2077867723225344e-05, "loss": 2.4039, "step": 320230 }, { "epoch": 0.56, "learning_rate": 2.2076995783298514e-05, "loss": 2.2934, "step": 320240 }, { "epoch": 0.56, "learning_rate": 2.2076123843371688e-05, "loss": 2.4454, "step": 320250 }, { "epoch": 0.56, "learning_rate": 2.207525190344486e-05, "loss": 2.3525, "step": 320260 }, { "epoch": 0.56, "learning_rate": 2.2074379963518035e-05, "loss": 2.3681, "step": 320270 }, { "epoch": 0.56, "learning_rate": 2.207350802359121e-05, "loss": 2.1837, "step": 320280 }, { "epoch": 0.56, "learning_rate": 2.207263608366438e-05, "loss": 2.4031, "step": 320290 }, { "epoch": 0.56, "learning_rate": 2.2071764143737553e-05, "loss": 2.3638, "step": 320300 }, { "epoch": 0.56, "learning_rate": 2.2070892203810727e-05, "loss": 2.4025, "step": 320310 }, { "epoch": 0.56, "learning_rate": 2.20700202638839e-05, "loss": 2.339, "step": 320320 }, { "epoch": 0.56, "learning_rate": 2.206914832395707e-05, "loss": 2.2562, "step": 320330 }, { "epoch": 0.56, "learning_rate": 2.206827638403025e-05, "loss": 2.3263, "step": 320340 }, { "epoch": 0.56, "learning_rate": 2.2067404444103422e-05, "loss": 2.3932, "step": 320350 }, { "epoch": 0.56, "learning_rate": 2.2066532504176593e-05, "loss": 2.2916, "step": 320360 }, { "epoch": 0.56, "learning_rate": 2.2065660564249766e-05, "loss": 2.3762, "step": 320370 }, { "epoch": 0.56, "learning_rate": 2.206478862432294e-05, "loss": 2.4156, "step": 320380 }, { "epoch": 0.56, "learning_rate": 2.2063916684396114e-05, "loss": 2.4563, "step": 320390 }, { "epoch": 0.56, "learning_rate": 2.2063044744469284e-05, "loss": 2.4347, "step": 320400 }, { "epoch": 0.56, "learning_rate": 2.2062172804542458e-05, "loss": 2.2606, "step": 320410 }, { "epoch": 0.56, "learning_rate": 2.2061300864615632e-05, "loss": 2.4164, "step": 320420 }, { "epoch": 0.56, "learning_rate": 2.2060428924688806e-05, "loss": 2.3688, "step": 320430 }, { "epoch": 0.56, "learning_rate": 2.205955698476198e-05, "loss": 2.3822, "step": 320440 }, { "epoch": 0.56, "learning_rate": 2.2058685044835153e-05, "loss": 2.3703, "step": 320450 }, { "epoch": 0.56, "learning_rate": 2.2057813104908327e-05, "loss": 2.2898, "step": 320460 }, { "epoch": 0.56, "learning_rate": 2.2056941164981497e-05, "loss": 2.34, "step": 320470 }, { "epoch": 0.56, "learning_rate": 2.205606922505467e-05, "loss": 2.3431, "step": 320480 }, { "epoch": 0.56, "learning_rate": 2.2055197285127845e-05, "loss": 2.3906, "step": 320490 }, { "epoch": 0.56, "learning_rate": 2.205432534520102e-05, "loss": 2.3471, "step": 320500 }, { "epoch": 0.56, "learning_rate": 2.2053453405274192e-05, "loss": 2.3204, "step": 320510 }, { "epoch": 0.56, "learning_rate": 2.2052581465347363e-05, "loss": 2.2533, "step": 320520 }, { "epoch": 0.56, "learning_rate": 2.205170952542054e-05, "loss": 2.371, "step": 320530 }, { "epoch": 0.56, "learning_rate": 2.205083758549371e-05, "loss": 2.3705, "step": 320540 }, { "epoch": 0.56, "learning_rate": 2.2049965645566884e-05, "loss": 2.3491, "step": 320550 }, { "epoch": 0.56, "learning_rate": 2.2049093705640054e-05, "loss": 2.4094, "step": 320560 }, { "epoch": 0.56, "learning_rate": 2.204822176571323e-05, "loss": 2.3025, "step": 320570 }, { "epoch": 0.56, "learning_rate": 2.2047349825786405e-05, "loss": 2.3921, "step": 320580 }, { "epoch": 0.56, "learning_rate": 2.2046477885859576e-05, "loss": 2.3958, "step": 320590 }, { "epoch": 0.56, "learning_rate": 2.2045605945932753e-05, "loss": 2.388, "step": 320600 }, { "epoch": 0.56, "learning_rate": 2.2044734006005923e-05, "loss": 2.4296, "step": 320610 }, { "epoch": 0.56, "learning_rate": 2.2043862066079097e-05, "loss": 2.3531, "step": 320620 }, { "epoch": 0.56, "learning_rate": 2.2042990126152267e-05, "loss": 2.2403, "step": 320630 }, { "epoch": 0.56, "learning_rate": 2.2042118186225445e-05, "loss": 2.3062, "step": 320640 }, { "epoch": 0.56, "learning_rate": 2.2041246246298615e-05, "loss": 2.3036, "step": 320650 }, { "epoch": 0.56, "learning_rate": 2.204037430637179e-05, "loss": 2.3714, "step": 320660 }, { "epoch": 0.56, "learning_rate": 2.2039502366444962e-05, "loss": 2.3733, "step": 320670 }, { "epoch": 0.56, "learning_rate": 2.2038630426518136e-05, "loss": 2.3704, "step": 320680 }, { "epoch": 0.56, "learning_rate": 2.203775848659131e-05, "loss": 2.3046, "step": 320690 }, { "epoch": 0.56, "learning_rate": 2.203688654666448e-05, "loss": 2.3939, "step": 320700 }, { "epoch": 0.56, "learning_rate": 2.2036014606737658e-05, "loss": 2.3909, "step": 320710 }, { "epoch": 0.56, "learning_rate": 2.2035142666810828e-05, "loss": 2.2506, "step": 320720 }, { "epoch": 0.56, "learning_rate": 2.2034270726884002e-05, "loss": 2.2521, "step": 320730 }, { "epoch": 0.56, "learning_rate": 2.2033398786957175e-05, "loss": 2.2658, "step": 320740 }, { "epoch": 0.56, "learning_rate": 2.203252684703035e-05, "loss": 2.3013, "step": 320750 }, { "epoch": 0.56, "learning_rate": 2.2031654907103523e-05, "loss": 2.2841, "step": 320760 }, { "epoch": 0.56, "learning_rate": 2.2030782967176693e-05, "loss": 2.4694, "step": 320770 }, { "epoch": 0.56, "learning_rate": 2.2029911027249867e-05, "loss": 2.3424, "step": 320780 }, { "epoch": 0.56, "learning_rate": 2.202903908732304e-05, "loss": 2.3298, "step": 320790 }, { "epoch": 0.56, "learning_rate": 2.2028167147396215e-05, "loss": 2.396, "step": 320800 }, { "epoch": 0.56, "learning_rate": 2.2027295207469385e-05, "loss": 2.2581, "step": 320810 }, { "epoch": 0.56, "learning_rate": 2.202642326754256e-05, "loss": 2.4091, "step": 320820 }, { "epoch": 0.56, "learning_rate": 2.2025551327615736e-05, "loss": 2.4688, "step": 320830 }, { "epoch": 0.56, "learning_rate": 2.2024679387688906e-05, "loss": 2.3997, "step": 320840 }, { "epoch": 0.56, "learning_rate": 2.202380744776208e-05, "loss": 2.4519, "step": 320850 }, { "epoch": 0.56, "learning_rate": 2.2022935507835254e-05, "loss": 2.2835, "step": 320860 }, { "epoch": 0.56, "learning_rate": 2.2022063567908428e-05, "loss": 2.1772, "step": 320870 }, { "epoch": 0.56, "learning_rate": 2.2021191627981598e-05, "loss": 2.2179, "step": 320880 }, { "epoch": 0.56, "learning_rate": 2.2020319688054772e-05, "loss": 2.4057, "step": 320890 }, { "epoch": 0.56, "learning_rate": 2.2019447748127946e-05, "loss": 2.3236, "step": 320900 }, { "epoch": 0.56, "learning_rate": 2.201857580820112e-05, "loss": 2.4212, "step": 320910 }, { "epoch": 0.56, "learning_rate": 2.2017703868274293e-05, "loss": 2.3344, "step": 320920 }, { "epoch": 0.56, "learning_rate": 2.2016831928347464e-05, "loss": 2.3234, "step": 320930 }, { "epoch": 0.56, "learning_rate": 2.201595998842064e-05, "loss": 2.2781, "step": 320940 }, { "epoch": 0.56, "learning_rate": 2.201508804849381e-05, "loss": 2.3984, "step": 320950 }, { "epoch": 0.56, "learning_rate": 2.2014216108566985e-05, "loss": 2.3, "step": 320960 }, { "epoch": 0.56, "learning_rate": 2.201334416864016e-05, "loss": 2.3913, "step": 320970 }, { "epoch": 0.56, "learning_rate": 2.2012472228713332e-05, "loss": 2.3993, "step": 320980 }, { "epoch": 0.56, "learning_rate": 2.2011600288786506e-05, "loss": 2.3457, "step": 320990 }, { "epoch": 0.56, "learning_rate": 2.2010728348859677e-05, "loss": 2.3367, "step": 321000 }, { "epoch": 0.56, "learning_rate": 2.2009856408932854e-05, "loss": 2.4385, "step": 321010 }, { "epoch": 0.56, "learning_rate": 2.2008984469006024e-05, "loss": 2.3268, "step": 321020 }, { "epoch": 0.56, "learning_rate": 2.2008112529079198e-05, "loss": 2.3983, "step": 321030 }, { "epoch": 0.56, "learning_rate": 2.2007240589152368e-05, "loss": 2.3782, "step": 321040 }, { "epoch": 0.56, "learning_rate": 2.2006368649225545e-05, "loss": 2.4717, "step": 321050 }, { "epoch": 0.56, "learning_rate": 2.2005496709298716e-05, "loss": 2.3095, "step": 321060 }, { "epoch": 0.56, "learning_rate": 2.200462476937189e-05, "loss": 2.5284, "step": 321070 }, { "epoch": 0.56, "learning_rate": 2.2003752829445063e-05, "loss": 2.3307, "step": 321080 }, { "epoch": 0.56, "learning_rate": 2.2002880889518237e-05, "loss": 2.4189, "step": 321090 }, { "epoch": 0.56, "learning_rate": 2.200200894959141e-05, "loss": 2.3579, "step": 321100 }, { "epoch": 0.56, "learning_rate": 2.200113700966458e-05, "loss": 2.4058, "step": 321110 }, { "epoch": 0.56, "learning_rate": 2.200026506973776e-05, "loss": 2.3628, "step": 321120 }, { "epoch": 0.56, "learning_rate": 2.199939312981093e-05, "loss": 2.2277, "step": 321130 }, { "epoch": 0.56, "learning_rate": 2.1998521189884103e-05, "loss": 2.3224, "step": 321140 }, { "epoch": 0.56, "learning_rate": 2.1997649249957276e-05, "loss": 2.2955, "step": 321150 }, { "epoch": 0.56, "learning_rate": 2.199677731003045e-05, "loss": 2.3742, "step": 321160 }, { "epoch": 0.56, "learning_rate": 2.1995905370103624e-05, "loss": 2.297, "step": 321170 }, { "epoch": 0.56, "learning_rate": 2.1995033430176794e-05, "loss": 2.329, "step": 321180 }, { "epoch": 0.56, "learning_rate": 2.1994161490249968e-05, "loss": 2.4243, "step": 321190 }, { "epoch": 0.56, "learning_rate": 2.1993289550323142e-05, "loss": 2.3112, "step": 321200 }, { "epoch": 0.56, "learning_rate": 2.1992417610396316e-05, "loss": 2.3329, "step": 321210 }, { "epoch": 0.56, "learning_rate": 2.199154567046949e-05, "loss": 2.3333, "step": 321220 }, { "epoch": 0.56, "learning_rate": 2.199067373054266e-05, "loss": 2.3016, "step": 321230 }, { "epoch": 0.56, "learning_rate": 2.1989801790615837e-05, "loss": 2.3122, "step": 321240 }, { "epoch": 0.56, "learning_rate": 2.1988929850689007e-05, "loss": 2.3463, "step": 321250 }, { "epoch": 0.56, "learning_rate": 2.198805791076218e-05, "loss": 2.3238, "step": 321260 }, { "epoch": 0.56, "learning_rate": 2.1987185970835355e-05, "loss": 2.335, "step": 321270 }, { "epoch": 0.56, "learning_rate": 2.198631403090853e-05, "loss": 2.3036, "step": 321280 }, { "epoch": 0.56, "learning_rate": 2.19854420909817e-05, "loss": 2.387, "step": 321290 }, { "epoch": 0.56, "learning_rate": 2.1984570151054873e-05, "loss": 2.229, "step": 321300 }, { "epoch": 0.56, "learning_rate": 2.198369821112805e-05, "loss": 2.4781, "step": 321310 }, { "epoch": 0.56, "learning_rate": 2.198282627120122e-05, "loss": 2.3133, "step": 321320 }, { "epoch": 0.56, "learning_rate": 2.1981954331274394e-05, "loss": 2.3673, "step": 321330 }, { "epoch": 0.56, "learning_rate": 2.1981082391347564e-05, "loss": 2.3563, "step": 321340 }, { "epoch": 0.56, "learning_rate": 2.198021045142074e-05, "loss": 2.3589, "step": 321350 }, { "epoch": 0.56, "learning_rate": 2.1979338511493912e-05, "loss": 2.4577, "step": 321360 }, { "epoch": 0.56, "learning_rate": 2.1978466571567086e-05, "loss": 2.2753, "step": 321370 }, { "epoch": 0.56, "learning_rate": 2.197759463164026e-05, "loss": 2.3411, "step": 321380 }, { "epoch": 0.56, "learning_rate": 2.1976722691713433e-05, "loss": 2.416, "step": 321390 }, { "epoch": 0.56, "learning_rate": 2.1975850751786607e-05, "loss": 2.3922, "step": 321400 }, { "epoch": 0.56, "learning_rate": 2.1974978811859777e-05, "loss": 2.3704, "step": 321410 }, { "epoch": 0.56, "learning_rate": 2.1974106871932955e-05, "loss": 2.3217, "step": 321420 }, { "epoch": 0.56, "learning_rate": 2.1973234932006125e-05, "loss": 2.3295, "step": 321430 }, { "epoch": 0.56, "learning_rate": 2.19723629920793e-05, "loss": 2.3397, "step": 321440 }, { "epoch": 0.56, "learning_rate": 2.1971491052152472e-05, "loss": 2.3364, "step": 321450 }, { "epoch": 0.56, "learning_rate": 2.1970619112225646e-05, "loss": 2.4735, "step": 321460 }, { "epoch": 0.56, "learning_rate": 2.196974717229882e-05, "loss": 2.3586, "step": 321470 }, { "epoch": 0.56, "learning_rate": 2.196887523237199e-05, "loss": 2.3539, "step": 321480 }, { "epoch": 0.56, "learning_rate": 2.1968003292445164e-05, "loss": 2.3672, "step": 321490 }, { "epoch": 0.56, "learning_rate": 2.1967131352518338e-05, "loss": 2.3498, "step": 321500 }, { "epoch": 0.56, "learning_rate": 2.1966259412591512e-05, "loss": 2.4743, "step": 321510 }, { "epoch": 0.56, "learning_rate": 2.1965387472664682e-05, "loss": 2.4237, "step": 321520 }, { "epoch": 0.56, "learning_rate": 2.196451553273786e-05, "loss": 2.3326, "step": 321530 }, { "epoch": 0.56, "learning_rate": 2.196364359281103e-05, "loss": 2.3207, "step": 321540 }, { "epoch": 0.56, "learning_rate": 2.1962771652884203e-05, "loss": 2.3964, "step": 321550 }, { "epoch": 0.56, "learning_rate": 2.1961899712957377e-05, "loss": 2.3343, "step": 321560 }, { "epoch": 0.56, "learning_rate": 2.196102777303055e-05, "loss": 2.4224, "step": 321570 }, { "epoch": 0.56, "learning_rate": 2.1960155833103725e-05, "loss": 2.3177, "step": 321580 }, { "epoch": 0.56, "learning_rate": 2.1959283893176895e-05, "loss": 2.3824, "step": 321590 }, { "epoch": 0.56, "learning_rate": 2.195841195325007e-05, "loss": 2.2812, "step": 321600 }, { "epoch": 0.56, "learning_rate": 2.1957540013323243e-05, "loss": 2.3757, "step": 321610 }, { "epoch": 0.56, "learning_rate": 2.1956668073396416e-05, "loss": 2.3415, "step": 321620 }, { "epoch": 0.56, "learning_rate": 2.195579613346959e-05, "loss": 2.3328, "step": 321630 }, { "epoch": 0.56, "learning_rate": 2.1954924193542764e-05, "loss": 2.391, "step": 321640 }, { "epoch": 0.56, "learning_rate": 2.1954052253615938e-05, "loss": 2.3737, "step": 321650 }, { "epoch": 0.56, "learning_rate": 2.1953180313689108e-05, "loss": 2.3325, "step": 321660 }, { "epoch": 0.56, "learning_rate": 2.1952308373762282e-05, "loss": 2.2921, "step": 321670 }, { "epoch": 0.56, "learning_rate": 2.1951436433835456e-05, "loss": 2.4212, "step": 321680 }, { "epoch": 0.56, "learning_rate": 2.195056449390863e-05, "loss": 2.3571, "step": 321690 }, { "epoch": 0.56, "learning_rate": 2.1949692553981803e-05, "loss": 2.4673, "step": 321700 }, { "epoch": 0.56, "learning_rate": 2.1948820614054974e-05, "loss": 2.3288, "step": 321710 }, { "epoch": 0.56, "learning_rate": 2.194794867412815e-05, "loss": 2.3305, "step": 321720 }, { "epoch": 0.56, "learning_rate": 2.194707673420132e-05, "loss": 2.3305, "step": 321730 }, { "epoch": 0.56, "learning_rate": 2.1946204794274495e-05, "loss": 2.3209, "step": 321740 }, { "epoch": 0.56, "learning_rate": 2.1945332854347665e-05, "loss": 2.3571, "step": 321750 }, { "epoch": 0.56, "learning_rate": 2.1944460914420842e-05, "loss": 2.3101, "step": 321760 }, { "epoch": 0.56, "learning_rate": 2.1943588974494013e-05, "loss": 2.3539, "step": 321770 }, { "epoch": 0.56, "learning_rate": 2.1942717034567187e-05, "loss": 2.3772, "step": 321780 }, { "epoch": 0.56, "learning_rate": 2.194184509464036e-05, "loss": 2.3614, "step": 321790 }, { "epoch": 0.56, "learning_rate": 2.1940973154713534e-05, "loss": 2.3634, "step": 321800 }, { "epoch": 0.56, "learning_rate": 2.1940101214786708e-05, "loss": 2.3255, "step": 321810 }, { "epoch": 0.56, "learning_rate": 2.1939229274859878e-05, "loss": 2.4184, "step": 321820 }, { "epoch": 0.56, "learning_rate": 2.1938357334933055e-05, "loss": 2.2732, "step": 321830 }, { "epoch": 0.56, "learning_rate": 2.1937485395006226e-05, "loss": 2.3667, "step": 321840 }, { "epoch": 0.56, "learning_rate": 2.19366134550794e-05, "loss": 2.3936, "step": 321850 }, { "epoch": 0.56, "learning_rate": 2.1935741515152573e-05, "loss": 2.4113, "step": 321860 }, { "epoch": 0.56, "learning_rate": 2.1934869575225747e-05, "loss": 2.3706, "step": 321870 }, { "epoch": 0.56, "learning_rate": 2.193399763529892e-05, "loss": 2.4589, "step": 321880 }, { "epoch": 0.56, "learning_rate": 2.193312569537209e-05, "loss": 2.3172, "step": 321890 }, { "epoch": 0.56, "learning_rate": 2.193225375544527e-05, "loss": 2.4241, "step": 321900 }, { "epoch": 0.56, "learning_rate": 2.193138181551844e-05, "loss": 2.2768, "step": 321910 }, { "epoch": 0.56, "learning_rate": 2.1930509875591613e-05, "loss": 2.3429, "step": 321920 }, { "epoch": 0.56, "learning_rate": 2.1929637935664786e-05, "loss": 2.3827, "step": 321930 }, { "epoch": 0.56, "learning_rate": 2.192876599573796e-05, "loss": 2.3515, "step": 321940 }, { "epoch": 0.56, "learning_rate": 2.1927894055811134e-05, "loss": 2.3933, "step": 321950 }, { "epoch": 0.56, "learning_rate": 2.1927022115884304e-05, "loss": 2.2903, "step": 321960 }, { "epoch": 0.56, "learning_rate": 2.1926150175957478e-05, "loss": 2.3672, "step": 321970 }, { "epoch": 0.56, "learning_rate": 2.1925278236030652e-05, "loss": 2.269, "step": 321980 }, { "epoch": 0.56, "learning_rate": 2.1924406296103826e-05, "loss": 2.2986, "step": 321990 }, { "epoch": 0.56, "learning_rate": 2.1923534356176996e-05, "loss": 2.3769, "step": 322000 }, { "epoch": 0.56, "learning_rate": 2.192266241625017e-05, "loss": 2.2913, "step": 322010 }, { "epoch": 0.56, "learning_rate": 2.1921790476323343e-05, "loss": 2.2951, "step": 322020 }, { "epoch": 0.56, "learning_rate": 2.1920918536396517e-05, "loss": 2.3669, "step": 322030 }, { "epoch": 0.56, "learning_rate": 2.192004659646969e-05, "loss": 2.3538, "step": 322040 }, { "epoch": 0.56, "learning_rate": 2.1919174656542865e-05, "loss": 2.3063, "step": 322050 }, { "epoch": 0.56, "learning_rate": 2.191830271661604e-05, "loss": 2.2845, "step": 322060 }, { "epoch": 0.56, "learning_rate": 2.191743077668921e-05, "loss": 2.3595, "step": 322070 }, { "epoch": 0.56, "learning_rate": 2.1916558836762383e-05, "loss": 2.3284, "step": 322080 }, { "epoch": 0.56, "learning_rate": 2.1915686896835556e-05, "loss": 2.2519, "step": 322090 }, { "epoch": 0.56, "learning_rate": 2.191481495690873e-05, "loss": 2.322, "step": 322100 }, { "epoch": 0.56, "learning_rate": 2.1913943016981904e-05, "loss": 2.3569, "step": 322110 }, { "epoch": 0.56, "learning_rate": 2.1913071077055074e-05, "loss": 2.3706, "step": 322120 }, { "epoch": 0.56, "learning_rate": 2.191219913712825e-05, "loss": 2.3477, "step": 322130 }, { "epoch": 0.56, "learning_rate": 2.1911327197201422e-05, "loss": 2.4115, "step": 322140 }, { "epoch": 0.56, "learning_rate": 2.1910455257274596e-05, "loss": 2.2481, "step": 322150 }, { "epoch": 0.56, "learning_rate": 2.1909583317347766e-05, "loss": 2.3055, "step": 322160 }, { "epoch": 0.56, "learning_rate": 2.1908711377420943e-05, "loss": 2.287, "step": 322170 }, { "epoch": 0.56, "learning_rate": 2.1907839437494117e-05, "loss": 2.2745, "step": 322180 }, { "epoch": 0.56, "learning_rate": 2.1906967497567287e-05, "loss": 2.3452, "step": 322190 }, { "epoch": 0.56, "learning_rate": 2.1906095557640465e-05, "loss": 2.3714, "step": 322200 }, { "epoch": 0.56, "learning_rate": 2.1905223617713635e-05, "loss": 2.2452, "step": 322210 }, { "epoch": 0.56, "learning_rate": 2.190435167778681e-05, "loss": 2.3371, "step": 322220 }, { "epoch": 0.56, "learning_rate": 2.190347973785998e-05, "loss": 2.3569, "step": 322230 }, { "epoch": 0.56, "learning_rate": 2.1902607797933156e-05, "loss": 2.3744, "step": 322240 }, { "epoch": 0.56, "learning_rate": 2.1901735858006327e-05, "loss": 2.2793, "step": 322250 }, { "epoch": 0.56, "learning_rate": 2.19008639180795e-05, "loss": 2.4216, "step": 322260 }, { "epoch": 0.56, "learning_rate": 2.1899991978152674e-05, "loss": 2.4271, "step": 322270 }, { "epoch": 0.56, "learning_rate": 2.1899120038225848e-05, "loss": 2.3549, "step": 322280 }, { "epoch": 0.56, "learning_rate": 2.1898248098299022e-05, "loss": 2.356, "step": 322290 }, { "epoch": 0.56, "learning_rate": 2.1897376158372192e-05, "loss": 2.1577, "step": 322300 }, { "epoch": 0.56, "learning_rate": 2.189650421844537e-05, "loss": 2.3889, "step": 322310 }, { "epoch": 0.56, "learning_rate": 2.189563227851854e-05, "loss": 2.2827, "step": 322320 }, { "epoch": 0.56, "learning_rate": 2.1894760338591713e-05, "loss": 2.382, "step": 322330 }, { "epoch": 0.56, "learning_rate": 2.1893888398664887e-05, "loss": 2.3108, "step": 322340 }, { "epoch": 0.56, "learning_rate": 2.189301645873806e-05, "loss": 2.248, "step": 322350 }, { "epoch": 0.56, "learning_rate": 2.1892144518811235e-05, "loss": 2.3016, "step": 322360 }, { "epoch": 0.56, "learning_rate": 2.1891272578884405e-05, "loss": 2.3592, "step": 322370 }, { "epoch": 0.56, "learning_rate": 2.189040063895758e-05, "loss": 2.2996, "step": 322380 }, { "epoch": 0.56, "learning_rate": 2.1889528699030753e-05, "loss": 2.3736, "step": 322390 }, { "epoch": 0.56, "learning_rate": 2.1888656759103926e-05, "loss": 2.2197, "step": 322400 }, { "epoch": 0.56, "learning_rate": 2.1887784819177097e-05, "loss": 2.3045, "step": 322410 }, { "epoch": 0.56, "learning_rate": 2.188691287925027e-05, "loss": 2.2362, "step": 322420 }, { "epoch": 0.56, "learning_rate": 2.1886040939323448e-05, "loss": 2.3843, "step": 322430 }, { "epoch": 0.56, "learning_rate": 2.1885168999396618e-05, "loss": 2.3769, "step": 322440 }, { "epoch": 0.56, "learning_rate": 2.1884297059469792e-05, "loss": 2.379, "step": 322450 }, { "epoch": 0.56, "learning_rate": 2.1883425119542966e-05, "loss": 2.344, "step": 322460 }, { "epoch": 0.56, "learning_rate": 2.188255317961614e-05, "loss": 2.3288, "step": 322470 }, { "epoch": 0.56, "learning_rate": 2.188168123968931e-05, "loss": 2.475, "step": 322480 }, { "epoch": 0.56, "learning_rate": 2.1880809299762484e-05, "loss": 2.3883, "step": 322490 }, { "epoch": 0.56, "learning_rate": 2.1879937359835657e-05, "loss": 2.3131, "step": 322500 }, { "epoch": 0.56, "learning_rate": 2.187906541990883e-05, "loss": 2.3429, "step": 322510 }, { "epoch": 0.56, "learning_rate": 2.1878193479982005e-05, "loss": 2.4013, "step": 322520 }, { "epoch": 0.56, "learning_rate": 2.1877321540055175e-05, "loss": 2.3209, "step": 322530 }, { "epoch": 0.56, "learning_rate": 2.1876449600128352e-05, "loss": 2.474, "step": 322540 }, { "epoch": 0.56, "learning_rate": 2.1875577660201523e-05, "loss": 2.2728, "step": 322550 }, { "epoch": 0.56, "learning_rate": 2.1874705720274697e-05, "loss": 2.3764, "step": 322560 }, { "epoch": 0.56, "learning_rate": 2.187383378034787e-05, "loss": 2.3059, "step": 322570 }, { "epoch": 0.56, "learning_rate": 2.1872961840421044e-05, "loss": 2.4285, "step": 322580 }, { "epoch": 0.56, "learning_rate": 2.1872089900494218e-05, "loss": 2.3922, "step": 322590 }, { "epoch": 0.56, "learning_rate": 2.1871217960567388e-05, "loss": 2.3152, "step": 322600 }, { "epoch": 0.56, "learning_rate": 2.1870346020640565e-05, "loss": 2.2915, "step": 322610 }, { "epoch": 0.56, "learning_rate": 2.1869474080713736e-05, "loss": 2.3079, "step": 322620 }, { "epoch": 0.56, "learning_rate": 2.186860214078691e-05, "loss": 2.4096, "step": 322630 }, { "epoch": 0.56, "learning_rate": 2.186773020086008e-05, "loss": 2.3548, "step": 322640 }, { "epoch": 0.56, "learning_rate": 2.1866858260933257e-05, "loss": 2.2814, "step": 322650 }, { "epoch": 0.56, "learning_rate": 2.186598632100643e-05, "loss": 2.2786, "step": 322660 }, { "epoch": 0.56, "learning_rate": 2.18651143810796e-05, "loss": 2.3271, "step": 322670 }, { "epoch": 0.56, "learning_rate": 2.1864242441152775e-05, "loss": 2.2722, "step": 322680 }, { "epoch": 0.56, "learning_rate": 2.186337050122595e-05, "loss": 2.4052, "step": 322690 }, { "epoch": 0.56, "learning_rate": 2.1862498561299123e-05, "loss": 2.4173, "step": 322700 }, { "epoch": 0.56, "learning_rate": 2.1861626621372293e-05, "loss": 2.4556, "step": 322710 }, { "epoch": 0.56, "learning_rate": 2.186075468144547e-05, "loss": 2.3867, "step": 322720 }, { "epoch": 0.56, "learning_rate": 2.185988274151864e-05, "loss": 2.3887, "step": 322730 }, { "epoch": 0.56, "learning_rate": 2.1859010801591814e-05, "loss": 2.4299, "step": 322740 }, { "epoch": 0.56, "learning_rate": 2.1858138861664988e-05, "loss": 2.2603, "step": 322750 }, { "epoch": 0.56, "learning_rate": 2.1857266921738162e-05, "loss": 2.2981, "step": 322760 }, { "epoch": 0.56, "learning_rate": 2.1856394981811336e-05, "loss": 2.5019, "step": 322770 }, { "epoch": 0.56, "learning_rate": 2.1855523041884506e-05, "loss": 2.3744, "step": 322780 }, { "epoch": 0.56, "learning_rate": 2.185465110195768e-05, "loss": 2.3171, "step": 322790 }, { "epoch": 0.56, "learning_rate": 2.1853779162030853e-05, "loss": 2.268, "step": 322800 }, { "epoch": 0.56, "learning_rate": 2.1852907222104027e-05, "loss": 2.4127, "step": 322810 }, { "epoch": 0.56, "learning_rate": 2.18520352821772e-05, "loss": 2.3494, "step": 322820 }, { "epoch": 0.56, "learning_rate": 2.185116334225037e-05, "loss": 2.3664, "step": 322830 }, { "epoch": 0.56, "learning_rate": 2.185029140232355e-05, "loss": 2.3906, "step": 322840 }, { "epoch": 0.56, "learning_rate": 2.184941946239672e-05, "loss": 2.4184, "step": 322850 }, { "epoch": 0.56, "learning_rate": 2.1848547522469893e-05, "loss": 2.3993, "step": 322860 }, { "epoch": 0.56, "learning_rate": 2.1847675582543066e-05, "loss": 2.3118, "step": 322870 }, { "epoch": 0.56, "learning_rate": 2.184680364261624e-05, "loss": 2.3401, "step": 322880 }, { "epoch": 0.56, "learning_rate": 2.184593170268941e-05, "loss": 2.4143, "step": 322890 }, { "epoch": 0.56, "learning_rate": 2.1845059762762584e-05, "loss": 2.3244, "step": 322900 }, { "epoch": 0.56, "learning_rate": 2.184418782283576e-05, "loss": 2.2556, "step": 322910 }, { "epoch": 0.56, "learning_rate": 2.1843315882908932e-05, "loss": 2.4289, "step": 322920 }, { "epoch": 0.56, "learning_rate": 2.1842443942982106e-05, "loss": 2.3631, "step": 322930 }, { "epoch": 0.56, "learning_rate": 2.1841572003055276e-05, "loss": 2.3868, "step": 322940 }, { "epoch": 0.56, "learning_rate": 2.1840700063128453e-05, "loss": 2.2177, "step": 322950 }, { "epoch": 0.56, "learning_rate": 2.1839828123201624e-05, "loss": 2.4083, "step": 322960 }, { "epoch": 0.56, "learning_rate": 2.1838956183274797e-05, "loss": 2.3973, "step": 322970 }, { "epoch": 0.56, "learning_rate": 2.183808424334797e-05, "loss": 2.3968, "step": 322980 }, { "epoch": 0.56, "learning_rate": 2.1837212303421145e-05, "loss": 2.3966, "step": 322990 }, { "epoch": 0.56, "learning_rate": 2.183634036349432e-05, "loss": 2.1521, "step": 323000 }, { "epoch": 0.56, "learning_rate": 2.183546842356749e-05, "loss": 2.293, "step": 323010 }, { "epoch": 0.56, "learning_rate": 2.1834596483640666e-05, "loss": 2.365, "step": 323020 }, { "epoch": 0.56, "learning_rate": 2.1833724543713837e-05, "loss": 2.3218, "step": 323030 }, { "epoch": 0.56, "learning_rate": 2.183285260378701e-05, "loss": 2.3536, "step": 323040 }, { "epoch": 0.56, "learning_rate": 2.1831980663860184e-05, "loss": 2.3527, "step": 323050 }, { "epoch": 0.56, "learning_rate": 2.1831108723933358e-05, "loss": 2.3366, "step": 323060 }, { "epoch": 0.56, "learning_rate": 2.1830236784006532e-05, "loss": 2.3599, "step": 323070 }, { "epoch": 0.56, "learning_rate": 2.1829364844079702e-05, "loss": 2.3121, "step": 323080 }, { "epoch": 0.56, "learning_rate": 2.1828492904152876e-05, "loss": 2.3471, "step": 323090 }, { "epoch": 0.56, "learning_rate": 2.182762096422605e-05, "loss": 2.302, "step": 323100 }, { "epoch": 0.56, "learning_rate": 2.1826749024299223e-05, "loss": 2.3995, "step": 323110 }, { "epoch": 0.56, "learning_rate": 2.1825877084372394e-05, "loss": 2.3042, "step": 323120 }, { "epoch": 0.56, "learning_rate": 2.182500514444557e-05, "loss": 2.4492, "step": 323130 }, { "epoch": 0.56, "learning_rate": 2.182413320451874e-05, "loss": 2.3296, "step": 323140 }, { "epoch": 0.56, "learning_rate": 2.1823261264591915e-05, "loss": 2.3594, "step": 323150 }, { "epoch": 0.56, "learning_rate": 2.182238932466509e-05, "loss": 2.3172, "step": 323160 }, { "epoch": 0.56, "learning_rate": 2.1821517384738263e-05, "loss": 2.3962, "step": 323170 }, { "epoch": 0.56, "learning_rate": 2.1820645444811436e-05, "loss": 2.3268, "step": 323180 }, { "epoch": 0.56, "learning_rate": 2.1819773504884607e-05, "loss": 2.3174, "step": 323190 }, { "epoch": 0.56, "learning_rate": 2.181890156495778e-05, "loss": 2.2225, "step": 323200 }, { "epoch": 0.56, "learning_rate": 2.1818029625030954e-05, "loss": 2.3102, "step": 323210 }, { "epoch": 0.56, "learning_rate": 2.1817157685104128e-05, "loss": 2.3743, "step": 323220 }, { "epoch": 0.56, "learning_rate": 2.1816285745177302e-05, "loss": 2.3855, "step": 323230 }, { "epoch": 0.56, "learning_rate": 2.1815413805250476e-05, "loss": 2.32, "step": 323240 }, { "epoch": 0.56, "learning_rate": 2.181454186532365e-05, "loss": 2.3448, "step": 323250 }, { "epoch": 0.56, "learning_rate": 2.181366992539682e-05, "loss": 2.3667, "step": 323260 }, { "epoch": 0.56, "learning_rate": 2.1812797985469994e-05, "loss": 2.3675, "step": 323270 }, { "epoch": 0.56, "learning_rate": 2.1811926045543167e-05, "loss": 2.331, "step": 323280 }, { "epoch": 0.56, "learning_rate": 2.181105410561634e-05, "loss": 2.3712, "step": 323290 }, { "epoch": 0.56, "learning_rate": 2.1810182165689515e-05, "loss": 2.3333, "step": 323300 }, { "epoch": 0.56, "learning_rate": 2.1809310225762685e-05, "loss": 2.2524, "step": 323310 }, { "epoch": 0.56, "learning_rate": 2.1808438285835862e-05, "loss": 2.3064, "step": 323320 }, { "epoch": 0.56, "learning_rate": 2.1807566345909033e-05, "loss": 2.3077, "step": 323330 }, { "epoch": 0.56, "learning_rate": 2.1806694405982207e-05, "loss": 2.3643, "step": 323340 }, { "epoch": 0.56, "learning_rate": 2.1805822466055377e-05, "loss": 2.4481, "step": 323350 }, { "epoch": 0.56, "learning_rate": 2.1804950526128554e-05, "loss": 2.3148, "step": 323360 }, { "epoch": 0.56, "learning_rate": 2.1804078586201724e-05, "loss": 2.2958, "step": 323370 }, { "epoch": 0.56, "learning_rate": 2.1803206646274898e-05, "loss": 2.4328, "step": 323380 }, { "epoch": 0.56, "learning_rate": 2.1802334706348075e-05, "loss": 2.3577, "step": 323390 }, { "epoch": 0.56, "learning_rate": 2.1801462766421246e-05, "loss": 2.3483, "step": 323400 }, { "epoch": 0.56, "learning_rate": 2.180059082649442e-05, "loss": 2.2729, "step": 323410 }, { "epoch": 0.56, "learning_rate": 2.179971888656759e-05, "loss": 2.2716, "step": 323420 }, { "epoch": 0.56, "learning_rate": 2.1798846946640767e-05, "loss": 2.278, "step": 323430 }, { "epoch": 0.56, "learning_rate": 2.1797975006713937e-05, "loss": 2.4747, "step": 323440 }, { "epoch": 0.56, "learning_rate": 2.179710306678711e-05, "loss": 2.3499, "step": 323450 }, { "epoch": 0.56, "learning_rate": 2.1796231126860285e-05, "loss": 2.3181, "step": 323460 }, { "epoch": 0.56, "learning_rate": 2.179535918693346e-05, "loss": 2.3954, "step": 323470 }, { "epoch": 0.56, "learning_rate": 2.1794487247006633e-05, "loss": 2.2611, "step": 323480 }, { "epoch": 0.56, "learning_rate": 2.1793615307079803e-05, "loss": 2.3054, "step": 323490 }, { "epoch": 0.56, "learning_rate": 2.179274336715298e-05, "loss": 2.299, "step": 323500 }, { "epoch": 0.56, "learning_rate": 2.179187142722615e-05, "loss": 2.3663, "step": 323510 }, { "epoch": 0.56, "learning_rate": 2.1790999487299324e-05, "loss": 2.2273, "step": 323520 }, { "epoch": 0.56, "learning_rate": 2.1790127547372498e-05, "loss": 2.3146, "step": 323530 }, { "epoch": 0.56, "learning_rate": 2.1789255607445672e-05, "loss": 2.2908, "step": 323540 }, { "epoch": 0.56, "learning_rate": 2.1788383667518846e-05, "loss": 2.3464, "step": 323550 }, { "epoch": 0.56, "learning_rate": 2.1787511727592016e-05, "loss": 2.3571, "step": 323560 }, { "epoch": 0.56, "learning_rate": 2.178663978766519e-05, "loss": 2.3218, "step": 323570 }, { "epoch": 0.56, "learning_rate": 2.1785767847738363e-05, "loss": 2.4122, "step": 323580 }, { "epoch": 0.56, "learning_rate": 2.1784895907811537e-05, "loss": 2.4264, "step": 323590 }, { "epoch": 0.56, "learning_rate": 2.1784023967884708e-05, "loss": 2.2904, "step": 323600 }, { "epoch": 0.56, "learning_rate": 2.178315202795788e-05, "loss": 2.3645, "step": 323610 }, { "epoch": 0.56, "learning_rate": 2.1782280088031055e-05, "loss": 2.3752, "step": 323620 }, { "epoch": 0.56, "learning_rate": 2.178140814810423e-05, "loss": 2.3916, "step": 323630 }, { "epoch": 0.56, "learning_rate": 2.1780536208177403e-05, "loss": 2.2, "step": 323640 }, { "epoch": 0.56, "learning_rate": 2.1779664268250576e-05, "loss": 2.2393, "step": 323650 }, { "epoch": 0.56, "learning_rate": 2.177879232832375e-05, "loss": 2.3722, "step": 323660 }, { "epoch": 0.56, "learning_rate": 2.177792038839692e-05, "loss": 2.2746, "step": 323670 }, { "epoch": 0.56, "learning_rate": 2.1777048448470094e-05, "loss": 2.3891, "step": 323680 }, { "epoch": 0.56, "learning_rate": 2.1776176508543268e-05, "loss": 2.3025, "step": 323690 }, { "epoch": 0.56, "learning_rate": 2.1775304568616442e-05, "loss": 2.3342, "step": 323700 }, { "epoch": 0.56, "learning_rate": 2.1774432628689616e-05, "loss": 2.3353, "step": 323710 }, { "epoch": 0.56, "learning_rate": 2.1773560688762786e-05, "loss": 2.3393, "step": 323720 }, { "epoch": 0.56, "learning_rate": 2.1772688748835963e-05, "loss": 2.2925, "step": 323730 }, { "epoch": 0.56, "learning_rate": 2.1771816808909134e-05, "loss": 2.2444, "step": 323740 }, { "epoch": 0.56, "learning_rate": 2.1770944868982307e-05, "loss": 2.5031, "step": 323750 }, { "epoch": 0.56, "learning_rate": 2.1770072929055478e-05, "loss": 2.3171, "step": 323760 }, { "epoch": 0.56, "learning_rate": 2.1769200989128655e-05, "loss": 2.3432, "step": 323770 }, { "epoch": 0.56, "learning_rate": 2.176832904920183e-05, "loss": 2.2618, "step": 323780 }, { "epoch": 0.56, "learning_rate": 2.1767457109275e-05, "loss": 2.3705, "step": 323790 }, { "epoch": 0.56, "learning_rate": 2.1766585169348176e-05, "loss": 2.2998, "step": 323800 }, { "epoch": 0.56, "learning_rate": 2.1765713229421347e-05, "loss": 2.4165, "step": 323810 }, { "epoch": 0.56, "learning_rate": 2.176484128949452e-05, "loss": 2.3463, "step": 323820 }, { "epoch": 0.56, "learning_rate": 2.176396934956769e-05, "loss": 2.4572, "step": 323830 }, { "epoch": 0.56, "learning_rate": 2.1763097409640868e-05, "loss": 2.1615, "step": 323840 }, { "epoch": 0.56, "learning_rate": 2.176222546971404e-05, "loss": 2.2716, "step": 323850 }, { "epoch": 0.56, "learning_rate": 2.1761353529787212e-05, "loss": 2.3645, "step": 323860 }, { "epoch": 0.56, "learning_rate": 2.1760481589860386e-05, "loss": 2.4038, "step": 323870 }, { "epoch": 0.56, "learning_rate": 2.175960964993356e-05, "loss": 2.2059, "step": 323880 }, { "epoch": 0.56, "learning_rate": 2.1758737710006733e-05, "loss": 2.3659, "step": 323890 }, { "epoch": 0.56, "learning_rate": 2.1757865770079904e-05, "loss": 2.3279, "step": 323900 }, { "epoch": 0.56, "learning_rate": 2.175699383015308e-05, "loss": 2.328, "step": 323910 }, { "epoch": 0.56, "learning_rate": 2.175612189022625e-05, "loss": 2.3479, "step": 323920 }, { "epoch": 0.56, "learning_rate": 2.1755249950299425e-05, "loss": 2.3345, "step": 323930 }, { "epoch": 0.56, "learning_rate": 2.17543780103726e-05, "loss": 2.3089, "step": 323940 }, { "epoch": 0.56, "learning_rate": 2.1753506070445773e-05, "loss": 2.3647, "step": 323950 }, { "epoch": 0.56, "learning_rate": 2.1752634130518946e-05, "loss": 2.3164, "step": 323960 }, { "epoch": 0.56, "learning_rate": 2.1751762190592117e-05, "loss": 2.3977, "step": 323970 }, { "epoch": 0.56, "learning_rate": 2.175089025066529e-05, "loss": 2.2806, "step": 323980 }, { "epoch": 0.56, "learning_rate": 2.1750018310738464e-05, "loss": 2.3459, "step": 323990 }, { "epoch": 0.57, "learning_rate": 2.1749146370811638e-05, "loss": 2.3291, "step": 324000 }, { "epoch": 0.57, "learning_rate": 2.1748274430884812e-05, "loss": 2.2928, "step": 324010 }, { "epoch": 0.57, "learning_rate": 2.1747402490957982e-05, "loss": 2.3442, "step": 324020 }, { "epoch": 0.57, "learning_rate": 2.174653055103116e-05, "loss": 2.3405, "step": 324030 }, { "epoch": 0.57, "learning_rate": 2.174565861110433e-05, "loss": 2.4095, "step": 324040 }, { "epoch": 0.57, "learning_rate": 2.1744786671177504e-05, "loss": 2.3156, "step": 324050 }, { "epoch": 0.57, "learning_rate": 2.1743914731250677e-05, "loss": 2.3552, "step": 324060 }, { "epoch": 0.57, "learning_rate": 2.174304279132385e-05, "loss": 2.3214, "step": 324070 }, { "epoch": 0.57, "learning_rate": 2.174217085139702e-05, "loss": 2.3239, "step": 324080 }, { "epoch": 0.57, "learning_rate": 2.1741298911470195e-05, "loss": 2.2569, "step": 324090 }, { "epoch": 0.57, "learning_rate": 2.174042697154337e-05, "loss": 2.3726, "step": 324100 }, { "epoch": 0.57, "learning_rate": 2.1739555031616543e-05, "loss": 2.2854, "step": 324110 }, { "epoch": 0.57, "learning_rate": 2.1738683091689717e-05, "loss": 2.2577, "step": 324120 }, { "epoch": 0.57, "learning_rate": 2.1737811151762887e-05, "loss": 2.3584, "step": 324130 }, { "epoch": 0.57, "learning_rate": 2.1736939211836064e-05, "loss": 2.4694, "step": 324140 }, { "epoch": 0.57, "learning_rate": 2.1736067271909234e-05, "loss": 2.2618, "step": 324150 }, { "epoch": 0.57, "learning_rate": 2.1735195331982408e-05, "loss": 2.2758, "step": 324160 }, { "epoch": 0.57, "learning_rate": 2.1734323392055582e-05, "loss": 2.2685, "step": 324170 }, { "epoch": 0.57, "learning_rate": 2.1733451452128756e-05, "loss": 2.3522, "step": 324180 }, { "epoch": 0.57, "learning_rate": 2.173257951220193e-05, "loss": 2.3359, "step": 324190 }, { "epoch": 0.57, "learning_rate": 2.17317075722751e-05, "loss": 2.4001, "step": 324200 }, { "epoch": 0.57, "learning_rate": 2.1730835632348277e-05, "loss": 2.3169, "step": 324210 }, { "epoch": 0.57, "learning_rate": 2.1729963692421447e-05, "loss": 2.3137, "step": 324220 }, { "epoch": 0.57, "learning_rate": 2.172909175249462e-05, "loss": 2.3458, "step": 324230 }, { "epoch": 0.57, "learning_rate": 2.172821981256779e-05, "loss": 2.4613, "step": 324240 }, { "epoch": 0.57, "learning_rate": 2.172734787264097e-05, "loss": 2.3482, "step": 324250 }, { "epoch": 0.57, "learning_rate": 2.1726475932714143e-05, "loss": 2.4159, "step": 324260 }, { "epoch": 0.57, "learning_rate": 2.1725603992787313e-05, "loss": 2.4192, "step": 324270 }, { "epoch": 0.57, "learning_rate": 2.1724732052860487e-05, "loss": 2.2986, "step": 324280 }, { "epoch": 0.57, "learning_rate": 2.172386011293366e-05, "loss": 2.406, "step": 324290 }, { "epoch": 0.57, "learning_rate": 2.1722988173006834e-05, "loss": 2.3291, "step": 324300 }, { "epoch": 0.57, "learning_rate": 2.1722116233080005e-05, "loss": 2.2723, "step": 324310 }, { "epoch": 0.57, "learning_rate": 2.1721244293153182e-05, "loss": 2.3499, "step": 324320 }, { "epoch": 0.57, "learning_rate": 2.1720372353226352e-05, "loss": 2.3657, "step": 324330 }, { "epoch": 0.57, "learning_rate": 2.1719500413299526e-05, "loss": 2.21, "step": 324340 }, { "epoch": 0.57, "learning_rate": 2.17186284733727e-05, "loss": 2.2857, "step": 324350 }, { "epoch": 0.57, "learning_rate": 2.1717756533445874e-05, "loss": 2.312, "step": 324360 }, { "epoch": 0.57, "learning_rate": 2.1716884593519047e-05, "loss": 2.3438, "step": 324370 }, { "epoch": 0.57, "learning_rate": 2.1716012653592218e-05, "loss": 2.3486, "step": 324380 }, { "epoch": 0.57, "learning_rate": 2.171514071366539e-05, "loss": 2.2784, "step": 324390 }, { "epoch": 0.57, "learning_rate": 2.1714268773738565e-05, "loss": 2.3863, "step": 324400 }, { "epoch": 0.57, "learning_rate": 2.171339683381174e-05, "loss": 2.4562, "step": 324410 }, { "epoch": 0.57, "learning_rate": 2.1712524893884913e-05, "loss": 2.42, "step": 324420 }, { "epoch": 0.57, "learning_rate": 2.1711652953958087e-05, "loss": 2.2824, "step": 324430 }, { "epoch": 0.57, "learning_rate": 2.171078101403126e-05, "loss": 2.3439, "step": 324440 }, { "epoch": 0.57, "learning_rate": 2.170990907410443e-05, "loss": 2.3629, "step": 324450 }, { "epoch": 0.57, "learning_rate": 2.1709037134177604e-05, "loss": 2.4285, "step": 324460 }, { "epoch": 0.57, "learning_rate": 2.1708165194250778e-05, "loss": 2.3181, "step": 324470 }, { "epoch": 0.57, "learning_rate": 2.1707293254323952e-05, "loss": 2.3222, "step": 324480 }, { "epoch": 0.57, "learning_rate": 2.1706421314397122e-05, "loss": 2.3361, "step": 324490 }, { "epoch": 0.57, "learning_rate": 2.1705549374470296e-05, "loss": 2.4158, "step": 324500 }, { "epoch": 0.57, "learning_rate": 2.1704677434543473e-05, "loss": 2.3583, "step": 324510 }, { "epoch": 0.57, "learning_rate": 2.1703805494616644e-05, "loss": 2.3139, "step": 324520 }, { "epoch": 0.57, "learning_rate": 2.1702933554689817e-05, "loss": 2.3242, "step": 324530 }, { "epoch": 0.57, "learning_rate": 2.1702061614762988e-05, "loss": 2.3238, "step": 324540 }, { "epoch": 0.57, "learning_rate": 2.1701189674836165e-05, "loss": 2.3436, "step": 324550 }, { "epoch": 0.57, "learning_rate": 2.1700317734909335e-05, "loss": 2.3601, "step": 324560 }, { "epoch": 0.57, "learning_rate": 2.169944579498251e-05, "loss": 2.3334, "step": 324570 }, { "epoch": 0.57, "learning_rate": 2.1698573855055683e-05, "loss": 2.3025, "step": 324580 }, { "epoch": 0.57, "learning_rate": 2.1697701915128857e-05, "loss": 2.3521, "step": 324590 }, { "epoch": 0.57, "learning_rate": 2.169682997520203e-05, "loss": 2.3927, "step": 324600 }, { "epoch": 0.57, "learning_rate": 2.16959580352752e-05, "loss": 2.1775, "step": 324610 }, { "epoch": 0.57, "learning_rate": 2.1695086095348378e-05, "loss": 2.4065, "step": 324620 }, { "epoch": 0.57, "learning_rate": 2.169421415542155e-05, "loss": 2.4272, "step": 324630 }, { "epoch": 0.57, "learning_rate": 2.1693342215494722e-05, "loss": 2.4426, "step": 324640 }, { "epoch": 0.57, "learning_rate": 2.1692470275567896e-05, "loss": 2.3795, "step": 324650 }, { "epoch": 0.57, "learning_rate": 2.169159833564107e-05, "loss": 2.535, "step": 324660 }, { "epoch": 0.57, "learning_rate": 2.1690726395714243e-05, "loss": 2.3735, "step": 324670 }, { "epoch": 0.57, "learning_rate": 2.1689854455787414e-05, "loss": 2.3002, "step": 324680 }, { "epoch": 0.57, "learning_rate": 2.1688982515860588e-05, "loss": 2.3278, "step": 324690 }, { "epoch": 0.57, "learning_rate": 2.168811057593376e-05, "loss": 2.3897, "step": 324700 }, { "epoch": 0.57, "learning_rate": 2.1687238636006935e-05, "loss": 2.3375, "step": 324710 }, { "epoch": 0.57, "learning_rate": 2.1686366696080106e-05, "loss": 2.4145, "step": 324720 }, { "epoch": 0.57, "learning_rate": 2.1685494756153283e-05, "loss": 2.2415, "step": 324730 }, { "epoch": 0.57, "learning_rate": 2.1684622816226456e-05, "loss": 2.1979, "step": 324740 }, { "epoch": 0.57, "learning_rate": 2.1683750876299627e-05, "loss": 2.3504, "step": 324750 }, { "epoch": 0.57, "learning_rate": 2.16828789363728e-05, "loss": 2.5496, "step": 324760 }, { "epoch": 0.57, "learning_rate": 2.1682006996445974e-05, "loss": 2.277, "step": 324770 }, { "epoch": 0.57, "learning_rate": 2.1681135056519148e-05, "loss": 2.251, "step": 324780 }, { "epoch": 0.57, "learning_rate": 2.168026311659232e-05, "loss": 2.3996, "step": 324790 }, { "epoch": 0.57, "learning_rate": 2.1679391176665492e-05, "loss": 2.4412, "step": 324800 }, { "epoch": 0.57, "learning_rate": 2.1678519236738666e-05, "loss": 2.3214, "step": 324810 }, { "epoch": 0.57, "learning_rate": 2.167764729681184e-05, "loss": 2.234, "step": 324820 }, { "epoch": 0.57, "learning_rate": 2.1676775356885014e-05, "loss": 2.3437, "step": 324830 }, { "epoch": 0.57, "learning_rate": 2.1675903416958187e-05, "loss": 2.3327, "step": 324840 }, { "epoch": 0.57, "learning_rate": 2.167503147703136e-05, "loss": 2.303, "step": 324850 }, { "epoch": 0.57, "learning_rate": 2.167415953710453e-05, "loss": 2.3563, "step": 324860 }, { "epoch": 0.57, "learning_rate": 2.1673287597177705e-05, "loss": 2.3669, "step": 324870 }, { "epoch": 0.57, "learning_rate": 2.167241565725088e-05, "loss": 2.2141, "step": 324880 }, { "epoch": 0.57, "learning_rate": 2.1671543717324053e-05, "loss": 2.3145, "step": 324890 }, { "epoch": 0.57, "learning_rate": 2.1670671777397227e-05, "loss": 2.3361, "step": 324900 }, { "epoch": 0.57, "learning_rate": 2.1669799837470397e-05, "loss": 2.348, "step": 324910 }, { "epoch": 0.57, "learning_rate": 2.1668927897543574e-05, "loss": 2.3332, "step": 324920 }, { "epoch": 0.57, "learning_rate": 2.1668055957616745e-05, "loss": 2.3945, "step": 324930 }, { "epoch": 0.57, "learning_rate": 2.1667184017689918e-05, "loss": 2.3782, "step": 324940 }, { "epoch": 0.57, "learning_rate": 2.166631207776309e-05, "loss": 2.3308, "step": 324950 }, { "epoch": 0.57, "learning_rate": 2.1665440137836266e-05, "loss": 2.3711, "step": 324960 }, { "epoch": 0.57, "learning_rate": 2.1664568197909436e-05, "loss": 2.367, "step": 324970 }, { "epoch": 0.57, "learning_rate": 2.166369625798261e-05, "loss": 2.3798, "step": 324980 }, { "epoch": 0.57, "learning_rate": 2.1662824318055787e-05, "loss": 2.3459, "step": 324990 }, { "epoch": 0.57, "learning_rate": 2.1661952378128958e-05, "loss": 2.3554, "step": 325000 }, { "epoch": 0.57, "learning_rate": 2.166108043820213e-05, "loss": 2.398, "step": 325010 }, { "epoch": 0.57, "learning_rate": 2.16602084982753e-05, "loss": 2.2237, "step": 325020 }, { "epoch": 0.57, "learning_rate": 2.165933655834848e-05, "loss": 2.3121, "step": 325030 }, { "epoch": 0.57, "learning_rate": 2.165846461842165e-05, "loss": 2.3307, "step": 325040 }, { "epoch": 0.57, "learning_rate": 2.1657592678494823e-05, "loss": 2.3645, "step": 325050 }, { "epoch": 0.57, "learning_rate": 2.1656720738567997e-05, "loss": 2.3873, "step": 325060 }, { "epoch": 0.57, "learning_rate": 2.165584879864117e-05, "loss": 2.3477, "step": 325070 }, { "epoch": 0.57, "learning_rate": 2.1654976858714344e-05, "loss": 2.2482, "step": 325080 }, { "epoch": 0.57, "learning_rate": 2.1654104918787515e-05, "loss": 2.427, "step": 325090 }, { "epoch": 0.57, "learning_rate": 2.1653232978860692e-05, "loss": 2.3261, "step": 325100 }, { "epoch": 0.57, "learning_rate": 2.1652361038933862e-05, "loss": 2.2743, "step": 325110 }, { "epoch": 0.57, "learning_rate": 2.1651489099007036e-05, "loss": 2.3925, "step": 325120 }, { "epoch": 0.57, "learning_rate": 2.165061715908021e-05, "loss": 2.3315, "step": 325130 }, { "epoch": 0.57, "learning_rate": 2.1649745219153384e-05, "loss": 2.2498, "step": 325140 }, { "epoch": 0.57, "learning_rate": 2.1648873279226557e-05, "loss": 2.3311, "step": 325150 }, { "epoch": 0.57, "learning_rate": 2.1648001339299728e-05, "loss": 2.3887, "step": 325160 }, { "epoch": 0.57, "learning_rate": 2.16471293993729e-05, "loss": 2.3769, "step": 325170 }, { "epoch": 0.57, "learning_rate": 2.1646257459446075e-05, "loss": 2.4127, "step": 325180 }, { "epoch": 0.57, "learning_rate": 2.164538551951925e-05, "loss": 2.4282, "step": 325190 }, { "epoch": 0.57, "learning_rate": 2.164451357959242e-05, "loss": 2.2962, "step": 325200 }, { "epoch": 0.57, "learning_rate": 2.1643641639665593e-05, "loss": 2.3028, "step": 325210 }, { "epoch": 0.57, "learning_rate": 2.1642769699738767e-05, "loss": 2.3608, "step": 325220 }, { "epoch": 0.57, "learning_rate": 2.164189775981194e-05, "loss": 2.2981, "step": 325230 }, { "epoch": 0.57, "learning_rate": 2.1641025819885114e-05, "loss": 2.3271, "step": 325240 }, { "epoch": 0.57, "learning_rate": 2.1640153879958288e-05, "loss": 2.4282, "step": 325250 }, { "epoch": 0.57, "learning_rate": 2.1639281940031462e-05, "loss": 2.3707, "step": 325260 }, { "epoch": 0.57, "learning_rate": 2.1638410000104632e-05, "loss": 2.3439, "step": 325270 }, { "epoch": 0.57, "learning_rate": 2.1637538060177806e-05, "loss": 2.2964, "step": 325280 }, { "epoch": 0.57, "learning_rate": 2.163666612025098e-05, "loss": 2.2897, "step": 325290 }, { "epoch": 0.57, "learning_rate": 2.1635794180324154e-05, "loss": 2.2683, "step": 325300 }, { "epoch": 0.57, "learning_rate": 2.1634922240397327e-05, "loss": 2.4125, "step": 325310 }, { "epoch": 0.57, "learning_rate": 2.1634050300470498e-05, "loss": 2.4071, "step": 325320 }, { "epoch": 0.57, "learning_rate": 2.1633178360543675e-05, "loss": 2.3953, "step": 325330 }, { "epoch": 0.57, "learning_rate": 2.1632306420616845e-05, "loss": 2.3523, "step": 325340 }, { "epoch": 0.57, "learning_rate": 2.163143448069002e-05, "loss": 2.3922, "step": 325350 }, { "epoch": 0.57, "learning_rate": 2.1630562540763193e-05, "loss": 2.2905, "step": 325360 }, { "epoch": 0.57, "learning_rate": 2.1629690600836367e-05, "loss": 2.3148, "step": 325370 }, { "epoch": 0.57, "learning_rate": 2.162881866090954e-05, "loss": 2.3729, "step": 325380 }, { "epoch": 0.57, "learning_rate": 2.162794672098271e-05, "loss": 2.379, "step": 325390 }, { "epoch": 0.57, "learning_rate": 2.1627074781055888e-05, "loss": 2.3793, "step": 325400 }, { "epoch": 0.57, "learning_rate": 2.162620284112906e-05, "loss": 2.3651, "step": 325410 }, { "epoch": 0.57, "learning_rate": 2.1625330901202232e-05, "loss": 2.2779, "step": 325420 }, { "epoch": 0.57, "learning_rate": 2.1624458961275403e-05, "loss": 2.2842, "step": 325430 }, { "epoch": 0.57, "learning_rate": 2.162358702134858e-05, "loss": 2.3994, "step": 325440 }, { "epoch": 0.57, "learning_rate": 2.162271508142175e-05, "loss": 2.3735, "step": 325450 }, { "epoch": 0.57, "learning_rate": 2.1621843141494924e-05, "loss": 2.2903, "step": 325460 }, { "epoch": 0.57, "learning_rate": 2.1620971201568098e-05, "loss": 2.3159, "step": 325470 }, { "epoch": 0.57, "learning_rate": 2.162009926164127e-05, "loss": 2.1918, "step": 325480 }, { "epoch": 0.57, "learning_rate": 2.1619227321714445e-05, "loss": 2.4497, "step": 325490 }, { "epoch": 0.57, "learning_rate": 2.1618355381787616e-05, "loss": 2.3086, "step": 325500 }, { "epoch": 0.57, "learning_rate": 2.1617483441860793e-05, "loss": 2.4627, "step": 325510 }, { "epoch": 0.57, "learning_rate": 2.1616611501933963e-05, "loss": 2.3617, "step": 325520 }, { "epoch": 0.57, "learning_rate": 2.1615739562007137e-05, "loss": 2.3771, "step": 325530 }, { "epoch": 0.57, "learning_rate": 2.161486762208031e-05, "loss": 2.4072, "step": 325540 }, { "epoch": 0.57, "learning_rate": 2.1613995682153484e-05, "loss": 2.3025, "step": 325550 }, { "epoch": 0.57, "learning_rate": 2.1613123742226658e-05, "loss": 2.3435, "step": 325560 }, { "epoch": 0.57, "learning_rate": 2.161225180229983e-05, "loss": 2.4122, "step": 325570 }, { "epoch": 0.57, "learning_rate": 2.1611379862373002e-05, "loss": 2.2751, "step": 325580 }, { "epoch": 0.57, "learning_rate": 2.1610507922446176e-05, "loss": 2.342, "step": 325590 }, { "epoch": 0.57, "learning_rate": 2.160963598251935e-05, "loss": 2.3612, "step": 325600 }, { "epoch": 0.57, "learning_rate": 2.1608764042592524e-05, "loss": 2.3398, "step": 325610 }, { "epoch": 0.57, "learning_rate": 2.1607892102665694e-05, "loss": 2.3732, "step": 325620 }, { "epoch": 0.57, "learning_rate": 2.160702016273887e-05, "loss": 2.3597, "step": 325630 }, { "epoch": 0.57, "learning_rate": 2.160614822281204e-05, "loss": 2.366, "step": 325640 }, { "epoch": 0.57, "learning_rate": 2.1605276282885215e-05, "loss": 2.4004, "step": 325650 }, { "epoch": 0.57, "learning_rate": 2.160440434295839e-05, "loss": 2.4164, "step": 325660 }, { "epoch": 0.57, "learning_rate": 2.1603532403031563e-05, "loss": 2.388, "step": 325670 }, { "epoch": 0.57, "learning_rate": 2.1602660463104733e-05, "loss": 2.3688, "step": 325680 }, { "epoch": 0.57, "learning_rate": 2.1601788523177907e-05, "loss": 2.2449, "step": 325690 }, { "epoch": 0.57, "learning_rate": 2.160091658325108e-05, "loss": 2.3607, "step": 325700 }, { "epoch": 0.57, "learning_rate": 2.1600044643324255e-05, "loss": 2.2932, "step": 325710 }, { "epoch": 0.57, "learning_rate": 2.1599172703397428e-05, "loss": 2.3354, "step": 325720 }, { "epoch": 0.57, "learning_rate": 2.15983007634706e-05, "loss": 2.3635, "step": 325730 }, { "epoch": 0.57, "learning_rate": 2.1597428823543776e-05, "loss": 2.3701, "step": 325740 }, { "epoch": 0.57, "learning_rate": 2.1596556883616946e-05, "loss": 2.2344, "step": 325750 }, { "epoch": 0.57, "learning_rate": 2.159568494369012e-05, "loss": 2.2932, "step": 325760 }, { "epoch": 0.57, "learning_rate": 2.1594813003763294e-05, "loss": 2.2381, "step": 325770 }, { "epoch": 0.57, "learning_rate": 2.1593941063836468e-05, "loss": 2.3297, "step": 325780 }, { "epoch": 0.57, "learning_rate": 2.159306912390964e-05, "loss": 2.3016, "step": 325790 }, { "epoch": 0.57, "learning_rate": 2.159219718398281e-05, "loss": 2.3524, "step": 325800 }, { "epoch": 0.57, "learning_rate": 2.159132524405599e-05, "loss": 2.3665, "step": 325810 }, { "epoch": 0.57, "learning_rate": 2.159045330412916e-05, "loss": 2.4357, "step": 325820 }, { "epoch": 0.57, "learning_rate": 2.1589581364202333e-05, "loss": 2.3144, "step": 325830 }, { "epoch": 0.57, "learning_rate": 2.1588709424275503e-05, "loss": 2.3468, "step": 325840 }, { "epoch": 0.57, "learning_rate": 2.158783748434868e-05, "loss": 2.408, "step": 325850 }, { "epoch": 0.57, "learning_rate": 2.1586965544421854e-05, "loss": 2.3734, "step": 325860 }, { "epoch": 0.57, "learning_rate": 2.1586093604495025e-05, "loss": 2.4074, "step": 325870 }, { "epoch": 0.57, "learning_rate": 2.15852216645682e-05, "loss": 2.477, "step": 325880 }, { "epoch": 0.57, "learning_rate": 2.1584349724641372e-05, "loss": 2.432, "step": 325890 }, { "epoch": 0.57, "learning_rate": 2.1583477784714546e-05, "loss": 2.4178, "step": 325900 }, { "epoch": 0.57, "learning_rate": 2.1582605844787716e-05, "loss": 2.2547, "step": 325910 }, { "epoch": 0.57, "learning_rate": 2.1581733904860894e-05, "loss": 2.3103, "step": 325920 }, { "epoch": 0.57, "learning_rate": 2.1580861964934064e-05, "loss": 2.28, "step": 325930 }, { "epoch": 0.57, "learning_rate": 2.1579990025007238e-05, "loss": 2.2938, "step": 325940 }, { "epoch": 0.57, "learning_rate": 2.157911808508041e-05, "loss": 2.3712, "step": 325950 }, { "epoch": 0.57, "learning_rate": 2.1578246145153585e-05, "loss": 2.3598, "step": 325960 }, { "epoch": 0.57, "learning_rate": 2.157737420522676e-05, "loss": 2.3564, "step": 325970 }, { "epoch": 0.57, "learning_rate": 2.157650226529993e-05, "loss": 2.3423, "step": 325980 }, { "epoch": 0.57, "learning_rate": 2.1575630325373103e-05, "loss": 2.4945, "step": 325990 }, { "epoch": 0.57, "learning_rate": 2.1574758385446277e-05, "loss": 2.3916, "step": 326000 }, { "epoch": 0.57, "learning_rate": 2.157388644551945e-05, "loss": 2.3127, "step": 326010 }, { "epoch": 0.57, "learning_rate": 2.1573014505592624e-05, "loss": 2.3185, "step": 326020 }, { "epoch": 0.57, "learning_rate": 2.1572142565665798e-05, "loss": 2.3427, "step": 326030 }, { "epoch": 0.57, "learning_rate": 2.1571270625738972e-05, "loss": 2.2453, "step": 326040 }, { "epoch": 0.57, "learning_rate": 2.1570398685812142e-05, "loss": 2.2426, "step": 326050 }, { "epoch": 0.57, "learning_rate": 2.1569526745885316e-05, "loss": 2.4844, "step": 326060 }, { "epoch": 0.57, "learning_rate": 2.156865480595849e-05, "loss": 2.2634, "step": 326070 }, { "epoch": 0.57, "learning_rate": 2.1567782866031664e-05, "loss": 2.4328, "step": 326080 }, { "epoch": 0.57, "learning_rate": 2.1566910926104837e-05, "loss": 2.1761, "step": 326090 }, { "epoch": 0.57, "learning_rate": 2.1566038986178008e-05, "loss": 2.2846, "step": 326100 }, { "epoch": 0.57, "learning_rate": 2.1565167046251185e-05, "loss": 2.3706, "step": 326110 }, { "epoch": 0.57, "learning_rate": 2.1564295106324355e-05, "loss": 2.3939, "step": 326120 }, { "epoch": 0.57, "learning_rate": 2.156342316639753e-05, "loss": 2.3386, "step": 326130 }, { "epoch": 0.57, "learning_rate": 2.15625512264707e-05, "loss": 2.2984, "step": 326140 }, { "epoch": 0.57, "learning_rate": 2.1561679286543877e-05, "loss": 2.1456, "step": 326150 }, { "epoch": 0.57, "learning_rate": 2.1560807346617047e-05, "loss": 2.3765, "step": 326160 }, { "epoch": 0.57, "learning_rate": 2.155993540669022e-05, "loss": 2.3181, "step": 326170 }, { "epoch": 0.57, "learning_rate": 2.1559063466763395e-05, "loss": 2.3263, "step": 326180 }, { "epoch": 0.57, "learning_rate": 2.155819152683657e-05, "loss": 2.4416, "step": 326190 }, { "epoch": 0.57, "learning_rate": 2.1557319586909742e-05, "loss": 2.4508, "step": 326200 }, { "epoch": 0.57, "learning_rate": 2.1556447646982913e-05, "loss": 2.3513, "step": 326210 }, { "epoch": 0.57, "learning_rate": 2.155557570705609e-05, "loss": 2.3694, "step": 326220 }, { "epoch": 0.57, "learning_rate": 2.155470376712926e-05, "loss": 2.3011, "step": 326230 }, { "epoch": 0.57, "learning_rate": 2.1553831827202434e-05, "loss": 2.3944, "step": 326240 }, { "epoch": 0.57, "learning_rate": 2.1552959887275608e-05, "loss": 2.4008, "step": 326250 }, { "epoch": 0.57, "learning_rate": 2.155208794734878e-05, "loss": 2.3661, "step": 326260 }, { "epoch": 0.57, "learning_rate": 2.1551216007421955e-05, "loss": 2.3675, "step": 326270 }, { "epoch": 0.57, "learning_rate": 2.1550344067495126e-05, "loss": 2.4674, "step": 326280 }, { "epoch": 0.57, "learning_rate": 2.1549472127568303e-05, "loss": 2.2509, "step": 326290 }, { "epoch": 0.57, "learning_rate": 2.1548600187641473e-05, "loss": 2.3652, "step": 326300 }, { "epoch": 0.57, "learning_rate": 2.1547728247714647e-05, "loss": 2.3591, "step": 326310 }, { "epoch": 0.57, "learning_rate": 2.1546856307787817e-05, "loss": 2.3428, "step": 326320 }, { "epoch": 0.57, "learning_rate": 2.1545984367860994e-05, "loss": 2.3165, "step": 326330 }, { "epoch": 0.57, "learning_rate": 2.1545112427934168e-05, "loss": 2.4802, "step": 326340 }, { "epoch": 0.57, "learning_rate": 2.154424048800734e-05, "loss": 2.3266, "step": 326350 }, { "epoch": 0.57, "learning_rate": 2.1543368548080512e-05, "loss": 2.2585, "step": 326360 }, { "epoch": 0.57, "learning_rate": 2.1542496608153686e-05, "loss": 2.3584, "step": 326370 }, { "epoch": 0.57, "learning_rate": 2.154162466822686e-05, "loss": 2.3771, "step": 326380 }, { "epoch": 0.57, "learning_rate": 2.154075272830003e-05, "loss": 2.2731, "step": 326390 }, { "epoch": 0.57, "learning_rate": 2.1539880788373204e-05, "loss": 2.3346, "step": 326400 }, { "epoch": 0.57, "learning_rate": 2.1539008848446378e-05, "loss": 2.3257, "step": 326410 }, { "epoch": 0.57, "learning_rate": 2.153813690851955e-05, "loss": 2.3472, "step": 326420 }, { "epoch": 0.57, "learning_rate": 2.1537264968592725e-05, "loss": 2.2904, "step": 326430 }, { "epoch": 0.57, "learning_rate": 2.15363930286659e-05, "loss": 2.383, "step": 326440 }, { "epoch": 0.57, "learning_rate": 2.1535521088739073e-05, "loss": 2.2793, "step": 326450 }, { "epoch": 0.57, "learning_rate": 2.1534649148812243e-05, "loss": 2.3121, "step": 326460 }, { "epoch": 0.57, "learning_rate": 2.1533777208885417e-05, "loss": 2.2681, "step": 326470 }, { "epoch": 0.57, "learning_rate": 2.153290526895859e-05, "loss": 2.3793, "step": 326480 }, { "epoch": 0.57, "learning_rate": 2.1532033329031765e-05, "loss": 2.4144, "step": 326490 }, { "epoch": 0.57, "learning_rate": 2.1531161389104938e-05, "loss": 2.2392, "step": 326500 }, { "epoch": 0.57, "learning_rate": 2.153028944917811e-05, "loss": 2.3213, "step": 326510 }, { "epoch": 0.57, "learning_rate": 2.1529417509251286e-05, "loss": 2.3064, "step": 326520 }, { "epoch": 0.57, "learning_rate": 2.1528545569324456e-05, "loss": 2.3038, "step": 326530 }, { "epoch": 0.57, "learning_rate": 2.152767362939763e-05, "loss": 2.3707, "step": 326540 }, { "epoch": 0.57, "learning_rate": 2.15268016894708e-05, "loss": 2.325, "step": 326550 }, { "epoch": 0.57, "learning_rate": 2.1525929749543978e-05, "loss": 2.4135, "step": 326560 }, { "epoch": 0.57, "learning_rate": 2.1525057809617148e-05, "loss": 2.3384, "step": 326570 }, { "epoch": 0.57, "learning_rate": 2.152418586969032e-05, "loss": 2.4399, "step": 326580 }, { "epoch": 0.57, "learning_rate": 2.15233139297635e-05, "loss": 2.3208, "step": 326590 }, { "epoch": 0.57, "learning_rate": 2.152244198983667e-05, "loss": 2.3495, "step": 326600 }, { "epoch": 0.57, "learning_rate": 2.1521570049909843e-05, "loss": 2.3076, "step": 326610 }, { "epoch": 0.57, "learning_rate": 2.1520698109983013e-05, "loss": 2.3659, "step": 326620 }, { "epoch": 0.57, "learning_rate": 2.151982617005619e-05, "loss": 2.3612, "step": 326630 }, { "epoch": 0.57, "learning_rate": 2.151895423012936e-05, "loss": 2.3795, "step": 326640 }, { "epoch": 0.57, "learning_rate": 2.1518082290202535e-05, "loss": 2.4171, "step": 326650 }, { "epoch": 0.57, "learning_rate": 2.151721035027571e-05, "loss": 2.3143, "step": 326660 }, { "epoch": 0.57, "learning_rate": 2.1516338410348882e-05, "loss": 2.4504, "step": 326670 }, { "epoch": 0.57, "learning_rate": 2.1515466470422056e-05, "loss": 2.3162, "step": 326680 }, { "epoch": 0.57, "learning_rate": 2.1514594530495226e-05, "loss": 2.2518, "step": 326690 }, { "epoch": 0.57, "learning_rate": 2.1513722590568404e-05, "loss": 2.2392, "step": 326700 }, { "epoch": 0.57, "learning_rate": 2.1512850650641574e-05, "loss": 2.3268, "step": 326710 }, { "epoch": 0.57, "learning_rate": 2.1511978710714748e-05, "loss": 2.4256, "step": 326720 }, { "epoch": 0.57, "learning_rate": 2.151110677078792e-05, "loss": 2.2929, "step": 326730 }, { "epoch": 0.57, "learning_rate": 2.1510234830861095e-05, "loss": 2.3042, "step": 326740 }, { "epoch": 0.57, "learning_rate": 2.150936289093427e-05, "loss": 2.3999, "step": 326750 }, { "epoch": 0.57, "learning_rate": 2.150849095100744e-05, "loss": 2.3663, "step": 326760 }, { "epoch": 0.57, "learning_rate": 2.1507619011080613e-05, "loss": 2.3489, "step": 326770 }, { "epoch": 0.57, "learning_rate": 2.1506747071153787e-05, "loss": 2.3435, "step": 326780 }, { "epoch": 0.57, "learning_rate": 2.150587513122696e-05, "loss": 2.3479, "step": 326790 }, { "epoch": 0.57, "learning_rate": 2.150500319130013e-05, "loss": 2.3475, "step": 326800 }, { "epoch": 0.57, "learning_rate": 2.1504131251373305e-05, "loss": 2.3838, "step": 326810 }, { "epoch": 0.57, "learning_rate": 2.1503259311446482e-05, "loss": 2.4594, "step": 326820 }, { "epoch": 0.57, "learning_rate": 2.1502387371519652e-05, "loss": 2.3684, "step": 326830 }, { "epoch": 0.57, "learning_rate": 2.1501515431592826e-05, "loss": 2.306, "step": 326840 }, { "epoch": 0.57, "learning_rate": 2.1500643491666e-05, "loss": 2.3087, "step": 326850 }, { "epoch": 0.57, "learning_rate": 2.1499771551739174e-05, "loss": 2.3907, "step": 326860 }, { "epoch": 0.57, "learning_rate": 2.1498899611812344e-05, "loss": 2.2955, "step": 326870 }, { "epoch": 0.57, "learning_rate": 2.1498027671885518e-05, "loss": 2.2617, "step": 326880 }, { "epoch": 0.57, "learning_rate": 2.149715573195869e-05, "loss": 2.3548, "step": 326890 }, { "epoch": 0.57, "learning_rate": 2.1496283792031865e-05, "loss": 2.3454, "step": 326900 }, { "epoch": 0.57, "learning_rate": 2.149541185210504e-05, "loss": 2.3429, "step": 326910 }, { "epoch": 0.57, "learning_rate": 2.149453991217821e-05, "loss": 2.2985, "step": 326920 }, { "epoch": 0.57, "learning_rate": 2.1493667972251387e-05, "loss": 2.2237, "step": 326930 }, { "epoch": 0.57, "learning_rate": 2.1492796032324557e-05, "loss": 2.327, "step": 326940 }, { "epoch": 0.57, "learning_rate": 2.149192409239773e-05, "loss": 2.3252, "step": 326950 }, { "epoch": 0.57, "learning_rate": 2.1491052152470905e-05, "loss": 2.2553, "step": 326960 }, { "epoch": 0.57, "learning_rate": 2.149018021254408e-05, "loss": 2.4013, "step": 326970 }, { "epoch": 0.57, "learning_rate": 2.1489308272617252e-05, "loss": 2.3083, "step": 326980 }, { "epoch": 0.57, "learning_rate": 2.1488436332690423e-05, "loss": 2.3641, "step": 326990 }, { "epoch": 0.57, "learning_rate": 2.14875643927636e-05, "loss": 2.3702, "step": 327000 }, { "epoch": 0.57, "learning_rate": 2.148669245283677e-05, "loss": 2.3475, "step": 327010 }, { "epoch": 0.57, "learning_rate": 2.1485820512909944e-05, "loss": 2.3408, "step": 327020 }, { "epoch": 0.57, "learning_rate": 2.1484948572983114e-05, "loss": 2.3768, "step": 327030 }, { "epoch": 0.57, "learning_rate": 2.148407663305629e-05, "loss": 2.4606, "step": 327040 }, { "epoch": 0.57, "learning_rate": 2.1483204693129462e-05, "loss": 2.463, "step": 327050 }, { "epoch": 0.57, "learning_rate": 2.1482332753202636e-05, "loss": 2.3149, "step": 327060 }, { "epoch": 0.57, "learning_rate": 2.148146081327581e-05, "loss": 2.3492, "step": 327070 }, { "epoch": 0.57, "learning_rate": 2.1480588873348983e-05, "loss": 2.474, "step": 327080 }, { "epoch": 0.57, "learning_rate": 2.1479716933422157e-05, "loss": 2.3645, "step": 327090 }, { "epoch": 0.57, "learning_rate": 2.1478844993495327e-05, "loss": 2.3679, "step": 327100 }, { "epoch": 0.57, "learning_rate": 2.1477973053568504e-05, "loss": 2.3641, "step": 327110 }, { "epoch": 0.57, "learning_rate": 2.1477101113641675e-05, "loss": 2.3958, "step": 327120 }, { "epoch": 0.57, "learning_rate": 2.147622917371485e-05, "loss": 2.453, "step": 327130 }, { "epoch": 0.57, "learning_rate": 2.1475357233788022e-05, "loss": 2.3317, "step": 327140 }, { "epoch": 0.57, "learning_rate": 2.1474485293861196e-05, "loss": 2.2838, "step": 327150 }, { "epoch": 0.57, "learning_rate": 2.147361335393437e-05, "loss": 2.4008, "step": 327160 }, { "epoch": 0.57, "learning_rate": 2.147274141400754e-05, "loss": 2.2806, "step": 327170 }, { "epoch": 0.57, "learning_rate": 2.1471869474080714e-05, "loss": 2.3475, "step": 327180 }, { "epoch": 0.57, "learning_rate": 2.1470997534153888e-05, "loss": 2.3151, "step": 327190 }, { "epoch": 0.57, "learning_rate": 2.147012559422706e-05, "loss": 2.3756, "step": 327200 }, { "epoch": 0.57, "learning_rate": 2.1469253654300235e-05, "loss": 2.4463, "step": 327210 }, { "epoch": 0.57, "learning_rate": 2.1468381714373406e-05, "loss": 2.272, "step": 327220 }, { "epoch": 0.57, "learning_rate": 2.1467509774446583e-05, "loss": 2.4778, "step": 327230 }, { "epoch": 0.57, "learning_rate": 2.1466637834519753e-05, "loss": 2.3386, "step": 327240 }, { "epoch": 0.57, "learning_rate": 2.1465765894592927e-05, "loss": 2.3076, "step": 327250 }, { "epoch": 0.57, "learning_rate": 2.14648939546661e-05, "loss": 2.2943, "step": 327260 }, { "epoch": 0.57, "learning_rate": 2.1464022014739275e-05, "loss": 2.2784, "step": 327270 }, { "epoch": 0.57, "learning_rate": 2.1463150074812445e-05, "loss": 2.2831, "step": 327280 }, { "epoch": 0.57, "learning_rate": 2.146227813488562e-05, "loss": 2.454, "step": 327290 }, { "epoch": 0.57, "learning_rate": 2.1461406194958792e-05, "loss": 2.2842, "step": 327300 }, { "epoch": 0.57, "learning_rate": 2.1460534255031966e-05, "loss": 2.3019, "step": 327310 }, { "epoch": 0.57, "learning_rate": 2.145966231510514e-05, "loss": 2.3023, "step": 327320 }, { "epoch": 0.57, "learning_rate": 2.145879037517831e-05, "loss": 2.3825, "step": 327330 }, { "epoch": 0.57, "learning_rate": 2.1457918435251488e-05, "loss": 2.3717, "step": 327340 }, { "epoch": 0.57, "learning_rate": 2.1457046495324658e-05, "loss": 2.3264, "step": 327350 }, { "epoch": 0.57, "learning_rate": 2.145617455539783e-05, "loss": 2.3209, "step": 327360 }, { "epoch": 0.57, "learning_rate": 2.1455302615471005e-05, "loss": 2.3175, "step": 327370 }, { "epoch": 0.57, "learning_rate": 2.145443067554418e-05, "loss": 2.271, "step": 327380 }, { "epoch": 0.57, "learning_rate": 2.1453558735617353e-05, "loss": 2.3185, "step": 327390 }, { "epoch": 0.57, "learning_rate": 2.1452686795690523e-05, "loss": 2.4233, "step": 327400 }, { "epoch": 0.57, "learning_rate": 2.14518148557637e-05, "loss": 2.2855, "step": 327410 }, { "epoch": 0.57, "learning_rate": 2.145094291583687e-05, "loss": 2.2325, "step": 327420 }, { "epoch": 0.57, "learning_rate": 2.1450070975910045e-05, "loss": 2.4644, "step": 327430 }, { "epoch": 0.57, "learning_rate": 2.144919903598322e-05, "loss": 2.3165, "step": 327440 }, { "epoch": 0.57, "learning_rate": 2.1448327096056392e-05, "loss": 2.3589, "step": 327450 }, { "epoch": 0.57, "learning_rate": 2.1447455156129566e-05, "loss": 2.3508, "step": 327460 }, { "epoch": 0.57, "learning_rate": 2.1446583216202736e-05, "loss": 2.2455, "step": 327470 }, { "epoch": 0.57, "learning_rate": 2.144571127627591e-05, "loss": 2.3703, "step": 327480 }, { "epoch": 0.57, "learning_rate": 2.1444839336349084e-05, "loss": 2.3294, "step": 327490 }, { "epoch": 0.57, "learning_rate": 2.1443967396422258e-05, "loss": 2.4329, "step": 327500 }, { "epoch": 0.57, "learning_rate": 2.1443095456495428e-05, "loss": 2.2805, "step": 327510 }, { "epoch": 0.57, "learning_rate": 2.1442223516568605e-05, "loss": 2.32, "step": 327520 }, { "epoch": 0.57, "learning_rate": 2.1441351576641776e-05, "loss": 2.4105, "step": 327530 }, { "epoch": 0.57, "learning_rate": 2.144047963671495e-05, "loss": 2.2387, "step": 327540 }, { "epoch": 0.57, "learning_rate": 2.1439607696788123e-05, "loss": 2.3219, "step": 327550 }, { "epoch": 0.57, "learning_rate": 2.1438735756861297e-05, "loss": 2.1798, "step": 327560 }, { "epoch": 0.57, "learning_rate": 2.143786381693447e-05, "loss": 2.2723, "step": 327570 }, { "epoch": 0.57, "learning_rate": 2.143699187700764e-05, "loss": 2.4521, "step": 327580 }, { "epoch": 0.57, "learning_rate": 2.1436119937080815e-05, "loss": 2.3545, "step": 327590 }, { "epoch": 0.57, "learning_rate": 2.143524799715399e-05, "loss": 2.3818, "step": 327600 }, { "epoch": 0.57, "learning_rate": 2.1434376057227162e-05, "loss": 2.2901, "step": 327610 }, { "epoch": 0.57, "learning_rate": 2.1433504117300336e-05, "loss": 2.305, "step": 327620 }, { "epoch": 0.57, "learning_rate": 2.143263217737351e-05, "loss": 2.4237, "step": 327630 }, { "epoch": 0.57, "learning_rate": 2.1431760237446684e-05, "loss": 2.5445, "step": 327640 }, { "epoch": 0.57, "learning_rate": 2.1430888297519854e-05, "loss": 2.35, "step": 327650 }, { "epoch": 0.57, "learning_rate": 2.1430016357593028e-05, "loss": 2.4051, "step": 327660 }, { "epoch": 0.57, "learning_rate": 2.14291444176662e-05, "loss": 2.3122, "step": 327670 }, { "epoch": 0.57, "learning_rate": 2.1428272477739375e-05, "loss": 2.35, "step": 327680 }, { "epoch": 0.57, "learning_rate": 2.142740053781255e-05, "loss": 2.4346, "step": 327690 }, { "epoch": 0.57, "learning_rate": 2.142652859788572e-05, "loss": 2.3262, "step": 327700 }, { "epoch": 0.57, "learning_rate": 2.1425656657958897e-05, "loss": 2.3752, "step": 327710 }, { "epoch": 0.57, "learning_rate": 2.1424784718032067e-05, "loss": 2.4151, "step": 327720 }, { "epoch": 0.57, "learning_rate": 2.142391277810524e-05, "loss": 2.2872, "step": 327730 }, { "epoch": 0.57, "learning_rate": 2.142304083817841e-05, "loss": 2.3854, "step": 327740 }, { "epoch": 0.57, "learning_rate": 2.142216889825159e-05, "loss": 2.3676, "step": 327750 }, { "epoch": 0.57, "learning_rate": 2.142129695832476e-05, "loss": 2.3139, "step": 327760 }, { "epoch": 0.57, "learning_rate": 2.1420425018397933e-05, "loss": 2.3384, "step": 327770 }, { "epoch": 0.57, "learning_rate": 2.1419553078471106e-05, "loss": 2.3929, "step": 327780 }, { "epoch": 0.57, "learning_rate": 2.141868113854428e-05, "loss": 2.3269, "step": 327790 }, { "epoch": 0.57, "learning_rate": 2.1417809198617454e-05, "loss": 2.4078, "step": 327800 }, { "epoch": 0.57, "learning_rate": 2.1416937258690624e-05, "loss": 2.3863, "step": 327810 }, { "epoch": 0.57, "learning_rate": 2.14160653187638e-05, "loss": 2.4324, "step": 327820 }, { "epoch": 0.57, "learning_rate": 2.1415193378836972e-05, "loss": 2.4023, "step": 327830 }, { "epoch": 0.57, "learning_rate": 2.1414321438910146e-05, "loss": 2.2086, "step": 327840 }, { "epoch": 0.57, "learning_rate": 2.141344949898332e-05, "loss": 2.3583, "step": 327850 }, { "epoch": 0.57, "learning_rate": 2.1412577559056493e-05, "loss": 2.3224, "step": 327860 }, { "epoch": 0.57, "learning_rate": 2.1411705619129667e-05, "loss": 2.3866, "step": 327870 }, { "epoch": 0.57, "learning_rate": 2.1410833679202837e-05, "loss": 2.3909, "step": 327880 }, { "epoch": 0.57, "learning_rate": 2.1409961739276014e-05, "loss": 2.3816, "step": 327890 }, { "epoch": 0.57, "learning_rate": 2.1409089799349185e-05, "loss": 2.2544, "step": 327900 }, { "epoch": 0.57, "learning_rate": 2.140821785942236e-05, "loss": 2.4825, "step": 327910 }, { "epoch": 0.57, "learning_rate": 2.140734591949553e-05, "loss": 2.3419, "step": 327920 }, { "epoch": 0.57, "learning_rate": 2.1406473979568706e-05, "loss": 2.3872, "step": 327930 }, { "epoch": 0.57, "learning_rate": 2.140560203964188e-05, "loss": 2.3063, "step": 327940 }, { "epoch": 0.57, "learning_rate": 2.140473009971505e-05, "loss": 2.3405, "step": 327950 }, { "epoch": 0.57, "learning_rate": 2.1403858159788224e-05, "loss": 2.3659, "step": 327960 }, { "epoch": 0.57, "learning_rate": 2.1402986219861398e-05, "loss": 2.3508, "step": 327970 }, { "epoch": 0.57, "learning_rate": 2.140211427993457e-05, "loss": 2.3269, "step": 327980 }, { "epoch": 0.57, "learning_rate": 2.1401242340007742e-05, "loss": 2.3684, "step": 327990 }, { "epoch": 0.57, "learning_rate": 2.1400370400080916e-05, "loss": 2.3539, "step": 328000 }, { "epoch": 0.57, "learning_rate": 2.139949846015409e-05, "loss": 2.2274, "step": 328010 }, { "epoch": 0.57, "learning_rate": 2.1398626520227263e-05, "loss": 2.2791, "step": 328020 }, { "epoch": 0.57, "learning_rate": 2.1397754580300437e-05, "loss": 2.3037, "step": 328030 }, { "epoch": 0.57, "learning_rate": 2.139688264037361e-05, "loss": 2.3632, "step": 328040 }, { "epoch": 0.57, "learning_rate": 2.1396010700446785e-05, "loss": 2.3904, "step": 328050 }, { "epoch": 0.57, "learning_rate": 2.1395138760519955e-05, "loss": 2.3803, "step": 328060 }, { "epoch": 0.57, "learning_rate": 2.139426682059313e-05, "loss": 2.3881, "step": 328070 }, { "epoch": 0.57, "learning_rate": 2.1393394880666302e-05, "loss": 2.254, "step": 328080 }, { "epoch": 0.57, "learning_rate": 2.1392522940739476e-05, "loss": 2.2945, "step": 328090 }, { "epoch": 0.57, "learning_rate": 2.139165100081265e-05, "loss": 2.3379, "step": 328100 }, { "epoch": 0.57, "learning_rate": 2.139077906088582e-05, "loss": 2.366, "step": 328110 }, { "epoch": 0.57, "learning_rate": 2.1389907120958998e-05, "loss": 2.3762, "step": 328120 }, { "epoch": 0.57, "learning_rate": 2.1389035181032168e-05, "loss": 2.2291, "step": 328130 }, { "epoch": 0.57, "learning_rate": 2.138816324110534e-05, "loss": 2.3523, "step": 328140 }, { "epoch": 0.57, "learning_rate": 2.1387291301178512e-05, "loss": 2.081, "step": 328150 }, { "epoch": 0.57, "learning_rate": 2.138641936125169e-05, "loss": 2.3711, "step": 328160 }, { "epoch": 0.57, "learning_rate": 2.1385547421324863e-05, "loss": 2.3999, "step": 328170 }, { "epoch": 0.57, "learning_rate": 2.1384675481398033e-05, "loss": 2.2494, "step": 328180 }, { "epoch": 0.57, "learning_rate": 2.138380354147121e-05, "loss": 2.4211, "step": 328190 }, { "epoch": 0.57, "learning_rate": 2.138293160154438e-05, "loss": 2.3655, "step": 328200 }, { "epoch": 0.57, "learning_rate": 2.1382059661617555e-05, "loss": 2.2782, "step": 328210 }, { "epoch": 0.57, "learning_rate": 2.1381187721690725e-05, "loss": 2.3465, "step": 328220 }, { "epoch": 0.57, "learning_rate": 2.1380315781763902e-05, "loss": 2.3429, "step": 328230 }, { "epoch": 0.57, "learning_rate": 2.1379443841837073e-05, "loss": 2.295, "step": 328240 }, { "epoch": 0.57, "learning_rate": 2.1378571901910246e-05, "loss": 2.3057, "step": 328250 }, { "epoch": 0.57, "learning_rate": 2.137769996198342e-05, "loss": 2.2015, "step": 328260 }, { "epoch": 0.57, "learning_rate": 2.1376828022056594e-05, "loss": 2.2464, "step": 328270 }, { "epoch": 0.57, "learning_rate": 2.1375956082129768e-05, "loss": 2.3169, "step": 328280 }, { "epoch": 0.57, "learning_rate": 2.1375084142202938e-05, "loss": 2.4221, "step": 328290 }, { "epoch": 0.57, "learning_rate": 2.1374212202276115e-05, "loss": 2.4354, "step": 328300 }, { "epoch": 0.57, "learning_rate": 2.1373340262349286e-05, "loss": 2.2398, "step": 328310 }, { "epoch": 0.57, "learning_rate": 2.137246832242246e-05, "loss": 2.4312, "step": 328320 }, { "epoch": 0.57, "learning_rate": 2.1371596382495633e-05, "loss": 2.2961, "step": 328330 }, { "epoch": 0.57, "learning_rate": 2.1370724442568807e-05, "loss": 2.2918, "step": 328340 }, { "epoch": 0.57, "learning_rate": 2.136985250264198e-05, "loss": 2.4436, "step": 328350 }, { "epoch": 0.57, "learning_rate": 2.136898056271515e-05, "loss": 2.4402, "step": 328360 }, { "epoch": 0.57, "learning_rate": 2.1368108622788325e-05, "loss": 2.3225, "step": 328370 }, { "epoch": 0.57, "learning_rate": 2.13672366828615e-05, "loss": 2.2788, "step": 328380 }, { "epoch": 0.57, "learning_rate": 2.1366364742934672e-05, "loss": 2.3212, "step": 328390 }, { "epoch": 0.57, "learning_rate": 2.1365492803007843e-05, "loss": 2.3857, "step": 328400 }, { "epoch": 0.57, "learning_rate": 2.1364620863081017e-05, "loss": 2.3924, "step": 328410 }, { "epoch": 0.57, "learning_rate": 2.1363748923154194e-05, "loss": 2.3875, "step": 328420 }, { "epoch": 0.57, "learning_rate": 2.1362876983227364e-05, "loss": 2.3231, "step": 328430 }, { "epoch": 0.57, "learning_rate": 2.1362005043300538e-05, "loss": 2.27, "step": 328440 }, { "epoch": 0.57, "learning_rate": 2.136113310337371e-05, "loss": 2.3472, "step": 328450 }, { "epoch": 0.57, "learning_rate": 2.1360261163446885e-05, "loss": 2.3403, "step": 328460 }, { "epoch": 0.57, "learning_rate": 2.1359389223520056e-05, "loss": 2.4451, "step": 328470 }, { "epoch": 0.57, "learning_rate": 2.135851728359323e-05, "loss": 2.232, "step": 328480 }, { "epoch": 0.57, "learning_rate": 2.1357645343666403e-05, "loss": 2.2502, "step": 328490 }, { "epoch": 0.57, "learning_rate": 2.1356773403739577e-05, "loss": 2.3266, "step": 328500 }, { "epoch": 0.57, "learning_rate": 2.135590146381275e-05, "loss": 2.3468, "step": 328510 }, { "epoch": 0.57, "learning_rate": 2.135502952388592e-05, "loss": 2.1999, "step": 328520 }, { "epoch": 0.57, "learning_rate": 2.13541575839591e-05, "loss": 2.3668, "step": 328530 }, { "epoch": 0.57, "learning_rate": 2.135328564403227e-05, "loss": 2.1818, "step": 328540 }, { "epoch": 0.57, "learning_rate": 2.1352413704105443e-05, "loss": 2.3175, "step": 328550 }, { "epoch": 0.57, "learning_rate": 2.1351541764178616e-05, "loss": 2.2502, "step": 328560 }, { "epoch": 0.57, "learning_rate": 2.135066982425179e-05, "loss": 2.3764, "step": 328570 }, { "epoch": 0.57, "learning_rate": 2.1349797884324964e-05, "loss": 2.2589, "step": 328580 }, { "epoch": 0.57, "learning_rate": 2.1348925944398134e-05, "loss": 2.3606, "step": 328590 }, { "epoch": 0.57, "learning_rate": 2.134805400447131e-05, "loss": 2.2838, "step": 328600 }, { "epoch": 0.57, "learning_rate": 2.1347182064544482e-05, "loss": 2.3272, "step": 328610 }, { "epoch": 0.57, "learning_rate": 2.1346310124617656e-05, "loss": 2.2869, "step": 328620 }, { "epoch": 0.57, "learning_rate": 2.1345438184690826e-05, "loss": 2.2257, "step": 328630 }, { "epoch": 0.57, "learning_rate": 2.1344566244764003e-05, "loss": 2.4818, "step": 328640 }, { "epoch": 0.57, "learning_rate": 2.1343694304837173e-05, "loss": 2.4055, "step": 328650 }, { "epoch": 0.57, "learning_rate": 2.1342822364910347e-05, "loss": 2.4423, "step": 328660 }, { "epoch": 0.57, "learning_rate": 2.134195042498352e-05, "loss": 2.3457, "step": 328670 }, { "epoch": 0.57, "learning_rate": 2.1341078485056695e-05, "loss": 2.3978, "step": 328680 }, { "epoch": 0.57, "learning_rate": 2.134020654512987e-05, "loss": 2.3706, "step": 328690 }, { "epoch": 0.57, "learning_rate": 2.133933460520304e-05, "loss": 2.4158, "step": 328700 }, { "epoch": 0.57, "learning_rate": 2.1338462665276216e-05, "loss": 2.3133, "step": 328710 }, { "epoch": 0.57, "learning_rate": 2.1337590725349386e-05, "loss": 2.1928, "step": 328720 }, { "epoch": 0.57, "learning_rate": 2.133671878542256e-05, "loss": 2.3976, "step": 328730 }, { "epoch": 0.57, "learning_rate": 2.1335846845495734e-05, "loss": 2.345, "step": 328740 }, { "epoch": 0.57, "learning_rate": 2.1334974905568908e-05, "loss": 2.315, "step": 328750 }, { "epoch": 0.57, "learning_rate": 2.133410296564208e-05, "loss": 2.3643, "step": 328760 }, { "epoch": 0.57, "learning_rate": 2.1333231025715252e-05, "loss": 2.3634, "step": 328770 }, { "epoch": 0.57, "learning_rate": 2.1332359085788426e-05, "loss": 2.3367, "step": 328780 }, { "epoch": 0.57, "learning_rate": 2.13314871458616e-05, "loss": 2.3519, "step": 328790 }, { "epoch": 0.57, "learning_rate": 2.1330615205934773e-05, "loss": 2.3727, "step": 328800 }, { "epoch": 0.57, "learning_rate": 2.1329743266007947e-05, "loss": 2.3349, "step": 328810 }, { "epoch": 0.57, "learning_rate": 2.132887132608112e-05, "loss": 2.3909, "step": 328820 }, { "epoch": 0.57, "learning_rate": 2.1327999386154295e-05, "loss": 2.3312, "step": 328830 }, { "epoch": 0.57, "learning_rate": 2.1327127446227465e-05, "loss": 2.4762, "step": 328840 }, { "epoch": 0.57, "learning_rate": 2.132625550630064e-05, "loss": 2.3606, "step": 328850 }, { "epoch": 0.57, "learning_rate": 2.1325383566373812e-05, "loss": 2.4225, "step": 328860 }, { "epoch": 0.57, "learning_rate": 2.1324511626446986e-05, "loss": 2.4058, "step": 328870 }, { "epoch": 0.57, "learning_rate": 2.1323639686520157e-05, "loss": 2.3966, "step": 328880 }, { "epoch": 0.57, "learning_rate": 2.132276774659333e-05, "loss": 2.4173, "step": 328890 }, { "epoch": 0.57, "learning_rate": 2.1321895806666508e-05, "loss": 2.349, "step": 328900 }, { "epoch": 0.57, "learning_rate": 2.1321023866739678e-05, "loss": 2.4596, "step": 328910 }, { "epoch": 0.57, "learning_rate": 2.132015192681285e-05, "loss": 2.3013, "step": 328920 }, { "epoch": 0.57, "learning_rate": 2.1319279986886022e-05, "loss": 2.3932, "step": 328930 }, { "epoch": 0.57, "learning_rate": 2.13184080469592e-05, "loss": 2.2759, "step": 328940 }, { "epoch": 0.57, "learning_rate": 2.131753610703237e-05, "loss": 2.3308, "step": 328950 }, { "epoch": 0.57, "learning_rate": 2.1316664167105543e-05, "loss": 2.4877, "step": 328960 }, { "epoch": 0.57, "learning_rate": 2.1315792227178717e-05, "loss": 2.3771, "step": 328970 }, { "epoch": 0.57, "learning_rate": 2.131492028725189e-05, "loss": 2.2641, "step": 328980 }, { "epoch": 0.57, "learning_rate": 2.1314048347325065e-05, "loss": 2.3867, "step": 328990 }, { "epoch": 0.57, "learning_rate": 2.1313176407398235e-05, "loss": 2.3376, "step": 329000 }, { "epoch": 0.57, "learning_rate": 2.1312304467471412e-05, "loss": 2.4304, "step": 329010 }, { "epoch": 0.57, "learning_rate": 2.1311432527544583e-05, "loss": 2.378, "step": 329020 }, { "epoch": 0.57, "learning_rate": 2.1310560587617756e-05, "loss": 2.325, "step": 329030 }, { "epoch": 0.57, "learning_rate": 2.130968864769093e-05, "loss": 2.3993, "step": 329040 }, { "epoch": 0.57, "learning_rate": 2.1308816707764104e-05, "loss": 2.3161, "step": 329050 }, { "epoch": 0.57, "learning_rate": 2.1307944767837278e-05, "loss": 2.3042, "step": 329060 }, { "epoch": 0.57, "learning_rate": 2.1307072827910448e-05, "loss": 2.3846, "step": 329070 }, { "epoch": 0.57, "learning_rate": 2.1306200887983622e-05, "loss": 2.3439, "step": 329080 }, { "epoch": 0.57, "learning_rate": 2.1305328948056796e-05, "loss": 2.3712, "step": 329090 }, { "epoch": 0.57, "learning_rate": 2.130445700812997e-05, "loss": 2.1971, "step": 329100 }, { "epoch": 0.57, "learning_rate": 2.130358506820314e-05, "loss": 2.4055, "step": 329110 }, { "epoch": 0.57, "learning_rate": 2.1302713128276317e-05, "loss": 2.3831, "step": 329120 }, { "epoch": 0.57, "learning_rate": 2.1301841188349487e-05, "loss": 2.3508, "step": 329130 }, { "epoch": 0.57, "learning_rate": 2.130096924842266e-05, "loss": 2.3286, "step": 329140 }, { "epoch": 0.57, "learning_rate": 2.1300097308495835e-05, "loss": 2.4273, "step": 329150 }, { "epoch": 0.57, "learning_rate": 2.129922536856901e-05, "loss": 2.3222, "step": 329160 }, { "epoch": 0.57, "learning_rate": 2.1298353428642182e-05, "loss": 2.3167, "step": 329170 }, { "epoch": 0.57, "learning_rate": 2.1297481488715353e-05, "loss": 2.3656, "step": 329180 }, { "epoch": 0.57, "learning_rate": 2.1296609548788527e-05, "loss": 2.38, "step": 329190 }, { "epoch": 0.57, "learning_rate": 2.12957376088617e-05, "loss": 2.3599, "step": 329200 }, { "epoch": 0.57, "learning_rate": 2.1294865668934874e-05, "loss": 2.4016, "step": 329210 }, { "epoch": 0.57, "learning_rate": 2.1293993729008048e-05, "loss": 2.2686, "step": 329220 }, { "epoch": 0.57, "learning_rate": 2.129312178908122e-05, "loss": 2.4104, "step": 329230 }, { "epoch": 0.57, "learning_rate": 2.1292249849154395e-05, "loss": 2.3262, "step": 329240 }, { "epoch": 0.57, "learning_rate": 2.1291377909227566e-05, "loss": 2.3009, "step": 329250 }, { "epoch": 0.57, "learning_rate": 2.129050596930074e-05, "loss": 2.2622, "step": 329260 }, { "epoch": 0.57, "learning_rate": 2.1289634029373913e-05, "loss": 2.3216, "step": 329270 }, { "epoch": 0.57, "learning_rate": 2.1288762089447087e-05, "loss": 2.3128, "step": 329280 }, { "epoch": 0.57, "learning_rate": 2.128789014952026e-05, "loss": 2.3718, "step": 329290 }, { "epoch": 0.57, "learning_rate": 2.128701820959343e-05, "loss": 2.3608, "step": 329300 }, { "epoch": 0.57, "learning_rate": 2.128614626966661e-05, "loss": 2.2428, "step": 329310 }, { "epoch": 0.57, "learning_rate": 2.128527432973978e-05, "loss": 2.3497, "step": 329320 }, { "epoch": 0.57, "learning_rate": 2.1284402389812953e-05, "loss": 2.298, "step": 329330 }, { "epoch": 0.57, "learning_rate": 2.1283530449886123e-05, "loss": 2.4022, "step": 329340 }, { "epoch": 0.57, "learning_rate": 2.12826585099593e-05, "loss": 2.2927, "step": 329350 }, { "epoch": 0.57, "learning_rate": 2.128178657003247e-05, "loss": 2.2517, "step": 329360 }, { "epoch": 0.57, "learning_rate": 2.1280914630105644e-05, "loss": 2.356, "step": 329370 }, { "epoch": 0.57, "learning_rate": 2.1280042690178818e-05, "loss": 2.3369, "step": 329380 }, { "epoch": 0.57, "learning_rate": 2.1279170750251992e-05, "loss": 2.2344, "step": 329390 }, { "epoch": 0.57, "learning_rate": 2.1278298810325166e-05, "loss": 2.2487, "step": 329400 }, { "epoch": 0.57, "learning_rate": 2.1277426870398336e-05, "loss": 2.3097, "step": 329410 }, { "epoch": 0.57, "learning_rate": 2.1276554930471513e-05, "loss": 2.3492, "step": 329420 }, { "epoch": 0.57, "learning_rate": 2.1275682990544683e-05, "loss": 2.3838, "step": 329430 }, { "epoch": 0.57, "learning_rate": 2.1274811050617857e-05, "loss": 2.3083, "step": 329440 }, { "epoch": 0.57, "learning_rate": 2.127393911069103e-05, "loss": 2.2925, "step": 329450 }, { "epoch": 0.57, "learning_rate": 2.1273067170764205e-05, "loss": 2.3671, "step": 329460 }, { "epoch": 0.57, "learning_rate": 2.127219523083738e-05, "loss": 2.3193, "step": 329470 }, { "epoch": 0.57, "learning_rate": 2.127132329091055e-05, "loss": 2.3383, "step": 329480 }, { "epoch": 0.57, "learning_rate": 2.1270451350983726e-05, "loss": 2.2417, "step": 329490 }, { "epoch": 0.57, "learning_rate": 2.1269579411056896e-05, "loss": 2.255, "step": 329500 }, { "epoch": 0.57, "learning_rate": 2.126870747113007e-05, "loss": 2.2875, "step": 329510 }, { "epoch": 0.57, "learning_rate": 2.1267835531203244e-05, "loss": 2.4277, "step": 329520 }, { "epoch": 0.57, "learning_rate": 2.1266963591276418e-05, "loss": 2.4092, "step": 329530 }, { "epoch": 0.57, "learning_rate": 2.126609165134959e-05, "loss": 2.2331, "step": 329540 }, { "epoch": 0.57, "learning_rate": 2.1265219711422762e-05, "loss": 2.3071, "step": 329550 }, { "epoch": 0.57, "learning_rate": 2.1264347771495936e-05, "loss": 2.3641, "step": 329560 }, { "epoch": 0.57, "learning_rate": 2.126347583156911e-05, "loss": 2.3398, "step": 329570 }, { "epoch": 0.57, "learning_rate": 2.1262603891642283e-05, "loss": 2.297, "step": 329580 }, { "epoch": 0.57, "learning_rate": 2.1261731951715454e-05, "loss": 2.4432, "step": 329590 }, { "epoch": 0.57, "learning_rate": 2.1260860011788627e-05, "loss": 2.3338, "step": 329600 }, { "epoch": 0.57, "learning_rate": 2.12599880718618e-05, "loss": 2.4203, "step": 329610 }, { "epoch": 0.57, "learning_rate": 2.1259116131934975e-05, "loss": 2.3264, "step": 329620 }, { "epoch": 0.57, "learning_rate": 2.125824419200815e-05, "loss": 2.3684, "step": 329630 }, { "epoch": 0.57, "learning_rate": 2.1257372252081322e-05, "loss": 2.3326, "step": 329640 }, { "epoch": 0.57, "learning_rate": 2.1256500312154496e-05, "loss": 2.3373, "step": 329650 }, { "epoch": 0.57, "learning_rate": 2.1255628372227667e-05, "loss": 2.441, "step": 329660 }, { "epoch": 0.57, "learning_rate": 2.125475643230084e-05, "loss": 2.2139, "step": 329670 }, { "epoch": 0.57, "learning_rate": 2.1253884492374014e-05, "loss": 2.2938, "step": 329680 }, { "epoch": 0.57, "learning_rate": 2.1253012552447188e-05, "loss": 2.2921, "step": 329690 }, { "epoch": 0.57, "learning_rate": 2.1252140612520362e-05, "loss": 2.4018, "step": 329700 }, { "epoch": 0.57, "learning_rate": 2.1251268672593532e-05, "loss": 2.2944, "step": 329710 }, { "epoch": 0.57, "learning_rate": 2.125039673266671e-05, "loss": 2.3032, "step": 329720 }, { "epoch": 0.58, "learning_rate": 2.124952479273988e-05, "loss": 2.2442, "step": 329730 }, { "epoch": 0.58, "learning_rate": 2.1248652852813053e-05, "loss": 2.3446, "step": 329740 }, { "epoch": 0.58, "learning_rate": 2.1247780912886227e-05, "loss": 2.2293, "step": 329750 }, { "epoch": 0.58, "learning_rate": 2.12469089729594e-05, "loss": 2.3335, "step": 329760 }, { "epoch": 0.58, "learning_rate": 2.1246037033032575e-05, "loss": 2.273, "step": 329770 }, { "epoch": 0.58, "learning_rate": 2.1245165093105745e-05, "loss": 2.3094, "step": 329780 }, { "epoch": 0.58, "learning_rate": 2.1244293153178922e-05, "loss": 2.3919, "step": 329790 }, { "epoch": 0.58, "learning_rate": 2.1243421213252093e-05, "loss": 2.3365, "step": 329800 }, { "epoch": 0.58, "learning_rate": 2.1242549273325266e-05, "loss": 2.3275, "step": 329810 }, { "epoch": 0.58, "learning_rate": 2.1241677333398437e-05, "loss": 2.3214, "step": 329820 }, { "epoch": 0.58, "learning_rate": 2.1240805393471614e-05, "loss": 2.3668, "step": 329830 }, { "epoch": 0.58, "learning_rate": 2.1239933453544784e-05, "loss": 2.3831, "step": 329840 }, { "epoch": 0.58, "learning_rate": 2.1239061513617958e-05, "loss": 2.2958, "step": 329850 }, { "epoch": 0.58, "learning_rate": 2.1238189573691132e-05, "loss": 2.2502, "step": 329860 }, { "epoch": 0.58, "learning_rate": 2.1237317633764306e-05, "loss": 2.2139, "step": 329870 }, { "epoch": 0.58, "learning_rate": 2.123644569383748e-05, "loss": 2.2611, "step": 329880 }, { "epoch": 0.58, "learning_rate": 2.123557375391065e-05, "loss": 2.4451, "step": 329890 }, { "epoch": 0.58, "learning_rate": 2.1234701813983827e-05, "loss": 2.3835, "step": 329900 }, { "epoch": 0.58, "learning_rate": 2.1233829874056997e-05, "loss": 2.3874, "step": 329910 }, { "epoch": 0.58, "learning_rate": 2.123295793413017e-05, "loss": 2.3782, "step": 329920 }, { "epoch": 0.58, "learning_rate": 2.1232085994203345e-05, "loss": 2.2801, "step": 329930 }, { "epoch": 0.58, "learning_rate": 2.123121405427652e-05, "loss": 2.2719, "step": 329940 }, { "epoch": 0.58, "learning_rate": 2.1230342114349692e-05, "loss": 2.2854, "step": 329950 }, { "epoch": 0.58, "learning_rate": 2.1229470174422863e-05, "loss": 2.3691, "step": 329960 }, { "epoch": 0.58, "learning_rate": 2.1228598234496037e-05, "loss": 2.2255, "step": 329970 }, { "epoch": 0.58, "learning_rate": 2.122772629456921e-05, "loss": 2.3106, "step": 329980 }, { "epoch": 0.58, "learning_rate": 2.1226854354642384e-05, "loss": 2.2297, "step": 329990 }, { "epoch": 0.58, "learning_rate": 2.1225982414715554e-05, "loss": 2.3703, "step": 330000 }, { "epoch": 0.58, "learning_rate": 2.1225110474788728e-05, "loss": 2.338, "step": 330010 }, { "epoch": 0.58, "learning_rate": 2.1224238534861905e-05, "loss": 2.3234, "step": 330020 }, { "epoch": 0.58, "learning_rate": 2.1223366594935076e-05, "loss": 2.4078, "step": 330030 }, { "epoch": 0.58, "learning_rate": 2.122249465500825e-05, "loss": 2.3127, "step": 330040 }, { "epoch": 0.58, "learning_rate": 2.1221622715081423e-05, "loss": 2.2959, "step": 330050 }, { "epoch": 0.58, "learning_rate": 2.1220750775154597e-05, "loss": 2.3038, "step": 330060 }, { "epoch": 0.58, "learning_rate": 2.1219878835227767e-05, "loss": 2.2859, "step": 330070 }, { "epoch": 0.58, "learning_rate": 2.121900689530094e-05, "loss": 2.4298, "step": 330080 }, { "epoch": 0.58, "learning_rate": 2.1218134955374115e-05, "loss": 2.3114, "step": 330090 }, { "epoch": 0.58, "learning_rate": 2.121726301544729e-05, "loss": 2.4369, "step": 330100 }, { "epoch": 0.58, "learning_rate": 2.1216391075520463e-05, "loss": 2.3844, "step": 330110 }, { "epoch": 0.58, "learning_rate": 2.1215519135593633e-05, "loss": 2.2079, "step": 330120 }, { "epoch": 0.58, "learning_rate": 2.121464719566681e-05, "loss": 2.3452, "step": 330130 }, { "epoch": 0.58, "learning_rate": 2.121377525573998e-05, "loss": 2.3779, "step": 330140 }, { "epoch": 0.58, "learning_rate": 2.1212903315813154e-05, "loss": 2.3438, "step": 330150 }, { "epoch": 0.58, "learning_rate": 2.1212031375886328e-05, "loss": 2.345, "step": 330160 }, { "epoch": 0.58, "learning_rate": 2.1211159435959502e-05, "loss": 2.4659, "step": 330170 }, { "epoch": 0.58, "learning_rate": 2.1210287496032676e-05, "loss": 2.3256, "step": 330180 }, { "epoch": 0.58, "learning_rate": 2.1209415556105846e-05, "loss": 2.3762, "step": 330190 }, { "epoch": 0.58, "learning_rate": 2.1208543616179023e-05, "loss": 2.2225, "step": 330200 }, { "epoch": 0.58, "learning_rate": 2.1207671676252193e-05, "loss": 2.4192, "step": 330210 }, { "epoch": 0.58, "learning_rate": 2.1206799736325367e-05, "loss": 2.2714, "step": 330220 }, { "epoch": 0.58, "learning_rate": 2.1205927796398538e-05, "loss": 2.1806, "step": 330230 }, { "epoch": 0.58, "learning_rate": 2.1205055856471715e-05, "loss": 2.4105, "step": 330240 }, { "epoch": 0.58, "learning_rate": 2.120418391654489e-05, "loss": 2.4349, "step": 330250 }, { "epoch": 0.58, "learning_rate": 2.120331197661806e-05, "loss": 2.2821, "step": 330260 }, { "epoch": 0.58, "learning_rate": 2.1202440036691233e-05, "loss": 2.3755, "step": 330270 }, { "epoch": 0.58, "learning_rate": 2.1201568096764406e-05, "loss": 2.268, "step": 330280 }, { "epoch": 0.58, "learning_rate": 2.120069615683758e-05, "loss": 2.4506, "step": 330290 }, { "epoch": 0.58, "learning_rate": 2.119982421691075e-05, "loss": 2.3692, "step": 330300 }, { "epoch": 0.58, "learning_rate": 2.1198952276983928e-05, "loss": 2.3737, "step": 330310 }, { "epoch": 0.58, "learning_rate": 2.1198080337057098e-05, "loss": 2.3647, "step": 330320 }, { "epoch": 0.58, "learning_rate": 2.1197208397130272e-05, "loss": 2.3994, "step": 330330 }, { "epoch": 0.58, "learning_rate": 2.1196336457203446e-05, "loss": 2.4788, "step": 330340 }, { "epoch": 0.58, "learning_rate": 2.119546451727662e-05, "loss": 2.3283, "step": 330350 }, { "epoch": 0.58, "learning_rate": 2.1194592577349793e-05, "loss": 2.4376, "step": 330360 }, { "epoch": 0.58, "learning_rate": 2.1193720637422964e-05, "loss": 2.2191, "step": 330370 }, { "epoch": 0.58, "learning_rate": 2.1192848697496137e-05, "loss": 2.4535, "step": 330380 }, { "epoch": 0.58, "learning_rate": 2.119197675756931e-05, "loss": 2.4245, "step": 330390 }, { "epoch": 0.58, "learning_rate": 2.1191104817642485e-05, "loss": 2.1765, "step": 330400 }, { "epoch": 0.58, "learning_rate": 2.119023287771566e-05, "loss": 2.3386, "step": 330410 }, { "epoch": 0.58, "learning_rate": 2.1189360937788832e-05, "loss": 2.3799, "step": 330420 }, { "epoch": 0.58, "learning_rate": 2.1188488997862006e-05, "loss": 2.3849, "step": 330430 }, { "epoch": 0.58, "learning_rate": 2.1187617057935177e-05, "loss": 2.3692, "step": 330440 }, { "epoch": 0.58, "learning_rate": 2.118674511800835e-05, "loss": 2.3738, "step": 330450 }, { "epoch": 0.58, "learning_rate": 2.1185873178081524e-05, "loss": 2.3412, "step": 330460 }, { "epoch": 0.58, "learning_rate": 2.1185001238154698e-05, "loss": 2.3559, "step": 330470 }, { "epoch": 0.58, "learning_rate": 2.118412929822787e-05, "loss": 2.3487, "step": 330480 }, { "epoch": 0.58, "learning_rate": 2.1183257358301042e-05, "loss": 2.4105, "step": 330490 }, { "epoch": 0.58, "learning_rate": 2.118238541837422e-05, "loss": 2.2681, "step": 330500 }, { "epoch": 0.58, "learning_rate": 2.118151347844739e-05, "loss": 2.4421, "step": 330510 }, { "epoch": 0.58, "learning_rate": 2.1180641538520563e-05, "loss": 2.2799, "step": 330520 }, { "epoch": 0.58, "learning_rate": 2.1179769598593734e-05, "loss": 2.3308, "step": 330530 }, { "epoch": 0.58, "learning_rate": 2.117889765866691e-05, "loss": 2.2923, "step": 330540 }, { "epoch": 0.58, "learning_rate": 2.117802571874008e-05, "loss": 2.3017, "step": 330550 }, { "epoch": 0.58, "learning_rate": 2.1177153778813255e-05, "loss": 2.3151, "step": 330560 }, { "epoch": 0.58, "learning_rate": 2.117628183888643e-05, "loss": 2.2553, "step": 330570 }, { "epoch": 0.58, "learning_rate": 2.1175409898959603e-05, "loss": 2.33, "step": 330580 }, { "epoch": 0.58, "learning_rate": 2.1174537959032776e-05, "loss": 2.3635, "step": 330590 }, { "epoch": 0.58, "learning_rate": 2.1173666019105947e-05, "loss": 2.3473, "step": 330600 }, { "epoch": 0.58, "learning_rate": 2.1172794079179124e-05, "loss": 2.2836, "step": 330610 }, { "epoch": 0.58, "learning_rate": 2.1171922139252294e-05, "loss": 2.3135, "step": 330620 }, { "epoch": 0.58, "learning_rate": 2.1171050199325468e-05, "loss": 2.3021, "step": 330630 }, { "epoch": 0.58, "learning_rate": 2.1170178259398642e-05, "loss": 2.2311, "step": 330640 }, { "epoch": 0.58, "learning_rate": 2.1169306319471816e-05, "loss": 2.2157, "step": 330650 }, { "epoch": 0.58, "learning_rate": 2.116843437954499e-05, "loss": 2.3393, "step": 330660 }, { "epoch": 0.58, "learning_rate": 2.116756243961816e-05, "loss": 2.3514, "step": 330670 }, { "epoch": 0.58, "learning_rate": 2.1166690499691337e-05, "loss": 2.301, "step": 330680 }, { "epoch": 0.58, "learning_rate": 2.1165818559764507e-05, "loss": 2.3681, "step": 330690 }, { "epoch": 0.58, "learning_rate": 2.116494661983768e-05, "loss": 2.3856, "step": 330700 }, { "epoch": 0.58, "learning_rate": 2.116407467991085e-05, "loss": 2.3727, "step": 330710 }, { "epoch": 0.58, "learning_rate": 2.116320273998403e-05, "loss": 2.3496, "step": 330720 }, { "epoch": 0.58, "learning_rate": 2.11623308000572e-05, "loss": 2.2649, "step": 330730 }, { "epoch": 0.58, "learning_rate": 2.1161458860130373e-05, "loss": 2.2897, "step": 330740 }, { "epoch": 0.58, "learning_rate": 2.1160586920203547e-05, "loss": 2.2983, "step": 330750 }, { "epoch": 0.58, "learning_rate": 2.115971498027672e-05, "loss": 2.2989, "step": 330760 }, { "epoch": 0.58, "learning_rate": 2.1158843040349894e-05, "loss": 2.3604, "step": 330770 }, { "epoch": 0.58, "learning_rate": 2.1157971100423064e-05, "loss": 2.3172, "step": 330780 }, { "epoch": 0.58, "learning_rate": 2.1157099160496238e-05, "loss": 2.2811, "step": 330790 }, { "epoch": 0.58, "learning_rate": 2.1156227220569412e-05, "loss": 2.3564, "step": 330800 }, { "epoch": 0.58, "learning_rate": 2.1155355280642586e-05, "loss": 2.254, "step": 330810 }, { "epoch": 0.58, "learning_rate": 2.115448334071576e-05, "loss": 2.3179, "step": 330820 }, { "epoch": 0.58, "learning_rate": 2.1153611400788933e-05, "loss": 2.2982, "step": 330830 }, { "epoch": 0.58, "learning_rate": 2.1152739460862107e-05, "loss": 2.3741, "step": 330840 }, { "epoch": 0.58, "learning_rate": 2.1151867520935277e-05, "loss": 2.3414, "step": 330850 }, { "epoch": 0.58, "learning_rate": 2.115099558100845e-05, "loss": 2.3453, "step": 330860 }, { "epoch": 0.58, "learning_rate": 2.1150123641081625e-05, "loss": 2.2692, "step": 330870 }, { "epoch": 0.58, "learning_rate": 2.11492517011548e-05, "loss": 2.2181, "step": 330880 }, { "epoch": 0.58, "learning_rate": 2.1148379761227973e-05, "loss": 2.2586, "step": 330890 }, { "epoch": 0.58, "learning_rate": 2.1147507821301143e-05, "loss": 2.2053, "step": 330900 }, { "epoch": 0.58, "learning_rate": 2.114663588137432e-05, "loss": 2.3327, "step": 330910 }, { "epoch": 0.58, "learning_rate": 2.114576394144749e-05, "loss": 2.3602, "step": 330920 }, { "epoch": 0.58, "learning_rate": 2.1144892001520664e-05, "loss": 2.382, "step": 330930 }, { "epoch": 0.58, "learning_rate": 2.1144020061593835e-05, "loss": 2.3213, "step": 330940 }, { "epoch": 0.58, "learning_rate": 2.1143148121667012e-05, "loss": 2.2978, "step": 330950 }, { "epoch": 0.58, "learning_rate": 2.1142276181740182e-05, "loss": 2.3414, "step": 330960 }, { "epoch": 0.58, "learning_rate": 2.1141404241813356e-05, "loss": 2.2844, "step": 330970 }, { "epoch": 0.58, "learning_rate": 2.1140532301886533e-05, "loss": 2.455, "step": 330980 }, { "epoch": 0.58, "learning_rate": 2.1139660361959703e-05, "loss": 2.3152, "step": 330990 }, { "epoch": 0.58, "learning_rate": 2.1138788422032877e-05, "loss": 2.3032, "step": 331000 }, { "epoch": 0.58, "learning_rate": 2.1137916482106048e-05, "loss": 2.3552, "step": 331010 }, { "epoch": 0.58, "learning_rate": 2.1137044542179225e-05, "loss": 2.4063, "step": 331020 }, { "epoch": 0.58, "learning_rate": 2.1136172602252395e-05, "loss": 2.3659, "step": 331030 }, { "epoch": 0.58, "learning_rate": 2.113530066232557e-05, "loss": 2.227, "step": 331040 }, { "epoch": 0.58, "learning_rate": 2.1134428722398743e-05, "loss": 2.302, "step": 331050 }, { "epoch": 0.58, "learning_rate": 2.1133556782471916e-05, "loss": 2.3517, "step": 331060 }, { "epoch": 0.58, "learning_rate": 2.113268484254509e-05, "loss": 2.3203, "step": 331070 }, { "epoch": 0.58, "learning_rate": 2.113181290261826e-05, "loss": 2.3711, "step": 331080 }, { "epoch": 0.58, "learning_rate": 2.1130940962691438e-05, "loss": 2.2157, "step": 331090 }, { "epoch": 0.58, "learning_rate": 2.1130069022764608e-05, "loss": 2.2404, "step": 331100 }, { "epoch": 0.58, "learning_rate": 2.1129197082837782e-05, "loss": 2.3604, "step": 331110 }, { "epoch": 0.58, "learning_rate": 2.1128325142910956e-05, "loss": 2.3019, "step": 331120 }, { "epoch": 0.58, "learning_rate": 2.112745320298413e-05, "loss": 2.3707, "step": 331130 }, { "epoch": 0.58, "learning_rate": 2.1126581263057303e-05, "loss": 2.3981, "step": 331140 }, { "epoch": 0.58, "learning_rate": 2.1125709323130474e-05, "loss": 2.3076, "step": 331150 }, { "epoch": 0.58, "learning_rate": 2.1124837383203647e-05, "loss": 2.3339, "step": 331160 }, { "epoch": 0.58, "learning_rate": 2.112396544327682e-05, "loss": 2.3551, "step": 331170 }, { "epoch": 0.58, "learning_rate": 2.1123093503349995e-05, "loss": 2.3067, "step": 331180 }, { "epoch": 0.58, "learning_rate": 2.1122221563423165e-05, "loss": 2.3079, "step": 331190 }, { "epoch": 0.58, "learning_rate": 2.112134962349634e-05, "loss": 2.3334, "step": 331200 }, { "epoch": 0.58, "learning_rate": 2.1120477683569513e-05, "loss": 2.4573, "step": 331210 }, { "epoch": 0.58, "learning_rate": 2.1119605743642687e-05, "loss": 2.29, "step": 331220 }, { "epoch": 0.58, "learning_rate": 2.111873380371586e-05, "loss": 2.2826, "step": 331230 }, { "epoch": 0.58, "learning_rate": 2.1117861863789034e-05, "loss": 2.3899, "step": 331240 }, { "epoch": 0.58, "learning_rate": 2.1116989923862208e-05, "loss": 2.3194, "step": 331250 }, { "epoch": 0.58, "learning_rate": 2.111611798393538e-05, "loss": 2.3761, "step": 331260 }, { "epoch": 0.58, "learning_rate": 2.1115246044008552e-05, "loss": 2.3072, "step": 331270 }, { "epoch": 0.58, "learning_rate": 2.1114374104081726e-05, "loss": 2.404, "step": 331280 }, { "epoch": 0.58, "learning_rate": 2.11135021641549e-05, "loss": 2.3082, "step": 331290 }, { "epoch": 0.58, "learning_rate": 2.1112630224228073e-05, "loss": 2.4075, "step": 331300 }, { "epoch": 0.58, "learning_rate": 2.1111758284301244e-05, "loss": 2.284, "step": 331310 }, { "epoch": 0.58, "learning_rate": 2.111088634437442e-05, "loss": 2.4308, "step": 331320 }, { "epoch": 0.58, "learning_rate": 2.111001440444759e-05, "loss": 2.3421, "step": 331330 }, { "epoch": 0.58, "learning_rate": 2.1109142464520765e-05, "loss": 2.2159, "step": 331340 }, { "epoch": 0.58, "learning_rate": 2.110827052459394e-05, "loss": 2.2826, "step": 331350 }, { "epoch": 0.58, "learning_rate": 2.1107398584667113e-05, "loss": 2.4458, "step": 331360 }, { "epoch": 0.58, "learning_rate": 2.1106526644740286e-05, "loss": 2.261, "step": 331370 }, { "epoch": 0.58, "learning_rate": 2.1105654704813457e-05, "loss": 2.2384, "step": 331380 }, { "epoch": 0.58, "learning_rate": 2.1104782764886634e-05, "loss": 2.4135, "step": 331390 }, { "epoch": 0.58, "learning_rate": 2.1103910824959804e-05, "loss": 2.3057, "step": 331400 }, { "epoch": 0.58, "learning_rate": 2.1103038885032978e-05, "loss": 2.2864, "step": 331410 }, { "epoch": 0.58, "learning_rate": 2.110216694510615e-05, "loss": 2.2138, "step": 331420 }, { "epoch": 0.58, "learning_rate": 2.1101295005179326e-05, "loss": 2.4212, "step": 331430 }, { "epoch": 0.58, "learning_rate": 2.1100423065252496e-05, "loss": 2.3146, "step": 331440 }, { "epoch": 0.58, "learning_rate": 2.109955112532567e-05, "loss": 2.3094, "step": 331450 }, { "epoch": 0.58, "learning_rate": 2.1098679185398844e-05, "loss": 2.3242, "step": 331460 }, { "epoch": 0.58, "learning_rate": 2.1097807245472017e-05, "loss": 2.4165, "step": 331470 }, { "epoch": 0.58, "learning_rate": 2.109693530554519e-05, "loss": 2.2859, "step": 331480 }, { "epoch": 0.58, "learning_rate": 2.109606336561836e-05, "loss": 2.2615, "step": 331490 }, { "epoch": 0.58, "learning_rate": 2.109519142569154e-05, "loss": 2.4834, "step": 331500 }, { "epoch": 0.58, "learning_rate": 2.109431948576471e-05, "loss": 2.3469, "step": 331510 }, { "epoch": 0.58, "learning_rate": 2.1093447545837883e-05, "loss": 2.2846, "step": 331520 }, { "epoch": 0.58, "learning_rate": 2.1092575605911057e-05, "loss": 2.3392, "step": 331530 }, { "epoch": 0.58, "learning_rate": 2.109170366598423e-05, "loss": 2.2899, "step": 331540 }, { "epoch": 0.58, "learning_rate": 2.1090831726057404e-05, "loss": 2.2635, "step": 331550 }, { "epoch": 0.58, "learning_rate": 2.1089959786130574e-05, "loss": 2.2825, "step": 331560 }, { "epoch": 0.58, "learning_rate": 2.1089087846203748e-05, "loss": 2.4102, "step": 331570 }, { "epoch": 0.58, "learning_rate": 2.1088215906276922e-05, "loss": 2.3355, "step": 331580 }, { "epoch": 0.58, "learning_rate": 2.1087343966350096e-05, "loss": 2.426, "step": 331590 }, { "epoch": 0.58, "learning_rate": 2.108647202642327e-05, "loss": 2.3151, "step": 331600 }, { "epoch": 0.58, "learning_rate": 2.108560008649644e-05, "loss": 2.3628, "step": 331610 }, { "epoch": 0.58, "learning_rate": 2.1084728146569617e-05, "loss": 2.374, "step": 331620 }, { "epoch": 0.58, "learning_rate": 2.1083856206642787e-05, "loss": 2.3608, "step": 331630 }, { "epoch": 0.58, "learning_rate": 2.108298426671596e-05, "loss": 2.2921, "step": 331640 }, { "epoch": 0.58, "learning_rate": 2.1082112326789135e-05, "loss": 2.333, "step": 331650 }, { "epoch": 0.58, "learning_rate": 2.108124038686231e-05, "loss": 2.3861, "step": 331660 }, { "epoch": 0.58, "learning_rate": 2.108036844693548e-05, "loss": 2.2493, "step": 331670 }, { "epoch": 0.58, "learning_rate": 2.1079496507008653e-05, "loss": 2.3895, "step": 331680 }, { "epoch": 0.58, "learning_rate": 2.1078624567081827e-05, "loss": 2.4576, "step": 331690 }, { "epoch": 0.58, "learning_rate": 2.1077752627155e-05, "loss": 2.2758, "step": 331700 }, { "epoch": 0.58, "learning_rate": 2.1076880687228174e-05, "loss": 2.2788, "step": 331710 }, { "epoch": 0.58, "learning_rate": 2.1076008747301345e-05, "loss": 2.2826, "step": 331720 }, { "epoch": 0.58, "learning_rate": 2.1075136807374522e-05, "loss": 2.2985, "step": 331730 }, { "epoch": 0.58, "learning_rate": 2.1074264867447692e-05, "loss": 2.271, "step": 331740 }, { "epoch": 0.58, "learning_rate": 2.1073392927520866e-05, "loss": 2.2985, "step": 331750 }, { "epoch": 0.58, "learning_rate": 2.107252098759404e-05, "loss": 2.2391, "step": 331760 }, { "epoch": 0.58, "learning_rate": 2.1071649047667213e-05, "loss": 2.3479, "step": 331770 }, { "epoch": 0.58, "learning_rate": 2.1070777107740387e-05, "loss": 2.2975, "step": 331780 }, { "epoch": 0.58, "learning_rate": 2.1069905167813558e-05, "loss": 2.2835, "step": 331790 }, { "epoch": 0.58, "learning_rate": 2.1069033227886735e-05, "loss": 2.3767, "step": 331800 }, { "epoch": 0.58, "learning_rate": 2.1068161287959905e-05, "loss": 2.4244, "step": 331810 }, { "epoch": 0.58, "learning_rate": 2.106728934803308e-05, "loss": 2.3304, "step": 331820 }, { "epoch": 0.58, "learning_rate": 2.106641740810625e-05, "loss": 2.2724, "step": 331830 }, { "epoch": 0.58, "learning_rate": 2.1065545468179426e-05, "loss": 2.3446, "step": 331840 }, { "epoch": 0.58, "learning_rate": 2.10646735282526e-05, "loss": 2.2556, "step": 331850 }, { "epoch": 0.58, "learning_rate": 2.106380158832577e-05, "loss": 2.371, "step": 331860 }, { "epoch": 0.58, "learning_rate": 2.1062929648398944e-05, "loss": 2.2427, "step": 331870 }, { "epoch": 0.58, "learning_rate": 2.1062057708472118e-05, "loss": 2.2679, "step": 331880 }, { "epoch": 0.58, "learning_rate": 2.1061185768545292e-05, "loss": 2.3364, "step": 331890 }, { "epoch": 0.58, "learning_rate": 2.1060313828618462e-05, "loss": 2.2652, "step": 331900 }, { "epoch": 0.58, "learning_rate": 2.105944188869164e-05, "loss": 2.3388, "step": 331910 }, { "epoch": 0.58, "learning_rate": 2.105856994876481e-05, "loss": 2.437, "step": 331920 }, { "epoch": 0.58, "learning_rate": 2.1057698008837984e-05, "loss": 2.3925, "step": 331930 }, { "epoch": 0.58, "learning_rate": 2.1056826068911157e-05, "loss": 2.2451, "step": 331940 }, { "epoch": 0.58, "learning_rate": 2.105595412898433e-05, "loss": 2.4141, "step": 331950 }, { "epoch": 0.58, "learning_rate": 2.1055082189057505e-05, "loss": 2.4586, "step": 331960 }, { "epoch": 0.58, "learning_rate": 2.1054210249130675e-05, "loss": 2.4166, "step": 331970 }, { "epoch": 0.58, "learning_rate": 2.105333830920385e-05, "loss": 2.285, "step": 331980 }, { "epoch": 0.58, "learning_rate": 2.1052466369277023e-05, "loss": 2.4062, "step": 331990 }, { "epoch": 0.58, "learning_rate": 2.1051594429350197e-05, "loss": 2.3515, "step": 332000 }, { "epoch": 0.58, "learning_rate": 2.105072248942337e-05, "loss": 2.3034, "step": 332010 }, { "epoch": 0.58, "learning_rate": 2.1049850549496544e-05, "loss": 2.3782, "step": 332020 }, { "epoch": 0.58, "learning_rate": 2.1048978609569718e-05, "loss": 2.3573, "step": 332030 }, { "epoch": 0.58, "learning_rate": 2.104810666964289e-05, "loss": 2.2841, "step": 332040 }, { "epoch": 0.58, "learning_rate": 2.1047234729716062e-05, "loss": 2.3776, "step": 332050 }, { "epoch": 0.58, "learning_rate": 2.1046362789789236e-05, "loss": 2.3405, "step": 332060 }, { "epoch": 0.58, "learning_rate": 2.104549084986241e-05, "loss": 2.1603, "step": 332070 }, { "epoch": 0.58, "learning_rate": 2.104461890993558e-05, "loss": 2.2864, "step": 332080 }, { "epoch": 0.58, "learning_rate": 2.1043746970008754e-05, "loss": 2.3613, "step": 332090 }, { "epoch": 0.58, "learning_rate": 2.104287503008193e-05, "loss": 2.2777, "step": 332100 }, { "epoch": 0.58, "learning_rate": 2.10420030901551e-05, "loss": 2.3224, "step": 332110 }, { "epoch": 0.58, "learning_rate": 2.1041131150228275e-05, "loss": 2.3017, "step": 332120 }, { "epoch": 0.58, "learning_rate": 2.1040259210301445e-05, "loss": 2.4039, "step": 332130 }, { "epoch": 0.58, "learning_rate": 2.1039387270374623e-05, "loss": 2.4262, "step": 332140 }, { "epoch": 0.58, "learning_rate": 2.1038515330447793e-05, "loss": 2.3055, "step": 332150 }, { "epoch": 0.58, "learning_rate": 2.1037643390520967e-05, "loss": 2.2311, "step": 332160 }, { "epoch": 0.58, "learning_rate": 2.103677145059414e-05, "loss": 2.3658, "step": 332170 }, { "epoch": 0.58, "learning_rate": 2.1035899510667314e-05, "loss": 2.3691, "step": 332180 }, { "epoch": 0.58, "learning_rate": 2.1035027570740488e-05, "loss": 2.3646, "step": 332190 }, { "epoch": 0.58, "learning_rate": 2.103415563081366e-05, "loss": 2.395, "step": 332200 }, { "epoch": 0.58, "learning_rate": 2.1033283690886836e-05, "loss": 2.4215, "step": 332210 }, { "epoch": 0.58, "learning_rate": 2.1032411750960006e-05, "loss": 2.3719, "step": 332220 }, { "epoch": 0.58, "learning_rate": 2.103153981103318e-05, "loss": 2.3922, "step": 332230 }, { "epoch": 0.58, "learning_rate": 2.1030667871106354e-05, "loss": 2.315, "step": 332240 }, { "epoch": 0.58, "learning_rate": 2.1029795931179527e-05, "loss": 2.3156, "step": 332250 }, { "epoch": 0.58, "learning_rate": 2.10289239912527e-05, "loss": 2.3289, "step": 332260 }, { "epoch": 0.58, "learning_rate": 2.102805205132587e-05, "loss": 2.3193, "step": 332270 }, { "epoch": 0.58, "learning_rate": 2.102718011139905e-05, "loss": 2.3812, "step": 332280 }, { "epoch": 0.58, "learning_rate": 2.102630817147222e-05, "loss": 2.2654, "step": 332290 }, { "epoch": 0.58, "learning_rate": 2.1025436231545393e-05, "loss": 2.3175, "step": 332300 }, { "epoch": 0.58, "learning_rate": 2.1024564291618563e-05, "loss": 2.4188, "step": 332310 }, { "epoch": 0.58, "learning_rate": 2.102369235169174e-05, "loss": 2.3565, "step": 332320 }, { "epoch": 0.58, "learning_rate": 2.1022820411764914e-05, "loss": 2.3777, "step": 332330 }, { "epoch": 0.58, "learning_rate": 2.1021948471838084e-05, "loss": 2.2389, "step": 332340 }, { "epoch": 0.58, "learning_rate": 2.1021076531911258e-05, "loss": 2.3938, "step": 332350 }, { "epoch": 0.58, "learning_rate": 2.1020204591984432e-05, "loss": 2.3265, "step": 332360 }, { "epoch": 0.58, "learning_rate": 2.1019332652057606e-05, "loss": 2.3629, "step": 332370 }, { "epoch": 0.58, "learning_rate": 2.1018460712130776e-05, "loss": 2.3906, "step": 332380 }, { "epoch": 0.58, "learning_rate": 2.101758877220395e-05, "loss": 2.4485, "step": 332390 }, { "epoch": 0.58, "learning_rate": 2.1016716832277124e-05, "loss": 2.2912, "step": 332400 }, { "epoch": 0.58, "learning_rate": 2.1015844892350297e-05, "loss": 2.2923, "step": 332410 }, { "epoch": 0.58, "learning_rate": 2.101497295242347e-05, "loss": 2.4041, "step": 332420 }, { "epoch": 0.58, "learning_rate": 2.1014101012496645e-05, "loss": 2.3409, "step": 332430 }, { "epoch": 0.58, "learning_rate": 2.101322907256982e-05, "loss": 2.249, "step": 332440 }, { "epoch": 0.58, "learning_rate": 2.101235713264299e-05, "loss": 2.3955, "step": 332450 }, { "epoch": 0.58, "learning_rate": 2.1011485192716163e-05, "loss": 2.2388, "step": 332460 }, { "epoch": 0.58, "learning_rate": 2.1010613252789337e-05, "loss": 2.3177, "step": 332470 }, { "epoch": 0.58, "learning_rate": 2.100974131286251e-05, "loss": 2.3138, "step": 332480 }, { "epoch": 0.58, "learning_rate": 2.1008869372935684e-05, "loss": 2.3136, "step": 332490 }, { "epoch": 0.58, "learning_rate": 2.1007997433008855e-05, "loss": 2.3532, "step": 332500 }, { "epoch": 0.58, "learning_rate": 2.1007125493082032e-05, "loss": 2.3281, "step": 332510 }, { "epoch": 0.58, "learning_rate": 2.1006253553155202e-05, "loss": 2.347, "step": 332520 }, { "epoch": 0.58, "learning_rate": 2.1005381613228376e-05, "loss": 2.251, "step": 332530 }, { "epoch": 0.58, "learning_rate": 2.1004509673301546e-05, "loss": 2.4278, "step": 332540 }, { "epoch": 0.58, "learning_rate": 2.1003637733374723e-05, "loss": 2.2274, "step": 332550 }, { "epoch": 0.58, "learning_rate": 2.1002765793447894e-05, "loss": 2.309, "step": 332560 }, { "epoch": 0.58, "learning_rate": 2.1001893853521068e-05, "loss": 2.3586, "step": 332570 }, { "epoch": 0.58, "learning_rate": 2.1001021913594245e-05, "loss": 2.2519, "step": 332580 }, { "epoch": 0.58, "learning_rate": 2.1000149973667415e-05, "loss": 2.31, "step": 332590 }, { "epoch": 0.58, "learning_rate": 2.099927803374059e-05, "loss": 2.3282, "step": 332600 }, { "epoch": 0.58, "learning_rate": 2.099840609381376e-05, "loss": 2.3775, "step": 332610 }, { "epoch": 0.58, "learning_rate": 2.0997534153886936e-05, "loss": 2.3458, "step": 332620 }, { "epoch": 0.58, "learning_rate": 2.0996662213960107e-05, "loss": 2.4899, "step": 332630 }, { "epoch": 0.58, "learning_rate": 2.099579027403328e-05, "loss": 2.3935, "step": 332640 }, { "epoch": 0.58, "learning_rate": 2.0994918334106454e-05, "loss": 2.338, "step": 332650 }, { "epoch": 0.58, "learning_rate": 2.0994046394179628e-05, "loss": 2.2941, "step": 332660 }, { "epoch": 0.58, "learning_rate": 2.0993174454252802e-05, "loss": 2.2671, "step": 332670 }, { "epoch": 0.58, "learning_rate": 2.0992302514325972e-05, "loss": 2.3903, "step": 332680 }, { "epoch": 0.58, "learning_rate": 2.099143057439915e-05, "loss": 2.2412, "step": 332690 }, { "epoch": 0.58, "learning_rate": 2.099055863447232e-05, "loss": 2.3846, "step": 332700 }, { "epoch": 0.58, "learning_rate": 2.0989686694545494e-05, "loss": 2.3578, "step": 332710 }, { "epoch": 0.58, "learning_rate": 2.0988814754618667e-05, "loss": 2.3972, "step": 332720 }, { "epoch": 0.58, "learning_rate": 2.098794281469184e-05, "loss": 2.2864, "step": 332730 }, { "epoch": 0.58, "learning_rate": 2.0987070874765015e-05, "loss": 2.3322, "step": 332740 }, { "epoch": 0.58, "learning_rate": 2.0986198934838185e-05, "loss": 2.3444, "step": 332750 }, { "epoch": 0.58, "learning_rate": 2.098532699491136e-05, "loss": 2.2796, "step": 332760 }, { "epoch": 0.58, "learning_rate": 2.0984455054984533e-05, "loss": 2.3497, "step": 332770 }, { "epoch": 0.58, "learning_rate": 2.0983583115057707e-05, "loss": 2.3297, "step": 332780 }, { "epoch": 0.58, "learning_rate": 2.0982711175130877e-05, "loss": 2.3763, "step": 332790 }, { "epoch": 0.58, "learning_rate": 2.098183923520405e-05, "loss": 2.3271, "step": 332800 }, { "epoch": 0.58, "learning_rate": 2.0980967295277225e-05, "loss": 2.2655, "step": 332810 }, { "epoch": 0.58, "learning_rate": 2.09800953553504e-05, "loss": 2.2209, "step": 332820 }, { "epoch": 0.58, "learning_rate": 2.0979223415423572e-05, "loss": 2.362, "step": 332830 }, { "epoch": 0.58, "learning_rate": 2.0978351475496746e-05, "loss": 2.253, "step": 332840 }, { "epoch": 0.58, "learning_rate": 2.097747953556992e-05, "loss": 2.3625, "step": 332850 }, { "epoch": 0.58, "learning_rate": 2.097660759564309e-05, "loss": 2.2809, "step": 332860 }, { "epoch": 0.58, "learning_rate": 2.0975735655716264e-05, "loss": 2.3391, "step": 332870 }, { "epoch": 0.58, "learning_rate": 2.0974863715789438e-05, "loss": 2.3176, "step": 332880 }, { "epoch": 0.58, "learning_rate": 2.097399177586261e-05, "loss": 2.304, "step": 332890 }, { "epoch": 0.58, "learning_rate": 2.0973119835935785e-05, "loss": 2.3482, "step": 332900 }, { "epoch": 0.58, "learning_rate": 2.0972247896008955e-05, "loss": 2.3385, "step": 332910 }, { "epoch": 0.58, "learning_rate": 2.0971375956082133e-05, "loss": 2.4194, "step": 332920 }, { "epoch": 0.58, "learning_rate": 2.0970504016155303e-05, "loss": 2.2658, "step": 332930 }, { "epoch": 0.58, "learning_rate": 2.0969632076228477e-05, "loss": 2.3248, "step": 332940 }, { "epoch": 0.58, "learning_rate": 2.096876013630165e-05, "loss": 2.4774, "step": 332950 }, { "epoch": 0.58, "learning_rate": 2.0967888196374824e-05, "loss": 2.3209, "step": 332960 }, { "epoch": 0.58, "learning_rate": 2.0967016256447998e-05, "loss": 2.3741, "step": 332970 }, { "epoch": 0.58, "learning_rate": 2.096614431652117e-05, "loss": 2.3559, "step": 332980 }, { "epoch": 0.58, "learning_rate": 2.0965272376594346e-05, "loss": 2.3577, "step": 332990 }, { "epoch": 0.58, "learning_rate": 2.0964400436667516e-05, "loss": 2.4038, "step": 333000 }, { "epoch": 0.58, "learning_rate": 2.096352849674069e-05, "loss": 2.4093, "step": 333010 }, { "epoch": 0.58, "learning_rate": 2.096265655681386e-05, "loss": 2.3801, "step": 333020 }, { "epoch": 0.58, "learning_rate": 2.0961784616887037e-05, "loss": 2.4384, "step": 333030 }, { "epoch": 0.58, "learning_rate": 2.0960912676960208e-05, "loss": 2.1224, "step": 333040 }, { "epoch": 0.58, "learning_rate": 2.096004073703338e-05, "loss": 2.3105, "step": 333050 }, { "epoch": 0.58, "learning_rate": 2.0959168797106555e-05, "loss": 2.3545, "step": 333060 }, { "epoch": 0.58, "learning_rate": 2.095829685717973e-05, "loss": 2.2249, "step": 333070 }, { "epoch": 0.58, "learning_rate": 2.0957424917252903e-05, "loss": 2.3651, "step": 333080 }, { "epoch": 0.58, "learning_rate": 2.0956552977326073e-05, "loss": 2.2603, "step": 333090 }, { "epoch": 0.58, "learning_rate": 2.095568103739925e-05, "loss": 2.2548, "step": 333100 }, { "epoch": 0.58, "learning_rate": 2.095480909747242e-05, "loss": 2.3563, "step": 333110 }, { "epoch": 0.58, "learning_rate": 2.0953937157545594e-05, "loss": 2.2813, "step": 333120 }, { "epoch": 0.58, "learning_rate": 2.0953065217618768e-05, "loss": 2.2987, "step": 333130 }, { "epoch": 0.58, "learning_rate": 2.0952193277691942e-05, "loss": 2.3156, "step": 333140 }, { "epoch": 0.58, "learning_rate": 2.0951321337765116e-05, "loss": 2.2948, "step": 333150 }, { "epoch": 0.58, "learning_rate": 2.0950449397838286e-05, "loss": 2.3406, "step": 333160 }, { "epoch": 0.58, "learning_rate": 2.094957745791146e-05, "loss": 2.379, "step": 333170 }, { "epoch": 0.58, "learning_rate": 2.0948705517984634e-05, "loss": 2.3093, "step": 333180 }, { "epoch": 0.58, "learning_rate": 2.0947833578057807e-05, "loss": 2.302, "step": 333190 }, { "epoch": 0.58, "learning_rate": 2.094696163813098e-05, "loss": 2.3785, "step": 333200 }, { "epoch": 0.58, "learning_rate": 2.0946089698204155e-05, "loss": 2.3221, "step": 333210 }, { "epoch": 0.58, "learning_rate": 2.094521775827733e-05, "loss": 2.2867, "step": 333220 }, { "epoch": 0.58, "learning_rate": 2.09443458183505e-05, "loss": 2.3409, "step": 333230 }, { "epoch": 0.58, "learning_rate": 2.0943473878423673e-05, "loss": 2.3665, "step": 333240 }, { "epoch": 0.58, "learning_rate": 2.0942601938496847e-05, "loss": 2.3541, "step": 333250 }, { "epoch": 0.58, "learning_rate": 2.094172999857002e-05, "loss": 2.3214, "step": 333260 }, { "epoch": 0.58, "learning_rate": 2.094085805864319e-05, "loss": 2.2546, "step": 333270 }, { "epoch": 0.58, "learning_rate": 2.0939986118716365e-05, "loss": 2.3087, "step": 333280 }, { "epoch": 0.58, "learning_rate": 2.093911417878954e-05, "loss": 2.2347, "step": 333290 }, { "epoch": 0.58, "learning_rate": 2.0938242238862712e-05, "loss": 2.3037, "step": 333300 }, { "epoch": 0.58, "learning_rate": 2.0937370298935886e-05, "loss": 2.2373, "step": 333310 }, { "epoch": 0.58, "learning_rate": 2.0936498359009056e-05, "loss": 2.3279, "step": 333320 }, { "epoch": 0.58, "learning_rate": 2.0935626419082234e-05, "loss": 2.4537, "step": 333330 }, { "epoch": 0.58, "learning_rate": 2.0934754479155404e-05, "loss": 2.4537, "step": 333340 }, { "epoch": 0.58, "learning_rate": 2.0933882539228578e-05, "loss": 2.3025, "step": 333350 }, { "epoch": 0.58, "learning_rate": 2.093301059930175e-05, "loss": 2.3957, "step": 333360 }, { "epoch": 0.58, "learning_rate": 2.0932138659374925e-05, "loss": 2.3143, "step": 333370 }, { "epoch": 0.58, "learning_rate": 2.09312667194481e-05, "loss": 2.3033, "step": 333380 }, { "epoch": 0.58, "learning_rate": 2.093039477952127e-05, "loss": 2.3338, "step": 333390 }, { "epoch": 0.58, "learning_rate": 2.0929522839594447e-05, "loss": 2.4436, "step": 333400 }, { "epoch": 0.58, "learning_rate": 2.0928650899667617e-05, "loss": 2.3172, "step": 333410 }, { "epoch": 0.58, "learning_rate": 2.092777895974079e-05, "loss": 2.3115, "step": 333420 }, { "epoch": 0.58, "learning_rate": 2.0926907019813964e-05, "loss": 2.3784, "step": 333430 }, { "epoch": 0.58, "learning_rate": 2.0926035079887138e-05, "loss": 2.2896, "step": 333440 }, { "epoch": 0.58, "learning_rate": 2.0925163139960312e-05, "loss": 2.3138, "step": 333450 }, { "epoch": 0.58, "learning_rate": 2.0924291200033482e-05, "loss": 2.3278, "step": 333460 }, { "epoch": 0.58, "learning_rate": 2.0923419260106656e-05, "loss": 2.2977, "step": 333470 }, { "epoch": 0.58, "learning_rate": 2.092254732017983e-05, "loss": 2.3084, "step": 333480 }, { "epoch": 0.58, "learning_rate": 2.0921675380253004e-05, "loss": 2.3614, "step": 333490 }, { "epoch": 0.58, "learning_rate": 2.0920803440326174e-05, "loss": 2.2933, "step": 333500 }, { "epoch": 0.58, "learning_rate": 2.091993150039935e-05, "loss": 2.3163, "step": 333510 }, { "epoch": 0.58, "learning_rate": 2.091905956047252e-05, "loss": 2.3961, "step": 333520 }, { "epoch": 0.58, "learning_rate": 2.0918187620545695e-05, "loss": 2.3437, "step": 333530 }, { "epoch": 0.58, "learning_rate": 2.091731568061887e-05, "loss": 2.2885, "step": 333540 }, { "epoch": 0.58, "learning_rate": 2.0916443740692043e-05, "loss": 2.303, "step": 333550 }, { "epoch": 0.58, "learning_rate": 2.0915571800765217e-05, "loss": 2.3501, "step": 333560 }, { "epoch": 0.58, "learning_rate": 2.0914699860838387e-05, "loss": 2.3509, "step": 333570 }, { "epoch": 0.58, "learning_rate": 2.091382792091156e-05, "loss": 2.3157, "step": 333580 }, { "epoch": 0.58, "learning_rate": 2.0912955980984735e-05, "loss": 2.2078, "step": 333590 }, { "epoch": 0.58, "learning_rate": 2.091208404105791e-05, "loss": 2.3417, "step": 333600 }, { "epoch": 0.58, "learning_rate": 2.0911212101131082e-05, "loss": 2.3321, "step": 333610 }, { "epoch": 0.58, "learning_rate": 2.0910340161204256e-05, "loss": 2.4379, "step": 333620 }, { "epoch": 0.58, "learning_rate": 2.090946822127743e-05, "loss": 2.4691, "step": 333630 }, { "epoch": 0.58, "learning_rate": 2.09085962813506e-05, "loss": 2.2801, "step": 333640 }, { "epoch": 0.58, "learning_rate": 2.0907724341423774e-05, "loss": 2.1598, "step": 333650 }, { "epoch": 0.58, "learning_rate": 2.0906852401496948e-05, "loss": 2.3032, "step": 333660 }, { "epoch": 0.58, "learning_rate": 2.090598046157012e-05, "loss": 2.2803, "step": 333670 }, { "epoch": 0.58, "learning_rate": 2.0905108521643295e-05, "loss": 2.4337, "step": 333680 }, { "epoch": 0.58, "learning_rate": 2.0904236581716466e-05, "loss": 2.3405, "step": 333690 }, { "epoch": 0.58, "learning_rate": 2.0903364641789643e-05, "loss": 2.296, "step": 333700 }, { "epoch": 0.58, "learning_rate": 2.0902492701862813e-05, "loss": 2.3279, "step": 333710 }, { "epoch": 0.58, "learning_rate": 2.0901620761935987e-05, "loss": 2.3639, "step": 333720 }, { "epoch": 0.58, "learning_rate": 2.0900748822009157e-05, "loss": 2.2857, "step": 333730 }, { "epoch": 0.58, "learning_rate": 2.0899876882082334e-05, "loss": 2.2393, "step": 333740 }, { "epoch": 0.58, "learning_rate": 2.0899004942155505e-05, "loss": 2.3367, "step": 333750 }, { "epoch": 0.58, "learning_rate": 2.089813300222868e-05, "loss": 2.2362, "step": 333760 }, { "epoch": 0.58, "learning_rate": 2.0897261062301852e-05, "loss": 2.2315, "step": 333770 }, { "epoch": 0.58, "learning_rate": 2.0896389122375026e-05, "loss": 2.208, "step": 333780 }, { "epoch": 0.58, "learning_rate": 2.08955171824482e-05, "loss": 2.3756, "step": 333790 }, { "epoch": 0.58, "learning_rate": 2.089464524252137e-05, "loss": 2.2584, "step": 333800 }, { "epoch": 0.58, "learning_rate": 2.0893773302594547e-05, "loss": 2.347, "step": 333810 }, { "epoch": 0.58, "learning_rate": 2.0892901362667718e-05, "loss": 2.3091, "step": 333820 }, { "epoch": 0.58, "learning_rate": 2.089202942274089e-05, "loss": 2.214, "step": 333830 }, { "epoch": 0.58, "learning_rate": 2.0891157482814065e-05, "loss": 2.3701, "step": 333840 }, { "epoch": 0.58, "learning_rate": 2.089028554288724e-05, "loss": 2.3266, "step": 333850 }, { "epoch": 0.58, "learning_rate": 2.0889413602960413e-05, "loss": 2.3315, "step": 333860 }, { "epoch": 0.58, "learning_rate": 2.0888541663033583e-05, "loss": 2.311, "step": 333870 }, { "epoch": 0.58, "learning_rate": 2.088766972310676e-05, "loss": 2.3568, "step": 333880 }, { "epoch": 0.58, "learning_rate": 2.088679778317993e-05, "loss": 2.3191, "step": 333890 }, { "epoch": 0.58, "learning_rate": 2.0885925843253105e-05, "loss": 2.3148, "step": 333900 }, { "epoch": 0.58, "learning_rate": 2.0885053903326275e-05, "loss": 2.3337, "step": 333910 }, { "epoch": 0.58, "learning_rate": 2.0884181963399452e-05, "loss": 2.3942, "step": 333920 }, { "epoch": 0.58, "learning_rate": 2.0883310023472626e-05, "loss": 2.3463, "step": 333930 }, { "epoch": 0.58, "learning_rate": 2.0882438083545796e-05, "loss": 2.2327, "step": 333940 }, { "epoch": 0.58, "learning_rate": 2.088156614361897e-05, "loss": 2.3772, "step": 333950 }, { "epoch": 0.58, "learning_rate": 2.0880694203692144e-05, "loss": 2.306, "step": 333960 }, { "epoch": 0.58, "learning_rate": 2.0879822263765318e-05, "loss": 2.3154, "step": 333970 }, { "epoch": 0.58, "learning_rate": 2.0878950323838488e-05, "loss": 2.293, "step": 333980 }, { "epoch": 0.58, "learning_rate": 2.087807838391166e-05, "loss": 2.3141, "step": 333990 }, { "epoch": 0.58, "learning_rate": 2.0877206443984835e-05, "loss": 2.3507, "step": 334000 }, { "epoch": 0.58, "learning_rate": 2.087633450405801e-05, "loss": 2.2521, "step": 334010 }, { "epoch": 0.58, "learning_rate": 2.0875462564131183e-05, "loss": 2.4041, "step": 334020 }, { "epoch": 0.58, "learning_rate": 2.0874590624204357e-05, "loss": 2.2315, "step": 334030 }, { "epoch": 0.58, "learning_rate": 2.087371868427753e-05, "loss": 2.4264, "step": 334040 }, { "epoch": 0.58, "learning_rate": 2.08728467443507e-05, "loss": 2.2739, "step": 334050 }, { "epoch": 0.58, "learning_rate": 2.0871974804423875e-05, "loss": 2.2439, "step": 334060 }, { "epoch": 0.58, "learning_rate": 2.087110286449705e-05, "loss": 2.4256, "step": 334070 }, { "epoch": 0.58, "learning_rate": 2.0870230924570222e-05, "loss": 2.4389, "step": 334080 }, { "epoch": 0.58, "learning_rate": 2.0869358984643396e-05, "loss": 2.3198, "step": 334090 }, { "epoch": 0.58, "learning_rate": 2.0868487044716566e-05, "loss": 2.3355, "step": 334100 }, { "epoch": 0.58, "learning_rate": 2.0867615104789744e-05, "loss": 2.4243, "step": 334110 }, { "epoch": 0.58, "learning_rate": 2.0866743164862914e-05, "loss": 2.3594, "step": 334120 }, { "epoch": 0.58, "learning_rate": 2.0865871224936088e-05, "loss": 2.2278, "step": 334130 }, { "epoch": 0.58, "learning_rate": 2.086499928500926e-05, "loss": 2.2839, "step": 334140 }, { "epoch": 0.58, "learning_rate": 2.0864127345082435e-05, "loss": 2.379, "step": 334150 }, { "epoch": 0.58, "learning_rate": 2.086325540515561e-05, "loss": 2.4181, "step": 334160 }, { "epoch": 0.58, "learning_rate": 2.086238346522878e-05, "loss": 2.3612, "step": 334170 }, { "epoch": 0.58, "learning_rate": 2.0861511525301957e-05, "loss": 2.2494, "step": 334180 }, { "epoch": 0.58, "learning_rate": 2.0860639585375127e-05, "loss": 2.3163, "step": 334190 }, { "epoch": 0.58, "learning_rate": 2.08597676454483e-05, "loss": 2.3904, "step": 334200 }, { "epoch": 0.58, "learning_rate": 2.085889570552147e-05, "loss": 2.2972, "step": 334210 }, { "epoch": 0.58, "learning_rate": 2.0858023765594648e-05, "loss": 2.412, "step": 334220 }, { "epoch": 0.58, "learning_rate": 2.085715182566782e-05, "loss": 2.4625, "step": 334230 }, { "epoch": 0.58, "learning_rate": 2.0856279885740992e-05, "loss": 2.3629, "step": 334240 }, { "epoch": 0.58, "learning_rate": 2.0855407945814166e-05, "loss": 2.3118, "step": 334250 }, { "epoch": 0.58, "learning_rate": 2.085453600588734e-05, "loss": 2.2731, "step": 334260 }, { "epoch": 0.58, "learning_rate": 2.0853664065960514e-05, "loss": 2.299, "step": 334270 }, { "epoch": 0.58, "learning_rate": 2.0852792126033684e-05, "loss": 2.351, "step": 334280 }, { "epoch": 0.58, "learning_rate": 2.085192018610686e-05, "loss": 2.3262, "step": 334290 }, { "epoch": 0.58, "learning_rate": 2.085104824618003e-05, "loss": 2.32, "step": 334300 }, { "epoch": 0.58, "learning_rate": 2.0850176306253205e-05, "loss": 2.1992, "step": 334310 }, { "epoch": 0.58, "learning_rate": 2.084930436632638e-05, "loss": 2.337, "step": 334320 }, { "epoch": 0.58, "learning_rate": 2.0848432426399553e-05, "loss": 2.2603, "step": 334330 }, { "epoch": 0.58, "learning_rate": 2.0847560486472727e-05, "loss": 2.3826, "step": 334340 }, { "epoch": 0.58, "learning_rate": 2.0846688546545897e-05, "loss": 2.2297, "step": 334350 }, { "epoch": 0.58, "learning_rate": 2.084581660661907e-05, "loss": 2.2893, "step": 334360 }, { "epoch": 0.58, "learning_rate": 2.0844944666692245e-05, "loss": 2.4059, "step": 334370 }, { "epoch": 0.58, "learning_rate": 2.084407272676542e-05, "loss": 2.2102, "step": 334380 }, { "epoch": 0.58, "learning_rate": 2.084320078683859e-05, "loss": 2.2999, "step": 334390 }, { "epoch": 0.58, "learning_rate": 2.0842328846911763e-05, "loss": 2.1898, "step": 334400 }, { "epoch": 0.58, "learning_rate": 2.084145690698494e-05, "loss": 2.2384, "step": 334410 }, { "epoch": 0.58, "learning_rate": 2.084058496705811e-05, "loss": 2.3271, "step": 334420 }, { "epoch": 0.58, "learning_rate": 2.0839713027131284e-05, "loss": 2.279, "step": 334430 }, { "epoch": 0.58, "learning_rate": 2.0838841087204458e-05, "loss": 2.2065, "step": 334440 }, { "epoch": 0.58, "learning_rate": 2.083796914727763e-05, "loss": 2.4428, "step": 334450 }, { "epoch": 0.58, "learning_rate": 2.0837097207350802e-05, "loss": 2.3192, "step": 334460 }, { "epoch": 0.58, "learning_rate": 2.0836225267423976e-05, "loss": 2.3101, "step": 334470 }, { "epoch": 0.58, "learning_rate": 2.083535332749715e-05, "loss": 2.3376, "step": 334480 }, { "epoch": 0.58, "learning_rate": 2.0834481387570323e-05, "loss": 2.3738, "step": 334490 }, { "epoch": 0.58, "learning_rate": 2.0833609447643497e-05, "loss": 2.3364, "step": 334500 }, { "epoch": 0.58, "learning_rate": 2.0832737507716667e-05, "loss": 2.4187, "step": 334510 }, { "epoch": 0.58, "learning_rate": 2.0831865567789844e-05, "loss": 2.3209, "step": 334520 }, { "epoch": 0.58, "learning_rate": 2.0830993627863015e-05, "loss": 2.4048, "step": 334530 }, { "epoch": 0.58, "learning_rate": 2.083012168793619e-05, "loss": 2.3419, "step": 334540 }, { "epoch": 0.58, "learning_rate": 2.0829249748009362e-05, "loss": 2.3729, "step": 334550 }, { "epoch": 0.58, "learning_rate": 2.0828377808082536e-05, "loss": 2.3592, "step": 334560 }, { "epoch": 0.58, "learning_rate": 2.082750586815571e-05, "loss": 2.2149, "step": 334570 }, { "epoch": 0.58, "learning_rate": 2.082663392822888e-05, "loss": 2.4603, "step": 334580 }, { "epoch": 0.58, "learning_rate": 2.0825761988302057e-05, "loss": 2.3539, "step": 334590 }, { "epoch": 0.58, "learning_rate": 2.0824890048375228e-05, "loss": 2.2936, "step": 334600 }, { "epoch": 0.58, "learning_rate": 2.08240181084484e-05, "loss": 2.3485, "step": 334610 }, { "epoch": 0.58, "learning_rate": 2.0823146168521572e-05, "loss": 2.3267, "step": 334620 }, { "epoch": 0.58, "learning_rate": 2.082227422859475e-05, "loss": 2.3017, "step": 334630 }, { "epoch": 0.58, "learning_rate": 2.082140228866792e-05, "loss": 2.4247, "step": 334640 }, { "epoch": 0.58, "learning_rate": 2.0820530348741093e-05, "loss": 2.2992, "step": 334650 }, { "epoch": 0.58, "learning_rate": 2.0819658408814267e-05, "loss": 2.351, "step": 334660 }, { "epoch": 0.58, "learning_rate": 2.081878646888744e-05, "loss": 2.3601, "step": 334670 }, { "epoch": 0.58, "learning_rate": 2.0817914528960615e-05, "loss": 2.3474, "step": 334680 }, { "epoch": 0.58, "learning_rate": 2.0817042589033785e-05, "loss": 2.371, "step": 334690 }, { "epoch": 0.58, "learning_rate": 2.0816170649106962e-05, "loss": 2.3246, "step": 334700 }, { "epoch": 0.58, "learning_rate": 2.0815298709180132e-05, "loss": 2.3957, "step": 334710 }, { "epoch": 0.58, "learning_rate": 2.0814426769253306e-05, "loss": 2.2845, "step": 334720 }, { "epoch": 0.58, "learning_rate": 2.081355482932648e-05, "loss": 2.2759, "step": 334730 }, { "epoch": 0.58, "learning_rate": 2.0812682889399654e-05, "loss": 2.303, "step": 334740 }, { "epoch": 0.58, "learning_rate": 2.0811810949472828e-05, "loss": 2.2845, "step": 334750 }, { "epoch": 0.58, "learning_rate": 2.0810939009545998e-05, "loss": 2.4192, "step": 334760 }, { "epoch": 0.58, "learning_rate": 2.081006706961917e-05, "loss": 2.3347, "step": 334770 }, { "epoch": 0.58, "learning_rate": 2.0809195129692345e-05, "loss": 2.3345, "step": 334780 }, { "epoch": 0.58, "learning_rate": 2.080832318976552e-05, "loss": 2.2909, "step": 334790 }, { "epoch": 0.58, "learning_rate": 2.0807451249838693e-05, "loss": 2.3448, "step": 334800 }, { "epoch": 0.58, "learning_rate": 2.0806579309911867e-05, "loss": 2.3763, "step": 334810 }, { "epoch": 0.58, "learning_rate": 2.080570736998504e-05, "loss": 2.2592, "step": 334820 }, { "epoch": 0.58, "learning_rate": 2.080483543005821e-05, "loss": 2.3448, "step": 334830 }, { "epoch": 0.58, "learning_rate": 2.0803963490131385e-05, "loss": 2.1708, "step": 334840 }, { "epoch": 0.58, "learning_rate": 2.080309155020456e-05, "loss": 2.2902, "step": 334850 }, { "epoch": 0.58, "learning_rate": 2.0802219610277732e-05, "loss": 2.3207, "step": 334860 }, { "epoch": 0.58, "learning_rate": 2.0801347670350903e-05, "loss": 2.3918, "step": 334870 }, { "epoch": 0.58, "learning_rate": 2.0800475730424076e-05, "loss": 2.3468, "step": 334880 }, { "epoch": 0.58, "learning_rate": 2.0799603790497254e-05, "loss": 2.2199, "step": 334890 }, { "epoch": 0.58, "learning_rate": 2.0798731850570424e-05, "loss": 2.3629, "step": 334900 }, { "epoch": 0.58, "learning_rate": 2.0797859910643598e-05, "loss": 2.2944, "step": 334910 }, { "epoch": 0.58, "learning_rate": 2.0796987970716768e-05, "loss": 2.2509, "step": 334920 }, { "epoch": 0.58, "learning_rate": 2.0796116030789945e-05, "loss": 2.3374, "step": 334930 }, { "epoch": 0.58, "learning_rate": 2.0795244090863116e-05, "loss": 2.3429, "step": 334940 }, { "epoch": 0.58, "learning_rate": 2.079437215093629e-05, "loss": 2.4328, "step": 334950 }, { "epoch": 0.58, "learning_rate": 2.0793500211009463e-05, "loss": 2.3492, "step": 334960 }, { "epoch": 0.58, "learning_rate": 2.0792628271082637e-05, "loss": 2.3207, "step": 334970 }, { "epoch": 0.58, "learning_rate": 2.079175633115581e-05, "loss": 2.3817, "step": 334980 }, { "epoch": 0.58, "learning_rate": 2.079088439122898e-05, "loss": 2.3086, "step": 334990 }, { "epoch": 0.58, "learning_rate": 2.0790012451302158e-05, "loss": 2.3872, "step": 335000 }, { "epoch": 0.58, "learning_rate": 2.078914051137533e-05, "loss": 2.2607, "step": 335010 }, { "epoch": 0.58, "learning_rate": 2.0788268571448502e-05, "loss": 2.4312, "step": 335020 }, { "epoch": 0.58, "learning_rate": 2.0787396631521676e-05, "loss": 2.2673, "step": 335030 }, { "epoch": 0.58, "learning_rate": 2.078652469159485e-05, "loss": 2.3064, "step": 335040 }, { "epoch": 0.58, "learning_rate": 2.0785652751668024e-05, "loss": 2.4369, "step": 335050 }, { "epoch": 0.58, "learning_rate": 2.0784780811741194e-05, "loss": 2.4757, "step": 335060 }, { "epoch": 0.58, "learning_rate": 2.078390887181437e-05, "loss": 2.3024, "step": 335070 }, { "epoch": 0.58, "learning_rate": 2.078303693188754e-05, "loss": 2.3128, "step": 335080 }, { "epoch": 0.58, "learning_rate": 2.0782164991960715e-05, "loss": 2.3463, "step": 335090 }, { "epoch": 0.58, "learning_rate": 2.0781293052033886e-05, "loss": 2.3516, "step": 335100 }, { "epoch": 0.58, "learning_rate": 2.0780421112107063e-05, "loss": 2.3399, "step": 335110 }, { "epoch": 0.58, "learning_rate": 2.0779549172180233e-05, "loss": 2.319, "step": 335120 }, { "epoch": 0.58, "learning_rate": 2.0778677232253407e-05, "loss": 2.3536, "step": 335130 }, { "epoch": 0.58, "learning_rate": 2.077780529232658e-05, "loss": 2.3927, "step": 335140 }, { "epoch": 0.58, "learning_rate": 2.0776933352399755e-05, "loss": 2.3876, "step": 335150 }, { "epoch": 0.58, "learning_rate": 2.077606141247293e-05, "loss": 2.3012, "step": 335160 }, { "epoch": 0.58, "learning_rate": 2.07751894725461e-05, "loss": 2.2235, "step": 335170 }, { "epoch": 0.58, "learning_rate": 2.0774317532619273e-05, "loss": 2.3498, "step": 335180 }, { "epoch": 0.58, "learning_rate": 2.0773445592692446e-05, "loss": 2.2996, "step": 335190 }, { "epoch": 0.58, "learning_rate": 2.077257365276562e-05, "loss": 2.4026, "step": 335200 }, { "epoch": 0.58, "learning_rate": 2.0771701712838794e-05, "loss": 2.3166, "step": 335210 }, { "epoch": 0.58, "learning_rate": 2.0770829772911968e-05, "loss": 2.301, "step": 335220 }, { "epoch": 0.58, "learning_rate": 2.076995783298514e-05, "loss": 2.3005, "step": 335230 }, { "epoch": 0.58, "learning_rate": 2.0769085893058312e-05, "loss": 2.4258, "step": 335240 }, { "epoch": 0.58, "learning_rate": 2.0768213953131486e-05, "loss": 2.2285, "step": 335250 }, { "epoch": 0.58, "learning_rate": 2.076734201320466e-05, "loss": 2.3316, "step": 335260 }, { "epoch": 0.58, "learning_rate": 2.0766470073277833e-05, "loss": 2.3859, "step": 335270 }, { "epoch": 0.58, "learning_rate": 2.0765598133351007e-05, "loss": 2.4325, "step": 335280 }, { "epoch": 0.58, "learning_rate": 2.0764726193424177e-05, "loss": 2.3072, "step": 335290 }, { "epoch": 0.58, "learning_rate": 2.0763854253497354e-05, "loss": 2.2772, "step": 335300 }, { "epoch": 0.58, "learning_rate": 2.0762982313570525e-05, "loss": 2.343, "step": 335310 }, { "epoch": 0.58, "learning_rate": 2.07621103736437e-05, "loss": 2.4244, "step": 335320 }, { "epoch": 0.58, "learning_rate": 2.076123843371687e-05, "loss": 2.3023, "step": 335330 }, { "epoch": 0.58, "learning_rate": 2.0760366493790046e-05, "loss": 2.2626, "step": 335340 }, { "epoch": 0.58, "learning_rate": 2.0759494553863216e-05, "loss": 2.3619, "step": 335350 }, { "epoch": 0.58, "learning_rate": 2.075862261393639e-05, "loss": 2.3963, "step": 335360 }, { "epoch": 0.58, "learning_rate": 2.0757750674009564e-05, "loss": 2.366, "step": 335370 }, { "epoch": 0.58, "learning_rate": 2.0756878734082738e-05, "loss": 2.3343, "step": 335380 }, { "epoch": 0.58, "learning_rate": 2.075600679415591e-05, "loss": 2.4781, "step": 335390 }, { "epoch": 0.58, "learning_rate": 2.0755134854229082e-05, "loss": 2.3679, "step": 335400 }, { "epoch": 0.58, "learning_rate": 2.075426291430226e-05, "loss": 2.3357, "step": 335410 }, { "epoch": 0.58, "learning_rate": 2.075339097437543e-05, "loss": 2.2023, "step": 335420 }, { "epoch": 0.58, "learning_rate": 2.0752519034448603e-05, "loss": 2.4257, "step": 335430 }, { "epoch": 0.58, "learning_rate": 2.0751647094521777e-05, "loss": 2.2535, "step": 335440 }, { "epoch": 0.58, "learning_rate": 2.075077515459495e-05, "loss": 2.374, "step": 335450 }, { "epoch": 0.59, "learning_rate": 2.0749903214668125e-05, "loss": 2.3577, "step": 335460 }, { "epoch": 0.59, "learning_rate": 2.0749031274741295e-05, "loss": 2.3867, "step": 335470 }, { "epoch": 0.59, "learning_rate": 2.0748159334814472e-05, "loss": 2.348, "step": 335480 }, { "epoch": 0.59, "learning_rate": 2.0747287394887642e-05, "loss": 2.4506, "step": 335490 }, { "epoch": 0.59, "learning_rate": 2.0746415454960816e-05, "loss": 2.2948, "step": 335500 }, { "epoch": 0.59, "learning_rate": 2.074554351503399e-05, "loss": 2.3799, "step": 335510 }, { "epoch": 0.59, "learning_rate": 2.0744671575107164e-05, "loss": 2.4495, "step": 335520 }, { "epoch": 0.59, "learning_rate": 2.0743799635180338e-05, "loss": 2.2764, "step": 335530 }, { "epoch": 0.59, "learning_rate": 2.0742927695253508e-05, "loss": 2.3828, "step": 335540 }, { "epoch": 0.59, "learning_rate": 2.074205575532668e-05, "loss": 2.3029, "step": 335550 }, { "epoch": 0.59, "learning_rate": 2.0741183815399855e-05, "loss": 2.4462, "step": 335560 }, { "epoch": 0.59, "learning_rate": 2.074031187547303e-05, "loss": 2.3669, "step": 335570 }, { "epoch": 0.59, "learning_rate": 2.07394399355462e-05, "loss": 2.3032, "step": 335580 }, { "epoch": 0.59, "learning_rate": 2.0738567995619373e-05, "loss": 2.2916, "step": 335590 }, { "epoch": 0.59, "learning_rate": 2.0737696055692547e-05, "loss": 2.4487, "step": 335600 }, { "epoch": 0.59, "learning_rate": 2.073682411576572e-05, "loss": 2.2746, "step": 335610 }, { "epoch": 0.59, "learning_rate": 2.0735952175838895e-05, "loss": 2.4127, "step": 335620 }, { "epoch": 0.59, "learning_rate": 2.073508023591207e-05, "loss": 2.2715, "step": 335630 }, { "epoch": 0.59, "learning_rate": 2.0734208295985242e-05, "loss": 2.2083, "step": 335640 }, { "epoch": 0.59, "learning_rate": 2.0733336356058413e-05, "loss": 2.3645, "step": 335650 }, { "epoch": 0.59, "learning_rate": 2.0732464416131586e-05, "loss": 2.5133, "step": 335660 }, { "epoch": 0.59, "learning_rate": 2.073159247620476e-05, "loss": 2.4126, "step": 335670 }, { "epoch": 0.59, "learning_rate": 2.0730720536277934e-05, "loss": 2.343, "step": 335680 }, { "epoch": 0.59, "learning_rate": 2.0729848596351108e-05, "loss": 2.3379, "step": 335690 }, { "epoch": 0.59, "learning_rate": 2.0728976656424278e-05, "loss": 2.384, "step": 335700 }, { "epoch": 0.59, "learning_rate": 2.0728104716497455e-05, "loss": 2.4826, "step": 335710 }, { "epoch": 0.59, "learning_rate": 2.0727232776570626e-05, "loss": 2.2203, "step": 335720 }, { "epoch": 0.59, "learning_rate": 2.07263608366438e-05, "loss": 2.4299, "step": 335730 }, { "epoch": 0.59, "learning_rate": 2.0725488896716973e-05, "loss": 2.3813, "step": 335740 }, { "epoch": 0.59, "learning_rate": 2.0724616956790147e-05, "loss": 2.2575, "step": 335750 }, { "epoch": 0.59, "learning_rate": 2.072374501686332e-05, "loss": 2.3208, "step": 335760 }, { "epoch": 0.59, "learning_rate": 2.072287307693649e-05, "loss": 2.4052, "step": 335770 }, { "epoch": 0.59, "learning_rate": 2.0722001137009668e-05, "loss": 2.3823, "step": 335780 }, { "epoch": 0.59, "learning_rate": 2.072112919708284e-05, "loss": 2.3302, "step": 335790 }, { "epoch": 0.59, "learning_rate": 2.0720257257156012e-05, "loss": 2.3747, "step": 335800 }, { "epoch": 0.59, "learning_rate": 2.0719385317229183e-05, "loss": 2.1454, "step": 335810 }, { "epoch": 0.59, "learning_rate": 2.071851337730236e-05, "loss": 2.2089, "step": 335820 }, { "epoch": 0.59, "learning_rate": 2.071764143737553e-05, "loss": 2.3209, "step": 335830 }, { "epoch": 0.59, "learning_rate": 2.0716769497448704e-05, "loss": 2.312, "step": 335840 }, { "epoch": 0.59, "learning_rate": 2.0715897557521878e-05, "loss": 2.2569, "step": 335850 }, { "epoch": 0.59, "learning_rate": 2.071502561759505e-05, "loss": 2.2446, "step": 335860 }, { "epoch": 0.59, "learning_rate": 2.0714153677668225e-05, "loss": 2.4188, "step": 335870 }, { "epoch": 0.59, "learning_rate": 2.0713281737741396e-05, "loss": 2.274, "step": 335880 }, { "epoch": 0.59, "learning_rate": 2.0712409797814573e-05, "loss": 2.3587, "step": 335890 }, { "epoch": 0.59, "learning_rate": 2.0711537857887743e-05, "loss": 2.4021, "step": 335900 }, { "epoch": 0.59, "learning_rate": 2.0710665917960917e-05, "loss": 2.3406, "step": 335910 }, { "epoch": 0.59, "learning_rate": 2.070979397803409e-05, "loss": 2.328, "step": 335920 }, { "epoch": 0.59, "learning_rate": 2.0708922038107265e-05, "loss": 2.3039, "step": 335930 }, { "epoch": 0.59, "learning_rate": 2.070805009818044e-05, "loss": 2.3327, "step": 335940 }, { "epoch": 0.59, "learning_rate": 2.070717815825361e-05, "loss": 2.2726, "step": 335950 }, { "epoch": 0.59, "learning_rate": 2.0706306218326783e-05, "loss": 2.2221, "step": 335960 }, { "epoch": 0.59, "learning_rate": 2.0705434278399956e-05, "loss": 2.3098, "step": 335970 }, { "epoch": 0.59, "learning_rate": 2.070456233847313e-05, "loss": 2.3903, "step": 335980 }, { "epoch": 0.59, "learning_rate": 2.07036903985463e-05, "loss": 2.2562, "step": 335990 }, { "epoch": 0.59, "learning_rate": 2.0702818458619478e-05, "loss": 2.285, "step": 336000 }, { "epoch": 0.59, "learning_rate": 2.070194651869265e-05, "loss": 2.3275, "step": 336010 }, { "epoch": 0.59, "learning_rate": 2.0701074578765822e-05, "loss": 2.3549, "step": 336020 }, { "epoch": 0.59, "learning_rate": 2.0700202638838996e-05, "loss": 2.33, "step": 336030 }, { "epoch": 0.59, "learning_rate": 2.069933069891217e-05, "loss": 2.2892, "step": 336040 }, { "epoch": 0.59, "learning_rate": 2.0698458758985343e-05, "loss": 2.3973, "step": 336050 }, { "epoch": 0.59, "learning_rate": 2.0697586819058513e-05, "loss": 2.3359, "step": 336060 }, { "epoch": 0.59, "learning_rate": 2.0696714879131687e-05, "loss": 2.3729, "step": 336070 }, { "epoch": 0.59, "learning_rate": 2.069584293920486e-05, "loss": 2.3096, "step": 336080 }, { "epoch": 0.59, "learning_rate": 2.0694970999278035e-05, "loss": 2.2917, "step": 336090 }, { "epoch": 0.59, "learning_rate": 2.069409905935121e-05, "loss": 2.3664, "step": 336100 }, { "epoch": 0.59, "learning_rate": 2.069322711942438e-05, "loss": 2.3047, "step": 336110 }, { "epoch": 0.59, "learning_rate": 2.0692355179497556e-05, "loss": 2.2458, "step": 336120 }, { "epoch": 0.59, "learning_rate": 2.0691483239570726e-05, "loss": 2.246, "step": 336130 }, { "epoch": 0.59, "learning_rate": 2.06906112996439e-05, "loss": 2.2462, "step": 336140 }, { "epoch": 0.59, "learning_rate": 2.0689739359717074e-05, "loss": 2.2707, "step": 336150 }, { "epoch": 0.59, "learning_rate": 2.0688867419790248e-05, "loss": 2.3644, "step": 336160 }, { "epoch": 0.59, "learning_rate": 2.068799547986342e-05, "loss": 2.3219, "step": 336170 }, { "epoch": 0.59, "learning_rate": 2.0687123539936592e-05, "loss": 2.2721, "step": 336180 }, { "epoch": 0.59, "learning_rate": 2.068625160000977e-05, "loss": 2.478, "step": 336190 }, { "epoch": 0.59, "learning_rate": 2.068537966008294e-05, "loss": 2.3561, "step": 336200 }, { "epoch": 0.59, "learning_rate": 2.0684507720156113e-05, "loss": 2.3587, "step": 336210 }, { "epoch": 0.59, "learning_rate": 2.0683635780229284e-05, "loss": 2.3655, "step": 336220 }, { "epoch": 0.59, "learning_rate": 2.068276384030246e-05, "loss": 2.3361, "step": 336230 }, { "epoch": 0.59, "learning_rate": 2.0681891900375635e-05, "loss": 2.3005, "step": 336240 }, { "epoch": 0.59, "learning_rate": 2.0681019960448805e-05, "loss": 2.392, "step": 336250 }, { "epoch": 0.59, "learning_rate": 2.068014802052198e-05, "loss": 2.3332, "step": 336260 }, { "epoch": 0.59, "learning_rate": 2.0679276080595152e-05, "loss": 2.3854, "step": 336270 }, { "epoch": 0.59, "learning_rate": 2.0678404140668326e-05, "loss": 2.3912, "step": 336280 }, { "epoch": 0.59, "learning_rate": 2.0677532200741497e-05, "loss": 2.3918, "step": 336290 }, { "epoch": 0.59, "learning_rate": 2.0676660260814674e-05, "loss": 2.3691, "step": 336300 }, { "epoch": 0.59, "learning_rate": 2.0675788320887844e-05, "loss": 2.3311, "step": 336310 }, { "epoch": 0.59, "learning_rate": 2.0674916380961018e-05, "loss": 2.2325, "step": 336320 }, { "epoch": 0.59, "learning_rate": 2.067404444103419e-05, "loss": 2.4171, "step": 336330 }, { "epoch": 0.59, "learning_rate": 2.0673172501107365e-05, "loss": 2.2711, "step": 336340 }, { "epoch": 0.59, "learning_rate": 2.067230056118054e-05, "loss": 2.2987, "step": 336350 }, { "epoch": 0.59, "learning_rate": 2.067142862125371e-05, "loss": 2.3483, "step": 336360 }, { "epoch": 0.59, "learning_rate": 2.0670556681326883e-05, "loss": 2.2702, "step": 336370 }, { "epoch": 0.59, "learning_rate": 2.0669684741400057e-05, "loss": 2.3487, "step": 336380 }, { "epoch": 0.59, "learning_rate": 2.066881280147323e-05, "loss": 2.3668, "step": 336390 }, { "epoch": 0.59, "learning_rate": 2.0667940861546405e-05, "loss": 2.3, "step": 336400 }, { "epoch": 0.59, "learning_rate": 2.066706892161958e-05, "loss": 2.3559, "step": 336410 }, { "epoch": 0.59, "learning_rate": 2.0666196981692752e-05, "loss": 2.2485, "step": 336420 }, { "epoch": 0.59, "learning_rate": 2.0665325041765923e-05, "loss": 2.3504, "step": 336430 }, { "epoch": 0.59, "learning_rate": 2.0664453101839096e-05, "loss": 2.2661, "step": 336440 }, { "epoch": 0.59, "learning_rate": 2.066358116191227e-05, "loss": 2.2942, "step": 336450 }, { "epoch": 0.59, "learning_rate": 2.0662709221985444e-05, "loss": 2.3675, "step": 336460 }, { "epoch": 0.59, "learning_rate": 2.0661837282058614e-05, "loss": 2.3895, "step": 336470 }, { "epoch": 0.59, "learning_rate": 2.0660965342131788e-05, "loss": 2.2963, "step": 336480 }, { "epoch": 0.59, "learning_rate": 2.0660093402204965e-05, "loss": 2.2954, "step": 336490 }, { "epoch": 0.59, "learning_rate": 2.0659221462278136e-05, "loss": 2.3414, "step": 336500 }, { "epoch": 0.59, "learning_rate": 2.065834952235131e-05, "loss": 2.3208, "step": 336510 }, { "epoch": 0.59, "learning_rate": 2.065747758242448e-05, "loss": 2.3371, "step": 336520 }, { "epoch": 0.59, "learning_rate": 2.0656605642497657e-05, "loss": 2.2729, "step": 336530 }, { "epoch": 0.59, "learning_rate": 2.0655733702570827e-05, "loss": 2.3574, "step": 336540 }, { "epoch": 0.59, "learning_rate": 2.0654861762644e-05, "loss": 2.3453, "step": 336550 }, { "epoch": 0.59, "learning_rate": 2.0653989822717175e-05, "loss": 2.3284, "step": 336560 }, { "epoch": 0.59, "learning_rate": 2.065311788279035e-05, "loss": 2.2426, "step": 336570 }, { "epoch": 0.59, "learning_rate": 2.0652245942863522e-05, "loss": 2.288, "step": 336580 }, { "epoch": 0.59, "learning_rate": 2.0651374002936693e-05, "loss": 2.3182, "step": 336590 }, { "epoch": 0.59, "learning_rate": 2.065050206300987e-05, "loss": 2.3341, "step": 336600 }, { "epoch": 0.59, "learning_rate": 2.064963012308304e-05, "loss": 2.2939, "step": 336610 }, { "epoch": 0.59, "learning_rate": 2.0648758183156214e-05, "loss": 2.2639, "step": 336620 }, { "epoch": 0.59, "learning_rate": 2.0647886243229388e-05, "loss": 2.3278, "step": 336630 }, { "epoch": 0.59, "learning_rate": 2.064701430330256e-05, "loss": 2.2063, "step": 336640 }, { "epoch": 0.59, "learning_rate": 2.0646142363375735e-05, "loss": 2.312, "step": 336650 }, { "epoch": 0.59, "learning_rate": 2.0645270423448906e-05, "loss": 2.3383, "step": 336660 }, { "epoch": 0.59, "learning_rate": 2.0644398483522083e-05, "loss": 2.3101, "step": 336670 }, { "epoch": 0.59, "learning_rate": 2.0643526543595253e-05, "loss": 2.3627, "step": 336680 }, { "epoch": 0.59, "learning_rate": 2.0642654603668427e-05, "loss": 2.3509, "step": 336690 }, { "epoch": 0.59, "learning_rate": 2.0641782663741597e-05, "loss": 2.338, "step": 336700 }, { "epoch": 0.59, "learning_rate": 2.0640910723814775e-05, "loss": 2.2813, "step": 336710 }, { "epoch": 0.59, "learning_rate": 2.0640038783887945e-05, "loss": 2.2847, "step": 336720 }, { "epoch": 0.59, "learning_rate": 2.063916684396112e-05, "loss": 2.384, "step": 336730 }, { "epoch": 0.59, "learning_rate": 2.0638294904034293e-05, "loss": 2.3851, "step": 336740 }, { "epoch": 0.59, "learning_rate": 2.0637422964107466e-05, "loss": 2.3719, "step": 336750 }, { "epoch": 0.59, "learning_rate": 2.063655102418064e-05, "loss": 2.4496, "step": 336760 }, { "epoch": 0.59, "learning_rate": 2.063567908425381e-05, "loss": 2.3137, "step": 336770 }, { "epoch": 0.59, "learning_rate": 2.0634807144326984e-05, "loss": 2.2099, "step": 336780 }, { "epoch": 0.59, "learning_rate": 2.0633935204400158e-05, "loss": 2.4212, "step": 336790 }, { "epoch": 0.59, "learning_rate": 2.0633063264473332e-05, "loss": 2.3354, "step": 336800 }, { "epoch": 0.59, "learning_rate": 2.0632191324546506e-05, "loss": 2.3506, "step": 336810 }, { "epoch": 0.59, "learning_rate": 2.063131938461968e-05, "loss": 2.475, "step": 336820 }, { "epoch": 0.59, "learning_rate": 2.0630447444692853e-05, "loss": 2.3702, "step": 336830 }, { "epoch": 0.59, "learning_rate": 2.0629575504766023e-05, "loss": 2.3434, "step": 336840 }, { "epoch": 0.59, "learning_rate": 2.0628703564839197e-05, "loss": 2.4181, "step": 336850 }, { "epoch": 0.59, "learning_rate": 2.062783162491237e-05, "loss": 2.2173, "step": 336860 }, { "epoch": 0.59, "learning_rate": 2.0626959684985545e-05, "loss": 2.2848, "step": 336870 }, { "epoch": 0.59, "learning_rate": 2.062608774505872e-05, "loss": 2.2973, "step": 336880 }, { "epoch": 0.59, "learning_rate": 2.062521580513189e-05, "loss": 2.398, "step": 336890 }, { "epoch": 0.59, "learning_rate": 2.0624343865205066e-05, "loss": 2.2426, "step": 336900 }, { "epoch": 0.59, "learning_rate": 2.0623471925278236e-05, "loss": 2.4089, "step": 336910 }, { "epoch": 0.59, "learning_rate": 2.062259998535141e-05, "loss": 2.3535, "step": 336920 }, { "epoch": 0.59, "learning_rate": 2.062172804542458e-05, "loss": 2.3016, "step": 336930 }, { "epoch": 0.59, "learning_rate": 2.0620856105497758e-05, "loss": 2.3801, "step": 336940 }, { "epoch": 0.59, "learning_rate": 2.0619984165570928e-05, "loss": 2.3618, "step": 336950 }, { "epoch": 0.59, "learning_rate": 2.0619112225644102e-05, "loss": 2.4325, "step": 336960 }, { "epoch": 0.59, "learning_rate": 2.061824028571728e-05, "loss": 2.3608, "step": 336970 }, { "epoch": 0.59, "learning_rate": 2.061736834579045e-05, "loss": 2.3454, "step": 336980 }, { "epoch": 0.59, "learning_rate": 2.0616496405863623e-05, "loss": 2.5388, "step": 336990 }, { "epoch": 0.59, "learning_rate": 2.0615624465936794e-05, "loss": 2.2774, "step": 337000 }, { "epoch": 0.59, "learning_rate": 2.061475252600997e-05, "loss": 2.3326, "step": 337010 }, { "epoch": 0.59, "learning_rate": 2.061388058608314e-05, "loss": 2.2196, "step": 337020 }, { "epoch": 0.59, "learning_rate": 2.0613008646156315e-05, "loss": 2.2216, "step": 337030 }, { "epoch": 0.59, "learning_rate": 2.061213670622949e-05, "loss": 2.4363, "step": 337040 }, { "epoch": 0.59, "learning_rate": 2.0611264766302662e-05, "loss": 2.3805, "step": 337050 }, { "epoch": 0.59, "learning_rate": 2.0610392826375836e-05, "loss": 2.1664, "step": 337060 }, { "epoch": 0.59, "learning_rate": 2.0609520886449007e-05, "loss": 2.3097, "step": 337070 }, { "epoch": 0.59, "learning_rate": 2.0608648946522184e-05, "loss": 2.3323, "step": 337080 }, { "epoch": 0.59, "learning_rate": 2.0607777006595354e-05, "loss": 2.2812, "step": 337090 }, { "epoch": 0.59, "learning_rate": 2.0606905066668528e-05, "loss": 2.3378, "step": 337100 }, { "epoch": 0.59, "learning_rate": 2.06060331267417e-05, "loss": 2.3914, "step": 337110 }, { "epoch": 0.59, "learning_rate": 2.0605161186814875e-05, "loss": 2.2508, "step": 337120 }, { "epoch": 0.59, "learning_rate": 2.060428924688805e-05, "loss": 2.4147, "step": 337130 }, { "epoch": 0.59, "learning_rate": 2.060341730696122e-05, "loss": 2.1675, "step": 337140 }, { "epoch": 0.59, "learning_rate": 2.0602545367034393e-05, "loss": 2.2828, "step": 337150 }, { "epoch": 0.59, "learning_rate": 2.0601673427107567e-05, "loss": 2.3492, "step": 337160 }, { "epoch": 0.59, "learning_rate": 2.060080148718074e-05, "loss": 2.3558, "step": 337170 }, { "epoch": 0.59, "learning_rate": 2.059992954725391e-05, "loss": 2.3009, "step": 337180 }, { "epoch": 0.59, "learning_rate": 2.0599057607327085e-05, "loss": 2.2031, "step": 337190 }, { "epoch": 0.59, "learning_rate": 2.059818566740026e-05, "loss": 2.2927, "step": 337200 }, { "epoch": 0.59, "learning_rate": 2.0597313727473433e-05, "loss": 2.3941, "step": 337210 }, { "epoch": 0.59, "learning_rate": 2.0596441787546606e-05, "loss": 2.3459, "step": 337220 }, { "epoch": 0.59, "learning_rate": 2.059556984761978e-05, "loss": 2.2863, "step": 337230 }, { "epoch": 0.59, "learning_rate": 2.0594697907692954e-05, "loss": 2.3058, "step": 337240 }, { "epoch": 0.59, "learning_rate": 2.0593825967766124e-05, "loss": 2.3676, "step": 337250 }, { "epoch": 0.59, "learning_rate": 2.0592954027839298e-05, "loss": 2.3301, "step": 337260 }, { "epoch": 0.59, "learning_rate": 2.0592082087912472e-05, "loss": 2.2507, "step": 337270 }, { "epoch": 0.59, "learning_rate": 2.0591210147985646e-05, "loss": 2.3575, "step": 337280 }, { "epoch": 0.59, "learning_rate": 2.059033820805882e-05, "loss": 2.2905, "step": 337290 }, { "epoch": 0.59, "learning_rate": 2.058946626813199e-05, "loss": 2.3005, "step": 337300 }, { "epoch": 0.59, "learning_rate": 2.0588594328205167e-05, "loss": 2.3497, "step": 337310 }, { "epoch": 0.59, "learning_rate": 2.0587722388278337e-05, "loss": 2.4457, "step": 337320 }, { "epoch": 0.59, "learning_rate": 2.058685044835151e-05, "loss": 2.2952, "step": 337330 }, { "epoch": 0.59, "learning_rate": 2.0585978508424685e-05, "loss": 2.4518, "step": 337340 }, { "epoch": 0.59, "learning_rate": 2.058510656849786e-05, "loss": 2.3612, "step": 337350 }, { "epoch": 0.59, "learning_rate": 2.0584234628571032e-05, "loss": 2.3498, "step": 337360 }, { "epoch": 0.59, "learning_rate": 2.0583362688644203e-05, "loss": 2.2937, "step": 337370 }, { "epoch": 0.59, "learning_rate": 2.058249074871738e-05, "loss": 2.3464, "step": 337380 }, { "epoch": 0.59, "learning_rate": 2.058161880879055e-05, "loss": 2.3577, "step": 337390 }, { "epoch": 0.59, "learning_rate": 2.0580746868863724e-05, "loss": 2.4046, "step": 337400 }, { "epoch": 0.59, "learning_rate": 2.0579874928936894e-05, "loss": 2.4094, "step": 337410 }, { "epoch": 0.59, "learning_rate": 2.057900298901007e-05, "loss": 2.1753, "step": 337420 }, { "epoch": 0.59, "learning_rate": 2.0578131049083242e-05, "loss": 2.3331, "step": 337430 }, { "epoch": 0.59, "learning_rate": 2.0577259109156416e-05, "loss": 2.3079, "step": 337440 }, { "epoch": 0.59, "learning_rate": 2.057638716922959e-05, "loss": 2.3377, "step": 337450 }, { "epoch": 0.59, "learning_rate": 2.0575515229302763e-05, "loss": 2.3931, "step": 337460 }, { "epoch": 0.59, "learning_rate": 2.0574643289375937e-05, "loss": 2.2818, "step": 337470 }, { "epoch": 0.59, "learning_rate": 2.0573771349449107e-05, "loss": 2.2985, "step": 337480 }, { "epoch": 0.59, "learning_rate": 2.0572899409522285e-05, "loss": 2.2765, "step": 337490 }, { "epoch": 0.59, "learning_rate": 2.0572027469595455e-05, "loss": 2.2953, "step": 337500 }, { "epoch": 0.59, "learning_rate": 2.057115552966863e-05, "loss": 2.2476, "step": 337510 }, { "epoch": 0.59, "learning_rate": 2.0570283589741803e-05, "loss": 2.4119, "step": 337520 }, { "epoch": 0.59, "learning_rate": 2.0569411649814976e-05, "loss": 2.2611, "step": 337530 }, { "epoch": 0.59, "learning_rate": 2.056853970988815e-05, "loss": 2.4205, "step": 337540 }, { "epoch": 0.59, "learning_rate": 2.056766776996132e-05, "loss": 2.3137, "step": 337550 }, { "epoch": 0.59, "learning_rate": 2.0566795830034494e-05, "loss": 2.4246, "step": 337560 }, { "epoch": 0.59, "learning_rate": 2.0565923890107668e-05, "loss": 2.3443, "step": 337570 }, { "epoch": 0.59, "learning_rate": 2.0565051950180842e-05, "loss": 2.2561, "step": 337580 }, { "epoch": 0.59, "learning_rate": 2.0564180010254016e-05, "loss": 2.4313, "step": 337590 }, { "epoch": 0.59, "learning_rate": 2.056330807032719e-05, "loss": 2.4016, "step": 337600 }, { "epoch": 0.59, "learning_rate": 2.0562436130400363e-05, "loss": 2.3139, "step": 337610 }, { "epoch": 0.59, "learning_rate": 2.0561564190473533e-05, "loss": 2.1904, "step": 337620 }, { "epoch": 0.59, "learning_rate": 2.0560692250546707e-05, "loss": 2.3532, "step": 337630 }, { "epoch": 0.59, "learning_rate": 2.055982031061988e-05, "loss": 2.3578, "step": 337640 }, { "epoch": 0.59, "learning_rate": 2.0558948370693055e-05, "loss": 2.3194, "step": 337650 }, { "epoch": 0.59, "learning_rate": 2.0558076430766225e-05, "loss": 2.3152, "step": 337660 }, { "epoch": 0.59, "learning_rate": 2.05572044908394e-05, "loss": 2.4305, "step": 337670 }, { "epoch": 0.59, "learning_rate": 2.0556332550912573e-05, "loss": 2.4211, "step": 337680 }, { "epoch": 0.59, "learning_rate": 2.0555460610985746e-05, "loss": 2.3238, "step": 337690 }, { "epoch": 0.59, "learning_rate": 2.055458867105892e-05, "loss": 2.3169, "step": 337700 }, { "epoch": 0.59, "learning_rate": 2.055371673113209e-05, "loss": 2.3608, "step": 337710 }, { "epoch": 0.59, "learning_rate": 2.0552844791205268e-05, "loss": 2.4697, "step": 337720 }, { "epoch": 0.59, "learning_rate": 2.0551972851278438e-05, "loss": 2.217, "step": 337730 }, { "epoch": 0.59, "learning_rate": 2.0551100911351612e-05, "loss": 2.2556, "step": 337740 }, { "epoch": 0.59, "learning_rate": 2.0550228971424786e-05, "loss": 2.4138, "step": 337750 }, { "epoch": 0.59, "learning_rate": 2.054935703149796e-05, "loss": 2.3777, "step": 337760 }, { "epoch": 0.59, "learning_rate": 2.0548485091571133e-05, "loss": 2.4012, "step": 337770 }, { "epoch": 0.59, "learning_rate": 2.0547613151644304e-05, "loss": 2.3352, "step": 337780 }, { "epoch": 0.59, "learning_rate": 2.054674121171748e-05, "loss": 2.4596, "step": 337790 }, { "epoch": 0.59, "learning_rate": 2.054586927179065e-05, "loss": 2.4, "step": 337800 }, { "epoch": 0.59, "learning_rate": 2.0544997331863825e-05, "loss": 2.2689, "step": 337810 }, { "epoch": 0.59, "learning_rate": 2.0544125391936995e-05, "loss": 2.3449, "step": 337820 }, { "epoch": 0.59, "learning_rate": 2.0543253452010172e-05, "loss": 2.3583, "step": 337830 }, { "epoch": 0.59, "learning_rate": 2.0542381512083346e-05, "loss": 2.2992, "step": 337840 }, { "epoch": 0.59, "learning_rate": 2.0541509572156517e-05, "loss": 2.3472, "step": 337850 }, { "epoch": 0.59, "learning_rate": 2.054063763222969e-05, "loss": 2.395, "step": 337860 }, { "epoch": 0.59, "learning_rate": 2.0539765692302864e-05, "loss": 2.4164, "step": 337870 }, { "epoch": 0.59, "learning_rate": 2.0538893752376038e-05, "loss": 2.2504, "step": 337880 }, { "epoch": 0.59, "learning_rate": 2.053802181244921e-05, "loss": 2.2435, "step": 337890 }, { "epoch": 0.59, "learning_rate": 2.0537149872522385e-05, "loss": 2.4411, "step": 337900 }, { "epoch": 0.59, "learning_rate": 2.0536277932595556e-05, "loss": 2.4384, "step": 337910 }, { "epoch": 0.59, "learning_rate": 2.053540599266873e-05, "loss": 2.3965, "step": 337920 }, { "epoch": 0.59, "learning_rate": 2.0534534052741903e-05, "loss": 2.3504, "step": 337930 }, { "epoch": 0.59, "learning_rate": 2.0533662112815077e-05, "loss": 2.2414, "step": 337940 }, { "epoch": 0.59, "learning_rate": 2.053279017288825e-05, "loss": 2.3138, "step": 337950 }, { "epoch": 0.59, "learning_rate": 2.053191823296142e-05, "loss": 2.4171, "step": 337960 }, { "epoch": 0.59, "learning_rate": 2.0531046293034595e-05, "loss": 2.2983, "step": 337970 }, { "epoch": 0.59, "learning_rate": 2.053017435310777e-05, "loss": 2.2992, "step": 337980 }, { "epoch": 0.59, "learning_rate": 2.0529302413180943e-05, "loss": 2.35, "step": 337990 }, { "epoch": 0.59, "learning_rate": 2.0528430473254116e-05, "loss": 2.2002, "step": 338000 }, { "epoch": 0.59, "learning_rate": 2.052755853332729e-05, "loss": 2.3626, "step": 338010 }, { "epoch": 0.59, "learning_rate": 2.0526686593400464e-05, "loss": 2.2958, "step": 338020 }, { "epoch": 0.59, "learning_rate": 2.0525814653473634e-05, "loss": 2.4495, "step": 338030 }, { "epoch": 0.59, "learning_rate": 2.0524942713546808e-05, "loss": 2.3654, "step": 338040 }, { "epoch": 0.59, "learning_rate": 2.0524070773619982e-05, "loss": 2.3641, "step": 338050 }, { "epoch": 0.59, "learning_rate": 2.0523198833693156e-05, "loss": 2.2557, "step": 338060 }, { "epoch": 0.59, "learning_rate": 2.0522326893766326e-05, "loss": 2.3026, "step": 338070 }, { "epoch": 0.59, "learning_rate": 2.05214549538395e-05, "loss": 2.4836, "step": 338080 }, { "epoch": 0.59, "learning_rate": 2.0520583013912677e-05, "loss": 2.3843, "step": 338090 }, { "epoch": 0.59, "learning_rate": 2.0519711073985847e-05, "loss": 2.3269, "step": 338100 }, { "epoch": 0.59, "learning_rate": 2.051883913405902e-05, "loss": 2.2906, "step": 338110 }, { "epoch": 0.59, "learning_rate": 2.051796719413219e-05, "loss": 2.1633, "step": 338120 }, { "epoch": 0.59, "learning_rate": 2.051709525420537e-05, "loss": 2.3889, "step": 338130 }, { "epoch": 0.59, "learning_rate": 2.051622331427854e-05, "loss": 2.3214, "step": 338140 }, { "epoch": 0.59, "learning_rate": 2.0515351374351713e-05, "loss": 2.3289, "step": 338150 }, { "epoch": 0.59, "learning_rate": 2.0514479434424887e-05, "loss": 2.3302, "step": 338160 }, { "epoch": 0.59, "learning_rate": 2.051360749449806e-05, "loss": 2.3735, "step": 338170 }, { "epoch": 0.59, "learning_rate": 2.0512735554571234e-05, "loss": 2.2317, "step": 338180 }, { "epoch": 0.59, "learning_rate": 2.0511863614644404e-05, "loss": 2.4349, "step": 338190 }, { "epoch": 0.59, "learning_rate": 2.051099167471758e-05, "loss": 2.3051, "step": 338200 }, { "epoch": 0.59, "learning_rate": 2.0510119734790752e-05, "loss": 2.323, "step": 338210 }, { "epoch": 0.59, "learning_rate": 2.0509247794863926e-05, "loss": 2.3556, "step": 338220 }, { "epoch": 0.59, "learning_rate": 2.05083758549371e-05, "loss": 2.2918, "step": 338230 }, { "epoch": 0.59, "learning_rate": 2.0507503915010273e-05, "loss": 2.2994, "step": 338240 }, { "epoch": 0.59, "learning_rate": 2.0506631975083447e-05, "loss": 2.3722, "step": 338250 }, { "epoch": 0.59, "learning_rate": 2.0505760035156617e-05, "loss": 2.2436, "step": 338260 }, { "epoch": 0.59, "learning_rate": 2.0504888095229795e-05, "loss": 2.2651, "step": 338270 }, { "epoch": 0.59, "learning_rate": 2.0504016155302965e-05, "loss": 2.4471, "step": 338280 }, { "epoch": 0.59, "learning_rate": 2.050314421537614e-05, "loss": 2.3166, "step": 338290 }, { "epoch": 0.59, "learning_rate": 2.050227227544931e-05, "loss": 2.3708, "step": 338300 }, { "epoch": 0.59, "learning_rate": 2.0501400335522486e-05, "loss": 2.3614, "step": 338310 }, { "epoch": 0.59, "learning_rate": 2.050052839559566e-05, "loss": 2.287, "step": 338320 }, { "epoch": 0.59, "learning_rate": 2.049965645566883e-05, "loss": 2.2947, "step": 338330 }, { "epoch": 0.59, "learning_rate": 2.0498784515742004e-05, "loss": 2.3284, "step": 338340 }, { "epoch": 0.59, "learning_rate": 2.0497912575815178e-05, "loss": 2.3281, "step": 338350 }, { "epoch": 0.59, "learning_rate": 2.0497040635888352e-05, "loss": 2.3298, "step": 338360 }, { "epoch": 0.59, "learning_rate": 2.0496168695961522e-05, "loss": 2.3346, "step": 338370 }, { "epoch": 0.59, "learning_rate": 2.0495296756034696e-05, "loss": 2.3433, "step": 338380 }, { "epoch": 0.59, "learning_rate": 2.049442481610787e-05, "loss": 2.3973, "step": 338390 }, { "epoch": 0.59, "learning_rate": 2.0493552876181043e-05, "loss": 2.4238, "step": 338400 }, { "epoch": 0.59, "learning_rate": 2.0492680936254217e-05, "loss": 2.4015, "step": 338410 }, { "epoch": 0.59, "learning_rate": 2.049180899632739e-05, "loss": 2.2166, "step": 338420 }, { "epoch": 0.59, "learning_rate": 2.0490937056400565e-05, "loss": 2.3735, "step": 338430 }, { "epoch": 0.59, "learning_rate": 2.0490065116473735e-05, "loss": 2.3294, "step": 338440 }, { "epoch": 0.59, "learning_rate": 2.048919317654691e-05, "loss": 2.4274, "step": 338450 }, { "epoch": 0.59, "learning_rate": 2.0488321236620083e-05, "loss": 2.3142, "step": 338460 }, { "epoch": 0.59, "learning_rate": 2.0487449296693256e-05, "loss": 2.3487, "step": 338470 }, { "epoch": 0.59, "learning_rate": 2.048657735676643e-05, "loss": 2.4014, "step": 338480 }, { "epoch": 0.59, "learning_rate": 2.04857054168396e-05, "loss": 2.2979, "step": 338490 }, { "epoch": 0.59, "learning_rate": 2.0484833476912778e-05, "loss": 2.2724, "step": 338500 }, { "epoch": 0.59, "learning_rate": 2.0483961536985948e-05, "loss": 2.4308, "step": 338510 }, { "epoch": 0.59, "learning_rate": 2.0483089597059122e-05, "loss": 2.2926, "step": 338520 }, { "epoch": 0.59, "learning_rate": 2.0482217657132296e-05, "loss": 2.2096, "step": 338530 }, { "epoch": 0.59, "learning_rate": 2.048134571720547e-05, "loss": 2.2815, "step": 338540 }, { "epoch": 0.59, "learning_rate": 2.048047377727864e-05, "loss": 2.2617, "step": 338550 }, { "epoch": 0.59, "learning_rate": 2.0479601837351814e-05, "loss": 2.3567, "step": 338560 }, { "epoch": 0.59, "learning_rate": 2.047872989742499e-05, "loss": 2.3002, "step": 338570 }, { "epoch": 0.59, "learning_rate": 2.047785795749816e-05, "loss": 2.1965, "step": 338580 }, { "epoch": 0.59, "learning_rate": 2.0476986017571335e-05, "loss": 2.4156, "step": 338590 }, { "epoch": 0.59, "learning_rate": 2.0476114077644505e-05, "loss": 2.3433, "step": 338600 }, { "epoch": 0.59, "learning_rate": 2.0475242137717682e-05, "loss": 2.2955, "step": 338610 }, { "epoch": 0.59, "learning_rate": 2.0474370197790853e-05, "loss": 2.3147, "step": 338620 }, { "epoch": 0.59, "learning_rate": 2.0473498257864027e-05, "loss": 2.3357, "step": 338630 }, { "epoch": 0.59, "learning_rate": 2.04726263179372e-05, "loss": 2.3461, "step": 338640 }, { "epoch": 0.59, "learning_rate": 2.0471754378010374e-05, "loss": 2.4198, "step": 338650 }, { "epoch": 0.59, "learning_rate": 2.0470882438083548e-05, "loss": 2.3024, "step": 338660 }, { "epoch": 0.59, "learning_rate": 2.047001049815672e-05, "loss": 2.3236, "step": 338670 }, { "epoch": 0.59, "learning_rate": 2.0469138558229895e-05, "loss": 2.3758, "step": 338680 }, { "epoch": 0.59, "learning_rate": 2.0468266618303066e-05, "loss": 2.2963, "step": 338690 }, { "epoch": 0.59, "learning_rate": 2.046739467837624e-05, "loss": 2.4858, "step": 338700 }, { "epoch": 0.59, "learning_rate": 2.0466522738449413e-05, "loss": 2.3701, "step": 338710 }, { "epoch": 0.59, "learning_rate": 2.0465650798522587e-05, "loss": 2.3371, "step": 338720 }, { "epoch": 0.59, "learning_rate": 2.046477885859576e-05, "loss": 2.4031, "step": 338730 }, { "epoch": 0.59, "learning_rate": 2.046390691866893e-05, "loss": 2.2036, "step": 338740 }, { "epoch": 0.59, "learning_rate": 2.0463034978742105e-05, "loss": 2.3745, "step": 338750 }, { "epoch": 0.59, "learning_rate": 2.046216303881528e-05, "loss": 2.3086, "step": 338760 }, { "epoch": 0.59, "learning_rate": 2.0461291098888453e-05, "loss": 2.3761, "step": 338770 }, { "epoch": 0.59, "learning_rate": 2.0460419158961623e-05, "loss": 2.3703, "step": 338780 }, { "epoch": 0.59, "learning_rate": 2.0459547219034797e-05, "loss": 2.3941, "step": 338790 }, { "epoch": 0.59, "learning_rate": 2.045867527910797e-05, "loss": 2.3806, "step": 338800 }, { "epoch": 0.59, "learning_rate": 2.0457803339181144e-05, "loss": 2.3734, "step": 338810 }, { "epoch": 0.59, "learning_rate": 2.0456931399254318e-05, "loss": 2.4272, "step": 338820 }, { "epoch": 0.59, "learning_rate": 2.0456059459327492e-05, "loss": 2.3833, "step": 338830 }, { "epoch": 0.59, "learning_rate": 2.0455187519400666e-05, "loss": 2.2965, "step": 338840 }, { "epoch": 0.59, "learning_rate": 2.0454315579473836e-05, "loss": 2.2901, "step": 338850 }, { "epoch": 0.59, "learning_rate": 2.045344363954701e-05, "loss": 2.3508, "step": 338860 }, { "epoch": 0.59, "learning_rate": 2.0452571699620184e-05, "loss": 2.2939, "step": 338870 }, { "epoch": 0.59, "learning_rate": 2.0451699759693357e-05, "loss": 2.2642, "step": 338880 }, { "epoch": 0.59, "learning_rate": 2.045082781976653e-05, "loss": 2.415, "step": 338890 }, { "epoch": 0.59, "learning_rate": 2.04499558798397e-05, "loss": 2.4415, "step": 338900 }, { "epoch": 0.59, "learning_rate": 2.044908393991288e-05, "loss": 2.3275, "step": 338910 }, { "epoch": 0.59, "learning_rate": 2.044821199998605e-05, "loss": 2.44, "step": 338920 }, { "epoch": 0.59, "learning_rate": 2.0447340060059223e-05, "loss": 2.2695, "step": 338930 }, { "epoch": 0.59, "learning_rate": 2.0446468120132397e-05, "loss": 2.31, "step": 338940 }, { "epoch": 0.59, "learning_rate": 2.044559618020557e-05, "loss": 2.2762, "step": 338950 }, { "epoch": 0.59, "learning_rate": 2.0444724240278744e-05, "loss": 2.2724, "step": 338960 }, { "epoch": 0.59, "learning_rate": 2.0443852300351914e-05, "loss": 2.213, "step": 338970 }, { "epoch": 0.59, "learning_rate": 2.044298036042509e-05, "loss": 2.3357, "step": 338980 }, { "epoch": 0.59, "learning_rate": 2.0442108420498262e-05, "loss": 2.3008, "step": 338990 }, { "epoch": 0.59, "learning_rate": 2.0441236480571436e-05, "loss": 2.3261, "step": 339000 }, { "epoch": 0.59, "learning_rate": 2.0440364540644606e-05, "loss": 2.3434, "step": 339010 }, { "epoch": 0.59, "learning_rate": 2.0439492600717783e-05, "loss": 2.3712, "step": 339020 }, { "epoch": 0.59, "learning_rate": 2.0438620660790954e-05, "loss": 2.3729, "step": 339030 }, { "epoch": 0.59, "learning_rate": 2.0437748720864127e-05, "loss": 2.256, "step": 339040 }, { "epoch": 0.59, "learning_rate": 2.04368767809373e-05, "loss": 2.3348, "step": 339050 }, { "epoch": 0.59, "learning_rate": 2.0436004841010475e-05, "loss": 2.2632, "step": 339060 }, { "epoch": 0.59, "learning_rate": 2.043513290108365e-05, "loss": 2.3108, "step": 339070 }, { "epoch": 0.59, "learning_rate": 2.043426096115682e-05, "loss": 2.3164, "step": 339080 }, { "epoch": 0.59, "learning_rate": 2.0433389021229996e-05, "loss": 2.2914, "step": 339090 }, { "epoch": 0.59, "learning_rate": 2.0432517081303167e-05, "loss": 2.3507, "step": 339100 }, { "epoch": 0.59, "learning_rate": 2.043164514137634e-05, "loss": 2.3544, "step": 339110 }, { "epoch": 0.59, "learning_rate": 2.0430773201449514e-05, "loss": 2.4576, "step": 339120 }, { "epoch": 0.59, "learning_rate": 2.0429901261522688e-05, "loss": 2.4279, "step": 339130 }, { "epoch": 0.59, "learning_rate": 2.0429029321595862e-05, "loss": 2.3724, "step": 339140 }, { "epoch": 0.59, "learning_rate": 2.0428157381669032e-05, "loss": 2.2057, "step": 339150 }, { "epoch": 0.59, "learning_rate": 2.0427285441742206e-05, "loss": 2.3318, "step": 339160 }, { "epoch": 0.59, "learning_rate": 2.042641350181538e-05, "loss": 2.2895, "step": 339170 }, { "epoch": 0.59, "learning_rate": 2.0425541561888553e-05, "loss": 2.2591, "step": 339180 }, { "epoch": 0.59, "learning_rate": 2.0424669621961727e-05, "loss": 2.2749, "step": 339190 }, { "epoch": 0.59, "learning_rate": 2.04237976820349e-05, "loss": 2.2973, "step": 339200 }, { "epoch": 0.59, "learning_rate": 2.0422925742108075e-05, "loss": 2.3241, "step": 339210 }, { "epoch": 0.59, "learning_rate": 2.0422053802181245e-05, "loss": 2.3587, "step": 339220 }, { "epoch": 0.59, "learning_rate": 2.042118186225442e-05, "loss": 2.2497, "step": 339230 }, { "epoch": 0.59, "learning_rate": 2.0420309922327593e-05, "loss": 2.4041, "step": 339240 }, { "epoch": 0.59, "learning_rate": 2.0419437982400766e-05, "loss": 2.3722, "step": 339250 }, { "epoch": 0.59, "learning_rate": 2.0418566042473937e-05, "loss": 2.3612, "step": 339260 }, { "epoch": 0.59, "learning_rate": 2.041769410254711e-05, "loss": 2.3076, "step": 339270 }, { "epoch": 0.59, "learning_rate": 2.0416822162620284e-05, "loss": 2.3588, "step": 339280 }, { "epoch": 0.59, "learning_rate": 2.0415950222693458e-05, "loss": 2.2479, "step": 339290 }, { "epoch": 0.59, "learning_rate": 2.0415078282766632e-05, "loss": 2.3164, "step": 339300 }, { "epoch": 0.59, "learning_rate": 2.0414206342839802e-05, "loss": 2.2951, "step": 339310 }, { "epoch": 0.59, "learning_rate": 2.041333440291298e-05, "loss": 2.3763, "step": 339320 }, { "epoch": 0.59, "learning_rate": 2.041246246298615e-05, "loss": 2.234, "step": 339330 }, { "epoch": 0.59, "learning_rate": 2.0411590523059324e-05, "loss": 2.4055, "step": 339340 }, { "epoch": 0.59, "learning_rate": 2.0410718583132497e-05, "loss": 2.3094, "step": 339350 }, { "epoch": 0.59, "learning_rate": 2.040984664320567e-05, "loss": 2.2468, "step": 339360 }, { "epoch": 0.59, "learning_rate": 2.0408974703278845e-05, "loss": 2.3615, "step": 339370 }, { "epoch": 0.59, "learning_rate": 2.0408102763352015e-05, "loss": 2.2735, "step": 339380 }, { "epoch": 0.59, "learning_rate": 2.0407230823425192e-05, "loss": 2.2967, "step": 339390 }, { "epoch": 0.59, "learning_rate": 2.0406358883498363e-05, "loss": 2.3387, "step": 339400 }, { "epoch": 0.59, "learning_rate": 2.0405486943571537e-05, "loss": 2.3157, "step": 339410 }, { "epoch": 0.59, "learning_rate": 2.0404615003644707e-05, "loss": 2.3679, "step": 339420 }, { "epoch": 0.59, "learning_rate": 2.0403743063717884e-05, "loss": 2.2553, "step": 339430 }, { "epoch": 0.59, "learning_rate": 2.0402871123791058e-05, "loss": 2.4064, "step": 339440 }, { "epoch": 0.59, "learning_rate": 2.040199918386423e-05, "loss": 2.2975, "step": 339450 }, { "epoch": 0.59, "learning_rate": 2.0401127243937405e-05, "loss": 2.1787, "step": 339460 }, { "epoch": 0.59, "learning_rate": 2.0400255304010576e-05, "loss": 2.3414, "step": 339470 }, { "epoch": 0.59, "learning_rate": 2.039938336408375e-05, "loss": 2.3802, "step": 339480 }, { "epoch": 0.59, "learning_rate": 2.039851142415692e-05, "loss": 2.3936, "step": 339490 }, { "epoch": 0.59, "learning_rate": 2.0397639484230097e-05, "loss": 2.3279, "step": 339500 }, { "epoch": 0.59, "learning_rate": 2.0396767544303268e-05, "loss": 2.3667, "step": 339510 }, { "epoch": 0.59, "learning_rate": 2.039589560437644e-05, "loss": 2.3414, "step": 339520 }, { "epoch": 0.59, "learning_rate": 2.0395023664449615e-05, "loss": 2.2646, "step": 339530 }, { "epoch": 0.59, "learning_rate": 2.039415172452279e-05, "loss": 2.3582, "step": 339540 }, { "epoch": 0.59, "learning_rate": 2.0393279784595963e-05, "loss": 2.2752, "step": 339550 }, { "epoch": 0.59, "learning_rate": 2.0392407844669133e-05, "loss": 2.2626, "step": 339560 }, { "epoch": 0.59, "learning_rate": 2.0391535904742307e-05, "loss": 2.391, "step": 339570 }, { "epoch": 0.59, "learning_rate": 2.039066396481548e-05, "loss": 2.3213, "step": 339580 }, { "epoch": 0.59, "learning_rate": 2.0389792024888654e-05, "loss": 2.3387, "step": 339590 }, { "epoch": 0.59, "learning_rate": 2.0388920084961828e-05, "loss": 2.3302, "step": 339600 }, { "epoch": 0.59, "learning_rate": 2.0388048145035002e-05, "loss": 2.3337, "step": 339610 }, { "epoch": 0.59, "learning_rate": 2.0387176205108176e-05, "loss": 2.2835, "step": 339620 }, { "epoch": 0.59, "learning_rate": 2.0386304265181346e-05, "loss": 2.1967, "step": 339630 }, { "epoch": 0.59, "learning_rate": 2.038543232525452e-05, "loss": 2.2777, "step": 339640 }, { "epoch": 0.59, "learning_rate": 2.0384560385327694e-05, "loss": 2.2413, "step": 339650 }, { "epoch": 0.59, "learning_rate": 2.0383688445400867e-05, "loss": 2.3268, "step": 339660 }, { "epoch": 0.59, "learning_rate": 2.038281650547404e-05, "loss": 2.3581, "step": 339670 }, { "epoch": 0.59, "learning_rate": 2.038194456554721e-05, "loss": 2.2764, "step": 339680 }, { "epoch": 0.59, "learning_rate": 2.038107262562039e-05, "loss": 2.2702, "step": 339690 }, { "epoch": 0.59, "learning_rate": 2.038020068569356e-05, "loss": 2.4018, "step": 339700 }, { "epoch": 0.59, "learning_rate": 2.0379328745766733e-05, "loss": 2.5041, "step": 339710 }, { "epoch": 0.59, "learning_rate": 2.0378456805839903e-05, "loss": 2.3337, "step": 339720 }, { "epoch": 0.59, "learning_rate": 2.037758486591308e-05, "loss": 2.352, "step": 339730 }, { "epoch": 0.59, "learning_rate": 2.037671292598625e-05, "loss": 2.3072, "step": 339740 }, { "epoch": 0.59, "learning_rate": 2.0375840986059424e-05, "loss": 2.3939, "step": 339750 }, { "epoch": 0.59, "learning_rate": 2.0374969046132598e-05, "loss": 2.437, "step": 339760 }, { "epoch": 0.59, "learning_rate": 2.0374097106205772e-05, "loss": 2.1852, "step": 339770 }, { "epoch": 0.59, "learning_rate": 2.0373225166278946e-05, "loss": 2.332, "step": 339780 }, { "epoch": 0.59, "learning_rate": 2.0372353226352116e-05, "loss": 2.4255, "step": 339790 }, { "epoch": 0.59, "learning_rate": 2.0371481286425293e-05, "loss": 2.2389, "step": 339800 }, { "epoch": 0.59, "learning_rate": 2.0370609346498464e-05, "loss": 2.3441, "step": 339810 }, { "epoch": 0.59, "learning_rate": 2.0369737406571637e-05, "loss": 2.3938, "step": 339820 }, { "epoch": 0.59, "learning_rate": 2.036886546664481e-05, "loss": 2.2237, "step": 339830 }, { "epoch": 0.59, "learning_rate": 2.0367993526717985e-05, "loss": 2.4547, "step": 339840 }, { "epoch": 0.59, "learning_rate": 2.036712158679116e-05, "loss": 2.2844, "step": 339850 }, { "epoch": 0.59, "learning_rate": 2.036624964686433e-05, "loss": 2.3893, "step": 339860 }, { "epoch": 0.59, "learning_rate": 2.0365377706937506e-05, "loss": 2.3341, "step": 339870 }, { "epoch": 0.59, "learning_rate": 2.0364505767010677e-05, "loss": 2.2876, "step": 339880 }, { "epoch": 0.59, "learning_rate": 2.036363382708385e-05, "loss": 2.4237, "step": 339890 }, { "epoch": 0.59, "learning_rate": 2.036276188715702e-05, "loss": 2.3294, "step": 339900 }, { "epoch": 0.59, "learning_rate": 2.0361889947230198e-05, "loss": 2.3996, "step": 339910 }, { "epoch": 0.59, "learning_rate": 2.0361018007303372e-05, "loss": 2.3233, "step": 339920 }, { "epoch": 0.59, "learning_rate": 2.0360146067376542e-05, "loss": 2.3802, "step": 339930 }, { "epoch": 0.59, "learning_rate": 2.0359274127449716e-05, "loss": 2.3315, "step": 339940 }, { "epoch": 0.59, "learning_rate": 2.035840218752289e-05, "loss": 2.4106, "step": 339950 }, { "epoch": 0.59, "learning_rate": 2.0357530247596063e-05, "loss": 2.3374, "step": 339960 }, { "epoch": 0.59, "learning_rate": 2.0356658307669234e-05, "loss": 2.3202, "step": 339970 }, { "epoch": 0.59, "learning_rate": 2.0355786367742408e-05, "loss": 2.3638, "step": 339980 }, { "epoch": 0.59, "learning_rate": 2.035491442781558e-05, "loss": 2.33, "step": 339990 }, { "epoch": 0.59, "learning_rate": 2.0354042487888755e-05, "loss": 2.226, "step": 340000 }, { "epoch": 0.59, "learning_rate": 2.035317054796193e-05, "loss": 2.2696, "step": 340010 }, { "epoch": 0.59, "learning_rate": 2.0352298608035103e-05, "loss": 2.3564, "step": 340020 }, { "epoch": 0.59, "learning_rate": 2.0351426668108276e-05, "loss": 2.3542, "step": 340030 }, { "epoch": 0.59, "learning_rate": 2.0350554728181447e-05, "loss": 2.312, "step": 340040 }, { "epoch": 0.59, "learning_rate": 2.034968278825462e-05, "loss": 2.4018, "step": 340050 }, { "epoch": 0.59, "learning_rate": 2.0348810848327794e-05, "loss": 2.3373, "step": 340060 }, { "epoch": 0.59, "learning_rate": 2.0347938908400968e-05, "loss": 2.3603, "step": 340070 }, { "epoch": 0.59, "learning_rate": 2.0347066968474142e-05, "loss": 2.3865, "step": 340080 }, { "epoch": 0.59, "learning_rate": 2.0346195028547312e-05, "loss": 2.3306, "step": 340090 }, { "epoch": 0.59, "learning_rate": 2.034532308862049e-05, "loss": 2.3649, "step": 340100 }, { "epoch": 0.59, "learning_rate": 2.034445114869366e-05, "loss": 2.3298, "step": 340110 }, { "epoch": 0.59, "learning_rate": 2.0343579208766834e-05, "loss": 2.3441, "step": 340120 }, { "epoch": 0.59, "learning_rate": 2.0342707268840007e-05, "loss": 2.3679, "step": 340130 }, { "epoch": 0.59, "learning_rate": 2.034183532891318e-05, "loss": 2.3158, "step": 340140 }, { "epoch": 0.59, "learning_rate": 2.034096338898635e-05, "loss": 2.3952, "step": 340150 }, { "epoch": 0.59, "learning_rate": 2.0340091449059525e-05, "loss": 2.3664, "step": 340160 }, { "epoch": 0.59, "learning_rate": 2.0339219509132702e-05, "loss": 2.3641, "step": 340170 }, { "epoch": 0.59, "learning_rate": 2.0338347569205873e-05, "loss": 2.4024, "step": 340180 }, { "epoch": 0.59, "learning_rate": 2.0337475629279047e-05, "loss": 2.2719, "step": 340190 }, { "epoch": 0.59, "learning_rate": 2.0336603689352217e-05, "loss": 2.3343, "step": 340200 }, { "epoch": 0.59, "learning_rate": 2.0335731749425394e-05, "loss": 2.2099, "step": 340210 }, { "epoch": 0.59, "learning_rate": 2.0334859809498565e-05, "loss": 2.3492, "step": 340220 }, { "epoch": 0.59, "learning_rate": 2.033398786957174e-05, "loss": 2.346, "step": 340230 }, { "epoch": 0.59, "learning_rate": 2.0333115929644912e-05, "loss": 2.4019, "step": 340240 }, { "epoch": 0.59, "learning_rate": 2.0332243989718086e-05, "loss": 2.3093, "step": 340250 }, { "epoch": 0.59, "learning_rate": 2.033137204979126e-05, "loss": 2.3151, "step": 340260 }, { "epoch": 0.59, "learning_rate": 2.033050010986443e-05, "loss": 2.4479, "step": 340270 }, { "epoch": 0.59, "learning_rate": 2.0329628169937607e-05, "loss": 2.3687, "step": 340280 }, { "epoch": 0.59, "learning_rate": 2.0328756230010778e-05, "loss": 2.3479, "step": 340290 }, { "epoch": 0.59, "learning_rate": 2.032788429008395e-05, "loss": 2.3746, "step": 340300 }, { "epoch": 0.59, "learning_rate": 2.0327012350157125e-05, "loss": 2.3154, "step": 340310 }, { "epoch": 0.59, "learning_rate": 2.03261404102303e-05, "loss": 2.4012, "step": 340320 }, { "epoch": 0.59, "learning_rate": 2.0325268470303473e-05, "loss": 2.3542, "step": 340330 }, { "epoch": 0.59, "learning_rate": 2.0324396530376643e-05, "loss": 2.2898, "step": 340340 }, { "epoch": 0.59, "learning_rate": 2.0323524590449817e-05, "loss": 2.3583, "step": 340350 }, { "epoch": 0.59, "learning_rate": 2.032265265052299e-05, "loss": 2.4033, "step": 340360 }, { "epoch": 0.59, "learning_rate": 2.0321780710596164e-05, "loss": 2.4297, "step": 340370 }, { "epoch": 0.59, "learning_rate": 2.0320908770669335e-05, "loss": 2.2352, "step": 340380 }, { "epoch": 0.59, "learning_rate": 2.0320036830742512e-05, "loss": 2.381, "step": 340390 }, { "epoch": 0.59, "learning_rate": 2.0319164890815686e-05, "loss": 2.3732, "step": 340400 }, { "epoch": 0.59, "learning_rate": 2.0318292950888856e-05, "loss": 2.3483, "step": 340410 }, { "epoch": 0.59, "learning_rate": 2.031742101096203e-05, "loss": 2.3245, "step": 340420 }, { "epoch": 0.59, "learning_rate": 2.0316549071035204e-05, "loss": 2.4802, "step": 340430 }, { "epoch": 0.59, "learning_rate": 2.0315677131108377e-05, "loss": 2.3697, "step": 340440 }, { "epoch": 0.59, "learning_rate": 2.0314805191181548e-05, "loss": 2.2758, "step": 340450 }, { "epoch": 0.59, "learning_rate": 2.031393325125472e-05, "loss": 2.3291, "step": 340460 }, { "epoch": 0.59, "learning_rate": 2.0313061311327895e-05, "loss": 2.2362, "step": 340470 }, { "epoch": 0.59, "learning_rate": 2.031218937140107e-05, "loss": 2.39, "step": 340480 }, { "epoch": 0.59, "learning_rate": 2.0311317431474243e-05, "loss": 2.2683, "step": 340490 }, { "epoch": 0.59, "learning_rate": 2.0310445491547413e-05, "loss": 2.3664, "step": 340500 }, { "epoch": 0.59, "learning_rate": 2.030957355162059e-05, "loss": 2.3911, "step": 340510 }, { "epoch": 0.59, "learning_rate": 2.030870161169376e-05, "loss": 2.2157, "step": 340520 }, { "epoch": 0.59, "learning_rate": 2.0307829671766934e-05, "loss": 2.4022, "step": 340530 }, { "epoch": 0.59, "learning_rate": 2.0306957731840108e-05, "loss": 2.2833, "step": 340540 }, { "epoch": 0.59, "learning_rate": 2.0306085791913282e-05, "loss": 2.3323, "step": 340550 }, { "epoch": 0.59, "learning_rate": 2.0305213851986456e-05, "loss": 2.2676, "step": 340560 }, { "epoch": 0.59, "learning_rate": 2.0304341912059626e-05, "loss": 2.3743, "step": 340570 }, { "epoch": 0.59, "learning_rate": 2.0303469972132803e-05, "loss": 2.3049, "step": 340580 }, { "epoch": 0.59, "learning_rate": 2.0302598032205974e-05, "loss": 2.3102, "step": 340590 }, { "epoch": 0.59, "learning_rate": 2.0301726092279147e-05, "loss": 2.4176, "step": 340600 }, { "epoch": 0.59, "learning_rate": 2.0300854152352318e-05, "loss": 2.4024, "step": 340610 }, { "epoch": 0.59, "learning_rate": 2.0299982212425495e-05, "loss": 2.4224, "step": 340620 }, { "epoch": 0.59, "learning_rate": 2.0299110272498665e-05, "loss": 2.46, "step": 340630 }, { "epoch": 0.59, "learning_rate": 2.029823833257184e-05, "loss": 2.3574, "step": 340640 }, { "epoch": 0.59, "learning_rate": 2.0297366392645013e-05, "loss": 2.1638, "step": 340650 }, { "epoch": 0.59, "learning_rate": 2.0296494452718187e-05, "loss": 2.1449, "step": 340660 }, { "epoch": 0.59, "learning_rate": 2.029562251279136e-05, "loss": 2.3072, "step": 340670 }, { "epoch": 0.59, "learning_rate": 2.029475057286453e-05, "loss": 2.2714, "step": 340680 }, { "epoch": 0.59, "learning_rate": 2.0293878632937708e-05, "loss": 2.3977, "step": 340690 }, { "epoch": 0.59, "learning_rate": 2.029300669301088e-05, "loss": 2.2088, "step": 340700 }, { "epoch": 0.59, "learning_rate": 2.0292134753084052e-05, "loss": 2.376, "step": 340710 }, { "epoch": 0.59, "learning_rate": 2.0291262813157226e-05, "loss": 2.2381, "step": 340720 }, { "epoch": 0.59, "learning_rate": 2.02903908732304e-05, "loss": 2.329, "step": 340730 }, { "epoch": 0.59, "learning_rate": 2.0289518933303573e-05, "loss": 2.3243, "step": 340740 }, { "epoch": 0.59, "learning_rate": 2.0288646993376744e-05, "loss": 2.3403, "step": 340750 }, { "epoch": 0.59, "learning_rate": 2.0287775053449918e-05, "loss": 2.409, "step": 340760 }, { "epoch": 0.59, "learning_rate": 2.028690311352309e-05, "loss": 2.3717, "step": 340770 }, { "epoch": 0.59, "learning_rate": 2.0286031173596265e-05, "loss": 2.4473, "step": 340780 }, { "epoch": 0.59, "learning_rate": 2.028515923366944e-05, "loss": 2.281, "step": 340790 }, { "epoch": 0.59, "learning_rate": 2.0284287293742613e-05, "loss": 2.3212, "step": 340800 }, { "epoch": 0.59, "learning_rate": 2.0283415353815786e-05, "loss": 2.3251, "step": 340810 }, { "epoch": 0.59, "learning_rate": 2.0282543413888957e-05, "loss": 2.2641, "step": 340820 }, { "epoch": 0.59, "learning_rate": 2.028167147396213e-05, "loss": 2.3501, "step": 340830 }, { "epoch": 0.59, "learning_rate": 2.0280799534035304e-05, "loss": 2.3269, "step": 340840 }, { "epoch": 0.59, "learning_rate": 2.0279927594108478e-05, "loss": 2.2934, "step": 340850 }, { "epoch": 0.59, "learning_rate": 2.027905565418165e-05, "loss": 2.3227, "step": 340860 }, { "epoch": 0.59, "learning_rate": 2.0278183714254822e-05, "loss": 2.2563, "step": 340870 }, { "epoch": 0.59, "learning_rate": 2.0277311774327996e-05, "loss": 2.4297, "step": 340880 }, { "epoch": 0.59, "learning_rate": 2.027643983440117e-05, "loss": 2.3938, "step": 340890 }, { "epoch": 0.59, "learning_rate": 2.0275567894474344e-05, "loss": 2.3356, "step": 340900 }, { "epoch": 0.59, "learning_rate": 2.0274695954547514e-05, "loss": 2.2166, "step": 340910 }, { "epoch": 0.59, "learning_rate": 2.027382401462069e-05, "loss": 2.3034, "step": 340920 }, { "epoch": 0.59, "learning_rate": 2.027295207469386e-05, "loss": 2.4524, "step": 340930 }, { "epoch": 0.59, "learning_rate": 2.0272080134767035e-05, "loss": 2.1824, "step": 340940 }, { "epoch": 0.59, "learning_rate": 2.027120819484021e-05, "loss": 2.3341, "step": 340950 }, { "epoch": 0.59, "learning_rate": 2.0270336254913383e-05, "loss": 2.3364, "step": 340960 }, { "epoch": 0.59, "learning_rate": 2.0269464314986557e-05, "loss": 2.3534, "step": 340970 }, { "epoch": 0.59, "learning_rate": 2.0268592375059727e-05, "loss": 2.2773, "step": 340980 }, { "epoch": 0.59, "learning_rate": 2.0267720435132904e-05, "loss": 2.3409, "step": 340990 }, { "epoch": 0.59, "learning_rate": 2.0266848495206075e-05, "loss": 2.4168, "step": 341000 }, { "epoch": 0.59, "learning_rate": 2.026597655527925e-05, "loss": 2.2662, "step": 341010 }, { "epoch": 0.59, "learning_rate": 2.0265104615352422e-05, "loss": 2.2911, "step": 341020 }, { "epoch": 0.59, "learning_rate": 2.0264232675425596e-05, "loss": 2.3844, "step": 341030 }, { "epoch": 0.59, "learning_rate": 2.026336073549877e-05, "loss": 2.3672, "step": 341040 }, { "epoch": 0.59, "learning_rate": 2.026248879557194e-05, "loss": 2.2314, "step": 341050 }, { "epoch": 0.59, "learning_rate": 2.0261616855645117e-05, "loss": 2.2959, "step": 341060 }, { "epoch": 0.59, "learning_rate": 2.0260744915718288e-05, "loss": 2.4241, "step": 341070 }, { "epoch": 0.59, "learning_rate": 2.025987297579146e-05, "loss": 2.2399, "step": 341080 }, { "epoch": 0.59, "learning_rate": 2.0259001035864632e-05, "loss": 2.2942, "step": 341090 }, { "epoch": 0.59, "learning_rate": 2.025812909593781e-05, "loss": 2.354, "step": 341100 }, { "epoch": 0.59, "learning_rate": 2.025725715601098e-05, "loss": 2.362, "step": 341110 }, { "epoch": 0.59, "learning_rate": 2.0256385216084153e-05, "loss": 2.4763, "step": 341120 }, { "epoch": 0.59, "learning_rate": 2.0255513276157327e-05, "loss": 2.3644, "step": 341130 }, { "epoch": 0.59, "learning_rate": 2.02546413362305e-05, "loss": 2.3196, "step": 341140 }, { "epoch": 0.59, "learning_rate": 2.0253769396303674e-05, "loss": 2.2732, "step": 341150 }, { "epoch": 0.59, "learning_rate": 2.0252897456376845e-05, "loss": 2.4085, "step": 341160 }, { "epoch": 0.59, "learning_rate": 2.025202551645002e-05, "loss": 2.3187, "step": 341170 }, { "epoch": 0.59, "learning_rate": 2.0251153576523192e-05, "loss": 2.4741, "step": 341180 }, { "epoch": 0.59, "learning_rate": 2.0250281636596366e-05, "loss": 2.3462, "step": 341190 }, { "epoch": 0.6, "learning_rate": 2.024940969666954e-05, "loss": 2.3962, "step": 341200 }, { "epoch": 0.6, "learning_rate": 2.0248537756742714e-05, "loss": 2.2428, "step": 341210 }, { "epoch": 0.6, "learning_rate": 2.0247665816815887e-05, "loss": 2.3064, "step": 341220 }, { "epoch": 0.6, "learning_rate": 2.0246793876889058e-05, "loss": 2.3295, "step": 341230 }, { "epoch": 0.6, "learning_rate": 2.024592193696223e-05, "loss": 2.3817, "step": 341240 }, { "epoch": 0.6, "learning_rate": 2.0245049997035405e-05, "loss": 2.2351, "step": 341250 }, { "epoch": 0.6, "learning_rate": 2.024417805710858e-05, "loss": 2.4373, "step": 341260 }, { "epoch": 0.6, "learning_rate": 2.0243306117181753e-05, "loss": 2.419, "step": 341270 }, { "epoch": 0.6, "learning_rate": 2.0242434177254923e-05, "loss": 2.3316, "step": 341280 }, { "epoch": 0.6, "learning_rate": 2.02415622373281e-05, "loss": 2.3897, "step": 341290 }, { "epoch": 0.6, "learning_rate": 2.024069029740127e-05, "loss": 2.2845, "step": 341300 }, { "epoch": 0.6, "learning_rate": 2.0239818357474444e-05, "loss": 2.2769, "step": 341310 }, { "epoch": 0.6, "learning_rate": 2.0238946417547615e-05, "loss": 2.2532, "step": 341320 }, { "epoch": 0.6, "learning_rate": 2.0238074477620792e-05, "loss": 2.3457, "step": 341330 }, { "epoch": 0.6, "learning_rate": 2.0237202537693962e-05, "loss": 2.3121, "step": 341340 }, { "epoch": 0.6, "learning_rate": 2.0236330597767136e-05, "loss": 2.3389, "step": 341350 }, { "epoch": 0.6, "learning_rate": 2.023545865784031e-05, "loss": 2.2323, "step": 341360 }, { "epoch": 0.6, "learning_rate": 2.0234586717913484e-05, "loss": 2.4013, "step": 341370 }, { "epoch": 0.6, "learning_rate": 2.0233714777986657e-05, "loss": 2.362, "step": 341380 }, { "epoch": 0.6, "learning_rate": 2.0232842838059828e-05, "loss": 2.4031, "step": 341390 }, { "epoch": 0.6, "learning_rate": 2.0231970898133005e-05, "loss": 2.4226, "step": 341400 }, { "epoch": 0.6, "learning_rate": 2.0231098958206175e-05, "loss": 2.4111, "step": 341410 }, { "epoch": 0.6, "learning_rate": 2.023022701827935e-05, "loss": 2.3214, "step": 341420 }, { "epoch": 0.6, "learning_rate": 2.0229355078352523e-05, "loss": 2.3117, "step": 341430 }, { "epoch": 0.6, "learning_rate": 2.0228483138425697e-05, "loss": 2.3681, "step": 341440 }, { "epoch": 0.6, "learning_rate": 2.022761119849887e-05, "loss": 2.3072, "step": 341450 }, { "epoch": 0.6, "learning_rate": 2.022673925857204e-05, "loss": 2.3864, "step": 341460 }, { "epoch": 0.6, "learning_rate": 2.0225867318645218e-05, "loss": 2.4446, "step": 341470 }, { "epoch": 0.6, "learning_rate": 2.022499537871839e-05, "loss": 2.3723, "step": 341480 }, { "epoch": 0.6, "learning_rate": 2.0224123438791562e-05, "loss": 2.2936, "step": 341490 }, { "epoch": 0.6, "learning_rate": 2.0223251498864733e-05, "loss": 2.367, "step": 341500 }, { "epoch": 0.6, "learning_rate": 2.022237955893791e-05, "loss": 2.4904, "step": 341510 }, { "epoch": 0.6, "learning_rate": 2.0221507619011083e-05, "loss": 2.4098, "step": 341520 }, { "epoch": 0.6, "learning_rate": 2.0220635679084254e-05, "loss": 2.2596, "step": 341530 }, { "epoch": 0.6, "learning_rate": 2.0219763739157428e-05, "loss": 2.3812, "step": 341540 }, { "epoch": 0.6, "learning_rate": 2.02188917992306e-05, "loss": 2.2104, "step": 341550 }, { "epoch": 0.6, "learning_rate": 2.0218019859303775e-05, "loss": 2.4331, "step": 341560 }, { "epoch": 0.6, "learning_rate": 2.0217147919376946e-05, "loss": 2.2506, "step": 341570 }, { "epoch": 0.6, "learning_rate": 2.021627597945012e-05, "loss": 2.1874, "step": 341580 }, { "epoch": 0.6, "learning_rate": 2.0215404039523293e-05, "loss": 2.4036, "step": 341590 }, { "epoch": 0.6, "learning_rate": 2.0214532099596467e-05, "loss": 2.3196, "step": 341600 }, { "epoch": 0.6, "learning_rate": 2.021366015966964e-05, "loss": 2.3365, "step": 341610 }, { "epoch": 0.6, "learning_rate": 2.0212788219742814e-05, "loss": 2.2703, "step": 341620 }, { "epoch": 0.6, "learning_rate": 2.0211916279815988e-05, "loss": 2.3809, "step": 341630 }, { "epoch": 0.6, "learning_rate": 2.021104433988916e-05, "loss": 2.2975, "step": 341640 }, { "epoch": 0.6, "learning_rate": 2.0210172399962332e-05, "loss": 2.339, "step": 341650 }, { "epoch": 0.6, "learning_rate": 2.0209300460035506e-05, "loss": 2.2633, "step": 341660 }, { "epoch": 0.6, "learning_rate": 2.020842852010868e-05, "loss": 2.4616, "step": 341670 }, { "epoch": 0.6, "learning_rate": 2.0207556580181854e-05, "loss": 2.3123, "step": 341680 }, { "epoch": 0.6, "learning_rate": 2.0206684640255024e-05, "loss": 2.2788, "step": 341690 }, { "epoch": 0.6, "learning_rate": 2.02058127003282e-05, "loss": 2.3903, "step": 341700 }, { "epoch": 0.6, "learning_rate": 2.020494076040137e-05, "loss": 2.2938, "step": 341710 }, { "epoch": 0.6, "learning_rate": 2.0204068820474545e-05, "loss": 2.3046, "step": 341720 }, { "epoch": 0.6, "learning_rate": 2.020319688054772e-05, "loss": 2.4048, "step": 341730 }, { "epoch": 0.6, "learning_rate": 2.0202324940620893e-05, "loss": 2.2989, "step": 341740 }, { "epoch": 0.6, "learning_rate": 2.0201453000694067e-05, "loss": 2.3019, "step": 341750 }, { "epoch": 0.6, "learning_rate": 2.0200581060767237e-05, "loss": 2.4324, "step": 341760 }, { "epoch": 0.6, "learning_rate": 2.0199709120840414e-05, "loss": 2.331, "step": 341770 }, { "epoch": 0.6, "learning_rate": 2.0198837180913585e-05, "loss": 2.364, "step": 341780 }, { "epoch": 0.6, "learning_rate": 2.019796524098676e-05, "loss": 2.2464, "step": 341790 }, { "epoch": 0.6, "learning_rate": 2.019709330105993e-05, "loss": 2.453, "step": 341800 }, { "epoch": 0.6, "learning_rate": 2.0196221361133106e-05, "loss": 2.15, "step": 341810 }, { "epoch": 0.6, "learning_rate": 2.0195349421206276e-05, "loss": 2.4129, "step": 341820 }, { "epoch": 0.6, "learning_rate": 2.019447748127945e-05, "loss": 2.4066, "step": 341830 }, { "epoch": 0.6, "learning_rate": 2.0193605541352624e-05, "loss": 2.3199, "step": 341840 }, { "epoch": 0.6, "learning_rate": 2.0192733601425798e-05, "loss": 2.3768, "step": 341850 }, { "epoch": 0.6, "learning_rate": 2.019186166149897e-05, "loss": 2.4509, "step": 341860 }, { "epoch": 0.6, "learning_rate": 2.0190989721572142e-05, "loss": 2.3836, "step": 341870 }, { "epoch": 0.6, "learning_rate": 2.019011778164532e-05, "loss": 2.3596, "step": 341880 }, { "epoch": 0.6, "learning_rate": 2.018924584171849e-05, "loss": 2.4171, "step": 341890 }, { "epoch": 0.6, "learning_rate": 2.0188373901791663e-05, "loss": 2.3508, "step": 341900 }, { "epoch": 0.6, "learning_rate": 2.0187501961864837e-05, "loss": 2.363, "step": 341910 }, { "epoch": 0.6, "learning_rate": 2.018663002193801e-05, "loss": 2.3006, "step": 341920 }, { "epoch": 0.6, "learning_rate": 2.0185758082011184e-05, "loss": 2.2818, "step": 341930 }, { "epoch": 0.6, "learning_rate": 2.0184886142084355e-05, "loss": 2.3261, "step": 341940 }, { "epoch": 0.6, "learning_rate": 2.018401420215753e-05, "loss": 2.2891, "step": 341950 }, { "epoch": 0.6, "learning_rate": 2.0183142262230702e-05, "loss": 2.2543, "step": 341960 }, { "epoch": 0.6, "learning_rate": 2.0182270322303876e-05, "loss": 2.3567, "step": 341970 }, { "epoch": 0.6, "learning_rate": 2.0181398382377046e-05, "loss": 2.3505, "step": 341980 }, { "epoch": 0.6, "learning_rate": 2.0180526442450224e-05, "loss": 2.4119, "step": 341990 }, { "epoch": 0.6, "learning_rate": 2.0179654502523397e-05, "loss": 2.285, "step": 342000 }, { "epoch": 0.6, "learning_rate": 2.0178782562596568e-05, "loss": 2.4141, "step": 342010 }, { "epoch": 0.6, "learning_rate": 2.017791062266974e-05, "loss": 2.4262, "step": 342020 }, { "epoch": 0.6, "learning_rate": 2.0177038682742915e-05, "loss": 2.2708, "step": 342030 }, { "epoch": 0.6, "learning_rate": 2.017616674281609e-05, "loss": 2.2642, "step": 342040 }, { "epoch": 0.6, "learning_rate": 2.017529480288926e-05, "loss": 2.3878, "step": 342050 }, { "epoch": 0.6, "learning_rate": 2.0174422862962433e-05, "loss": 2.3642, "step": 342060 }, { "epoch": 0.6, "learning_rate": 2.0173550923035607e-05, "loss": 2.4486, "step": 342070 }, { "epoch": 0.6, "learning_rate": 2.017267898310878e-05, "loss": 2.3096, "step": 342080 }, { "epoch": 0.6, "learning_rate": 2.0171807043181954e-05, "loss": 2.3251, "step": 342090 }, { "epoch": 0.6, "learning_rate": 2.0170935103255125e-05, "loss": 2.2763, "step": 342100 }, { "epoch": 0.6, "learning_rate": 2.0170063163328302e-05, "loss": 2.3938, "step": 342110 }, { "epoch": 0.6, "learning_rate": 2.0169191223401472e-05, "loss": 2.3371, "step": 342120 }, { "epoch": 0.6, "learning_rate": 2.0168319283474646e-05, "loss": 2.2956, "step": 342130 }, { "epoch": 0.6, "learning_rate": 2.016744734354782e-05, "loss": 2.3498, "step": 342140 }, { "epoch": 0.6, "learning_rate": 2.0166575403620994e-05, "loss": 2.2867, "step": 342150 }, { "epoch": 0.6, "learning_rate": 2.0165703463694168e-05, "loss": 2.4461, "step": 342160 }, { "epoch": 0.6, "learning_rate": 2.0164831523767338e-05, "loss": 2.3365, "step": 342170 }, { "epoch": 0.6, "learning_rate": 2.0163959583840515e-05, "loss": 2.1946, "step": 342180 }, { "epoch": 0.6, "learning_rate": 2.0163087643913685e-05, "loss": 2.274, "step": 342190 }, { "epoch": 0.6, "learning_rate": 2.016221570398686e-05, "loss": 2.3539, "step": 342200 }, { "epoch": 0.6, "learning_rate": 2.016134376406003e-05, "loss": 2.2947, "step": 342210 }, { "epoch": 0.6, "learning_rate": 2.0160471824133207e-05, "loss": 2.3915, "step": 342220 }, { "epoch": 0.6, "learning_rate": 2.0159599884206377e-05, "loss": 2.3783, "step": 342230 }, { "epoch": 0.6, "learning_rate": 2.015872794427955e-05, "loss": 2.3846, "step": 342240 }, { "epoch": 0.6, "learning_rate": 2.0157856004352725e-05, "loss": 2.2895, "step": 342250 }, { "epoch": 0.6, "learning_rate": 2.01569840644259e-05, "loss": 2.4236, "step": 342260 }, { "epoch": 0.6, "learning_rate": 2.0156112124499072e-05, "loss": 2.2792, "step": 342270 }, { "epoch": 0.6, "learning_rate": 2.0155240184572243e-05, "loss": 2.3271, "step": 342280 }, { "epoch": 0.6, "learning_rate": 2.015436824464542e-05, "loss": 2.3608, "step": 342290 }, { "epoch": 0.6, "learning_rate": 2.015349630471859e-05, "loss": 2.2926, "step": 342300 }, { "epoch": 0.6, "learning_rate": 2.0152624364791764e-05, "loss": 2.2997, "step": 342310 }, { "epoch": 0.6, "learning_rate": 2.0151752424864938e-05, "loss": 2.3187, "step": 342320 }, { "epoch": 0.6, "learning_rate": 2.015088048493811e-05, "loss": 2.3137, "step": 342330 }, { "epoch": 0.6, "learning_rate": 2.0150008545011285e-05, "loss": 2.3463, "step": 342340 }, { "epoch": 0.6, "learning_rate": 2.0149136605084456e-05, "loss": 2.2562, "step": 342350 }, { "epoch": 0.6, "learning_rate": 2.014826466515763e-05, "loss": 2.3086, "step": 342360 }, { "epoch": 0.6, "learning_rate": 2.0147392725230803e-05, "loss": 2.3224, "step": 342370 }, { "epoch": 0.6, "learning_rate": 2.0146520785303977e-05, "loss": 2.4098, "step": 342380 }, { "epoch": 0.6, "learning_rate": 2.014564884537715e-05, "loss": 2.2975, "step": 342390 }, { "epoch": 0.6, "learning_rate": 2.0144776905450324e-05, "loss": 2.2376, "step": 342400 }, { "epoch": 0.6, "learning_rate": 2.0143904965523498e-05, "loss": 2.3993, "step": 342410 }, { "epoch": 0.6, "learning_rate": 2.014303302559667e-05, "loss": 2.3279, "step": 342420 }, { "epoch": 0.6, "learning_rate": 2.0142161085669842e-05, "loss": 2.3601, "step": 342430 }, { "epoch": 0.6, "learning_rate": 2.0141289145743016e-05, "loss": 2.2915, "step": 342440 }, { "epoch": 0.6, "learning_rate": 2.014041720581619e-05, "loss": 2.3503, "step": 342450 }, { "epoch": 0.6, "learning_rate": 2.013954526588936e-05, "loss": 2.2395, "step": 342460 }, { "epoch": 0.6, "learning_rate": 2.0138673325962534e-05, "loss": 2.3125, "step": 342470 }, { "epoch": 0.6, "learning_rate": 2.013780138603571e-05, "loss": 2.353, "step": 342480 }, { "epoch": 0.6, "learning_rate": 2.013692944610888e-05, "loss": 2.3042, "step": 342490 }, { "epoch": 0.6, "learning_rate": 2.0136057506182055e-05, "loss": 2.294, "step": 342500 }, { "epoch": 0.6, "learning_rate": 2.0135185566255226e-05, "loss": 2.3391, "step": 342510 }, { "epoch": 0.6, "learning_rate": 2.0134313626328403e-05, "loss": 2.3149, "step": 342520 }, { "epoch": 0.6, "learning_rate": 2.0133441686401573e-05, "loss": 2.3181, "step": 342530 }, { "epoch": 0.6, "learning_rate": 2.0132569746474747e-05, "loss": 2.2821, "step": 342540 }, { "epoch": 0.6, "learning_rate": 2.013169780654792e-05, "loss": 2.4205, "step": 342550 }, { "epoch": 0.6, "learning_rate": 2.0130825866621095e-05, "loss": 2.3553, "step": 342560 }, { "epoch": 0.6, "learning_rate": 2.012995392669427e-05, "loss": 2.1639, "step": 342570 }, { "epoch": 0.6, "learning_rate": 2.012908198676744e-05, "loss": 2.2975, "step": 342580 }, { "epoch": 0.6, "learning_rate": 2.0128210046840616e-05, "loss": 2.3976, "step": 342590 }, { "epoch": 0.6, "learning_rate": 2.0127338106913786e-05, "loss": 2.3746, "step": 342600 }, { "epoch": 0.6, "learning_rate": 2.012646616698696e-05, "loss": 2.4175, "step": 342610 }, { "epoch": 0.6, "learning_rate": 2.0125594227060134e-05, "loss": 2.2743, "step": 342620 }, { "epoch": 0.6, "learning_rate": 2.0124722287133308e-05, "loss": 2.3048, "step": 342630 }, { "epoch": 0.6, "learning_rate": 2.012385034720648e-05, "loss": 2.3266, "step": 342640 }, { "epoch": 0.6, "learning_rate": 2.0122978407279652e-05, "loss": 2.3572, "step": 342650 }, { "epoch": 0.6, "learning_rate": 2.012210646735283e-05, "loss": 2.4742, "step": 342660 }, { "epoch": 0.6, "learning_rate": 2.0121234527426e-05, "loss": 2.2968, "step": 342670 }, { "epoch": 0.6, "learning_rate": 2.0120362587499173e-05, "loss": 2.2431, "step": 342680 }, { "epoch": 0.6, "learning_rate": 2.0119490647572343e-05, "loss": 2.4659, "step": 342690 }, { "epoch": 0.6, "learning_rate": 2.011861870764552e-05, "loss": 2.4039, "step": 342700 }, { "epoch": 0.6, "learning_rate": 2.011774676771869e-05, "loss": 2.2555, "step": 342710 }, { "epoch": 0.6, "learning_rate": 2.0116874827791865e-05, "loss": 2.4472, "step": 342720 }, { "epoch": 0.6, "learning_rate": 2.011600288786504e-05, "loss": 2.373, "step": 342730 }, { "epoch": 0.6, "learning_rate": 2.0115130947938212e-05, "loss": 2.3874, "step": 342740 }, { "epoch": 0.6, "learning_rate": 2.0114259008011386e-05, "loss": 2.1955, "step": 342750 }, { "epoch": 0.6, "learning_rate": 2.0113387068084556e-05, "loss": 2.2682, "step": 342760 }, { "epoch": 0.6, "learning_rate": 2.011251512815773e-05, "loss": 2.3188, "step": 342770 }, { "epoch": 0.6, "learning_rate": 2.0111643188230904e-05, "loss": 2.4105, "step": 342780 }, { "epoch": 0.6, "learning_rate": 2.0110771248304078e-05, "loss": 2.2887, "step": 342790 }, { "epoch": 0.6, "learning_rate": 2.010989930837725e-05, "loss": 2.2043, "step": 342800 }, { "epoch": 0.6, "learning_rate": 2.0109027368450425e-05, "loss": 2.354, "step": 342810 }, { "epoch": 0.6, "learning_rate": 2.01081554285236e-05, "loss": 2.4025, "step": 342820 }, { "epoch": 0.6, "learning_rate": 2.010728348859677e-05, "loss": 2.3237, "step": 342830 }, { "epoch": 0.6, "learning_rate": 2.0106411548669943e-05, "loss": 2.2479, "step": 342840 }, { "epoch": 0.6, "learning_rate": 2.0105539608743117e-05, "loss": 2.2897, "step": 342850 }, { "epoch": 0.6, "learning_rate": 2.010466766881629e-05, "loss": 2.4056, "step": 342860 }, { "epoch": 0.6, "learning_rate": 2.0103795728889465e-05, "loss": 2.3878, "step": 342870 }, { "epoch": 0.6, "learning_rate": 2.0102923788962635e-05, "loss": 2.4018, "step": 342880 }, { "epoch": 0.6, "learning_rate": 2.0102051849035812e-05, "loss": 2.4445, "step": 342890 }, { "epoch": 0.6, "learning_rate": 2.0101179909108982e-05, "loss": 2.266, "step": 342900 }, { "epoch": 0.6, "learning_rate": 2.0100307969182156e-05, "loss": 2.3186, "step": 342910 }, { "epoch": 0.6, "learning_rate": 2.009943602925533e-05, "loss": 2.2662, "step": 342920 }, { "epoch": 0.6, "learning_rate": 2.0098564089328504e-05, "loss": 2.4012, "step": 342930 }, { "epoch": 0.6, "learning_rate": 2.0097692149401674e-05, "loss": 2.2771, "step": 342940 }, { "epoch": 0.6, "learning_rate": 2.0096820209474848e-05, "loss": 2.5058, "step": 342950 }, { "epoch": 0.6, "learning_rate": 2.009594826954802e-05, "loss": 2.3043, "step": 342960 }, { "epoch": 0.6, "learning_rate": 2.0095076329621195e-05, "loss": 2.3272, "step": 342970 }, { "epoch": 0.6, "learning_rate": 2.009420438969437e-05, "loss": 2.2796, "step": 342980 }, { "epoch": 0.6, "learning_rate": 2.009333244976754e-05, "loss": 2.2553, "step": 342990 }, { "epoch": 0.6, "learning_rate": 2.0092460509840717e-05, "loss": 2.3804, "step": 343000 }, { "epoch": 0.6, "learning_rate": 2.0091588569913887e-05, "loss": 2.2877, "step": 343010 }, { "epoch": 0.6, "learning_rate": 2.009071662998706e-05, "loss": 2.3787, "step": 343020 }, { "epoch": 0.6, "learning_rate": 2.0089844690060235e-05, "loss": 2.3367, "step": 343030 }, { "epoch": 0.6, "learning_rate": 2.008897275013341e-05, "loss": 2.3874, "step": 343040 }, { "epoch": 0.6, "learning_rate": 2.0088100810206582e-05, "loss": 2.2729, "step": 343050 }, { "epoch": 0.6, "learning_rate": 2.0087228870279753e-05, "loss": 2.3187, "step": 343060 }, { "epoch": 0.6, "learning_rate": 2.008635693035293e-05, "loss": 2.2713, "step": 343070 }, { "epoch": 0.6, "learning_rate": 2.00854849904261e-05, "loss": 2.4274, "step": 343080 }, { "epoch": 0.6, "learning_rate": 2.0084613050499274e-05, "loss": 2.2517, "step": 343090 }, { "epoch": 0.6, "learning_rate": 2.0083741110572448e-05, "loss": 2.2646, "step": 343100 }, { "epoch": 0.6, "learning_rate": 2.008286917064562e-05, "loss": 2.2316, "step": 343110 }, { "epoch": 0.6, "learning_rate": 2.0081997230718795e-05, "loss": 2.2589, "step": 343120 }, { "epoch": 0.6, "learning_rate": 2.0081125290791966e-05, "loss": 2.2833, "step": 343130 }, { "epoch": 0.6, "learning_rate": 2.008025335086514e-05, "loss": 2.247, "step": 343140 }, { "epoch": 0.6, "learning_rate": 2.0079381410938313e-05, "loss": 2.381, "step": 343150 }, { "epoch": 0.6, "learning_rate": 2.0078509471011487e-05, "loss": 2.4367, "step": 343160 }, { "epoch": 0.6, "learning_rate": 2.0077637531084657e-05, "loss": 2.4037, "step": 343170 }, { "epoch": 0.6, "learning_rate": 2.007676559115783e-05, "loss": 2.2529, "step": 343180 }, { "epoch": 0.6, "learning_rate": 2.0075893651231005e-05, "loss": 2.3439, "step": 343190 }, { "epoch": 0.6, "learning_rate": 2.007502171130418e-05, "loss": 2.2854, "step": 343200 }, { "epoch": 0.6, "learning_rate": 2.0074149771377352e-05, "loss": 2.4401, "step": 343210 }, { "epoch": 0.6, "learning_rate": 2.0073277831450526e-05, "loss": 2.3239, "step": 343220 }, { "epoch": 0.6, "learning_rate": 2.00724058915237e-05, "loss": 2.3151, "step": 343230 }, { "epoch": 0.6, "learning_rate": 2.007153395159687e-05, "loss": 2.2901, "step": 343240 }, { "epoch": 0.6, "learning_rate": 2.0070662011670044e-05, "loss": 2.3912, "step": 343250 }, { "epoch": 0.6, "learning_rate": 2.0069790071743218e-05, "loss": 2.3642, "step": 343260 }, { "epoch": 0.6, "learning_rate": 2.006891813181639e-05, "loss": 2.3912, "step": 343270 }, { "epoch": 0.6, "learning_rate": 2.0068046191889565e-05, "loss": 2.3578, "step": 343280 }, { "epoch": 0.6, "learning_rate": 2.0067174251962736e-05, "loss": 2.295, "step": 343290 }, { "epoch": 0.6, "learning_rate": 2.0066302312035913e-05, "loss": 2.3181, "step": 343300 }, { "epoch": 0.6, "learning_rate": 2.0065430372109083e-05, "loss": 2.3716, "step": 343310 }, { "epoch": 0.6, "learning_rate": 2.0064558432182257e-05, "loss": 2.44, "step": 343320 }, { "epoch": 0.6, "learning_rate": 2.006368649225543e-05, "loss": 2.4053, "step": 343330 }, { "epoch": 0.6, "learning_rate": 2.0062814552328605e-05, "loss": 2.347, "step": 343340 }, { "epoch": 0.6, "learning_rate": 2.006194261240178e-05, "loss": 2.2775, "step": 343350 }, { "epoch": 0.6, "learning_rate": 2.006107067247495e-05, "loss": 2.254, "step": 343360 }, { "epoch": 0.6, "learning_rate": 2.0060198732548126e-05, "loss": 2.2812, "step": 343370 }, { "epoch": 0.6, "learning_rate": 2.0059326792621296e-05, "loss": 2.2749, "step": 343380 }, { "epoch": 0.6, "learning_rate": 2.005845485269447e-05, "loss": 2.3787, "step": 343390 }, { "epoch": 0.6, "learning_rate": 2.005758291276764e-05, "loss": 2.3895, "step": 343400 }, { "epoch": 0.6, "learning_rate": 2.0056710972840818e-05, "loss": 2.3474, "step": 343410 }, { "epoch": 0.6, "learning_rate": 2.0055839032913988e-05, "loss": 2.2279, "step": 343420 }, { "epoch": 0.6, "learning_rate": 2.0054967092987162e-05, "loss": 2.329, "step": 343430 }, { "epoch": 0.6, "learning_rate": 2.0054095153060336e-05, "loss": 2.3811, "step": 343440 }, { "epoch": 0.6, "learning_rate": 2.005322321313351e-05, "loss": 2.2899, "step": 343450 }, { "epoch": 0.6, "learning_rate": 2.0052351273206683e-05, "loss": 2.3068, "step": 343460 }, { "epoch": 0.6, "learning_rate": 2.0051479333279853e-05, "loss": 2.3113, "step": 343470 }, { "epoch": 0.6, "learning_rate": 2.005060739335303e-05, "loss": 2.4507, "step": 343480 }, { "epoch": 0.6, "learning_rate": 2.00497354534262e-05, "loss": 2.3234, "step": 343490 }, { "epoch": 0.6, "learning_rate": 2.0048863513499375e-05, "loss": 2.2999, "step": 343500 }, { "epoch": 0.6, "learning_rate": 2.004799157357255e-05, "loss": 2.2687, "step": 343510 }, { "epoch": 0.6, "learning_rate": 2.0047119633645722e-05, "loss": 2.429, "step": 343520 }, { "epoch": 0.6, "learning_rate": 2.0046247693718896e-05, "loss": 2.3207, "step": 343530 }, { "epoch": 0.6, "learning_rate": 2.0045375753792066e-05, "loss": 2.4138, "step": 343540 }, { "epoch": 0.6, "learning_rate": 2.004450381386524e-05, "loss": 2.2146, "step": 343550 }, { "epoch": 0.6, "learning_rate": 2.0043631873938414e-05, "loss": 2.39, "step": 343560 }, { "epoch": 0.6, "learning_rate": 2.0042759934011588e-05, "loss": 2.254, "step": 343570 }, { "epoch": 0.6, "learning_rate": 2.0041887994084758e-05, "loss": 2.2674, "step": 343580 }, { "epoch": 0.6, "learning_rate": 2.0041016054157935e-05, "loss": 2.2599, "step": 343590 }, { "epoch": 0.6, "learning_rate": 2.004014411423111e-05, "loss": 2.2571, "step": 343600 }, { "epoch": 0.6, "learning_rate": 2.003927217430428e-05, "loss": 2.3184, "step": 343610 }, { "epoch": 0.6, "learning_rate": 2.0038400234377453e-05, "loss": 2.4391, "step": 343620 }, { "epoch": 0.6, "learning_rate": 2.0037528294450627e-05, "loss": 2.3896, "step": 343630 }, { "epoch": 0.6, "learning_rate": 2.00366563545238e-05, "loss": 2.3646, "step": 343640 }, { "epoch": 0.6, "learning_rate": 2.003578441459697e-05, "loss": 2.3757, "step": 343650 }, { "epoch": 0.6, "learning_rate": 2.0034912474670145e-05, "loss": 2.2369, "step": 343660 }, { "epoch": 0.6, "learning_rate": 2.003404053474332e-05, "loss": 2.3398, "step": 343670 }, { "epoch": 0.6, "learning_rate": 2.0033168594816492e-05, "loss": 2.3956, "step": 343680 }, { "epoch": 0.6, "learning_rate": 2.0032296654889666e-05, "loss": 2.2408, "step": 343690 }, { "epoch": 0.6, "learning_rate": 2.0031424714962837e-05, "loss": 2.2298, "step": 343700 }, { "epoch": 0.6, "learning_rate": 2.0030552775036014e-05, "loss": 2.2659, "step": 343710 }, { "epoch": 0.6, "learning_rate": 2.0029680835109184e-05, "loss": 2.3391, "step": 343720 }, { "epoch": 0.6, "learning_rate": 2.0028808895182358e-05, "loss": 2.3367, "step": 343730 }, { "epoch": 0.6, "learning_rate": 2.002793695525553e-05, "loss": 2.3085, "step": 343740 }, { "epoch": 0.6, "learning_rate": 2.0027065015328705e-05, "loss": 2.3237, "step": 343750 }, { "epoch": 0.6, "learning_rate": 2.002619307540188e-05, "loss": 2.2756, "step": 343760 }, { "epoch": 0.6, "learning_rate": 2.002532113547505e-05, "loss": 2.3863, "step": 343770 }, { "epoch": 0.6, "learning_rate": 2.0024449195548227e-05, "loss": 2.2377, "step": 343780 }, { "epoch": 0.6, "learning_rate": 2.0023577255621397e-05, "loss": 2.4038, "step": 343790 }, { "epoch": 0.6, "learning_rate": 2.002270531569457e-05, "loss": 2.3944, "step": 343800 }, { "epoch": 0.6, "learning_rate": 2.002183337576774e-05, "loss": 2.2655, "step": 343810 }, { "epoch": 0.6, "learning_rate": 2.002096143584092e-05, "loss": 2.1941, "step": 343820 }, { "epoch": 0.6, "learning_rate": 2.0020089495914092e-05, "loss": 2.3272, "step": 343830 }, { "epoch": 0.6, "learning_rate": 2.0019217555987263e-05, "loss": 2.2535, "step": 343840 }, { "epoch": 0.6, "learning_rate": 2.001834561606044e-05, "loss": 2.304, "step": 343850 }, { "epoch": 0.6, "learning_rate": 2.001747367613361e-05, "loss": 2.3538, "step": 343860 }, { "epoch": 0.6, "learning_rate": 2.0016601736206784e-05, "loss": 2.2538, "step": 343870 }, { "epoch": 0.6, "learning_rate": 2.0015729796279954e-05, "loss": 2.2407, "step": 343880 }, { "epoch": 0.6, "learning_rate": 2.001485785635313e-05, "loss": 2.2129, "step": 343890 }, { "epoch": 0.6, "learning_rate": 2.0013985916426302e-05, "loss": 2.3497, "step": 343900 }, { "epoch": 0.6, "learning_rate": 2.0013113976499476e-05, "loss": 2.433, "step": 343910 }, { "epoch": 0.6, "learning_rate": 2.001224203657265e-05, "loss": 2.3011, "step": 343920 }, { "epoch": 0.6, "learning_rate": 2.0011370096645823e-05, "loss": 2.2722, "step": 343930 }, { "epoch": 0.6, "learning_rate": 2.0010498156718997e-05, "loss": 2.3689, "step": 343940 }, { "epoch": 0.6, "learning_rate": 2.0009626216792167e-05, "loss": 2.3368, "step": 343950 }, { "epoch": 0.6, "learning_rate": 2.000875427686534e-05, "loss": 2.3711, "step": 343960 }, { "epoch": 0.6, "learning_rate": 2.0007882336938515e-05, "loss": 2.379, "step": 343970 }, { "epoch": 0.6, "learning_rate": 2.000701039701169e-05, "loss": 2.3641, "step": 343980 }, { "epoch": 0.6, "learning_rate": 2.0006138457084862e-05, "loss": 2.3239, "step": 343990 }, { "epoch": 0.6, "learning_rate": 2.0005266517158036e-05, "loss": 2.2927, "step": 344000 }, { "epoch": 0.6, "learning_rate": 2.000439457723121e-05, "loss": 2.4385, "step": 344010 }, { "epoch": 0.6, "learning_rate": 2.000352263730438e-05, "loss": 2.4148, "step": 344020 }, { "epoch": 0.6, "learning_rate": 2.0002650697377554e-05, "loss": 2.2551, "step": 344030 }, { "epoch": 0.6, "learning_rate": 2.0001778757450728e-05, "loss": 2.3722, "step": 344040 }, { "epoch": 0.6, "learning_rate": 2.00009068175239e-05, "loss": 2.4626, "step": 344050 }, { "epoch": 0.6, "learning_rate": 2.0000034877597072e-05, "loss": 2.3122, "step": 344060 }, { "epoch": 0.6, "learning_rate": 1.9999162937670246e-05, "loss": 2.3392, "step": 344070 }, { "epoch": 0.6, "learning_rate": 1.9998290997743423e-05, "loss": 2.3582, "step": 344080 }, { "epoch": 0.6, "learning_rate": 1.9997419057816593e-05, "loss": 2.3369, "step": 344090 }, { "epoch": 0.6, "learning_rate": 1.9996547117889767e-05, "loss": 2.4265, "step": 344100 }, { "epoch": 0.6, "learning_rate": 1.9995675177962937e-05, "loss": 2.317, "step": 344110 }, { "epoch": 0.6, "learning_rate": 1.9994803238036115e-05, "loss": 2.2944, "step": 344120 }, { "epoch": 0.6, "learning_rate": 1.9993931298109285e-05, "loss": 2.3278, "step": 344130 }, { "epoch": 0.6, "learning_rate": 1.999305935818246e-05, "loss": 2.2587, "step": 344140 }, { "epoch": 0.6, "learning_rate": 1.9992187418255633e-05, "loss": 2.4103, "step": 344150 }, { "epoch": 0.6, "learning_rate": 1.9991315478328806e-05, "loss": 2.4173, "step": 344160 }, { "epoch": 0.6, "learning_rate": 1.999044353840198e-05, "loss": 2.3098, "step": 344170 }, { "epoch": 0.6, "learning_rate": 1.998957159847515e-05, "loss": 2.3136, "step": 344180 }, { "epoch": 0.6, "learning_rate": 1.9988699658548328e-05, "loss": 2.3789, "step": 344190 }, { "epoch": 0.6, "learning_rate": 1.9987827718621498e-05, "loss": 2.3386, "step": 344200 }, { "epoch": 0.6, "learning_rate": 1.9986955778694672e-05, "loss": 2.2411, "step": 344210 }, { "epoch": 0.6, "learning_rate": 1.9986083838767846e-05, "loss": 2.3405, "step": 344220 }, { "epoch": 0.6, "learning_rate": 1.998521189884102e-05, "loss": 2.4213, "step": 344230 }, { "epoch": 0.6, "learning_rate": 1.9984339958914193e-05, "loss": 2.2516, "step": 344240 }, { "epoch": 0.6, "learning_rate": 1.9983468018987363e-05, "loss": 2.3386, "step": 344250 }, { "epoch": 0.6, "learning_rate": 1.998259607906054e-05, "loss": 2.2585, "step": 344260 }, { "epoch": 0.6, "learning_rate": 1.998172413913371e-05, "loss": 2.2863, "step": 344270 }, { "epoch": 0.6, "learning_rate": 1.9980852199206885e-05, "loss": 2.4447, "step": 344280 }, { "epoch": 0.6, "learning_rate": 1.9979980259280055e-05, "loss": 2.2669, "step": 344290 }, { "epoch": 0.6, "learning_rate": 1.9979108319353232e-05, "loss": 2.329, "step": 344300 }, { "epoch": 0.6, "learning_rate": 1.9978236379426403e-05, "loss": 2.2927, "step": 344310 }, { "epoch": 0.6, "learning_rate": 1.9977364439499576e-05, "loss": 2.4112, "step": 344320 }, { "epoch": 0.6, "learning_rate": 1.997649249957275e-05, "loss": 2.4204, "step": 344330 }, { "epoch": 0.6, "learning_rate": 1.9975620559645924e-05, "loss": 2.4236, "step": 344340 }, { "epoch": 0.6, "learning_rate": 1.9974748619719098e-05, "loss": 2.3648, "step": 344350 }, { "epoch": 0.6, "learning_rate": 1.9973876679792268e-05, "loss": 2.3168, "step": 344360 }, { "epoch": 0.6, "learning_rate": 1.9973004739865442e-05, "loss": 2.1646, "step": 344370 }, { "epoch": 0.6, "learning_rate": 1.9972132799938616e-05, "loss": 2.4149, "step": 344380 }, { "epoch": 0.6, "learning_rate": 1.997126086001179e-05, "loss": 2.2952, "step": 344390 }, { "epoch": 0.6, "learning_rate": 1.9970388920084963e-05, "loss": 2.4156, "step": 344400 }, { "epoch": 0.6, "learning_rate": 1.9969516980158137e-05, "loss": 2.375, "step": 344410 }, { "epoch": 0.6, "learning_rate": 1.996864504023131e-05, "loss": 2.3324, "step": 344420 }, { "epoch": 0.6, "learning_rate": 1.996777310030448e-05, "loss": 2.2556, "step": 344430 }, { "epoch": 0.6, "learning_rate": 1.9966901160377655e-05, "loss": 2.2859, "step": 344440 }, { "epoch": 0.6, "learning_rate": 1.996602922045083e-05, "loss": 2.3925, "step": 344450 }, { "epoch": 0.6, "learning_rate": 1.9965157280524002e-05, "loss": 2.2517, "step": 344460 }, { "epoch": 0.6, "learning_rate": 1.9964285340597176e-05, "loss": 2.3853, "step": 344470 }, { "epoch": 0.6, "learning_rate": 1.9963413400670347e-05, "loss": 2.3613, "step": 344480 }, { "epoch": 0.6, "learning_rate": 1.9962541460743524e-05, "loss": 2.5729, "step": 344490 }, { "epoch": 0.6, "learning_rate": 1.9961669520816694e-05, "loss": 2.3846, "step": 344500 }, { "epoch": 0.6, "learning_rate": 1.9960797580889868e-05, "loss": 2.257, "step": 344510 }, { "epoch": 0.6, "learning_rate": 1.995992564096304e-05, "loss": 2.3763, "step": 344520 }, { "epoch": 0.6, "learning_rate": 1.9959053701036215e-05, "loss": 2.3438, "step": 344530 }, { "epoch": 0.6, "learning_rate": 1.9958181761109386e-05, "loss": 2.302, "step": 344540 }, { "epoch": 0.6, "learning_rate": 1.995730982118256e-05, "loss": 2.3483, "step": 344550 }, { "epoch": 0.6, "learning_rate": 1.9956437881255737e-05, "loss": 2.3227, "step": 344560 }, { "epoch": 0.6, "learning_rate": 1.9955565941328907e-05, "loss": 2.3424, "step": 344570 }, { "epoch": 0.6, "learning_rate": 1.995469400140208e-05, "loss": 2.3546, "step": 344580 }, { "epoch": 0.6, "learning_rate": 1.995382206147525e-05, "loss": 2.3271, "step": 344590 }, { "epoch": 0.6, "learning_rate": 1.995295012154843e-05, "loss": 2.3659, "step": 344600 }, { "epoch": 0.6, "learning_rate": 1.99520781816216e-05, "loss": 2.2466, "step": 344610 }, { "epoch": 0.6, "learning_rate": 1.9951206241694773e-05, "loss": 2.2745, "step": 344620 }, { "epoch": 0.6, "learning_rate": 1.9950334301767946e-05, "loss": 2.3244, "step": 344630 }, { "epoch": 0.6, "learning_rate": 1.994946236184112e-05, "loss": 2.3536, "step": 344640 }, { "epoch": 0.6, "learning_rate": 1.9948590421914294e-05, "loss": 2.2948, "step": 344650 }, { "epoch": 0.6, "learning_rate": 1.9947718481987464e-05, "loss": 2.419, "step": 344660 }, { "epoch": 0.6, "learning_rate": 1.994684654206064e-05, "loss": 2.3499, "step": 344670 }, { "epoch": 0.6, "learning_rate": 1.9945974602133812e-05, "loss": 2.332, "step": 344680 }, { "epoch": 0.6, "learning_rate": 1.9945102662206986e-05, "loss": 2.2027, "step": 344690 }, { "epoch": 0.6, "learning_rate": 1.994423072228016e-05, "loss": 2.2927, "step": 344700 }, { "epoch": 0.6, "learning_rate": 1.9943358782353333e-05, "loss": 2.2606, "step": 344710 }, { "epoch": 0.6, "learning_rate": 1.9942486842426507e-05, "loss": 2.1753, "step": 344720 }, { "epoch": 0.6, "learning_rate": 1.9941614902499677e-05, "loss": 2.3006, "step": 344730 }, { "epoch": 0.6, "learning_rate": 1.994074296257285e-05, "loss": 2.3293, "step": 344740 }, { "epoch": 0.6, "learning_rate": 1.9939871022646025e-05, "loss": 2.3565, "step": 344750 }, { "epoch": 0.6, "learning_rate": 1.99389990827192e-05, "loss": 2.2583, "step": 344760 }, { "epoch": 0.6, "learning_rate": 1.993812714279237e-05, "loss": 2.3013, "step": 344770 }, { "epoch": 0.6, "learning_rate": 1.9937255202865546e-05, "loss": 2.3568, "step": 344780 }, { "epoch": 0.6, "learning_rate": 1.9936383262938717e-05, "loss": 2.3378, "step": 344790 }, { "epoch": 0.6, "learning_rate": 1.993551132301189e-05, "loss": 2.4567, "step": 344800 }, { "epoch": 0.6, "learning_rate": 1.9934639383085064e-05, "loss": 2.3154, "step": 344810 }, { "epoch": 0.6, "learning_rate": 1.9933767443158238e-05, "loss": 2.3467, "step": 344820 }, { "epoch": 0.6, "learning_rate": 1.993289550323141e-05, "loss": 2.2186, "step": 344830 }, { "epoch": 0.6, "learning_rate": 1.9932023563304582e-05, "loss": 2.2557, "step": 344840 }, { "epoch": 0.6, "learning_rate": 1.9931151623377756e-05, "loss": 2.4095, "step": 344850 }, { "epoch": 0.6, "learning_rate": 1.993027968345093e-05, "loss": 2.3587, "step": 344860 }, { "epoch": 0.6, "learning_rate": 1.9929407743524103e-05, "loss": 2.2901, "step": 344870 }, { "epoch": 0.6, "learning_rate": 1.9928535803597277e-05, "loss": 2.2152, "step": 344880 }, { "epoch": 0.6, "learning_rate": 1.9927663863670447e-05, "loss": 2.3479, "step": 344890 }, { "epoch": 0.6, "learning_rate": 1.9926791923743625e-05, "loss": 2.2769, "step": 344900 }, { "epoch": 0.6, "learning_rate": 1.9925919983816795e-05, "loss": 2.3829, "step": 344910 }, { "epoch": 0.6, "learning_rate": 1.992504804388997e-05, "loss": 2.4816, "step": 344920 }, { "epoch": 0.6, "learning_rate": 1.9924176103963143e-05, "loss": 2.2979, "step": 344930 }, { "epoch": 0.6, "learning_rate": 1.9923304164036316e-05, "loss": 2.3456, "step": 344940 }, { "epoch": 0.6, "learning_rate": 1.992243222410949e-05, "loss": 2.2483, "step": 344950 }, { "epoch": 0.6, "learning_rate": 1.992156028418266e-05, "loss": 2.3699, "step": 344960 }, { "epoch": 0.6, "learning_rate": 1.9920688344255838e-05, "loss": 2.3935, "step": 344970 }, { "epoch": 0.6, "learning_rate": 1.9919816404329008e-05, "loss": 2.3107, "step": 344980 }, { "epoch": 0.6, "learning_rate": 1.9918944464402182e-05, "loss": 2.3673, "step": 344990 }, { "epoch": 0.6, "learning_rate": 1.9918072524475352e-05, "loss": 2.3251, "step": 345000 }, { "epoch": 0.6, "learning_rate": 1.991720058454853e-05, "loss": 2.3729, "step": 345010 }, { "epoch": 0.6, "learning_rate": 1.99163286446217e-05, "loss": 2.3712, "step": 345020 }, { "epoch": 0.6, "learning_rate": 1.9915456704694873e-05, "loss": 2.2759, "step": 345030 }, { "epoch": 0.6, "learning_rate": 1.9914584764768047e-05, "loss": 2.3497, "step": 345040 }, { "epoch": 0.6, "learning_rate": 1.991371282484122e-05, "loss": 2.3191, "step": 345050 }, { "epoch": 0.6, "learning_rate": 1.9912840884914395e-05, "loss": 2.3711, "step": 345060 }, { "epoch": 0.6, "learning_rate": 1.9911968944987565e-05, "loss": 2.2549, "step": 345070 }, { "epoch": 0.6, "learning_rate": 1.9911097005060742e-05, "loss": 2.3878, "step": 345080 }, { "epoch": 0.6, "learning_rate": 1.9910225065133913e-05, "loss": 2.3586, "step": 345090 }, { "epoch": 0.6, "learning_rate": 1.9909353125207086e-05, "loss": 2.3682, "step": 345100 }, { "epoch": 0.6, "learning_rate": 1.990848118528026e-05, "loss": 2.3796, "step": 345110 }, { "epoch": 0.6, "learning_rate": 1.9907609245353434e-05, "loss": 2.3, "step": 345120 }, { "epoch": 0.6, "learning_rate": 1.9906737305426608e-05, "loss": 2.2874, "step": 345130 }, { "epoch": 0.6, "learning_rate": 1.9905865365499778e-05, "loss": 2.3221, "step": 345140 }, { "epoch": 0.6, "learning_rate": 1.9904993425572952e-05, "loss": 2.3494, "step": 345150 }, { "epoch": 0.6, "learning_rate": 1.9904121485646126e-05, "loss": 2.2688, "step": 345160 }, { "epoch": 0.6, "learning_rate": 1.99032495457193e-05, "loss": 2.4109, "step": 345170 }, { "epoch": 0.6, "learning_rate": 1.9902377605792473e-05, "loss": 2.246, "step": 345180 }, { "epoch": 0.6, "learning_rate": 1.9901505665865647e-05, "loss": 2.3192, "step": 345190 }, { "epoch": 0.6, "learning_rate": 1.990063372593882e-05, "loss": 2.2877, "step": 345200 }, { "epoch": 0.6, "learning_rate": 1.989976178601199e-05, "loss": 2.323, "step": 345210 }, { "epoch": 0.6, "learning_rate": 1.9898889846085165e-05, "loss": 2.4049, "step": 345220 }, { "epoch": 0.6, "learning_rate": 1.989801790615834e-05, "loss": 2.363, "step": 345230 }, { "epoch": 0.6, "learning_rate": 1.9897145966231512e-05, "loss": 2.4095, "step": 345240 }, { "epoch": 0.6, "learning_rate": 1.9896274026304683e-05, "loss": 2.3882, "step": 345250 }, { "epoch": 0.6, "learning_rate": 1.9895402086377857e-05, "loss": 2.2454, "step": 345260 }, { "epoch": 0.6, "learning_rate": 1.989453014645103e-05, "loss": 2.309, "step": 345270 }, { "epoch": 0.6, "learning_rate": 1.9893658206524204e-05, "loss": 2.3518, "step": 345280 }, { "epoch": 0.6, "learning_rate": 1.9892786266597378e-05, "loss": 2.3246, "step": 345290 }, { "epoch": 0.6, "learning_rate": 1.9891914326670548e-05, "loss": 2.3884, "step": 345300 }, { "epoch": 0.6, "learning_rate": 1.9891042386743725e-05, "loss": 2.321, "step": 345310 }, { "epoch": 0.6, "learning_rate": 1.9890170446816896e-05, "loss": 2.3993, "step": 345320 }, { "epoch": 0.6, "learning_rate": 1.988929850689007e-05, "loss": 2.382, "step": 345330 }, { "epoch": 0.6, "learning_rate": 1.9888426566963243e-05, "loss": 2.3398, "step": 345340 }, { "epoch": 0.6, "learning_rate": 1.9887554627036417e-05, "loss": 2.3081, "step": 345350 }, { "epoch": 0.6, "learning_rate": 1.988668268710959e-05, "loss": 2.3151, "step": 345360 }, { "epoch": 0.6, "learning_rate": 1.988581074718276e-05, "loss": 2.4319, "step": 345370 }, { "epoch": 0.6, "learning_rate": 1.988493880725594e-05, "loss": 2.3954, "step": 345380 }, { "epoch": 0.6, "learning_rate": 1.988406686732911e-05, "loss": 2.3205, "step": 345390 }, { "epoch": 0.6, "learning_rate": 1.9883194927402283e-05, "loss": 2.319, "step": 345400 }, { "epoch": 0.6, "learning_rate": 1.9882322987475453e-05, "loss": 2.373, "step": 345410 }, { "epoch": 0.6, "learning_rate": 1.988145104754863e-05, "loss": 2.284, "step": 345420 }, { "epoch": 0.6, "learning_rate": 1.9880579107621804e-05, "loss": 2.3005, "step": 345430 }, { "epoch": 0.6, "learning_rate": 1.9879707167694974e-05, "loss": 2.295, "step": 345440 }, { "epoch": 0.6, "learning_rate": 1.987883522776815e-05, "loss": 2.2089, "step": 345450 }, { "epoch": 0.6, "learning_rate": 1.9877963287841322e-05, "loss": 2.3445, "step": 345460 }, { "epoch": 0.6, "learning_rate": 1.9877091347914496e-05, "loss": 2.309, "step": 345470 }, { "epoch": 0.6, "learning_rate": 1.9876219407987666e-05, "loss": 2.3322, "step": 345480 }, { "epoch": 0.6, "learning_rate": 1.9875347468060843e-05, "loss": 2.3232, "step": 345490 }, { "epoch": 0.6, "learning_rate": 1.9874475528134014e-05, "loss": 2.3262, "step": 345500 }, { "epoch": 0.6, "learning_rate": 1.9873603588207187e-05, "loss": 2.3877, "step": 345510 }, { "epoch": 0.6, "learning_rate": 1.987273164828036e-05, "loss": 2.3491, "step": 345520 }, { "epoch": 0.6, "learning_rate": 1.9871859708353535e-05, "loss": 2.2937, "step": 345530 }, { "epoch": 0.6, "learning_rate": 1.987098776842671e-05, "loss": 2.4053, "step": 345540 }, { "epoch": 0.6, "learning_rate": 1.987011582849988e-05, "loss": 2.2379, "step": 345550 }, { "epoch": 0.6, "learning_rate": 1.9869243888573053e-05, "loss": 2.3566, "step": 345560 }, { "epoch": 0.6, "learning_rate": 1.9868371948646227e-05, "loss": 2.4208, "step": 345570 }, { "epoch": 0.6, "learning_rate": 1.98675000087194e-05, "loss": 2.3083, "step": 345580 }, { "epoch": 0.6, "learning_rate": 1.9866628068792574e-05, "loss": 2.4203, "step": 345590 }, { "epoch": 0.6, "learning_rate": 1.9865756128865748e-05, "loss": 2.2595, "step": 345600 }, { "epoch": 0.6, "learning_rate": 1.986488418893892e-05, "loss": 2.266, "step": 345610 }, { "epoch": 0.6, "learning_rate": 1.9864012249012092e-05, "loss": 2.3753, "step": 345620 }, { "epoch": 0.6, "learning_rate": 1.9863140309085266e-05, "loss": 2.3999, "step": 345630 }, { "epoch": 0.6, "learning_rate": 1.986226836915844e-05, "loss": 2.3362, "step": 345640 }, { "epoch": 0.6, "learning_rate": 1.9861396429231613e-05, "loss": 2.2632, "step": 345650 }, { "epoch": 0.6, "learning_rate": 1.9860524489304787e-05, "loss": 2.3033, "step": 345660 }, { "epoch": 0.6, "learning_rate": 1.9859652549377957e-05, "loss": 2.4042, "step": 345670 }, { "epoch": 0.6, "learning_rate": 1.9858780609451135e-05, "loss": 2.2984, "step": 345680 }, { "epoch": 0.6, "learning_rate": 1.9857908669524305e-05, "loss": 2.4133, "step": 345690 }, { "epoch": 0.6, "learning_rate": 1.985703672959748e-05, "loss": 2.2195, "step": 345700 }, { "epoch": 0.6, "learning_rate": 1.9856164789670653e-05, "loss": 2.3369, "step": 345710 }, { "epoch": 0.6, "learning_rate": 1.9855292849743826e-05, "loss": 2.3068, "step": 345720 }, { "epoch": 0.6, "learning_rate": 1.9854420909816997e-05, "loss": 2.2945, "step": 345730 }, { "epoch": 0.6, "learning_rate": 1.985354896989017e-05, "loss": 2.3755, "step": 345740 }, { "epoch": 0.6, "learning_rate": 1.9852677029963344e-05, "loss": 2.238, "step": 345750 }, { "epoch": 0.6, "learning_rate": 1.9851805090036518e-05, "loss": 2.3775, "step": 345760 }, { "epoch": 0.6, "learning_rate": 1.9850933150109692e-05, "loss": 2.3858, "step": 345770 }, { "epoch": 0.6, "learning_rate": 1.9850061210182862e-05, "loss": 2.2876, "step": 345780 }, { "epoch": 0.6, "learning_rate": 1.984918927025604e-05, "loss": 2.4157, "step": 345790 }, { "epoch": 0.6, "learning_rate": 1.984831733032921e-05, "loss": 2.4465, "step": 345800 }, { "epoch": 0.6, "learning_rate": 1.9847445390402383e-05, "loss": 2.404, "step": 345810 }, { "epoch": 0.6, "learning_rate": 1.9846573450475557e-05, "loss": 2.2842, "step": 345820 }, { "epoch": 0.6, "learning_rate": 1.984570151054873e-05, "loss": 2.4134, "step": 345830 }, { "epoch": 0.6, "learning_rate": 1.9844829570621905e-05, "loss": 2.4017, "step": 345840 }, { "epoch": 0.6, "learning_rate": 1.9843957630695075e-05, "loss": 2.3132, "step": 345850 }, { "epoch": 0.6, "learning_rate": 1.9843085690768252e-05, "loss": 2.3906, "step": 345860 }, { "epoch": 0.6, "learning_rate": 1.9842213750841423e-05, "loss": 2.3513, "step": 345870 }, { "epoch": 0.6, "learning_rate": 1.9841341810914596e-05, "loss": 2.322, "step": 345880 }, { "epoch": 0.6, "learning_rate": 1.9840469870987767e-05, "loss": 2.4202, "step": 345890 }, { "epoch": 0.6, "learning_rate": 1.9839597931060944e-05, "loss": 2.366, "step": 345900 }, { "epoch": 0.6, "learning_rate": 1.9838725991134118e-05, "loss": 2.3909, "step": 345910 }, { "epoch": 0.6, "learning_rate": 1.9837854051207288e-05, "loss": 2.2991, "step": 345920 }, { "epoch": 0.6, "learning_rate": 1.9836982111280462e-05, "loss": 2.2661, "step": 345930 }, { "epoch": 0.6, "learning_rate": 1.9836110171353636e-05, "loss": 2.3354, "step": 345940 }, { "epoch": 0.6, "learning_rate": 1.983523823142681e-05, "loss": 2.2128, "step": 345950 }, { "epoch": 0.6, "learning_rate": 1.983436629149998e-05, "loss": 2.3179, "step": 345960 }, { "epoch": 0.6, "learning_rate": 1.9833494351573154e-05, "loss": 2.402, "step": 345970 }, { "epoch": 0.6, "learning_rate": 1.9832622411646327e-05, "loss": 2.2653, "step": 345980 }, { "epoch": 0.6, "learning_rate": 1.98317504717195e-05, "loss": 2.365, "step": 345990 }, { "epoch": 0.6, "learning_rate": 1.9830878531792675e-05, "loss": 2.3498, "step": 346000 }, { "epoch": 0.6, "learning_rate": 1.983000659186585e-05, "loss": 2.3211, "step": 346010 }, { "epoch": 0.6, "learning_rate": 1.9829134651939022e-05, "loss": 2.1962, "step": 346020 }, { "epoch": 0.6, "learning_rate": 1.9828262712012193e-05, "loss": 2.3663, "step": 346030 }, { "epoch": 0.6, "learning_rate": 1.9827390772085367e-05, "loss": 2.3567, "step": 346040 }, { "epoch": 0.6, "learning_rate": 1.982651883215854e-05, "loss": 2.4552, "step": 346050 }, { "epoch": 0.6, "learning_rate": 1.9825646892231714e-05, "loss": 2.3565, "step": 346060 }, { "epoch": 0.6, "learning_rate": 1.9824774952304888e-05, "loss": 2.3555, "step": 346070 }, { "epoch": 0.6, "learning_rate": 1.9823903012378058e-05, "loss": 2.217, "step": 346080 }, { "epoch": 0.6, "learning_rate": 1.9823031072451235e-05, "loss": 2.329, "step": 346090 }, { "epoch": 0.6, "learning_rate": 1.9822159132524406e-05, "loss": 2.3105, "step": 346100 }, { "epoch": 0.6, "learning_rate": 1.982128719259758e-05, "loss": 2.3658, "step": 346110 }, { "epoch": 0.6, "learning_rate": 1.9820415252670753e-05, "loss": 2.4063, "step": 346120 }, { "epoch": 0.6, "learning_rate": 1.9819543312743927e-05, "loss": 2.2907, "step": 346130 }, { "epoch": 0.6, "learning_rate": 1.9818671372817098e-05, "loss": 2.3145, "step": 346140 }, { "epoch": 0.6, "learning_rate": 1.981779943289027e-05, "loss": 2.367, "step": 346150 }, { "epoch": 0.6, "learning_rate": 1.981692749296345e-05, "loss": 2.4411, "step": 346160 }, { "epoch": 0.6, "learning_rate": 1.981605555303662e-05, "loss": 2.3556, "step": 346170 }, { "epoch": 0.6, "learning_rate": 1.9815183613109793e-05, "loss": 2.3575, "step": 346180 }, { "epoch": 0.6, "learning_rate": 1.9814311673182963e-05, "loss": 2.2792, "step": 346190 }, { "epoch": 0.6, "learning_rate": 1.981343973325614e-05, "loss": 2.4118, "step": 346200 }, { "epoch": 0.6, "learning_rate": 1.981256779332931e-05, "loss": 2.2964, "step": 346210 }, { "epoch": 0.6, "learning_rate": 1.9811695853402484e-05, "loss": 2.3778, "step": 346220 }, { "epoch": 0.6, "learning_rate": 1.9810823913475658e-05, "loss": 2.3689, "step": 346230 }, { "epoch": 0.6, "learning_rate": 1.9809951973548832e-05, "loss": 2.4007, "step": 346240 }, { "epoch": 0.6, "learning_rate": 1.9809080033622006e-05, "loss": 2.4159, "step": 346250 }, { "epoch": 0.6, "learning_rate": 1.9808208093695176e-05, "loss": 2.3522, "step": 346260 }, { "epoch": 0.6, "learning_rate": 1.9807336153768353e-05, "loss": 2.2156, "step": 346270 }, { "epoch": 0.6, "learning_rate": 1.9806464213841524e-05, "loss": 2.459, "step": 346280 }, { "epoch": 0.6, "learning_rate": 1.9805592273914697e-05, "loss": 2.2132, "step": 346290 }, { "epoch": 0.6, "learning_rate": 1.980472033398787e-05, "loss": 2.3219, "step": 346300 }, { "epoch": 0.6, "learning_rate": 1.9803848394061045e-05, "loss": 2.4217, "step": 346310 }, { "epoch": 0.6, "learning_rate": 1.980297645413422e-05, "loss": 2.2231, "step": 346320 }, { "epoch": 0.6, "learning_rate": 1.980210451420739e-05, "loss": 2.3108, "step": 346330 }, { "epoch": 0.6, "learning_rate": 1.9801232574280563e-05, "loss": 2.3381, "step": 346340 }, { "epoch": 0.6, "learning_rate": 1.9800360634353737e-05, "loss": 2.3581, "step": 346350 }, { "epoch": 0.6, "learning_rate": 1.979948869442691e-05, "loss": 2.2898, "step": 346360 }, { "epoch": 0.6, "learning_rate": 1.979861675450008e-05, "loss": 2.2533, "step": 346370 }, { "epoch": 0.6, "learning_rate": 1.9797744814573258e-05, "loss": 2.2698, "step": 346380 }, { "epoch": 0.6, "learning_rate": 1.979687287464643e-05, "loss": 2.315, "step": 346390 }, { "epoch": 0.6, "learning_rate": 1.9796000934719602e-05, "loss": 2.268, "step": 346400 }, { "epoch": 0.6, "learning_rate": 1.9795128994792776e-05, "loss": 2.2339, "step": 346410 }, { "epoch": 0.6, "learning_rate": 1.979425705486595e-05, "loss": 2.3464, "step": 346420 }, { "epoch": 0.6, "learning_rate": 1.9793385114939123e-05, "loss": 2.2631, "step": 346430 }, { "epoch": 0.6, "learning_rate": 1.9792513175012294e-05, "loss": 2.3938, "step": 346440 }, { "epoch": 0.6, "learning_rate": 1.9791641235085467e-05, "loss": 2.2795, "step": 346450 }, { "epoch": 0.6, "learning_rate": 1.979076929515864e-05, "loss": 2.3253, "step": 346460 }, { "epoch": 0.6, "learning_rate": 1.9789897355231815e-05, "loss": 2.3058, "step": 346470 }, { "epoch": 0.6, "learning_rate": 1.978902541530499e-05, "loss": 2.2443, "step": 346480 }, { "epoch": 0.6, "learning_rate": 1.978815347537816e-05, "loss": 2.3242, "step": 346490 }, { "epoch": 0.6, "learning_rate": 1.9787281535451336e-05, "loss": 2.4017, "step": 346500 }, { "epoch": 0.6, "learning_rate": 1.9786409595524507e-05, "loss": 2.3075, "step": 346510 }, { "epoch": 0.6, "learning_rate": 1.978553765559768e-05, "loss": 2.2732, "step": 346520 }, { "epoch": 0.6, "learning_rate": 1.9784665715670854e-05, "loss": 2.3599, "step": 346530 }, { "epoch": 0.6, "learning_rate": 1.9783793775744028e-05, "loss": 2.37, "step": 346540 }, { "epoch": 0.6, "learning_rate": 1.9782921835817202e-05, "loss": 2.4323, "step": 346550 }, { "epoch": 0.6, "learning_rate": 1.9782049895890372e-05, "loss": 2.3594, "step": 346560 }, { "epoch": 0.6, "learning_rate": 1.978117795596355e-05, "loss": 2.3462, "step": 346570 }, { "epoch": 0.6, "learning_rate": 1.978030601603672e-05, "loss": 2.3734, "step": 346580 }, { "epoch": 0.6, "learning_rate": 1.9779434076109893e-05, "loss": 2.2952, "step": 346590 }, { "epoch": 0.6, "learning_rate": 1.9778562136183064e-05, "loss": 2.3508, "step": 346600 }, { "epoch": 0.6, "learning_rate": 1.977769019625624e-05, "loss": 2.2997, "step": 346610 }, { "epoch": 0.6, "learning_rate": 1.977681825632941e-05, "loss": 2.1928, "step": 346620 }, { "epoch": 0.6, "learning_rate": 1.9775946316402585e-05, "loss": 2.3917, "step": 346630 }, { "epoch": 0.6, "learning_rate": 1.977507437647576e-05, "loss": 2.3242, "step": 346640 }, { "epoch": 0.6, "learning_rate": 1.9774202436548933e-05, "loss": 2.2709, "step": 346650 }, { "epoch": 0.6, "learning_rate": 1.9773330496622106e-05, "loss": 2.5074, "step": 346660 }, { "epoch": 0.6, "learning_rate": 1.9772458556695277e-05, "loss": 2.3776, "step": 346670 }, { "epoch": 0.6, "learning_rate": 1.9771586616768454e-05, "loss": 2.331, "step": 346680 }, { "epoch": 0.6, "learning_rate": 1.9770714676841624e-05, "loss": 2.3771, "step": 346690 }, { "epoch": 0.6, "learning_rate": 1.9769842736914798e-05, "loss": 2.3062, "step": 346700 }, { "epoch": 0.6, "learning_rate": 1.9768970796987972e-05, "loss": 2.3647, "step": 346710 }, { "epoch": 0.6, "learning_rate": 1.9768098857061146e-05, "loss": 2.3285, "step": 346720 }, { "epoch": 0.6, "learning_rate": 1.976722691713432e-05, "loss": 2.3026, "step": 346730 }, { "epoch": 0.6, "learning_rate": 1.976635497720749e-05, "loss": 2.383, "step": 346740 }, { "epoch": 0.6, "learning_rate": 1.9765483037280664e-05, "loss": 2.3266, "step": 346750 }, { "epoch": 0.6, "learning_rate": 1.9764611097353837e-05, "loss": 2.3471, "step": 346760 }, { "epoch": 0.6, "learning_rate": 1.976373915742701e-05, "loss": 2.3499, "step": 346770 }, { "epoch": 0.6, "learning_rate": 1.9762867217500185e-05, "loss": 2.3402, "step": 346780 }, { "epoch": 0.6, "learning_rate": 1.976199527757336e-05, "loss": 2.2301, "step": 346790 }, { "epoch": 0.6, "learning_rate": 1.9761123337646532e-05, "loss": 2.3383, "step": 346800 }, { "epoch": 0.6, "learning_rate": 1.9760251397719703e-05, "loss": 2.2863, "step": 346810 }, { "epoch": 0.6, "learning_rate": 1.9759379457792877e-05, "loss": 2.4041, "step": 346820 }, { "epoch": 0.6, "learning_rate": 1.975850751786605e-05, "loss": 2.2899, "step": 346830 }, { "epoch": 0.6, "learning_rate": 1.9757635577939224e-05, "loss": 2.3247, "step": 346840 }, { "epoch": 0.6, "learning_rate": 1.9756763638012395e-05, "loss": 2.3256, "step": 346850 }, { "epoch": 0.6, "learning_rate": 1.975589169808557e-05, "loss": 2.3809, "step": 346860 }, { "epoch": 0.6, "learning_rate": 1.9755019758158742e-05, "loss": 2.3043, "step": 346870 }, { "epoch": 0.6, "learning_rate": 1.9754147818231916e-05, "loss": 2.3306, "step": 346880 }, { "epoch": 0.6, "learning_rate": 1.975327587830509e-05, "loss": 2.2431, "step": 346890 }, { "epoch": 0.6, "learning_rate": 1.975240393837826e-05, "loss": 2.259, "step": 346900 }, { "epoch": 0.6, "learning_rate": 1.9751531998451437e-05, "loss": 2.4287, "step": 346910 }, { "epoch": 0.6, "learning_rate": 1.9750660058524608e-05, "loss": 2.3478, "step": 346920 }, { "epoch": 0.61, "learning_rate": 1.974978811859778e-05, "loss": 2.4424, "step": 346930 }, { "epoch": 0.61, "learning_rate": 1.9748916178670955e-05, "loss": 2.2437, "step": 346940 }, { "epoch": 0.61, "learning_rate": 1.974804423874413e-05, "loss": 2.3451, "step": 346950 }, { "epoch": 0.61, "learning_rate": 1.9747172298817303e-05, "loss": 2.304, "step": 346960 }, { "epoch": 0.61, "learning_rate": 1.9746300358890473e-05, "loss": 2.364, "step": 346970 }, { "epoch": 0.61, "learning_rate": 1.974542841896365e-05, "loss": 2.2997, "step": 346980 }, { "epoch": 0.61, "learning_rate": 1.974455647903682e-05, "loss": 2.3394, "step": 346990 }, { "epoch": 0.61, "learning_rate": 1.9743684539109994e-05, "loss": 2.2296, "step": 347000 }, { "epoch": 0.61, "learning_rate": 1.9742812599183168e-05, "loss": 2.2746, "step": 347010 }, { "epoch": 0.61, "learning_rate": 1.9741940659256342e-05, "loss": 2.3046, "step": 347020 }, { "epoch": 0.61, "learning_rate": 1.9741068719329516e-05, "loss": 2.2803, "step": 347030 }, { "epoch": 0.61, "learning_rate": 1.9740196779402686e-05, "loss": 2.333, "step": 347040 }, { "epoch": 0.61, "learning_rate": 1.9739324839475863e-05, "loss": 2.3762, "step": 347050 }, { "epoch": 0.61, "learning_rate": 1.9738452899549034e-05, "loss": 2.3486, "step": 347060 }, { "epoch": 0.61, "learning_rate": 1.9737580959622207e-05, "loss": 2.3907, "step": 347070 }, { "epoch": 0.61, "learning_rate": 1.9736709019695378e-05, "loss": 2.4936, "step": 347080 }, { "epoch": 0.61, "learning_rate": 1.9735837079768555e-05, "loss": 2.2571, "step": 347090 }, { "epoch": 0.61, "learning_rate": 1.9734965139841725e-05, "loss": 2.325, "step": 347100 }, { "epoch": 0.61, "learning_rate": 1.97340931999149e-05, "loss": 2.329, "step": 347110 }, { "epoch": 0.61, "learning_rate": 1.9733221259988073e-05, "loss": 2.3561, "step": 347120 }, { "epoch": 0.61, "learning_rate": 1.9732349320061247e-05, "loss": 2.3763, "step": 347130 }, { "epoch": 0.61, "learning_rate": 1.973147738013442e-05, "loss": 2.3397, "step": 347140 }, { "epoch": 0.61, "learning_rate": 1.973060544020759e-05, "loss": 2.4157, "step": 347150 }, { "epoch": 0.61, "learning_rate": 1.9729733500280764e-05, "loss": 2.2658, "step": 347160 }, { "epoch": 0.61, "learning_rate": 1.9728861560353938e-05, "loss": 2.2611, "step": 347170 }, { "epoch": 0.61, "learning_rate": 1.9727989620427112e-05, "loss": 2.4498, "step": 347180 }, { "epoch": 0.61, "learning_rate": 1.9727117680500286e-05, "loss": 2.3077, "step": 347190 }, { "epoch": 0.61, "learning_rate": 1.972624574057346e-05, "loss": 2.4089, "step": 347200 }, { "epoch": 0.61, "learning_rate": 1.9725373800646633e-05, "loss": 2.4173, "step": 347210 }, { "epoch": 0.61, "learning_rate": 1.9724501860719804e-05, "loss": 2.2889, "step": 347220 }, { "epoch": 0.61, "learning_rate": 1.9723629920792977e-05, "loss": 2.3736, "step": 347230 }, { "epoch": 0.61, "learning_rate": 1.972275798086615e-05, "loss": 2.3065, "step": 347240 }, { "epoch": 0.61, "learning_rate": 1.9721886040939325e-05, "loss": 2.3988, "step": 347250 }, { "epoch": 0.61, "learning_rate": 1.97210141010125e-05, "loss": 2.2959, "step": 347260 }, { "epoch": 0.61, "learning_rate": 1.972014216108567e-05, "loss": 2.3583, "step": 347270 }, { "epoch": 0.61, "learning_rate": 1.9719270221158846e-05, "loss": 2.3816, "step": 347280 }, { "epoch": 0.61, "learning_rate": 1.9718398281232017e-05, "loss": 2.3017, "step": 347290 }, { "epoch": 0.61, "learning_rate": 1.971752634130519e-05, "loss": 2.4102, "step": 347300 }, { "epoch": 0.61, "learning_rate": 1.9716654401378364e-05, "loss": 2.4661, "step": 347310 }, { "epoch": 0.61, "learning_rate": 1.9715782461451538e-05, "loss": 2.4305, "step": 347320 }, { "epoch": 0.61, "learning_rate": 1.971491052152471e-05, "loss": 2.3561, "step": 347330 }, { "epoch": 0.61, "learning_rate": 1.9714038581597882e-05, "loss": 2.3199, "step": 347340 }, { "epoch": 0.61, "learning_rate": 1.9713166641671056e-05, "loss": 2.3184, "step": 347350 }, { "epoch": 0.61, "learning_rate": 1.971229470174423e-05, "loss": 2.3298, "step": 347360 }, { "epoch": 0.61, "learning_rate": 1.9711422761817403e-05, "loss": 2.3372, "step": 347370 }, { "epoch": 0.61, "learning_rate": 1.9710550821890574e-05, "loss": 2.3951, "step": 347380 }, { "epoch": 0.61, "learning_rate": 1.970967888196375e-05, "loss": 2.4728, "step": 347390 }, { "epoch": 0.61, "learning_rate": 1.970880694203692e-05, "loss": 2.3577, "step": 347400 }, { "epoch": 0.61, "learning_rate": 1.9707935002110095e-05, "loss": 2.364, "step": 347410 }, { "epoch": 0.61, "learning_rate": 1.970706306218327e-05, "loss": 2.3819, "step": 347420 }, { "epoch": 0.61, "learning_rate": 1.9706191122256443e-05, "loss": 2.4356, "step": 347430 }, { "epoch": 0.61, "learning_rate": 1.9705319182329616e-05, "loss": 2.2606, "step": 347440 }, { "epoch": 0.61, "learning_rate": 1.9704447242402787e-05, "loss": 2.4045, "step": 347450 }, { "epoch": 0.61, "learning_rate": 1.9703575302475964e-05, "loss": 2.1837, "step": 347460 }, { "epoch": 0.61, "learning_rate": 1.9702703362549134e-05, "loss": 2.3232, "step": 347470 }, { "epoch": 0.61, "learning_rate": 1.9701831422622308e-05, "loss": 2.3849, "step": 347480 }, { "epoch": 0.61, "learning_rate": 1.970095948269548e-05, "loss": 2.2244, "step": 347490 }, { "epoch": 0.61, "learning_rate": 1.9700087542768656e-05, "loss": 2.2754, "step": 347500 }, { "epoch": 0.61, "learning_rate": 1.969921560284183e-05, "loss": 2.392, "step": 347510 }, { "epoch": 0.61, "learning_rate": 1.9698343662915e-05, "loss": 2.337, "step": 347520 }, { "epoch": 0.61, "learning_rate": 1.9697471722988174e-05, "loss": 2.3556, "step": 347530 }, { "epoch": 0.61, "learning_rate": 1.9696599783061347e-05, "loss": 2.3984, "step": 347540 }, { "epoch": 0.61, "learning_rate": 1.969572784313452e-05, "loss": 2.3359, "step": 347550 }, { "epoch": 0.61, "learning_rate": 1.969485590320769e-05, "loss": 2.3319, "step": 347560 }, { "epoch": 0.61, "learning_rate": 1.9693983963280865e-05, "loss": 2.3353, "step": 347570 }, { "epoch": 0.61, "learning_rate": 1.969311202335404e-05, "loss": 2.3517, "step": 347580 }, { "epoch": 0.61, "learning_rate": 1.9692240083427213e-05, "loss": 2.1911, "step": 347590 }, { "epoch": 0.61, "learning_rate": 1.9691368143500387e-05, "loss": 2.3837, "step": 347600 }, { "epoch": 0.61, "learning_rate": 1.969049620357356e-05, "loss": 2.226, "step": 347610 }, { "epoch": 0.61, "learning_rate": 1.9689624263646734e-05, "loss": 2.3167, "step": 347620 }, { "epoch": 0.61, "learning_rate": 1.9688752323719905e-05, "loss": 2.3305, "step": 347630 }, { "epoch": 0.61, "learning_rate": 1.968788038379308e-05, "loss": 2.4007, "step": 347640 }, { "epoch": 0.61, "learning_rate": 1.9687008443866252e-05, "loss": 2.3188, "step": 347650 }, { "epoch": 0.61, "learning_rate": 1.9686136503939426e-05, "loss": 2.3441, "step": 347660 }, { "epoch": 0.61, "learning_rate": 1.96852645640126e-05, "loss": 2.3455, "step": 347670 }, { "epoch": 0.61, "learning_rate": 1.968439262408577e-05, "loss": 2.4199, "step": 347680 }, { "epoch": 0.61, "learning_rate": 1.9683520684158947e-05, "loss": 2.287, "step": 347690 }, { "epoch": 0.61, "learning_rate": 1.9682648744232118e-05, "loss": 2.3009, "step": 347700 }, { "epoch": 0.61, "learning_rate": 1.968177680430529e-05, "loss": 2.2039, "step": 347710 }, { "epoch": 0.61, "learning_rate": 1.9680904864378465e-05, "loss": 2.3455, "step": 347720 }, { "epoch": 0.61, "learning_rate": 1.968003292445164e-05, "loss": 2.3128, "step": 347730 }, { "epoch": 0.61, "learning_rate": 1.9679160984524813e-05, "loss": 2.244, "step": 347740 }, { "epoch": 0.61, "learning_rate": 1.9678289044597983e-05, "loss": 2.4144, "step": 347750 }, { "epoch": 0.61, "learning_rate": 1.967741710467116e-05, "loss": 2.2185, "step": 347760 }, { "epoch": 0.61, "learning_rate": 1.967654516474433e-05, "loss": 2.3596, "step": 347770 }, { "epoch": 0.61, "learning_rate": 1.9675673224817504e-05, "loss": 2.2852, "step": 347780 }, { "epoch": 0.61, "learning_rate": 1.9674801284890675e-05, "loss": 2.2967, "step": 347790 }, { "epoch": 0.61, "learning_rate": 1.9673929344963852e-05, "loss": 2.4546, "step": 347800 }, { "epoch": 0.61, "learning_rate": 1.9673057405037022e-05, "loss": 2.2723, "step": 347810 }, { "epoch": 0.61, "learning_rate": 1.9672185465110196e-05, "loss": 2.3837, "step": 347820 }, { "epoch": 0.61, "learning_rate": 1.967131352518337e-05, "loss": 2.2945, "step": 347830 }, { "epoch": 0.61, "learning_rate": 1.9670441585256544e-05, "loss": 2.2507, "step": 347840 }, { "epoch": 0.61, "learning_rate": 1.9669569645329717e-05, "loss": 2.3858, "step": 347850 }, { "epoch": 0.61, "learning_rate": 1.9668697705402888e-05, "loss": 2.4893, "step": 347860 }, { "epoch": 0.61, "learning_rate": 1.9667825765476065e-05, "loss": 2.2585, "step": 347870 }, { "epoch": 0.61, "learning_rate": 1.9666953825549235e-05, "loss": 2.456, "step": 347880 }, { "epoch": 0.61, "learning_rate": 1.966608188562241e-05, "loss": 2.3968, "step": 347890 }, { "epoch": 0.61, "learning_rate": 1.9665209945695583e-05, "loss": 2.2927, "step": 347900 }, { "epoch": 0.61, "learning_rate": 1.9664338005768757e-05, "loss": 2.1929, "step": 347910 }, { "epoch": 0.61, "learning_rate": 1.966346606584193e-05, "loss": 2.3806, "step": 347920 }, { "epoch": 0.61, "learning_rate": 1.96625941259151e-05, "loss": 2.3464, "step": 347930 }, { "epoch": 0.61, "learning_rate": 1.9661722185988274e-05, "loss": 2.2692, "step": 347940 }, { "epoch": 0.61, "learning_rate": 1.9660850246061448e-05, "loss": 2.2956, "step": 347950 }, { "epoch": 0.61, "learning_rate": 1.9659978306134622e-05, "loss": 2.3268, "step": 347960 }, { "epoch": 0.61, "learning_rate": 1.9659106366207792e-05, "loss": 2.3439, "step": 347970 }, { "epoch": 0.61, "learning_rate": 1.965823442628097e-05, "loss": 2.1618, "step": 347980 }, { "epoch": 0.61, "learning_rate": 1.9657362486354143e-05, "loss": 2.3664, "step": 347990 }, { "epoch": 0.61, "learning_rate": 1.9656490546427314e-05, "loss": 2.4143, "step": 348000 }, { "epoch": 0.61, "learning_rate": 1.9655618606500487e-05, "loss": 2.3302, "step": 348010 }, { "epoch": 0.61, "learning_rate": 1.965474666657366e-05, "loss": 2.512, "step": 348020 }, { "epoch": 0.61, "learning_rate": 1.9653874726646835e-05, "loss": 2.2961, "step": 348030 }, { "epoch": 0.61, "learning_rate": 1.9653002786720005e-05, "loss": 2.33, "step": 348040 }, { "epoch": 0.61, "learning_rate": 1.965213084679318e-05, "loss": 2.2621, "step": 348050 }, { "epoch": 0.61, "learning_rate": 1.9651258906866353e-05, "loss": 2.2926, "step": 348060 }, { "epoch": 0.61, "learning_rate": 1.9650386966939527e-05, "loss": 2.3802, "step": 348070 }, { "epoch": 0.61, "learning_rate": 1.96495150270127e-05, "loss": 2.273, "step": 348080 }, { "epoch": 0.61, "learning_rate": 1.964864308708587e-05, "loss": 2.3563, "step": 348090 }, { "epoch": 0.61, "learning_rate": 1.9647771147159048e-05, "loss": 2.2456, "step": 348100 }, { "epoch": 0.61, "learning_rate": 1.964689920723222e-05, "loss": 2.2786, "step": 348110 }, { "epoch": 0.61, "learning_rate": 1.9646027267305392e-05, "loss": 2.2797, "step": 348120 }, { "epoch": 0.61, "learning_rate": 1.9645155327378566e-05, "loss": 2.2882, "step": 348130 }, { "epoch": 0.61, "learning_rate": 1.964428338745174e-05, "loss": 2.276, "step": 348140 }, { "epoch": 0.61, "learning_rate": 1.9643411447524913e-05, "loss": 2.2919, "step": 348150 }, { "epoch": 0.61, "learning_rate": 1.9642539507598084e-05, "loss": 2.3483, "step": 348160 }, { "epoch": 0.61, "learning_rate": 1.964166756767126e-05, "loss": 2.3386, "step": 348170 }, { "epoch": 0.61, "learning_rate": 1.964079562774443e-05, "loss": 2.3258, "step": 348180 }, { "epoch": 0.61, "learning_rate": 1.9639923687817605e-05, "loss": 2.4302, "step": 348190 }, { "epoch": 0.61, "learning_rate": 1.9639051747890776e-05, "loss": 2.3778, "step": 348200 }, { "epoch": 0.61, "learning_rate": 1.9638179807963953e-05, "loss": 2.349, "step": 348210 }, { "epoch": 0.61, "learning_rate": 1.9637307868037123e-05, "loss": 2.3031, "step": 348220 }, { "epoch": 0.61, "learning_rate": 1.9636435928110297e-05, "loss": 2.3195, "step": 348230 }, { "epoch": 0.61, "learning_rate": 1.9635563988183474e-05, "loss": 2.2754, "step": 348240 }, { "epoch": 0.61, "learning_rate": 1.9634692048256644e-05, "loss": 2.4747, "step": 348250 }, { "epoch": 0.61, "learning_rate": 1.9633820108329818e-05, "loss": 2.3255, "step": 348260 }, { "epoch": 0.61, "learning_rate": 1.963294816840299e-05, "loss": 2.2432, "step": 348270 }, { "epoch": 0.61, "learning_rate": 1.9632076228476166e-05, "loss": 2.3818, "step": 348280 }, { "epoch": 0.61, "learning_rate": 1.9631204288549336e-05, "loss": 2.3913, "step": 348290 }, { "epoch": 0.61, "learning_rate": 1.963033234862251e-05, "loss": 2.2866, "step": 348300 }, { "epoch": 0.61, "learning_rate": 1.9629460408695684e-05, "loss": 2.4056, "step": 348310 }, { "epoch": 0.61, "learning_rate": 1.9628588468768857e-05, "loss": 2.3573, "step": 348320 }, { "epoch": 0.61, "learning_rate": 1.962771652884203e-05, "loss": 2.411, "step": 348330 }, { "epoch": 0.61, "learning_rate": 1.96268445889152e-05, "loss": 2.287, "step": 348340 }, { "epoch": 0.61, "learning_rate": 1.9625972648988375e-05, "loss": 2.3791, "step": 348350 }, { "epoch": 0.61, "learning_rate": 1.962510070906155e-05, "loss": 2.3293, "step": 348360 }, { "epoch": 0.61, "learning_rate": 1.9624228769134723e-05, "loss": 2.2737, "step": 348370 }, { "epoch": 0.61, "learning_rate": 1.9623356829207897e-05, "loss": 2.2892, "step": 348380 }, { "epoch": 0.61, "learning_rate": 1.962248488928107e-05, "loss": 2.2752, "step": 348390 }, { "epoch": 0.61, "learning_rate": 1.9621612949354244e-05, "loss": 2.3726, "step": 348400 }, { "epoch": 0.61, "learning_rate": 1.9620741009427415e-05, "loss": 2.4426, "step": 348410 }, { "epoch": 0.61, "learning_rate": 1.961986906950059e-05, "loss": 2.355, "step": 348420 }, { "epoch": 0.61, "learning_rate": 1.9618997129573762e-05, "loss": 2.3019, "step": 348430 }, { "epoch": 0.61, "learning_rate": 1.9618125189646936e-05, "loss": 2.4275, "step": 348440 }, { "epoch": 0.61, "learning_rate": 1.9617253249720106e-05, "loss": 2.3699, "step": 348450 }, { "epoch": 0.61, "learning_rate": 1.961638130979328e-05, "loss": 2.4124, "step": 348460 }, { "epoch": 0.61, "learning_rate": 1.9615509369866457e-05, "loss": 2.2578, "step": 348470 }, { "epoch": 0.61, "learning_rate": 1.9614637429939628e-05, "loss": 2.2281, "step": 348480 }, { "epoch": 0.61, "learning_rate": 1.96137654900128e-05, "loss": 2.4282, "step": 348490 }, { "epoch": 0.61, "learning_rate": 1.9612893550085972e-05, "loss": 2.2972, "step": 348500 }, { "epoch": 0.61, "learning_rate": 1.961202161015915e-05, "loss": 2.272, "step": 348510 }, { "epoch": 0.61, "learning_rate": 1.961114967023232e-05, "loss": 2.322, "step": 348520 }, { "epoch": 0.61, "learning_rate": 1.9610277730305493e-05, "loss": 2.309, "step": 348530 }, { "epoch": 0.61, "learning_rate": 1.9609405790378667e-05, "loss": 2.4263, "step": 348540 }, { "epoch": 0.61, "learning_rate": 1.960853385045184e-05, "loss": 2.2665, "step": 348550 }, { "epoch": 0.61, "learning_rate": 1.9607661910525014e-05, "loss": 2.2775, "step": 348560 }, { "epoch": 0.61, "learning_rate": 1.9606789970598185e-05, "loss": 2.4037, "step": 348570 }, { "epoch": 0.61, "learning_rate": 1.9605918030671362e-05, "loss": 2.2849, "step": 348580 }, { "epoch": 0.61, "learning_rate": 1.9605046090744532e-05, "loss": 2.1749, "step": 348590 }, { "epoch": 0.61, "learning_rate": 1.9604174150817706e-05, "loss": 2.2824, "step": 348600 }, { "epoch": 0.61, "learning_rate": 1.960330221089088e-05, "loss": 2.2996, "step": 348610 }, { "epoch": 0.61, "learning_rate": 1.9602430270964054e-05, "loss": 2.3621, "step": 348620 }, { "epoch": 0.61, "learning_rate": 1.9601558331037227e-05, "loss": 2.3527, "step": 348630 }, { "epoch": 0.61, "learning_rate": 1.9600686391110398e-05, "loss": 2.37, "step": 348640 }, { "epoch": 0.61, "learning_rate": 1.9599814451183575e-05, "loss": 2.3497, "step": 348650 }, { "epoch": 0.61, "learning_rate": 1.9598942511256745e-05, "loss": 2.3799, "step": 348660 }, { "epoch": 0.61, "learning_rate": 1.959807057132992e-05, "loss": 2.4079, "step": 348670 }, { "epoch": 0.61, "learning_rate": 1.959719863140309e-05, "loss": 2.2183, "step": 348680 }, { "epoch": 0.61, "learning_rate": 1.9596326691476267e-05, "loss": 2.327, "step": 348690 }, { "epoch": 0.61, "learning_rate": 1.9595454751549437e-05, "loss": 2.3553, "step": 348700 }, { "epoch": 0.61, "learning_rate": 1.959458281162261e-05, "loss": 2.327, "step": 348710 }, { "epoch": 0.61, "learning_rate": 1.9593710871695784e-05, "loss": 2.3447, "step": 348720 }, { "epoch": 0.61, "learning_rate": 1.9592838931768958e-05, "loss": 2.3492, "step": 348730 }, { "epoch": 0.61, "learning_rate": 1.9591966991842132e-05, "loss": 2.4688, "step": 348740 }, { "epoch": 0.61, "learning_rate": 1.9591095051915302e-05, "loss": 2.3513, "step": 348750 }, { "epoch": 0.61, "learning_rate": 1.9590223111988476e-05, "loss": 2.3032, "step": 348760 }, { "epoch": 0.61, "learning_rate": 1.958935117206165e-05, "loss": 2.2229, "step": 348770 }, { "epoch": 0.61, "learning_rate": 1.9588479232134824e-05, "loss": 2.2768, "step": 348780 }, { "epoch": 0.61, "learning_rate": 1.9587607292207997e-05, "loss": 2.3722, "step": 348790 }, { "epoch": 0.61, "learning_rate": 1.958673535228117e-05, "loss": 2.3316, "step": 348800 }, { "epoch": 0.61, "learning_rate": 1.9585863412354345e-05, "loss": 2.3506, "step": 348810 }, { "epoch": 0.61, "learning_rate": 1.9584991472427515e-05, "loss": 2.4009, "step": 348820 }, { "epoch": 0.61, "learning_rate": 1.958411953250069e-05, "loss": 2.0419, "step": 348830 }, { "epoch": 0.61, "learning_rate": 1.9583247592573863e-05, "loss": 2.3824, "step": 348840 }, { "epoch": 0.61, "learning_rate": 1.9582375652647037e-05, "loss": 2.3764, "step": 348850 }, { "epoch": 0.61, "learning_rate": 1.958150371272021e-05, "loss": 2.3366, "step": 348860 }, { "epoch": 0.61, "learning_rate": 1.958063177279338e-05, "loss": 2.3342, "step": 348870 }, { "epoch": 0.61, "learning_rate": 1.9579759832866558e-05, "loss": 2.325, "step": 348880 }, { "epoch": 0.61, "learning_rate": 1.957888789293973e-05, "loss": 2.216, "step": 348890 }, { "epoch": 0.61, "learning_rate": 1.9578015953012902e-05, "loss": 2.2386, "step": 348900 }, { "epoch": 0.61, "learning_rate": 1.9577144013086076e-05, "loss": 2.2859, "step": 348910 }, { "epoch": 0.61, "learning_rate": 1.957627207315925e-05, "loss": 2.2315, "step": 348920 }, { "epoch": 0.61, "learning_rate": 1.957540013323242e-05, "loss": 2.3445, "step": 348930 }, { "epoch": 0.61, "learning_rate": 1.9574528193305594e-05, "loss": 2.2692, "step": 348940 }, { "epoch": 0.61, "learning_rate": 1.9573656253378768e-05, "loss": 2.3105, "step": 348950 }, { "epoch": 0.61, "learning_rate": 1.957278431345194e-05, "loss": 2.2728, "step": 348960 }, { "epoch": 0.61, "learning_rate": 1.9571912373525115e-05, "loss": 2.2129, "step": 348970 }, { "epoch": 0.61, "learning_rate": 1.9571040433598286e-05, "loss": 2.3371, "step": 348980 }, { "epoch": 0.61, "learning_rate": 1.9570168493671463e-05, "loss": 2.2979, "step": 348990 }, { "epoch": 0.61, "learning_rate": 1.9569296553744633e-05, "loss": 2.2564, "step": 349000 }, { "epoch": 0.61, "learning_rate": 1.9568424613817807e-05, "loss": 2.3352, "step": 349010 }, { "epoch": 0.61, "learning_rate": 1.956755267389098e-05, "loss": 2.4582, "step": 349020 }, { "epoch": 0.61, "learning_rate": 1.9566680733964154e-05, "loss": 2.2205, "step": 349030 }, { "epoch": 0.61, "learning_rate": 1.9565808794037328e-05, "loss": 2.3509, "step": 349040 }, { "epoch": 0.61, "learning_rate": 1.95649368541105e-05, "loss": 2.3805, "step": 349050 }, { "epoch": 0.61, "learning_rate": 1.9564064914183676e-05, "loss": 2.4035, "step": 349060 }, { "epoch": 0.61, "learning_rate": 1.9563192974256846e-05, "loss": 2.269, "step": 349070 }, { "epoch": 0.61, "learning_rate": 1.956232103433002e-05, "loss": 2.3075, "step": 349080 }, { "epoch": 0.61, "learning_rate": 1.9561449094403194e-05, "loss": 2.303, "step": 349090 }, { "epoch": 0.61, "learning_rate": 1.9560577154476367e-05, "loss": 2.3936, "step": 349100 }, { "epoch": 0.61, "learning_rate": 1.955970521454954e-05, "loss": 2.3648, "step": 349110 }, { "epoch": 0.61, "learning_rate": 1.955883327462271e-05, "loss": 2.3141, "step": 349120 }, { "epoch": 0.61, "learning_rate": 1.9557961334695885e-05, "loss": 2.3761, "step": 349130 }, { "epoch": 0.61, "learning_rate": 1.955708939476906e-05, "loss": 2.3388, "step": 349140 }, { "epoch": 0.61, "learning_rate": 1.9556217454842233e-05, "loss": 2.3792, "step": 349150 }, { "epoch": 0.61, "learning_rate": 1.9555345514915403e-05, "loss": 2.2915, "step": 349160 }, { "epoch": 0.61, "learning_rate": 1.955447357498858e-05, "loss": 2.4534, "step": 349170 }, { "epoch": 0.61, "learning_rate": 1.955360163506175e-05, "loss": 2.3321, "step": 349180 }, { "epoch": 0.61, "learning_rate": 1.9552729695134925e-05, "loss": 2.3133, "step": 349190 }, { "epoch": 0.61, "learning_rate": 1.95518577552081e-05, "loss": 2.3149, "step": 349200 }, { "epoch": 0.61, "learning_rate": 1.9550985815281272e-05, "loss": 2.3567, "step": 349210 }, { "epoch": 0.61, "learning_rate": 1.9550113875354446e-05, "loss": 2.4076, "step": 349220 }, { "epoch": 0.61, "learning_rate": 1.9549241935427616e-05, "loss": 2.4255, "step": 349230 }, { "epoch": 0.61, "learning_rate": 1.954836999550079e-05, "loss": 2.3211, "step": 349240 }, { "epoch": 0.61, "learning_rate": 1.9547498055573964e-05, "loss": 2.313, "step": 349250 }, { "epoch": 0.61, "learning_rate": 1.9546626115647138e-05, "loss": 2.3468, "step": 349260 }, { "epoch": 0.61, "learning_rate": 1.954575417572031e-05, "loss": 2.2666, "step": 349270 }, { "epoch": 0.61, "learning_rate": 1.9544882235793482e-05, "loss": 2.3386, "step": 349280 }, { "epoch": 0.61, "learning_rate": 1.954401029586666e-05, "loss": 2.3637, "step": 349290 }, { "epoch": 0.61, "learning_rate": 1.954313835593983e-05, "loss": 2.2094, "step": 349300 }, { "epoch": 0.61, "learning_rate": 1.9542266416013003e-05, "loss": 2.4036, "step": 349310 }, { "epoch": 0.61, "learning_rate": 1.9541394476086177e-05, "loss": 2.291, "step": 349320 }, { "epoch": 0.61, "learning_rate": 1.954052253615935e-05, "loss": 2.2336, "step": 349330 }, { "epoch": 0.61, "learning_rate": 1.9539650596232524e-05, "loss": 2.3563, "step": 349340 }, { "epoch": 0.61, "learning_rate": 1.9538778656305695e-05, "loss": 2.2398, "step": 349350 }, { "epoch": 0.61, "learning_rate": 1.9537906716378872e-05, "loss": 2.3627, "step": 349360 }, { "epoch": 0.61, "learning_rate": 1.9537034776452042e-05, "loss": 2.4278, "step": 349370 }, { "epoch": 0.61, "learning_rate": 1.9536162836525216e-05, "loss": 2.3921, "step": 349380 }, { "epoch": 0.61, "learning_rate": 1.9535290896598386e-05, "loss": 2.4734, "step": 349390 }, { "epoch": 0.61, "learning_rate": 1.9534418956671564e-05, "loss": 2.3355, "step": 349400 }, { "epoch": 0.61, "learning_rate": 1.9533547016744734e-05, "loss": 2.3774, "step": 349410 }, { "epoch": 0.61, "learning_rate": 1.9532675076817908e-05, "loss": 2.3457, "step": 349420 }, { "epoch": 0.61, "learning_rate": 1.953180313689108e-05, "loss": 2.3699, "step": 349430 }, { "epoch": 0.61, "learning_rate": 1.9530931196964255e-05, "loss": 2.3234, "step": 349440 }, { "epoch": 0.61, "learning_rate": 1.953005925703743e-05, "loss": 2.3493, "step": 349450 }, { "epoch": 0.61, "learning_rate": 1.95291873171106e-05, "loss": 2.199, "step": 349460 }, { "epoch": 0.61, "learning_rate": 1.9528315377183777e-05, "loss": 2.324, "step": 349470 }, { "epoch": 0.61, "learning_rate": 1.9527443437256947e-05, "loss": 2.164, "step": 349480 }, { "epoch": 0.61, "learning_rate": 1.952657149733012e-05, "loss": 2.2705, "step": 349490 }, { "epoch": 0.61, "learning_rate": 1.9525699557403294e-05, "loss": 2.3047, "step": 349500 }, { "epoch": 0.61, "learning_rate": 1.9524827617476468e-05, "loss": 2.3124, "step": 349510 }, { "epoch": 0.61, "learning_rate": 1.9523955677549642e-05, "loss": 2.3952, "step": 349520 }, { "epoch": 0.61, "learning_rate": 1.9523083737622812e-05, "loss": 2.2955, "step": 349530 }, { "epoch": 0.61, "learning_rate": 1.9522211797695986e-05, "loss": 2.4372, "step": 349540 }, { "epoch": 0.61, "learning_rate": 1.952133985776916e-05, "loss": 2.3494, "step": 349550 }, { "epoch": 0.61, "learning_rate": 1.9520467917842334e-05, "loss": 2.3329, "step": 349560 }, { "epoch": 0.61, "learning_rate": 1.9519595977915504e-05, "loss": 2.419, "step": 349570 }, { "epoch": 0.61, "learning_rate": 1.951872403798868e-05, "loss": 2.3673, "step": 349580 }, { "epoch": 0.61, "learning_rate": 1.9517852098061855e-05, "loss": 2.1396, "step": 349590 }, { "epoch": 0.61, "learning_rate": 1.9516980158135025e-05, "loss": 2.3331, "step": 349600 }, { "epoch": 0.61, "learning_rate": 1.95161082182082e-05, "loss": 2.3822, "step": 349610 }, { "epoch": 0.61, "learning_rate": 1.9515236278281373e-05, "loss": 2.251, "step": 349620 }, { "epoch": 0.61, "learning_rate": 1.9514364338354547e-05, "loss": 2.318, "step": 349630 }, { "epoch": 0.61, "learning_rate": 1.9513492398427717e-05, "loss": 2.3445, "step": 349640 }, { "epoch": 0.61, "learning_rate": 1.951262045850089e-05, "loss": 2.2983, "step": 349650 }, { "epoch": 0.61, "learning_rate": 1.9511748518574065e-05, "loss": 2.4103, "step": 349660 }, { "epoch": 0.61, "learning_rate": 1.951087657864724e-05, "loss": 2.3641, "step": 349670 }, { "epoch": 0.61, "learning_rate": 1.9510004638720412e-05, "loss": 2.2944, "step": 349680 }, { "epoch": 0.61, "learning_rate": 1.9509132698793583e-05, "loss": 2.3306, "step": 349690 }, { "epoch": 0.61, "learning_rate": 1.950826075886676e-05, "loss": 2.3027, "step": 349700 }, { "epoch": 0.61, "learning_rate": 1.950738881893993e-05, "loss": 2.466, "step": 349710 }, { "epoch": 0.61, "learning_rate": 1.9506516879013104e-05, "loss": 2.2951, "step": 349720 }, { "epoch": 0.61, "learning_rate": 1.9505644939086278e-05, "loss": 2.304, "step": 349730 }, { "epoch": 0.61, "learning_rate": 1.950477299915945e-05, "loss": 2.3558, "step": 349740 }, { "epoch": 0.61, "learning_rate": 1.9503901059232625e-05, "loss": 2.2496, "step": 349750 }, { "epoch": 0.61, "learning_rate": 1.9503029119305796e-05, "loss": 2.3607, "step": 349760 }, { "epoch": 0.61, "learning_rate": 1.9502157179378973e-05, "loss": 2.3063, "step": 349770 }, { "epoch": 0.61, "learning_rate": 1.9501285239452143e-05, "loss": 2.2634, "step": 349780 }, { "epoch": 0.61, "learning_rate": 1.9500413299525317e-05, "loss": 2.3102, "step": 349790 }, { "epoch": 0.61, "learning_rate": 1.9499541359598487e-05, "loss": 2.3108, "step": 349800 }, { "epoch": 0.61, "learning_rate": 1.9498669419671664e-05, "loss": 2.4283, "step": 349810 }, { "epoch": 0.61, "learning_rate": 1.9497797479744838e-05, "loss": 2.4004, "step": 349820 }, { "epoch": 0.61, "learning_rate": 1.949692553981801e-05, "loss": 2.3697, "step": 349830 }, { "epoch": 0.61, "learning_rate": 1.9496053599891186e-05, "loss": 2.3559, "step": 349840 }, { "epoch": 0.61, "learning_rate": 1.9495181659964356e-05, "loss": 2.3386, "step": 349850 }, { "epoch": 0.61, "learning_rate": 1.949430972003753e-05, "loss": 2.2405, "step": 349860 }, { "epoch": 0.61, "learning_rate": 1.94934377801107e-05, "loss": 2.3326, "step": 349870 }, { "epoch": 0.61, "learning_rate": 1.9492565840183877e-05, "loss": 2.2626, "step": 349880 }, { "epoch": 0.61, "learning_rate": 1.9491693900257048e-05, "loss": 2.377, "step": 349890 }, { "epoch": 0.61, "learning_rate": 1.949082196033022e-05, "loss": 2.3445, "step": 349900 }, { "epoch": 0.61, "learning_rate": 1.9489950020403395e-05, "loss": 2.3623, "step": 349910 }, { "epoch": 0.61, "learning_rate": 1.948907808047657e-05, "loss": 2.3185, "step": 349920 }, { "epoch": 0.61, "learning_rate": 1.9488206140549743e-05, "loss": 2.288, "step": 349930 }, { "epoch": 0.61, "learning_rate": 1.9487334200622913e-05, "loss": 2.3298, "step": 349940 }, { "epoch": 0.61, "learning_rate": 1.9486462260696087e-05, "loss": 2.3724, "step": 349950 }, { "epoch": 0.61, "learning_rate": 1.948559032076926e-05, "loss": 2.4181, "step": 349960 }, { "epoch": 0.61, "learning_rate": 1.9484718380842435e-05, "loss": 2.292, "step": 349970 }, { "epoch": 0.61, "learning_rate": 1.948384644091561e-05, "loss": 2.3761, "step": 349980 }, { "epoch": 0.61, "learning_rate": 1.9482974500988782e-05, "loss": 2.4397, "step": 349990 }, { "epoch": 0.61, "learning_rate": 1.9482102561061956e-05, "loss": 2.2869, "step": 350000 }, { "epoch": 0.61, "learning_rate": 1.9481230621135126e-05, "loss": 2.3066, "step": 350010 }, { "epoch": 0.61, "learning_rate": 1.94803586812083e-05, "loss": 2.2536, "step": 350020 }, { "epoch": 0.61, "learning_rate": 1.9479486741281474e-05, "loss": 2.2964, "step": 350030 }, { "epoch": 0.61, "learning_rate": 1.9478614801354648e-05, "loss": 2.3702, "step": 350040 }, { "epoch": 0.61, "learning_rate": 1.9477742861427818e-05, "loss": 2.3325, "step": 350050 }, { "epoch": 0.61, "learning_rate": 1.9476870921500992e-05, "loss": 2.2463, "step": 350060 }, { "epoch": 0.61, "learning_rate": 1.947599898157417e-05, "loss": 2.3833, "step": 350070 }, { "epoch": 0.61, "learning_rate": 1.947512704164734e-05, "loss": 2.3213, "step": 350080 }, { "epoch": 0.61, "learning_rate": 1.9474255101720513e-05, "loss": 2.3684, "step": 350090 }, { "epoch": 0.61, "learning_rate": 1.9473383161793687e-05, "loss": 2.2684, "step": 350100 }, { "epoch": 0.61, "learning_rate": 1.947251122186686e-05, "loss": 2.2435, "step": 350110 }, { "epoch": 0.61, "learning_rate": 1.947163928194003e-05, "loss": 2.2816, "step": 350120 }, { "epoch": 0.61, "learning_rate": 1.9470767342013205e-05, "loss": 2.3061, "step": 350130 }, { "epoch": 0.61, "learning_rate": 1.946989540208638e-05, "loss": 2.3099, "step": 350140 }, { "epoch": 0.61, "learning_rate": 1.9469023462159552e-05, "loss": 2.279, "step": 350150 }, { "epoch": 0.61, "learning_rate": 1.9468151522232726e-05, "loss": 2.2579, "step": 350160 }, { "epoch": 0.61, "learning_rate": 1.9467279582305896e-05, "loss": 2.1981, "step": 350170 }, { "epoch": 0.61, "learning_rate": 1.9466407642379074e-05, "loss": 2.3007, "step": 350180 }, { "epoch": 0.61, "learning_rate": 1.9465535702452244e-05, "loss": 2.315, "step": 350190 }, { "epoch": 0.61, "learning_rate": 1.9464663762525418e-05, "loss": 2.3292, "step": 350200 }, { "epoch": 0.61, "learning_rate": 1.946379182259859e-05, "loss": 2.3366, "step": 350210 }, { "epoch": 0.61, "learning_rate": 1.9462919882671765e-05, "loss": 2.2502, "step": 350220 }, { "epoch": 0.61, "learning_rate": 1.946204794274494e-05, "loss": 2.3167, "step": 350230 }, { "epoch": 0.61, "learning_rate": 1.946117600281811e-05, "loss": 2.2639, "step": 350240 }, { "epoch": 0.61, "learning_rate": 1.9460304062891287e-05, "loss": 2.1478, "step": 350250 }, { "epoch": 0.61, "learning_rate": 1.9459432122964457e-05, "loss": 2.4136, "step": 350260 }, { "epoch": 0.61, "learning_rate": 1.945856018303763e-05, "loss": 2.2898, "step": 350270 }, { "epoch": 0.61, "learning_rate": 1.94576882431108e-05, "loss": 2.2185, "step": 350280 }, { "epoch": 0.61, "learning_rate": 1.9456816303183978e-05, "loss": 2.2606, "step": 350290 }, { "epoch": 0.61, "learning_rate": 1.945594436325715e-05, "loss": 2.2317, "step": 350300 }, { "epoch": 0.61, "learning_rate": 1.9455072423330322e-05, "loss": 2.3401, "step": 350310 }, { "epoch": 0.61, "learning_rate": 1.9454200483403496e-05, "loss": 2.2712, "step": 350320 }, { "epoch": 0.61, "learning_rate": 1.945332854347667e-05, "loss": 2.2536, "step": 350330 }, { "epoch": 0.61, "learning_rate": 1.9452456603549844e-05, "loss": 2.2444, "step": 350340 }, { "epoch": 0.61, "learning_rate": 1.9451584663623014e-05, "loss": 2.4018, "step": 350350 }, { "epoch": 0.61, "learning_rate": 1.9450712723696188e-05, "loss": 2.4143, "step": 350360 }, { "epoch": 0.61, "learning_rate": 1.944984078376936e-05, "loss": 2.3022, "step": 350370 }, { "epoch": 0.61, "learning_rate": 1.9448968843842535e-05, "loss": 2.3292, "step": 350380 }, { "epoch": 0.61, "learning_rate": 1.944809690391571e-05, "loss": 2.3109, "step": 350390 }, { "epoch": 0.61, "learning_rate": 1.9447224963988883e-05, "loss": 2.384, "step": 350400 }, { "epoch": 0.61, "learning_rate": 1.9446353024062057e-05, "loss": 2.2911, "step": 350410 }, { "epoch": 0.61, "learning_rate": 1.9445481084135227e-05, "loss": 2.4595, "step": 350420 }, { "epoch": 0.61, "learning_rate": 1.94446091442084e-05, "loss": 2.2783, "step": 350430 }, { "epoch": 0.61, "learning_rate": 1.9443737204281575e-05, "loss": 2.3116, "step": 350440 }, { "epoch": 0.61, "learning_rate": 1.944286526435475e-05, "loss": 2.2664, "step": 350450 }, { "epoch": 0.61, "learning_rate": 1.9441993324427922e-05, "loss": 2.3772, "step": 350460 }, { "epoch": 0.61, "learning_rate": 1.9441121384501093e-05, "loss": 2.2903, "step": 350470 }, { "epoch": 0.61, "learning_rate": 1.944024944457427e-05, "loss": 2.3432, "step": 350480 }, { "epoch": 0.61, "learning_rate": 1.943937750464744e-05, "loss": 2.355, "step": 350490 }, { "epoch": 0.61, "learning_rate": 1.9438505564720614e-05, "loss": 2.2968, "step": 350500 }, { "epoch": 0.61, "learning_rate": 1.9437633624793788e-05, "loss": 2.3936, "step": 350510 }, { "epoch": 0.61, "learning_rate": 1.943676168486696e-05, "loss": 2.3697, "step": 350520 }, { "epoch": 0.61, "learning_rate": 1.9435889744940132e-05, "loss": 2.2605, "step": 350530 }, { "epoch": 0.61, "learning_rate": 1.9435017805013306e-05, "loss": 2.3863, "step": 350540 }, { "epoch": 0.61, "learning_rate": 1.9434145865086483e-05, "loss": 2.3672, "step": 350550 }, { "epoch": 0.61, "learning_rate": 1.9433273925159653e-05, "loss": 2.3713, "step": 350560 }, { "epoch": 0.61, "learning_rate": 1.9432401985232827e-05, "loss": 2.2939, "step": 350570 }, { "epoch": 0.61, "learning_rate": 1.9431530045305997e-05, "loss": 2.4678, "step": 350580 }, { "epoch": 0.61, "learning_rate": 1.9430658105379174e-05, "loss": 2.3789, "step": 350590 }, { "epoch": 0.61, "learning_rate": 1.9429786165452345e-05, "loss": 2.443, "step": 350600 }, { "epoch": 0.61, "learning_rate": 1.942891422552552e-05, "loss": 2.3315, "step": 350610 }, { "epoch": 0.61, "learning_rate": 1.9428042285598692e-05, "loss": 2.277, "step": 350620 }, { "epoch": 0.61, "learning_rate": 1.9427170345671866e-05, "loss": 2.4399, "step": 350630 }, { "epoch": 0.61, "learning_rate": 1.942629840574504e-05, "loss": 2.3914, "step": 350640 }, { "epoch": 0.61, "learning_rate": 1.942542646581821e-05, "loss": 2.3621, "step": 350650 }, { "epoch": 0.61, "learning_rate": 1.9424554525891387e-05, "loss": 2.3896, "step": 350660 }, { "epoch": 0.61, "learning_rate": 1.9423682585964558e-05, "loss": 2.3994, "step": 350670 }, { "epoch": 0.61, "learning_rate": 1.942281064603773e-05, "loss": 2.4933, "step": 350680 }, { "epoch": 0.61, "learning_rate": 1.9421938706110905e-05, "loss": 2.3857, "step": 350690 }, { "epoch": 0.61, "learning_rate": 1.942106676618408e-05, "loss": 2.3293, "step": 350700 }, { "epoch": 0.61, "learning_rate": 1.9420194826257253e-05, "loss": 2.3531, "step": 350710 }, { "epoch": 0.61, "learning_rate": 1.9419322886330423e-05, "loss": 2.2928, "step": 350720 }, { "epoch": 0.61, "learning_rate": 1.9418450946403597e-05, "loss": 2.2813, "step": 350730 }, { "epoch": 0.61, "learning_rate": 1.941757900647677e-05, "loss": 2.4508, "step": 350740 }, { "epoch": 0.61, "learning_rate": 1.9416707066549945e-05, "loss": 2.4032, "step": 350750 }, { "epoch": 0.61, "learning_rate": 1.9415835126623115e-05, "loss": 2.1607, "step": 350760 }, { "epoch": 0.61, "learning_rate": 1.9414963186696292e-05, "loss": 2.4208, "step": 350770 }, { "epoch": 0.61, "learning_rate": 1.9414091246769462e-05, "loss": 2.2934, "step": 350780 }, { "epoch": 0.61, "learning_rate": 1.9413219306842636e-05, "loss": 2.4268, "step": 350790 }, { "epoch": 0.61, "learning_rate": 1.941234736691581e-05, "loss": 2.3817, "step": 350800 }, { "epoch": 0.61, "learning_rate": 1.9411475426988984e-05, "loss": 2.2679, "step": 350810 }, { "epoch": 0.61, "learning_rate": 1.9410603487062158e-05, "loss": 2.3931, "step": 350820 }, { "epoch": 0.61, "learning_rate": 1.9409731547135328e-05, "loss": 2.3632, "step": 350830 }, { "epoch": 0.61, "learning_rate": 1.9408859607208502e-05, "loss": 2.2648, "step": 350840 }, { "epoch": 0.61, "learning_rate": 1.9407987667281675e-05, "loss": 2.3967, "step": 350850 }, { "epoch": 0.61, "learning_rate": 1.940711572735485e-05, "loss": 2.3237, "step": 350860 }, { "epoch": 0.61, "learning_rate": 1.9406243787428023e-05, "loss": 2.3493, "step": 350870 }, { "epoch": 0.61, "learning_rate": 1.9405371847501193e-05, "loss": 2.3353, "step": 350880 }, { "epoch": 0.61, "learning_rate": 1.940449990757437e-05, "loss": 2.3569, "step": 350890 }, { "epoch": 0.61, "learning_rate": 1.940362796764754e-05, "loss": 2.2781, "step": 350900 }, { "epoch": 0.61, "learning_rate": 1.9402756027720715e-05, "loss": 2.3941, "step": 350910 }, { "epoch": 0.61, "learning_rate": 1.940188408779389e-05, "loss": 2.3126, "step": 350920 }, { "epoch": 0.61, "learning_rate": 1.9401012147867062e-05, "loss": 2.3621, "step": 350930 }, { "epoch": 0.61, "learning_rate": 1.9400140207940236e-05, "loss": 2.2582, "step": 350940 }, { "epoch": 0.61, "learning_rate": 1.9399268268013406e-05, "loss": 2.3525, "step": 350950 }, { "epoch": 0.61, "learning_rate": 1.9398396328086584e-05, "loss": 2.1914, "step": 350960 }, { "epoch": 0.61, "learning_rate": 1.9397524388159754e-05, "loss": 2.3354, "step": 350970 }, { "epoch": 0.61, "learning_rate": 1.9396652448232928e-05, "loss": 2.2848, "step": 350980 }, { "epoch": 0.61, "learning_rate": 1.9395780508306098e-05, "loss": 2.3851, "step": 350990 }, { "epoch": 0.61, "learning_rate": 1.9394908568379275e-05, "loss": 2.3634, "step": 351000 }, { "epoch": 0.61, "learning_rate": 1.9394036628452446e-05, "loss": 2.1852, "step": 351010 }, { "epoch": 0.61, "learning_rate": 1.939316468852562e-05, "loss": 2.2594, "step": 351020 }, { "epoch": 0.61, "learning_rate": 1.9392292748598793e-05, "loss": 2.3555, "step": 351030 }, { "epoch": 0.61, "learning_rate": 1.9391420808671967e-05, "loss": 2.2483, "step": 351040 }, { "epoch": 0.61, "learning_rate": 1.939054886874514e-05, "loss": 2.4466, "step": 351050 }, { "epoch": 0.61, "learning_rate": 1.938967692881831e-05, "loss": 2.311, "step": 351060 }, { "epoch": 0.61, "learning_rate": 1.9388804988891488e-05, "loss": 2.2989, "step": 351070 }, { "epoch": 0.61, "learning_rate": 1.938793304896466e-05, "loss": 2.3503, "step": 351080 }, { "epoch": 0.61, "learning_rate": 1.9387061109037832e-05, "loss": 2.3594, "step": 351090 }, { "epoch": 0.61, "learning_rate": 1.9386189169111006e-05, "loss": 2.1794, "step": 351100 }, { "epoch": 0.61, "learning_rate": 1.938531722918418e-05, "loss": 2.3606, "step": 351110 }, { "epoch": 0.61, "learning_rate": 1.9384445289257354e-05, "loss": 2.3213, "step": 351120 }, { "epoch": 0.61, "learning_rate": 1.9383573349330524e-05, "loss": 2.3079, "step": 351130 }, { "epoch": 0.61, "learning_rate": 1.9382701409403698e-05, "loss": 2.3715, "step": 351140 }, { "epoch": 0.61, "learning_rate": 1.938182946947687e-05, "loss": 2.3533, "step": 351150 }, { "epoch": 0.61, "learning_rate": 1.9380957529550045e-05, "loss": 2.3097, "step": 351160 }, { "epoch": 0.61, "learning_rate": 1.938008558962322e-05, "loss": 2.308, "step": 351170 }, { "epoch": 0.61, "learning_rate": 1.9379213649696393e-05, "loss": 2.4096, "step": 351180 }, { "epoch": 0.61, "learning_rate": 1.9378341709769567e-05, "loss": 2.4192, "step": 351190 }, { "epoch": 0.61, "learning_rate": 1.9377469769842737e-05, "loss": 2.2383, "step": 351200 }, { "epoch": 0.61, "learning_rate": 1.937659782991591e-05, "loss": 2.2369, "step": 351210 }, { "epoch": 0.61, "learning_rate": 1.9375725889989085e-05, "loss": 2.2109, "step": 351220 }, { "epoch": 0.61, "learning_rate": 1.937485395006226e-05, "loss": 2.3387, "step": 351230 }, { "epoch": 0.61, "learning_rate": 1.937398201013543e-05, "loss": 2.312, "step": 351240 }, { "epoch": 0.61, "learning_rate": 1.9373110070208603e-05, "loss": 2.3065, "step": 351250 }, { "epoch": 0.61, "learning_rate": 1.9372238130281776e-05, "loss": 2.5074, "step": 351260 }, { "epoch": 0.61, "learning_rate": 1.937136619035495e-05, "loss": 2.3855, "step": 351270 }, { "epoch": 0.61, "learning_rate": 1.9370494250428124e-05, "loss": 2.2574, "step": 351280 }, { "epoch": 0.61, "learning_rate": 1.9369622310501294e-05, "loss": 2.2938, "step": 351290 }, { "epoch": 0.61, "learning_rate": 1.936875037057447e-05, "loss": 2.3534, "step": 351300 }, { "epoch": 0.61, "learning_rate": 1.9367878430647642e-05, "loss": 2.2647, "step": 351310 }, { "epoch": 0.61, "learning_rate": 1.9367006490720816e-05, "loss": 2.2329, "step": 351320 }, { "epoch": 0.61, "learning_rate": 1.936613455079399e-05, "loss": 2.3117, "step": 351330 }, { "epoch": 0.61, "learning_rate": 1.9365262610867163e-05, "loss": 2.3391, "step": 351340 }, { "epoch": 0.61, "learning_rate": 1.9364390670940337e-05, "loss": 2.2818, "step": 351350 }, { "epoch": 0.61, "learning_rate": 1.9363518731013507e-05, "loss": 2.3501, "step": 351360 }, { "epoch": 0.61, "learning_rate": 1.9362646791086684e-05, "loss": 2.3468, "step": 351370 }, { "epoch": 0.61, "learning_rate": 1.9361774851159855e-05, "loss": 2.3496, "step": 351380 }, { "epoch": 0.61, "learning_rate": 1.936090291123303e-05, "loss": 2.2662, "step": 351390 }, { "epoch": 0.61, "learning_rate": 1.93600309713062e-05, "loss": 2.3161, "step": 351400 }, { "epoch": 0.61, "learning_rate": 1.9359159031379376e-05, "loss": 2.2694, "step": 351410 }, { "epoch": 0.61, "learning_rate": 1.935828709145255e-05, "loss": 2.3888, "step": 351420 }, { "epoch": 0.61, "learning_rate": 1.935741515152572e-05, "loss": 2.4068, "step": 351430 }, { "epoch": 0.61, "learning_rate": 1.9356543211598897e-05, "loss": 2.2384, "step": 351440 }, { "epoch": 0.61, "learning_rate": 1.9355671271672068e-05, "loss": 2.319, "step": 351450 }, { "epoch": 0.61, "learning_rate": 1.935479933174524e-05, "loss": 2.1383, "step": 351460 }, { "epoch": 0.61, "learning_rate": 1.9353927391818412e-05, "loss": 2.3237, "step": 351470 }, { "epoch": 0.61, "learning_rate": 1.935305545189159e-05, "loss": 2.3531, "step": 351480 }, { "epoch": 0.61, "learning_rate": 1.935218351196476e-05, "loss": 2.4745, "step": 351490 }, { "epoch": 0.61, "learning_rate": 1.9351311572037933e-05, "loss": 2.3462, "step": 351500 }, { "epoch": 0.61, "learning_rate": 1.9350439632111107e-05, "loss": 2.3345, "step": 351510 }, { "epoch": 0.61, "learning_rate": 1.934956769218428e-05, "loss": 2.1794, "step": 351520 }, { "epoch": 0.61, "learning_rate": 1.9348695752257455e-05, "loss": 2.3027, "step": 351530 }, { "epoch": 0.61, "learning_rate": 1.9347823812330625e-05, "loss": 2.3702, "step": 351540 }, { "epoch": 0.61, "learning_rate": 1.93469518724038e-05, "loss": 2.4399, "step": 351550 }, { "epoch": 0.61, "learning_rate": 1.9346079932476973e-05, "loss": 2.3612, "step": 351560 }, { "epoch": 0.61, "learning_rate": 1.9345207992550146e-05, "loss": 2.2329, "step": 351570 }, { "epoch": 0.61, "learning_rate": 1.934433605262332e-05, "loss": 2.3537, "step": 351580 }, { "epoch": 0.61, "learning_rate": 1.9343464112696494e-05, "loss": 2.2603, "step": 351590 }, { "epoch": 0.61, "learning_rate": 1.9342592172769668e-05, "loss": 2.338, "step": 351600 }, { "epoch": 0.61, "learning_rate": 1.9341720232842838e-05, "loss": 2.3767, "step": 351610 }, { "epoch": 0.61, "learning_rate": 1.9340848292916012e-05, "loss": 2.1545, "step": 351620 }, { "epoch": 0.61, "learning_rate": 1.9339976352989186e-05, "loss": 2.4031, "step": 351630 }, { "epoch": 0.61, "learning_rate": 1.933910441306236e-05, "loss": 2.5121, "step": 351640 }, { "epoch": 0.61, "learning_rate": 1.933823247313553e-05, "loss": 2.3664, "step": 351650 }, { "epoch": 0.61, "learning_rate": 1.9337360533208703e-05, "loss": 2.243, "step": 351660 }, { "epoch": 0.61, "learning_rate": 1.933648859328188e-05, "loss": 2.2896, "step": 351670 }, { "epoch": 0.61, "learning_rate": 1.933561665335505e-05, "loss": 2.3792, "step": 351680 }, { "epoch": 0.61, "learning_rate": 1.9334744713428225e-05, "loss": 2.1943, "step": 351690 }, { "epoch": 0.61, "learning_rate": 1.93338727735014e-05, "loss": 2.4077, "step": 351700 }, { "epoch": 0.61, "learning_rate": 1.9333000833574572e-05, "loss": 2.186, "step": 351710 }, { "epoch": 0.61, "learning_rate": 1.9332128893647743e-05, "loss": 2.2958, "step": 351720 }, { "epoch": 0.61, "learning_rate": 1.9331256953720916e-05, "loss": 2.3836, "step": 351730 }, { "epoch": 0.61, "learning_rate": 1.933038501379409e-05, "loss": 2.2563, "step": 351740 }, { "epoch": 0.61, "learning_rate": 1.9329513073867264e-05, "loss": 2.3357, "step": 351750 }, { "epoch": 0.61, "learning_rate": 1.9328641133940438e-05, "loss": 2.3468, "step": 351760 }, { "epoch": 0.61, "learning_rate": 1.9327769194013608e-05, "loss": 2.36, "step": 351770 }, { "epoch": 0.61, "learning_rate": 1.9326897254086785e-05, "loss": 2.3806, "step": 351780 }, { "epoch": 0.61, "learning_rate": 1.9326025314159956e-05, "loss": 2.3949, "step": 351790 }, { "epoch": 0.61, "learning_rate": 1.932515337423313e-05, "loss": 2.3161, "step": 351800 }, { "epoch": 0.61, "learning_rate": 1.9324281434306303e-05, "loss": 2.3753, "step": 351810 }, { "epoch": 0.61, "learning_rate": 1.9323409494379477e-05, "loss": 2.4087, "step": 351820 }, { "epoch": 0.61, "learning_rate": 1.932253755445265e-05, "loss": 2.4001, "step": 351830 }, { "epoch": 0.61, "learning_rate": 1.932166561452582e-05, "loss": 2.3471, "step": 351840 }, { "epoch": 0.61, "learning_rate": 1.9320793674598998e-05, "loss": 2.3621, "step": 351850 }, { "epoch": 0.61, "learning_rate": 1.931992173467217e-05, "loss": 2.2435, "step": 351860 }, { "epoch": 0.61, "learning_rate": 1.9319049794745342e-05, "loss": 2.3931, "step": 351870 }, { "epoch": 0.61, "learning_rate": 1.9318177854818513e-05, "loss": 2.339, "step": 351880 }, { "epoch": 0.61, "learning_rate": 1.931730591489169e-05, "loss": 2.2032, "step": 351890 }, { "epoch": 0.61, "learning_rate": 1.9316433974964864e-05, "loss": 2.4309, "step": 351900 }, { "epoch": 0.61, "learning_rate": 1.9315562035038034e-05, "loss": 2.3995, "step": 351910 }, { "epoch": 0.61, "learning_rate": 1.9314690095111208e-05, "loss": 2.5287, "step": 351920 }, { "epoch": 0.61, "learning_rate": 1.931381815518438e-05, "loss": 2.3346, "step": 351930 }, { "epoch": 0.61, "learning_rate": 1.9312946215257555e-05, "loss": 2.31, "step": 351940 }, { "epoch": 0.61, "learning_rate": 1.9312074275330726e-05, "loss": 2.2544, "step": 351950 }, { "epoch": 0.61, "learning_rate": 1.93112023354039e-05, "loss": 2.2731, "step": 351960 }, { "epoch": 0.61, "learning_rate": 1.9310330395477073e-05, "loss": 2.309, "step": 351970 }, { "epoch": 0.61, "learning_rate": 1.9309458455550247e-05, "loss": 2.2533, "step": 351980 }, { "epoch": 0.61, "learning_rate": 1.930858651562342e-05, "loss": 2.3054, "step": 351990 }, { "epoch": 0.61, "learning_rate": 1.9307714575696595e-05, "loss": 2.3289, "step": 352000 }, { "epoch": 0.61, "learning_rate": 1.930684263576977e-05, "loss": 2.3502, "step": 352010 }, { "epoch": 0.61, "learning_rate": 1.930597069584294e-05, "loss": 2.2713, "step": 352020 }, { "epoch": 0.61, "learning_rate": 1.9305098755916113e-05, "loss": 2.2883, "step": 352030 }, { "epoch": 0.61, "learning_rate": 1.9304226815989286e-05, "loss": 2.3939, "step": 352040 }, { "epoch": 0.61, "learning_rate": 1.930335487606246e-05, "loss": 2.3443, "step": 352050 }, { "epoch": 0.61, "learning_rate": 1.9302482936135634e-05, "loss": 2.3718, "step": 352060 }, { "epoch": 0.61, "learning_rate": 1.9301610996208804e-05, "loss": 2.2931, "step": 352070 }, { "epoch": 0.61, "learning_rate": 1.930073905628198e-05, "loss": 2.3151, "step": 352080 }, { "epoch": 0.61, "learning_rate": 1.9299867116355152e-05, "loss": 2.3586, "step": 352090 }, { "epoch": 0.61, "learning_rate": 1.9298995176428326e-05, "loss": 2.1977, "step": 352100 }, { "epoch": 0.61, "learning_rate": 1.92981232365015e-05, "loss": 2.3279, "step": 352110 }, { "epoch": 0.61, "learning_rate": 1.9297251296574673e-05, "loss": 2.3613, "step": 352120 }, { "epoch": 0.61, "learning_rate": 1.9296379356647844e-05, "loss": 2.2524, "step": 352130 }, { "epoch": 0.61, "learning_rate": 1.9295507416721017e-05, "loss": 2.2632, "step": 352140 }, { "epoch": 0.61, "learning_rate": 1.9294635476794194e-05, "loss": 2.3043, "step": 352150 }, { "epoch": 0.61, "learning_rate": 1.9293763536867365e-05, "loss": 2.4222, "step": 352160 }, { "epoch": 0.61, "learning_rate": 1.929289159694054e-05, "loss": 2.3303, "step": 352170 }, { "epoch": 0.61, "learning_rate": 1.929201965701371e-05, "loss": 2.3124, "step": 352180 }, { "epoch": 0.61, "learning_rate": 1.9291147717086886e-05, "loss": 2.2757, "step": 352190 }, { "epoch": 0.61, "learning_rate": 1.9290275777160057e-05, "loss": 2.2246, "step": 352200 }, { "epoch": 0.61, "learning_rate": 1.928940383723323e-05, "loss": 2.3697, "step": 352210 }, { "epoch": 0.61, "learning_rate": 1.9288531897306404e-05, "loss": 2.2523, "step": 352220 }, { "epoch": 0.61, "learning_rate": 1.9287659957379578e-05, "loss": 2.2326, "step": 352230 }, { "epoch": 0.61, "learning_rate": 1.928678801745275e-05, "loss": 2.3909, "step": 352240 }, { "epoch": 0.61, "learning_rate": 1.9285916077525922e-05, "loss": 2.3627, "step": 352250 }, { "epoch": 0.61, "learning_rate": 1.92850441375991e-05, "loss": 2.2352, "step": 352260 }, { "epoch": 0.61, "learning_rate": 1.928417219767227e-05, "loss": 2.3287, "step": 352270 }, { "epoch": 0.61, "learning_rate": 1.9283300257745443e-05, "loss": 2.3373, "step": 352280 }, { "epoch": 0.61, "learning_rate": 1.9282428317818617e-05, "loss": 2.2982, "step": 352290 }, { "epoch": 0.61, "learning_rate": 1.928155637789179e-05, "loss": 2.3906, "step": 352300 }, { "epoch": 0.61, "learning_rate": 1.9280684437964965e-05, "loss": 2.3978, "step": 352310 }, { "epoch": 0.61, "learning_rate": 1.9279812498038135e-05, "loss": 2.31, "step": 352320 }, { "epoch": 0.61, "learning_rate": 1.927894055811131e-05, "loss": 2.3508, "step": 352330 }, { "epoch": 0.61, "learning_rate": 1.9278068618184483e-05, "loss": 2.3715, "step": 352340 }, { "epoch": 0.61, "learning_rate": 1.9277196678257656e-05, "loss": 2.3579, "step": 352350 }, { "epoch": 0.61, "learning_rate": 1.9276324738330827e-05, "loss": 2.213, "step": 352360 }, { "epoch": 0.61, "learning_rate": 1.9275452798404004e-05, "loss": 2.3481, "step": 352370 }, { "epoch": 0.61, "learning_rate": 1.9274580858477174e-05, "loss": 2.3682, "step": 352380 }, { "epoch": 0.61, "learning_rate": 1.9273708918550348e-05, "loss": 2.2858, "step": 352390 }, { "epoch": 0.61, "learning_rate": 1.9272836978623522e-05, "loss": 2.2761, "step": 352400 }, { "epoch": 0.61, "learning_rate": 1.9271965038696696e-05, "loss": 2.449, "step": 352410 }, { "epoch": 0.61, "learning_rate": 1.927109309876987e-05, "loss": 2.3858, "step": 352420 }, { "epoch": 0.61, "learning_rate": 1.927022115884304e-05, "loss": 2.3359, "step": 352430 }, { "epoch": 0.61, "learning_rate": 1.9269349218916213e-05, "loss": 2.3807, "step": 352440 }, { "epoch": 0.61, "learning_rate": 1.9268477278989387e-05, "loss": 2.3303, "step": 352450 }, { "epoch": 0.61, "learning_rate": 1.926760533906256e-05, "loss": 2.3351, "step": 352460 }, { "epoch": 0.61, "learning_rate": 1.9266733399135735e-05, "loss": 2.3722, "step": 352470 }, { "epoch": 0.61, "learning_rate": 1.9265861459208905e-05, "loss": 2.3598, "step": 352480 }, { "epoch": 0.61, "learning_rate": 1.9264989519282082e-05, "loss": 2.3633, "step": 352490 }, { "epoch": 0.61, "learning_rate": 1.9264117579355253e-05, "loss": 2.3121, "step": 352500 }, { "epoch": 0.61, "learning_rate": 1.9263245639428426e-05, "loss": 2.2985, "step": 352510 }, { "epoch": 0.61, "learning_rate": 1.92623736995016e-05, "loss": 2.3765, "step": 352520 }, { "epoch": 0.61, "learning_rate": 1.9261501759574774e-05, "loss": 2.3647, "step": 352530 }, { "epoch": 0.61, "learning_rate": 1.9260629819647948e-05, "loss": 2.3487, "step": 352540 }, { "epoch": 0.61, "learning_rate": 1.9259757879721118e-05, "loss": 2.2997, "step": 352550 }, { "epoch": 0.61, "learning_rate": 1.9258885939794295e-05, "loss": 2.3264, "step": 352560 }, { "epoch": 0.61, "learning_rate": 1.9258013999867466e-05, "loss": 2.2198, "step": 352570 }, { "epoch": 0.61, "learning_rate": 1.925714205994064e-05, "loss": 2.3388, "step": 352580 }, { "epoch": 0.61, "learning_rate": 1.925627012001381e-05, "loss": 2.3546, "step": 352590 }, { "epoch": 0.61, "learning_rate": 1.9255398180086987e-05, "loss": 2.4553, "step": 352600 }, { "epoch": 0.61, "learning_rate": 1.9254526240160157e-05, "loss": 2.2963, "step": 352610 }, { "epoch": 0.61, "learning_rate": 1.925365430023333e-05, "loss": 2.2756, "step": 352620 }, { "epoch": 0.61, "learning_rate": 1.9252782360306508e-05, "loss": 2.1609, "step": 352630 }, { "epoch": 0.61, "learning_rate": 1.925191042037968e-05, "loss": 2.3627, "step": 352640 }, { "epoch": 0.61, "learning_rate": 1.9251038480452852e-05, "loss": 2.3473, "step": 352650 }, { "epoch": 0.61, "learning_rate": 1.9250166540526023e-05, "loss": 2.3646, "step": 352660 }, { "epoch": 0.62, "learning_rate": 1.92492946005992e-05, "loss": 2.3062, "step": 352670 }, { "epoch": 0.62, "learning_rate": 1.924842266067237e-05, "loss": 2.3411, "step": 352680 }, { "epoch": 0.62, "learning_rate": 1.9247550720745544e-05, "loss": 2.2752, "step": 352690 }, { "epoch": 0.62, "learning_rate": 1.9246678780818718e-05, "loss": 2.4229, "step": 352700 }, { "epoch": 0.62, "learning_rate": 1.924580684089189e-05, "loss": 2.3005, "step": 352710 }, { "epoch": 0.62, "learning_rate": 1.9244934900965065e-05, "loss": 2.3177, "step": 352720 }, { "epoch": 0.62, "learning_rate": 1.9244062961038236e-05, "loss": 2.349, "step": 352730 }, { "epoch": 0.62, "learning_rate": 1.924319102111141e-05, "loss": 2.4152, "step": 352740 }, { "epoch": 0.62, "learning_rate": 1.9242319081184583e-05, "loss": 2.2336, "step": 352750 }, { "epoch": 0.62, "learning_rate": 1.9241447141257757e-05, "loss": 2.2835, "step": 352760 }, { "epoch": 0.62, "learning_rate": 1.924057520133093e-05, "loss": 2.3763, "step": 352770 }, { "epoch": 0.62, "learning_rate": 1.9239703261404105e-05, "loss": 2.3355, "step": 352780 }, { "epoch": 0.62, "learning_rate": 1.923883132147728e-05, "loss": 2.3411, "step": 352790 }, { "epoch": 0.62, "learning_rate": 1.923795938155045e-05, "loss": 2.4064, "step": 352800 }, { "epoch": 0.62, "learning_rate": 1.9237087441623623e-05, "loss": 2.2678, "step": 352810 }, { "epoch": 0.62, "learning_rate": 1.9236215501696796e-05, "loss": 2.3946, "step": 352820 }, { "epoch": 0.62, "learning_rate": 1.923534356176997e-05, "loss": 2.3436, "step": 352830 }, { "epoch": 0.62, "learning_rate": 1.923447162184314e-05, "loss": 2.3496, "step": 352840 }, { "epoch": 0.62, "learning_rate": 1.9233599681916314e-05, "loss": 2.4113, "step": 352850 }, { "epoch": 0.62, "learning_rate": 1.9232727741989488e-05, "loss": 2.3536, "step": 352860 }, { "epoch": 0.62, "learning_rate": 1.9231855802062662e-05, "loss": 2.3412, "step": 352870 }, { "epoch": 0.62, "learning_rate": 1.9230983862135836e-05, "loss": 2.2557, "step": 352880 }, { "epoch": 0.62, "learning_rate": 1.9230111922209006e-05, "loss": 2.3198, "step": 352890 }, { "epoch": 0.62, "learning_rate": 1.9229239982282183e-05, "loss": 2.3592, "step": 352900 }, { "epoch": 0.62, "learning_rate": 1.9228368042355354e-05, "loss": 2.3016, "step": 352910 }, { "epoch": 0.62, "learning_rate": 1.9227496102428527e-05, "loss": 2.1598, "step": 352920 }, { "epoch": 0.62, "learning_rate": 1.92266241625017e-05, "loss": 2.2319, "step": 352930 }, { "epoch": 0.62, "learning_rate": 1.9225752222574875e-05, "loss": 2.3399, "step": 352940 }, { "epoch": 0.62, "learning_rate": 1.922488028264805e-05, "loss": 2.334, "step": 352950 }, { "epoch": 0.62, "learning_rate": 1.922400834272122e-05, "loss": 2.2906, "step": 352960 }, { "epoch": 0.62, "learning_rate": 1.9223136402794396e-05, "loss": 2.3146, "step": 352970 }, { "epoch": 0.62, "learning_rate": 1.9222264462867567e-05, "loss": 2.3183, "step": 352980 }, { "epoch": 0.62, "learning_rate": 1.922139252294074e-05, "loss": 2.2603, "step": 352990 }, { "epoch": 0.62, "learning_rate": 1.922052058301391e-05, "loss": 2.3446, "step": 353000 }, { "epoch": 0.62, "learning_rate": 1.9219648643087088e-05, "loss": 2.2515, "step": 353010 }, { "epoch": 0.62, "learning_rate": 1.921877670316026e-05, "loss": 2.2003, "step": 353020 }, { "epoch": 0.62, "learning_rate": 1.9217904763233432e-05, "loss": 2.2488, "step": 353030 }, { "epoch": 0.62, "learning_rate": 1.921703282330661e-05, "loss": 2.303, "step": 353040 }, { "epoch": 0.62, "learning_rate": 1.921616088337978e-05, "loss": 2.4693, "step": 353050 }, { "epoch": 0.62, "learning_rate": 1.9215288943452953e-05, "loss": 2.3871, "step": 353060 }, { "epoch": 0.62, "learning_rate": 1.9214417003526124e-05, "loss": 2.42, "step": 353070 }, { "epoch": 0.62, "learning_rate": 1.92135450635993e-05, "loss": 2.336, "step": 353080 }, { "epoch": 0.62, "learning_rate": 1.921267312367247e-05, "loss": 2.398, "step": 353090 }, { "epoch": 0.62, "learning_rate": 1.9211801183745645e-05, "loss": 2.4564, "step": 353100 }, { "epoch": 0.62, "learning_rate": 1.921092924381882e-05, "loss": 2.2654, "step": 353110 }, { "epoch": 0.62, "learning_rate": 1.9210057303891993e-05, "loss": 2.2311, "step": 353120 }, { "epoch": 0.62, "learning_rate": 1.9209185363965166e-05, "loss": 2.279, "step": 353130 }, { "epoch": 0.62, "learning_rate": 1.9208313424038337e-05, "loss": 2.2708, "step": 353140 }, { "epoch": 0.62, "learning_rate": 1.920744148411151e-05, "loss": 2.3183, "step": 353150 }, { "epoch": 0.62, "learning_rate": 1.9206569544184684e-05, "loss": 2.3354, "step": 353160 }, { "epoch": 0.62, "learning_rate": 1.9205697604257858e-05, "loss": 2.3809, "step": 353170 }, { "epoch": 0.62, "learning_rate": 1.9204825664331032e-05, "loss": 2.3224, "step": 353180 }, { "epoch": 0.62, "learning_rate": 1.9203953724404206e-05, "loss": 2.4346, "step": 353190 }, { "epoch": 0.62, "learning_rate": 1.920308178447738e-05, "loss": 2.3689, "step": 353200 }, { "epoch": 0.62, "learning_rate": 1.920220984455055e-05, "loss": 2.3053, "step": 353210 }, { "epoch": 0.62, "learning_rate": 1.9201337904623723e-05, "loss": 2.4265, "step": 353220 }, { "epoch": 0.62, "learning_rate": 1.9200465964696897e-05, "loss": 2.3443, "step": 353230 }, { "epoch": 0.62, "learning_rate": 1.919959402477007e-05, "loss": 2.3631, "step": 353240 }, { "epoch": 0.62, "learning_rate": 1.9198722084843245e-05, "loss": 2.1993, "step": 353250 }, { "epoch": 0.62, "learning_rate": 1.9197850144916415e-05, "loss": 2.2754, "step": 353260 }, { "epoch": 0.62, "learning_rate": 1.9196978204989592e-05, "loss": 2.276, "step": 353270 }, { "epoch": 0.62, "learning_rate": 1.9196106265062763e-05, "loss": 2.2699, "step": 353280 }, { "epoch": 0.62, "learning_rate": 1.9195234325135936e-05, "loss": 2.3672, "step": 353290 }, { "epoch": 0.62, "learning_rate": 1.919436238520911e-05, "loss": 2.2578, "step": 353300 }, { "epoch": 0.62, "learning_rate": 1.9193490445282284e-05, "loss": 2.4329, "step": 353310 }, { "epoch": 0.62, "learning_rate": 1.9192618505355454e-05, "loss": 2.3269, "step": 353320 }, { "epoch": 0.62, "learning_rate": 1.9191746565428628e-05, "loss": 2.2033, "step": 353330 }, { "epoch": 0.62, "learning_rate": 1.9190874625501802e-05, "loss": 2.3143, "step": 353340 }, { "epoch": 0.62, "learning_rate": 1.9190002685574976e-05, "loss": 2.2766, "step": 353350 }, { "epoch": 0.62, "learning_rate": 1.918913074564815e-05, "loss": 2.3377, "step": 353360 }, { "epoch": 0.62, "learning_rate": 1.918825880572132e-05, "loss": 2.3634, "step": 353370 }, { "epoch": 0.62, "learning_rate": 1.9187386865794497e-05, "loss": 2.345, "step": 353380 }, { "epoch": 0.62, "learning_rate": 1.9186514925867667e-05, "loss": 2.5013, "step": 353390 }, { "epoch": 0.62, "learning_rate": 1.918564298594084e-05, "loss": 2.3151, "step": 353400 }, { "epoch": 0.62, "learning_rate": 1.9184771046014015e-05, "loss": 2.2945, "step": 353410 }, { "epoch": 0.62, "learning_rate": 1.918389910608719e-05, "loss": 2.3246, "step": 353420 }, { "epoch": 0.62, "learning_rate": 1.9183027166160362e-05, "loss": 2.3089, "step": 353430 }, { "epoch": 0.62, "learning_rate": 1.9182155226233533e-05, "loss": 2.3661, "step": 353440 }, { "epoch": 0.62, "learning_rate": 1.918128328630671e-05, "loss": 2.2494, "step": 353450 }, { "epoch": 0.62, "learning_rate": 1.918041134637988e-05, "loss": 2.2646, "step": 353460 }, { "epoch": 0.62, "learning_rate": 1.9179539406453054e-05, "loss": 2.3082, "step": 353470 }, { "epoch": 0.62, "learning_rate": 1.9178667466526225e-05, "loss": 2.225, "step": 353480 }, { "epoch": 0.62, "learning_rate": 1.91777955265994e-05, "loss": 2.4318, "step": 353490 }, { "epoch": 0.62, "learning_rate": 1.9176923586672575e-05, "loss": 2.5269, "step": 353500 }, { "epoch": 0.62, "learning_rate": 1.9176051646745746e-05, "loss": 2.3051, "step": 353510 }, { "epoch": 0.62, "learning_rate": 1.917517970681892e-05, "loss": 2.3012, "step": 353520 }, { "epoch": 0.62, "learning_rate": 1.9174307766892093e-05, "loss": 2.3697, "step": 353530 }, { "epoch": 0.62, "learning_rate": 1.9173435826965267e-05, "loss": 2.2762, "step": 353540 }, { "epoch": 0.62, "learning_rate": 1.9172563887038438e-05, "loss": 2.2653, "step": 353550 }, { "epoch": 0.62, "learning_rate": 1.9171691947111615e-05, "loss": 2.2208, "step": 353560 }, { "epoch": 0.62, "learning_rate": 1.9170820007184785e-05, "loss": 2.224, "step": 353570 }, { "epoch": 0.62, "learning_rate": 1.916994806725796e-05, "loss": 2.4121, "step": 353580 }, { "epoch": 0.62, "learning_rate": 1.9169076127331133e-05, "loss": 2.3555, "step": 353590 }, { "epoch": 0.62, "learning_rate": 1.9168204187404306e-05, "loss": 2.3225, "step": 353600 }, { "epoch": 0.62, "learning_rate": 1.916733224747748e-05, "loss": 2.2641, "step": 353610 }, { "epoch": 0.62, "learning_rate": 1.916646030755065e-05, "loss": 2.3468, "step": 353620 }, { "epoch": 0.62, "learning_rate": 1.9165588367623824e-05, "loss": 2.3447, "step": 353630 }, { "epoch": 0.62, "learning_rate": 1.9164716427696998e-05, "loss": 2.3827, "step": 353640 }, { "epoch": 0.62, "learning_rate": 1.9163844487770172e-05, "loss": 2.2022, "step": 353650 }, { "epoch": 0.62, "learning_rate": 1.9162972547843346e-05, "loss": 2.3921, "step": 353660 }, { "epoch": 0.62, "learning_rate": 1.9162100607916516e-05, "loss": 2.3854, "step": 353670 }, { "epoch": 0.62, "learning_rate": 1.9161228667989693e-05, "loss": 2.3662, "step": 353680 }, { "epoch": 0.62, "learning_rate": 1.9160356728062864e-05, "loss": 2.3832, "step": 353690 }, { "epoch": 0.62, "learning_rate": 1.9159484788136037e-05, "loss": 2.288, "step": 353700 }, { "epoch": 0.62, "learning_rate": 1.915861284820921e-05, "loss": 2.3707, "step": 353710 }, { "epoch": 0.62, "learning_rate": 1.9157740908282385e-05, "loss": 2.4449, "step": 353720 }, { "epoch": 0.62, "learning_rate": 1.9156868968355555e-05, "loss": 2.2656, "step": 353730 }, { "epoch": 0.62, "learning_rate": 1.915599702842873e-05, "loss": 2.3816, "step": 353740 }, { "epoch": 0.62, "learning_rate": 1.9155125088501906e-05, "loss": 2.3126, "step": 353750 }, { "epoch": 0.62, "learning_rate": 1.9154253148575077e-05, "loss": 2.3158, "step": 353760 }, { "epoch": 0.62, "learning_rate": 1.915338120864825e-05, "loss": 2.2625, "step": 353770 }, { "epoch": 0.62, "learning_rate": 1.915250926872142e-05, "loss": 2.4002, "step": 353780 }, { "epoch": 0.62, "learning_rate": 1.9151637328794598e-05, "loss": 2.3731, "step": 353790 }, { "epoch": 0.62, "learning_rate": 1.9150765388867768e-05, "loss": 2.329, "step": 353800 }, { "epoch": 0.62, "learning_rate": 1.9149893448940942e-05, "loss": 2.3219, "step": 353810 }, { "epoch": 0.62, "learning_rate": 1.9149021509014116e-05, "loss": 2.368, "step": 353820 }, { "epoch": 0.62, "learning_rate": 1.914814956908729e-05, "loss": 2.3451, "step": 353830 }, { "epoch": 0.62, "learning_rate": 1.9147277629160463e-05, "loss": 2.2592, "step": 353840 }, { "epoch": 0.62, "learning_rate": 1.9146405689233634e-05, "loss": 2.3334, "step": 353850 }, { "epoch": 0.62, "learning_rate": 1.914553374930681e-05, "loss": 2.3908, "step": 353860 }, { "epoch": 0.62, "learning_rate": 1.914466180937998e-05, "loss": 2.4113, "step": 353870 }, { "epoch": 0.62, "learning_rate": 1.9143789869453155e-05, "loss": 2.3422, "step": 353880 }, { "epoch": 0.62, "learning_rate": 1.914291792952633e-05, "loss": 2.3907, "step": 353890 }, { "epoch": 0.62, "learning_rate": 1.9142045989599503e-05, "loss": 2.3747, "step": 353900 }, { "epoch": 0.62, "learning_rate": 1.9141174049672676e-05, "loss": 2.3505, "step": 353910 }, { "epoch": 0.62, "learning_rate": 1.9140302109745847e-05, "loss": 2.3849, "step": 353920 }, { "epoch": 0.62, "learning_rate": 1.913943016981902e-05, "loss": 2.3676, "step": 353930 }, { "epoch": 0.62, "learning_rate": 1.9138558229892194e-05, "loss": 2.3656, "step": 353940 }, { "epoch": 0.62, "learning_rate": 1.9137686289965368e-05, "loss": 2.2841, "step": 353950 }, { "epoch": 0.62, "learning_rate": 1.913681435003854e-05, "loss": 2.1853, "step": 353960 }, { "epoch": 0.62, "learning_rate": 1.9135942410111716e-05, "loss": 2.3183, "step": 353970 }, { "epoch": 0.62, "learning_rate": 1.913507047018489e-05, "loss": 2.2989, "step": 353980 }, { "epoch": 0.62, "learning_rate": 1.913419853025806e-05, "loss": 2.3171, "step": 353990 }, { "epoch": 0.62, "learning_rate": 1.9133326590331233e-05, "loss": 2.3766, "step": 354000 }, { "epoch": 0.62, "learning_rate": 1.9132454650404407e-05, "loss": 2.4828, "step": 354010 }, { "epoch": 0.62, "learning_rate": 1.913158271047758e-05, "loss": 2.3612, "step": 354020 }, { "epoch": 0.62, "learning_rate": 1.913071077055075e-05, "loss": 2.3321, "step": 354030 }, { "epoch": 0.62, "learning_rate": 1.9129838830623925e-05, "loss": 2.3099, "step": 354040 }, { "epoch": 0.62, "learning_rate": 1.91289668906971e-05, "loss": 2.4082, "step": 354050 }, { "epoch": 0.62, "learning_rate": 1.9128094950770273e-05, "loss": 2.1822, "step": 354060 }, { "epoch": 0.62, "learning_rate": 1.9127223010843446e-05, "loss": 2.2898, "step": 354070 }, { "epoch": 0.62, "learning_rate": 1.9126351070916617e-05, "loss": 2.386, "step": 354080 }, { "epoch": 0.62, "learning_rate": 1.9125479130989794e-05, "loss": 2.3076, "step": 354090 }, { "epoch": 0.62, "learning_rate": 1.9124607191062964e-05, "loss": 2.4046, "step": 354100 }, { "epoch": 0.62, "learning_rate": 1.9123735251136138e-05, "loss": 2.2114, "step": 354110 }, { "epoch": 0.62, "learning_rate": 1.9122863311209312e-05, "loss": 2.3992, "step": 354120 }, { "epoch": 0.62, "learning_rate": 1.9121991371282486e-05, "loss": 2.2635, "step": 354130 }, { "epoch": 0.62, "learning_rate": 1.912111943135566e-05, "loss": 2.3602, "step": 354140 }, { "epoch": 0.62, "learning_rate": 1.912024749142883e-05, "loss": 2.3757, "step": 354150 }, { "epoch": 0.62, "learning_rate": 1.9119375551502007e-05, "loss": 2.3524, "step": 354160 }, { "epoch": 0.62, "learning_rate": 1.9118503611575177e-05, "loss": 2.3117, "step": 354170 }, { "epoch": 0.62, "learning_rate": 1.911763167164835e-05, "loss": 2.3155, "step": 354180 }, { "epoch": 0.62, "learning_rate": 1.911675973172152e-05, "loss": 2.3, "step": 354190 }, { "epoch": 0.62, "learning_rate": 1.91158877917947e-05, "loss": 2.2535, "step": 354200 }, { "epoch": 0.62, "learning_rate": 1.911501585186787e-05, "loss": 2.309, "step": 354210 }, { "epoch": 0.62, "learning_rate": 1.9114143911941043e-05, "loss": 2.3784, "step": 354220 }, { "epoch": 0.62, "learning_rate": 1.911327197201422e-05, "loss": 2.2237, "step": 354230 }, { "epoch": 0.62, "learning_rate": 1.911240003208739e-05, "loss": 2.3269, "step": 354240 }, { "epoch": 0.62, "learning_rate": 1.9111528092160564e-05, "loss": 2.3262, "step": 354250 }, { "epoch": 0.62, "learning_rate": 1.9110656152233735e-05, "loss": 2.2644, "step": 354260 }, { "epoch": 0.62, "learning_rate": 1.910978421230691e-05, "loss": 2.3884, "step": 354270 }, { "epoch": 0.62, "learning_rate": 1.9108912272380082e-05, "loss": 2.2694, "step": 354280 }, { "epoch": 0.62, "learning_rate": 1.9108040332453256e-05, "loss": 2.4462, "step": 354290 }, { "epoch": 0.62, "learning_rate": 1.910716839252643e-05, "loss": 2.3721, "step": 354300 }, { "epoch": 0.62, "learning_rate": 1.9106296452599603e-05, "loss": 2.3488, "step": 354310 }, { "epoch": 0.62, "learning_rate": 1.9105424512672777e-05, "loss": 2.3403, "step": 354320 }, { "epoch": 0.62, "learning_rate": 1.9104552572745948e-05, "loss": 2.3967, "step": 354330 }, { "epoch": 0.62, "learning_rate": 1.910368063281912e-05, "loss": 2.4312, "step": 354340 }, { "epoch": 0.62, "learning_rate": 1.9102808692892295e-05, "loss": 2.3752, "step": 354350 }, { "epoch": 0.62, "learning_rate": 1.910193675296547e-05, "loss": 2.3046, "step": 354360 }, { "epoch": 0.62, "learning_rate": 1.9101064813038643e-05, "loss": 2.3323, "step": 354370 }, { "epoch": 0.62, "learning_rate": 1.9100192873111816e-05, "loss": 2.4438, "step": 354380 }, { "epoch": 0.62, "learning_rate": 1.909932093318499e-05, "loss": 2.283, "step": 354390 }, { "epoch": 0.62, "learning_rate": 1.909844899325816e-05, "loss": 2.4127, "step": 354400 }, { "epoch": 0.62, "learning_rate": 1.9097577053331334e-05, "loss": 2.3397, "step": 354410 }, { "epoch": 0.62, "learning_rate": 1.9096705113404508e-05, "loss": 2.3509, "step": 354420 }, { "epoch": 0.62, "learning_rate": 1.9095833173477682e-05, "loss": 2.1679, "step": 354430 }, { "epoch": 0.62, "learning_rate": 1.9094961233550852e-05, "loss": 2.2485, "step": 354440 }, { "epoch": 0.62, "learning_rate": 1.9094089293624026e-05, "loss": 2.3417, "step": 354450 }, { "epoch": 0.62, "learning_rate": 1.90932173536972e-05, "loss": 2.2627, "step": 354460 }, { "epoch": 0.62, "learning_rate": 1.9092345413770374e-05, "loss": 2.3511, "step": 354470 }, { "epoch": 0.62, "learning_rate": 1.9091473473843547e-05, "loss": 2.28, "step": 354480 }, { "epoch": 0.62, "learning_rate": 1.909060153391672e-05, "loss": 2.4491, "step": 354490 }, { "epoch": 0.62, "learning_rate": 1.9089729593989895e-05, "loss": 2.4492, "step": 354500 }, { "epoch": 0.62, "learning_rate": 1.9088857654063065e-05, "loss": 2.2463, "step": 354510 }, { "epoch": 0.62, "learning_rate": 1.908798571413624e-05, "loss": 2.2342, "step": 354520 }, { "epoch": 0.62, "learning_rate": 1.9087113774209413e-05, "loss": 2.2161, "step": 354530 }, { "epoch": 0.62, "learning_rate": 1.9086241834282587e-05, "loss": 2.3297, "step": 354540 }, { "epoch": 0.62, "learning_rate": 1.908536989435576e-05, "loss": 2.3889, "step": 354550 }, { "epoch": 0.62, "learning_rate": 1.908449795442893e-05, "loss": 2.3452, "step": 354560 }, { "epoch": 0.62, "learning_rate": 1.9083626014502108e-05, "loss": 2.3038, "step": 354570 }, { "epoch": 0.62, "learning_rate": 1.9082754074575278e-05, "loss": 2.2697, "step": 354580 }, { "epoch": 0.62, "learning_rate": 1.9081882134648452e-05, "loss": 2.2248, "step": 354590 }, { "epoch": 0.62, "learning_rate": 1.9081010194721626e-05, "loss": 2.212, "step": 354600 }, { "epoch": 0.62, "learning_rate": 1.90801382547948e-05, "loss": 2.4037, "step": 354610 }, { "epoch": 0.62, "learning_rate": 1.9079266314867973e-05, "loss": 2.3444, "step": 354620 }, { "epoch": 0.62, "learning_rate": 1.9078394374941144e-05, "loss": 2.3921, "step": 354630 }, { "epoch": 0.62, "learning_rate": 1.907752243501432e-05, "loss": 2.4174, "step": 354640 }, { "epoch": 0.62, "learning_rate": 1.907665049508749e-05, "loss": 2.2107, "step": 354650 }, { "epoch": 0.62, "learning_rate": 1.9075778555160665e-05, "loss": 2.2698, "step": 354660 }, { "epoch": 0.62, "learning_rate": 1.9074906615233835e-05, "loss": 2.3613, "step": 354670 }, { "epoch": 0.62, "learning_rate": 1.9074034675307013e-05, "loss": 2.3771, "step": 354680 }, { "epoch": 0.62, "learning_rate": 1.9073162735380183e-05, "loss": 2.3813, "step": 354690 }, { "epoch": 0.62, "learning_rate": 1.9072290795453357e-05, "loss": 2.2953, "step": 354700 }, { "epoch": 0.62, "learning_rate": 1.907141885552653e-05, "loss": 2.261, "step": 354710 }, { "epoch": 0.62, "learning_rate": 1.9070546915599704e-05, "loss": 2.3188, "step": 354720 }, { "epoch": 0.62, "learning_rate": 1.9069674975672878e-05, "loss": 2.3335, "step": 354730 }, { "epoch": 0.62, "learning_rate": 1.906880303574605e-05, "loss": 2.3903, "step": 354740 }, { "epoch": 0.62, "learning_rate": 1.9067931095819222e-05, "loss": 2.3928, "step": 354750 }, { "epoch": 0.62, "learning_rate": 1.9067059155892396e-05, "loss": 2.2841, "step": 354760 }, { "epoch": 0.62, "learning_rate": 1.906618721596557e-05, "loss": 2.405, "step": 354770 }, { "epoch": 0.62, "learning_rate": 1.9065315276038743e-05, "loss": 2.3709, "step": 354780 }, { "epoch": 0.62, "learning_rate": 1.9064443336111917e-05, "loss": 2.4336, "step": 354790 }, { "epoch": 0.62, "learning_rate": 1.906357139618509e-05, "loss": 2.3109, "step": 354800 }, { "epoch": 0.62, "learning_rate": 1.906269945625826e-05, "loss": 2.2109, "step": 354810 }, { "epoch": 0.62, "learning_rate": 1.9061827516331435e-05, "loss": 2.251, "step": 354820 }, { "epoch": 0.62, "learning_rate": 1.906095557640461e-05, "loss": 2.4301, "step": 354830 }, { "epoch": 0.62, "learning_rate": 1.9060083636477783e-05, "loss": 2.3077, "step": 354840 }, { "epoch": 0.62, "learning_rate": 1.9059211696550956e-05, "loss": 2.338, "step": 354850 }, { "epoch": 0.62, "learning_rate": 1.9058339756624127e-05, "loss": 2.3101, "step": 354860 }, { "epoch": 0.62, "learning_rate": 1.9057467816697304e-05, "loss": 2.3564, "step": 354870 }, { "epoch": 0.62, "learning_rate": 1.9056595876770474e-05, "loss": 2.3457, "step": 354880 }, { "epoch": 0.62, "learning_rate": 1.9055723936843648e-05, "loss": 2.2535, "step": 354890 }, { "epoch": 0.62, "learning_rate": 1.9054851996916822e-05, "loss": 2.4144, "step": 354900 }, { "epoch": 0.62, "learning_rate": 1.9053980056989996e-05, "loss": 2.4078, "step": 354910 }, { "epoch": 0.62, "learning_rate": 1.9053108117063166e-05, "loss": 2.3171, "step": 354920 }, { "epoch": 0.62, "learning_rate": 1.905223617713634e-05, "loss": 2.3465, "step": 354930 }, { "epoch": 0.62, "learning_rate": 1.9051364237209514e-05, "loss": 2.1954, "step": 354940 }, { "epoch": 0.62, "learning_rate": 1.9050492297282687e-05, "loss": 2.2595, "step": 354950 }, { "epoch": 0.62, "learning_rate": 1.904962035735586e-05, "loss": 2.3364, "step": 354960 }, { "epoch": 0.62, "learning_rate": 1.904874841742903e-05, "loss": 2.3002, "step": 354970 }, { "epoch": 0.62, "learning_rate": 1.904787647750221e-05, "loss": 2.2735, "step": 354980 }, { "epoch": 0.62, "learning_rate": 1.904700453757538e-05, "loss": 2.2518, "step": 354990 }, { "epoch": 0.62, "learning_rate": 1.9046132597648553e-05, "loss": 2.3581, "step": 355000 }, { "epoch": 0.62, "learning_rate": 1.9045260657721727e-05, "loss": 2.4076, "step": 355010 }, { "epoch": 0.62, "learning_rate": 1.90443887177949e-05, "loss": 2.3834, "step": 355020 }, { "epoch": 0.62, "learning_rate": 1.9043516777868074e-05, "loss": 2.4343, "step": 355030 }, { "epoch": 0.62, "learning_rate": 1.9042644837941245e-05, "loss": 2.1516, "step": 355040 }, { "epoch": 0.62, "learning_rate": 1.904177289801442e-05, "loss": 2.4127, "step": 355050 }, { "epoch": 0.62, "learning_rate": 1.9040900958087592e-05, "loss": 2.3384, "step": 355060 }, { "epoch": 0.62, "learning_rate": 1.9040029018160766e-05, "loss": 2.2323, "step": 355070 }, { "epoch": 0.62, "learning_rate": 1.9039157078233936e-05, "loss": 2.2788, "step": 355080 }, { "epoch": 0.62, "learning_rate": 1.9038285138307113e-05, "loss": 2.3994, "step": 355090 }, { "epoch": 0.62, "learning_rate": 1.9037413198380287e-05, "loss": 2.2839, "step": 355100 }, { "epoch": 0.62, "learning_rate": 1.9036541258453458e-05, "loss": 2.2376, "step": 355110 }, { "epoch": 0.62, "learning_rate": 1.903566931852663e-05, "loss": 2.3419, "step": 355120 }, { "epoch": 0.62, "learning_rate": 1.9034797378599805e-05, "loss": 2.33, "step": 355130 }, { "epoch": 0.62, "learning_rate": 1.903392543867298e-05, "loss": 2.219, "step": 355140 }, { "epoch": 0.62, "learning_rate": 1.903305349874615e-05, "loss": 2.3125, "step": 355150 }, { "epoch": 0.62, "learning_rate": 1.9032181558819326e-05, "loss": 2.3388, "step": 355160 }, { "epoch": 0.62, "learning_rate": 1.9031309618892497e-05, "loss": 2.2958, "step": 355170 }, { "epoch": 0.62, "learning_rate": 1.903043767896567e-05, "loss": 2.2924, "step": 355180 }, { "epoch": 0.62, "learning_rate": 1.9029565739038844e-05, "loss": 2.3403, "step": 355190 }, { "epoch": 0.62, "learning_rate": 1.9028693799112018e-05, "loss": 2.2199, "step": 355200 }, { "epoch": 0.62, "learning_rate": 1.9027821859185192e-05, "loss": 2.376, "step": 355210 }, { "epoch": 0.62, "learning_rate": 1.9026949919258362e-05, "loss": 2.2129, "step": 355220 }, { "epoch": 0.62, "learning_rate": 1.9026077979331536e-05, "loss": 2.2406, "step": 355230 }, { "epoch": 0.62, "learning_rate": 1.902520603940471e-05, "loss": 2.2892, "step": 355240 }, { "epoch": 0.62, "learning_rate": 1.9024334099477884e-05, "loss": 2.249, "step": 355250 }, { "epoch": 0.62, "learning_rate": 1.9023462159551057e-05, "loss": 2.3679, "step": 355260 }, { "epoch": 0.62, "learning_rate": 1.9022590219624228e-05, "loss": 2.3768, "step": 355270 }, { "epoch": 0.62, "learning_rate": 1.9021718279697405e-05, "loss": 2.4152, "step": 355280 }, { "epoch": 0.62, "learning_rate": 1.9020846339770575e-05, "loss": 2.3602, "step": 355290 }, { "epoch": 0.62, "learning_rate": 1.901997439984375e-05, "loss": 2.341, "step": 355300 }, { "epoch": 0.62, "learning_rate": 1.9019102459916923e-05, "loss": 2.3147, "step": 355310 }, { "epoch": 0.62, "learning_rate": 1.9018230519990097e-05, "loss": 2.3692, "step": 355320 }, { "epoch": 0.62, "learning_rate": 1.901735858006327e-05, "loss": 2.2406, "step": 355330 }, { "epoch": 0.62, "learning_rate": 1.901648664013644e-05, "loss": 2.3642, "step": 355340 }, { "epoch": 0.62, "learning_rate": 1.9015614700209618e-05, "loss": 2.3261, "step": 355350 }, { "epoch": 0.62, "learning_rate": 1.9014742760282788e-05, "loss": 2.3799, "step": 355360 }, { "epoch": 0.62, "learning_rate": 1.9013870820355962e-05, "loss": 2.295, "step": 355370 }, { "epoch": 0.62, "learning_rate": 1.9012998880429132e-05, "loss": 2.3274, "step": 355380 }, { "epoch": 0.62, "learning_rate": 1.901212694050231e-05, "loss": 2.2983, "step": 355390 }, { "epoch": 0.62, "learning_rate": 1.901125500057548e-05, "loss": 2.3331, "step": 355400 }, { "epoch": 0.62, "learning_rate": 1.9010383060648654e-05, "loss": 2.4162, "step": 355410 }, { "epoch": 0.62, "learning_rate": 1.9009511120721827e-05, "loss": 2.2132, "step": 355420 }, { "epoch": 0.62, "learning_rate": 1.9008639180795e-05, "loss": 2.3849, "step": 355430 }, { "epoch": 0.62, "learning_rate": 1.9007767240868175e-05, "loss": 2.2956, "step": 355440 }, { "epoch": 0.62, "learning_rate": 1.9006895300941345e-05, "loss": 2.3828, "step": 355450 }, { "epoch": 0.62, "learning_rate": 1.9006023361014523e-05, "loss": 2.3925, "step": 355460 }, { "epoch": 0.62, "learning_rate": 1.9005151421087693e-05, "loss": 2.2183, "step": 355470 }, { "epoch": 0.62, "learning_rate": 1.9004279481160867e-05, "loss": 2.2605, "step": 355480 }, { "epoch": 0.62, "learning_rate": 1.900340754123404e-05, "loss": 2.3754, "step": 355490 }, { "epoch": 0.62, "learning_rate": 1.9002535601307214e-05, "loss": 2.4308, "step": 355500 }, { "epoch": 0.62, "learning_rate": 1.9001663661380388e-05, "loss": 2.1994, "step": 355510 }, { "epoch": 0.62, "learning_rate": 1.900079172145356e-05, "loss": 2.3904, "step": 355520 }, { "epoch": 0.62, "learning_rate": 1.8999919781526732e-05, "loss": 2.2106, "step": 355530 }, { "epoch": 0.62, "learning_rate": 1.8999047841599906e-05, "loss": 2.4207, "step": 355540 }, { "epoch": 0.62, "learning_rate": 1.899817590167308e-05, "loss": 2.3091, "step": 355550 }, { "epoch": 0.62, "learning_rate": 1.899730396174625e-05, "loss": 2.2972, "step": 355560 }, { "epoch": 0.62, "learning_rate": 1.8996432021819427e-05, "loss": 2.2926, "step": 355570 }, { "epoch": 0.62, "learning_rate": 1.89955600818926e-05, "loss": 2.3798, "step": 355580 }, { "epoch": 0.62, "learning_rate": 1.899468814196577e-05, "loss": 2.2745, "step": 355590 }, { "epoch": 0.62, "learning_rate": 1.8993816202038945e-05, "loss": 2.2569, "step": 355600 }, { "epoch": 0.62, "learning_rate": 1.899294426211212e-05, "loss": 2.3995, "step": 355610 }, { "epoch": 0.62, "learning_rate": 1.8992072322185293e-05, "loss": 2.2954, "step": 355620 }, { "epoch": 0.62, "learning_rate": 1.8991200382258463e-05, "loss": 2.3473, "step": 355630 }, { "epoch": 0.62, "learning_rate": 1.8990328442331637e-05, "loss": 2.3251, "step": 355640 }, { "epoch": 0.62, "learning_rate": 1.898945650240481e-05, "loss": 2.3648, "step": 355650 }, { "epoch": 0.62, "learning_rate": 1.8988584562477984e-05, "loss": 2.2786, "step": 355660 }, { "epoch": 0.62, "learning_rate": 1.8987712622551158e-05, "loss": 2.2241, "step": 355670 }, { "epoch": 0.62, "learning_rate": 1.898684068262433e-05, "loss": 2.3936, "step": 355680 }, { "epoch": 0.62, "learning_rate": 1.8985968742697506e-05, "loss": 2.2385, "step": 355690 }, { "epoch": 0.62, "learning_rate": 1.8985096802770676e-05, "loss": 2.3769, "step": 355700 }, { "epoch": 0.62, "learning_rate": 1.898422486284385e-05, "loss": 2.369, "step": 355710 }, { "epoch": 0.62, "learning_rate": 1.8983352922917024e-05, "loss": 2.3555, "step": 355720 }, { "epoch": 0.62, "learning_rate": 1.8982480982990197e-05, "loss": 2.3335, "step": 355730 }, { "epoch": 0.62, "learning_rate": 1.898160904306337e-05, "loss": 2.3344, "step": 355740 }, { "epoch": 0.62, "learning_rate": 1.898073710313654e-05, "loss": 2.3169, "step": 355750 }, { "epoch": 0.62, "learning_rate": 1.897986516320972e-05, "loss": 2.3315, "step": 355760 }, { "epoch": 0.62, "learning_rate": 1.897899322328289e-05, "loss": 2.3356, "step": 355770 }, { "epoch": 0.62, "learning_rate": 1.8978121283356063e-05, "loss": 2.2778, "step": 355780 }, { "epoch": 0.62, "learning_rate": 1.8977249343429233e-05, "loss": 2.3119, "step": 355790 }, { "epoch": 0.62, "learning_rate": 1.897637740350241e-05, "loss": 2.3712, "step": 355800 }, { "epoch": 0.62, "learning_rate": 1.897550546357558e-05, "loss": 2.4084, "step": 355810 }, { "epoch": 0.62, "learning_rate": 1.8974633523648755e-05, "loss": 2.2802, "step": 355820 }, { "epoch": 0.62, "learning_rate": 1.8973761583721932e-05, "loss": 2.2729, "step": 355830 }, { "epoch": 0.62, "learning_rate": 1.8972889643795102e-05, "loss": 2.3629, "step": 355840 }, { "epoch": 0.62, "learning_rate": 1.8972017703868276e-05, "loss": 2.4029, "step": 355850 }, { "epoch": 0.62, "learning_rate": 1.8971145763941446e-05, "loss": 2.4025, "step": 355860 }, { "epoch": 0.62, "learning_rate": 1.8970273824014623e-05, "loss": 2.3074, "step": 355870 }, { "epoch": 0.62, "learning_rate": 1.8969401884087794e-05, "loss": 2.302, "step": 355880 }, { "epoch": 0.62, "learning_rate": 1.8968529944160968e-05, "loss": 2.2653, "step": 355890 }, { "epoch": 0.62, "learning_rate": 1.896765800423414e-05, "loss": 2.3767, "step": 355900 }, { "epoch": 0.62, "learning_rate": 1.8966786064307315e-05, "loss": 2.37, "step": 355910 }, { "epoch": 0.62, "learning_rate": 1.896591412438049e-05, "loss": 2.2612, "step": 355920 }, { "epoch": 0.62, "learning_rate": 1.896504218445366e-05, "loss": 2.3536, "step": 355930 }, { "epoch": 0.62, "learning_rate": 1.8964170244526833e-05, "loss": 2.2484, "step": 355940 }, { "epoch": 0.62, "learning_rate": 1.8963298304600007e-05, "loss": 2.4279, "step": 355950 }, { "epoch": 0.62, "learning_rate": 1.896242636467318e-05, "loss": 2.3137, "step": 355960 }, { "epoch": 0.62, "learning_rate": 1.8961554424746354e-05, "loss": 2.3399, "step": 355970 }, { "epoch": 0.62, "learning_rate": 1.8960682484819528e-05, "loss": 2.2973, "step": 355980 }, { "epoch": 0.62, "learning_rate": 1.8959810544892702e-05, "loss": 2.3255, "step": 355990 }, { "epoch": 0.62, "learning_rate": 1.8958938604965872e-05, "loss": 2.4456, "step": 356000 }, { "epoch": 0.62, "learning_rate": 1.8958066665039046e-05, "loss": 2.3713, "step": 356010 }, { "epoch": 0.62, "learning_rate": 1.895719472511222e-05, "loss": 2.2909, "step": 356020 }, { "epoch": 0.62, "learning_rate": 1.8956322785185394e-05, "loss": 2.2822, "step": 356030 }, { "epoch": 0.62, "learning_rate": 1.8955450845258564e-05, "loss": 2.3634, "step": 356040 }, { "epoch": 0.62, "learning_rate": 1.8954578905331738e-05, "loss": 2.3487, "step": 356050 }, { "epoch": 0.62, "learning_rate": 1.8953706965404915e-05, "loss": 2.3828, "step": 356060 }, { "epoch": 0.62, "learning_rate": 1.8952835025478085e-05, "loss": 2.2664, "step": 356070 }, { "epoch": 0.62, "learning_rate": 1.895196308555126e-05, "loss": 2.272, "step": 356080 }, { "epoch": 0.62, "learning_rate": 1.8951091145624433e-05, "loss": 2.291, "step": 356090 }, { "epoch": 0.62, "learning_rate": 1.8950219205697607e-05, "loss": 2.3184, "step": 356100 }, { "epoch": 0.62, "learning_rate": 1.8949347265770777e-05, "loss": 2.3427, "step": 356110 }, { "epoch": 0.62, "learning_rate": 1.894847532584395e-05, "loss": 2.2781, "step": 356120 }, { "epoch": 0.62, "learning_rate": 1.8947603385917124e-05, "loss": 2.3425, "step": 356130 }, { "epoch": 0.62, "learning_rate": 1.8946731445990298e-05, "loss": 2.29, "step": 356140 }, { "epoch": 0.62, "learning_rate": 1.8945859506063472e-05, "loss": 2.2962, "step": 356150 }, { "epoch": 0.62, "learning_rate": 1.8944987566136642e-05, "loss": 2.351, "step": 356160 }, { "epoch": 0.62, "learning_rate": 1.894411562620982e-05, "loss": 2.3372, "step": 356170 }, { "epoch": 0.62, "learning_rate": 1.894324368628299e-05, "loss": 2.2306, "step": 356180 }, { "epoch": 0.62, "learning_rate": 1.8942371746356164e-05, "loss": 2.3605, "step": 356190 }, { "epoch": 0.62, "learning_rate": 1.8941499806429337e-05, "loss": 2.292, "step": 356200 }, { "epoch": 0.62, "learning_rate": 1.894062786650251e-05, "loss": 2.3302, "step": 356210 }, { "epoch": 0.62, "learning_rate": 1.8939755926575685e-05, "loss": 2.2932, "step": 356220 }, { "epoch": 0.62, "learning_rate": 1.8938883986648855e-05, "loss": 2.2445, "step": 356230 }, { "epoch": 0.62, "learning_rate": 1.8938012046722033e-05, "loss": 2.3265, "step": 356240 }, { "epoch": 0.62, "learning_rate": 1.8937140106795203e-05, "loss": 2.2305, "step": 356250 }, { "epoch": 0.62, "learning_rate": 1.8936268166868377e-05, "loss": 2.4182, "step": 356260 }, { "epoch": 0.62, "learning_rate": 1.8935396226941547e-05, "loss": 2.3275, "step": 356270 }, { "epoch": 0.62, "learning_rate": 1.8934524287014724e-05, "loss": 2.3173, "step": 356280 }, { "epoch": 0.62, "learning_rate": 1.8933652347087895e-05, "loss": 2.3298, "step": 356290 }, { "epoch": 0.62, "learning_rate": 1.893278040716107e-05, "loss": 2.3564, "step": 356300 }, { "epoch": 0.62, "learning_rate": 1.8931908467234242e-05, "loss": 2.3315, "step": 356310 }, { "epoch": 0.62, "learning_rate": 1.8931036527307416e-05, "loss": 2.295, "step": 356320 }, { "epoch": 0.62, "learning_rate": 1.893016458738059e-05, "loss": 2.2873, "step": 356330 }, { "epoch": 0.62, "learning_rate": 1.892929264745376e-05, "loss": 2.3073, "step": 356340 }, { "epoch": 0.62, "learning_rate": 1.8928420707526934e-05, "loss": 2.2943, "step": 356350 }, { "epoch": 0.62, "learning_rate": 1.8927548767600108e-05, "loss": 2.3209, "step": 356360 }, { "epoch": 0.62, "learning_rate": 1.892667682767328e-05, "loss": 2.4581, "step": 356370 }, { "epoch": 0.62, "learning_rate": 1.8925804887746455e-05, "loss": 2.2646, "step": 356380 }, { "epoch": 0.62, "learning_rate": 1.892493294781963e-05, "loss": 2.4391, "step": 356390 }, { "epoch": 0.62, "learning_rate": 1.8924061007892803e-05, "loss": 2.3664, "step": 356400 }, { "epoch": 0.62, "learning_rate": 1.8923189067965973e-05, "loss": 2.2986, "step": 356410 }, { "epoch": 0.62, "learning_rate": 1.8922317128039147e-05, "loss": 2.2916, "step": 356420 }, { "epoch": 0.62, "learning_rate": 1.892144518811232e-05, "loss": 2.2781, "step": 356430 }, { "epoch": 0.62, "learning_rate": 1.8920573248185494e-05, "loss": 2.4411, "step": 356440 }, { "epoch": 0.62, "learning_rate": 1.8919701308258668e-05, "loss": 2.3222, "step": 356450 }, { "epoch": 0.62, "learning_rate": 1.891882936833184e-05, "loss": 2.3792, "step": 356460 }, { "epoch": 0.62, "learning_rate": 1.8917957428405016e-05, "loss": 2.2679, "step": 356470 }, { "epoch": 0.62, "learning_rate": 1.8917085488478186e-05, "loss": 2.3436, "step": 356480 }, { "epoch": 0.62, "learning_rate": 1.891621354855136e-05, "loss": 2.3273, "step": 356490 }, { "epoch": 0.62, "learning_rate": 1.8915341608624534e-05, "loss": 2.2842, "step": 356500 }, { "epoch": 0.62, "learning_rate": 1.8914469668697707e-05, "loss": 2.2644, "step": 356510 }, { "epoch": 0.62, "learning_rate": 1.8913597728770878e-05, "loss": 2.3222, "step": 356520 }, { "epoch": 0.62, "learning_rate": 1.891272578884405e-05, "loss": 2.3846, "step": 356530 }, { "epoch": 0.62, "learning_rate": 1.8911853848917225e-05, "loss": 2.298, "step": 356540 }, { "epoch": 0.62, "learning_rate": 1.89109819089904e-05, "loss": 2.2379, "step": 356550 }, { "epoch": 0.62, "learning_rate": 1.8910109969063573e-05, "loss": 2.3168, "step": 356560 }, { "epoch": 0.62, "learning_rate": 1.8909238029136743e-05, "loss": 2.3204, "step": 356570 }, { "epoch": 0.62, "learning_rate": 1.890836608920992e-05, "loss": 2.3687, "step": 356580 }, { "epoch": 0.62, "learning_rate": 1.890749414928309e-05, "loss": 2.2869, "step": 356590 }, { "epoch": 0.62, "learning_rate": 1.8906622209356265e-05, "loss": 2.3444, "step": 356600 }, { "epoch": 0.62, "learning_rate": 1.890575026942944e-05, "loss": 2.3335, "step": 356610 }, { "epoch": 0.62, "learning_rate": 1.8904878329502612e-05, "loss": 2.3575, "step": 356620 }, { "epoch": 0.62, "learning_rate": 1.8904006389575786e-05, "loss": 2.3868, "step": 356630 }, { "epoch": 0.62, "learning_rate": 1.8903134449648956e-05, "loss": 2.3724, "step": 356640 }, { "epoch": 0.62, "learning_rate": 1.8902262509722133e-05, "loss": 2.4142, "step": 356650 }, { "epoch": 0.62, "learning_rate": 1.8901390569795304e-05, "loss": 2.3533, "step": 356660 }, { "epoch": 0.62, "learning_rate": 1.8900518629868478e-05, "loss": 2.3666, "step": 356670 }, { "epoch": 0.62, "learning_rate": 1.889964668994165e-05, "loss": 2.2513, "step": 356680 }, { "epoch": 0.62, "learning_rate": 1.8898774750014825e-05, "loss": 2.3596, "step": 356690 }, { "epoch": 0.62, "learning_rate": 1.8897902810088e-05, "loss": 2.2842, "step": 356700 }, { "epoch": 0.62, "learning_rate": 1.889703087016117e-05, "loss": 2.3803, "step": 356710 }, { "epoch": 0.62, "learning_rate": 1.8896158930234343e-05, "loss": 2.2624, "step": 356720 }, { "epoch": 0.62, "learning_rate": 1.8895286990307517e-05, "loss": 2.2183, "step": 356730 }, { "epoch": 0.62, "learning_rate": 1.889441505038069e-05, "loss": 2.3214, "step": 356740 }, { "epoch": 0.62, "learning_rate": 1.889354311045386e-05, "loss": 2.3432, "step": 356750 }, { "epoch": 0.62, "learning_rate": 1.8892671170527038e-05, "loss": 2.4232, "step": 356760 }, { "epoch": 0.62, "learning_rate": 1.889179923060021e-05, "loss": 2.3673, "step": 356770 }, { "epoch": 0.62, "learning_rate": 1.8890927290673382e-05, "loss": 2.2613, "step": 356780 }, { "epoch": 0.62, "learning_rate": 1.8890055350746556e-05, "loss": 2.4343, "step": 356790 }, { "epoch": 0.62, "learning_rate": 1.888918341081973e-05, "loss": 2.4297, "step": 356800 }, { "epoch": 0.62, "learning_rate": 1.8888311470892904e-05, "loss": 2.3657, "step": 356810 }, { "epoch": 0.62, "learning_rate": 1.8887439530966074e-05, "loss": 2.2492, "step": 356820 }, { "epoch": 0.62, "learning_rate": 1.8886567591039248e-05, "loss": 2.4387, "step": 356830 }, { "epoch": 0.62, "learning_rate": 1.888569565111242e-05, "loss": 2.2978, "step": 356840 }, { "epoch": 0.62, "learning_rate": 1.8884823711185595e-05, "loss": 2.3477, "step": 356850 }, { "epoch": 0.62, "learning_rate": 1.888395177125877e-05, "loss": 2.4384, "step": 356860 }, { "epoch": 0.62, "learning_rate": 1.888307983133194e-05, "loss": 2.3278, "step": 356870 }, { "epoch": 0.62, "learning_rate": 1.8882207891405117e-05, "loss": 2.379, "step": 356880 }, { "epoch": 0.62, "learning_rate": 1.8881335951478287e-05, "loss": 2.4146, "step": 356890 }, { "epoch": 0.62, "learning_rate": 1.888046401155146e-05, "loss": 2.3258, "step": 356900 }, { "epoch": 0.62, "learning_rate": 1.8879592071624634e-05, "loss": 2.4013, "step": 356910 }, { "epoch": 0.62, "learning_rate": 1.8878720131697808e-05, "loss": 2.3681, "step": 356920 }, { "epoch": 0.62, "learning_rate": 1.8877848191770982e-05, "loss": 2.4141, "step": 356930 }, { "epoch": 0.62, "learning_rate": 1.8876976251844152e-05, "loss": 2.3257, "step": 356940 }, { "epoch": 0.62, "learning_rate": 1.887610431191733e-05, "loss": 2.3211, "step": 356950 }, { "epoch": 0.62, "learning_rate": 1.88752323719905e-05, "loss": 2.2529, "step": 356960 }, { "epoch": 0.62, "learning_rate": 1.8874360432063674e-05, "loss": 2.3409, "step": 356970 }, { "epoch": 0.62, "learning_rate": 1.8873488492136844e-05, "loss": 2.244, "step": 356980 }, { "epoch": 0.62, "learning_rate": 1.887261655221002e-05, "loss": 2.2589, "step": 356990 }, { "epoch": 0.62, "learning_rate": 1.887174461228319e-05, "loss": 2.2835, "step": 357000 }, { "epoch": 0.62, "learning_rate": 1.8870872672356365e-05, "loss": 2.42, "step": 357010 }, { "epoch": 0.62, "learning_rate": 1.887000073242954e-05, "loss": 2.3533, "step": 357020 }, { "epoch": 0.62, "learning_rate": 1.8869128792502713e-05, "loss": 2.3023, "step": 357030 }, { "epoch": 0.62, "learning_rate": 1.8868256852575887e-05, "loss": 2.2609, "step": 357040 }, { "epoch": 0.62, "learning_rate": 1.8867384912649057e-05, "loss": 2.3023, "step": 357050 }, { "epoch": 0.62, "learning_rate": 1.8866512972722234e-05, "loss": 2.3084, "step": 357060 }, { "epoch": 0.62, "learning_rate": 1.8865641032795405e-05, "loss": 2.4131, "step": 357070 }, { "epoch": 0.62, "learning_rate": 1.886476909286858e-05, "loss": 2.3842, "step": 357080 }, { "epoch": 0.62, "learning_rate": 1.8863897152941752e-05, "loss": 2.4207, "step": 357090 }, { "epoch": 0.62, "learning_rate": 1.8863025213014926e-05, "loss": 2.3816, "step": 357100 }, { "epoch": 0.62, "learning_rate": 1.88621532730881e-05, "loss": 2.3296, "step": 357110 }, { "epoch": 0.62, "learning_rate": 1.886128133316127e-05, "loss": 2.3944, "step": 357120 }, { "epoch": 0.62, "learning_rate": 1.8860409393234444e-05, "loss": 2.2914, "step": 357130 }, { "epoch": 0.62, "learning_rate": 1.8859537453307618e-05, "loss": 2.2479, "step": 357140 }, { "epoch": 0.62, "learning_rate": 1.885866551338079e-05, "loss": 2.3173, "step": 357150 }, { "epoch": 0.62, "learning_rate": 1.8857793573453962e-05, "loss": 2.3015, "step": 357160 }, { "epoch": 0.62, "learning_rate": 1.885692163352714e-05, "loss": 2.3053, "step": 357170 }, { "epoch": 0.62, "learning_rate": 1.8856049693600313e-05, "loss": 2.2867, "step": 357180 }, { "epoch": 0.62, "learning_rate": 1.8855177753673483e-05, "loss": 2.3839, "step": 357190 }, { "epoch": 0.62, "learning_rate": 1.8854305813746657e-05, "loss": 2.2292, "step": 357200 }, { "epoch": 0.62, "learning_rate": 1.885343387381983e-05, "loss": 2.239, "step": 357210 }, { "epoch": 0.62, "learning_rate": 1.8852561933893004e-05, "loss": 2.2211, "step": 357220 }, { "epoch": 0.62, "learning_rate": 1.8851689993966175e-05, "loss": 2.4452, "step": 357230 }, { "epoch": 0.62, "learning_rate": 1.885081805403935e-05, "loss": 2.2723, "step": 357240 }, { "epoch": 0.62, "learning_rate": 1.8849946114112522e-05, "loss": 2.2954, "step": 357250 }, { "epoch": 0.62, "learning_rate": 1.8849074174185696e-05, "loss": 2.3629, "step": 357260 }, { "epoch": 0.62, "learning_rate": 1.884820223425887e-05, "loss": 2.2766, "step": 357270 }, { "epoch": 0.62, "learning_rate": 1.884733029433204e-05, "loss": 2.3016, "step": 357280 }, { "epoch": 0.62, "learning_rate": 1.8846458354405217e-05, "loss": 2.2859, "step": 357290 }, { "epoch": 0.62, "learning_rate": 1.8845586414478388e-05, "loss": 2.2904, "step": 357300 }, { "epoch": 0.62, "learning_rate": 1.884471447455156e-05, "loss": 2.33, "step": 357310 }, { "epoch": 0.62, "learning_rate": 1.8843842534624735e-05, "loss": 2.3368, "step": 357320 }, { "epoch": 0.62, "learning_rate": 1.884297059469791e-05, "loss": 2.3611, "step": 357330 }, { "epoch": 0.62, "learning_rate": 1.8842098654771083e-05, "loss": 2.2721, "step": 357340 }, { "epoch": 0.62, "learning_rate": 1.8841226714844253e-05, "loss": 2.3709, "step": 357350 }, { "epoch": 0.62, "learning_rate": 1.884035477491743e-05, "loss": 2.4549, "step": 357360 }, { "epoch": 0.62, "learning_rate": 1.88394828349906e-05, "loss": 2.2903, "step": 357370 }, { "epoch": 0.62, "learning_rate": 1.8838610895063775e-05, "loss": 2.2842, "step": 357380 }, { "epoch": 0.62, "learning_rate": 1.8837738955136945e-05, "loss": 2.3938, "step": 357390 }, { "epoch": 0.62, "learning_rate": 1.8836867015210122e-05, "loss": 2.3038, "step": 357400 }, { "epoch": 0.62, "learning_rate": 1.8835995075283296e-05, "loss": 2.244, "step": 357410 }, { "epoch": 0.62, "learning_rate": 1.8835123135356466e-05, "loss": 2.3486, "step": 357420 }, { "epoch": 0.62, "learning_rate": 1.8834251195429643e-05, "loss": 2.4367, "step": 357430 }, { "epoch": 0.62, "learning_rate": 1.8833379255502814e-05, "loss": 2.315, "step": 357440 }, { "epoch": 0.62, "learning_rate": 1.8832507315575988e-05, "loss": 2.2748, "step": 357450 }, { "epoch": 0.62, "learning_rate": 1.8831635375649158e-05, "loss": 2.3412, "step": 357460 }, { "epoch": 0.62, "learning_rate": 1.8830763435722335e-05, "loss": 2.2601, "step": 357470 }, { "epoch": 0.62, "learning_rate": 1.8829891495795505e-05, "loss": 2.3776, "step": 357480 }, { "epoch": 0.62, "learning_rate": 1.882901955586868e-05, "loss": 2.1596, "step": 357490 }, { "epoch": 0.62, "learning_rate": 1.8828147615941853e-05, "loss": 2.2536, "step": 357500 }, { "epoch": 0.62, "learning_rate": 1.8827275676015027e-05, "loss": 2.2292, "step": 357510 }, { "epoch": 0.62, "learning_rate": 1.88264037360882e-05, "loss": 2.3426, "step": 357520 }, { "epoch": 0.62, "learning_rate": 1.882553179616137e-05, "loss": 2.1771, "step": 357530 }, { "epoch": 0.62, "learning_rate": 1.8824659856234545e-05, "loss": 2.4109, "step": 357540 }, { "epoch": 0.62, "learning_rate": 1.882378791630772e-05, "loss": 2.2637, "step": 357550 }, { "epoch": 0.62, "learning_rate": 1.8822915976380892e-05, "loss": 2.3279, "step": 357560 }, { "epoch": 0.62, "learning_rate": 1.8822044036454066e-05, "loss": 2.4886, "step": 357570 }, { "epoch": 0.62, "learning_rate": 1.882117209652724e-05, "loss": 2.2749, "step": 357580 }, { "epoch": 0.62, "learning_rate": 1.8820300156600414e-05, "loss": 2.3402, "step": 357590 }, { "epoch": 0.62, "learning_rate": 1.8819428216673584e-05, "loss": 2.3482, "step": 357600 }, { "epoch": 0.62, "learning_rate": 1.8818556276746758e-05, "loss": 2.3285, "step": 357610 }, { "epoch": 0.62, "learning_rate": 1.881768433681993e-05, "loss": 2.3246, "step": 357620 }, { "epoch": 0.62, "learning_rate": 1.8816812396893105e-05, "loss": 2.3891, "step": 357630 }, { "epoch": 0.62, "learning_rate": 1.8815940456966276e-05, "loss": 2.2494, "step": 357640 }, { "epoch": 0.62, "learning_rate": 1.881506851703945e-05, "loss": 2.2967, "step": 357650 }, { "epoch": 0.62, "learning_rate": 1.8814196577112627e-05, "loss": 2.3517, "step": 357660 }, { "epoch": 0.62, "learning_rate": 1.8813324637185797e-05, "loss": 2.346, "step": 357670 }, { "epoch": 0.62, "learning_rate": 1.881245269725897e-05, "loss": 2.2734, "step": 357680 }, { "epoch": 0.62, "learning_rate": 1.8811580757332144e-05, "loss": 2.275, "step": 357690 }, { "epoch": 0.62, "learning_rate": 1.8810708817405318e-05, "loss": 2.3966, "step": 357700 }, { "epoch": 0.62, "learning_rate": 1.880983687747849e-05, "loss": 2.2174, "step": 357710 }, { "epoch": 0.62, "learning_rate": 1.8808964937551662e-05, "loss": 2.2751, "step": 357720 }, { "epoch": 0.62, "learning_rate": 1.8808092997624836e-05, "loss": 2.1238, "step": 357730 }, { "epoch": 0.62, "learning_rate": 1.880722105769801e-05, "loss": 2.419, "step": 357740 }, { "epoch": 0.62, "learning_rate": 1.8806349117771184e-05, "loss": 2.4245, "step": 357750 }, { "epoch": 0.62, "learning_rate": 1.8805477177844354e-05, "loss": 2.3665, "step": 357760 }, { "epoch": 0.62, "learning_rate": 1.880460523791753e-05, "loss": 2.3478, "step": 357770 }, { "epoch": 0.62, "learning_rate": 1.88037332979907e-05, "loss": 2.3016, "step": 357780 }, { "epoch": 0.62, "learning_rate": 1.8802861358063875e-05, "loss": 2.3211, "step": 357790 }, { "epoch": 0.62, "learning_rate": 1.880198941813705e-05, "loss": 2.3782, "step": 357800 }, { "epoch": 0.62, "learning_rate": 1.8801117478210223e-05, "loss": 2.4556, "step": 357810 }, { "epoch": 0.62, "learning_rate": 1.8800245538283397e-05, "loss": 2.3891, "step": 357820 }, { "epoch": 0.62, "learning_rate": 1.8799373598356567e-05, "loss": 2.2876, "step": 357830 }, { "epoch": 0.62, "learning_rate": 1.8798501658429744e-05, "loss": 2.4269, "step": 357840 }, { "epoch": 0.62, "learning_rate": 1.8797629718502915e-05, "loss": 2.389, "step": 357850 }, { "epoch": 0.62, "learning_rate": 1.879675777857609e-05, "loss": 2.2032, "step": 357860 }, { "epoch": 0.62, "learning_rate": 1.879588583864926e-05, "loss": 2.3393, "step": 357870 }, { "epoch": 0.62, "learning_rate": 1.8795013898722436e-05, "loss": 2.3608, "step": 357880 }, { "epoch": 0.62, "learning_rate": 1.8794141958795606e-05, "loss": 2.4567, "step": 357890 }, { "epoch": 0.62, "learning_rate": 1.879327001886878e-05, "loss": 2.298, "step": 357900 }, { "epoch": 0.62, "learning_rate": 1.8792398078941954e-05, "loss": 2.2986, "step": 357910 }, { "epoch": 0.62, "learning_rate": 1.8791526139015128e-05, "loss": 2.2639, "step": 357920 }, { "epoch": 0.62, "learning_rate": 1.87906541990883e-05, "loss": 2.2596, "step": 357930 }, { "epoch": 0.62, "learning_rate": 1.8789782259161472e-05, "loss": 2.2381, "step": 357940 }, { "epoch": 0.62, "learning_rate": 1.878891031923465e-05, "loss": 2.273, "step": 357950 }, { "epoch": 0.62, "learning_rate": 1.878803837930782e-05, "loss": 2.2738, "step": 357960 }, { "epoch": 0.62, "learning_rate": 1.8787166439380993e-05, "loss": 2.3813, "step": 357970 }, { "epoch": 0.62, "learning_rate": 1.8786294499454167e-05, "loss": 2.3407, "step": 357980 }, { "epoch": 0.62, "learning_rate": 1.878542255952734e-05, "loss": 2.3659, "step": 357990 }, { "epoch": 0.62, "learning_rate": 1.8784550619600514e-05, "loss": 2.3094, "step": 358000 }, { "epoch": 0.62, "learning_rate": 1.8783678679673685e-05, "loss": 2.3836, "step": 358010 }, { "epoch": 0.62, "learning_rate": 1.878280673974686e-05, "loss": 2.3122, "step": 358020 }, { "epoch": 0.62, "learning_rate": 1.8781934799820032e-05, "loss": 2.3104, "step": 358030 }, { "epoch": 0.62, "learning_rate": 1.8781062859893206e-05, "loss": 2.4044, "step": 358040 }, { "epoch": 0.62, "learning_rate": 1.878019091996638e-05, "loss": 2.3289, "step": 358050 }, { "epoch": 0.62, "learning_rate": 1.877931898003955e-05, "loss": 2.3406, "step": 358060 }, { "epoch": 0.62, "learning_rate": 1.8778447040112727e-05, "loss": 2.2568, "step": 358070 }, { "epoch": 0.62, "learning_rate": 1.8777575100185898e-05, "loss": 2.3536, "step": 358080 }, { "epoch": 0.62, "learning_rate": 1.877670316025907e-05, "loss": 2.2192, "step": 358090 }, { "epoch": 0.62, "learning_rate": 1.8775831220332245e-05, "loss": 2.3717, "step": 358100 }, { "epoch": 0.62, "learning_rate": 1.877495928040542e-05, "loss": 2.3312, "step": 358110 }, { "epoch": 0.62, "learning_rate": 1.877408734047859e-05, "loss": 2.2982, "step": 358120 }, { "epoch": 0.62, "learning_rate": 1.8773215400551763e-05, "loss": 2.4005, "step": 358130 }, { "epoch": 0.62, "learning_rate": 1.877234346062494e-05, "loss": 2.3646, "step": 358140 }, { "epoch": 0.62, "learning_rate": 1.877147152069811e-05, "loss": 2.2479, "step": 358150 }, { "epoch": 0.62, "learning_rate": 1.8770599580771285e-05, "loss": 2.3106, "step": 358160 }, { "epoch": 0.62, "learning_rate": 1.8769727640844455e-05, "loss": 2.2372, "step": 358170 }, { "epoch": 0.62, "learning_rate": 1.8768855700917632e-05, "loss": 2.3273, "step": 358180 }, { "epoch": 0.62, "learning_rate": 1.8767983760990802e-05, "loss": 2.2882, "step": 358190 }, { "epoch": 0.62, "learning_rate": 1.8767111821063976e-05, "loss": 2.4046, "step": 358200 }, { "epoch": 0.62, "learning_rate": 1.876623988113715e-05, "loss": 2.3089, "step": 358210 }, { "epoch": 0.62, "learning_rate": 1.8765367941210324e-05, "loss": 2.3903, "step": 358220 }, { "epoch": 0.62, "learning_rate": 1.8764496001283498e-05, "loss": 2.2897, "step": 358230 }, { "epoch": 0.62, "learning_rate": 1.8763624061356668e-05, "loss": 2.3841, "step": 358240 }, { "epoch": 0.62, "learning_rate": 1.8762752121429845e-05, "loss": 2.3597, "step": 358250 }, { "epoch": 0.62, "learning_rate": 1.8761880181503015e-05, "loss": 2.2177, "step": 358260 }, { "epoch": 0.62, "learning_rate": 1.876100824157619e-05, "loss": 2.4074, "step": 358270 }, { "epoch": 0.62, "learning_rate": 1.8760136301649363e-05, "loss": 2.4473, "step": 358280 }, { "epoch": 0.62, "learning_rate": 1.8759264361722537e-05, "loss": 2.3493, "step": 358290 }, { "epoch": 0.62, "learning_rate": 1.875839242179571e-05, "loss": 2.2754, "step": 358300 }, { "epoch": 0.62, "learning_rate": 1.875752048186888e-05, "loss": 2.3765, "step": 358310 }, { "epoch": 0.62, "learning_rate": 1.8756648541942055e-05, "loss": 2.2649, "step": 358320 }, { "epoch": 0.62, "learning_rate": 1.875577660201523e-05, "loss": 2.363, "step": 358330 }, { "epoch": 0.62, "learning_rate": 1.8754904662088402e-05, "loss": 2.2633, "step": 358340 }, { "epoch": 0.62, "learning_rate": 1.8754032722161573e-05, "loss": 2.3136, "step": 358350 }, { "epoch": 0.62, "learning_rate": 1.875316078223475e-05, "loss": 2.2087, "step": 358360 }, { "epoch": 0.62, "learning_rate": 1.875228884230792e-05, "loss": 2.3397, "step": 358370 }, { "epoch": 0.62, "learning_rate": 1.8751416902381094e-05, "loss": 2.2177, "step": 358380 }, { "epoch": 0.62, "learning_rate": 1.8750544962454268e-05, "loss": 2.3647, "step": 358390 }, { "epoch": 0.63, "learning_rate": 1.874967302252744e-05, "loss": 2.3245, "step": 358400 }, { "epoch": 0.63, "learning_rate": 1.8748801082600615e-05, "loss": 2.4044, "step": 358410 }, { "epoch": 0.63, "learning_rate": 1.8747929142673786e-05, "loss": 2.4123, "step": 358420 }, { "epoch": 0.63, "learning_rate": 1.874705720274696e-05, "loss": 2.3928, "step": 358430 }, { "epoch": 0.63, "learning_rate": 1.8746185262820133e-05, "loss": 2.2162, "step": 358440 }, { "epoch": 0.63, "learning_rate": 1.8745313322893307e-05, "loss": 2.26, "step": 358450 }, { "epoch": 0.63, "learning_rate": 1.874444138296648e-05, "loss": 2.3233, "step": 358460 }, { "epoch": 0.63, "learning_rate": 1.874356944303965e-05, "loss": 2.349, "step": 358470 }, { "epoch": 0.63, "learning_rate": 1.8742697503112828e-05, "loss": 2.3334, "step": 358480 }, { "epoch": 0.63, "learning_rate": 1.8741825563186e-05, "loss": 2.3606, "step": 358490 }, { "epoch": 0.63, "learning_rate": 1.8740953623259172e-05, "loss": 2.375, "step": 358500 }, { "epoch": 0.63, "learning_rate": 1.8740081683332346e-05, "loss": 2.2859, "step": 358510 }, { "epoch": 0.63, "learning_rate": 1.873920974340552e-05, "loss": 2.3198, "step": 358520 }, { "epoch": 0.63, "learning_rate": 1.8738337803478694e-05, "loss": 2.3127, "step": 358530 }, { "epoch": 0.63, "learning_rate": 1.8737465863551864e-05, "loss": 2.4314, "step": 358540 }, { "epoch": 0.63, "learning_rate": 1.873659392362504e-05, "loss": 2.3237, "step": 358550 }, { "epoch": 0.63, "learning_rate": 1.873572198369821e-05, "loss": 2.3599, "step": 358560 }, { "epoch": 0.63, "learning_rate": 1.8734850043771385e-05, "loss": 2.2954, "step": 358570 }, { "epoch": 0.63, "learning_rate": 1.8733978103844556e-05, "loss": 2.2484, "step": 358580 }, { "epoch": 0.63, "learning_rate": 1.8733106163917733e-05, "loss": 2.3265, "step": 358590 }, { "epoch": 0.63, "learning_rate": 1.8732234223990903e-05, "loss": 2.2142, "step": 358600 }, { "epoch": 0.63, "learning_rate": 1.8731362284064077e-05, "loss": 2.3286, "step": 358610 }, { "epoch": 0.63, "learning_rate": 1.8730490344137254e-05, "loss": 2.4028, "step": 358620 }, { "epoch": 0.63, "learning_rate": 1.8729618404210425e-05, "loss": 2.2722, "step": 358630 }, { "epoch": 0.63, "learning_rate": 1.87287464642836e-05, "loss": 2.2914, "step": 358640 }, { "epoch": 0.63, "learning_rate": 1.872787452435677e-05, "loss": 2.3324, "step": 358650 }, { "epoch": 0.63, "learning_rate": 1.8727002584429946e-05, "loss": 2.3589, "step": 358660 }, { "epoch": 0.63, "learning_rate": 1.8726130644503116e-05, "loss": 2.3272, "step": 358670 }, { "epoch": 0.63, "learning_rate": 1.872525870457629e-05, "loss": 2.2798, "step": 358680 }, { "epoch": 0.63, "learning_rate": 1.8724386764649464e-05, "loss": 2.3121, "step": 358690 }, { "epoch": 0.63, "learning_rate": 1.8723514824722638e-05, "loss": 2.3859, "step": 358700 }, { "epoch": 0.63, "learning_rate": 1.872264288479581e-05, "loss": 2.1834, "step": 358710 }, { "epoch": 0.63, "learning_rate": 1.8721770944868982e-05, "loss": 2.4517, "step": 358720 }, { "epoch": 0.63, "learning_rate": 1.8720899004942156e-05, "loss": 2.3427, "step": 358730 }, { "epoch": 0.63, "learning_rate": 1.872002706501533e-05, "loss": 2.3583, "step": 358740 }, { "epoch": 0.63, "learning_rate": 1.8719155125088503e-05, "loss": 2.3255, "step": 358750 }, { "epoch": 0.63, "learning_rate": 1.8718283185161677e-05, "loss": 2.2382, "step": 358760 }, { "epoch": 0.63, "learning_rate": 1.871741124523485e-05, "loss": 2.2967, "step": 358770 }, { "epoch": 0.63, "learning_rate": 1.8716539305308024e-05, "loss": 2.3961, "step": 358780 }, { "epoch": 0.63, "learning_rate": 1.8715667365381195e-05, "loss": 2.3348, "step": 358790 }, { "epoch": 0.63, "learning_rate": 1.871479542545437e-05, "loss": 2.3484, "step": 358800 }, { "epoch": 0.63, "learning_rate": 1.8713923485527542e-05, "loss": 2.2435, "step": 358810 }, { "epoch": 0.63, "learning_rate": 1.8713051545600716e-05, "loss": 2.2959, "step": 358820 }, { "epoch": 0.63, "learning_rate": 1.8712179605673886e-05, "loss": 2.3668, "step": 358830 }, { "epoch": 0.63, "learning_rate": 1.871130766574706e-05, "loss": 2.3754, "step": 358840 }, { "epoch": 0.63, "learning_rate": 1.8710435725820234e-05, "loss": 2.3233, "step": 358850 }, { "epoch": 0.63, "learning_rate": 1.8709563785893408e-05, "loss": 2.3475, "step": 358860 }, { "epoch": 0.63, "learning_rate": 1.870869184596658e-05, "loss": 2.1582, "step": 358870 }, { "epoch": 0.63, "learning_rate": 1.8707819906039755e-05, "loss": 2.3534, "step": 358880 }, { "epoch": 0.63, "learning_rate": 1.870694796611293e-05, "loss": 2.3415, "step": 358890 }, { "epoch": 0.63, "learning_rate": 1.87060760261861e-05, "loss": 2.3605, "step": 358900 }, { "epoch": 0.63, "learning_rate": 1.8705204086259273e-05, "loss": 2.2862, "step": 358910 }, { "epoch": 0.63, "learning_rate": 1.8704332146332447e-05, "loss": 2.3182, "step": 358920 }, { "epoch": 0.63, "learning_rate": 1.870346020640562e-05, "loss": 2.3187, "step": 358930 }, { "epoch": 0.63, "learning_rate": 1.8702588266478795e-05, "loss": 2.2725, "step": 358940 }, { "epoch": 0.63, "learning_rate": 1.8701716326551965e-05, "loss": 2.3321, "step": 358950 }, { "epoch": 0.63, "learning_rate": 1.8700844386625142e-05, "loss": 2.2254, "step": 358960 }, { "epoch": 0.63, "learning_rate": 1.8699972446698312e-05, "loss": 2.3909, "step": 358970 }, { "epoch": 0.63, "learning_rate": 1.8699100506771486e-05, "loss": 2.3918, "step": 358980 }, { "epoch": 0.63, "learning_rate": 1.8698228566844657e-05, "loss": 2.2291, "step": 358990 }, { "epoch": 0.63, "learning_rate": 1.8697356626917834e-05, "loss": 2.3377, "step": 359000 }, { "epoch": 0.63, "learning_rate": 1.8696484686991008e-05, "loss": 2.3056, "step": 359010 }, { "epoch": 0.63, "learning_rate": 1.8695612747064178e-05, "loss": 2.3638, "step": 359020 }, { "epoch": 0.63, "learning_rate": 1.8694740807137355e-05, "loss": 2.4012, "step": 359030 }, { "epoch": 0.63, "learning_rate": 1.8693868867210525e-05, "loss": 2.3321, "step": 359040 }, { "epoch": 0.63, "learning_rate": 1.86929969272837e-05, "loss": 2.3501, "step": 359050 }, { "epoch": 0.63, "learning_rate": 1.869212498735687e-05, "loss": 2.3701, "step": 359060 }, { "epoch": 0.63, "learning_rate": 1.8691253047430047e-05, "loss": 2.2844, "step": 359070 }, { "epoch": 0.63, "learning_rate": 1.8690381107503217e-05, "loss": 2.2729, "step": 359080 }, { "epoch": 0.63, "learning_rate": 1.868950916757639e-05, "loss": 2.3677, "step": 359090 }, { "epoch": 0.63, "learning_rate": 1.8688637227649565e-05, "loss": 2.3185, "step": 359100 }, { "epoch": 0.63, "learning_rate": 1.868776528772274e-05, "loss": 2.3237, "step": 359110 }, { "epoch": 0.63, "learning_rate": 1.8686893347795912e-05, "loss": 2.1986, "step": 359120 }, { "epoch": 0.63, "learning_rate": 1.8686021407869083e-05, "loss": 2.3544, "step": 359130 }, { "epoch": 0.63, "learning_rate": 1.8685149467942256e-05, "loss": 2.3469, "step": 359140 }, { "epoch": 0.63, "learning_rate": 1.868427752801543e-05, "loss": 2.2607, "step": 359150 }, { "epoch": 0.63, "learning_rate": 1.8683405588088604e-05, "loss": 2.3729, "step": 359160 }, { "epoch": 0.63, "learning_rate": 1.8682533648161778e-05, "loss": 2.342, "step": 359170 }, { "epoch": 0.63, "learning_rate": 1.868166170823495e-05, "loss": 2.3696, "step": 359180 }, { "epoch": 0.63, "learning_rate": 1.8680789768308125e-05, "loss": 2.2784, "step": 359190 }, { "epoch": 0.63, "learning_rate": 1.8679917828381296e-05, "loss": 2.3106, "step": 359200 }, { "epoch": 0.63, "learning_rate": 1.867904588845447e-05, "loss": 2.3327, "step": 359210 }, { "epoch": 0.63, "learning_rate": 1.8678173948527643e-05, "loss": 2.261, "step": 359220 }, { "epoch": 0.63, "learning_rate": 1.8677302008600817e-05, "loss": 2.1892, "step": 359230 }, { "epoch": 0.63, "learning_rate": 1.867643006867399e-05, "loss": 2.3241, "step": 359240 }, { "epoch": 0.63, "learning_rate": 1.867555812874716e-05, "loss": 2.2214, "step": 359250 }, { "epoch": 0.63, "learning_rate": 1.8674686188820338e-05, "loss": 2.2059, "step": 359260 }, { "epoch": 0.63, "learning_rate": 1.867381424889351e-05, "loss": 2.3417, "step": 359270 }, { "epoch": 0.63, "learning_rate": 1.8672942308966682e-05, "loss": 2.2739, "step": 359280 }, { "epoch": 0.63, "learning_rate": 1.8672070369039856e-05, "loss": 2.3435, "step": 359290 }, { "epoch": 0.63, "learning_rate": 1.867119842911303e-05, "loss": 2.3945, "step": 359300 }, { "epoch": 0.63, "learning_rate": 1.86703264891862e-05, "loss": 2.4295, "step": 359310 }, { "epoch": 0.63, "learning_rate": 1.8669454549259374e-05, "loss": 2.3564, "step": 359320 }, { "epoch": 0.63, "learning_rate": 1.8668582609332548e-05, "loss": 2.3998, "step": 359330 }, { "epoch": 0.63, "learning_rate": 1.866771066940572e-05, "loss": 2.3034, "step": 359340 }, { "epoch": 0.63, "learning_rate": 1.8666838729478895e-05, "loss": 2.3517, "step": 359350 }, { "epoch": 0.63, "learning_rate": 1.8665966789552066e-05, "loss": 2.3221, "step": 359360 }, { "epoch": 0.63, "learning_rate": 1.8665094849625243e-05, "loss": 2.3625, "step": 359370 }, { "epoch": 0.63, "learning_rate": 1.8664222909698413e-05, "loss": 2.4176, "step": 359380 }, { "epoch": 0.63, "learning_rate": 1.8663350969771587e-05, "loss": 2.2456, "step": 359390 }, { "epoch": 0.63, "learning_rate": 1.866247902984476e-05, "loss": 2.4152, "step": 359400 }, { "epoch": 0.63, "learning_rate": 1.8661607089917935e-05, "loss": 2.3181, "step": 359410 }, { "epoch": 0.63, "learning_rate": 1.866073514999111e-05, "loss": 2.3255, "step": 359420 }, { "epoch": 0.63, "learning_rate": 1.865986321006428e-05, "loss": 2.2602, "step": 359430 }, { "epoch": 0.63, "learning_rate": 1.8658991270137456e-05, "loss": 2.3051, "step": 359440 }, { "epoch": 0.63, "learning_rate": 1.8658119330210626e-05, "loss": 2.2182, "step": 359450 }, { "epoch": 0.63, "learning_rate": 1.86572473902838e-05, "loss": 2.3996, "step": 359460 }, { "epoch": 0.63, "learning_rate": 1.865637545035697e-05, "loss": 2.2939, "step": 359470 }, { "epoch": 0.63, "learning_rate": 1.8655503510430148e-05, "loss": 2.3595, "step": 359480 }, { "epoch": 0.63, "learning_rate": 1.865463157050332e-05, "loss": 2.2625, "step": 359490 }, { "epoch": 0.63, "learning_rate": 1.8653759630576492e-05, "loss": 2.375, "step": 359500 }, { "epoch": 0.63, "learning_rate": 1.8652887690649666e-05, "loss": 2.3997, "step": 359510 }, { "epoch": 0.63, "learning_rate": 1.865201575072284e-05, "loss": 2.4011, "step": 359520 }, { "epoch": 0.63, "learning_rate": 1.8651143810796013e-05, "loss": 2.3425, "step": 359530 }, { "epoch": 0.63, "learning_rate": 1.8650271870869183e-05, "loss": 2.3847, "step": 359540 }, { "epoch": 0.63, "learning_rate": 1.864939993094236e-05, "loss": 2.3446, "step": 359550 }, { "epoch": 0.63, "learning_rate": 1.864852799101553e-05, "loss": 2.2814, "step": 359560 }, { "epoch": 0.63, "learning_rate": 1.8647656051088705e-05, "loss": 2.3724, "step": 359570 }, { "epoch": 0.63, "learning_rate": 1.864678411116188e-05, "loss": 2.306, "step": 359580 }, { "epoch": 0.63, "learning_rate": 1.8645912171235052e-05, "loss": 2.2665, "step": 359590 }, { "epoch": 0.63, "learning_rate": 1.8645040231308226e-05, "loss": 2.3301, "step": 359600 }, { "epoch": 0.63, "learning_rate": 1.8644168291381396e-05, "loss": 2.319, "step": 359610 }, { "epoch": 0.63, "learning_rate": 1.864329635145457e-05, "loss": 2.3053, "step": 359620 }, { "epoch": 0.63, "learning_rate": 1.8642424411527744e-05, "loss": 2.2944, "step": 359630 }, { "epoch": 0.63, "learning_rate": 1.8641552471600918e-05, "loss": 2.3189, "step": 359640 }, { "epoch": 0.63, "learning_rate": 1.864068053167409e-05, "loss": 2.3437, "step": 359650 }, { "epoch": 0.63, "learning_rate": 1.8639808591747262e-05, "loss": 2.2602, "step": 359660 }, { "epoch": 0.63, "learning_rate": 1.863893665182044e-05, "loss": 2.3275, "step": 359670 }, { "epoch": 0.63, "learning_rate": 1.863806471189361e-05, "loss": 2.3471, "step": 359680 }, { "epoch": 0.63, "learning_rate": 1.8637192771966783e-05, "loss": 2.2516, "step": 359690 }, { "epoch": 0.63, "learning_rate": 1.8636320832039957e-05, "loss": 2.4334, "step": 359700 }, { "epoch": 0.63, "learning_rate": 1.863544889211313e-05, "loss": 2.2997, "step": 359710 }, { "epoch": 0.63, "learning_rate": 1.86345769521863e-05, "loss": 2.3031, "step": 359720 }, { "epoch": 0.63, "learning_rate": 1.8633705012259475e-05, "loss": 2.2232, "step": 359730 }, { "epoch": 0.63, "learning_rate": 1.8632833072332652e-05, "loss": 2.3528, "step": 359740 }, { "epoch": 0.63, "learning_rate": 1.8631961132405822e-05, "loss": 2.3817, "step": 359750 }, { "epoch": 0.63, "learning_rate": 1.8631089192478996e-05, "loss": 2.315, "step": 359760 }, { "epoch": 0.63, "learning_rate": 1.8630217252552167e-05, "loss": 2.2895, "step": 359770 }, { "epoch": 0.63, "learning_rate": 1.8629345312625344e-05, "loss": 2.3053, "step": 359780 }, { "epoch": 0.63, "learning_rate": 1.8628473372698514e-05, "loss": 2.2577, "step": 359790 }, { "epoch": 0.63, "learning_rate": 1.8627601432771688e-05, "loss": 2.3411, "step": 359800 }, { "epoch": 0.63, "learning_rate": 1.8626729492844862e-05, "loss": 2.3119, "step": 359810 }, { "epoch": 0.63, "learning_rate": 1.8625857552918035e-05, "loss": 2.3855, "step": 359820 }, { "epoch": 0.63, "learning_rate": 1.862498561299121e-05, "loss": 2.3624, "step": 359830 }, { "epoch": 0.63, "learning_rate": 1.862411367306438e-05, "loss": 2.3367, "step": 359840 }, { "epoch": 0.63, "learning_rate": 1.8623241733137557e-05, "loss": 2.2404, "step": 359850 }, { "epoch": 0.63, "learning_rate": 1.8622369793210727e-05, "loss": 2.3829, "step": 359860 }, { "epoch": 0.63, "learning_rate": 1.86214978532839e-05, "loss": 2.2968, "step": 359870 }, { "epoch": 0.63, "learning_rate": 1.8620625913357075e-05, "loss": 2.3606, "step": 359880 }, { "epoch": 0.63, "learning_rate": 1.861975397343025e-05, "loss": 2.3589, "step": 359890 }, { "epoch": 0.63, "learning_rate": 1.8618882033503422e-05, "loss": 2.3698, "step": 359900 }, { "epoch": 0.63, "learning_rate": 1.8618010093576593e-05, "loss": 2.2979, "step": 359910 }, { "epoch": 0.63, "learning_rate": 1.8617138153649766e-05, "loss": 2.2671, "step": 359920 }, { "epoch": 0.63, "learning_rate": 1.861626621372294e-05, "loss": 2.1954, "step": 359930 }, { "epoch": 0.63, "learning_rate": 1.8615394273796114e-05, "loss": 2.3208, "step": 359940 }, { "epoch": 0.63, "learning_rate": 1.8614522333869284e-05, "loss": 2.2864, "step": 359950 }, { "epoch": 0.63, "learning_rate": 1.861365039394246e-05, "loss": 2.3194, "step": 359960 }, { "epoch": 0.63, "learning_rate": 1.8612778454015635e-05, "loss": 2.2356, "step": 359970 }, { "epoch": 0.63, "learning_rate": 1.8611906514088806e-05, "loss": 2.4041, "step": 359980 }, { "epoch": 0.63, "learning_rate": 1.861103457416198e-05, "loss": 2.3567, "step": 359990 }, { "epoch": 0.63, "learning_rate": 1.8610162634235153e-05, "loss": 2.3732, "step": 360000 }, { "epoch": 0.63, "learning_rate": 1.8609290694308327e-05, "loss": 2.288, "step": 360010 }, { "epoch": 0.63, "learning_rate": 1.8608418754381497e-05, "loss": 2.3511, "step": 360020 }, { "epoch": 0.63, "learning_rate": 1.860754681445467e-05, "loss": 2.3299, "step": 360030 }, { "epoch": 0.63, "learning_rate": 1.8606674874527845e-05, "loss": 2.3115, "step": 360040 }, { "epoch": 0.63, "learning_rate": 1.860580293460102e-05, "loss": 2.2577, "step": 360050 }, { "epoch": 0.63, "learning_rate": 1.8604930994674192e-05, "loss": 2.4564, "step": 360060 }, { "epoch": 0.63, "learning_rate": 1.8604059054747363e-05, "loss": 2.33, "step": 360070 }, { "epoch": 0.63, "learning_rate": 1.860318711482054e-05, "loss": 2.283, "step": 360080 }, { "epoch": 0.63, "learning_rate": 1.860231517489371e-05, "loss": 2.3601, "step": 360090 }, { "epoch": 0.63, "learning_rate": 1.8601443234966884e-05, "loss": 2.3077, "step": 360100 }, { "epoch": 0.63, "learning_rate": 1.8600571295040058e-05, "loss": 2.3001, "step": 360110 }, { "epoch": 0.63, "learning_rate": 1.859969935511323e-05, "loss": 2.2787, "step": 360120 }, { "epoch": 0.63, "learning_rate": 1.8598827415186405e-05, "loss": 2.4189, "step": 360130 }, { "epoch": 0.63, "learning_rate": 1.8597955475259576e-05, "loss": 2.392, "step": 360140 }, { "epoch": 0.63, "learning_rate": 1.8597083535332753e-05, "loss": 2.2584, "step": 360150 }, { "epoch": 0.63, "learning_rate": 1.8596211595405923e-05, "loss": 2.2234, "step": 360160 }, { "epoch": 0.63, "learning_rate": 1.8595339655479097e-05, "loss": 2.3709, "step": 360170 }, { "epoch": 0.63, "learning_rate": 1.8594467715552267e-05, "loss": 2.3995, "step": 360180 }, { "epoch": 0.63, "learning_rate": 1.8593595775625445e-05, "loss": 2.4375, "step": 360190 }, { "epoch": 0.63, "learning_rate": 1.8592723835698615e-05, "loss": 2.42, "step": 360200 }, { "epoch": 0.63, "learning_rate": 1.859185189577179e-05, "loss": 2.2037, "step": 360210 }, { "epoch": 0.63, "learning_rate": 1.8590979955844966e-05, "loss": 2.3427, "step": 360220 }, { "epoch": 0.63, "learning_rate": 1.8590108015918136e-05, "loss": 2.2992, "step": 360230 }, { "epoch": 0.63, "learning_rate": 1.858923607599131e-05, "loss": 2.2579, "step": 360240 }, { "epoch": 0.63, "learning_rate": 1.858836413606448e-05, "loss": 2.3106, "step": 360250 }, { "epoch": 0.63, "learning_rate": 1.8587492196137658e-05, "loss": 2.3462, "step": 360260 }, { "epoch": 0.63, "learning_rate": 1.8586620256210828e-05, "loss": 2.1572, "step": 360270 }, { "epoch": 0.63, "learning_rate": 1.8585748316284002e-05, "loss": 2.3359, "step": 360280 }, { "epoch": 0.63, "learning_rate": 1.8584876376357176e-05, "loss": 2.34, "step": 360290 }, { "epoch": 0.63, "learning_rate": 1.858400443643035e-05, "loss": 2.3627, "step": 360300 }, { "epoch": 0.63, "learning_rate": 1.8583132496503523e-05, "loss": 2.3947, "step": 360310 }, { "epoch": 0.63, "learning_rate": 1.8582260556576694e-05, "loss": 2.3286, "step": 360320 }, { "epoch": 0.63, "learning_rate": 1.8581388616649867e-05, "loss": 2.2761, "step": 360330 }, { "epoch": 0.63, "learning_rate": 1.858051667672304e-05, "loss": 2.3497, "step": 360340 }, { "epoch": 0.63, "learning_rate": 1.8579644736796215e-05, "loss": 2.3138, "step": 360350 }, { "epoch": 0.63, "learning_rate": 1.857877279686939e-05, "loss": 2.29, "step": 360360 }, { "epoch": 0.63, "learning_rate": 1.8577900856942562e-05, "loss": 2.3254, "step": 360370 }, { "epoch": 0.63, "learning_rate": 1.8577028917015736e-05, "loss": 2.3712, "step": 360380 }, { "epoch": 0.63, "learning_rate": 1.8576156977088907e-05, "loss": 2.3404, "step": 360390 }, { "epoch": 0.63, "learning_rate": 1.857528503716208e-05, "loss": 2.3092, "step": 360400 }, { "epoch": 0.63, "learning_rate": 1.8574413097235254e-05, "loss": 2.346, "step": 360410 }, { "epoch": 0.63, "learning_rate": 1.8573541157308428e-05, "loss": 2.2189, "step": 360420 }, { "epoch": 0.63, "learning_rate": 1.8572669217381598e-05, "loss": 2.2769, "step": 360430 }, { "epoch": 0.63, "learning_rate": 1.8571797277454772e-05, "loss": 2.4136, "step": 360440 }, { "epoch": 0.63, "learning_rate": 1.8570925337527946e-05, "loss": 2.2848, "step": 360450 }, { "epoch": 0.63, "learning_rate": 1.857005339760112e-05, "loss": 2.2392, "step": 360460 }, { "epoch": 0.63, "learning_rate": 1.8569181457674293e-05, "loss": 2.3603, "step": 360470 }, { "epoch": 0.63, "learning_rate": 1.8568309517747467e-05, "loss": 2.2571, "step": 360480 }, { "epoch": 0.63, "learning_rate": 1.856743757782064e-05, "loss": 2.2838, "step": 360490 }, { "epoch": 0.63, "learning_rate": 1.856656563789381e-05, "loss": 2.3356, "step": 360500 }, { "epoch": 0.63, "learning_rate": 1.8565693697966985e-05, "loss": 2.286, "step": 360510 }, { "epoch": 0.63, "learning_rate": 1.856482175804016e-05, "loss": 2.2508, "step": 360520 }, { "epoch": 0.63, "learning_rate": 1.8563949818113333e-05, "loss": 2.3924, "step": 360530 }, { "epoch": 0.63, "learning_rate": 1.8563077878186506e-05, "loss": 2.2964, "step": 360540 }, { "epoch": 0.63, "learning_rate": 1.8562205938259677e-05, "loss": 2.2557, "step": 360550 }, { "epoch": 0.63, "learning_rate": 1.8561333998332854e-05, "loss": 2.2888, "step": 360560 }, { "epoch": 0.63, "learning_rate": 1.8560462058406024e-05, "loss": 2.3677, "step": 360570 }, { "epoch": 0.63, "learning_rate": 1.8559590118479198e-05, "loss": 2.3288, "step": 360580 }, { "epoch": 0.63, "learning_rate": 1.8558718178552372e-05, "loss": 2.3065, "step": 360590 }, { "epoch": 0.63, "learning_rate": 1.8557846238625546e-05, "loss": 2.4114, "step": 360600 }, { "epoch": 0.63, "learning_rate": 1.855697429869872e-05, "loss": 2.3153, "step": 360610 }, { "epoch": 0.63, "learning_rate": 1.855610235877189e-05, "loss": 2.1661, "step": 360620 }, { "epoch": 0.63, "learning_rate": 1.8555230418845067e-05, "loss": 2.286, "step": 360630 }, { "epoch": 0.63, "learning_rate": 1.8554358478918237e-05, "loss": 2.3571, "step": 360640 }, { "epoch": 0.63, "learning_rate": 1.855348653899141e-05, "loss": 2.3746, "step": 360650 }, { "epoch": 0.63, "learning_rate": 1.855261459906458e-05, "loss": 2.3288, "step": 360660 }, { "epoch": 0.63, "learning_rate": 1.855174265913776e-05, "loss": 2.2811, "step": 360670 }, { "epoch": 0.63, "learning_rate": 1.855087071921093e-05, "loss": 2.3046, "step": 360680 }, { "epoch": 0.63, "learning_rate": 1.8549998779284103e-05, "loss": 2.2881, "step": 360690 }, { "epoch": 0.63, "learning_rate": 1.8549126839357276e-05, "loss": 2.2409, "step": 360700 }, { "epoch": 0.63, "learning_rate": 1.854825489943045e-05, "loss": 2.2205, "step": 360710 }, { "epoch": 0.63, "learning_rate": 1.8547382959503624e-05, "loss": 2.2289, "step": 360720 }, { "epoch": 0.63, "learning_rate": 1.8546511019576794e-05, "loss": 2.3535, "step": 360730 }, { "epoch": 0.63, "learning_rate": 1.8545639079649968e-05, "loss": 2.3324, "step": 360740 }, { "epoch": 0.63, "learning_rate": 1.8544767139723142e-05, "loss": 2.2906, "step": 360750 }, { "epoch": 0.63, "learning_rate": 1.8543895199796316e-05, "loss": 2.3539, "step": 360760 }, { "epoch": 0.63, "learning_rate": 1.854302325986949e-05, "loss": 2.1847, "step": 360770 }, { "epoch": 0.63, "learning_rate": 1.8542151319942663e-05, "loss": 2.2755, "step": 360780 }, { "epoch": 0.63, "learning_rate": 1.8541279380015837e-05, "loss": 2.3457, "step": 360790 }, { "epoch": 0.63, "learning_rate": 1.8540407440089007e-05, "loss": 2.3691, "step": 360800 }, { "epoch": 0.63, "learning_rate": 1.853953550016218e-05, "loss": 2.3274, "step": 360810 }, { "epoch": 0.63, "learning_rate": 1.8538663560235355e-05, "loss": 2.3283, "step": 360820 }, { "epoch": 0.63, "learning_rate": 1.853779162030853e-05, "loss": 2.2455, "step": 360830 }, { "epoch": 0.63, "learning_rate": 1.8536919680381702e-05, "loss": 2.366, "step": 360840 }, { "epoch": 0.63, "learning_rate": 1.8536047740454873e-05, "loss": 2.3236, "step": 360850 }, { "epoch": 0.63, "learning_rate": 1.853517580052805e-05, "loss": 2.2706, "step": 360860 }, { "epoch": 0.63, "learning_rate": 1.853430386060122e-05, "loss": 2.2441, "step": 360870 }, { "epoch": 0.63, "learning_rate": 1.8533431920674394e-05, "loss": 2.3922, "step": 360880 }, { "epoch": 0.63, "learning_rate": 1.8532559980747568e-05, "loss": 2.2907, "step": 360890 }, { "epoch": 0.63, "learning_rate": 1.853168804082074e-05, "loss": 2.3204, "step": 360900 }, { "epoch": 0.63, "learning_rate": 1.8530816100893912e-05, "loss": 2.3452, "step": 360910 }, { "epoch": 0.63, "learning_rate": 1.8529944160967086e-05, "loss": 2.2749, "step": 360920 }, { "epoch": 0.63, "learning_rate": 1.852907222104026e-05, "loss": 2.3858, "step": 360930 }, { "epoch": 0.63, "learning_rate": 1.8528200281113433e-05, "loss": 2.2931, "step": 360940 }, { "epoch": 0.63, "learning_rate": 1.8527328341186607e-05, "loss": 2.3081, "step": 360950 }, { "epoch": 0.63, "learning_rate": 1.8526456401259778e-05, "loss": 2.4349, "step": 360960 }, { "epoch": 0.63, "learning_rate": 1.8525584461332955e-05, "loss": 2.2887, "step": 360970 }, { "epoch": 0.63, "learning_rate": 1.8524712521406125e-05, "loss": 2.3103, "step": 360980 }, { "epoch": 0.63, "learning_rate": 1.85238405814793e-05, "loss": 2.1988, "step": 360990 }, { "epoch": 0.63, "learning_rate": 1.8522968641552473e-05, "loss": 2.2717, "step": 361000 }, { "epoch": 0.63, "learning_rate": 1.8522096701625646e-05, "loss": 2.2511, "step": 361010 }, { "epoch": 0.63, "learning_rate": 1.852122476169882e-05, "loss": 2.3657, "step": 361020 }, { "epoch": 0.63, "learning_rate": 1.852035282177199e-05, "loss": 2.4178, "step": 361030 }, { "epoch": 0.63, "learning_rate": 1.8519480881845168e-05, "loss": 2.3081, "step": 361040 }, { "epoch": 0.63, "learning_rate": 1.8518608941918338e-05, "loss": 2.3095, "step": 361050 }, { "epoch": 0.63, "learning_rate": 1.8517737001991512e-05, "loss": 2.2493, "step": 361060 }, { "epoch": 0.63, "learning_rate": 1.8516865062064682e-05, "loss": 2.3023, "step": 361070 }, { "epoch": 0.63, "learning_rate": 1.851599312213786e-05, "loss": 2.4155, "step": 361080 }, { "epoch": 0.63, "learning_rate": 1.8515121182211033e-05, "loss": 2.2709, "step": 361090 }, { "epoch": 0.63, "learning_rate": 1.8514249242284204e-05, "loss": 2.464, "step": 361100 }, { "epoch": 0.63, "learning_rate": 1.8513377302357377e-05, "loss": 2.2663, "step": 361110 }, { "epoch": 0.63, "learning_rate": 1.851250536243055e-05, "loss": 2.2881, "step": 361120 }, { "epoch": 0.63, "learning_rate": 1.8511633422503725e-05, "loss": 2.3069, "step": 361130 }, { "epoch": 0.63, "learning_rate": 1.8510761482576895e-05, "loss": 2.2969, "step": 361140 }, { "epoch": 0.63, "learning_rate": 1.8509889542650072e-05, "loss": 2.347, "step": 361150 }, { "epoch": 0.63, "learning_rate": 1.8509017602723243e-05, "loss": 2.2506, "step": 361160 }, { "epoch": 0.63, "learning_rate": 1.8508145662796417e-05, "loss": 2.2809, "step": 361170 }, { "epoch": 0.63, "learning_rate": 1.850727372286959e-05, "loss": 2.3252, "step": 361180 }, { "epoch": 0.63, "learning_rate": 1.8506401782942764e-05, "loss": 2.292, "step": 361190 }, { "epoch": 0.63, "learning_rate": 1.8505529843015938e-05, "loss": 2.4414, "step": 361200 }, { "epoch": 0.63, "learning_rate": 1.8504657903089108e-05, "loss": 2.229, "step": 361210 }, { "epoch": 0.63, "learning_rate": 1.8503785963162282e-05, "loss": 2.3169, "step": 361220 }, { "epoch": 0.63, "learning_rate": 1.8502914023235456e-05, "loss": 2.3462, "step": 361230 }, { "epoch": 0.63, "learning_rate": 1.850204208330863e-05, "loss": 2.1588, "step": 361240 }, { "epoch": 0.63, "learning_rate": 1.8501170143381803e-05, "loss": 2.3438, "step": 361250 }, { "epoch": 0.63, "learning_rate": 1.8500298203454974e-05, "loss": 2.3765, "step": 361260 }, { "epoch": 0.63, "learning_rate": 1.849942626352815e-05, "loss": 2.3038, "step": 361270 }, { "epoch": 0.63, "learning_rate": 1.849855432360132e-05, "loss": 2.3187, "step": 361280 }, { "epoch": 0.63, "learning_rate": 1.8497682383674495e-05, "loss": 2.3048, "step": 361290 }, { "epoch": 0.63, "learning_rate": 1.849681044374767e-05, "loss": 2.4213, "step": 361300 }, { "epoch": 0.63, "learning_rate": 1.8495938503820843e-05, "loss": 2.3012, "step": 361310 }, { "epoch": 0.63, "learning_rate": 1.8495066563894016e-05, "loss": 2.4008, "step": 361320 }, { "epoch": 0.63, "learning_rate": 1.8494194623967187e-05, "loss": 2.3819, "step": 361330 }, { "epoch": 0.63, "learning_rate": 1.8493322684040364e-05, "loss": 2.3264, "step": 361340 }, { "epoch": 0.63, "learning_rate": 1.8492450744113534e-05, "loss": 2.3574, "step": 361350 }, { "epoch": 0.63, "learning_rate": 1.8491578804186708e-05, "loss": 2.2984, "step": 361360 }, { "epoch": 0.63, "learning_rate": 1.849070686425988e-05, "loss": 2.3348, "step": 361370 }, { "epoch": 0.63, "learning_rate": 1.8489834924333056e-05, "loss": 2.348, "step": 361380 }, { "epoch": 0.63, "learning_rate": 1.8488962984406226e-05, "loss": 2.3978, "step": 361390 }, { "epoch": 0.63, "learning_rate": 1.84880910444794e-05, "loss": 2.3527, "step": 361400 }, { "epoch": 0.63, "learning_rate": 1.8487219104552573e-05, "loss": 2.3589, "step": 361410 }, { "epoch": 0.63, "learning_rate": 1.8486347164625747e-05, "loss": 2.3695, "step": 361420 }, { "epoch": 0.63, "learning_rate": 1.848547522469892e-05, "loss": 2.2988, "step": 361430 }, { "epoch": 0.63, "learning_rate": 1.848460328477209e-05, "loss": 2.374, "step": 361440 }, { "epoch": 0.63, "learning_rate": 1.848373134484527e-05, "loss": 2.2941, "step": 361450 }, { "epoch": 0.63, "learning_rate": 1.848285940491844e-05, "loss": 2.2719, "step": 361460 }, { "epoch": 0.63, "learning_rate": 1.8481987464991613e-05, "loss": 2.2661, "step": 361470 }, { "epoch": 0.63, "learning_rate": 1.8481115525064786e-05, "loss": 2.3959, "step": 361480 }, { "epoch": 0.63, "learning_rate": 1.848024358513796e-05, "loss": 2.1818, "step": 361490 }, { "epoch": 0.63, "learning_rate": 1.8479371645211134e-05, "loss": 2.3334, "step": 361500 }, { "epoch": 0.63, "learning_rate": 1.8478499705284304e-05, "loss": 2.3807, "step": 361510 }, { "epoch": 0.63, "learning_rate": 1.8477627765357478e-05, "loss": 2.256, "step": 361520 }, { "epoch": 0.63, "learning_rate": 1.8476755825430652e-05, "loss": 2.413, "step": 361530 }, { "epoch": 0.63, "learning_rate": 1.8475883885503826e-05, "loss": 2.309, "step": 361540 }, { "epoch": 0.63, "learning_rate": 1.8475011945576996e-05, "loss": 2.2885, "step": 361550 }, { "epoch": 0.63, "learning_rate": 1.8474140005650173e-05, "loss": 2.2779, "step": 361560 }, { "epoch": 0.63, "learning_rate": 1.8473268065723347e-05, "loss": 2.2148, "step": 361570 }, { "epoch": 0.63, "learning_rate": 1.8472396125796517e-05, "loss": 2.3665, "step": 361580 }, { "epoch": 0.63, "learning_rate": 1.847152418586969e-05, "loss": 2.3712, "step": 361590 }, { "epoch": 0.63, "learning_rate": 1.8470652245942865e-05, "loss": 2.2866, "step": 361600 }, { "epoch": 0.63, "learning_rate": 1.846978030601604e-05, "loss": 2.3562, "step": 361610 }, { "epoch": 0.63, "learning_rate": 1.846890836608921e-05, "loss": 2.3832, "step": 361620 }, { "epoch": 0.63, "learning_rate": 1.8468036426162383e-05, "loss": 2.3077, "step": 361630 }, { "epoch": 0.63, "learning_rate": 1.8467164486235557e-05, "loss": 2.2947, "step": 361640 }, { "epoch": 0.63, "learning_rate": 1.846629254630873e-05, "loss": 2.3049, "step": 361650 }, { "epoch": 0.63, "learning_rate": 1.8465420606381904e-05, "loss": 2.3427, "step": 361660 }, { "epoch": 0.63, "learning_rate": 1.8464548666455075e-05, "loss": 2.3639, "step": 361670 }, { "epoch": 0.63, "learning_rate": 1.846367672652825e-05, "loss": 2.2975, "step": 361680 }, { "epoch": 0.63, "learning_rate": 1.8462804786601422e-05, "loss": 2.3418, "step": 361690 }, { "epoch": 0.63, "learning_rate": 1.8461932846674596e-05, "loss": 2.3347, "step": 361700 }, { "epoch": 0.63, "learning_rate": 1.846106090674777e-05, "loss": 2.3171, "step": 361710 }, { "epoch": 0.63, "learning_rate": 1.8460188966820943e-05, "loss": 2.2863, "step": 361720 }, { "epoch": 0.63, "learning_rate": 1.8459317026894117e-05, "loss": 2.3751, "step": 361730 }, { "epoch": 0.63, "learning_rate": 1.8458445086967288e-05, "loss": 2.3661, "step": 361740 }, { "epoch": 0.63, "learning_rate": 1.8457573147040465e-05, "loss": 2.3832, "step": 361750 }, { "epoch": 0.63, "learning_rate": 1.8456701207113635e-05, "loss": 2.345, "step": 361760 }, { "epoch": 0.63, "learning_rate": 1.845582926718681e-05, "loss": 2.3231, "step": 361770 }, { "epoch": 0.63, "learning_rate": 1.845495732725998e-05, "loss": 2.3407, "step": 361780 }, { "epoch": 0.63, "learning_rate": 1.8454085387333156e-05, "loss": 2.3608, "step": 361790 }, { "epoch": 0.63, "learning_rate": 1.8453213447406327e-05, "loss": 2.3469, "step": 361800 }, { "epoch": 0.63, "learning_rate": 1.84523415074795e-05, "loss": 2.2818, "step": 361810 }, { "epoch": 0.63, "learning_rate": 1.8451469567552678e-05, "loss": 2.3559, "step": 361820 }, { "epoch": 0.63, "learning_rate": 1.8450597627625848e-05, "loss": 2.307, "step": 361830 }, { "epoch": 0.63, "learning_rate": 1.8449725687699022e-05, "loss": 2.3975, "step": 361840 }, { "epoch": 0.63, "learning_rate": 1.8448853747772192e-05, "loss": 2.3443, "step": 361850 }, { "epoch": 0.63, "learning_rate": 1.844798180784537e-05, "loss": 2.4522, "step": 361860 }, { "epoch": 0.63, "learning_rate": 1.844710986791854e-05, "loss": 2.2418, "step": 361870 }, { "epoch": 0.63, "learning_rate": 1.8446237927991714e-05, "loss": 2.3127, "step": 361880 }, { "epoch": 0.63, "learning_rate": 1.8445365988064887e-05, "loss": 2.3262, "step": 361890 }, { "epoch": 0.63, "learning_rate": 1.844449404813806e-05, "loss": 2.4218, "step": 361900 }, { "epoch": 0.63, "learning_rate": 1.8443622108211235e-05, "loss": 2.3423, "step": 361910 }, { "epoch": 0.63, "learning_rate": 1.8442750168284405e-05, "loss": 2.2733, "step": 361920 }, { "epoch": 0.63, "learning_rate": 1.844187822835758e-05, "loss": 2.3319, "step": 361930 }, { "epoch": 0.63, "learning_rate": 1.8441006288430753e-05, "loss": 2.3034, "step": 361940 }, { "epoch": 0.63, "learning_rate": 1.8440134348503927e-05, "loss": 2.2386, "step": 361950 }, { "epoch": 0.63, "learning_rate": 1.84392624085771e-05, "loss": 2.3755, "step": 361960 }, { "epoch": 0.63, "learning_rate": 1.8438390468650274e-05, "loss": 2.3366, "step": 361970 }, { "epoch": 0.63, "learning_rate": 1.8437518528723448e-05, "loss": 2.3444, "step": 361980 }, { "epoch": 0.63, "learning_rate": 1.8436646588796618e-05, "loss": 2.2518, "step": 361990 }, { "epoch": 0.63, "learning_rate": 1.8435774648869792e-05, "loss": 2.2812, "step": 362000 }, { "epoch": 0.63, "learning_rate": 1.8434902708942966e-05, "loss": 2.475, "step": 362010 }, { "epoch": 0.63, "learning_rate": 1.843403076901614e-05, "loss": 2.3884, "step": 362020 }, { "epoch": 0.63, "learning_rate": 1.843315882908931e-05, "loss": 2.3722, "step": 362030 }, { "epoch": 0.63, "learning_rate": 1.8432286889162484e-05, "loss": 2.341, "step": 362040 }, { "epoch": 0.63, "learning_rate": 1.843141494923566e-05, "loss": 2.3463, "step": 362050 }, { "epoch": 0.63, "learning_rate": 1.843054300930883e-05, "loss": 2.3512, "step": 362060 }, { "epoch": 0.63, "learning_rate": 1.8429671069382005e-05, "loss": 2.337, "step": 362070 }, { "epoch": 0.63, "learning_rate": 1.842879912945518e-05, "loss": 2.2999, "step": 362080 }, { "epoch": 0.63, "learning_rate": 1.8427927189528353e-05, "loss": 2.4729, "step": 362090 }, { "epoch": 0.63, "learning_rate": 1.8427055249601523e-05, "loss": 2.2979, "step": 362100 }, { "epoch": 0.63, "learning_rate": 1.8426183309674697e-05, "loss": 2.3759, "step": 362110 }, { "epoch": 0.63, "learning_rate": 1.842531136974787e-05, "loss": 2.4013, "step": 362120 }, { "epoch": 0.63, "learning_rate": 1.8424439429821044e-05, "loss": 2.2556, "step": 362130 }, { "epoch": 0.63, "learning_rate": 1.8423567489894218e-05, "loss": 2.436, "step": 362140 }, { "epoch": 0.63, "learning_rate": 1.842269554996739e-05, "loss": 2.39, "step": 362150 }, { "epoch": 0.63, "learning_rate": 1.8421823610040566e-05, "loss": 2.2751, "step": 362160 }, { "epoch": 0.63, "learning_rate": 1.8420951670113736e-05, "loss": 2.374, "step": 362170 }, { "epoch": 0.63, "learning_rate": 1.842007973018691e-05, "loss": 2.3209, "step": 362180 }, { "epoch": 0.63, "learning_rate": 1.8419207790260083e-05, "loss": 2.3542, "step": 362190 }, { "epoch": 0.63, "learning_rate": 1.8418335850333257e-05, "loss": 2.2894, "step": 362200 }, { "epoch": 0.63, "learning_rate": 1.841746391040643e-05, "loss": 2.3352, "step": 362210 }, { "epoch": 0.63, "learning_rate": 1.84165919704796e-05, "loss": 2.3838, "step": 362220 }, { "epoch": 0.63, "learning_rate": 1.841572003055278e-05, "loss": 2.3561, "step": 362230 }, { "epoch": 0.63, "learning_rate": 1.841484809062595e-05, "loss": 2.3292, "step": 362240 }, { "epoch": 0.63, "learning_rate": 1.8413976150699123e-05, "loss": 2.3576, "step": 362250 }, { "epoch": 0.63, "learning_rate": 1.8413104210772293e-05, "loss": 2.3898, "step": 362260 }, { "epoch": 0.63, "learning_rate": 1.841223227084547e-05, "loss": 2.2975, "step": 362270 }, { "epoch": 0.63, "learning_rate": 1.841136033091864e-05, "loss": 2.2989, "step": 362280 }, { "epoch": 0.63, "learning_rate": 1.8410488390991814e-05, "loss": 2.4415, "step": 362290 }, { "epoch": 0.63, "learning_rate": 1.8409616451064988e-05, "loss": 2.3472, "step": 362300 }, { "epoch": 0.63, "learning_rate": 1.8408744511138162e-05, "loss": 2.4003, "step": 362310 }, { "epoch": 0.63, "learning_rate": 1.8407872571211336e-05, "loss": 2.4506, "step": 362320 }, { "epoch": 0.63, "learning_rate": 1.8407000631284506e-05, "loss": 2.2518, "step": 362330 }, { "epoch": 0.63, "learning_rate": 1.8406128691357683e-05, "loss": 2.3446, "step": 362340 }, { "epoch": 0.63, "learning_rate": 1.8405256751430854e-05, "loss": 2.3936, "step": 362350 }, { "epoch": 0.63, "learning_rate": 1.8404384811504027e-05, "loss": 2.1847, "step": 362360 }, { "epoch": 0.63, "learning_rate": 1.84035128715772e-05, "loss": 2.3369, "step": 362370 }, { "epoch": 0.63, "learning_rate": 1.8402640931650375e-05, "loss": 2.2943, "step": 362380 }, { "epoch": 0.63, "learning_rate": 1.840176899172355e-05, "loss": 2.3666, "step": 362390 }, { "epoch": 0.63, "learning_rate": 1.840089705179672e-05, "loss": 2.2852, "step": 362400 }, { "epoch": 0.63, "learning_rate": 1.8400025111869893e-05, "loss": 2.3782, "step": 362410 }, { "epoch": 0.63, "learning_rate": 1.8399153171943067e-05, "loss": 2.2461, "step": 362420 }, { "epoch": 0.63, "learning_rate": 1.839828123201624e-05, "loss": 2.2125, "step": 362430 }, { "epoch": 0.63, "learning_rate": 1.8397409292089414e-05, "loss": 2.2789, "step": 362440 }, { "epoch": 0.63, "learning_rate": 1.8396537352162585e-05, "loss": 2.3167, "step": 362450 }, { "epoch": 0.63, "learning_rate": 1.839566541223576e-05, "loss": 2.239, "step": 362460 }, { "epoch": 0.63, "learning_rate": 1.8394793472308932e-05, "loss": 2.3318, "step": 362470 }, { "epoch": 0.63, "learning_rate": 1.8393921532382106e-05, "loss": 2.3444, "step": 362480 }, { "epoch": 0.63, "learning_rate": 1.839304959245528e-05, "loss": 2.3545, "step": 362490 }, { "epoch": 0.63, "learning_rate": 1.8392177652528453e-05, "loss": 2.2901, "step": 362500 }, { "epoch": 0.63, "learning_rate": 1.8391305712601624e-05, "loss": 2.2948, "step": 362510 }, { "epoch": 0.63, "learning_rate": 1.8390433772674798e-05, "loss": 2.2451, "step": 362520 }, { "epoch": 0.63, "learning_rate": 1.838956183274797e-05, "loss": 2.3153, "step": 362530 }, { "epoch": 0.63, "learning_rate": 1.8388689892821145e-05, "loss": 2.3389, "step": 362540 }, { "epoch": 0.63, "learning_rate": 1.838781795289432e-05, "loss": 2.2955, "step": 362550 }, { "epoch": 0.63, "learning_rate": 1.838694601296749e-05, "loss": 2.3483, "step": 362560 }, { "epoch": 0.63, "learning_rate": 1.8386074073040666e-05, "loss": 2.3644, "step": 362570 }, { "epoch": 0.63, "learning_rate": 1.8385202133113837e-05, "loss": 2.352, "step": 362580 }, { "epoch": 0.63, "learning_rate": 1.838433019318701e-05, "loss": 2.2643, "step": 362590 }, { "epoch": 0.63, "learning_rate": 1.8383458253260184e-05, "loss": 2.3986, "step": 362600 }, { "epoch": 0.63, "learning_rate": 1.8382586313333358e-05, "loss": 2.3314, "step": 362610 }, { "epoch": 0.63, "learning_rate": 1.8381714373406532e-05, "loss": 2.2787, "step": 362620 }, { "epoch": 0.63, "learning_rate": 1.8380842433479702e-05, "loss": 2.1369, "step": 362630 }, { "epoch": 0.63, "learning_rate": 1.837997049355288e-05, "loss": 2.3216, "step": 362640 }, { "epoch": 0.63, "learning_rate": 1.837909855362605e-05, "loss": 2.3882, "step": 362650 }, { "epoch": 0.63, "learning_rate": 1.8378226613699224e-05, "loss": 2.3317, "step": 362660 }, { "epoch": 0.63, "learning_rate": 1.8377354673772397e-05, "loss": 2.2067, "step": 362670 }, { "epoch": 0.63, "learning_rate": 1.837648273384557e-05, "loss": 2.3192, "step": 362680 }, { "epoch": 0.63, "learning_rate": 1.8375610793918745e-05, "loss": 2.3808, "step": 362690 }, { "epoch": 0.63, "learning_rate": 1.8374738853991915e-05, "loss": 2.2739, "step": 362700 }, { "epoch": 0.63, "learning_rate": 1.837386691406509e-05, "loss": 2.344, "step": 362710 }, { "epoch": 0.63, "learning_rate": 1.8372994974138263e-05, "loss": 2.2452, "step": 362720 }, { "epoch": 0.63, "learning_rate": 1.8372123034211437e-05, "loss": 2.3909, "step": 362730 }, { "epoch": 0.63, "learning_rate": 1.8371251094284607e-05, "loss": 2.3464, "step": 362740 }, { "epoch": 0.63, "learning_rate": 1.8370379154357784e-05, "loss": 2.3803, "step": 362750 }, { "epoch": 0.63, "learning_rate": 1.8369507214430954e-05, "loss": 2.3126, "step": 362760 }, { "epoch": 0.63, "learning_rate": 1.8368635274504128e-05, "loss": 2.3878, "step": 362770 }, { "epoch": 0.63, "learning_rate": 1.8367763334577302e-05, "loss": 2.2028, "step": 362780 }, { "epoch": 0.63, "learning_rate": 1.8366891394650476e-05, "loss": 2.3559, "step": 362790 }, { "epoch": 0.63, "learning_rate": 1.836601945472365e-05, "loss": 2.4134, "step": 362800 }, { "epoch": 0.63, "learning_rate": 1.836514751479682e-05, "loss": 2.348, "step": 362810 }, { "epoch": 0.63, "learning_rate": 1.8364275574869994e-05, "loss": 2.2767, "step": 362820 }, { "epoch": 0.63, "learning_rate": 1.8363403634943167e-05, "loss": 2.3503, "step": 362830 }, { "epoch": 0.63, "learning_rate": 1.836253169501634e-05, "loss": 2.2389, "step": 362840 }, { "epoch": 0.63, "learning_rate": 1.8361659755089515e-05, "loss": 2.244, "step": 362850 }, { "epoch": 0.63, "learning_rate": 1.8360787815162685e-05, "loss": 2.2318, "step": 362860 }, { "epoch": 0.63, "learning_rate": 1.8359915875235863e-05, "loss": 2.3474, "step": 362870 }, { "epoch": 0.63, "learning_rate": 1.8359043935309033e-05, "loss": 2.3259, "step": 362880 }, { "epoch": 0.63, "learning_rate": 1.8358171995382207e-05, "loss": 2.2732, "step": 362890 }, { "epoch": 0.63, "learning_rate": 1.835730005545538e-05, "loss": 2.3559, "step": 362900 }, { "epoch": 0.63, "learning_rate": 1.8356428115528554e-05, "loss": 2.1897, "step": 362910 }, { "epoch": 0.63, "learning_rate": 1.8355556175601728e-05, "loss": 2.4102, "step": 362920 }, { "epoch": 0.63, "learning_rate": 1.83546842356749e-05, "loss": 2.2931, "step": 362930 }, { "epoch": 0.63, "learning_rate": 1.8353812295748076e-05, "loss": 2.516, "step": 362940 }, { "epoch": 0.63, "learning_rate": 1.8352940355821246e-05, "loss": 2.301, "step": 362950 }, { "epoch": 0.63, "learning_rate": 1.835206841589442e-05, "loss": 2.4497, "step": 362960 }, { "epoch": 0.63, "learning_rate": 1.835119647596759e-05, "loss": 2.3997, "step": 362970 }, { "epoch": 0.63, "learning_rate": 1.8350324536040767e-05, "loss": 2.3569, "step": 362980 }, { "epoch": 0.63, "learning_rate": 1.8349452596113938e-05, "loss": 2.322, "step": 362990 }, { "epoch": 0.63, "learning_rate": 1.834858065618711e-05, "loss": 2.2911, "step": 363000 }, { "epoch": 0.63, "learning_rate": 1.8347708716260285e-05, "loss": 2.4045, "step": 363010 }, { "epoch": 0.63, "learning_rate": 1.834683677633346e-05, "loss": 2.2449, "step": 363020 }, { "epoch": 0.63, "learning_rate": 1.8345964836406633e-05, "loss": 2.3566, "step": 363030 }, { "epoch": 0.63, "learning_rate": 1.8345092896479803e-05, "loss": 2.3384, "step": 363040 }, { "epoch": 0.63, "learning_rate": 1.834422095655298e-05, "loss": 2.2829, "step": 363050 }, { "epoch": 0.63, "learning_rate": 1.834334901662615e-05, "loss": 2.3699, "step": 363060 }, { "epoch": 0.63, "learning_rate": 1.8342477076699324e-05, "loss": 2.3466, "step": 363070 }, { "epoch": 0.63, "learning_rate": 1.8341605136772498e-05, "loss": 2.3861, "step": 363080 }, { "epoch": 0.63, "learning_rate": 1.8340733196845672e-05, "loss": 2.294, "step": 363090 }, { "epoch": 0.63, "learning_rate": 1.8339861256918846e-05, "loss": 2.2751, "step": 363100 }, { "epoch": 0.63, "learning_rate": 1.8338989316992016e-05, "loss": 2.2994, "step": 363110 }, { "epoch": 0.63, "learning_rate": 1.833811737706519e-05, "loss": 2.2483, "step": 363120 }, { "epoch": 0.63, "learning_rate": 1.8337245437138364e-05, "loss": 2.3436, "step": 363130 }, { "epoch": 0.63, "learning_rate": 1.8336373497211537e-05, "loss": 2.4314, "step": 363140 }, { "epoch": 0.63, "learning_rate": 1.8335501557284708e-05, "loss": 2.3045, "step": 363150 }, { "epoch": 0.63, "learning_rate": 1.8334629617357885e-05, "loss": 2.4326, "step": 363160 }, { "epoch": 0.63, "learning_rate": 1.833375767743106e-05, "loss": 2.2938, "step": 363170 }, { "epoch": 0.63, "learning_rate": 1.833288573750423e-05, "loss": 2.287, "step": 363180 }, { "epoch": 0.63, "learning_rate": 1.8332013797577403e-05, "loss": 2.2727, "step": 363190 }, { "epoch": 0.63, "learning_rate": 1.8331141857650577e-05, "loss": 2.1824, "step": 363200 }, { "epoch": 0.63, "learning_rate": 1.833026991772375e-05, "loss": 2.3568, "step": 363210 }, { "epoch": 0.63, "learning_rate": 1.832939797779692e-05, "loss": 2.3095, "step": 363220 }, { "epoch": 0.63, "learning_rate": 1.8328526037870095e-05, "loss": 2.3564, "step": 363230 }, { "epoch": 0.63, "learning_rate": 1.8327654097943268e-05, "loss": 2.3835, "step": 363240 }, { "epoch": 0.63, "learning_rate": 1.8326782158016442e-05, "loss": 2.3905, "step": 363250 }, { "epoch": 0.63, "learning_rate": 1.8325910218089616e-05, "loss": 2.3704, "step": 363260 }, { "epoch": 0.63, "learning_rate": 1.832503827816279e-05, "loss": 2.3259, "step": 363270 }, { "epoch": 0.63, "learning_rate": 1.8324166338235963e-05, "loss": 2.3024, "step": 363280 }, { "epoch": 0.63, "learning_rate": 1.8323294398309134e-05, "loss": 2.2366, "step": 363290 }, { "epoch": 0.63, "learning_rate": 1.8322422458382308e-05, "loss": 2.2365, "step": 363300 }, { "epoch": 0.63, "learning_rate": 1.832155051845548e-05, "loss": 2.4501, "step": 363310 }, { "epoch": 0.63, "learning_rate": 1.8320678578528655e-05, "loss": 2.2054, "step": 363320 }, { "epoch": 0.63, "learning_rate": 1.831980663860183e-05, "loss": 2.371, "step": 363330 }, { "epoch": 0.63, "learning_rate": 1.8318934698675e-05, "loss": 2.2317, "step": 363340 }, { "epoch": 0.63, "learning_rate": 1.8318062758748176e-05, "loss": 2.371, "step": 363350 }, { "epoch": 0.63, "learning_rate": 1.8317190818821347e-05, "loss": 2.3532, "step": 363360 }, { "epoch": 0.63, "learning_rate": 1.831631887889452e-05, "loss": 2.2312, "step": 363370 }, { "epoch": 0.63, "learning_rate": 1.831544693896769e-05, "loss": 2.3283, "step": 363380 }, { "epoch": 0.63, "learning_rate": 1.8314574999040868e-05, "loss": 2.2321, "step": 363390 }, { "epoch": 0.63, "learning_rate": 1.8313703059114042e-05, "loss": 2.3447, "step": 363400 }, { "epoch": 0.63, "learning_rate": 1.8312831119187212e-05, "loss": 2.2785, "step": 363410 }, { "epoch": 0.63, "learning_rate": 1.831195917926039e-05, "loss": 2.4025, "step": 363420 }, { "epoch": 0.63, "learning_rate": 1.831108723933356e-05, "loss": 2.3223, "step": 363430 }, { "epoch": 0.63, "learning_rate": 1.8310215299406734e-05, "loss": 2.3351, "step": 363440 }, { "epoch": 0.63, "learning_rate": 1.8309343359479904e-05, "loss": 2.2572, "step": 363450 }, { "epoch": 0.63, "learning_rate": 1.830847141955308e-05, "loss": 2.3675, "step": 363460 }, { "epoch": 0.63, "learning_rate": 1.830759947962625e-05, "loss": 2.3752, "step": 363470 }, { "epoch": 0.63, "learning_rate": 1.8306727539699425e-05, "loss": 2.3946, "step": 363480 }, { "epoch": 0.63, "learning_rate": 1.83058555997726e-05, "loss": 2.3287, "step": 363490 }, { "epoch": 0.63, "learning_rate": 1.8304983659845773e-05, "loss": 2.376, "step": 363500 }, { "epoch": 0.63, "learning_rate": 1.8304111719918947e-05, "loss": 2.3053, "step": 363510 }, { "epoch": 0.63, "learning_rate": 1.8303239779992117e-05, "loss": 2.34, "step": 363520 }, { "epoch": 0.63, "learning_rate": 1.830236784006529e-05, "loss": 2.3543, "step": 363530 }, { "epoch": 0.63, "learning_rate": 1.8301495900138464e-05, "loss": 2.4111, "step": 363540 }, { "epoch": 0.63, "learning_rate": 1.8300623960211638e-05, "loss": 2.2978, "step": 363550 }, { "epoch": 0.63, "learning_rate": 1.8299752020284812e-05, "loss": 2.3233, "step": 363560 }, { "epoch": 0.63, "learning_rate": 1.8298880080357986e-05, "loss": 2.3206, "step": 363570 }, { "epoch": 0.63, "learning_rate": 1.829800814043116e-05, "loss": 2.3594, "step": 363580 }, { "epoch": 0.63, "learning_rate": 1.829713620050433e-05, "loss": 2.3115, "step": 363590 }, { "epoch": 0.63, "learning_rate": 1.8296264260577504e-05, "loss": 2.4035, "step": 363600 }, { "epoch": 0.63, "learning_rate": 1.8295392320650677e-05, "loss": 2.3637, "step": 363610 }, { "epoch": 0.63, "learning_rate": 1.829452038072385e-05, "loss": 2.3469, "step": 363620 }, { "epoch": 0.63, "learning_rate": 1.829364844079702e-05, "loss": 2.4554, "step": 363630 }, { "epoch": 0.63, "learning_rate": 1.8292776500870195e-05, "loss": 2.3518, "step": 363640 }, { "epoch": 0.63, "learning_rate": 1.8291904560943373e-05, "loss": 2.3506, "step": 363650 }, { "epoch": 0.63, "learning_rate": 1.8291032621016543e-05, "loss": 2.3324, "step": 363660 }, { "epoch": 0.63, "learning_rate": 1.8290160681089717e-05, "loss": 2.3305, "step": 363670 }, { "epoch": 0.63, "learning_rate": 1.828928874116289e-05, "loss": 2.5168, "step": 363680 }, { "epoch": 0.63, "learning_rate": 1.8288416801236064e-05, "loss": 2.355, "step": 363690 }, { "epoch": 0.63, "learning_rate": 1.8287544861309235e-05, "loss": 2.37, "step": 363700 }, { "epoch": 0.63, "learning_rate": 1.828667292138241e-05, "loss": 2.2828, "step": 363710 }, { "epoch": 0.63, "learning_rate": 1.8285800981455582e-05, "loss": 2.3839, "step": 363720 }, { "epoch": 0.63, "learning_rate": 1.8284929041528756e-05, "loss": 2.2915, "step": 363730 }, { "epoch": 0.63, "learning_rate": 1.828405710160193e-05, "loss": 2.2886, "step": 363740 }, { "epoch": 0.63, "learning_rate": 1.82831851616751e-05, "loss": 2.3123, "step": 363750 }, { "epoch": 0.63, "learning_rate": 1.8282313221748277e-05, "loss": 2.3696, "step": 363760 }, { "epoch": 0.63, "learning_rate": 1.8281441281821448e-05, "loss": 2.4275, "step": 363770 }, { "epoch": 0.63, "learning_rate": 1.828056934189462e-05, "loss": 2.222, "step": 363780 }, { "epoch": 0.63, "learning_rate": 1.8279697401967795e-05, "loss": 2.3662, "step": 363790 }, { "epoch": 0.63, "learning_rate": 1.827882546204097e-05, "loss": 2.3833, "step": 363800 }, { "epoch": 0.63, "learning_rate": 1.8277953522114143e-05, "loss": 2.5125, "step": 363810 }, { "epoch": 0.63, "learning_rate": 1.8277081582187313e-05, "loss": 2.3399, "step": 363820 }, { "epoch": 0.63, "learning_rate": 1.827620964226049e-05, "loss": 2.2916, "step": 363830 }, { "epoch": 0.63, "learning_rate": 1.827533770233366e-05, "loss": 2.4504, "step": 363840 }, { "epoch": 0.63, "learning_rate": 1.8274465762406834e-05, "loss": 2.255, "step": 363850 }, { "epoch": 0.63, "learning_rate": 1.8273593822480005e-05, "loss": 2.2991, "step": 363860 }, { "epoch": 0.63, "learning_rate": 1.8272721882553182e-05, "loss": 2.3093, "step": 363870 }, { "epoch": 0.63, "learning_rate": 1.8271849942626352e-05, "loss": 2.2988, "step": 363880 }, { "epoch": 0.63, "learning_rate": 1.8270978002699526e-05, "loss": 2.2733, "step": 363890 }, { "epoch": 0.63, "learning_rate": 1.82701060627727e-05, "loss": 2.2278, "step": 363900 }, { "epoch": 0.63, "learning_rate": 1.8269234122845874e-05, "loss": 2.2722, "step": 363910 }, { "epoch": 0.63, "learning_rate": 1.8268362182919047e-05, "loss": 2.3292, "step": 363920 }, { "epoch": 0.63, "learning_rate": 1.8267490242992218e-05, "loss": 2.3608, "step": 363930 }, { "epoch": 0.63, "learning_rate": 1.8266618303065395e-05, "loss": 2.3281, "step": 363940 }, { "epoch": 0.63, "learning_rate": 1.8265746363138565e-05, "loss": 2.3579, "step": 363950 }, { "epoch": 0.63, "learning_rate": 1.826487442321174e-05, "loss": 2.3801, "step": 363960 }, { "epoch": 0.63, "learning_rate": 1.8264002483284913e-05, "loss": 2.373, "step": 363970 }, { "epoch": 0.63, "learning_rate": 1.8263130543358087e-05, "loss": 2.3094, "step": 363980 }, { "epoch": 0.63, "learning_rate": 1.826225860343126e-05, "loss": 2.3824, "step": 363990 }, { "epoch": 0.63, "learning_rate": 1.826138666350443e-05, "loss": 2.2528, "step": 364000 }, { "epoch": 0.63, "learning_rate": 1.8260514723577605e-05, "loss": 2.3227, "step": 364010 }, { "epoch": 0.63, "learning_rate": 1.8259642783650778e-05, "loss": 2.3468, "step": 364020 }, { "epoch": 0.63, "learning_rate": 1.8258770843723952e-05, "loss": 2.4083, "step": 364030 }, { "epoch": 0.63, "learning_rate": 1.8257898903797126e-05, "loss": 2.3193, "step": 364040 }, { "epoch": 0.63, "learning_rate": 1.8257026963870296e-05, "loss": 2.2975, "step": 364050 }, { "epoch": 0.63, "learning_rate": 1.8256155023943473e-05, "loss": 2.3813, "step": 364060 }, { "epoch": 0.63, "learning_rate": 1.8255283084016644e-05, "loss": 2.3657, "step": 364070 }, { "epoch": 0.63, "learning_rate": 1.8254411144089818e-05, "loss": 2.3212, "step": 364080 }, { "epoch": 0.63, "learning_rate": 1.825353920416299e-05, "loss": 2.2754, "step": 364090 }, { "epoch": 0.63, "learning_rate": 1.8252667264236165e-05, "loss": 2.3801, "step": 364100 }, { "epoch": 0.63, "learning_rate": 1.8251795324309335e-05, "loss": 2.2545, "step": 364110 }, { "epoch": 0.63, "learning_rate": 1.825092338438251e-05, "loss": 2.3241, "step": 364120 }, { "epoch": 0.63, "learning_rate": 1.8250051444455686e-05, "loss": 2.3435, "step": 364130 }, { "epoch": 0.64, "learning_rate": 1.8249179504528857e-05, "loss": 2.3407, "step": 364140 }, { "epoch": 0.64, "learning_rate": 1.824830756460203e-05, "loss": 2.3138, "step": 364150 }, { "epoch": 0.64, "learning_rate": 1.82474356246752e-05, "loss": 2.2713, "step": 364160 }, { "epoch": 0.64, "learning_rate": 1.8246563684748378e-05, "loss": 2.2934, "step": 364170 }, { "epoch": 0.64, "learning_rate": 1.824569174482155e-05, "loss": 2.1927, "step": 364180 }, { "epoch": 0.64, "learning_rate": 1.8244819804894722e-05, "loss": 2.3016, "step": 364190 }, { "epoch": 0.64, "learning_rate": 1.8243947864967896e-05, "loss": 2.2639, "step": 364200 }, { "epoch": 0.64, "learning_rate": 1.824307592504107e-05, "loss": 2.297, "step": 364210 }, { "epoch": 0.64, "learning_rate": 1.8242203985114244e-05, "loss": 2.3051, "step": 364220 }, { "epoch": 0.64, "learning_rate": 1.8241332045187414e-05, "loss": 2.3162, "step": 364230 }, { "epoch": 0.64, "learning_rate": 1.824046010526059e-05, "loss": 2.2759, "step": 364240 }, { "epoch": 0.64, "learning_rate": 1.823958816533376e-05, "loss": 2.2967, "step": 364250 }, { "epoch": 0.64, "learning_rate": 1.8238716225406935e-05, "loss": 2.1801, "step": 364260 }, { "epoch": 0.64, "learning_rate": 1.823784428548011e-05, "loss": 2.3135, "step": 364270 }, { "epoch": 0.64, "learning_rate": 1.8236972345553283e-05, "loss": 2.341, "step": 364280 }, { "epoch": 0.64, "learning_rate": 1.8236100405626457e-05, "loss": 2.2946, "step": 364290 }, { "epoch": 0.64, "learning_rate": 1.8235228465699627e-05, "loss": 2.2877, "step": 364300 }, { "epoch": 0.64, "learning_rate": 1.82343565257728e-05, "loss": 2.4199, "step": 364310 }, { "epoch": 0.64, "learning_rate": 1.8233484585845974e-05, "loss": 2.3001, "step": 364320 }, { "epoch": 0.64, "learning_rate": 1.8232612645919148e-05, "loss": 2.2729, "step": 364330 }, { "epoch": 0.64, "learning_rate": 1.823174070599232e-05, "loss": 2.2408, "step": 364340 }, { "epoch": 0.64, "learning_rate": 1.8230868766065496e-05, "loss": 2.3648, "step": 364350 }, { "epoch": 0.64, "learning_rate": 1.8229996826138666e-05, "loss": 2.3252, "step": 364360 }, { "epoch": 0.64, "learning_rate": 1.822912488621184e-05, "loss": 2.3134, "step": 364370 }, { "epoch": 0.64, "learning_rate": 1.8228252946285014e-05, "loss": 2.2363, "step": 364380 }, { "epoch": 0.64, "learning_rate": 1.8227381006358187e-05, "loss": 2.4006, "step": 364390 }, { "epoch": 0.64, "learning_rate": 1.822650906643136e-05, "loss": 2.2096, "step": 364400 }, { "epoch": 0.64, "learning_rate": 1.822563712650453e-05, "loss": 2.4477, "step": 364410 }, { "epoch": 0.64, "learning_rate": 1.8224765186577705e-05, "loss": 2.3947, "step": 364420 }, { "epoch": 0.64, "learning_rate": 1.822389324665088e-05, "loss": 2.3234, "step": 364430 }, { "epoch": 0.64, "learning_rate": 1.8223021306724053e-05, "loss": 2.2953, "step": 364440 }, { "epoch": 0.64, "learning_rate": 1.8222149366797227e-05, "loss": 2.3255, "step": 364450 }, { "epoch": 0.64, "learning_rate": 1.8221277426870397e-05, "loss": 2.2307, "step": 364460 }, { "epoch": 0.64, "learning_rate": 1.8220405486943574e-05, "loss": 2.3489, "step": 364470 }, { "epoch": 0.64, "learning_rate": 1.8219533547016745e-05, "loss": 2.3096, "step": 364480 }, { "epoch": 0.64, "learning_rate": 1.821866160708992e-05, "loss": 2.3205, "step": 364490 }, { "epoch": 0.64, "learning_rate": 1.8217789667163092e-05, "loss": 2.3753, "step": 364500 }, { "epoch": 0.64, "learning_rate": 1.8216917727236266e-05, "loss": 2.3458, "step": 364510 }, { "epoch": 0.64, "learning_rate": 1.821604578730944e-05, "loss": 2.3418, "step": 364520 }, { "epoch": 0.64, "learning_rate": 1.821517384738261e-05, "loss": 2.1469, "step": 364530 }, { "epoch": 0.64, "learning_rate": 1.8214301907455787e-05, "loss": 2.2734, "step": 364540 }, { "epoch": 0.64, "learning_rate": 1.8213429967528958e-05, "loss": 2.4429, "step": 364550 }, { "epoch": 0.64, "learning_rate": 1.821255802760213e-05, "loss": 2.4409, "step": 364560 }, { "epoch": 0.64, "learning_rate": 1.8211686087675302e-05, "loss": 2.3156, "step": 364570 }, { "epoch": 0.64, "learning_rate": 1.821081414774848e-05, "loss": 2.357, "step": 364580 }, { "epoch": 0.64, "learning_rate": 1.820994220782165e-05, "loss": 2.323, "step": 364590 }, { "epoch": 0.64, "learning_rate": 1.8209070267894823e-05, "loss": 2.2813, "step": 364600 }, { "epoch": 0.64, "learning_rate": 1.8208198327967997e-05, "loss": 2.3322, "step": 364610 }, { "epoch": 0.64, "learning_rate": 1.820732638804117e-05, "loss": 2.2938, "step": 364620 }, { "epoch": 0.64, "learning_rate": 1.8206454448114344e-05, "loss": 2.275, "step": 364630 }, { "epoch": 0.64, "learning_rate": 1.8205582508187515e-05, "loss": 2.3858, "step": 364640 }, { "epoch": 0.64, "learning_rate": 1.8204710568260692e-05, "loss": 2.2759, "step": 364650 }, { "epoch": 0.64, "learning_rate": 1.8203838628333862e-05, "loss": 2.3633, "step": 364660 }, { "epoch": 0.64, "learning_rate": 1.8202966688407036e-05, "loss": 2.1981, "step": 364670 }, { "epoch": 0.64, "learning_rate": 1.820209474848021e-05, "loss": 2.3377, "step": 364680 }, { "epoch": 0.64, "learning_rate": 1.8201222808553384e-05, "loss": 2.3744, "step": 364690 }, { "epoch": 0.64, "learning_rate": 1.8200350868626557e-05, "loss": 2.2666, "step": 364700 }, { "epoch": 0.64, "learning_rate": 1.8199478928699728e-05, "loss": 2.2875, "step": 364710 }, { "epoch": 0.64, "learning_rate": 1.81986069887729e-05, "loss": 2.3435, "step": 364720 }, { "epoch": 0.64, "learning_rate": 1.8197735048846075e-05, "loss": 2.327, "step": 364730 }, { "epoch": 0.64, "learning_rate": 1.819686310891925e-05, "loss": 2.3991, "step": 364740 }, { "epoch": 0.64, "learning_rate": 1.8195991168992423e-05, "loss": 2.3667, "step": 364750 }, { "epoch": 0.64, "learning_rate": 1.8195119229065597e-05, "loss": 2.2182, "step": 364760 }, { "epoch": 0.64, "learning_rate": 1.819424728913877e-05, "loss": 2.312, "step": 364770 }, { "epoch": 0.64, "learning_rate": 1.819337534921194e-05, "loss": 2.3867, "step": 364780 }, { "epoch": 0.64, "learning_rate": 1.8192503409285115e-05, "loss": 2.355, "step": 364790 }, { "epoch": 0.64, "learning_rate": 1.819163146935829e-05, "loss": 2.2799, "step": 364800 }, { "epoch": 0.64, "learning_rate": 1.8190759529431462e-05, "loss": 2.1998, "step": 364810 }, { "epoch": 0.64, "learning_rate": 1.8189887589504632e-05, "loss": 2.3861, "step": 364820 }, { "epoch": 0.64, "learning_rate": 1.8189015649577806e-05, "loss": 2.3634, "step": 364830 }, { "epoch": 0.64, "learning_rate": 1.818814370965098e-05, "loss": 2.2827, "step": 364840 }, { "epoch": 0.64, "learning_rate": 1.8187271769724154e-05, "loss": 2.3099, "step": 364850 }, { "epoch": 0.64, "learning_rate": 1.8186399829797328e-05, "loss": 2.2527, "step": 364860 }, { "epoch": 0.64, "learning_rate": 1.81855278898705e-05, "loss": 2.3219, "step": 364870 }, { "epoch": 0.64, "learning_rate": 1.8184655949943675e-05, "loss": 2.3424, "step": 364880 }, { "epoch": 0.64, "learning_rate": 1.8183784010016845e-05, "loss": 2.3601, "step": 364890 }, { "epoch": 0.64, "learning_rate": 1.818291207009002e-05, "loss": 2.2019, "step": 364900 }, { "epoch": 0.64, "learning_rate": 1.8182040130163193e-05, "loss": 2.2618, "step": 364910 }, { "epoch": 0.64, "learning_rate": 1.8181168190236367e-05, "loss": 2.3455, "step": 364920 }, { "epoch": 0.64, "learning_rate": 1.818029625030954e-05, "loss": 2.2322, "step": 364930 }, { "epoch": 0.64, "learning_rate": 1.817942431038271e-05, "loss": 2.3264, "step": 364940 }, { "epoch": 0.64, "learning_rate": 1.8178552370455888e-05, "loss": 2.1749, "step": 364950 }, { "epoch": 0.64, "learning_rate": 1.817768043052906e-05, "loss": 2.2802, "step": 364960 }, { "epoch": 0.64, "learning_rate": 1.8176808490602232e-05, "loss": 2.1598, "step": 364970 }, { "epoch": 0.64, "learning_rate": 1.8175936550675403e-05, "loss": 2.2529, "step": 364980 }, { "epoch": 0.64, "learning_rate": 1.817506461074858e-05, "loss": 2.2416, "step": 364990 }, { "epoch": 0.64, "learning_rate": 1.8174192670821754e-05, "loss": 2.3488, "step": 365000 }, { "epoch": 0.64, "learning_rate": 1.8173320730894924e-05, "loss": 2.334, "step": 365010 }, { "epoch": 0.64, "learning_rate": 1.81724487909681e-05, "loss": 2.4309, "step": 365020 }, { "epoch": 0.64, "learning_rate": 1.817157685104127e-05, "loss": 2.211, "step": 365030 }, { "epoch": 0.64, "learning_rate": 1.8170704911114445e-05, "loss": 2.2794, "step": 365040 }, { "epoch": 0.64, "learning_rate": 1.8169832971187616e-05, "loss": 2.2431, "step": 365050 }, { "epoch": 0.64, "learning_rate": 1.8168961031260793e-05, "loss": 2.3766, "step": 365060 }, { "epoch": 0.64, "learning_rate": 1.8168089091333963e-05, "loss": 2.306, "step": 365070 }, { "epoch": 0.64, "learning_rate": 1.8167217151407137e-05, "loss": 2.3155, "step": 365080 }, { "epoch": 0.64, "learning_rate": 1.816634521148031e-05, "loss": 2.358, "step": 365090 }, { "epoch": 0.64, "learning_rate": 1.8165473271553484e-05, "loss": 2.2592, "step": 365100 }, { "epoch": 0.64, "learning_rate": 1.8164601331626658e-05, "loss": 2.4451, "step": 365110 }, { "epoch": 0.64, "learning_rate": 1.816372939169983e-05, "loss": 2.247, "step": 365120 }, { "epoch": 0.64, "learning_rate": 1.8162857451773002e-05, "loss": 2.375, "step": 365130 }, { "epoch": 0.64, "learning_rate": 1.8161985511846176e-05, "loss": 2.2855, "step": 365140 }, { "epoch": 0.64, "learning_rate": 1.816111357191935e-05, "loss": 2.2778, "step": 365150 }, { "epoch": 0.64, "learning_rate": 1.8160241631992524e-05, "loss": 2.3418, "step": 365160 }, { "epoch": 0.64, "learning_rate": 1.8159369692065697e-05, "loss": 2.3203, "step": 365170 }, { "epoch": 0.64, "learning_rate": 1.815849775213887e-05, "loss": 2.3179, "step": 365180 }, { "epoch": 0.64, "learning_rate": 1.815762581221204e-05, "loss": 2.2526, "step": 365190 }, { "epoch": 0.64, "learning_rate": 1.8156753872285215e-05, "loss": 2.3804, "step": 365200 }, { "epoch": 0.64, "learning_rate": 1.815588193235839e-05, "loss": 2.2074, "step": 365210 }, { "epoch": 0.64, "learning_rate": 1.8155009992431563e-05, "loss": 2.3762, "step": 365220 }, { "epoch": 0.64, "learning_rate": 1.8154138052504733e-05, "loss": 2.408, "step": 365230 }, { "epoch": 0.64, "learning_rate": 1.8153266112577907e-05, "loss": 2.3609, "step": 365240 }, { "epoch": 0.64, "learning_rate": 1.8152394172651084e-05, "loss": 2.3435, "step": 365250 }, { "epoch": 0.64, "learning_rate": 1.8151522232724255e-05, "loss": 2.3621, "step": 365260 }, { "epoch": 0.64, "learning_rate": 1.815065029279743e-05, "loss": 2.3359, "step": 365270 }, { "epoch": 0.64, "learning_rate": 1.8149778352870602e-05, "loss": 2.1998, "step": 365280 }, { "epoch": 0.64, "learning_rate": 1.8148906412943776e-05, "loss": 2.3272, "step": 365290 }, { "epoch": 0.64, "learning_rate": 1.8148034473016946e-05, "loss": 2.3719, "step": 365300 }, { "epoch": 0.64, "learning_rate": 1.814716253309012e-05, "loss": 2.3375, "step": 365310 }, { "epoch": 0.64, "learning_rate": 1.8146290593163294e-05, "loss": 2.42, "step": 365320 }, { "epoch": 0.64, "learning_rate": 1.8145418653236468e-05, "loss": 2.3294, "step": 365330 }, { "epoch": 0.64, "learning_rate": 1.814454671330964e-05, "loss": 2.3689, "step": 365340 }, { "epoch": 0.64, "learning_rate": 1.8143674773382812e-05, "loss": 2.2013, "step": 365350 }, { "epoch": 0.64, "learning_rate": 1.814280283345599e-05, "loss": 2.3836, "step": 365360 }, { "epoch": 0.64, "learning_rate": 1.814193089352916e-05, "loss": 2.324, "step": 365370 }, { "epoch": 0.64, "learning_rate": 1.8141058953602333e-05, "loss": 2.2682, "step": 365380 }, { "epoch": 0.64, "learning_rate": 1.8140187013675507e-05, "loss": 2.367, "step": 365390 }, { "epoch": 0.64, "learning_rate": 1.813931507374868e-05, "loss": 2.3515, "step": 365400 }, { "epoch": 0.64, "learning_rate": 1.8138443133821854e-05, "loss": 2.226, "step": 365410 }, { "epoch": 0.64, "learning_rate": 1.8137571193895025e-05, "loss": 2.3157, "step": 365420 }, { "epoch": 0.64, "learning_rate": 1.8136699253968202e-05, "loss": 2.3486, "step": 365430 }, { "epoch": 0.64, "learning_rate": 1.8135827314041372e-05, "loss": 2.354, "step": 365440 }, { "epoch": 0.64, "learning_rate": 1.8134955374114546e-05, "loss": 2.3805, "step": 365450 }, { "epoch": 0.64, "learning_rate": 1.8134083434187716e-05, "loss": 2.3854, "step": 365460 }, { "epoch": 0.64, "learning_rate": 1.8133211494260894e-05, "loss": 2.3555, "step": 365470 }, { "epoch": 0.64, "learning_rate": 1.8132339554334067e-05, "loss": 2.2931, "step": 365480 }, { "epoch": 0.64, "learning_rate": 1.8131467614407238e-05, "loss": 2.5155, "step": 365490 }, { "epoch": 0.64, "learning_rate": 1.813059567448041e-05, "loss": 2.2672, "step": 365500 }, { "epoch": 0.64, "learning_rate": 1.8129723734553585e-05, "loss": 2.4609, "step": 365510 }, { "epoch": 0.64, "learning_rate": 1.812885179462676e-05, "loss": 2.2929, "step": 365520 }, { "epoch": 0.64, "learning_rate": 1.812797985469993e-05, "loss": 2.3108, "step": 365530 }, { "epoch": 0.64, "learning_rate": 1.8127107914773107e-05, "loss": 2.2786, "step": 365540 }, { "epoch": 0.64, "learning_rate": 1.8126235974846277e-05, "loss": 2.4305, "step": 365550 }, { "epoch": 0.64, "learning_rate": 1.812536403491945e-05, "loss": 2.2135, "step": 365560 }, { "epoch": 0.64, "learning_rate": 1.8124492094992625e-05, "loss": 2.3245, "step": 365570 }, { "epoch": 0.64, "learning_rate": 1.81236201550658e-05, "loss": 2.2409, "step": 365580 }, { "epoch": 0.64, "learning_rate": 1.8122748215138972e-05, "loss": 2.3919, "step": 365590 }, { "epoch": 0.64, "learning_rate": 1.8121876275212142e-05, "loss": 2.2739, "step": 365600 }, { "epoch": 0.64, "learning_rate": 1.8121004335285316e-05, "loss": 2.3931, "step": 365610 }, { "epoch": 0.64, "learning_rate": 1.812013239535849e-05, "loss": 2.2801, "step": 365620 }, { "epoch": 0.64, "learning_rate": 1.8119260455431664e-05, "loss": 2.3051, "step": 365630 }, { "epoch": 0.64, "learning_rate": 1.8118388515504838e-05, "loss": 2.2404, "step": 365640 }, { "epoch": 0.64, "learning_rate": 1.8117516575578008e-05, "loss": 2.2554, "step": 365650 }, { "epoch": 0.64, "learning_rate": 1.8116644635651185e-05, "loss": 2.167, "step": 365660 }, { "epoch": 0.64, "learning_rate": 1.8115772695724355e-05, "loss": 2.2468, "step": 365670 }, { "epoch": 0.64, "learning_rate": 1.811490075579753e-05, "loss": 2.2517, "step": 365680 }, { "epoch": 0.64, "learning_rate": 1.8114028815870703e-05, "loss": 2.3684, "step": 365690 }, { "epoch": 0.64, "learning_rate": 1.8113156875943877e-05, "loss": 2.3554, "step": 365700 }, { "epoch": 0.64, "learning_rate": 1.8112284936017047e-05, "loss": 2.3183, "step": 365710 }, { "epoch": 0.64, "learning_rate": 1.811141299609022e-05, "loss": 2.315, "step": 365720 }, { "epoch": 0.64, "learning_rate": 1.8110541056163398e-05, "loss": 2.297, "step": 365730 }, { "epoch": 0.64, "learning_rate": 1.810966911623657e-05, "loss": 2.3822, "step": 365740 }, { "epoch": 0.64, "learning_rate": 1.8108797176309742e-05, "loss": 2.4429, "step": 365750 }, { "epoch": 0.64, "learning_rate": 1.8107925236382913e-05, "loss": 2.2189, "step": 365760 }, { "epoch": 0.64, "learning_rate": 1.810705329645609e-05, "loss": 2.3305, "step": 365770 }, { "epoch": 0.64, "learning_rate": 1.810618135652926e-05, "loss": 2.3011, "step": 365780 }, { "epoch": 0.64, "learning_rate": 1.8105309416602434e-05, "loss": 2.3394, "step": 365790 }, { "epoch": 0.64, "learning_rate": 1.8104437476675608e-05, "loss": 2.272, "step": 365800 }, { "epoch": 0.64, "learning_rate": 1.810356553674878e-05, "loss": 2.2718, "step": 365810 }, { "epoch": 0.64, "learning_rate": 1.8102693596821955e-05, "loss": 2.2438, "step": 365820 }, { "epoch": 0.64, "learning_rate": 1.8101821656895126e-05, "loss": 2.2762, "step": 365830 }, { "epoch": 0.64, "learning_rate": 1.8100949716968303e-05, "loss": 2.2704, "step": 365840 }, { "epoch": 0.64, "learning_rate": 1.8100077777041473e-05, "loss": 2.3083, "step": 365850 }, { "epoch": 0.64, "learning_rate": 1.8099205837114647e-05, "loss": 2.3868, "step": 365860 }, { "epoch": 0.64, "learning_rate": 1.809833389718782e-05, "loss": 2.1597, "step": 365870 }, { "epoch": 0.64, "learning_rate": 1.8097461957260994e-05, "loss": 2.3584, "step": 365880 }, { "epoch": 0.64, "learning_rate": 1.8096590017334168e-05, "loss": 2.2935, "step": 365890 }, { "epoch": 0.64, "learning_rate": 1.809571807740734e-05, "loss": 2.3426, "step": 365900 }, { "epoch": 0.64, "learning_rate": 1.8094846137480512e-05, "loss": 2.4063, "step": 365910 }, { "epoch": 0.64, "learning_rate": 1.8093974197553686e-05, "loss": 2.2775, "step": 365920 }, { "epoch": 0.64, "learning_rate": 1.809310225762686e-05, "loss": 2.3403, "step": 365930 }, { "epoch": 0.64, "learning_rate": 1.809223031770003e-05, "loss": 2.3854, "step": 365940 }, { "epoch": 0.64, "learning_rate": 1.8091358377773207e-05, "loss": 2.2881, "step": 365950 }, { "epoch": 0.64, "learning_rate": 1.8090486437846378e-05, "loss": 2.3447, "step": 365960 }, { "epoch": 0.64, "learning_rate": 1.808961449791955e-05, "loss": 2.3196, "step": 365970 }, { "epoch": 0.64, "learning_rate": 1.8088742557992725e-05, "loss": 2.3801, "step": 365980 }, { "epoch": 0.64, "learning_rate": 1.80878706180659e-05, "loss": 2.3133, "step": 365990 }, { "epoch": 0.64, "learning_rate": 1.8086998678139073e-05, "loss": 2.3152, "step": 366000 }, { "epoch": 0.64, "learning_rate": 1.8086126738212243e-05, "loss": 2.2818, "step": 366010 }, { "epoch": 0.64, "learning_rate": 1.8085254798285417e-05, "loss": 2.2855, "step": 366020 }, { "epoch": 0.64, "learning_rate": 1.808438285835859e-05, "loss": 2.4015, "step": 366030 }, { "epoch": 0.64, "learning_rate": 1.8083510918431765e-05, "loss": 2.3098, "step": 366040 }, { "epoch": 0.64, "learning_rate": 1.808263897850494e-05, "loss": 2.366, "step": 366050 }, { "epoch": 0.64, "learning_rate": 1.808176703857811e-05, "loss": 2.3207, "step": 366060 }, { "epoch": 0.64, "learning_rate": 1.8080895098651286e-05, "loss": 2.4126, "step": 366070 }, { "epoch": 0.64, "learning_rate": 1.8080023158724456e-05, "loss": 2.3586, "step": 366080 }, { "epoch": 0.64, "learning_rate": 1.807915121879763e-05, "loss": 2.2742, "step": 366090 }, { "epoch": 0.64, "learning_rate": 1.8078279278870804e-05, "loss": 2.2679, "step": 366100 }, { "epoch": 0.64, "learning_rate": 1.8077407338943978e-05, "loss": 2.3185, "step": 366110 }, { "epoch": 0.64, "learning_rate": 1.807653539901715e-05, "loss": 2.243, "step": 366120 }, { "epoch": 0.64, "learning_rate": 1.8075663459090322e-05, "loss": 2.2526, "step": 366130 }, { "epoch": 0.64, "learning_rate": 1.80747915191635e-05, "loss": 2.368, "step": 366140 }, { "epoch": 0.64, "learning_rate": 1.807391957923667e-05, "loss": 2.3412, "step": 366150 }, { "epoch": 0.64, "learning_rate": 1.8073047639309843e-05, "loss": 2.4722, "step": 366160 }, { "epoch": 0.64, "learning_rate": 1.8072175699383013e-05, "loss": 2.2742, "step": 366170 }, { "epoch": 0.64, "learning_rate": 1.807130375945619e-05, "loss": 2.3399, "step": 366180 }, { "epoch": 0.64, "learning_rate": 1.807043181952936e-05, "loss": 2.1444, "step": 366190 }, { "epoch": 0.64, "learning_rate": 1.8069559879602535e-05, "loss": 2.3074, "step": 366200 }, { "epoch": 0.64, "learning_rate": 1.8068687939675712e-05, "loss": 2.33, "step": 366210 }, { "epoch": 0.64, "learning_rate": 1.8067815999748882e-05, "loss": 2.2563, "step": 366220 }, { "epoch": 0.64, "learning_rate": 1.8066944059822056e-05, "loss": 2.2633, "step": 366230 }, { "epoch": 0.64, "learning_rate": 1.8066072119895226e-05, "loss": 2.3339, "step": 366240 }, { "epoch": 0.64, "learning_rate": 1.8065200179968404e-05, "loss": 2.2759, "step": 366250 }, { "epoch": 0.64, "learning_rate": 1.8064328240041574e-05, "loss": 2.3839, "step": 366260 }, { "epoch": 0.64, "learning_rate": 1.8063456300114748e-05, "loss": 2.3094, "step": 366270 }, { "epoch": 0.64, "learning_rate": 1.806258436018792e-05, "loss": 2.3467, "step": 366280 }, { "epoch": 0.64, "learning_rate": 1.8061712420261095e-05, "loss": 2.221, "step": 366290 }, { "epoch": 0.64, "learning_rate": 1.806084048033427e-05, "loss": 2.3069, "step": 366300 }, { "epoch": 0.64, "learning_rate": 1.805996854040744e-05, "loss": 2.3046, "step": 366310 }, { "epoch": 0.64, "learning_rate": 1.8059096600480613e-05, "loss": 2.4411, "step": 366320 }, { "epoch": 0.64, "learning_rate": 1.8058224660553787e-05, "loss": 2.2848, "step": 366330 }, { "epoch": 0.64, "learning_rate": 1.805735272062696e-05, "loss": 2.3552, "step": 366340 }, { "epoch": 0.64, "learning_rate": 1.8056480780700135e-05, "loss": 2.3911, "step": 366350 }, { "epoch": 0.64, "learning_rate": 1.805560884077331e-05, "loss": 2.2975, "step": 366360 }, { "epoch": 0.64, "learning_rate": 1.8054736900846482e-05, "loss": 2.3226, "step": 366370 }, { "epoch": 0.64, "learning_rate": 1.8053864960919652e-05, "loss": 2.3752, "step": 366380 }, { "epoch": 0.64, "learning_rate": 1.8052993020992826e-05, "loss": 2.2751, "step": 366390 }, { "epoch": 0.64, "learning_rate": 1.8052121081066e-05, "loss": 2.247, "step": 366400 }, { "epoch": 0.64, "learning_rate": 1.8051249141139174e-05, "loss": 2.3006, "step": 366410 }, { "epoch": 0.64, "learning_rate": 1.8050377201212344e-05, "loss": 2.2676, "step": 366420 }, { "epoch": 0.64, "learning_rate": 1.8049505261285518e-05, "loss": 2.2878, "step": 366430 }, { "epoch": 0.64, "learning_rate": 1.8048633321358692e-05, "loss": 2.2327, "step": 366440 }, { "epoch": 0.64, "learning_rate": 1.8047761381431865e-05, "loss": 2.3243, "step": 366450 }, { "epoch": 0.64, "learning_rate": 1.804688944150504e-05, "loss": 2.2575, "step": 366460 }, { "epoch": 0.64, "learning_rate": 1.8046017501578213e-05, "loss": 2.3724, "step": 366470 }, { "epoch": 0.64, "learning_rate": 1.8045145561651387e-05, "loss": 2.3156, "step": 366480 }, { "epoch": 0.64, "learning_rate": 1.8044273621724557e-05, "loss": 2.2972, "step": 366490 }, { "epoch": 0.64, "learning_rate": 1.804340168179773e-05, "loss": 2.3457, "step": 366500 }, { "epoch": 0.64, "learning_rate": 1.8042529741870905e-05, "loss": 2.3348, "step": 366510 }, { "epoch": 0.64, "learning_rate": 1.804165780194408e-05, "loss": 2.2909, "step": 366520 }, { "epoch": 0.64, "learning_rate": 1.8040785862017252e-05, "loss": 2.3104, "step": 366530 }, { "epoch": 0.64, "learning_rate": 1.8039913922090423e-05, "loss": 2.3939, "step": 366540 }, { "epoch": 0.64, "learning_rate": 1.80390419821636e-05, "loss": 2.3492, "step": 366550 }, { "epoch": 0.64, "learning_rate": 1.803817004223677e-05, "loss": 2.4067, "step": 366560 }, { "epoch": 0.64, "learning_rate": 1.8037298102309944e-05, "loss": 2.2796, "step": 366570 }, { "epoch": 0.64, "learning_rate": 1.8036426162383114e-05, "loss": 2.2979, "step": 366580 }, { "epoch": 0.64, "learning_rate": 1.803555422245629e-05, "loss": 2.4105, "step": 366590 }, { "epoch": 0.64, "learning_rate": 1.8034682282529465e-05, "loss": 2.3129, "step": 366600 }, { "epoch": 0.64, "learning_rate": 1.8033810342602636e-05, "loss": 2.3748, "step": 366610 }, { "epoch": 0.64, "learning_rate": 1.8032938402675813e-05, "loss": 2.2936, "step": 366620 }, { "epoch": 0.64, "learning_rate": 1.8032066462748983e-05, "loss": 2.3588, "step": 366630 }, { "epoch": 0.64, "learning_rate": 1.8031194522822157e-05, "loss": 2.2269, "step": 366640 }, { "epoch": 0.64, "learning_rate": 1.8030322582895327e-05, "loss": 2.252, "step": 366650 }, { "epoch": 0.64, "learning_rate": 1.8029450642968504e-05, "loss": 2.3524, "step": 366660 }, { "epoch": 0.64, "learning_rate": 1.8028578703041675e-05, "loss": 2.4, "step": 366670 }, { "epoch": 0.64, "learning_rate": 1.802770676311485e-05, "loss": 2.2691, "step": 366680 }, { "epoch": 0.64, "learning_rate": 1.8026834823188022e-05, "loss": 2.3402, "step": 366690 }, { "epoch": 0.64, "learning_rate": 1.8025962883261196e-05, "loss": 2.2516, "step": 366700 }, { "epoch": 0.64, "learning_rate": 1.802509094333437e-05, "loss": 2.3277, "step": 366710 }, { "epoch": 0.64, "learning_rate": 1.802421900340754e-05, "loss": 2.313, "step": 366720 }, { "epoch": 0.64, "learning_rate": 1.8023347063480717e-05, "loss": 2.2978, "step": 366730 }, { "epoch": 0.64, "learning_rate": 1.8022475123553888e-05, "loss": 2.2247, "step": 366740 }, { "epoch": 0.64, "learning_rate": 1.802160318362706e-05, "loss": 2.3042, "step": 366750 }, { "epoch": 0.64, "learning_rate": 1.8020731243700235e-05, "loss": 2.2642, "step": 366760 }, { "epoch": 0.64, "learning_rate": 1.801985930377341e-05, "loss": 2.249, "step": 366770 }, { "epoch": 0.64, "learning_rate": 1.8018987363846583e-05, "loss": 2.3493, "step": 366780 }, { "epoch": 0.64, "learning_rate": 1.8018115423919753e-05, "loss": 2.3282, "step": 366790 }, { "epoch": 0.64, "learning_rate": 1.8017243483992927e-05, "loss": 2.403, "step": 366800 }, { "epoch": 0.64, "learning_rate": 1.80163715440661e-05, "loss": 2.259, "step": 366810 }, { "epoch": 0.64, "learning_rate": 1.8015499604139275e-05, "loss": 2.3331, "step": 366820 }, { "epoch": 0.64, "learning_rate": 1.801462766421245e-05, "loss": 2.3919, "step": 366830 }, { "epoch": 0.64, "learning_rate": 1.801375572428562e-05, "loss": 2.3615, "step": 366840 }, { "epoch": 0.64, "learning_rate": 1.8012883784358796e-05, "loss": 2.2782, "step": 366850 }, { "epoch": 0.64, "learning_rate": 1.8012011844431966e-05, "loss": 2.2357, "step": 366860 }, { "epoch": 0.64, "learning_rate": 1.801113990450514e-05, "loss": 2.3851, "step": 366870 }, { "epoch": 0.64, "learning_rate": 1.8010267964578314e-05, "loss": 2.2684, "step": 366880 }, { "epoch": 0.64, "learning_rate": 1.8009396024651488e-05, "loss": 2.3203, "step": 366890 }, { "epoch": 0.64, "learning_rate": 1.8008524084724658e-05, "loss": 2.3701, "step": 366900 }, { "epoch": 0.64, "learning_rate": 1.8007652144797832e-05, "loss": 2.2405, "step": 366910 }, { "epoch": 0.64, "learning_rate": 1.8006780204871006e-05, "loss": 2.3398, "step": 366920 }, { "epoch": 0.64, "learning_rate": 1.800590826494418e-05, "loss": 2.299, "step": 366930 }, { "epoch": 0.64, "learning_rate": 1.8005036325017353e-05, "loss": 2.3422, "step": 366940 }, { "epoch": 0.64, "learning_rate": 1.8004164385090523e-05, "loss": 2.2719, "step": 366950 }, { "epoch": 0.64, "learning_rate": 1.80032924451637e-05, "loss": 2.306, "step": 366960 }, { "epoch": 0.64, "learning_rate": 1.800242050523687e-05, "loss": 2.3691, "step": 366970 }, { "epoch": 0.64, "learning_rate": 1.8001548565310045e-05, "loss": 2.3415, "step": 366980 }, { "epoch": 0.64, "learning_rate": 1.800067662538322e-05, "loss": 2.3881, "step": 366990 }, { "epoch": 0.64, "learning_rate": 1.7999804685456392e-05, "loss": 2.272, "step": 367000 }, { "epoch": 0.64, "learning_rate": 1.7998932745529566e-05, "loss": 2.3458, "step": 367010 }, { "epoch": 0.64, "learning_rate": 1.7998060805602736e-05, "loss": 2.3743, "step": 367020 }, { "epoch": 0.64, "learning_rate": 1.7997188865675914e-05, "loss": 2.2767, "step": 367030 }, { "epoch": 0.64, "learning_rate": 1.7996316925749084e-05, "loss": 2.3521, "step": 367040 }, { "epoch": 0.64, "learning_rate": 1.7995444985822258e-05, "loss": 2.362, "step": 367050 }, { "epoch": 0.64, "learning_rate": 1.7994573045895428e-05, "loss": 2.4004, "step": 367060 }, { "epoch": 0.64, "learning_rate": 1.7993701105968605e-05, "loss": 2.254, "step": 367070 }, { "epoch": 0.64, "learning_rate": 1.799282916604178e-05, "loss": 2.3756, "step": 367080 }, { "epoch": 0.64, "learning_rate": 1.799195722611495e-05, "loss": 2.2689, "step": 367090 }, { "epoch": 0.64, "learning_rate": 1.7991085286188123e-05, "loss": 2.3543, "step": 367100 }, { "epoch": 0.64, "learning_rate": 1.7990213346261297e-05, "loss": 2.3548, "step": 367110 }, { "epoch": 0.64, "learning_rate": 1.798934140633447e-05, "loss": 2.1875, "step": 367120 }, { "epoch": 0.64, "learning_rate": 1.798846946640764e-05, "loss": 2.257, "step": 367130 }, { "epoch": 0.64, "learning_rate": 1.798759752648082e-05, "loss": 2.2737, "step": 367140 }, { "epoch": 0.64, "learning_rate": 1.798672558655399e-05, "loss": 2.3268, "step": 367150 }, { "epoch": 0.64, "learning_rate": 1.7985853646627162e-05, "loss": 2.2289, "step": 367160 }, { "epoch": 0.64, "learning_rate": 1.7984981706700336e-05, "loss": 2.3061, "step": 367170 }, { "epoch": 0.64, "learning_rate": 1.798410976677351e-05, "loss": 2.29, "step": 367180 }, { "epoch": 0.64, "learning_rate": 1.7983237826846684e-05, "loss": 2.2574, "step": 367190 }, { "epoch": 0.64, "learning_rate": 1.7982365886919854e-05, "loss": 2.3941, "step": 367200 }, { "epoch": 0.64, "learning_rate": 1.7981493946993028e-05, "loss": 2.3758, "step": 367210 }, { "epoch": 0.64, "learning_rate": 1.7980622007066202e-05, "loss": 2.2931, "step": 367220 }, { "epoch": 0.64, "learning_rate": 1.7979750067139375e-05, "loss": 2.3633, "step": 367230 }, { "epoch": 0.64, "learning_rate": 1.797887812721255e-05, "loss": 2.287, "step": 367240 }, { "epoch": 0.64, "learning_rate": 1.797800618728572e-05, "loss": 2.3715, "step": 367250 }, { "epoch": 0.64, "learning_rate": 1.7977134247358897e-05, "loss": 2.3147, "step": 367260 }, { "epoch": 0.64, "learning_rate": 1.7976262307432067e-05, "loss": 2.2337, "step": 367270 }, { "epoch": 0.64, "learning_rate": 1.797539036750524e-05, "loss": 2.3572, "step": 367280 }, { "epoch": 0.64, "learning_rate": 1.7974518427578415e-05, "loss": 2.2335, "step": 367290 }, { "epoch": 0.64, "learning_rate": 1.797364648765159e-05, "loss": 2.358, "step": 367300 }, { "epoch": 0.64, "learning_rate": 1.797277454772476e-05, "loss": 2.3659, "step": 367310 }, { "epoch": 0.64, "learning_rate": 1.7971902607797933e-05, "loss": 2.3677, "step": 367320 }, { "epoch": 0.64, "learning_rate": 1.797103066787111e-05, "loss": 2.2867, "step": 367330 }, { "epoch": 0.64, "learning_rate": 1.797015872794428e-05, "loss": 2.3042, "step": 367340 }, { "epoch": 0.64, "learning_rate": 1.7969286788017454e-05, "loss": 2.1841, "step": 367350 }, { "epoch": 0.64, "learning_rate": 1.7968414848090624e-05, "loss": 2.1709, "step": 367360 }, { "epoch": 0.64, "learning_rate": 1.79675429081638e-05, "loss": 2.4265, "step": 367370 }, { "epoch": 0.64, "learning_rate": 1.7966670968236972e-05, "loss": 2.279, "step": 367380 }, { "epoch": 0.64, "learning_rate": 1.7965799028310146e-05, "loss": 2.3271, "step": 367390 }, { "epoch": 0.64, "learning_rate": 1.796492708838332e-05, "loss": 2.3749, "step": 367400 }, { "epoch": 0.64, "learning_rate": 1.7964055148456493e-05, "loss": 2.3127, "step": 367410 }, { "epoch": 0.64, "learning_rate": 1.7963183208529667e-05, "loss": 2.168, "step": 367420 }, { "epoch": 0.64, "learning_rate": 1.7962311268602837e-05, "loss": 2.4241, "step": 367430 }, { "epoch": 0.64, "learning_rate": 1.7961439328676014e-05, "loss": 2.369, "step": 367440 }, { "epoch": 0.64, "learning_rate": 1.7960567388749185e-05, "loss": 2.3671, "step": 367450 }, { "epoch": 0.64, "learning_rate": 1.795969544882236e-05, "loss": 2.353, "step": 367460 }, { "epoch": 0.64, "learning_rate": 1.7958823508895532e-05, "loss": 2.229, "step": 367470 }, { "epoch": 0.64, "learning_rate": 1.7957951568968706e-05, "loss": 2.4086, "step": 367480 }, { "epoch": 0.64, "learning_rate": 1.795707962904188e-05, "loss": 2.2235, "step": 367490 }, { "epoch": 0.64, "learning_rate": 1.795620768911505e-05, "loss": 2.257, "step": 367500 }, { "epoch": 0.64, "learning_rate": 1.7955335749188224e-05, "loss": 2.253, "step": 367510 }, { "epoch": 0.64, "learning_rate": 1.7954463809261398e-05, "loss": 2.3455, "step": 367520 }, { "epoch": 0.64, "learning_rate": 1.795359186933457e-05, "loss": 2.2418, "step": 367530 }, { "epoch": 0.64, "learning_rate": 1.7952719929407742e-05, "loss": 2.3326, "step": 367540 }, { "epoch": 0.64, "learning_rate": 1.795184798948092e-05, "loss": 2.3227, "step": 367550 }, { "epoch": 0.64, "learning_rate": 1.7950976049554093e-05, "loss": 2.4294, "step": 367560 }, { "epoch": 0.64, "learning_rate": 1.7950104109627263e-05, "loss": 2.262, "step": 367570 }, { "epoch": 0.64, "learning_rate": 1.7949232169700437e-05, "loss": 2.2688, "step": 367580 }, { "epoch": 0.64, "learning_rate": 1.794836022977361e-05, "loss": 2.3297, "step": 367590 }, { "epoch": 0.64, "learning_rate": 1.7947488289846785e-05, "loss": 2.3365, "step": 367600 }, { "epoch": 0.64, "learning_rate": 1.7946616349919955e-05, "loss": 2.2786, "step": 367610 }, { "epoch": 0.64, "learning_rate": 1.794574440999313e-05, "loss": 2.3415, "step": 367620 }, { "epoch": 0.64, "learning_rate": 1.7944872470066303e-05, "loss": 2.3366, "step": 367630 }, { "epoch": 0.64, "learning_rate": 1.7944000530139476e-05, "loss": 2.3095, "step": 367640 }, { "epoch": 0.64, "learning_rate": 1.794312859021265e-05, "loss": 2.3437, "step": 367650 }, { "epoch": 0.64, "learning_rate": 1.7942256650285824e-05, "loss": 2.3398, "step": 367660 }, { "epoch": 0.64, "learning_rate": 1.7941384710358998e-05, "loss": 2.3077, "step": 367670 }, { "epoch": 0.64, "learning_rate": 1.7940512770432168e-05, "loss": 2.3164, "step": 367680 }, { "epoch": 0.64, "learning_rate": 1.7939640830505342e-05, "loss": 2.286, "step": 367690 }, { "epoch": 0.64, "learning_rate": 1.7938768890578516e-05, "loss": 2.3361, "step": 367700 }, { "epoch": 0.64, "learning_rate": 1.793789695065169e-05, "loss": 2.346, "step": 367710 }, { "epoch": 0.64, "learning_rate": 1.7937025010724863e-05, "loss": 2.286, "step": 367720 }, { "epoch": 0.64, "learning_rate": 1.7936153070798033e-05, "loss": 2.3006, "step": 367730 }, { "epoch": 0.64, "learning_rate": 1.793528113087121e-05, "loss": 2.3208, "step": 367740 }, { "epoch": 0.64, "learning_rate": 1.793440919094438e-05, "loss": 2.2563, "step": 367750 }, { "epoch": 0.64, "learning_rate": 1.7933537251017555e-05, "loss": 2.3289, "step": 367760 }, { "epoch": 0.64, "learning_rate": 1.7932665311090725e-05, "loss": 2.3873, "step": 367770 }, { "epoch": 0.64, "learning_rate": 1.7931793371163902e-05, "loss": 2.3812, "step": 367780 }, { "epoch": 0.64, "learning_rate": 1.7930921431237073e-05, "loss": 2.1399, "step": 367790 }, { "epoch": 0.64, "learning_rate": 1.7930049491310246e-05, "loss": 2.3676, "step": 367800 }, { "epoch": 0.64, "learning_rate": 1.7929177551383424e-05, "loss": 2.3703, "step": 367810 }, { "epoch": 0.64, "learning_rate": 1.7928305611456594e-05, "loss": 2.2461, "step": 367820 }, { "epoch": 0.64, "learning_rate": 1.7927433671529768e-05, "loss": 2.4244, "step": 367830 }, { "epoch": 0.64, "learning_rate": 1.7926561731602938e-05, "loss": 2.3608, "step": 367840 }, { "epoch": 0.64, "learning_rate": 1.7925689791676115e-05, "loss": 2.1651, "step": 367850 }, { "epoch": 0.64, "learning_rate": 1.7924817851749286e-05, "loss": 2.1991, "step": 367860 }, { "epoch": 0.64, "learning_rate": 1.792394591182246e-05, "loss": 2.3632, "step": 367870 }, { "epoch": 0.64, "learning_rate": 1.7923073971895633e-05, "loss": 2.3254, "step": 367880 }, { "epoch": 0.64, "learning_rate": 1.7922202031968807e-05, "loss": 2.3457, "step": 367890 }, { "epoch": 0.64, "learning_rate": 1.792133009204198e-05, "loss": 2.456, "step": 367900 }, { "epoch": 0.64, "learning_rate": 1.792045815211515e-05, "loss": 2.3348, "step": 367910 }, { "epoch": 0.64, "learning_rate": 1.7919586212188325e-05, "loss": 2.2944, "step": 367920 }, { "epoch": 0.64, "learning_rate": 1.79187142722615e-05, "loss": 2.3344, "step": 367930 }, { "epoch": 0.64, "learning_rate": 1.7917842332334672e-05, "loss": 2.3258, "step": 367940 }, { "epoch": 0.64, "learning_rate": 1.7916970392407846e-05, "loss": 2.3802, "step": 367950 }, { "epoch": 0.64, "learning_rate": 1.791609845248102e-05, "loss": 2.3447, "step": 367960 }, { "epoch": 0.64, "learning_rate": 1.7915226512554194e-05, "loss": 2.42, "step": 367970 }, { "epoch": 0.64, "learning_rate": 1.7914354572627364e-05, "loss": 2.3699, "step": 367980 }, { "epoch": 0.64, "learning_rate": 1.7913482632700538e-05, "loss": 2.3382, "step": 367990 }, { "epoch": 0.64, "learning_rate": 1.7912610692773712e-05, "loss": 2.3039, "step": 368000 }, { "epoch": 0.64, "learning_rate": 1.7911738752846885e-05, "loss": 2.3909, "step": 368010 }, { "epoch": 0.64, "learning_rate": 1.7910866812920056e-05, "loss": 2.2862, "step": 368020 }, { "epoch": 0.64, "learning_rate": 1.790999487299323e-05, "loss": 2.312, "step": 368030 }, { "epoch": 0.64, "learning_rate": 1.7909122933066403e-05, "loss": 2.3084, "step": 368040 }, { "epoch": 0.64, "learning_rate": 1.7908250993139577e-05, "loss": 2.3159, "step": 368050 }, { "epoch": 0.64, "learning_rate": 1.790737905321275e-05, "loss": 2.3951, "step": 368060 }, { "epoch": 0.64, "learning_rate": 1.7906507113285925e-05, "loss": 2.2927, "step": 368070 }, { "epoch": 0.64, "learning_rate": 1.79056351733591e-05, "loss": 2.2806, "step": 368080 }, { "epoch": 0.64, "learning_rate": 1.790476323343227e-05, "loss": 2.2613, "step": 368090 }, { "epoch": 0.64, "learning_rate": 1.7903891293505443e-05, "loss": 2.378, "step": 368100 }, { "epoch": 0.64, "learning_rate": 1.7903019353578616e-05, "loss": 2.1855, "step": 368110 }, { "epoch": 0.64, "learning_rate": 1.790214741365179e-05, "loss": 2.3562, "step": 368120 }, { "epoch": 0.64, "learning_rate": 1.7901275473724964e-05, "loss": 2.235, "step": 368130 }, { "epoch": 0.64, "learning_rate": 1.7900403533798134e-05, "loss": 2.2346, "step": 368140 }, { "epoch": 0.64, "learning_rate": 1.789953159387131e-05, "loss": 2.325, "step": 368150 }, { "epoch": 0.64, "learning_rate": 1.7898659653944482e-05, "loss": 2.3711, "step": 368160 }, { "epoch": 0.64, "learning_rate": 1.7897787714017656e-05, "loss": 2.3881, "step": 368170 }, { "epoch": 0.64, "learning_rate": 1.789691577409083e-05, "loss": 2.3227, "step": 368180 }, { "epoch": 0.64, "learning_rate": 1.7896043834164003e-05, "loss": 2.3164, "step": 368190 }, { "epoch": 0.64, "learning_rate": 1.7895171894237177e-05, "loss": 2.2621, "step": 368200 }, { "epoch": 0.64, "learning_rate": 1.7894299954310347e-05, "loss": 2.3882, "step": 368210 }, { "epoch": 0.64, "learning_rate": 1.7893428014383524e-05, "loss": 2.4207, "step": 368220 }, { "epoch": 0.64, "learning_rate": 1.7892556074456695e-05, "loss": 2.3441, "step": 368230 }, { "epoch": 0.64, "learning_rate": 1.789168413452987e-05, "loss": 2.2926, "step": 368240 }, { "epoch": 0.64, "learning_rate": 1.789081219460304e-05, "loss": 2.2808, "step": 368250 }, { "epoch": 0.64, "learning_rate": 1.7889940254676216e-05, "loss": 2.3045, "step": 368260 }, { "epoch": 0.64, "learning_rate": 1.7889068314749387e-05, "loss": 2.2529, "step": 368270 }, { "epoch": 0.64, "learning_rate": 1.788819637482256e-05, "loss": 2.2644, "step": 368280 }, { "epoch": 0.64, "learning_rate": 1.7887324434895734e-05, "loss": 2.4422, "step": 368290 }, { "epoch": 0.64, "learning_rate": 1.7886452494968908e-05, "loss": 2.2784, "step": 368300 }, { "epoch": 0.64, "learning_rate": 1.788558055504208e-05, "loss": 2.36, "step": 368310 }, { "epoch": 0.64, "learning_rate": 1.7884708615115252e-05, "loss": 2.332, "step": 368320 }, { "epoch": 0.64, "learning_rate": 1.788383667518843e-05, "loss": 2.3854, "step": 368330 }, { "epoch": 0.64, "learning_rate": 1.78829647352616e-05, "loss": 2.3409, "step": 368340 }, { "epoch": 0.64, "learning_rate": 1.7882092795334773e-05, "loss": 2.2649, "step": 368350 }, { "epoch": 0.64, "learning_rate": 1.7881220855407947e-05, "loss": 2.2047, "step": 368360 }, { "epoch": 0.64, "learning_rate": 1.788034891548112e-05, "loss": 2.318, "step": 368370 }, { "epoch": 0.64, "learning_rate": 1.7879476975554295e-05, "loss": 2.4245, "step": 368380 }, { "epoch": 0.64, "learning_rate": 1.7878605035627465e-05, "loss": 2.3921, "step": 368390 }, { "epoch": 0.64, "learning_rate": 1.787773309570064e-05, "loss": 2.3492, "step": 368400 }, { "epoch": 0.64, "learning_rate": 1.7876861155773813e-05, "loss": 2.211, "step": 368410 }, { "epoch": 0.64, "learning_rate": 1.7875989215846986e-05, "loss": 2.2346, "step": 368420 }, { "epoch": 0.64, "learning_rate": 1.787511727592016e-05, "loss": 2.4325, "step": 368430 }, { "epoch": 0.64, "learning_rate": 1.787424533599333e-05, "loss": 2.264, "step": 368440 }, { "epoch": 0.64, "learning_rate": 1.7873373396066508e-05, "loss": 2.2759, "step": 368450 }, { "epoch": 0.64, "learning_rate": 1.7872501456139678e-05, "loss": 2.3691, "step": 368460 }, { "epoch": 0.64, "learning_rate": 1.7871629516212852e-05, "loss": 2.3228, "step": 368470 }, { "epoch": 0.64, "learning_rate": 1.7870757576286026e-05, "loss": 2.3104, "step": 368480 }, { "epoch": 0.64, "learning_rate": 1.78698856363592e-05, "loss": 2.2349, "step": 368490 }, { "epoch": 0.64, "learning_rate": 1.786901369643237e-05, "loss": 2.3386, "step": 368500 }, { "epoch": 0.64, "learning_rate": 1.7868141756505543e-05, "loss": 2.2408, "step": 368510 }, { "epoch": 0.64, "learning_rate": 1.7867269816578717e-05, "loss": 2.2836, "step": 368520 }, { "epoch": 0.64, "learning_rate": 1.786639787665189e-05, "loss": 2.3632, "step": 368530 }, { "epoch": 0.64, "learning_rate": 1.7865525936725065e-05, "loss": 2.3333, "step": 368540 }, { "epoch": 0.64, "learning_rate": 1.7864653996798235e-05, "loss": 2.2414, "step": 368550 }, { "epoch": 0.64, "learning_rate": 1.7863782056871412e-05, "loss": 2.2204, "step": 368560 }, { "epoch": 0.64, "learning_rate": 1.7862910116944583e-05, "loss": 2.322, "step": 368570 }, { "epoch": 0.64, "learning_rate": 1.7862038177017756e-05, "loss": 2.2235, "step": 368580 }, { "epoch": 0.64, "learning_rate": 1.786116623709093e-05, "loss": 2.3417, "step": 368590 }, { "epoch": 0.64, "learning_rate": 1.7860294297164104e-05, "loss": 2.2092, "step": 368600 }, { "epoch": 0.64, "learning_rate": 1.7859422357237278e-05, "loss": 2.2998, "step": 368610 }, { "epoch": 0.64, "learning_rate": 1.7858550417310448e-05, "loss": 2.2887, "step": 368620 }, { "epoch": 0.64, "learning_rate": 1.7857678477383625e-05, "loss": 2.4211, "step": 368630 }, { "epoch": 0.64, "learning_rate": 1.7856806537456796e-05, "loss": 2.3275, "step": 368640 }, { "epoch": 0.64, "learning_rate": 1.785593459752997e-05, "loss": 2.3667, "step": 368650 }, { "epoch": 0.64, "learning_rate": 1.785506265760314e-05, "loss": 2.2972, "step": 368660 }, { "epoch": 0.64, "learning_rate": 1.7854190717676317e-05, "loss": 2.3442, "step": 368670 }, { "epoch": 0.64, "learning_rate": 1.785331877774949e-05, "loss": 2.3916, "step": 368680 }, { "epoch": 0.64, "learning_rate": 1.785244683782266e-05, "loss": 2.3442, "step": 368690 }, { "epoch": 0.64, "learning_rate": 1.7851574897895835e-05, "loss": 2.3497, "step": 368700 }, { "epoch": 0.64, "learning_rate": 1.785070295796901e-05, "loss": 2.2394, "step": 368710 }, { "epoch": 0.64, "learning_rate": 1.7849831018042182e-05, "loss": 2.3626, "step": 368720 }, { "epoch": 0.64, "learning_rate": 1.7848959078115353e-05, "loss": 2.3445, "step": 368730 }, { "epoch": 0.64, "learning_rate": 1.784808713818853e-05, "loss": 2.3113, "step": 368740 }, { "epoch": 0.64, "learning_rate": 1.78472151982617e-05, "loss": 2.3132, "step": 368750 }, { "epoch": 0.64, "learning_rate": 1.7846343258334874e-05, "loss": 2.3148, "step": 368760 }, { "epoch": 0.64, "learning_rate": 1.7845471318408048e-05, "loss": 2.402, "step": 368770 }, { "epoch": 0.64, "learning_rate": 1.7844599378481222e-05, "loss": 2.369, "step": 368780 }, { "epoch": 0.64, "learning_rate": 1.7843727438554395e-05, "loss": 2.2295, "step": 368790 }, { "epoch": 0.64, "learning_rate": 1.7842855498627566e-05, "loss": 2.3758, "step": 368800 }, { "epoch": 0.64, "learning_rate": 1.784198355870074e-05, "loss": 2.2951, "step": 368810 }, { "epoch": 0.64, "learning_rate": 1.7841111618773913e-05, "loss": 2.4163, "step": 368820 }, { "epoch": 0.64, "learning_rate": 1.7840239678847087e-05, "loss": 2.2301, "step": 368830 }, { "epoch": 0.64, "learning_rate": 1.783936773892026e-05, "loss": 2.1994, "step": 368840 }, { "epoch": 0.64, "learning_rate": 1.783849579899343e-05, "loss": 2.3791, "step": 368850 }, { "epoch": 0.64, "learning_rate": 1.783762385906661e-05, "loss": 2.3319, "step": 368860 }, { "epoch": 0.64, "learning_rate": 1.783675191913978e-05, "loss": 2.3782, "step": 368870 }, { "epoch": 0.64, "learning_rate": 1.7835879979212953e-05, "loss": 2.3813, "step": 368880 }, { "epoch": 0.64, "learning_rate": 1.7835008039286126e-05, "loss": 2.3615, "step": 368890 }, { "epoch": 0.64, "learning_rate": 1.78341360993593e-05, "loss": 2.4141, "step": 368900 }, { "epoch": 0.64, "learning_rate": 1.7833264159432474e-05, "loss": 2.3158, "step": 368910 }, { "epoch": 0.64, "learning_rate": 1.7832392219505644e-05, "loss": 2.4034, "step": 368920 }, { "epoch": 0.64, "learning_rate": 1.783152027957882e-05, "loss": 2.3277, "step": 368930 }, { "epoch": 0.64, "learning_rate": 1.7830648339651992e-05, "loss": 2.4612, "step": 368940 }, { "epoch": 0.64, "learning_rate": 1.7829776399725166e-05, "loss": 2.4041, "step": 368950 }, { "epoch": 0.64, "learning_rate": 1.7828904459798336e-05, "loss": 2.3308, "step": 368960 }, { "epoch": 0.64, "learning_rate": 1.7828032519871513e-05, "loss": 2.363, "step": 368970 }, { "epoch": 0.64, "learning_rate": 1.7827160579944684e-05, "loss": 2.3721, "step": 368980 }, { "epoch": 0.64, "learning_rate": 1.7826288640017857e-05, "loss": 2.3667, "step": 368990 }, { "epoch": 0.64, "learning_rate": 1.782541670009103e-05, "loss": 2.4719, "step": 369000 }, { "epoch": 0.64, "learning_rate": 1.7824544760164205e-05, "loss": 2.36, "step": 369010 }, { "epoch": 0.64, "learning_rate": 1.782367282023738e-05, "loss": 2.4146, "step": 369020 }, { "epoch": 0.64, "learning_rate": 1.782280088031055e-05, "loss": 2.3774, "step": 369030 }, { "epoch": 0.64, "learning_rate": 1.7821928940383726e-05, "loss": 2.4443, "step": 369040 }, { "epoch": 0.64, "learning_rate": 1.7821057000456897e-05, "loss": 2.326, "step": 369050 }, { "epoch": 0.64, "learning_rate": 1.782018506053007e-05, "loss": 2.2697, "step": 369060 }, { "epoch": 0.64, "learning_rate": 1.7819313120603244e-05, "loss": 2.4126, "step": 369070 }, { "epoch": 0.64, "learning_rate": 1.7818441180676418e-05, "loss": 2.2164, "step": 369080 }, { "epoch": 0.64, "learning_rate": 1.781756924074959e-05, "loss": 2.2859, "step": 369090 }, { "epoch": 0.64, "learning_rate": 1.7816697300822762e-05, "loss": 2.3145, "step": 369100 }, { "epoch": 0.64, "learning_rate": 1.7815825360895936e-05, "loss": 2.3207, "step": 369110 }, { "epoch": 0.64, "learning_rate": 1.781495342096911e-05, "loss": 2.4036, "step": 369120 }, { "epoch": 0.64, "learning_rate": 1.7814081481042283e-05, "loss": 2.3486, "step": 369130 }, { "epoch": 0.64, "learning_rate": 1.7813209541115454e-05, "loss": 2.2428, "step": 369140 }, { "epoch": 0.64, "learning_rate": 1.781233760118863e-05, "loss": 2.2797, "step": 369150 }, { "epoch": 0.64, "learning_rate": 1.7811465661261805e-05, "loss": 2.2507, "step": 369160 }, { "epoch": 0.64, "learning_rate": 1.7810593721334975e-05, "loss": 2.2805, "step": 369170 }, { "epoch": 0.64, "learning_rate": 1.780972178140815e-05, "loss": 2.2444, "step": 369180 }, { "epoch": 0.64, "learning_rate": 1.7808849841481323e-05, "loss": 2.1706, "step": 369190 }, { "epoch": 0.64, "learning_rate": 1.7807977901554496e-05, "loss": 2.2623, "step": 369200 }, { "epoch": 0.64, "learning_rate": 1.7807105961627667e-05, "loss": 2.1896, "step": 369210 }, { "epoch": 0.64, "learning_rate": 1.780623402170084e-05, "loss": 2.3336, "step": 369220 }, { "epoch": 0.64, "learning_rate": 1.7805362081774014e-05, "loss": 2.2889, "step": 369230 }, { "epoch": 0.64, "learning_rate": 1.7804490141847188e-05, "loss": 2.3541, "step": 369240 }, { "epoch": 0.64, "learning_rate": 1.7803618201920362e-05, "loss": 2.2982, "step": 369250 }, { "epoch": 0.64, "learning_rate": 1.7802746261993536e-05, "loss": 2.2622, "step": 369260 }, { "epoch": 0.64, "learning_rate": 1.780187432206671e-05, "loss": 2.2707, "step": 369270 }, { "epoch": 0.64, "learning_rate": 1.780100238213988e-05, "loss": 2.3084, "step": 369280 }, { "epoch": 0.64, "learning_rate": 1.7800130442213054e-05, "loss": 2.4211, "step": 369290 }, { "epoch": 0.64, "learning_rate": 1.7799258502286227e-05, "loss": 2.2738, "step": 369300 }, { "epoch": 0.64, "learning_rate": 1.77983865623594e-05, "loss": 2.385, "step": 369310 }, { "epoch": 0.64, "learning_rate": 1.7797514622432575e-05, "loss": 2.2564, "step": 369320 }, { "epoch": 0.64, "learning_rate": 1.7796642682505745e-05, "loss": 2.3884, "step": 369330 }, { "epoch": 0.64, "learning_rate": 1.7795770742578922e-05, "loss": 2.2844, "step": 369340 }, { "epoch": 0.64, "learning_rate": 1.7794898802652093e-05, "loss": 2.3888, "step": 369350 }, { "epoch": 0.64, "learning_rate": 1.7794026862725267e-05, "loss": 2.3435, "step": 369360 }, { "epoch": 0.64, "learning_rate": 1.7793154922798437e-05, "loss": 2.3638, "step": 369370 }, { "epoch": 0.64, "learning_rate": 1.7792282982871614e-05, "loss": 2.3414, "step": 369380 }, { "epoch": 0.64, "learning_rate": 1.7791411042944784e-05, "loss": 2.2875, "step": 369390 }, { "epoch": 0.64, "learning_rate": 1.7790539103017958e-05, "loss": 2.3827, "step": 369400 }, { "epoch": 0.64, "learning_rate": 1.7789667163091135e-05, "loss": 2.3168, "step": 369410 }, { "epoch": 0.64, "learning_rate": 1.7788795223164306e-05, "loss": 2.2211, "step": 369420 }, { "epoch": 0.64, "learning_rate": 1.778792328323748e-05, "loss": 2.3653, "step": 369430 }, { "epoch": 0.64, "learning_rate": 1.778705134331065e-05, "loss": 2.2435, "step": 369440 }, { "epoch": 0.64, "learning_rate": 1.7786179403383827e-05, "loss": 2.3074, "step": 369450 }, { "epoch": 0.64, "learning_rate": 1.7785307463456997e-05, "loss": 2.2124, "step": 369460 }, { "epoch": 0.64, "learning_rate": 1.778443552353017e-05, "loss": 2.2884, "step": 369470 }, { "epoch": 0.64, "learning_rate": 1.7783563583603345e-05, "loss": 2.347, "step": 369480 }, { "epoch": 0.64, "learning_rate": 1.778269164367652e-05, "loss": 2.2763, "step": 369490 }, { "epoch": 0.64, "learning_rate": 1.7781819703749693e-05, "loss": 2.3867, "step": 369500 }, { "epoch": 0.64, "learning_rate": 1.7780947763822863e-05, "loss": 2.3154, "step": 369510 }, { "epoch": 0.64, "learning_rate": 1.778007582389604e-05, "loss": 2.3286, "step": 369520 }, { "epoch": 0.64, "learning_rate": 1.777920388396921e-05, "loss": 2.2546, "step": 369530 }, { "epoch": 0.64, "learning_rate": 1.7778331944042384e-05, "loss": 2.2882, "step": 369540 }, { "epoch": 0.64, "learning_rate": 1.7777460004115558e-05, "loss": 2.3391, "step": 369550 }, { "epoch": 0.64, "learning_rate": 1.7776588064188732e-05, "loss": 2.2383, "step": 369560 }, { "epoch": 0.64, "learning_rate": 1.7775716124261906e-05, "loss": 2.3395, "step": 369570 }, { "epoch": 0.64, "learning_rate": 1.7774844184335076e-05, "loss": 2.2882, "step": 369580 }, { "epoch": 0.64, "learning_rate": 1.777397224440825e-05, "loss": 2.4327, "step": 369590 }, { "epoch": 0.64, "learning_rate": 1.7773100304481423e-05, "loss": 2.3689, "step": 369600 }, { "epoch": 0.64, "learning_rate": 1.7772228364554597e-05, "loss": 2.3834, "step": 369610 }, { "epoch": 0.64, "learning_rate": 1.7771356424627768e-05, "loss": 2.2051, "step": 369620 }, { "epoch": 0.64, "learning_rate": 1.777048448470094e-05, "loss": 2.2881, "step": 369630 }, { "epoch": 0.64, "learning_rate": 1.776961254477412e-05, "loss": 2.3591, "step": 369640 }, { "epoch": 0.64, "learning_rate": 1.776874060484729e-05, "loss": 2.3073, "step": 369650 }, { "epoch": 0.64, "learning_rate": 1.7767868664920463e-05, "loss": 2.2239, "step": 369660 }, { "epoch": 0.64, "learning_rate": 1.7766996724993636e-05, "loss": 2.2545, "step": 369670 }, { "epoch": 0.64, "learning_rate": 1.776612478506681e-05, "loss": 2.3264, "step": 369680 }, { "epoch": 0.64, "learning_rate": 1.776525284513998e-05, "loss": 2.3352, "step": 369690 }, { "epoch": 0.64, "learning_rate": 1.7764380905213154e-05, "loss": 2.2401, "step": 369700 }, { "epoch": 0.64, "learning_rate": 1.7763508965286328e-05, "loss": 2.2319, "step": 369710 }, { "epoch": 0.64, "learning_rate": 1.7762637025359502e-05, "loss": 2.2851, "step": 369720 }, { "epoch": 0.64, "learning_rate": 1.7761765085432676e-05, "loss": 2.2507, "step": 369730 }, { "epoch": 0.64, "learning_rate": 1.7760893145505846e-05, "loss": 2.3865, "step": 369740 }, { "epoch": 0.64, "learning_rate": 1.7760021205579023e-05, "loss": 2.2771, "step": 369750 }, { "epoch": 0.64, "learning_rate": 1.7759149265652194e-05, "loss": 2.3587, "step": 369760 }, { "epoch": 0.64, "learning_rate": 1.7758277325725367e-05, "loss": 2.2979, "step": 369770 }, { "epoch": 0.64, "learning_rate": 1.775740538579854e-05, "loss": 2.2304, "step": 369780 }, { "epoch": 0.64, "learning_rate": 1.7756533445871715e-05, "loss": 2.3358, "step": 369790 }, { "epoch": 0.64, "learning_rate": 1.775566150594489e-05, "loss": 2.2538, "step": 369800 }, { "epoch": 0.64, "learning_rate": 1.775478956601806e-05, "loss": 2.3843, "step": 369810 }, { "epoch": 0.64, "learning_rate": 1.7753917626091236e-05, "loss": 2.4124, "step": 369820 }, { "epoch": 0.64, "learning_rate": 1.7753045686164407e-05, "loss": 2.2591, "step": 369830 }, { "epoch": 0.64, "learning_rate": 1.775217374623758e-05, "loss": 2.4166, "step": 369840 }, { "epoch": 0.64, "learning_rate": 1.775130180631075e-05, "loss": 2.3105, "step": 369850 }, { "epoch": 0.64, "learning_rate": 1.7750429866383928e-05, "loss": 2.3787, "step": 369860 }, { "epoch": 0.65, "learning_rate": 1.7749557926457098e-05, "loss": 2.2947, "step": 369870 }, { "epoch": 0.65, "learning_rate": 1.7748685986530272e-05, "loss": 2.3224, "step": 369880 }, { "epoch": 0.65, "learning_rate": 1.7747814046603446e-05, "loss": 2.4279, "step": 369890 }, { "epoch": 0.65, "learning_rate": 1.774694210667662e-05, "loss": 2.329, "step": 369900 }, { "epoch": 0.65, "learning_rate": 1.7746070166749793e-05, "loss": 2.2247, "step": 369910 }, { "epoch": 0.65, "learning_rate": 1.7745198226822964e-05, "loss": 2.3777, "step": 369920 }, { "epoch": 0.65, "learning_rate": 1.774432628689614e-05, "loss": 2.3755, "step": 369930 }, { "epoch": 0.65, "learning_rate": 1.774345434696931e-05, "loss": 2.2608, "step": 369940 }, { "epoch": 0.65, "learning_rate": 1.7742582407042485e-05, "loss": 2.3021, "step": 369950 }, { "epoch": 0.65, "learning_rate": 1.774171046711566e-05, "loss": 2.2289, "step": 369960 }, { "epoch": 0.65, "learning_rate": 1.7740838527188833e-05, "loss": 2.2099, "step": 369970 }, { "epoch": 0.65, "learning_rate": 1.7739966587262006e-05, "loss": 2.26, "step": 369980 }, { "epoch": 0.65, "learning_rate": 1.7739094647335177e-05, "loss": 2.274, "step": 369990 }, { "epoch": 0.65, "learning_rate": 1.773822270740835e-05, "loss": 2.3244, "step": 370000 }, { "epoch": 0.65, "learning_rate": 1.7737350767481524e-05, "loss": 2.2632, "step": 370010 }, { "epoch": 0.65, "learning_rate": 1.7736478827554698e-05, "loss": 2.3939, "step": 370020 }, { "epoch": 0.65, "learning_rate": 1.7735606887627872e-05, "loss": 2.3382, "step": 370030 }, { "epoch": 0.65, "learning_rate": 1.7734734947701042e-05, "loss": 2.3621, "step": 370040 }, { "epoch": 0.65, "learning_rate": 1.773386300777422e-05, "loss": 2.2565, "step": 370050 }, { "epoch": 0.65, "learning_rate": 1.773299106784739e-05, "loss": 2.4254, "step": 370060 }, { "epoch": 0.65, "learning_rate": 1.7732119127920564e-05, "loss": 2.311, "step": 370070 }, { "epoch": 0.65, "learning_rate": 1.7731247187993737e-05, "loss": 2.2329, "step": 370080 }, { "epoch": 0.65, "learning_rate": 1.773037524806691e-05, "loss": 2.4797, "step": 370090 }, { "epoch": 0.65, "learning_rate": 1.772950330814008e-05, "loss": 2.3116, "step": 370100 }, { "epoch": 0.65, "learning_rate": 1.7728631368213255e-05, "loss": 2.3503, "step": 370110 }, { "epoch": 0.65, "learning_rate": 1.772775942828643e-05, "loss": 2.3393, "step": 370120 }, { "epoch": 0.65, "learning_rate": 1.7726887488359603e-05, "loss": 2.196, "step": 370130 }, { "epoch": 0.65, "learning_rate": 1.7726015548432777e-05, "loss": 2.2822, "step": 370140 }, { "epoch": 0.65, "learning_rate": 1.7725143608505947e-05, "loss": 2.4321, "step": 370150 }, { "epoch": 0.65, "learning_rate": 1.7724271668579124e-05, "loss": 2.3233, "step": 370160 }, { "epoch": 0.65, "learning_rate": 1.7723399728652294e-05, "loss": 2.2055, "step": 370170 }, { "epoch": 0.65, "learning_rate": 1.7722527788725468e-05, "loss": 2.2871, "step": 370180 }, { "epoch": 0.65, "learning_rate": 1.7721655848798642e-05, "loss": 2.4087, "step": 370190 }, { "epoch": 0.65, "learning_rate": 1.7720783908871816e-05, "loss": 2.3625, "step": 370200 }, { "epoch": 0.65, "learning_rate": 1.771991196894499e-05, "loss": 2.4035, "step": 370210 }, { "epoch": 0.65, "learning_rate": 1.771904002901816e-05, "loss": 2.2698, "step": 370220 }, { "epoch": 0.65, "learning_rate": 1.7718168089091337e-05, "loss": 2.388, "step": 370230 }, { "epoch": 0.65, "learning_rate": 1.7717296149164507e-05, "loss": 2.4066, "step": 370240 }, { "epoch": 0.65, "learning_rate": 1.771642420923768e-05, "loss": 2.2796, "step": 370250 }, { "epoch": 0.65, "learning_rate": 1.7715552269310855e-05, "loss": 2.3435, "step": 370260 }, { "epoch": 0.65, "learning_rate": 1.771468032938403e-05, "loss": 2.36, "step": 370270 }, { "epoch": 0.65, "learning_rate": 1.7713808389457203e-05, "loss": 2.3887, "step": 370280 }, { "epoch": 0.65, "learning_rate": 1.7712936449530373e-05, "loss": 2.2423, "step": 370290 }, { "epoch": 0.65, "learning_rate": 1.7712064509603547e-05, "loss": 2.3067, "step": 370300 }, { "epoch": 0.65, "learning_rate": 1.771119256967672e-05, "loss": 2.3575, "step": 370310 }, { "epoch": 0.65, "learning_rate": 1.7710320629749894e-05, "loss": 2.2633, "step": 370320 }, { "epoch": 0.65, "learning_rate": 1.7709448689823065e-05, "loss": 2.4374, "step": 370330 }, { "epoch": 0.65, "learning_rate": 1.7708576749896242e-05, "loss": 2.2198, "step": 370340 }, { "epoch": 0.65, "learning_rate": 1.7707704809969412e-05, "loss": 2.3312, "step": 370350 }, { "epoch": 0.65, "learning_rate": 1.7706832870042586e-05, "loss": 2.2861, "step": 370360 }, { "epoch": 0.65, "learning_rate": 1.770596093011576e-05, "loss": 2.3456, "step": 370370 }, { "epoch": 0.65, "learning_rate": 1.7705088990188933e-05, "loss": 2.2607, "step": 370380 }, { "epoch": 0.65, "learning_rate": 1.7704217050262107e-05, "loss": 2.2255, "step": 370390 }, { "epoch": 0.65, "learning_rate": 1.7703345110335278e-05, "loss": 2.4565, "step": 370400 }, { "epoch": 0.65, "learning_rate": 1.770247317040845e-05, "loss": 2.4806, "step": 370410 }, { "epoch": 0.65, "learning_rate": 1.7701601230481625e-05, "loss": 2.3009, "step": 370420 }, { "epoch": 0.65, "learning_rate": 1.77007292905548e-05, "loss": 2.2122, "step": 370430 }, { "epoch": 0.65, "learning_rate": 1.7699857350627973e-05, "loss": 2.4172, "step": 370440 }, { "epoch": 0.65, "learning_rate": 1.7698985410701143e-05, "loss": 2.2513, "step": 370450 }, { "epoch": 0.65, "learning_rate": 1.769811347077432e-05, "loss": 2.3113, "step": 370460 }, { "epoch": 0.65, "learning_rate": 1.769724153084749e-05, "loss": 2.3123, "step": 370470 }, { "epoch": 0.65, "learning_rate": 1.7696369590920664e-05, "loss": 2.3212, "step": 370480 }, { "epoch": 0.65, "learning_rate": 1.7695497650993838e-05, "loss": 2.2689, "step": 370490 }, { "epoch": 0.65, "learning_rate": 1.7694625711067012e-05, "loss": 2.2172, "step": 370500 }, { "epoch": 0.65, "learning_rate": 1.7693753771140186e-05, "loss": 2.2679, "step": 370510 }, { "epoch": 0.65, "learning_rate": 1.7692881831213356e-05, "loss": 2.3171, "step": 370520 }, { "epoch": 0.65, "learning_rate": 1.7692009891286533e-05, "loss": 2.2862, "step": 370530 }, { "epoch": 0.65, "learning_rate": 1.7691137951359704e-05, "loss": 2.4039, "step": 370540 }, { "epoch": 0.65, "learning_rate": 1.7690266011432877e-05, "loss": 2.2765, "step": 370550 }, { "epoch": 0.65, "learning_rate": 1.7689394071506048e-05, "loss": 2.3129, "step": 370560 }, { "epoch": 0.65, "learning_rate": 1.7688522131579225e-05, "loss": 2.4061, "step": 370570 }, { "epoch": 0.65, "learning_rate": 1.7687650191652395e-05, "loss": 2.1991, "step": 370580 }, { "epoch": 0.65, "learning_rate": 1.768677825172557e-05, "loss": 2.2112, "step": 370590 }, { "epoch": 0.65, "learning_rate": 1.7685906311798743e-05, "loss": 2.3288, "step": 370600 }, { "epoch": 0.65, "learning_rate": 1.7685034371871917e-05, "loss": 2.3209, "step": 370610 }, { "epoch": 0.65, "learning_rate": 1.768416243194509e-05, "loss": 2.3014, "step": 370620 }, { "epoch": 0.65, "learning_rate": 1.768329049201826e-05, "loss": 2.3462, "step": 370630 }, { "epoch": 0.65, "learning_rate": 1.7682418552091438e-05, "loss": 2.3546, "step": 370640 }, { "epoch": 0.65, "learning_rate": 1.7681546612164608e-05, "loss": 2.3164, "step": 370650 }, { "epoch": 0.65, "learning_rate": 1.7680674672237782e-05, "loss": 2.267, "step": 370660 }, { "epoch": 0.65, "learning_rate": 1.7679802732310956e-05, "loss": 2.3593, "step": 370670 }, { "epoch": 0.65, "learning_rate": 1.767893079238413e-05, "loss": 2.2887, "step": 370680 }, { "epoch": 0.65, "learning_rate": 1.7678058852457303e-05, "loss": 2.2009, "step": 370690 }, { "epoch": 0.65, "learning_rate": 1.7677186912530474e-05, "loss": 2.2936, "step": 370700 }, { "epoch": 0.65, "learning_rate": 1.7676314972603648e-05, "loss": 2.3846, "step": 370710 }, { "epoch": 0.65, "learning_rate": 1.767544303267682e-05, "loss": 2.3564, "step": 370720 }, { "epoch": 0.65, "learning_rate": 1.7674571092749995e-05, "loss": 2.3787, "step": 370730 }, { "epoch": 0.65, "learning_rate": 1.7673699152823165e-05, "loss": 2.2604, "step": 370740 }, { "epoch": 0.65, "learning_rate": 1.7672827212896343e-05, "loss": 2.2662, "step": 370750 }, { "epoch": 0.65, "learning_rate": 1.7671955272969516e-05, "loss": 2.3025, "step": 370760 }, { "epoch": 0.65, "learning_rate": 1.7671083333042687e-05, "loss": 2.1967, "step": 370770 }, { "epoch": 0.65, "learning_rate": 1.767021139311586e-05, "loss": 2.3038, "step": 370780 }, { "epoch": 0.65, "learning_rate": 1.7669339453189034e-05, "loss": 2.3484, "step": 370790 }, { "epoch": 0.65, "learning_rate": 1.7668467513262208e-05, "loss": 2.3774, "step": 370800 }, { "epoch": 0.65, "learning_rate": 1.766759557333538e-05, "loss": 2.2763, "step": 370810 }, { "epoch": 0.65, "learning_rate": 1.7666723633408552e-05, "loss": 2.2612, "step": 370820 }, { "epoch": 0.65, "learning_rate": 1.7665851693481726e-05, "loss": 2.3135, "step": 370830 }, { "epoch": 0.65, "learning_rate": 1.76649797535549e-05, "loss": 2.374, "step": 370840 }, { "epoch": 0.65, "learning_rate": 1.7664107813628074e-05, "loss": 2.3194, "step": 370850 }, { "epoch": 0.65, "learning_rate": 1.7663235873701247e-05, "loss": 2.3507, "step": 370860 }, { "epoch": 0.65, "learning_rate": 1.766236393377442e-05, "loss": 2.3134, "step": 370870 }, { "epoch": 0.65, "learning_rate": 1.766149199384759e-05, "loss": 2.3215, "step": 370880 }, { "epoch": 0.65, "learning_rate": 1.7660620053920765e-05, "loss": 2.3635, "step": 370890 }, { "epoch": 0.65, "learning_rate": 1.765974811399394e-05, "loss": 2.242, "step": 370900 }, { "epoch": 0.65, "learning_rate": 1.7658876174067113e-05, "loss": 2.3449, "step": 370910 }, { "epoch": 0.65, "learning_rate": 1.7658004234140287e-05, "loss": 2.3786, "step": 370920 }, { "epoch": 0.65, "learning_rate": 1.7657132294213457e-05, "loss": 2.278, "step": 370930 }, { "epoch": 0.65, "learning_rate": 1.7656260354286634e-05, "loss": 2.3438, "step": 370940 }, { "epoch": 0.65, "learning_rate": 1.7655388414359804e-05, "loss": 2.3442, "step": 370950 }, { "epoch": 0.65, "learning_rate": 1.7654516474432978e-05, "loss": 2.3106, "step": 370960 }, { "epoch": 0.65, "learning_rate": 1.765364453450615e-05, "loss": 2.325, "step": 370970 }, { "epoch": 0.65, "learning_rate": 1.7652772594579326e-05, "loss": 2.3443, "step": 370980 }, { "epoch": 0.65, "learning_rate": 1.76519006546525e-05, "loss": 2.1722, "step": 370990 }, { "epoch": 0.65, "learning_rate": 1.765102871472567e-05, "loss": 2.2283, "step": 371000 }, { "epoch": 0.65, "learning_rate": 1.7650156774798847e-05, "loss": 2.431, "step": 371010 }, { "epoch": 0.65, "learning_rate": 1.7649284834872017e-05, "loss": 2.4093, "step": 371020 }, { "epoch": 0.65, "learning_rate": 1.764841289494519e-05, "loss": 2.3049, "step": 371030 }, { "epoch": 0.65, "learning_rate": 1.764754095501836e-05, "loss": 2.3776, "step": 371040 }, { "epoch": 0.65, "learning_rate": 1.764666901509154e-05, "loss": 2.3385, "step": 371050 }, { "epoch": 0.65, "learning_rate": 1.764579707516471e-05, "loss": 2.3941, "step": 371060 }, { "epoch": 0.65, "learning_rate": 1.7644925135237883e-05, "loss": 2.2083, "step": 371070 }, { "epoch": 0.65, "learning_rate": 1.7644053195311057e-05, "loss": 2.3242, "step": 371080 }, { "epoch": 0.65, "learning_rate": 1.764318125538423e-05, "loss": 2.297, "step": 371090 }, { "epoch": 0.65, "learning_rate": 1.7642309315457404e-05, "loss": 2.3655, "step": 371100 }, { "epoch": 0.65, "learning_rate": 1.7641437375530575e-05, "loss": 2.1917, "step": 371110 }, { "epoch": 0.65, "learning_rate": 1.7640565435603752e-05, "loss": 2.2931, "step": 371120 }, { "epoch": 0.65, "learning_rate": 1.7639693495676922e-05, "loss": 2.3209, "step": 371130 }, { "epoch": 0.65, "learning_rate": 1.7638821555750096e-05, "loss": 2.2303, "step": 371140 }, { "epoch": 0.65, "learning_rate": 1.763794961582327e-05, "loss": 2.2936, "step": 371150 }, { "epoch": 0.65, "learning_rate": 1.7637077675896443e-05, "loss": 2.327, "step": 371160 }, { "epoch": 0.65, "learning_rate": 1.7636205735969617e-05, "loss": 2.2869, "step": 371170 }, { "epoch": 0.65, "learning_rate": 1.7635333796042788e-05, "loss": 2.3378, "step": 371180 }, { "epoch": 0.65, "learning_rate": 1.763446185611596e-05, "loss": 2.4664, "step": 371190 }, { "epoch": 0.65, "learning_rate": 1.7633589916189135e-05, "loss": 2.327, "step": 371200 }, { "epoch": 0.65, "learning_rate": 1.763271797626231e-05, "loss": 2.2822, "step": 371210 }, { "epoch": 0.65, "learning_rate": 1.763184603633548e-05, "loss": 2.2801, "step": 371220 }, { "epoch": 0.65, "learning_rate": 1.7630974096408653e-05, "loss": 2.261, "step": 371230 }, { "epoch": 0.65, "learning_rate": 1.763010215648183e-05, "loss": 2.2964, "step": 371240 }, { "epoch": 0.65, "learning_rate": 1.7629230216555e-05, "loss": 2.2874, "step": 371250 }, { "epoch": 0.65, "learning_rate": 1.7628358276628174e-05, "loss": 2.2124, "step": 371260 }, { "epoch": 0.65, "learning_rate": 1.7627486336701348e-05, "loss": 2.3527, "step": 371270 }, { "epoch": 0.65, "learning_rate": 1.7626614396774522e-05, "loss": 2.5046, "step": 371280 }, { "epoch": 0.65, "learning_rate": 1.7625742456847692e-05, "loss": 2.3006, "step": 371290 }, { "epoch": 0.65, "learning_rate": 1.7624870516920866e-05, "loss": 2.303, "step": 371300 }, { "epoch": 0.65, "learning_rate": 1.762399857699404e-05, "loss": 2.2374, "step": 371310 }, { "epoch": 0.65, "learning_rate": 1.7623126637067214e-05, "loss": 2.3162, "step": 371320 }, { "epoch": 0.65, "learning_rate": 1.7622254697140387e-05, "loss": 2.3567, "step": 371330 }, { "epoch": 0.65, "learning_rate": 1.7621382757213558e-05, "loss": 2.3249, "step": 371340 }, { "epoch": 0.65, "learning_rate": 1.7620510817286735e-05, "loss": 2.3162, "step": 371350 }, { "epoch": 0.65, "learning_rate": 1.7619638877359905e-05, "loss": 2.3289, "step": 371360 }, { "epoch": 0.65, "learning_rate": 1.761876693743308e-05, "loss": 2.3284, "step": 371370 }, { "epoch": 0.65, "learning_rate": 1.7617894997506253e-05, "loss": 2.2324, "step": 371380 }, { "epoch": 0.65, "learning_rate": 1.7617023057579427e-05, "loss": 2.2335, "step": 371390 }, { "epoch": 0.65, "learning_rate": 1.76161511176526e-05, "loss": 2.2398, "step": 371400 }, { "epoch": 0.65, "learning_rate": 1.761527917772577e-05, "loss": 2.3343, "step": 371410 }, { "epoch": 0.65, "learning_rate": 1.7614407237798948e-05, "loss": 2.2295, "step": 371420 }, { "epoch": 0.65, "learning_rate": 1.7613535297872118e-05, "loss": 2.3623, "step": 371430 }, { "epoch": 0.65, "learning_rate": 1.7612663357945292e-05, "loss": 2.305, "step": 371440 }, { "epoch": 0.65, "learning_rate": 1.7611791418018462e-05, "loss": 2.4074, "step": 371450 }, { "epoch": 0.65, "learning_rate": 1.761091947809164e-05, "loss": 2.2019, "step": 371460 }, { "epoch": 0.65, "learning_rate": 1.7610047538164813e-05, "loss": 2.3942, "step": 371470 }, { "epoch": 0.65, "learning_rate": 1.7609175598237984e-05, "loss": 2.3559, "step": 371480 }, { "epoch": 0.65, "learning_rate": 1.7608303658311158e-05, "loss": 2.3557, "step": 371490 }, { "epoch": 0.65, "learning_rate": 1.760743171838433e-05, "loss": 2.4407, "step": 371500 }, { "epoch": 0.65, "learning_rate": 1.7606559778457505e-05, "loss": 2.315, "step": 371510 }, { "epoch": 0.65, "learning_rate": 1.7605687838530675e-05, "loss": 2.3227, "step": 371520 }, { "epoch": 0.65, "learning_rate": 1.7604815898603853e-05, "loss": 2.3339, "step": 371530 }, { "epoch": 0.65, "learning_rate": 1.7603943958677023e-05, "loss": 2.2679, "step": 371540 }, { "epoch": 0.65, "learning_rate": 1.7603072018750197e-05, "loss": 2.2643, "step": 371550 }, { "epoch": 0.65, "learning_rate": 1.760220007882337e-05, "loss": 2.298, "step": 371560 }, { "epoch": 0.65, "learning_rate": 1.7601328138896544e-05, "loss": 2.2919, "step": 371570 }, { "epoch": 0.65, "learning_rate": 1.7600456198969718e-05, "loss": 2.2973, "step": 371580 }, { "epoch": 0.65, "learning_rate": 1.759958425904289e-05, "loss": 2.2101, "step": 371590 }, { "epoch": 0.65, "learning_rate": 1.7598712319116062e-05, "loss": 2.4638, "step": 371600 }, { "epoch": 0.65, "learning_rate": 1.7597840379189236e-05, "loss": 2.3596, "step": 371610 }, { "epoch": 0.65, "learning_rate": 1.759696843926241e-05, "loss": 2.2795, "step": 371620 }, { "epoch": 0.65, "learning_rate": 1.7596096499335584e-05, "loss": 2.3502, "step": 371630 }, { "epoch": 0.65, "learning_rate": 1.7595224559408754e-05, "loss": 2.3543, "step": 371640 }, { "epoch": 0.65, "learning_rate": 1.759435261948193e-05, "loss": 2.3654, "step": 371650 }, { "epoch": 0.65, "learning_rate": 1.75934806795551e-05, "loss": 2.3328, "step": 371660 }, { "epoch": 0.65, "learning_rate": 1.7592608739628275e-05, "loss": 2.2413, "step": 371670 }, { "epoch": 0.65, "learning_rate": 1.759173679970145e-05, "loss": 2.44, "step": 371680 }, { "epoch": 0.65, "learning_rate": 1.7590864859774623e-05, "loss": 2.302, "step": 371690 }, { "epoch": 0.65, "learning_rate": 1.7589992919847793e-05, "loss": 2.2912, "step": 371700 }, { "epoch": 0.65, "learning_rate": 1.7589120979920967e-05, "loss": 2.22, "step": 371710 }, { "epoch": 0.65, "learning_rate": 1.7588249039994144e-05, "loss": 2.3259, "step": 371720 }, { "epoch": 0.65, "learning_rate": 1.7587377100067314e-05, "loss": 2.3416, "step": 371730 }, { "epoch": 0.65, "learning_rate": 1.7586505160140488e-05, "loss": 2.3268, "step": 371740 }, { "epoch": 0.65, "learning_rate": 1.758563322021366e-05, "loss": 2.1969, "step": 371750 }, { "epoch": 0.65, "learning_rate": 1.7584761280286836e-05, "loss": 2.3818, "step": 371760 }, { "epoch": 0.65, "learning_rate": 1.7583889340360006e-05, "loss": 2.3673, "step": 371770 }, { "epoch": 0.65, "learning_rate": 1.758301740043318e-05, "loss": 2.3631, "step": 371780 }, { "epoch": 0.65, "learning_rate": 1.7582145460506354e-05, "loss": 2.1989, "step": 371790 }, { "epoch": 0.65, "learning_rate": 1.7581273520579527e-05, "loss": 2.4348, "step": 371800 }, { "epoch": 0.65, "learning_rate": 1.75804015806527e-05, "loss": 2.3426, "step": 371810 }, { "epoch": 0.65, "learning_rate": 1.757952964072587e-05, "loss": 2.3844, "step": 371820 }, { "epoch": 0.65, "learning_rate": 1.757865770079905e-05, "loss": 2.4072, "step": 371830 }, { "epoch": 0.65, "learning_rate": 1.757778576087222e-05, "loss": 2.2462, "step": 371840 }, { "epoch": 0.65, "learning_rate": 1.7576913820945393e-05, "loss": 2.3043, "step": 371850 }, { "epoch": 0.65, "learning_rate": 1.7576041881018567e-05, "loss": 2.3309, "step": 371860 }, { "epoch": 0.65, "learning_rate": 1.757516994109174e-05, "loss": 2.302, "step": 371870 }, { "epoch": 0.65, "learning_rate": 1.7574298001164914e-05, "loss": 2.2999, "step": 371880 }, { "epoch": 0.65, "learning_rate": 1.7573426061238085e-05, "loss": 2.1417, "step": 371890 }, { "epoch": 0.65, "learning_rate": 1.757255412131126e-05, "loss": 2.3544, "step": 371900 }, { "epoch": 0.65, "learning_rate": 1.7571682181384432e-05, "loss": 2.366, "step": 371910 }, { "epoch": 0.65, "learning_rate": 1.7570810241457606e-05, "loss": 2.2548, "step": 371920 }, { "epoch": 0.65, "learning_rate": 1.7569938301530776e-05, "loss": 2.3589, "step": 371930 }, { "epoch": 0.65, "learning_rate": 1.7569066361603953e-05, "loss": 2.341, "step": 371940 }, { "epoch": 0.65, "learning_rate": 1.7568194421677124e-05, "loss": 2.2189, "step": 371950 }, { "epoch": 0.65, "learning_rate": 1.7567322481750298e-05, "loss": 2.2896, "step": 371960 }, { "epoch": 0.65, "learning_rate": 1.756645054182347e-05, "loss": 2.2614, "step": 371970 }, { "epoch": 0.65, "learning_rate": 1.7565578601896645e-05, "loss": 2.3149, "step": 371980 }, { "epoch": 0.65, "learning_rate": 1.756470666196982e-05, "loss": 2.3862, "step": 371990 }, { "epoch": 0.65, "learning_rate": 1.756383472204299e-05, "loss": 2.4479, "step": 372000 }, { "epoch": 0.65, "learning_rate": 1.7562962782116163e-05, "loss": 2.4254, "step": 372010 }, { "epoch": 0.65, "learning_rate": 1.7562090842189337e-05, "loss": 2.3855, "step": 372020 }, { "epoch": 0.65, "learning_rate": 1.756121890226251e-05, "loss": 2.2567, "step": 372030 }, { "epoch": 0.65, "learning_rate": 1.7560346962335684e-05, "loss": 2.3238, "step": 372040 }, { "epoch": 0.65, "learning_rate": 1.7559475022408858e-05, "loss": 2.3768, "step": 372050 }, { "epoch": 0.65, "learning_rate": 1.7558603082482032e-05, "loss": 2.3478, "step": 372060 }, { "epoch": 0.65, "learning_rate": 1.7557731142555202e-05, "loss": 2.2849, "step": 372070 }, { "epoch": 0.65, "learning_rate": 1.7556859202628376e-05, "loss": 2.2397, "step": 372080 }, { "epoch": 0.65, "learning_rate": 1.755598726270155e-05, "loss": 2.3863, "step": 372090 }, { "epoch": 0.65, "learning_rate": 1.7555115322774724e-05, "loss": 2.3784, "step": 372100 }, { "epoch": 0.65, "learning_rate": 1.7554243382847897e-05, "loss": 2.3065, "step": 372110 }, { "epoch": 0.65, "learning_rate": 1.7553371442921068e-05, "loss": 2.2135, "step": 372120 }, { "epoch": 0.65, "learning_rate": 1.7552499502994245e-05, "loss": 2.3052, "step": 372130 }, { "epoch": 0.65, "learning_rate": 1.7551627563067415e-05, "loss": 2.3721, "step": 372140 }, { "epoch": 0.65, "learning_rate": 1.755075562314059e-05, "loss": 2.2691, "step": 372150 }, { "epoch": 0.65, "learning_rate": 1.754988368321376e-05, "loss": 2.3498, "step": 372160 }, { "epoch": 0.65, "learning_rate": 1.7549011743286937e-05, "loss": 2.3579, "step": 372170 }, { "epoch": 0.65, "learning_rate": 1.7548139803360107e-05, "loss": 2.2975, "step": 372180 }, { "epoch": 0.65, "learning_rate": 1.754726786343328e-05, "loss": 2.3789, "step": 372190 }, { "epoch": 0.65, "learning_rate": 1.7546395923506458e-05, "loss": 2.4001, "step": 372200 }, { "epoch": 0.65, "learning_rate": 1.7545523983579628e-05, "loss": 2.3051, "step": 372210 }, { "epoch": 0.65, "learning_rate": 1.7544652043652802e-05, "loss": 2.3472, "step": 372220 }, { "epoch": 0.65, "learning_rate": 1.7543780103725972e-05, "loss": 2.2406, "step": 372230 }, { "epoch": 0.65, "learning_rate": 1.754290816379915e-05, "loss": 2.2747, "step": 372240 }, { "epoch": 0.65, "learning_rate": 1.754203622387232e-05, "loss": 2.4564, "step": 372250 }, { "epoch": 0.65, "learning_rate": 1.7541164283945494e-05, "loss": 2.2556, "step": 372260 }, { "epoch": 0.65, "learning_rate": 1.7540292344018668e-05, "loss": 2.2518, "step": 372270 }, { "epoch": 0.65, "learning_rate": 1.753942040409184e-05, "loss": 2.316, "step": 372280 }, { "epoch": 0.65, "learning_rate": 1.7538548464165015e-05, "loss": 2.3016, "step": 372290 }, { "epoch": 0.65, "learning_rate": 1.7537676524238185e-05, "loss": 2.2717, "step": 372300 }, { "epoch": 0.65, "learning_rate": 1.753680458431136e-05, "loss": 2.3264, "step": 372310 }, { "epoch": 0.65, "learning_rate": 1.7535932644384533e-05, "loss": 2.3851, "step": 372320 }, { "epoch": 0.65, "learning_rate": 1.7535060704457707e-05, "loss": 2.2758, "step": 372330 }, { "epoch": 0.65, "learning_rate": 1.753418876453088e-05, "loss": 2.3088, "step": 372340 }, { "epoch": 0.65, "learning_rate": 1.7533316824604054e-05, "loss": 2.2786, "step": 372350 }, { "epoch": 0.65, "learning_rate": 1.7532444884677228e-05, "loss": 2.2592, "step": 372360 }, { "epoch": 0.65, "learning_rate": 1.75315729447504e-05, "loss": 2.307, "step": 372370 }, { "epoch": 0.65, "learning_rate": 1.7530701004823572e-05, "loss": 2.2841, "step": 372380 }, { "epoch": 0.65, "learning_rate": 1.7529829064896746e-05, "loss": 2.3202, "step": 372390 }, { "epoch": 0.65, "learning_rate": 1.752895712496992e-05, "loss": 2.3118, "step": 372400 }, { "epoch": 0.65, "learning_rate": 1.752808518504309e-05, "loss": 2.4117, "step": 372410 }, { "epoch": 0.65, "learning_rate": 1.7527213245116264e-05, "loss": 2.2676, "step": 372420 }, { "epoch": 0.65, "learning_rate": 1.7526341305189438e-05, "loss": 2.3092, "step": 372430 }, { "epoch": 0.65, "learning_rate": 1.752546936526261e-05, "loss": 2.206, "step": 372440 }, { "epoch": 0.65, "learning_rate": 1.7524597425335785e-05, "loss": 2.3917, "step": 372450 }, { "epoch": 0.65, "learning_rate": 1.752372548540896e-05, "loss": 2.337, "step": 372460 }, { "epoch": 0.65, "learning_rate": 1.7522853545482133e-05, "loss": 2.2318, "step": 372470 }, { "epoch": 0.65, "learning_rate": 1.7521981605555303e-05, "loss": 2.2777, "step": 372480 }, { "epoch": 0.65, "learning_rate": 1.7521109665628477e-05, "loss": 2.416, "step": 372490 }, { "epoch": 0.65, "learning_rate": 1.752023772570165e-05, "loss": 2.2748, "step": 372500 }, { "epoch": 0.65, "learning_rate": 1.7519365785774824e-05, "loss": 2.2223, "step": 372510 }, { "epoch": 0.65, "learning_rate": 1.7518493845847998e-05, "loss": 2.3051, "step": 372520 }, { "epoch": 0.65, "learning_rate": 1.751762190592117e-05, "loss": 2.3469, "step": 372530 }, { "epoch": 0.65, "learning_rate": 1.7516749965994346e-05, "loss": 2.2605, "step": 372540 }, { "epoch": 0.65, "learning_rate": 1.7515878026067516e-05, "loss": 2.2371, "step": 372550 }, { "epoch": 0.65, "learning_rate": 1.751500608614069e-05, "loss": 2.2077, "step": 372560 }, { "epoch": 0.65, "learning_rate": 1.751413414621386e-05, "loss": 2.2909, "step": 372570 }, { "epoch": 0.65, "learning_rate": 1.7513262206287037e-05, "loss": 2.3106, "step": 372580 }, { "epoch": 0.65, "learning_rate": 1.751239026636021e-05, "loss": 2.2767, "step": 372590 }, { "epoch": 0.65, "learning_rate": 1.751151832643338e-05, "loss": 2.3592, "step": 372600 }, { "epoch": 0.65, "learning_rate": 1.751064638650656e-05, "loss": 2.267, "step": 372610 }, { "epoch": 0.65, "learning_rate": 1.750977444657973e-05, "loss": 2.4342, "step": 372620 }, { "epoch": 0.65, "learning_rate": 1.7508902506652903e-05, "loss": 2.3065, "step": 372630 }, { "epoch": 0.65, "learning_rate": 1.7508030566726073e-05, "loss": 2.3863, "step": 372640 }, { "epoch": 0.65, "learning_rate": 1.750715862679925e-05, "loss": 2.333, "step": 372650 }, { "epoch": 0.65, "learning_rate": 1.750628668687242e-05, "loss": 2.2243, "step": 372660 }, { "epoch": 0.65, "learning_rate": 1.7505414746945595e-05, "loss": 2.2993, "step": 372670 }, { "epoch": 0.65, "learning_rate": 1.750454280701877e-05, "loss": 2.2689, "step": 372680 }, { "epoch": 0.65, "learning_rate": 1.7503670867091942e-05, "loss": 2.2965, "step": 372690 }, { "epoch": 0.65, "learning_rate": 1.7502798927165116e-05, "loss": 2.3676, "step": 372700 }, { "epoch": 0.65, "learning_rate": 1.7501926987238286e-05, "loss": 2.3242, "step": 372710 }, { "epoch": 0.65, "learning_rate": 1.7501055047311463e-05, "loss": 2.3336, "step": 372720 }, { "epoch": 0.65, "learning_rate": 1.7500183107384634e-05, "loss": 2.2547, "step": 372730 }, { "epoch": 0.65, "learning_rate": 1.7499311167457808e-05, "loss": 2.3349, "step": 372740 }, { "epoch": 0.65, "learning_rate": 1.749843922753098e-05, "loss": 2.3466, "step": 372750 }, { "epoch": 0.65, "learning_rate": 1.7497567287604155e-05, "loss": 2.3472, "step": 372760 }, { "epoch": 0.65, "learning_rate": 1.749669534767733e-05, "loss": 2.2814, "step": 372770 }, { "epoch": 0.65, "learning_rate": 1.74958234077505e-05, "loss": 2.1919, "step": 372780 }, { "epoch": 0.65, "learning_rate": 1.7494951467823673e-05, "loss": 2.2973, "step": 372790 }, { "epoch": 0.65, "learning_rate": 1.7494079527896847e-05, "loss": 2.2995, "step": 372800 }, { "epoch": 0.65, "learning_rate": 1.749320758797002e-05, "loss": 2.4064, "step": 372810 }, { "epoch": 0.65, "learning_rate": 1.7492335648043194e-05, "loss": 2.3066, "step": 372820 }, { "epoch": 0.65, "learning_rate": 1.7491463708116365e-05, "loss": 2.2554, "step": 372830 }, { "epoch": 0.65, "learning_rate": 1.7490591768189542e-05, "loss": 2.2835, "step": 372840 }, { "epoch": 0.65, "learning_rate": 1.7489719828262712e-05, "loss": 2.2159, "step": 372850 }, { "epoch": 0.65, "learning_rate": 1.7488847888335886e-05, "loss": 2.2778, "step": 372860 }, { "epoch": 0.65, "learning_rate": 1.748797594840906e-05, "loss": 2.3493, "step": 372870 }, { "epoch": 0.65, "learning_rate": 1.7487104008482234e-05, "loss": 2.3558, "step": 372880 }, { "epoch": 0.65, "learning_rate": 1.7486232068555404e-05, "loss": 2.3521, "step": 372890 }, { "epoch": 0.65, "learning_rate": 1.7485360128628578e-05, "loss": 2.4681, "step": 372900 }, { "epoch": 0.65, "learning_rate": 1.748448818870175e-05, "loss": 2.3534, "step": 372910 }, { "epoch": 0.65, "learning_rate": 1.7483616248774925e-05, "loss": 2.2469, "step": 372920 }, { "epoch": 0.65, "learning_rate": 1.74827443088481e-05, "loss": 2.3529, "step": 372930 }, { "epoch": 0.65, "learning_rate": 1.748187236892127e-05, "loss": 2.4499, "step": 372940 }, { "epoch": 0.65, "learning_rate": 1.7481000428994447e-05, "loss": 2.2027, "step": 372950 }, { "epoch": 0.65, "learning_rate": 1.7480128489067617e-05, "loss": 2.3176, "step": 372960 }, { "epoch": 0.65, "learning_rate": 1.747925654914079e-05, "loss": 2.3257, "step": 372970 }, { "epoch": 0.65, "learning_rate": 1.7478384609213965e-05, "loss": 2.3154, "step": 372980 }, { "epoch": 0.65, "learning_rate": 1.7477512669287138e-05, "loss": 2.3043, "step": 372990 }, { "epoch": 0.65, "learning_rate": 1.7476640729360312e-05, "loss": 2.2656, "step": 373000 }, { "epoch": 0.65, "learning_rate": 1.7475768789433482e-05, "loss": 2.2873, "step": 373010 }, { "epoch": 0.65, "learning_rate": 1.747489684950666e-05, "loss": 2.3961, "step": 373020 }, { "epoch": 0.65, "learning_rate": 1.747402490957983e-05, "loss": 2.3715, "step": 373030 }, { "epoch": 0.65, "learning_rate": 1.7473152969653004e-05, "loss": 2.3923, "step": 373040 }, { "epoch": 0.65, "learning_rate": 1.7472281029726174e-05, "loss": 2.2976, "step": 373050 }, { "epoch": 0.65, "learning_rate": 1.747140908979935e-05, "loss": 2.2999, "step": 373060 }, { "epoch": 0.65, "learning_rate": 1.7470537149872525e-05, "loss": 2.3421, "step": 373070 }, { "epoch": 0.65, "learning_rate": 1.7469665209945695e-05, "loss": 2.315, "step": 373080 }, { "epoch": 0.65, "learning_rate": 1.746879327001887e-05, "loss": 2.2424, "step": 373090 }, { "epoch": 0.65, "learning_rate": 1.7467921330092043e-05, "loss": 2.4253, "step": 373100 }, { "epoch": 0.65, "learning_rate": 1.7467049390165217e-05, "loss": 2.2811, "step": 373110 }, { "epoch": 0.65, "learning_rate": 1.7466177450238387e-05, "loss": 2.3278, "step": 373120 }, { "epoch": 0.65, "learning_rate": 1.7465305510311564e-05, "loss": 2.4897, "step": 373130 }, { "epoch": 0.65, "learning_rate": 1.7464433570384735e-05, "loss": 2.3432, "step": 373140 }, { "epoch": 0.65, "learning_rate": 1.746356163045791e-05, "loss": 2.1801, "step": 373150 }, { "epoch": 0.65, "learning_rate": 1.7462689690531082e-05, "loss": 2.3321, "step": 373160 }, { "epoch": 0.65, "learning_rate": 1.7461817750604256e-05, "loss": 2.2781, "step": 373170 }, { "epoch": 0.65, "learning_rate": 1.746094581067743e-05, "loss": 2.3275, "step": 373180 }, { "epoch": 0.65, "learning_rate": 1.74600738707506e-05, "loss": 2.3598, "step": 373190 }, { "epoch": 0.65, "learning_rate": 1.7459201930823774e-05, "loss": 2.3743, "step": 373200 }, { "epoch": 0.65, "learning_rate": 1.7458329990896948e-05, "loss": 2.3779, "step": 373210 }, { "epoch": 0.65, "learning_rate": 1.745745805097012e-05, "loss": 2.3379, "step": 373220 }, { "epoch": 0.65, "learning_rate": 1.7456586111043295e-05, "loss": 2.3007, "step": 373230 }, { "epoch": 0.65, "learning_rate": 1.7455714171116466e-05, "loss": 2.3621, "step": 373240 }, { "epoch": 0.65, "learning_rate": 1.7454842231189643e-05, "loss": 2.3149, "step": 373250 }, { "epoch": 0.65, "learning_rate": 1.7453970291262813e-05, "loss": 2.318, "step": 373260 }, { "epoch": 0.65, "learning_rate": 1.7453098351335987e-05, "loss": 2.3639, "step": 373270 }, { "epoch": 0.65, "learning_rate": 1.745222641140916e-05, "loss": 2.2292, "step": 373280 }, { "epoch": 0.65, "learning_rate": 1.7451354471482334e-05, "loss": 2.3201, "step": 373290 }, { "epoch": 0.65, "learning_rate": 1.7450482531555505e-05, "loss": 2.3256, "step": 373300 }, { "epoch": 0.65, "learning_rate": 1.744961059162868e-05, "loss": 2.2712, "step": 373310 }, { "epoch": 0.65, "learning_rate": 1.7448738651701856e-05, "loss": 2.3388, "step": 373320 }, { "epoch": 0.65, "learning_rate": 1.7447866711775026e-05, "loss": 2.2446, "step": 373330 }, { "epoch": 0.65, "learning_rate": 1.74469947718482e-05, "loss": 2.3177, "step": 373340 }, { "epoch": 0.65, "learning_rate": 1.744612283192137e-05, "loss": 2.2232, "step": 373350 }, { "epoch": 0.65, "learning_rate": 1.7445250891994547e-05, "loss": 2.3634, "step": 373360 }, { "epoch": 0.65, "learning_rate": 1.7444378952067718e-05, "loss": 2.4204, "step": 373370 }, { "epoch": 0.65, "learning_rate": 1.744350701214089e-05, "loss": 2.3996, "step": 373380 }, { "epoch": 0.65, "learning_rate": 1.7442635072214065e-05, "loss": 2.3631, "step": 373390 }, { "epoch": 0.65, "learning_rate": 1.744176313228724e-05, "loss": 2.2957, "step": 373400 }, { "epoch": 0.65, "learning_rate": 1.7440891192360413e-05, "loss": 2.2455, "step": 373410 }, { "epoch": 0.65, "learning_rate": 1.7440019252433583e-05, "loss": 2.267, "step": 373420 }, { "epoch": 0.65, "learning_rate": 1.743914731250676e-05, "loss": 2.3671, "step": 373430 }, { "epoch": 0.65, "learning_rate": 1.743827537257993e-05, "loss": 2.4207, "step": 373440 }, { "epoch": 0.65, "learning_rate": 1.7437403432653105e-05, "loss": 2.3101, "step": 373450 }, { "epoch": 0.65, "learning_rate": 1.743653149272628e-05, "loss": 2.3518, "step": 373460 }, { "epoch": 0.65, "learning_rate": 1.7435659552799452e-05, "loss": 2.34, "step": 373470 }, { "epoch": 0.65, "learning_rate": 1.7434787612872626e-05, "loss": 2.424, "step": 373480 }, { "epoch": 0.65, "learning_rate": 1.7433915672945796e-05, "loss": 2.3586, "step": 373490 }, { "epoch": 0.65, "learning_rate": 1.743304373301897e-05, "loss": 2.1928, "step": 373500 }, { "epoch": 0.65, "learning_rate": 1.7432171793092144e-05, "loss": 2.4004, "step": 373510 }, { "epoch": 0.65, "learning_rate": 1.7431299853165318e-05, "loss": 2.2558, "step": 373520 }, { "epoch": 0.65, "learning_rate": 1.7430427913238488e-05, "loss": 2.3058, "step": 373530 }, { "epoch": 0.65, "learning_rate": 1.7429555973311665e-05, "loss": 2.4519, "step": 373540 }, { "epoch": 0.65, "learning_rate": 1.742868403338484e-05, "loss": 2.4026, "step": 373550 }, { "epoch": 0.65, "learning_rate": 1.742781209345801e-05, "loss": 2.3349, "step": 373560 }, { "epoch": 0.65, "learning_rate": 1.7426940153531183e-05, "loss": 2.3704, "step": 373570 }, { "epoch": 0.65, "learning_rate": 1.7426068213604357e-05, "loss": 2.392, "step": 373580 }, { "epoch": 0.65, "learning_rate": 1.742519627367753e-05, "loss": 2.3762, "step": 373590 }, { "epoch": 0.65, "learning_rate": 1.74243243337507e-05, "loss": 2.4013, "step": 373600 }, { "epoch": 0.65, "learning_rate": 1.7423452393823875e-05, "loss": 2.3578, "step": 373610 }, { "epoch": 0.65, "learning_rate": 1.742258045389705e-05, "loss": 2.3003, "step": 373620 }, { "epoch": 0.65, "learning_rate": 1.7421708513970222e-05, "loss": 2.2573, "step": 373630 }, { "epoch": 0.65, "learning_rate": 1.7420836574043396e-05, "loss": 2.3049, "step": 373640 }, { "epoch": 0.65, "learning_rate": 1.741996463411657e-05, "loss": 2.2666, "step": 373650 }, { "epoch": 0.65, "learning_rate": 1.7419092694189744e-05, "loss": 2.4651, "step": 373660 }, { "epoch": 0.65, "learning_rate": 1.7418220754262914e-05, "loss": 2.2863, "step": 373670 }, { "epoch": 0.65, "learning_rate": 1.7417348814336088e-05, "loss": 2.2345, "step": 373680 }, { "epoch": 0.65, "learning_rate": 1.741647687440926e-05, "loss": 2.3521, "step": 373690 }, { "epoch": 0.65, "learning_rate": 1.7415604934482435e-05, "loss": 2.3704, "step": 373700 }, { "epoch": 0.65, "learning_rate": 1.741473299455561e-05, "loss": 2.2968, "step": 373710 }, { "epoch": 0.65, "learning_rate": 1.741386105462878e-05, "loss": 2.3135, "step": 373720 }, { "epoch": 0.65, "learning_rate": 1.7412989114701957e-05, "loss": 2.4003, "step": 373730 }, { "epoch": 0.65, "learning_rate": 1.7412117174775127e-05, "loss": 2.2722, "step": 373740 }, { "epoch": 0.65, "learning_rate": 1.74112452348483e-05, "loss": 2.3592, "step": 373750 }, { "epoch": 0.65, "learning_rate": 1.741037329492147e-05, "loss": 2.2797, "step": 373760 }, { "epoch": 0.65, "learning_rate": 1.740950135499465e-05, "loss": 2.3997, "step": 373770 }, { "epoch": 0.65, "learning_rate": 1.740862941506782e-05, "loss": 2.4342, "step": 373780 }, { "epoch": 0.65, "learning_rate": 1.7407757475140992e-05, "loss": 2.3969, "step": 373790 }, { "epoch": 0.65, "learning_rate": 1.740688553521417e-05, "loss": 2.3881, "step": 373800 }, { "epoch": 0.65, "learning_rate": 1.740601359528734e-05, "loss": 2.313, "step": 373810 }, { "epoch": 0.65, "learning_rate": 1.7405141655360514e-05, "loss": 2.3547, "step": 373820 }, { "epoch": 0.65, "learning_rate": 1.7404269715433684e-05, "loss": 2.3012, "step": 373830 }, { "epoch": 0.65, "learning_rate": 1.740339777550686e-05, "loss": 2.2383, "step": 373840 }, { "epoch": 0.65, "learning_rate": 1.7402525835580032e-05, "loss": 2.1674, "step": 373850 }, { "epoch": 0.65, "learning_rate": 1.7401653895653205e-05, "loss": 2.2048, "step": 373860 }, { "epoch": 0.65, "learning_rate": 1.740078195572638e-05, "loss": 2.3003, "step": 373870 }, { "epoch": 0.65, "learning_rate": 1.7399910015799553e-05, "loss": 2.3214, "step": 373880 }, { "epoch": 0.65, "learning_rate": 1.7399038075872727e-05, "loss": 2.3273, "step": 373890 }, { "epoch": 0.65, "learning_rate": 1.7398166135945897e-05, "loss": 2.3571, "step": 373900 }, { "epoch": 0.65, "learning_rate": 1.7397294196019074e-05, "loss": 2.3899, "step": 373910 }, { "epoch": 0.65, "learning_rate": 1.7396422256092245e-05, "loss": 2.3666, "step": 373920 }, { "epoch": 0.65, "learning_rate": 1.739555031616542e-05, "loss": 2.4038, "step": 373930 }, { "epoch": 0.65, "learning_rate": 1.7394678376238592e-05, "loss": 2.4005, "step": 373940 }, { "epoch": 0.65, "learning_rate": 1.7393806436311766e-05, "loss": 2.4216, "step": 373950 }, { "epoch": 0.65, "learning_rate": 1.739293449638494e-05, "loss": 2.3705, "step": 373960 }, { "epoch": 0.65, "learning_rate": 1.739206255645811e-05, "loss": 2.3098, "step": 373970 }, { "epoch": 0.65, "learning_rate": 1.7391190616531284e-05, "loss": 2.3332, "step": 373980 }, { "epoch": 0.65, "learning_rate": 1.7390318676604458e-05, "loss": 2.4013, "step": 373990 }, { "epoch": 0.65, "learning_rate": 1.738944673667763e-05, "loss": 2.41, "step": 374000 }, { "epoch": 0.65, "learning_rate": 1.7388574796750802e-05, "loss": 2.2885, "step": 374010 }, { "epoch": 0.65, "learning_rate": 1.7387702856823976e-05, "loss": 2.2966, "step": 374020 }, { "epoch": 0.65, "learning_rate": 1.738683091689715e-05, "loss": 2.3146, "step": 374030 }, { "epoch": 0.65, "learning_rate": 1.7385958976970323e-05, "loss": 2.3443, "step": 374040 }, { "epoch": 0.65, "learning_rate": 1.7385087037043497e-05, "loss": 2.2406, "step": 374050 }, { "epoch": 0.65, "learning_rate": 1.738421509711667e-05, "loss": 2.2729, "step": 374060 }, { "epoch": 0.65, "learning_rate": 1.7383343157189844e-05, "loss": 2.324, "step": 374070 }, { "epoch": 0.65, "learning_rate": 1.7382471217263015e-05, "loss": 2.1703, "step": 374080 }, { "epoch": 0.65, "learning_rate": 1.738159927733619e-05, "loss": 2.3066, "step": 374090 }, { "epoch": 0.65, "learning_rate": 1.7380727337409362e-05, "loss": 2.4341, "step": 374100 }, { "epoch": 0.65, "learning_rate": 1.7379855397482536e-05, "loss": 2.4535, "step": 374110 }, { "epoch": 0.65, "learning_rate": 1.737898345755571e-05, "loss": 2.2809, "step": 374120 }, { "epoch": 0.65, "learning_rate": 1.737811151762888e-05, "loss": 2.2911, "step": 374130 }, { "epoch": 0.65, "learning_rate": 1.7377239577702057e-05, "loss": 2.3692, "step": 374140 }, { "epoch": 0.65, "learning_rate": 1.7376367637775228e-05, "loss": 2.2563, "step": 374150 }, { "epoch": 0.65, "learning_rate": 1.73754956978484e-05, "loss": 2.2293, "step": 374160 }, { "epoch": 0.65, "learning_rate": 1.7374623757921575e-05, "loss": 2.2924, "step": 374170 }, { "epoch": 0.65, "learning_rate": 1.737375181799475e-05, "loss": 2.3663, "step": 374180 }, { "epoch": 0.65, "learning_rate": 1.7372879878067923e-05, "loss": 2.2274, "step": 374190 }, { "epoch": 0.65, "learning_rate": 1.7372007938141093e-05, "loss": 2.3177, "step": 374200 }, { "epoch": 0.65, "learning_rate": 1.737113599821427e-05, "loss": 2.4265, "step": 374210 }, { "epoch": 0.65, "learning_rate": 1.737026405828744e-05, "loss": 2.2235, "step": 374220 }, { "epoch": 0.65, "learning_rate": 1.7369392118360615e-05, "loss": 2.3965, "step": 374230 }, { "epoch": 0.65, "learning_rate": 1.7368520178433785e-05, "loss": 2.4046, "step": 374240 }, { "epoch": 0.65, "learning_rate": 1.7367648238506962e-05, "loss": 2.2179, "step": 374250 }, { "epoch": 0.65, "learning_rate": 1.7366776298580133e-05, "loss": 2.3943, "step": 374260 }, { "epoch": 0.65, "learning_rate": 1.7365904358653306e-05, "loss": 2.3989, "step": 374270 }, { "epoch": 0.65, "learning_rate": 1.736503241872648e-05, "loss": 2.377, "step": 374280 }, { "epoch": 0.65, "learning_rate": 1.7364160478799654e-05, "loss": 2.2611, "step": 374290 }, { "epoch": 0.65, "learning_rate": 1.7363288538872828e-05, "loss": 2.3294, "step": 374300 }, { "epoch": 0.65, "learning_rate": 1.7362416598945998e-05, "loss": 2.3451, "step": 374310 }, { "epoch": 0.65, "learning_rate": 1.7361544659019175e-05, "loss": 2.2755, "step": 374320 }, { "epoch": 0.65, "learning_rate": 1.7360672719092346e-05, "loss": 2.2364, "step": 374330 }, { "epoch": 0.65, "learning_rate": 1.735980077916552e-05, "loss": 2.1976, "step": 374340 }, { "epoch": 0.65, "learning_rate": 1.7358928839238693e-05, "loss": 2.4126, "step": 374350 }, { "epoch": 0.65, "learning_rate": 1.7358056899311867e-05, "loss": 2.2175, "step": 374360 }, { "epoch": 0.65, "learning_rate": 1.735718495938504e-05, "loss": 2.267, "step": 374370 }, { "epoch": 0.65, "learning_rate": 1.735631301945821e-05, "loss": 2.3936, "step": 374380 }, { "epoch": 0.65, "learning_rate": 1.7355441079531385e-05, "loss": 2.3762, "step": 374390 }, { "epoch": 0.65, "learning_rate": 1.735456913960456e-05, "loss": 2.3761, "step": 374400 }, { "epoch": 0.65, "learning_rate": 1.7353697199677732e-05, "loss": 2.3198, "step": 374410 }, { "epoch": 0.65, "learning_rate": 1.7352825259750906e-05, "loss": 2.3694, "step": 374420 }, { "epoch": 0.65, "learning_rate": 1.7351953319824076e-05, "loss": 2.299, "step": 374430 }, { "epoch": 0.65, "learning_rate": 1.7351081379897254e-05, "loss": 2.3049, "step": 374440 }, { "epoch": 0.65, "learning_rate": 1.7350209439970424e-05, "loss": 2.3566, "step": 374450 }, { "epoch": 0.65, "learning_rate": 1.7349337500043598e-05, "loss": 2.3334, "step": 374460 }, { "epoch": 0.65, "learning_rate": 1.734846556011677e-05, "loss": 2.312, "step": 374470 }, { "epoch": 0.65, "learning_rate": 1.7347593620189945e-05, "loss": 2.3148, "step": 374480 }, { "epoch": 0.65, "learning_rate": 1.7346721680263116e-05, "loss": 2.3428, "step": 374490 }, { "epoch": 0.65, "learning_rate": 1.734584974033629e-05, "loss": 2.3231, "step": 374500 }, { "epoch": 0.65, "learning_rate": 1.7344977800409463e-05, "loss": 2.3114, "step": 374510 }, { "epoch": 0.65, "learning_rate": 1.7344105860482637e-05, "loss": 2.3261, "step": 374520 }, { "epoch": 0.65, "learning_rate": 1.734323392055581e-05, "loss": 2.3153, "step": 374530 }, { "epoch": 0.65, "learning_rate": 1.734236198062898e-05, "loss": 2.3029, "step": 374540 }, { "epoch": 0.65, "learning_rate": 1.734149004070216e-05, "loss": 2.3046, "step": 374550 }, { "epoch": 0.65, "learning_rate": 1.734061810077533e-05, "loss": 2.3822, "step": 374560 }, { "epoch": 0.65, "learning_rate": 1.7339746160848502e-05, "loss": 2.2613, "step": 374570 }, { "epoch": 0.65, "learning_rate": 1.7338874220921676e-05, "loss": 2.3893, "step": 374580 }, { "epoch": 0.65, "learning_rate": 1.733800228099485e-05, "loss": 2.2694, "step": 374590 }, { "epoch": 0.65, "learning_rate": 1.7337130341068024e-05, "loss": 2.3245, "step": 374600 }, { "epoch": 0.65, "learning_rate": 1.7336258401141194e-05, "loss": 2.2862, "step": 374610 }, { "epoch": 0.65, "learning_rate": 1.733538646121437e-05, "loss": 2.2589, "step": 374620 }, { "epoch": 0.65, "learning_rate": 1.7334514521287542e-05, "loss": 2.3161, "step": 374630 }, { "epoch": 0.65, "learning_rate": 1.7333642581360715e-05, "loss": 2.2456, "step": 374640 }, { "epoch": 0.65, "learning_rate": 1.7332770641433886e-05, "loss": 2.3364, "step": 374650 }, { "epoch": 0.65, "learning_rate": 1.7331898701507063e-05, "loss": 2.2508, "step": 374660 }, { "epoch": 0.65, "learning_rate": 1.7331026761580237e-05, "loss": 2.5146, "step": 374670 }, { "epoch": 0.65, "learning_rate": 1.7330154821653407e-05, "loss": 2.3277, "step": 374680 }, { "epoch": 0.65, "learning_rate": 1.732928288172658e-05, "loss": 2.3392, "step": 374690 }, { "epoch": 0.65, "learning_rate": 1.7328410941799755e-05, "loss": 2.3929, "step": 374700 }, { "epoch": 0.65, "learning_rate": 1.732753900187293e-05, "loss": 2.511, "step": 374710 }, { "epoch": 0.65, "learning_rate": 1.73266670619461e-05, "loss": 2.3608, "step": 374720 }, { "epoch": 0.65, "learning_rate": 1.7325795122019276e-05, "loss": 2.2086, "step": 374730 }, { "epoch": 0.65, "learning_rate": 1.7324923182092446e-05, "loss": 2.3095, "step": 374740 }, { "epoch": 0.65, "learning_rate": 1.732405124216562e-05, "loss": 2.248, "step": 374750 }, { "epoch": 0.65, "learning_rate": 1.7323179302238794e-05, "loss": 2.358, "step": 374760 }, { "epoch": 0.65, "learning_rate": 1.7322307362311968e-05, "loss": 2.2984, "step": 374770 }, { "epoch": 0.65, "learning_rate": 1.732143542238514e-05, "loss": 2.3026, "step": 374780 }, { "epoch": 0.65, "learning_rate": 1.7320563482458312e-05, "loss": 2.3117, "step": 374790 }, { "epoch": 0.65, "learning_rate": 1.7319691542531486e-05, "loss": 2.3087, "step": 374800 }, { "epoch": 0.65, "learning_rate": 1.731881960260466e-05, "loss": 2.3497, "step": 374810 }, { "epoch": 0.65, "learning_rate": 1.7317947662677833e-05, "loss": 2.3721, "step": 374820 }, { "epoch": 0.65, "learning_rate": 1.7317075722751007e-05, "loss": 2.3091, "step": 374830 }, { "epoch": 0.65, "learning_rate": 1.7316203782824177e-05, "loss": 2.1705, "step": 374840 }, { "epoch": 0.65, "learning_rate": 1.7315331842897354e-05, "loss": 2.3314, "step": 374850 }, { "epoch": 0.65, "learning_rate": 1.7314459902970525e-05, "loss": 2.3381, "step": 374860 }, { "epoch": 0.65, "learning_rate": 1.73135879630437e-05, "loss": 2.3172, "step": 374870 }, { "epoch": 0.65, "learning_rate": 1.7312716023116872e-05, "loss": 2.3045, "step": 374880 }, { "epoch": 0.65, "learning_rate": 1.7311844083190046e-05, "loss": 2.3178, "step": 374890 }, { "epoch": 0.65, "learning_rate": 1.731097214326322e-05, "loss": 2.2515, "step": 374900 }, { "epoch": 0.65, "learning_rate": 1.731010020333639e-05, "loss": 2.2482, "step": 374910 }, { "epoch": 0.65, "learning_rate": 1.7309228263409567e-05, "loss": 2.305, "step": 374920 }, { "epoch": 0.65, "learning_rate": 1.7308356323482738e-05, "loss": 2.3845, "step": 374930 }, { "epoch": 0.65, "learning_rate": 1.730748438355591e-05, "loss": 2.4019, "step": 374940 }, { "epoch": 0.65, "learning_rate": 1.7306612443629082e-05, "loss": 2.2868, "step": 374950 }, { "epoch": 0.65, "learning_rate": 1.730574050370226e-05, "loss": 2.3032, "step": 374960 }, { "epoch": 0.65, "learning_rate": 1.730486856377543e-05, "loss": 2.386, "step": 374970 }, { "epoch": 0.65, "learning_rate": 1.7303996623848603e-05, "loss": 2.3372, "step": 374980 }, { "epoch": 0.65, "learning_rate": 1.7303124683921777e-05, "loss": 2.3868, "step": 374990 }, { "epoch": 0.65, "learning_rate": 1.730225274399495e-05, "loss": 2.2661, "step": 375000 }, { "epoch": 0.65, "learning_rate": 1.7301380804068125e-05, "loss": 2.3923, "step": 375010 }, { "epoch": 0.65, "learning_rate": 1.7300508864141295e-05, "loss": 2.3158, "step": 375020 }, { "epoch": 0.65, "learning_rate": 1.7299636924214472e-05, "loss": 2.3635, "step": 375030 }, { "epoch": 0.65, "learning_rate": 1.7298764984287643e-05, "loss": 2.2966, "step": 375040 }, { "epoch": 0.65, "learning_rate": 1.7297893044360816e-05, "loss": 2.3397, "step": 375050 }, { "epoch": 0.65, "learning_rate": 1.729702110443399e-05, "loss": 2.3367, "step": 375060 }, { "epoch": 0.65, "learning_rate": 1.7296149164507164e-05, "loss": 2.3709, "step": 375070 }, { "epoch": 0.65, "learning_rate": 1.7295277224580338e-05, "loss": 2.3933, "step": 375080 }, { "epoch": 0.65, "learning_rate": 1.7294405284653508e-05, "loss": 2.3343, "step": 375090 }, { "epoch": 0.65, "learning_rate": 1.7293533344726682e-05, "loss": 2.3145, "step": 375100 }, { "epoch": 0.65, "learning_rate": 1.7292661404799856e-05, "loss": 2.2912, "step": 375110 }, { "epoch": 0.65, "learning_rate": 1.729178946487303e-05, "loss": 2.3528, "step": 375120 }, { "epoch": 0.65, "learning_rate": 1.72909175249462e-05, "loss": 2.2858, "step": 375130 }, { "epoch": 0.65, "learning_rate": 1.7290045585019377e-05, "loss": 2.3195, "step": 375140 }, { "epoch": 0.65, "learning_rate": 1.728917364509255e-05, "loss": 2.375, "step": 375150 }, { "epoch": 0.65, "learning_rate": 1.728830170516572e-05, "loss": 2.406, "step": 375160 }, { "epoch": 0.65, "learning_rate": 1.7287429765238895e-05, "loss": 2.3075, "step": 375170 }, { "epoch": 0.65, "learning_rate": 1.728655782531207e-05, "loss": 2.2648, "step": 375180 }, { "epoch": 0.65, "learning_rate": 1.7285685885385242e-05, "loss": 2.2603, "step": 375190 }, { "epoch": 0.65, "learning_rate": 1.7284813945458413e-05, "loss": 2.271, "step": 375200 }, { "epoch": 0.65, "learning_rate": 1.7283942005531586e-05, "loss": 2.3146, "step": 375210 }, { "epoch": 0.65, "learning_rate": 1.728307006560476e-05, "loss": 2.3687, "step": 375220 }, { "epoch": 0.65, "learning_rate": 1.7282198125677934e-05, "loss": 2.2732, "step": 375230 }, { "epoch": 0.65, "learning_rate": 1.7281326185751108e-05, "loss": 2.438, "step": 375240 }, { "epoch": 0.65, "learning_rate": 1.728045424582428e-05, "loss": 2.2992, "step": 375250 }, { "epoch": 0.65, "learning_rate": 1.7279582305897455e-05, "loss": 2.3415, "step": 375260 }, { "epoch": 0.65, "learning_rate": 1.7278710365970626e-05, "loss": 2.3668, "step": 375270 }, { "epoch": 0.65, "learning_rate": 1.72778384260438e-05, "loss": 2.3799, "step": 375280 }, { "epoch": 0.65, "learning_rate": 1.7276966486116973e-05, "loss": 2.2112, "step": 375290 }, { "epoch": 0.65, "learning_rate": 1.7276094546190147e-05, "loss": 2.2837, "step": 375300 }, { "epoch": 0.65, "learning_rate": 1.727522260626332e-05, "loss": 2.3902, "step": 375310 }, { "epoch": 0.65, "learning_rate": 1.727435066633649e-05, "loss": 2.3204, "step": 375320 }, { "epoch": 0.65, "learning_rate": 1.727347872640967e-05, "loss": 2.2798, "step": 375330 }, { "epoch": 0.65, "learning_rate": 1.727260678648284e-05, "loss": 2.3685, "step": 375340 }, { "epoch": 0.65, "learning_rate": 1.7271734846556012e-05, "loss": 2.2907, "step": 375350 }, { "epoch": 0.65, "learning_rate": 1.7270862906629183e-05, "loss": 2.1992, "step": 375360 }, { "epoch": 0.65, "learning_rate": 1.726999096670236e-05, "loss": 2.2205, "step": 375370 }, { "epoch": 0.65, "learning_rate": 1.726911902677553e-05, "loss": 2.3384, "step": 375380 }, { "epoch": 0.65, "learning_rate": 1.7268247086848704e-05, "loss": 2.3895, "step": 375390 }, { "epoch": 0.65, "learning_rate": 1.726737514692188e-05, "loss": 2.3233, "step": 375400 }, { "epoch": 0.65, "learning_rate": 1.7266503206995052e-05, "loss": 2.2806, "step": 375410 }, { "epoch": 0.65, "learning_rate": 1.7265631267068225e-05, "loss": 2.2383, "step": 375420 }, { "epoch": 0.65, "learning_rate": 1.7264759327141396e-05, "loss": 2.3107, "step": 375430 }, { "epoch": 0.65, "learning_rate": 1.7263887387214573e-05, "loss": 2.304, "step": 375440 }, { "epoch": 0.65, "learning_rate": 1.7263015447287743e-05, "loss": 2.4387, "step": 375450 }, { "epoch": 0.65, "learning_rate": 1.7262143507360917e-05, "loss": 2.3266, "step": 375460 }, { "epoch": 0.65, "learning_rate": 1.726127156743409e-05, "loss": 2.3417, "step": 375470 }, { "epoch": 0.65, "learning_rate": 1.7260399627507265e-05, "loss": 2.2888, "step": 375480 }, { "epoch": 0.65, "learning_rate": 1.725952768758044e-05, "loss": 2.2479, "step": 375490 }, { "epoch": 0.65, "learning_rate": 1.725865574765361e-05, "loss": 2.4127, "step": 375500 }, { "epoch": 0.65, "learning_rate": 1.7257783807726786e-05, "loss": 2.309, "step": 375510 }, { "epoch": 0.65, "learning_rate": 1.7256911867799956e-05, "loss": 2.3385, "step": 375520 }, { "epoch": 0.65, "learning_rate": 1.725603992787313e-05, "loss": 2.3173, "step": 375530 }, { "epoch": 0.65, "learning_rate": 1.7255167987946304e-05, "loss": 2.3823, "step": 375540 }, { "epoch": 0.65, "learning_rate": 1.7254296048019478e-05, "loss": 2.3379, "step": 375550 }, { "epoch": 0.65, "learning_rate": 1.725342410809265e-05, "loss": 2.2879, "step": 375560 }, { "epoch": 0.65, "learning_rate": 1.7252552168165822e-05, "loss": 2.3568, "step": 375570 }, { "epoch": 0.65, "learning_rate": 1.7251680228238996e-05, "loss": 2.4165, "step": 375580 }, { "epoch": 0.65, "learning_rate": 1.725080828831217e-05, "loss": 2.2293, "step": 375590 }, { "epoch": 0.66, "learning_rate": 1.7249936348385343e-05, "loss": 2.2643, "step": 375600 }, { "epoch": 0.66, "learning_rate": 1.7249064408458514e-05, "loss": 2.2292, "step": 375610 }, { "epoch": 0.66, "learning_rate": 1.7248192468531687e-05, "loss": 2.3175, "step": 375620 }, { "epoch": 0.66, "learning_rate": 1.7247320528604864e-05, "loss": 2.4241, "step": 375630 }, { "epoch": 0.66, "learning_rate": 1.7246448588678035e-05, "loss": 2.4184, "step": 375640 }, { "epoch": 0.66, "learning_rate": 1.724557664875121e-05, "loss": 2.2992, "step": 375650 }, { "epoch": 0.66, "learning_rate": 1.7244704708824382e-05, "loss": 2.2606, "step": 375660 }, { "epoch": 0.66, "learning_rate": 1.7243832768897556e-05, "loss": 2.3886, "step": 375670 }, { "epoch": 0.66, "learning_rate": 1.7242960828970727e-05, "loss": 2.3281, "step": 375680 }, { "epoch": 0.66, "learning_rate": 1.72420888890439e-05, "loss": 2.256, "step": 375690 }, { "epoch": 0.66, "learning_rate": 1.7241216949117074e-05, "loss": 2.2784, "step": 375700 }, { "epoch": 0.66, "learning_rate": 1.7240345009190248e-05, "loss": 2.1952, "step": 375710 }, { "epoch": 0.66, "learning_rate": 1.723947306926342e-05, "loss": 2.3177, "step": 375720 }, { "epoch": 0.66, "learning_rate": 1.7238601129336592e-05, "loss": 2.269, "step": 375730 }, { "epoch": 0.66, "learning_rate": 1.723772918940977e-05, "loss": 2.3198, "step": 375740 }, { "epoch": 0.66, "learning_rate": 1.723685724948294e-05, "loss": 2.2882, "step": 375750 }, { "epoch": 0.66, "learning_rate": 1.7235985309556113e-05, "loss": 2.4664, "step": 375760 }, { "epoch": 0.66, "learning_rate": 1.7235113369629287e-05, "loss": 2.2876, "step": 375770 }, { "epoch": 0.66, "learning_rate": 1.723424142970246e-05, "loss": 2.3938, "step": 375780 }, { "epoch": 0.66, "learning_rate": 1.7233369489775635e-05, "loss": 2.3803, "step": 375790 }, { "epoch": 0.66, "learning_rate": 1.7232497549848805e-05, "loss": 2.2911, "step": 375800 }, { "epoch": 0.66, "learning_rate": 1.7231625609921982e-05, "loss": 2.3454, "step": 375810 }, { "epoch": 0.66, "learning_rate": 1.7230753669995153e-05, "loss": 2.3849, "step": 375820 }, { "epoch": 0.66, "learning_rate": 1.7229881730068326e-05, "loss": 2.3189, "step": 375830 }, { "epoch": 0.66, "learning_rate": 1.7229009790141497e-05, "loss": 2.3178, "step": 375840 }, { "epoch": 0.66, "learning_rate": 1.7228137850214674e-05, "loss": 2.39, "step": 375850 }, { "epoch": 0.66, "learning_rate": 1.7227265910287844e-05, "loss": 2.2492, "step": 375860 }, { "epoch": 0.66, "learning_rate": 1.7226393970361018e-05, "loss": 2.2546, "step": 375870 }, { "epoch": 0.66, "learning_rate": 1.7225522030434192e-05, "loss": 2.25, "step": 375880 }, { "epoch": 0.66, "learning_rate": 1.7224650090507366e-05, "loss": 2.3295, "step": 375890 }, { "epoch": 0.66, "learning_rate": 1.722377815058054e-05, "loss": 2.3812, "step": 375900 }, { "epoch": 0.66, "learning_rate": 1.722290621065371e-05, "loss": 2.3599, "step": 375910 }, { "epoch": 0.66, "learning_rate": 1.7222034270726887e-05, "loss": 2.2841, "step": 375920 }, { "epoch": 0.66, "learning_rate": 1.7221162330800057e-05, "loss": 2.3279, "step": 375930 }, { "epoch": 0.66, "learning_rate": 1.722029039087323e-05, "loss": 2.2333, "step": 375940 }, { "epoch": 0.66, "learning_rate": 1.7219418450946405e-05, "loss": 2.3255, "step": 375950 }, { "epoch": 0.66, "learning_rate": 1.721854651101958e-05, "loss": 2.3555, "step": 375960 }, { "epoch": 0.66, "learning_rate": 1.7217674571092752e-05, "loss": 2.2656, "step": 375970 }, { "epoch": 0.66, "learning_rate": 1.7216802631165923e-05, "loss": 2.4115, "step": 375980 }, { "epoch": 0.66, "learning_rate": 1.7215930691239096e-05, "loss": 2.2956, "step": 375990 }, { "epoch": 0.66, "learning_rate": 1.721505875131227e-05, "loss": 2.3194, "step": 376000 }, { "epoch": 0.66, "learning_rate": 1.7214186811385444e-05, "loss": 2.3228, "step": 376010 }, { "epoch": 0.66, "learning_rate": 1.7213314871458618e-05, "loss": 2.4089, "step": 376020 }, { "epoch": 0.66, "learning_rate": 1.7212442931531788e-05, "loss": 2.2939, "step": 376030 }, { "epoch": 0.66, "learning_rate": 1.7211570991604965e-05, "loss": 2.4491, "step": 376040 }, { "epoch": 0.66, "learning_rate": 1.7210699051678136e-05, "loss": 2.3837, "step": 376050 }, { "epoch": 0.66, "learning_rate": 1.720982711175131e-05, "loss": 2.321, "step": 376060 }, { "epoch": 0.66, "learning_rate": 1.7208955171824483e-05, "loss": 2.3258, "step": 376070 }, { "epoch": 0.66, "learning_rate": 1.7208083231897657e-05, "loss": 2.4234, "step": 376080 }, { "epoch": 0.66, "learning_rate": 1.7207211291970827e-05, "loss": 2.2667, "step": 376090 }, { "epoch": 0.66, "learning_rate": 1.7206339352044e-05, "loss": 2.3498, "step": 376100 }, { "epoch": 0.66, "learning_rate": 1.7205467412117175e-05, "loss": 2.3615, "step": 376110 }, { "epoch": 0.66, "learning_rate": 1.720459547219035e-05, "loss": 2.3519, "step": 376120 }, { "epoch": 0.66, "learning_rate": 1.7203723532263522e-05, "loss": 2.2793, "step": 376130 }, { "epoch": 0.66, "learning_rate": 1.7202851592336693e-05, "loss": 2.3378, "step": 376140 }, { "epoch": 0.66, "learning_rate": 1.720197965240987e-05, "loss": 2.4385, "step": 376150 }, { "epoch": 0.66, "learning_rate": 1.720110771248304e-05, "loss": 2.29, "step": 376160 }, { "epoch": 0.66, "learning_rate": 1.7200235772556214e-05, "loss": 2.3251, "step": 376170 }, { "epoch": 0.66, "learning_rate": 1.7199363832629388e-05, "loss": 2.2812, "step": 376180 }, { "epoch": 0.66, "learning_rate": 1.7198491892702562e-05, "loss": 2.3325, "step": 376190 }, { "epoch": 0.66, "learning_rate": 1.7197619952775735e-05, "loss": 2.1982, "step": 376200 }, { "epoch": 0.66, "learning_rate": 1.7196748012848906e-05, "loss": 2.248, "step": 376210 }, { "epoch": 0.66, "learning_rate": 1.7195876072922083e-05, "loss": 2.2284, "step": 376220 }, { "epoch": 0.66, "learning_rate": 1.7195004132995253e-05, "loss": 2.2671, "step": 376230 }, { "epoch": 0.66, "learning_rate": 1.7194132193068427e-05, "loss": 2.3553, "step": 376240 }, { "epoch": 0.66, "learning_rate": 1.71932602531416e-05, "loss": 2.3795, "step": 376250 }, { "epoch": 0.66, "learning_rate": 1.7192388313214775e-05, "loss": 2.2452, "step": 376260 }, { "epoch": 0.66, "learning_rate": 1.719151637328795e-05, "loss": 2.3192, "step": 376270 }, { "epoch": 0.66, "learning_rate": 1.719064443336112e-05, "loss": 2.2991, "step": 376280 }, { "epoch": 0.66, "learning_rate": 1.7189772493434293e-05, "loss": 2.3045, "step": 376290 }, { "epoch": 0.66, "learning_rate": 1.7188900553507466e-05, "loss": 2.3769, "step": 376300 }, { "epoch": 0.66, "learning_rate": 1.718802861358064e-05, "loss": 2.4355, "step": 376310 }, { "epoch": 0.66, "learning_rate": 1.718715667365381e-05, "loss": 2.2772, "step": 376320 }, { "epoch": 0.66, "learning_rate": 1.7186284733726988e-05, "loss": 2.33, "step": 376330 }, { "epoch": 0.66, "learning_rate": 1.7185412793800158e-05, "loss": 2.2936, "step": 376340 }, { "epoch": 0.66, "learning_rate": 1.7184540853873332e-05, "loss": 2.3024, "step": 376350 }, { "epoch": 0.66, "learning_rate": 1.7183668913946506e-05, "loss": 2.3339, "step": 376360 }, { "epoch": 0.66, "learning_rate": 1.718279697401968e-05, "loss": 2.4032, "step": 376370 }, { "epoch": 0.66, "learning_rate": 1.7181925034092853e-05, "loss": 2.2299, "step": 376380 }, { "epoch": 0.66, "learning_rate": 1.7181053094166024e-05, "loss": 2.2654, "step": 376390 }, { "epoch": 0.66, "learning_rate": 1.7180181154239197e-05, "loss": 2.2119, "step": 376400 }, { "epoch": 0.66, "learning_rate": 1.717930921431237e-05, "loss": 2.3239, "step": 376410 }, { "epoch": 0.66, "learning_rate": 1.7178437274385545e-05, "loss": 2.2742, "step": 376420 }, { "epoch": 0.66, "learning_rate": 1.717756533445872e-05, "loss": 2.2986, "step": 376430 }, { "epoch": 0.66, "learning_rate": 1.7176693394531892e-05, "loss": 2.3, "step": 376440 }, { "epoch": 0.66, "learning_rate": 1.7175821454605066e-05, "loss": 2.2809, "step": 376450 }, { "epoch": 0.66, "learning_rate": 1.7174949514678237e-05, "loss": 2.2113, "step": 376460 }, { "epoch": 0.66, "learning_rate": 1.717407757475141e-05, "loss": 2.3567, "step": 376470 }, { "epoch": 0.66, "learning_rate": 1.7173205634824584e-05, "loss": 2.2627, "step": 376480 }, { "epoch": 0.66, "learning_rate": 1.7172333694897758e-05, "loss": 2.2996, "step": 376490 }, { "epoch": 0.66, "learning_rate": 1.717146175497093e-05, "loss": 2.3617, "step": 376500 }, { "epoch": 0.66, "learning_rate": 1.7170589815044102e-05, "loss": 2.3106, "step": 376510 }, { "epoch": 0.66, "learning_rate": 1.716971787511728e-05, "loss": 2.3109, "step": 376520 }, { "epoch": 0.66, "learning_rate": 1.716884593519045e-05, "loss": 2.3088, "step": 376530 }, { "epoch": 0.66, "learning_rate": 1.7167973995263623e-05, "loss": 2.3279, "step": 376540 }, { "epoch": 0.66, "learning_rate": 1.7167102055336794e-05, "loss": 2.3396, "step": 376550 }, { "epoch": 0.66, "learning_rate": 1.716623011540997e-05, "loss": 2.2212, "step": 376560 }, { "epoch": 0.66, "learning_rate": 1.716535817548314e-05, "loss": 2.3122, "step": 376570 }, { "epoch": 0.66, "learning_rate": 1.7164486235556315e-05, "loss": 2.2867, "step": 376580 }, { "epoch": 0.66, "learning_rate": 1.716361429562949e-05, "loss": 2.262, "step": 376590 }, { "epoch": 0.66, "learning_rate": 1.7162742355702663e-05, "loss": 2.4606, "step": 376600 }, { "epoch": 0.66, "learning_rate": 1.7161870415775836e-05, "loss": 2.319, "step": 376610 }, { "epoch": 0.66, "learning_rate": 1.7160998475849007e-05, "loss": 2.3659, "step": 376620 }, { "epoch": 0.66, "learning_rate": 1.7160126535922184e-05, "loss": 2.3698, "step": 376630 }, { "epoch": 0.66, "learning_rate": 1.7159254595995354e-05, "loss": 2.3712, "step": 376640 }, { "epoch": 0.66, "learning_rate": 1.7158382656068528e-05, "loss": 2.3056, "step": 376650 }, { "epoch": 0.66, "learning_rate": 1.7157510716141702e-05, "loss": 2.2843, "step": 376660 }, { "epoch": 0.66, "learning_rate": 1.7156638776214876e-05, "loss": 2.3583, "step": 376670 }, { "epoch": 0.66, "learning_rate": 1.715576683628805e-05, "loss": 2.3201, "step": 376680 }, { "epoch": 0.66, "learning_rate": 1.715489489636122e-05, "loss": 2.4041, "step": 376690 }, { "epoch": 0.66, "learning_rate": 1.7154022956434393e-05, "loss": 2.3372, "step": 376700 }, { "epoch": 0.66, "learning_rate": 1.7153151016507567e-05, "loss": 2.4112, "step": 376710 }, { "epoch": 0.66, "learning_rate": 1.715227907658074e-05, "loss": 2.2633, "step": 376720 }, { "epoch": 0.66, "learning_rate": 1.715140713665391e-05, "loss": 2.3954, "step": 376730 }, { "epoch": 0.66, "learning_rate": 1.715053519672709e-05, "loss": 2.3131, "step": 376740 }, { "epoch": 0.66, "learning_rate": 1.7149663256800262e-05, "loss": 2.3413, "step": 376750 }, { "epoch": 0.66, "learning_rate": 1.7148791316873433e-05, "loss": 2.2829, "step": 376760 }, { "epoch": 0.66, "learning_rate": 1.7147919376946606e-05, "loss": 2.1798, "step": 376770 }, { "epoch": 0.66, "learning_rate": 1.714704743701978e-05, "loss": 2.2614, "step": 376780 }, { "epoch": 0.66, "learning_rate": 1.7146175497092954e-05, "loss": 2.283, "step": 376790 }, { "epoch": 0.66, "learning_rate": 1.7145303557166124e-05, "loss": 2.2649, "step": 376800 }, { "epoch": 0.66, "learning_rate": 1.7144431617239298e-05, "loss": 2.3022, "step": 376810 }, { "epoch": 0.66, "learning_rate": 1.7143559677312472e-05, "loss": 2.2907, "step": 376820 }, { "epoch": 0.66, "learning_rate": 1.7142687737385646e-05, "loss": 2.3141, "step": 376830 }, { "epoch": 0.66, "learning_rate": 1.714181579745882e-05, "loss": 2.3376, "step": 376840 }, { "epoch": 0.66, "learning_rate": 1.7140943857531993e-05, "loss": 2.418, "step": 376850 }, { "epoch": 0.66, "learning_rate": 1.7140071917605167e-05, "loss": 2.3139, "step": 376860 }, { "epoch": 0.66, "learning_rate": 1.7139199977678337e-05, "loss": 2.2822, "step": 376870 }, { "epoch": 0.66, "learning_rate": 1.713832803775151e-05, "loss": 2.3465, "step": 376880 }, { "epoch": 0.66, "learning_rate": 1.7137456097824685e-05, "loss": 2.274, "step": 376890 }, { "epoch": 0.66, "learning_rate": 1.713658415789786e-05, "loss": 2.3388, "step": 376900 }, { "epoch": 0.66, "learning_rate": 1.7135712217971032e-05, "loss": 2.2683, "step": 376910 }, { "epoch": 0.66, "learning_rate": 1.7134840278044203e-05, "loss": 2.2526, "step": 376920 }, { "epoch": 0.66, "learning_rate": 1.713396833811738e-05, "loss": 2.3153, "step": 376930 }, { "epoch": 0.66, "learning_rate": 1.713309639819055e-05, "loss": 2.3301, "step": 376940 }, { "epoch": 0.66, "learning_rate": 1.7132224458263724e-05, "loss": 2.4038, "step": 376950 }, { "epoch": 0.66, "learning_rate": 1.7131352518336895e-05, "loss": 2.3335, "step": 376960 }, { "epoch": 0.66, "learning_rate": 1.7130480578410072e-05, "loss": 2.3305, "step": 376970 }, { "epoch": 0.66, "learning_rate": 1.7129608638483245e-05, "loss": 2.3115, "step": 376980 }, { "epoch": 0.66, "learning_rate": 1.7128736698556416e-05, "loss": 2.3609, "step": 376990 }, { "epoch": 0.66, "learning_rate": 1.7127864758629593e-05, "loss": 2.2604, "step": 377000 }, { "epoch": 0.66, "learning_rate": 1.7126992818702763e-05, "loss": 2.279, "step": 377010 }, { "epoch": 0.66, "learning_rate": 1.7126120878775937e-05, "loss": 2.3645, "step": 377020 }, { "epoch": 0.66, "learning_rate": 1.7125248938849108e-05, "loss": 2.3025, "step": 377030 }, { "epoch": 0.66, "learning_rate": 1.7124376998922285e-05, "loss": 2.1676, "step": 377040 }, { "epoch": 0.66, "learning_rate": 1.7123505058995455e-05, "loss": 2.3451, "step": 377050 }, { "epoch": 0.66, "learning_rate": 1.712263311906863e-05, "loss": 2.3725, "step": 377060 }, { "epoch": 0.66, "learning_rate": 1.7121761179141803e-05, "loss": 2.2315, "step": 377070 }, { "epoch": 0.66, "learning_rate": 1.7120889239214976e-05, "loss": 2.2598, "step": 377080 }, { "epoch": 0.66, "learning_rate": 1.712001729928815e-05, "loss": 2.2407, "step": 377090 }, { "epoch": 0.66, "learning_rate": 1.711914535936132e-05, "loss": 2.3115, "step": 377100 }, { "epoch": 0.66, "learning_rate": 1.7118273419434498e-05, "loss": 2.3715, "step": 377110 }, { "epoch": 0.66, "learning_rate": 1.7117401479507668e-05, "loss": 2.38, "step": 377120 }, { "epoch": 0.66, "learning_rate": 1.7116529539580842e-05, "loss": 2.392, "step": 377130 }, { "epoch": 0.66, "learning_rate": 1.7115657599654016e-05, "loss": 2.3416, "step": 377140 }, { "epoch": 0.66, "learning_rate": 1.711478565972719e-05, "loss": 2.1535, "step": 377150 }, { "epoch": 0.66, "learning_rate": 1.7113913719800363e-05, "loss": 2.3792, "step": 377160 }, { "epoch": 0.66, "learning_rate": 1.7113041779873534e-05, "loss": 2.2359, "step": 377170 }, { "epoch": 0.66, "learning_rate": 1.7112169839946707e-05, "loss": 2.2679, "step": 377180 }, { "epoch": 0.66, "learning_rate": 1.711129790001988e-05, "loss": 2.3482, "step": 377190 }, { "epoch": 0.66, "learning_rate": 1.7110425960093055e-05, "loss": 2.3144, "step": 377200 }, { "epoch": 0.66, "learning_rate": 1.7109554020166225e-05, "loss": 2.2572, "step": 377210 }, { "epoch": 0.66, "learning_rate": 1.71086820802394e-05, "loss": 2.3864, "step": 377220 }, { "epoch": 0.66, "learning_rate": 1.7107810140312576e-05, "loss": 2.3612, "step": 377230 }, { "epoch": 0.66, "learning_rate": 1.7106938200385747e-05, "loss": 2.3038, "step": 377240 }, { "epoch": 0.66, "learning_rate": 1.710606626045892e-05, "loss": 2.3396, "step": 377250 }, { "epoch": 0.66, "learning_rate": 1.7105194320532094e-05, "loss": 2.2442, "step": 377260 }, { "epoch": 0.66, "learning_rate": 1.7104322380605268e-05, "loss": 2.267, "step": 377270 }, { "epoch": 0.66, "learning_rate": 1.7103450440678438e-05, "loss": 2.4166, "step": 377280 }, { "epoch": 0.66, "learning_rate": 1.7102578500751612e-05, "loss": 2.2742, "step": 377290 }, { "epoch": 0.66, "learning_rate": 1.7101706560824786e-05, "loss": 2.3426, "step": 377300 }, { "epoch": 0.66, "learning_rate": 1.710083462089796e-05, "loss": 2.327, "step": 377310 }, { "epoch": 0.66, "learning_rate": 1.7099962680971133e-05, "loss": 2.3988, "step": 377320 }, { "epoch": 0.66, "learning_rate": 1.7099090741044304e-05, "loss": 2.2704, "step": 377330 }, { "epoch": 0.66, "learning_rate": 1.709821880111748e-05, "loss": 2.3464, "step": 377340 }, { "epoch": 0.66, "learning_rate": 1.709734686119065e-05, "loss": 2.3414, "step": 377350 }, { "epoch": 0.66, "learning_rate": 1.7096474921263825e-05, "loss": 2.3453, "step": 377360 }, { "epoch": 0.66, "learning_rate": 1.7095602981337e-05, "loss": 2.3095, "step": 377370 }, { "epoch": 0.66, "learning_rate": 1.7094731041410173e-05, "loss": 2.3575, "step": 377380 }, { "epoch": 0.66, "learning_rate": 1.7093859101483346e-05, "loss": 2.2285, "step": 377390 }, { "epoch": 0.66, "learning_rate": 1.7092987161556517e-05, "loss": 2.3102, "step": 377400 }, { "epoch": 0.66, "learning_rate": 1.7092115221629694e-05, "loss": 2.3551, "step": 377410 }, { "epoch": 0.66, "learning_rate": 1.7091243281702864e-05, "loss": 2.3226, "step": 377420 }, { "epoch": 0.66, "learning_rate": 1.7090371341776038e-05, "loss": 2.2741, "step": 377430 }, { "epoch": 0.66, "learning_rate": 1.708949940184921e-05, "loss": 2.2649, "step": 377440 }, { "epoch": 0.66, "learning_rate": 1.7088627461922386e-05, "loss": 2.3195, "step": 377450 }, { "epoch": 0.66, "learning_rate": 1.7087755521995556e-05, "loss": 2.3501, "step": 377460 }, { "epoch": 0.66, "learning_rate": 1.708688358206873e-05, "loss": 2.4342, "step": 377470 }, { "epoch": 0.66, "learning_rate": 1.7086011642141903e-05, "loss": 2.3165, "step": 377480 }, { "epoch": 0.66, "learning_rate": 1.7085139702215077e-05, "loss": 2.394, "step": 377490 }, { "epoch": 0.66, "learning_rate": 1.708426776228825e-05, "loss": 2.3717, "step": 377500 }, { "epoch": 0.66, "learning_rate": 1.708339582236142e-05, "loss": 2.4768, "step": 377510 }, { "epoch": 0.66, "learning_rate": 1.70825238824346e-05, "loss": 2.2463, "step": 377520 }, { "epoch": 0.66, "learning_rate": 1.708165194250777e-05, "loss": 2.3012, "step": 377530 }, { "epoch": 0.66, "learning_rate": 1.7080780002580943e-05, "loss": 2.1724, "step": 377540 }, { "epoch": 0.66, "learning_rate": 1.7079908062654116e-05, "loss": 2.4287, "step": 377550 }, { "epoch": 0.66, "learning_rate": 1.707903612272729e-05, "loss": 2.3515, "step": 377560 }, { "epoch": 0.66, "learning_rate": 1.7078164182800464e-05, "loss": 2.3111, "step": 377570 }, { "epoch": 0.66, "learning_rate": 1.7077292242873634e-05, "loss": 2.293, "step": 377580 }, { "epoch": 0.66, "learning_rate": 1.7076420302946808e-05, "loss": 2.3878, "step": 377590 }, { "epoch": 0.66, "learning_rate": 1.7075548363019982e-05, "loss": 2.3848, "step": 377600 }, { "epoch": 0.66, "learning_rate": 1.7074676423093156e-05, "loss": 2.3543, "step": 377610 }, { "epoch": 0.66, "learning_rate": 1.707380448316633e-05, "loss": 2.2992, "step": 377620 }, { "epoch": 0.66, "learning_rate": 1.70729325432395e-05, "loss": 2.3942, "step": 377630 }, { "epoch": 0.66, "learning_rate": 1.7072060603312677e-05, "loss": 2.4457, "step": 377640 }, { "epoch": 0.66, "learning_rate": 1.7071188663385847e-05, "loss": 2.3576, "step": 377650 }, { "epoch": 0.66, "learning_rate": 1.707031672345902e-05, "loss": 2.3072, "step": 377660 }, { "epoch": 0.66, "learning_rate": 1.7069444783532195e-05, "loss": 2.4321, "step": 377670 }, { "epoch": 0.66, "learning_rate": 1.706857284360537e-05, "loss": 2.3622, "step": 377680 }, { "epoch": 0.66, "learning_rate": 1.706770090367854e-05, "loss": 2.2443, "step": 377690 }, { "epoch": 0.66, "learning_rate": 1.7066828963751713e-05, "loss": 2.2599, "step": 377700 }, { "epoch": 0.66, "learning_rate": 1.706595702382489e-05, "loss": 2.3395, "step": 377710 }, { "epoch": 0.66, "learning_rate": 1.706508508389806e-05, "loss": 2.3461, "step": 377720 }, { "epoch": 0.66, "learning_rate": 1.7064213143971234e-05, "loss": 2.2846, "step": 377730 }, { "epoch": 0.66, "learning_rate": 1.7063341204044405e-05, "loss": 2.2761, "step": 377740 }, { "epoch": 0.66, "learning_rate": 1.7062469264117582e-05, "loss": 2.3283, "step": 377750 }, { "epoch": 0.66, "learning_rate": 1.7061597324190752e-05, "loss": 2.3882, "step": 377760 }, { "epoch": 0.66, "learning_rate": 1.7060725384263926e-05, "loss": 2.4112, "step": 377770 }, { "epoch": 0.66, "learning_rate": 1.70598534443371e-05, "loss": 2.1841, "step": 377780 }, { "epoch": 0.66, "learning_rate": 1.7058981504410273e-05, "loss": 2.3539, "step": 377790 }, { "epoch": 0.66, "learning_rate": 1.7058109564483447e-05, "loss": 2.3053, "step": 377800 }, { "epoch": 0.66, "learning_rate": 1.7057237624556618e-05, "loss": 2.3519, "step": 377810 }, { "epoch": 0.66, "learning_rate": 1.7056365684629795e-05, "loss": 2.3156, "step": 377820 }, { "epoch": 0.66, "learning_rate": 1.7055493744702965e-05, "loss": 2.3775, "step": 377830 }, { "epoch": 0.66, "learning_rate": 1.705462180477614e-05, "loss": 2.3189, "step": 377840 }, { "epoch": 0.66, "learning_rate": 1.7053749864849313e-05, "loss": 2.4247, "step": 377850 }, { "epoch": 0.66, "learning_rate": 1.7052877924922486e-05, "loss": 2.315, "step": 377860 }, { "epoch": 0.66, "learning_rate": 1.705200598499566e-05, "loss": 2.3539, "step": 377870 }, { "epoch": 0.66, "learning_rate": 1.705113404506883e-05, "loss": 2.341, "step": 377880 }, { "epoch": 0.66, "learning_rate": 1.7050262105142004e-05, "loss": 2.283, "step": 377890 }, { "epoch": 0.66, "learning_rate": 1.7049390165215178e-05, "loss": 2.2999, "step": 377900 }, { "epoch": 0.66, "learning_rate": 1.7048518225288352e-05, "loss": 2.3354, "step": 377910 }, { "epoch": 0.66, "learning_rate": 1.7047646285361522e-05, "loss": 2.3697, "step": 377920 }, { "epoch": 0.66, "learning_rate": 1.70467743454347e-05, "loss": 2.3228, "step": 377930 }, { "epoch": 0.66, "learning_rate": 1.704590240550787e-05, "loss": 2.4005, "step": 377940 }, { "epoch": 0.66, "learning_rate": 1.7045030465581044e-05, "loss": 2.4584, "step": 377950 }, { "epoch": 0.66, "learning_rate": 1.7044158525654217e-05, "loss": 2.383, "step": 377960 }, { "epoch": 0.66, "learning_rate": 1.704328658572739e-05, "loss": 2.2226, "step": 377970 }, { "epoch": 0.66, "learning_rate": 1.7042414645800565e-05, "loss": 2.3378, "step": 377980 }, { "epoch": 0.66, "learning_rate": 1.7041542705873735e-05, "loss": 2.3098, "step": 377990 }, { "epoch": 0.66, "learning_rate": 1.704067076594691e-05, "loss": 2.3501, "step": 378000 }, { "epoch": 0.66, "learning_rate": 1.7039798826020083e-05, "loss": 2.358, "step": 378010 }, { "epoch": 0.66, "learning_rate": 1.7038926886093257e-05, "loss": 2.3389, "step": 378020 }, { "epoch": 0.66, "learning_rate": 1.703805494616643e-05, "loss": 2.2295, "step": 378030 }, { "epoch": 0.66, "learning_rate": 1.7037183006239604e-05, "loss": 2.2579, "step": 378040 }, { "epoch": 0.66, "learning_rate": 1.7036311066312778e-05, "loss": 2.1863, "step": 378050 }, { "epoch": 0.66, "learning_rate": 1.7035439126385948e-05, "loss": 2.3936, "step": 378060 }, { "epoch": 0.66, "learning_rate": 1.7034567186459122e-05, "loss": 2.2308, "step": 378070 }, { "epoch": 0.66, "learning_rate": 1.7033695246532296e-05, "loss": 2.3567, "step": 378080 }, { "epoch": 0.66, "learning_rate": 1.703282330660547e-05, "loss": 2.2988, "step": 378090 }, { "epoch": 0.66, "learning_rate": 1.7031951366678643e-05, "loss": 2.3501, "step": 378100 }, { "epoch": 0.66, "learning_rate": 1.7031079426751814e-05, "loss": 2.196, "step": 378110 }, { "epoch": 0.66, "learning_rate": 1.703020748682499e-05, "loss": 2.4058, "step": 378120 }, { "epoch": 0.66, "learning_rate": 1.702933554689816e-05, "loss": 2.3401, "step": 378130 }, { "epoch": 0.66, "learning_rate": 1.7028463606971335e-05, "loss": 2.2765, "step": 378140 }, { "epoch": 0.66, "learning_rate": 1.7027591667044505e-05, "loss": 2.2141, "step": 378150 }, { "epoch": 0.66, "learning_rate": 1.7026719727117683e-05, "loss": 2.3435, "step": 378160 }, { "epoch": 0.66, "learning_rate": 1.7025847787190853e-05, "loss": 2.0845, "step": 378170 }, { "epoch": 0.66, "learning_rate": 1.7024975847264027e-05, "loss": 2.272, "step": 378180 }, { "epoch": 0.66, "learning_rate": 1.70241039073372e-05, "loss": 2.2385, "step": 378190 }, { "epoch": 0.66, "learning_rate": 1.7023231967410374e-05, "loss": 2.3478, "step": 378200 }, { "epoch": 0.66, "learning_rate": 1.7022360027483548e-05, "loss": 2.2371, "step": 378210 }, { "epoch": 0.66, "learning_rate": 1.702148808755672e-05, "loss": 2.2299, "step": 378220 }, { "epoch": 0.66, "learning_rate": 1.7020616147629896e-05, "loss": 2.3502, "step": 378230 }, { "epoch": 0.66, "learning_rate": 1.7019744207703066e-05, "loss": 2.2712, "step": 378240 }, { "epoch": 0.66, "learning_rate": 1.701887226777624e-05, "loss": 2.3855, "step": 378250 }, { "epoch": 0.66, "learning_rate": 1.7018000327849414e-05, "loss": 2.2109, "step": 378260 }, { "epoch": 0.66, "learning_rate": 1.7017128387922587e-05, "loss": 2.1532, "step": 378270 }, { "epoch": 0.66, "learning_rate": 1.701625644799576e-05, "loss": 2.2835, "step": 378280 }, { "epoch": 0.66, "learning_rate": 1.701538450806893e-05, "loss": 2.3264, "step": 378290 }, { "epoch": 0.66, "learning_rate": 1.701451256814211e-05, "loss": 2.2487, "step": 378300 }, { "epoch": 0.66, "learning_rate": 1.701364062821528e-05, "loss": 2.3217, "step": 378310 }, { "epoch": 0.66, "learning_rate": 1.7012768688288453e-05, "loss": 2.3613, "step": 378320 }, { "epoch": 0.66, "learning_rate": 1.7011896748361627e-05, "loss": 2.436, "step": 378330 }, { "epoch": 0.66, "learning_rate": 1.70110248084348e-05, "loss": 2.4444, "step": 378340 }, { "epoch": 0.66, "learning_rate": 1.7010152868507974e-05, "loss": 2.337, "step": 378350 }, { "epoch": 0.66, "learning_rate": 1.7009280928581144e-05, "loss": 2.2757, "step": 378360 }, { "epoch": 0.66, "learning_rate": 1.7008408988654318e-05, "loss": 2.3246, "step": 378370 }, { "epoch": 0.66, "learning_rate": 1.7007537048727492e-05, "loss": 2.2979, "step": 378380 }, { "epoch": 0.66, "learning_rate": 1.7006665108800666e-05, "loss": 2.3299, "step": 378390 }, { "epoch": 0.66, "learning_rate": 1.7005793168873836e-05, "loss": 2.3018, "step": 378400 }, { "epoch": 0.66, "learning_rate": 1.700492122894701e-05, "loss": 2.243, "step": 378410 }, { "epoch": 0.66, "learning_rate": 1.7004049289020184e-05, "loss": 2.3251, "step": 378420 }, { "epoch": 0.66, "learning_rate": 1.7003177349093357e-05, "loss": 2.385, "step": 378430 }, { "epoch": 0.66, "learning_rate": 1.700230540916653e-05, "loss": 2.3255, "step": 378440 }, { "epoch": 0.66, "learning_rate": 1.7001433469239705e-05, "loss": 2.3163, "step": 378450 }, { "epoch": 0.66, "learning_rate": 1.700056152931288e-05, "loss": 2.2536, "step": 378460 }, { "epoch": 0.66, "learning_rate": 1.699968958938605e-05, "loss": 2.3505, "step": 378470 }, { "epoch": 0.66, "learning_rate": 1.6998817649459223e-05, "loss": 2.2433, "step": 378480 }, { "epoch": 0.66, "learning_rate": 1.6997945709532397e-05, "loss": 2.2847, "step": 378490 }, { "epoch": 0.66, "learning_rate": 1.699707376960557e-05, "loss": 2.3007, "step": 378500 }, { "epoch": 0.66, "learning_rate": 1.6996201829678744e-05, "loss": 2.2345, "step": 378510 }, { "epoch": 0.66, "learning_rate": 1.6995329889751915e-05, "loss": 2.2071, "step": 378520 }, { "epoch": 0.66, "learning_rate": 1.6994457949825092e-05, "loss": 2.2815, "step": 378530 }, { "epoch": 0.66, "learning_rate": 1.6993586009898262e-05, "loss": 2.381, "step": 378540 }, { "epoch": 0.66, "learning_rate": 1.6992714069971436e-05, "loss": 2.2736, "step": 378550 }, { "epoch": 0.66, "learning_rate": 1.6991842130044606e-05, "loss": 2.3192, "step": 378560 }, { "epoch": 0.66, "learning_rate": 1.6990970190117783e-05, "loss": 2.3101, "step": 378570 }, { "epoch": 0.66, "learning_rate": 1.6990098250190957e-05, "loss": 2.2067, "step": 378580 }, { "epoch": 0.66, "learning_rate": 1.6989226310264128e-05, "loss": 2.3342, "step": 378590 }, { "epoch": 0.66, "learning_rate": 1.6988354370337305e-05, "loss": 2.2857, "step": 378600 }, { "epoch": 0.66, "learning_rate": 1.6987482430410475e-05, "loss": 2.2346, "step": 378610 }, { "epoch": 0.66, "learning_rate": 1.698661049048365e-05, "loss": 2.2118, "step": 378620 }, { "epoch": 0.66, "learning_rate": 1.698573855055682e-05, "loss": 2.2459, "step": 378630 }, { "epoch": 0.66, "learning_rate": 1.6984866610629996e-05, "loss": 2.2423, "step": 378640 }, { "epoch": 0.66, "learning_rate": 1.6983994670703167e-05, "loss": 2.1942, "step": 378650 }, { "epoch": 0.66, "learning_rate": 1.698312273077634e-05, "loss": 2.3597, "step": 378660 }, { "epoch": 0.66, "learning_rate": 1.6982250790849514e-05, "loss": 2.3653, "step": 378670 }, { "epoch": 0.66, "learning_rate": 1.6981378850922688e-05, "loss": 2.3409, "step": 378680 }, { "epoch": 0.66, "learning_rate": 1.6980506910995862e-05, "loss": 2.377, "step": 378690 }, { "epoch": 0.66, "learning_rate": 1.6979634971069032e-05, "loss": 2.3434, "step": 378700 }, { "epoch": 0.66, "learning_rate": 1.697876303114221e-05, "loss": 2.4115, "step": 378710 }, { "epoch": 0.66, "learning_rate": 1.697789109121538e-05, "loss": 2.3286, "step": 378720 }, { "epoch": 0.66, "learning_rate": 1.6977019151288554e-05, "loss": 2.4143, "step": 378730 }, { "epoch": 0.66, "learning_rate": 1.6976147211361727e-05, "loss": 2.3572, "step": 378740 }, { "epoch": 0.66, "learning_rate": 1.69752752714349e-05, "loss": 2.3128, "step": 378750 }, { "epoch": 0.66, "learning_rate": 1.6974403331508075e-05, "loss": 2.3076, "step": 378760 }, { "epoch": 0.66, "learning_rate": 1.6973531391581245e-05, "loss": 2.2322, "step": 378770 }, { "epoch": 0.66, "learning_rate": 1.697265945165442e-05, "loss": 2.2124, "step": 378780 }, { "epoch": 0.66, "learning_rate": 1.6971787511727593e-05, "loss": 2.2525, "step": 378790 }, { "epoch": 0.66, "learning_rate": 1.6970915571800767e-05, "loss": 2.3409, "step": 378800 }, { "epoch": 0.66, "learning_rate": 1.6970043631873937e-05, "loss": 2.2854, "step": 378810 }, { "epoch": 0.66, "learning_rate": 1.696917169194711e-05, "loss": 2.2584, "step": 378820 }, { "epoch": 0.66, "learning_rate": 1.6968299752020288e-05, "loss": 2.3947, "step": 378830 }, { "epoch": 0.66, "learning_rate": 1.6967427812093458e-05, "loss": 2.3206, "step": 378840 }, { "epoch": 0.66, "learning_rate": 1.6966555872166632e-05, "loss": 2.2515, "step": 378850 }, { "epoch": 0.66, "learning_rate": 1.6965683932239806e-05, "loss": 2.3863, "step": 378860 }, { "epoch": 0.66, "learning_rate": 1.696481199231298e-05, "loss": 2.3666, "step": 378870 }, { "epoch": 0.66, "learning_rate": 1.696394005238615e-05, "loss": 2.2851, "step": 378880 }, { "epoch": 0.66, "learning_rate": 1.6963068112459324e-05, "loss": 2.3509, "step": 378890 }, { "epoch": 0.66, "learning_rate": 1.6962196172532498e-05, "loss": 2.304, "step": 378900 }, { "epoch": 0.66, "learning_rate": 1.696132423260567e-05, "loss": 2.2751, "step": 378910 }, { "epoch": 0.66, "learning_rate": 1.6960452292678845e-05, "loss": 2.4239, "step": 378920 }, { "epoch": 0.66, "learning_rate": 1.6959580352752015e-05, "loss": 2.3318, "step": 378930 }, { "epoch": 0.66, "learning_rate": 1.6958708412825193e-05, "loss": 2.4103, "step": 378940 }, { "epoch": 0.66, "learning_rate": 1.6957836472898363e-05, "loss": 2.2837, "step": 378950 }, { "epoch": 0.66, "learning_rate": 1.6956964532971537e-05, "loss": 2.2952, "step": 378960 }, { "epoch": 0.66, "learning_rate": 1.695609259304471e-05, "loss": 2.3179, "step": 378970 }, { "epoch": 0.66, "learning_rate": 1.6955220653117884e-05, "loss": 2.3301, "step": 378980 }, { "epoch": 0.66, "learning_rate": 1.6954348713191058e-05, "loss": 2.3146, "step": 378990 }, { "epoch": 0.66, "learning_rate": 1.695347677326423e-05, "loss": 2.2709, "step": 379000 }, { "epoch": 0.66, "learning_rate": 1.6952604833337406e-05, "loss": 2.3873, "step": 379010 }, { "epoch": 0.66, "learning_rate": 1.6951732893410576e-05, "loss": 2.2461, "step": 379020 }, { "epoch": 0.66, "learning_rate": 1.695086095348375e-05, "loss": 2.2695, "step": 379030 }, { "epoch": 0.66, "learning_rate": 1.694998901355692e-05, "loss": 2.258, "step": 379040 }, { "epoch": 0.66, "learning_rate": 1.6949117073630097e-05, "loss": 2.2391, "step": 379050 }, { "epoch": 0.66, "learning_rate": 1.694824513370327e-05, "loss": 2.3418, "step": 379060 }, { "epoch": 0.66, "learning_rate": 1.694737319377644e-05, "loss": 2.3444, "step": 379070 }, { "epoch": 0.66, "learning_rate": 1.6946501253849615e-05, "loss": 2.3456, "step": 379080 }, { "epoch": 0.66, "learning_rate": 1.694562931392279e-05, "loss": 2.2599, "step": 379090 }, { "epoch": 0.66, "learning_rate": 1.6944757373995963e-05, "loss": 2.3778, "step": 379100 }, { "epoch": 0.66, "learning_rate": 1.6943885434069133e-05, "loss": 2.3186, "step": 379110 }, { "epoch": 0.66, "learning_rate": 1.694301349414231e-05, "loss": 2.3225, "step": 379120 }, { "epoch": 0.66, "learning_rate": 1.694214155421548e-05, "loss": 2.3823, "step": 379130 }, { "epoch": 0.66, "learning_rate": 1.6941269614288654e-05, "loss": 2.4048, "step": 379140 }, { "epoch": 0.66, "learning_rate": 1.6940397674361828e-05, "loss": 2.3883, "step": 379150 }, { "epoch": 0.66, "learning_rate": 1.6939525734435002e-05, "loss": 2.2612, "step": 379160 }, { "epoch": 0.66, "learning_rate": 1.6938653794508176e-05, "loss": 2.2646, "step": 379170 }, { "epoch": 0.66, "learning_rate": 1.6937781854581346e-05, "loss": 2.4043, "step": 379180 }, { "epoch": 0.66, "learning_rate": 1.693690991465452e-05, "loss": 2.398, "step": 379190 }, { "epoch": 0.66, "learning_rate": 1.6936037974727694e-05, "loss": 2.3605, "step": 379200 }, { "epoch": 0.66, "learning_rate": 1.6935166034800867e-05, "loss": 2.3411, "step": 379210 }, { "epoch": 0.66, "learning_rate": 1.693429409487404e-05, "loss": 2.2971, "step": 379220 }, { "epoch": 0.66, "learning_rate": 1.6933422154947215e-05, "loss": 2.3472, "step": 379230 }, { "epoch": 0.66, "learning_rate": 1.693255021502039e-05, "loss": 2.2476, "step": 379240 }, { "epoch": 0.66, "learning_rate": 1.693167827509356e-05, "loss": 2.2115, "step": 379250 }, { "epoch": 0.66, "learning_rate": 1.6930806335166733e-05, "loss": 2.0942, "step": 379260 }, { "epoch": 0.66, "learning_rate": 1.6929934395239907e-05, "loss": 2.2882, "step": 379270 }, { "epoch": 0.66, "learning_rate": 1.692906245531308e-05, "loss": 2.2856, "step": 379280 }, { "epoch": 0.66, "learning_rate": 1.692819051538625e-05, "loss": 2.2941, "step": 379290 }, { "epoch": 0.66, "learning_rate": 1.6927318575459425e-05, "loss": 2.2769, "step": 379300 }, { "epoch": 0.66, "learning_rate": 1.6926446635532602e-05, "loss": 2.211, "step": 379310 }, { "epoch": 0.66, "learning_rate": 1.6925574695605772e-05, "loss": 2.3323, "step": 379320 }, { "epoch": 0.66, "learning_rate": 1.6924702755678946e-05, "loss": 2.3426, "step": 379330 }, { "epoch": 0.66, "learning_rate": 1.6923830815752116e-05, "loss": 2.324, "step": 379340 }, { "epoch": 0.66, "learning_rate": 1.6922958875825293e-05, "loss": 2.3215, "step": 379350 }, { "epoch": 0.66, "learning_rate": 1.6922086935898464e-05, "loss": 2.2698, "step": 379360 }, { "epoch": 0.66, "learning_rate": 1.6921214995971638e-05, "loss": 2.3085, "step": 379370 }, { "epoch": 0.66, "learning_rate": 1.692034305604481e-05, "loss": 2.416, "step": 379380 }, { "epoch": 0.66, "learning_rate": 1.6919471116117985e-05, "loss": 2.3383, "step": 379390 }, { "epoch": 0.66, "learning_rate": 1.691859917619116e-05, "loss": 2.2851, "step": 379400 }, { "epoch": 0.66, "learning_rate": 1.691772723626433e-05, "loss": 2.21, "step": 379410 }, { "epoch": 0.66, "learning_rate": 1.6916855296337506e-05, "loss": 2.3843, "step": 379420 }, { "epoch": 0.66, "learning_rate": 1.6915983356410677e-05, "loss": 2.3665, "step": 379430 }, { "epoch": 0.66, "learning_rate": 1.691511141648385e-05, "loss": 2.3412, "step": 379440 }, { "epoch": 0.66, "learning_rate": 1.6914239476557024e-05, "loss": 2.2974, "step": 379450 }, { "epoch": 0.66, "learning_rate": 1.6913367536630198e-05, "loss": 2.3731, "step": 379460 }, { "epoch": 0.66, "learning_rate": 1.6912495596703372e-05, "loss": 2.3744, "step": 379470 }, { "epoch": 0.66, "learning_rate": 1.6911623656776542e-05, "loss": 2.3232, "step": 379480 }, { "epoch": 0.66, "learning_rate": 1.6910751716849716e-05, "loss": 2.3349, "step": 379490 }, { "epoch": 0.66, "learning_rate": 1.690987977692289e-05, "loss": 2.3764, "step": 379500 }, { "epoch": 0.66, "learning_rate": 1.6909007836996064e-05, "loss": 2.2937, "step": 379510 }, { "epoch": 0.66, "learning_rate": 1.6908135897069234e-05, "loss": 2.2463, "step": 379520 }, { "epoch": 0.66, "learning_rate": 1.690726395714241e-05, "loss": 2.3538, "step": 379530 }, { "epoch": 0.66, "learning_rate": 1.690639201721558e-05, "loss": 2.3329, "step": 379540 }, { "epoch": 0.66, "learning_rate": 1.6905520077288755e-05, "loss": 2.2844, "step": 379550 }, { "epoch": 0.66, "learning_rate": 1.690464813736193e-05, "loss": 2.2214, "step": 379560 }, { "epoch": 0.66, "learning_rate": 1.6903776197435103e-05, "loss": 2.3034, "step": 379570 }, { "epoch": 0.66, "learning_rate": 1.6902904257508277e-05, "loss": 2.3338, "step": 379580 }, { "epoch": 0.66, "learning_rate": 1.6902032317581447e-05, "loss": 2.304, "step": 379590 }, { "epoch": 0.66, "learning_rate": 1.690116037765462e-05, "loss": 2.3782, "step": 379600 }, { "epoch": 0.66, "learning_rate": 1.6900288437727795e-05, "loss": 2.2751, "step": 379610 }, { "epoch": 0.66, "learning_rate": 1.6899416497800968e-05, "loss": 2.2085, "step": 379620 }, { "epoch": 0.66, "learning_rate": 1.6898544557874142e-05, "loss": 2.3334, "step": 379630 }, { "epoch": 0.66, "learning_rate": 1.6897672617947316e-05, "loss": 2.3679, "step": 379640 }, { "epoch": 0.66, "learning_rate": 1.689680067802049e-05, "loss": 2.3393, "step": 379650 }, { "epoch": 0.66, "learning_rate": 1.689592873809366e-05, "loss": 2.2648, "step": 379660 }, { "epoch": 0.66, "learning_rate": 1.6895056798166834e-05, "loss": 2.2886, "step": 379670 }, { "epoch": 0.66, "learning_rate": 1.6894184858240008e-05, "loss": 2.3278, "step": 379680 }, { "epoch": 0.66, "learning_rate": 1.689331291831318e-05, "loss": 2.3329, "step": 379690 }, { "epoch": 0.66, "learning_rate": 1.6892440978386355e-05, "loss": 2.4276, "step": 379700 }, { "epoch": 0.66, "learning_rate": 1.6891569038459525e-05, "loss": 2.2105, "step": 379710 }, { "epoch": 0.66, "learning_rate": 1.6890697098532703e-05, "loss": 2.2439, "step": 379720 }, { "epoch": 0.66, "learning_rate": 1.6889825158605873e-05, "loss": 2.3772, "step": 379730 }, { "epoch": 0.66, "learning_rate": 1.6888953218679047e-05, "loss": 2.2888, "step": 379740 }, { "epoch": 0.66, "learning_rate": 1.6888081278752217e-05, "loss": 2.2695, "step": 379750 }, { "epoch": 0.66, "learning_rate": 1.6887209338825394e-05, "loss": 2.3107, "step": 379760 }, { "epoch": 0.66, "learning_rate": 1.6886337398898565e-05, "loss": 2.2761, "step": 379770 }, { "epoch": 0.66, "learning_rate": 1.688546545897174e-05, "loss": 2.457, "step": 379780 }, { "epoch": 0.66, "learning_rate": 1.6884593519044916e-05, "loss": 2.2228, "step": 379790 }, { "epoch": 0.66, "learning_rate": 1.6883721579118086e-05, "loss": 2.2323, "step": 379800 }, { "epoch": 0.66, "learning_rate": 1.688284963919126e-05, "loss": 2.2534, "step": 379810 }, { "epoch": 0.66, "learning_rate": 1.688197769926443e-05, "loss": 2.4035, "step": 379820 }, { "epoch": 0.66, "learning_rate": 1.6881105759337607e-05, "loss": 2.253, "step": 379830 }, { "epoch": 0.66, "learning_rate": 1.6880233819410778e-05, "loss": 2.2852, "step": 379840 }, { "epoch": 0.66, "learning_rate": 1.687936187948395e-05, "loss": 2.2404, "step": 379850 }, { "epoch": 0.66, "learning_rate": 1.6878489939557125e-05, "loss": 2.246, "step": 379860 }, { "epoch": 0.66, "learning_rate": 1.68776179996303e-05, "loss": 2.3661, "step": 379870 }, { "epoch": 0.66, "learning_rate": 1.6876746059703473e-05, "loss": 2.3608, "step": 379880 }, { "epoch": 0.66, "learning_rate": 1.6875874119776643e-05, "loss": 2.3421, "step": 379890 }, { "epoch": 0.66, "learning_rate": 1.687500217984982e-05, "loss": 2.3161, "step": 379900 }, { "epoch": 0.66, "learning_rate": 1.687413023992299e-05, "loss": 2.2616, "step": 379910 }, { "epoch": 0.66, "learning_rate": 1.6873258299996164e-05, "loss": 2.371, "step": 379920 }, { "epoch": 0.66, "learning_rate": 1.6872386360069338e-05, "loss": 2.2775, "step": 379930 }, { "epoch": 0.66, "learning_rate": 1.6871514420142512e-05, "loss": 2.4206, "step": 379940 }, { "epoch": 0.66, "learning_rate": 1.6870642480215686e-05, "loss": 2.2278, "step": 379950 }, { "epoch": 0.66, "learning_rate": 1.6869770540288856e-05, "loss": 2.3837, "step": 379960 }, { "epoch": 0.66, "learning_rate": 1.686889860036203e-05, "loss": 2.3524, "step": 379970 }, { "epoch": 0.66, "learning_rate": 1.6868026660435204e-05, "loss": 2.1719, "step": 379980 }, { "epoch": 0.66, "learning_rate": 1.6867154720508377e-05, "loss": 2.3342, "step": 379990 }, { "epoch": 0.66, "learning_rate": 1.6866282780581548e-05, "loss": 2.2199, "step": 380000 }, { "epoch": 0.66, "learning_rate": 1.686541084065472e-05, "loss": 2.2453, "step": 380010 }, { "epoch": 0.66, "learning_rate": 1.6864538900727895e-05, "loss": 2.3465, "step": 380020 }, { "epoch": 0.66, "learning_rate": 1.686366696080107e-05, "loss": 2.3753, "step": 380030 }, { "epoch": 0.66, "learning_rate": 1.6862795020874243e-05, "loss": 2.264, "step": 380040 }, { "epoch": 0.66, "learning_rate": 1.6861923080947417e-05, "loss": 2.2893, "step": 380050 }, { "epoch": 0.66, "learning_rate": 1.686105114102059e-05, "loss": 2.3556, "step": 380060 }, { "epoch": 0.66, "learning_rate": 1.686017920109376e-05, "loss": 2.3086, "step": 380070 }, { "epoch": 0.66, "learning_rate": 1.6859307261166935e-05, "loss": 2.4279, "step": 380080 }, { "epoch": 0.66, "learning_rate": 1.685843532124011e-05, "loss": 2.3985, "step": 380090 }, { "epoch": 0.66, "learning_rate": 1.6857563381313282e-05, "loss": 2.4798, "step": 380100 }, { "epoch": 0.66, "learning_rate": 1.6856691441386456e-05, "loss": 2.374, "step": 380110 }, { "epoch": 0.66, "learning_rate": 1.6855819501459626e-05, "loss": 2.3818, "step": 380120 }, { "epoch": 0.66, "learning_rate": 1.6854947561532803e-05, "loss": 2.322, "step": 380130 }, { "epoch": 0.66, "learning_rate": 1.6854075621605974e-05, "loss": 2.2352, "step": 380140 }, { "epoch": 0.66, "learning_rate": 1.6853203681679148e-05, "loss": 2.3014, "step": 380150 }, { "epoch": 0.66, "learning_rate": 1.6852331741752318e-05, "loss": 2.3552, "step": 380160 }, { "epoch": 0.66, "learning_rate": 1.6851459801825495e-05, "loss": 2.3067, "step": 380170 }, { "epoch": 0.66, "learning_rate": 1.685058786189867e-05, "loss": 2.293, "step": 380180 }, { "epoch": 0.66, "learning_rate": 1.684971592197184e-05, "loss": 2.3342, "step": 380190 }, { "epoch": 0.66, "learning_rate": 1.6848843982045016e-05, "loss": 2.2725, "step": 380200 }, { "epoch": 0.66, "learning_rate": 1.6847972042118187e-05, "loss": 2.3857, "step": 380210 }, { "epoch": 0.66, "learning_rate": 1.684710010219136e-05, "loss": 2.301, "step": 380220 }, { "epoch": 0.66, "learning_rate": 1.684622816226453e-05, "loss": 2.261, "step": 380230 }, { "epoch": 0.66, "learning_rate": 1.6845356222337708e-05, "loss": 2.2199, "step": 380240 }, { "epoch": 0.66, "learning_rate": 1.684448428241088e-05, "loss": 2.2441, "step": 380250 }, { "epoch": 0.66, "learning_rate": 1.6843612342484052e-05, "loss": 2.2964, "step": 380260 }, { "epoch": 0.66, "learning_rate": 1.6842740402557226e-05, "loss": 2.3813, "step": 380270 }, { "epoch": 0.66, "learning_rate": 1.68418684626304e-05, "loss": 2.2666, "step": 380280 }, { "epoch": 0.66, "learning_rate": 1.6840996522703574e-05, "loss": 2.2191, "step": 380290 }, { "epoch": 0.66, "learning_rate": 1.6840124582776744e-05, "loss": 2.2023, "step": 380300 }, { "epoch": 0.66, "learning_rate": 1.683925264284992e-05, "loss": 2.2864, "step": 380310 }, { "epoch": 0.66, "learning_rate": 1.683838070292309e-05, "loss": 2.1695, "step": 380320 }, { "epoch": 0.66, "learning_rate": 1.6837508762996265e-05, "loss": 2.2855, "step": 380330 }, { "epoch": 0.66, "learning_rate": 1.683663682306944e-05, "loss": 2.2957, "step": 380340 }, { "epoch": 0.66, "learning_rate": 1.6835764883142613e-05, "loss": 2.2979, "step": 380350 }, { "epoch": 0.66, "learning_rate": 1.6834892943215787e-05, "loss": 2.1446, "step": 380360 }, { "epoch": 0.66, "learning_rate": 1.6834021003288957e-05, "loss": 2.3181, "step": 380370 }, { "epoch": 0.66, "learning_rate": 1.683314906336213e-05, "loss": 2.4133, "step": 380380 }, { "epoch": 0.66, "learning_rate": 1.6832277123435305e-05, "loss": 2.3067, "step": 380390 }, { "epoch": 0.66, "learning_rate": 1.6831405183508478e-05, "loss": 2.4126, "step": 380400 }, { "epoch": 0.66, "learning_rate": 1.6830533243581652e-05, "loss": 2.3352, "step": 380410 }, { "epoch": 0.66, "learning_rate": 1.6829661303654822e-05, "loss": 2.3426, "step": 380420 }, { "epoch": 0.66, "learning_rate": 1.6828789363728e-05, "loss": 2.3011, "step": 380430 }, { "epoch": 0.66, "learning_rate": 1.682791742380117e-05, "loss": 2.3111, "step": 380440 }, { "epoch": 0.66, "learning_rate": 1.6827045483874344e-05, "loss": 2.3269, "step": 380450 }, { "epoch": 0.66, "learning_rate": 1.6826173543947518e-05, "loss": 2.3305, "step": 380460 }, { "epoch": 0.66, "learning_rate": 1.682530160402069e-05, "loss": 2.26, "step": 380470 }, { "epoch": 0.66, "learning_rate": 1.682442966409386e-05, "loss": 2.3864, "step": 380480 }, { "epoch": 0.66, "learning_rate": 1.6823557724167035e-05, "loss": 2.4437, "step": 380490 }, { "epoch": 0.66, "learning_rate": 1.682268578424021e-05, "loss": 2.3511, "step": 380500 }, { "epoch": 0.66, "learning_rate": 1.6821813844313383e-05, "loss": 2.2302, "step": 380510 }, { "epoch": 0.66, "learning_rate": 1.6820941904386557e-05, "loss": 2.2709, "step": 380520 }, { "epoch": 0.66, "learning_rate": 1.6820069964459727e-05, "loss": 2.335, "step": 380530 }, { "epoch": 0.66, "learning_rate": 1.6819198024532904e-05, "loss": 2.3432, "step": 380540 }, { "epoch": 0.66, "learning_rate": 1.6818326084606075e-05, "loss": 2.3193, "step": 380550 }, { "epoch": 0.66, "learning_rate": 1.681745414467925e-05, "loss": 2.2562, "step": 380560 }, { "epoch": 0.66, "learning_rate": 1.6816582204752422e-05, "loss": 2.3672, "step": 380570 }, { "epoch": 0.66, "learning_rate": 1.6815710264825596e-05, "loss": 2.3591, "step": 380580 }, { "epoch": 0.66, "learning_rate": 1.681483832489877e-05, "loss": 2.3295, "step": 380590 }, { "epoch": 0.66, "learning_rate": 1.681396638497194e-05, "loss": 2.3628, "step": 380600 }, { "epoch": 0.66, "learning_rate": 1.6813094445045117e-05, "loss": 2.2017, "step": 380610 }, { "epoch": 0.66, "learning_rate": 1.6812222505118288e-05, "loss": 2.3686, "step": 380620 }, { "epoch": 0.66, "learning_rate": 1.681135056519146e-05, "loss": 2.5002, "step": 380630 }, { "epoch": 0.66, "learning_rate": 1.6810478625264632e-05, "loss": 2.3416, "step": 380640 }, { "epoch": 0.66, "learning_rate": 1.680960668533781e-05, "loss": 2.4275, "step": 380650 }, { "epoch": 0.66, "learning_rate": 1.6808734745410983e-05, "loss": 2.4328, "step": 380660 }, { "epoch": 0.66, "learning_rate": 1.6807862805484153e-05, "loss": 2.2948, "step": 380670 }, { "epoch": 0.66, "learning_rate": 1.6806990865557327e-05, "loss": 2.0997, "step": 380680 }, { "epoch": 0.66, "learning_rate": 1.68061189256305e-05, "loss": 2.2759, "step": 380690 }, { "epoch": 0.66, "learning_rate": 1.6805246985703674e-05, "loss": 2.3087, "step": 380700 }, { "epoch": 0.66, "learning_rate": 1.6804375045776845e-05, "loss": 2.2831, "step": 380710 }, { "epoch": 0.66, "learning_rate": 1.6803503105850022e-05, "loss": 2.3341, "step": 380720 }, { "epoch": 0.66, "learning_rate": 1.6802631165923192e-05, "loss": 2.3705, "step": 380730 }, { "epoch": 0.66, "learning_rate": 1.6801759225996366e-05, "loss": 2.3316, "step": 380740 }, { "epoch": 0.66, "learning_rate": 1.680088728606954e-05, "loss": 2.2298, "step": 380750 }, { "epoch": 0.66, "learning_rate": 1.6800015346142714e-05, "loss": 2.3516, "step": 380760 }, { "epoch": 0.66, "learning_rate": 1.6799143406215887e-05, "loss": 2.2961, "step": 380770 }, { "epoch": 0.66, "learning_rate": 1.6798271466289058e-05, "loss": 2.3607, "step": 380780 }, { "epoch": 0.66, "learning_rate": 1.679739952636223e-05, "loss": 2.3258, "step": 380790 }, { "epoch": 0.66, "learning_rate": 1.6796527586435405e-05, "loss": 2.3854, "step": 380800 }, { "epoch": 0.66, "learning_rate": 1.679565564650858e-05, "loss": 2.3771, "step": 380810 }, { "epoch": 0.66, "learning_rate": 1.6794783706581753e-05, "loss": 2.3544, "step": 380820 }, { "epoch": 0.66, "learning_rate": 1.6793911766654927e-05, "loss": 2.2574, "step": 380830 }, { "epoch": 0.66, "learning_rate": 1.67930398267281e-05, "loss": 2.3378, "step": 380840 }, { "epoch": 0.66, "learning_rate": 1.679216788680127e-05, "loss": 2.3562, "step": 380850 }, { "epoch": 0.66, "learning_rate": 1.6791295946874445e-05, "loss": 2.2562, "step": 380860 }, { "epoch": 0.66, "learning_rate": 1.679042400694762e-05, "loss": 2.3436, "step": 380870 }, { "epoch": 0.66, "learning_rate": 1.6789552067020792e-05, "loss": 2.3967, "step": 380880 }, { "epoch": 0.66, "learning_rate": 1.6788680127093963e-05, "loss": 2.3783, "step": 380890 }, { "epoch": 0.66, "learning_rate": 1.6787808187167136e-05, "loss": 2.3623, "step": 380900 }, { "epoch": 0.66, "learning_rate": 1.6786936247240313e-05, "loss": 2.3202, "step": 380910 }, { "epoch": 0.66, "learning_rate": 1.6786064307313484e-05, "loss": 2.324, "step": 380920 }, { "epoch": 0.66, "learning_rate": 1.6785192367386658e-05, "loss": 2.3425, "step": 380930 }, { "epoch": 0.66, "learning_rate": 1.6784320427459828e-05, "loss": 2.2164, "step": 380940 }, { "epoch": 0.66, "learning_rate": 1.6783448487533005e-05, "loss": 2.231, "step": 380950 }, { "epoch": 0.66, "learning_rate": 1.6782576547606176e-05, "loss": 2.1572, "step": 380960 }, { "epoch": 0.66, "learning_rate": 1.678170460767935e-05, "loss": 2.2973, "step": 380970 }, { "epoch": 0.66, "learning_rate": 1.6780832667752523e-05, "loss": 2.4303, "step": 380980 }, { "epoch": 0.66, "learning_rate": 1.6779960727825697e-05, "loss": 2.3217, "step": 380990 }, { "epoch": 0.66, "learning_rate": 1.677908878789887e-05, "loss": 2.3767, "step": 381000 }, { "epoch": 0.66, "learning_rate": 1.677821684797204e-05, "loss": 2.3417, "step": 381010 }, { "epoch": 0.66, "learning_rate": 1.6777344908045218e-05, "loss": 2.3221, "step": 381020 }, { "epoch": 0.66, "learning_rate": 1.677647296811839e-05, "loss": 2.3262, "step": 381030 }, { "epoch": 0.66, "learning_rate": 1.6775601028191562e-05, "loss": 2.3885, "step": 381040 }, { "epoch": 0.66, "learning_rate": 1.6774729088264736e-05, "loss": 2.3872, "step": 381050 }, { "epoch": 0.66, "learning_rate": 1.677385714833791e-05, "loss": 2.3479, "step": 381060 }, { "epoch": 0.66, "learning_rate": 1.6772985208411084e-05, "loss": 2.3253, "step": 381070 }, { "epoch": 0.66, "learning_rate": 1.6772113268484254e-05, "loss": 2.4009, "step": 381080 }, { "epoch": 0.66, "learning_rate": 1.6771241328557428e-05, "loss": 2.2152, "step": 381090 }, { "epoch": 0.66, "learning_rate": 1.67703693886306e-05, "loss": 2.3132, "step": 381100 }, { "epoch": 0.66, "learning_rate": 1.6769497448703775e-05, "loss": 2.3162, "step": 381110 }, { "epoch": 0.66, "learning_rate": 1.6768625508776946e-05, "loss": 2.2663, "step": 381120 }, { "epoch": 0.66, "learning_rate": 1.6767753568850123e-05, "loss": 2.3349, "step": 381130 }, { "epoch": 0.66, "learning_rate": 1.6766881628923297e-05, "loss": 2.2674, "step": 381140 }, { "epoch": 0.66, "learning_rate": 1.6766009688996467e-05, "loss": 2.2741, "step": 381150 }, { "epoch": 0.66, "learning_rate": 1.676513774906964e-05, "loss": 2.3111, "step": 381160 }, { "epoch": 0.66, "learning_rate": 1.6764265809142815e-05, "loss": 2.3165, "step": 381170 }, { "epoch": 0.66, "learning_rate": 1.6763393869215988e-05, "loss": 2.3744, "step": 381180 }, { "epoch": 0.66, "learning_rate": 1.676252192928916e-05, "loss": 2.4097, "step": 381190 }, { "epoch": 0.66, "learning_rate": 1.6761649989362332e-05, "loss": 2.2289, "step": 381200 }, { "epoch": 0.66, "learning_rate": 1.6760778049435506e-05, "loss": 2.2472, "step": 381210 }, { "epoch": 0.66, "learning_rate": 1.675990610950868e-05, "loss": 2.3248, "step": 381220 }, { "epoch": 0.66, "learning_rate": 1.6759034169581854e-05, "loss": 2.3774, "step": 381230 }, { "epoch": 0.66, "learning_rate": 1.6758162229655028e-05, "loss": 2.3381, "step": 381240 }, { "epoch": 0.66, "learning_rate": 1.67572902897282e-05, "loss": 2.3237, "step": 381250 }, { "epoch": 0.66, "learning_rate": 1.675641834980137e-05, "loss": 2.3035, "step": 381260 }, { "epoch": 0.66, "learning_rate": 1.6755546409874545e-05, "loss": 2.3845, "step": 381270 }, { "epoch": 0.66, "learning_rate": 1.675467446994772e-05, "loss": 2.3683, "step": 381280 }, { "epoch": 0.66, "learning_rate": 1.6753802530020893e-05, "loss": 2.3038, "step": 381290 }, { "epoch": 0.66, "learning_rate": 1.6752930590094067e-05, "loss": 2.2709, "step": 381300 }, { "epoch": 0.66, "learning_rate": 1.6752058650167237e-05, "loss": 2.3742, "step": 381310 }, { "epoch": 0.66, "learning_rate": 1.6751186710240414e-05, "loss": 2.3038, "step": 381320 }, { "epoch": 0.66, "learning_rate": 1.6750314770313585e-05, "loss": 2.222, "step": 381330 }, { "epoch": 0.67, "learning_rate": 1.674944283038676e-05, "loss": 2.2368, "step": 381340 }, { "epoch": 0.67, "learning_rate": 1.674857089045993e-05, "loss": 2.3053, "step": 381350 }, { "epoch": 0.67, "learning_rate": 1.6747698950533106e-05, "loss": 2.3416, "step": 381360 }, { "epoch": 0.67, "learning_rate": 1.6746827010606276e-05, "loss": 2.2818, "step": 381370 }, { "epoch": 0.67, "learning_rate": 1.674595507067945e-05, "loss": 2.2532, "step": 381380 }, { "epoch": 0.67, "learning_rate": 1.6745083130752627e-05, "loss": 2.4118, "step": 381390 }, { "epoch": 0.67, "learning_rate": 1.6744211190825798e-05, "loss": 2.4454, "step": 381400 }, { "epoch": 0.67, "learning_rate": 1.674333925089897e-05, "loss": 2.3, "step": 381410 }, { "epoch": 0.67, "learning_rate": 1.6742467310972142e-05, "loss": 2.2294, "step": 381420 }, { "epoch": 0.67, "learning_rate": 1.674159537104532e-05, "loss": 2.2648, "step": 381430 }, { "epoch": 0.67, "learning_rate": 1.674072343111849e-05, "loss": 2.2745, "step": 381440 }, { "epoch": 0.67, "learning_rate": 1.6739851491191663e-05, "loss": 2.2487, "step": 381450 }, { "epoch": 0.67, "learning_rate": 1.6738979551264837e-05, "loss": 2.2755, "step": 381460 }, { "epoch": 0.67, "learning_rate": 1.673810761133801e-05, "loss": 2.2893, "step": 381470 }, { "epoch": 0.67, "learning_rate": 1.6737235671411184e-05, "loss": 2.1717, "step": 381480 }, { "epoch": 0.67, "learning_rate": 1.6736363731484355e-05, "loss": 2.4332, "step": 381490 }, { "epoch": 0.67, "learning_rate": 1.6735491791557532e-05, "loss": 2.2192, "step": 381500 }, { "epoch": 0.67, "learning_rate": 1.6734619851630702e-05, "loss": 2.1958, "step": 381510 }, { "epoch": 0.67, "learning_rate": 1.6733747911703876e-05, "loss": 2.3331, "step": 381520 }, { "epoch": 0.67, "learning_rate": 1.673287597177705e-05, "loss": 2.2132, "step": 381530 }, { "epoch": 0.67, "learning_rate": 1.6732004031850224e-05, "loss": 2.3302, "step": 381540 }, { "epoch": 0.67, "learning_rate": 1.6731132091923397e-05, "loss": 2.2009, "step": 381550 }, { "epoch": 0.67, "learning_rate": 1.6730260151996568e-05, "loss": 2.105, "step": 381560 }, { "epoch": 0.67, "learning_rate": 1.672938821206974e-05, "loss": 2.4053, "step": 381570 }, { "epoch": 0.67, "learning_rate": 1.6728516272142915e-05, "loss": 2.3903, "step": 381580 }, { "epoch": 0.67, "learning_rate": 1.672764433221609e-05, "loss": 2.276, "step": 381590 }, { "epoch": 0.67, "learning_rate": 1.672677239228926e-05, "loss": 2.2543, "step": 381600 }, { "epoch": 0.67, "learning_rate": 1.6725900452362433e-05, "loss": 2.3436, "step": 381610 }, { "epoch": 0.67, "learning_rate": 1.6725028512435607e-05, "loss": 2.3895, "step": 381620 }, { "epoch": 0.67, "learning_rate": 1.672415657250878e-05, "loss": 2.2618, "step": 381630 }, { "epoch": 0.67, "learning_rate": 1.6723284632581955e-05, "loss": 2.2718, "step": 381640 }, { "epoch": 0.67, "learning_rate": 1.672241269265513e-05, "loss": 2.4499, "step": 381650 }, { "epoch": 0.67, "learning_rate": 1.6721540752728302e-05, "loss": 2.4074, "step": 381660 }, { "epoch": 0.67, "learning_rate": 1.6720668812801473e-05, "loss": 2.4393, "step": 381670 }, { "epoch": 0.67, "learning_rate": 1.6719796872874646e-05, "loss": 2.3612, "step": 381680 }, { "epoch": 0.67, "learning_rate": 1.671892493294782e-05, "loss": 2.4161, "step": 381690 }, { "epoch": 0.67, "learning_rate": 1.6718052993020994e-05, "loss": 2.2755, "step": 381700 }, { "epoch": 0.67, "learning_rate": 1.6717181053094168e-05, "loss": 2.2729, "step": 381710 }, { "epoch": 0.67, "learning_rate": 1.6716309113167338e-05, "loss": 2.2601, "step": 381720 }, { "epoch": 0.67, "learning_rate": 1.6715437173240515e-05, "loss": 2.2911, "step": 381730 }, { "epoch": 0.67, "learning_rate": 1.6714565233313686e-05, "loss": 2.3988, "step": 381740 }, { "epoch": 0.67, "learning_rate": 1.671369329338686e-05, "loss": 2.2675, "step": 381750 }, { "epoch": 0.67, "learning_rate": 1.6712821353460033e-05, "loss": 2.2826, "step": 381760 }, { "epoch": 0.67, "learning_rate": 1.6711949413533207e-05, "loss": 2.3825, "step": 381770 }, { "epoch": 0.67, "learning_rate": 1.671107747360638e-05, "loss": 2.3493, "step": 381780 }, { "epoch": 0.67, "learning_rate": 1.671020553367955e-05, "loss": 2.2755, "step": 381790 }, { "epoch": 0.67, "learning_rate": 1.6709333593752728e-05, "loss": 2.3891, "step": 381800 }, { "epoch": 0.67, "learning_rate": 1.67084616538259e-05, "loss": 2.3658, "step": 381810 }, { "epoch": 0.67, "learning_rate": 1.6707589713899072e-05, "loss": 2.2783, "step": 381820 }, { "epoch": 0.67, "learning_rate": 1.6706717773972243e-05, "loss": 2.2849, "step": 381830 }, { "epoch": 0.67, "learning_rate": 1.670584583404542e-05, "loss": 2.2321, "step": 381840 }, { "epoch": 0.67, "learning_rate": 1.670497389411859e-05, "loss": 2.3126, "step": 381850 }, { "epoch": 0.67, "learning_rate": 1.6704101954191764e-05, "loss": 2.292, "step": 381860 }, { "epoch": 0.67, "learning_rate": 1.6703230014264938e-05, "loss": 2.3183, "step": 381870 }, { "epoch": 0.67, "learning_rate": 1.670235807433811e-05, "loss": 2.3744, "step": 381880 }, { "epoch": 0.67, "learning_rate": 1.6701486134411285e-05, "loss": 2.2655, "step": 381890 }, { "epoch": 0.67, "learning_rate": 1.6700614194484456e-05, "loss": 2.1732, "step": 381900 }, { "epoch": 0.67, "learning_rate": 1.6699742254557633e-05, "loss": 2.262, "step": 381910 }, { "epoch": 0.67, "learning_rate": 1.6698870314630803e-05, "loss": 2.2914, "step": 381920 }, { "epoch": 0.67, "learning_rate": 1.6697998374703977e-05, "loss": 2.4012, "step": 381930 }, { "epoch": 0.67, "learning_rate": 1.669712643477715e-05, "loss": 2.2583, "step": 381940 }, { "epoch": 0.67, "learning_rate": 1.6696254494850325e-05, "loss": 2.4114, "step": 381950 }, { "epoch": 0.67, "learning_rate": 1.6695382554923498e-05, "loss": 2.3333, "step": 381960 }, { "epoch": 0.67, "learning_rate": 1.669451061499667e-05, "loss": 2.3752, "step": 381970 }, { "epoch": 0.67, "learning_rate": 1.6693638675069842e-05, "loss": 2.3554, "step": 381980 }, { "epoch": 0.67, "learning_rate": 1.6692766735143016e-05, "loss": 2.3027, "step": 381990 }, { "epoch": 0.67, "learning_rate": 1.669189479521619e-05, "loss": 2.2993, "step": 382000 }, { "epoch": 0.67, "learning_rate": 1.6691022855289364e-05, "loss": 2.2655, "step": 382010 }, { "epoch": 0.67, "learning_rate": 1.6690150915362534e-05, "loss": 2.3321, "step": 382020 }, { "epoch": 0.67, "learning_rate": 1.668927897543571e-05, "loss": 2.4447, "step": 382030 }, { "epoch": 0.67, "learning_rate": 1.668840703550888e-05, "loss": 2.2549, "step": 382040 }, { "epoch": 0.67, "learning_rate": 1.6687535095582055e-05, "loss": 2.2789, "step": 382050 }, { "epoch": 0.67, "learning_rate": 1.668666315565523e-05, "loss": 2.241, "step": 382060 }, { "epoch": 0.67, "learning_rate": 1.6685791215728403e-05, "loss": 2.4286, "step": 382070 }, { "epoch": 0.67, "learning_rate": 1.6684919275801573e-05, "loss": 2.2884, "step": 382080 }, { "epoch": 0.67, "learning_rate": 1.6684047335874747e-05, "loss": 2.1699, "step": 382090 }, { "epoch": 0.67, "learning_rate": 1.668317539594792e-05, "loss": 2.3215, "step": 382100 }, { "epoch": 0.67, "learning_rate": 1.6682303456021095e-05, "loss": 2.3163, "step": 382110 }, { "epoch": 0.67, "learning_rate": 1.668143151609427e-05, "loss": 2.3717, "step": 382120 }, { "epoch": 0.67, "learning_rate": 1.668055957616744e-05, "loss": 2.3204, "step": 382130 }, { "epoch": 0.67, "learning_rate": 1.6679687636240616e-05, "loss": 2.3044, "step": 382140 }, { "epoch": 0.67, "learning_rate": 1.6678815696313786e-05, "loss": 2.4487, "step": 382150 }, { "epoch": 0.67, "learning_rate": 1.667794375638696e-05, "loss": 2.2324, "step": 382160 }, { "epoch": 0.67, "learning_rate": 1.6677071816460134e-05, "loss": 2.3678, "step": 382170 }, { "epoch": 0.67, "learning_rate": 1.6676199876533308e-05, "loss": 2.2596, "step": 382180 }, { "epoch": 0.67, "learning_rate": 1.667532793660648e-05, "loss": 2.4041, "step": 382190 }, { "epoch": 0.67, "learning_rate": 1.6674455996679652e-05, "loss": 2.2751, "step": 382200 }, { "epoch": 0.67, "learning_rate": 1.667358405675283e-05, "loss": 2.4896, "step": 382210 }, { "epoch": 0.67, "learning_rate": 1.6672712116826e-05, "loss": 2.3489, "step": 382220 }, { "epoch": 0.67, "learning_rate": 1.6671840176899173e-05, "loss": 2.3743, "step": 382230 }, { "epoch": 0.67, "learning_rate": 1.6670968236972344e-05, "loss": 2.3014, "step": 382240 }, { "epoch": 0.67, "learning_rate": 1.667009629704552e-05, "loss": 2.2474, "step": 382250 }, { "epoch": 0.67, "learning_rate": 1.6669224357118694e-05, "loss": 2.2287, "step": 382260 }, { "epoch": 0.67, "learning_rate": 1.6668352417191865e-05, "loss": 2.2225, "step": 382270 }, { "epoch": 0.67, "learning_rate": 1.666748047726504e-05, "loss": 2.3907, "step": 382280 }, { "epoch": 0.67, "learning_rate": 1.6666608537338212e-05, "loss": 2.2739, "step": 382290 }, { "epoch": 0.67, "learning_rate": 1.6665736597411386e-05, "loss": 2.2625, "step": 382300 }, { "epoch": 0.67, "learning_rate": 1.6664864657484557e-05, "loss": 2.3299, "step": 382310 }, { "epoch": 0.67, "learning_rate": 1.6663992717557734e-05, "loss": 2.2718, "step": 382320 }, { "epoch": 0.67, "learning_rate": 1.6663120777630904e-05, "loss": 2.3455, "step": 382330 }, { "epoch": 0.67, "learning_rate": 1.6662248837704078e-05, "loss": 2.2265, "step": 382340 }, { "epoch": 0.67, "learning_rate": 1.666137689777725e-05, "loss": 2.2434, "step": 382350 }, { "epoch": 0.67, "learning_rate": 1.6660504957850425e-05, "loss": 2.3076, "step": 382360 }, { "epoch": 0.67, "learning_rate": 1.66596330179236e-05, "loss": 2.3977, "step": 382370 }, { "epoch": 0.67, "learning_rate": 1.665876107799677e-05, "loss": 2.2089, "step": 382380 }, { "epoch": 0.67, "learning_rate": 1.6657889138069943e-05, "loss": 2.3769, "step": 382390 }, { "epoch": 0.67, "learning_rate": 1.6657017198143117e-05, "loss": 2.3012, "step": 382400 }, { "epoch": 0.67, "learning_rate": 1.665614525821629e-05, "loss": 2.2935, "step": 382410 }, { "epoch": 0.67, "learning_rate": 1.6655273318289465e-05, "loss": 2.3588, "step": 382420 }, { "epoch": 0.67, "learning_rate": 1.665440137836264e-05, "loss": 2.3297, "step": 382430 }, { "epoch": 0.67, "learning_rate": 1.6653529438435812e-05, "loss": 2.2667, "step": 382440 }, { "epoch": 0.67, "learning_rate": 1.6652657498508983e-05, "loss": 2.2719, "step": 382450 }, { "epoch": 0.67, "learning_rate": 1.6651785558582156e-05, "loss": 2.3995, "step": 382460 }, { "epoch": 0.67, "learning_rate": 1.665091361865533e-05, "loss": 2.4098, "step": 382470 }, { "epoch": 0.67, "learning_rate": 1.6650041678728504e-05, "loss": 2.3312, "step": 382480 }, { "epoch": 0.67, "learning_rate": 1.6649169738801678e-05, "loss": 2.2773, "step": 382490 }, { "epoch": 0.67, "learning_rate": 1.6648297798874848e-05, "loss": 2.244, "step": 382500 }, { "epoch": 0.67, "learning_rate": 1.6647425858948025e-05, "loss": 2.4912, "step": 382510 }, { "epoch": 0.67, "learning_rate": 1.6646553919021196e-05, "loss": 2.265, "step": 382520 }, { "epoch": 0.67, "learning_rate": 1.664568197909437e-05, "loss": 2.3089, "step": 382530 }, { "epoch": 0.67, "learning_rate": 1.664481003916754e-05, "loss": 2.3269, "step": 382540 }, { "epoch": 0.67, "learning_rate": 1.6643938099240717e-05, "loss": 2.3592, "step": 382550 }, { "epoch": 0.67, "learning_rate": 1.6643066159313887e-05, "loss": 2.3655, "step": 382560 }, { "epoch": 0.67, "learning_rate": 1.664219421938706e-05, "loss": 2.2792, "step": 382570 }, { "epoch": 0.67, "learning_rate": 1.6641322279460235e-05, "loss": 2.373, "step": 382580 }, { "epoch": 0.67, "learning_rate": 1.664045033953341e-05, "loss": 2.2498, "step": 382590 }, { "epoch": 0.67, "learning_rate": 1.6639578399606582e-05, "loss": 2.3309, "step": 382600 }, { "epoch": 0.67, "learning_rate": 1.6638706459679753e-05, "loss": 2.3463, "step": 382610 }, { "epoch": 0.67, "learning_rate": 1.663783451975293e-05, "loss": 2.3639, "step": 382620 }, { "epoch": 0.67, "learning_rate": 1.66369625798261e-05, "loss": 2.3404, "step": 382630 }, { "epoch": 0.67, "learning_rate": 1.6636090639899274e-05, "loss": 2.2475, "step": 382640 }, { "epoch": 0.67, "learning_rate": 1.6635218699972448e-05, "loss": 2.2402, "step": 382650 }, { "epoch": 0.67, "learning_rate": 1.663434676004562e-05, "loss": 2.3129, "step": 382660 }, { "epoch": 0.67, "learning_rate": 1.6633474820118795e-05, "loss": 2.2532, "step": 382670 }, { "epoch": 0.67, "learning_rate": 1.6632602880191966e-05, "loss": 2.3686, "step": 382680 }, { "epoch": 0.67, "learning_rate": 1.6631730940265143e-05, "loss": 2.4257, "step": 382690 }, { "epoch": 0.67, "learning_rate": 1.6630859000338313e-05, "loss": 2.2681, "step": 382700 }, { "epoch": 0.67, "learning_rate": 1.6629987060411487e-05, "loss": 2.1637, "step": 382710 }, { "epoch": 0.67, "learning_rate": 1.6629115120484657e-05, "loss": 2.327, "step": 382720 }, { "epoch": 0.67, "learning_rate": 1.6628243180557835e-05, "loss": 2.4227, "step": 382730 }, { "epoch": 0.67, "learning_rate": 1.662737124063101e-05, "loss": 2.1907, "step": 382740 }, { "epoch": 0.67, "learning_rate": 1.662649930070418e-05, "loss": 2.2382, "step": 382750 }, { "epoch": 0.67, "learning_rate": 1.6625627360777352e-05, "loss": 2.3263, "step": 382760 }, { "epoch": 0.67, "learning_rate": 1.6624755420850526e-05, "loss": 2.3531, "step": 382770 }, { "epoch": 0.67, "learning_rate": 1.66238834809237e-05, "loss": 2.2461, "step": 382780 }, { "epoch": 0.67, "learning_rate": 1.662301154099687e-05, "loss": 2.2548, "step": 382790 }, { "epoch": 0.67, "learning_rate": 1.6622139601070044e-05, "loss": 2.5073, "step": 382800 }, { "epoch": 0.67, "learning_rate": 1.6621267661143218e-05, "loss": 2.3713, "step": 382810 }, { "epoch": 0.67, "learning_rate": 1.6620395721216392e-05, "loss": 2.327, "step": 382820 }, { "epoch": 0.67, "learning_rate": 1.6619523781289565e-05, "loss": 2.3477, "step": 382830 }, { "epoch": 0.67, "learning_rate": 1.661865184136274e-05, "loss": 2.2649, "step": 382840 }, { "epoch": 0.67, "learning_rate": 1.6617779901435913e-05, "loss": 2.4099, "step": 382850 }, { "epoch": 0.67, "learning_rate": 1.6616907961509083e-05, "loss": 2.3712, "step": 382860 }, { "epoch": 0.67, "learning_rate": 1.6616036021582257e-05, "loss": 2.31, "step": 382870 }, { "epoch": 0.67, "learning_rate": 1.661516408165543e-05, "loss": 2.285, "step": 382880 }, { "epoch": 0.67, "learning_rate": 1.6614292141728605e-05, "loss": 2.3086, "step": 382890 }, { "epoch": 0.67, "learning_rate": 1.661342020180178e-05, "loss": 2.1909, "step": 382900 }, { "epoch": 0.67, "learning_rate": 1.661254826187495e-05, "loss": 2.3121, "step": 382910 }, { "epoch": 0.67, "learning_rate": 1.6611676321948126e-05, "loss": 2.427, "step": 382920 }, { "epoch": 0.67, "learning_rate": 1.6610804382021296e-05, "loss": 2.242, "step": 382930 }, { "epoch": 0.67, "learning_rate": 1.660993244209447e-05, "loss": 2.2848, "step": 382940 }, { "epoch": 0.67, "learning_rate": 1.660906050216764e-05, "loss": 2.3428, "step": 382950 }, { "epoch": 0.67, "learning_rate": 1.6608188562240818e-05, "loss": 2.321, "step": 382960 }, { "epoch": 0.67, "learning_rate": 1.6607316622313988e-05, "loss": 2.3361, "step": 382970 }, { "epoch": 0.67, "learning_rate": 1.6606444682387162e-05, "loss": 2.2707, "step": 382980 }, { "epoch": 0.67, "learning_rate": 1.660557274246034e-05, "loss": 2.2898, "step": 382990 }, { "epoch": 0.67, "learning_rate": 1.660470080253351e-05, "loss": 2.4615, "step": 383000 }, { "epoch": 0.67, "learning_rate": 1.6603828862606683e-05, "loss": 2.2185, "step": 383010 }, { "epoch": 0.67, "learning_rate": 1.6602956922679854e-05, "loss": 2.3627, "step": 383020 }, { "epoch": 0.67, "learning_rate": 1.660208498275303e-05, "loss": 2.3078, "step": 383030 }, { "epoch": 0.67, "learning_rate": 1.66012130428262e-05, "loss": 2.3984, "step": 383040 }, { "epoch": 0.67, "learning_rate": 1.6600341102899375e-05, "loss": 2.2819, "step": 383050 }, { "epoch": 0.67, "learning_rate": 1.659946916297255e-05, "loss": 2.2993, "step": 383060 }, { "epoch": 0.67, "learning_rate": 1.6598597223045722e-05, "loss": 2.3649, "step": 383070 }, { "epoch": 0.67, "learning_rate": 1.6597725283118896e-05, "loss": 2.304, "step": 383080 }, { "epoch": 0.67, "learning_rate": 1.6596853343192067e-05, "loss": 2.3458, "step": 383090 }, { "epoch": 0.67, "learning_rate": 1.6595981403265244e-05, "loss": 2.2676, "step": 383100 }, { "epoch": 0.67, "learning_rate": 1.6595109463338414e-05, "loss": 2.3454, "step": 383110 }, { "epoch": 0.67, "learning_rate": 1.6594237523411588e-05, "loss": 2.2956, "step": 383120 }, { "epoch": 0.67, "learning_rate": 1.659336558348476e-05, "loss": 2.3739, "step": 383130 }, { "epoch": 0.67, "learning_rate": 1.6592493643557935e-05, "loss": 2.2492, "step": 383140 }, { "epoch": 0.67, "learning_rate": 1.659162170363111e-05, "loss": 2.2938, "step": 383150 }, { "epoch": 0.67, "learning_rate": 1.659074976370428e-05, "loss": 2.2257, "step": 383160 }, { "epoch": 0.67, "learning_rate": 1.6589877823777453e-05, "loss": 2.2181, "step": 383170 }, { "epoch": 0.67, "learning_rate": 1.6589005883850627e-05, "loss": 2.272, "step": 383180 }, { "epoch": 0.67, "learning_rate": 1.65881339439238e-05, "loss": 2.2944, "step": 383190 }, { "epoch": 0.67, "learning_rate": 1.658726200399697e-05, "loss": 2.3857, "step": 383200 }, { "epoch": 0.67, "learning_rate": 1.6586390064070145e-05, "loss": 2.2274, "step": 383210 }, { "epoch": 0.67, "learning_rate": 1.6585518124143322e-05, "loss": 2.3581, "step": 383220 }, { "epoch": 0.67, "learning_rate": 1.6584646184216493e-05, "loss": 2.2171, "step": 383230 }, { "epoch": 0.67, "learning_rate": 1.6583774244289666e-05, "loss": 2.3184, "step": 383240 }, { "epoch": 0.67, "learning_rate": 1.658290230436284e-05, "loss": 2.3655, "step": 383250 }, { "epoch": 0.67, "learning_rate": 1.6582030364436014e-05, "loss": 2.3681, "step": 383260 }, { "epoch": 0.67, "learning_rate": 1.6581158424509184e-05, "loss": 2.3302, "step": 383270 }, { "epoch": 0.67, "learning_rate": 1.6580286484582358e-05, "loss": 2.2612, "step": 383280 }, { "epoch": 0.67, "learning_rate": 1.6579414544655532e-05, "loss": 2.3644, "step": 383290 }, { "epoch": 0.67, "learning_rate": 1.6578542604728706e-05, "loss": 2.2808, "step": 383300 }, { "epoch": 0.67, "learning_rate": 1.657767066480188e-05, "loss": 2.2947, "step": 383310 }, { "epoch": 0.67, "learning_rate": 1.657679872487505e-05, "loss": 2.388, "step": 383320 }, { "epoch": 0.67, "learning_rate": 1.6575926784948227e-05, "loss": 2.3094, "step": 383330 }, { "epoch": 0.67, "learning_rate": 1.6575054845021397e-05, "loss": 2.3513, "step": 383340 }, { "epoch": 0.67, "learning_rate": 1.657418290509457e-05, "loss": 2.3885, "step": 383350 }, { "epoch": 0.67, "learning_rate": 1.6573310965167745e-05, "loss": 2.4149, "step": 383360 }, { "epoch": 0.67, "learning_rate": 1.657243902524092e-05, "loss": 2.2335, "step": 383370 }, { "epoch": 0.67, "learning_rate": 1.6571567085314092e-05, "loss": 2.2693, "step": 383380 }, { "epoch": 0.67, "learning_rate": 1.6570695145387263e-05, "loss": 2.317, "step": 383390 }, { "epoch": 0.67, "learning_rate": 1.656982320546044e-05, "loss": 2.227, "step": 383400 }, { "epoch": 0.67, "learning_rate": 1.656895126553361e-05, "loss": 2.4342, "step": 383410 }, { "epoch": 0.67, "learning_rate": 1.6568079325606784e-05, "loss": 2.3441, "step": 383420 }, { "epoch": 0.67, "learning_rate": 1.6567207385679954e-05, "loss": 2.3078, "step": 383430 }, { "epoch": 0.67, "learning_rate": 1.656633544575313e-05, "loss": 2.2717, "step": 383440 }, { "epoch": 0.67, "learning_rate": 1.6565463505826302e-05, "loss": 2.2535, "step": 383450 }, { "epoch": 0.67, "learning_rate": 1.6564591565899476e-05, "loss": 2.3508, "step": 383460 }, { "epoch": 0.67, "learning_rate": 1.656371962597265e-05, "loss": 2.2249, "step": 383470 }, { "epoch": 0.67, "learning_rate": 1.6562847686045823e-05, "loss": 2.3052, "step": 383480 }, { "epoch": 0.67, "learning_rate": 1.6561975746118997e-05, "loss": 2.2736, "step": 383490 }, { "epoch": 0.67, "learning_rate": 1.6561103806192167e-05, "loss": 2.3362, "step": 383500 }, { "epoch": 0.67, "learning_rate": 1.6560231866265345e-05, "loss": 2.4029, "step": 383510 }, { "epoch": 0.67, "learning_rate": 1.6559359926338515e-05, "loss": 2.3601, "step": 383520 }, { "epoch": 0.67, "learning_rate": 1.655848798641169e-05, "loss": 2.4466, "step": 383530 }, { "epoch": 0.67, "learning_rate": 1.6557616046484862e-05, "loss": 2.2657, "step": 383540 }, { "epoch": 0.67, "learning_rate": 1.6556744106558036e-05, "loss": 2.3483, "step": 383550 }, { "epoch": 0.67, "learning_rate": 1.655587216663121e-05, "loss": 2.2738, "step": 383560 }, { "epoch": 0.67, "learning_rate": 1.655500022670438e-05, "loss": 2.2752, "step": 383570 }, { "epoch": 0.67, "learning_rate": 1.6554128286777554e-05, "loss": 2.1125, "step": 383580 }, { "epoch": 0.67, "learning_rate": 1.6553256346850728e-05, "loss": 2.2682, "step": 383590 }, { "epoch": 0.67, "learning_rate": 1.6552384406923902e-05, "loss": 2.2447, "step": 383600 }, { "epoch": 0.67, "learning_rate": 1.6551512466997075e-05, "loss": 2.2187, "step": 383610 }, { "epoch": 0.67, "learning_rate": 1.655064052707025e-05, "loss": 2.3112, "step": 383620 }, { "epoch": 0.67, "learning_rate": 1.6549768587143423e-05, "loss": 2.337, "step": 383630 }, { "epoch": 0.67, "learning_rate": 1.6548896647216593e-05, "loss": 2.3681, "step": 383640 }, { "epoch": 0.67, "learning_rate": 1.6548024707289767e-05, "loss": 2.2993, "step": 383650 }, { "epoch": 0.67, "learning_rate": 1.654715276736294e-05, "loss": 2.3044, "step": 383660 }, { "epoch": 0.67, "learning_rate": 1.6546280827436115e-05, "loss": 2.2956, "step": 383670 }, { "epoch": 0.67, "learning_rate": 1.6545408887509285e-05, "loss": 2.3278, "step": 383680 }, { "epoch": 0.67, "learning_rate": 1.654453694758246e-05, "loss": 2.3542, "step": 383690 }, { "epoch": 0.67, "learning_rate": 1.6543665007655633e-05, "loss": 2.3193, "step": 383700 }, { "epoch": 0.67, "learning_rate": 1.6542793067728806e-05, "loss": 2.3365, "step": 383710 }, { "epoch": 0.67, "learning_rate": 1.654192112780198e-05, "loss": 2.326, "step": 383720 }, { "epoch": 0.67, "learning_rate": 1.654104918787515e-05, "loss": 2.3246, "step": 383730 }, { "epoch": 0.67, "learning_rate": 1.6540177247948328e-05, "loss": 2.3278, "step": 383740 }, { "epoch": 0.67, "learning_rate": 1.6539305308021498e-05, "loss": 2.3247, "step": 383750 }, { "epoch": 0.67, "learning_rate": 1.6538433368094672e-05, "loss": 2.3438, "step": 383760 }, { "epoch": 0.67, "learning_rate": 1.6537561428167846e-05, "loss": 2.3283, "step": 383770 }, { "epoch": 0.67, "learning_rate": 1.653668948824102e-05, "loss": 2.2961, "step": 383780 }, { "epoch": 0.67, "learning_rate": 1.6535817548314193e-05, "loss": 2.3763, "step": 383790 }, { "epoch": 0.67, "learning_rate": 1.6534945608387364e-05, "loss": 2.329, "step": 383800 }, { "epoch": 0.67, "learning_rate": 1.653407366846054e-05, "loss": 2.2488, "step": 383810 }, { "epoch": 0.67, "learning_rate": 1.653320172853371e-05, "loss": 2.2662, "step": 383820 }, { "epoch": 0.67, "learning_rate": 1.6532329788606885e-05, "loss": 2.2902, "step": 383830 }, { "epoch": 0.67, "learning_rate": 1.653145784868006e-05, "loss": 2.2629, "step": 383840 }, { "epoch": 0.67, "learning_rate": 1.6530585908753232e-05, "loss": 2.1779, "step": 383850 }, { "epoch": 0.67, "learning_rate": 1.6529713968826406e-05, "loss": 2.2899, "step": 383860 }, { "epoch": 0.67, "learning_rate": 1.6528842028899577e-05, "loss": 2.3404, "step": 383870 }, { "epoch": 0.67, "learning_rate": 1.652797008897275e-05, "loss": 2.3683, "step": 383880 }, { "epoch": 0.67, "learning_rate": 1.6527098149045924e-05, "loss": 2.1878, "step": 383890 }, { "epoch": 0.67, "learning_rate": 1.6526226209119098e-05, "loss": 2.3709, "step": 383900 }, { "epoch": 0.67, "learning_rate": 1.6525354269192268e-05, "loss": 2.2331, "step": 383910 }, { "epoch": 0.67, "learning_rate": 1.6524482329265445e-05, "loss": 2.2887, "step": 383920 }, { "epoch": 0.67, "learning_rate": 1.6523610389338616e-05, "loss": 2.1949, "step": 383930 }, { "epoch": 0.67, "learning_rate": 1.652273844941179e-05, "loss": 2.2646, "step": 383940 }, { "epoch": 0.67, "learning_rate": 1.6521866509484963e-05, "loss": 2.3897, "step": 383950 }, { "epoch": 0.67, "learning_rate": 1.6520994569558137e-05, "loss": 2.3245, "step": 383960 }, { "epoch": 0.67, "learning_rate": 1.652012262963131e-05, "loss": 2.3813, "step": 383970 }, { "epoch": 0.67, "learning_rate": 1.651925068970448e-05, "loss": 2.2748, "step": 383980 }, { "epoch": 0.67, "learning_rate": 1.6518378749777655e-05, "loss": 2.4129, "step": 383990 }, { "epoch": 0.67, "learning_rate": 1.651750680985083e-05, "loss": 2.3229, "step": 384000 }, { "epoch": 0.67, "learning_rate": 1.6516634869924003e-05, "loss": 2.2889, "step": 384010 }, { "epoch": 0.67, "learning_rate": 1.6515762929997176e-05, "loss": 2.1643, "step": 384020 }, { "epoch": 0.67, "learning_rate": 1.651489099007035e-05, "loss": 2.3087, "step": 384030 }, { "epoch": 0.67, "learning_rate": 1.6514019050143524e-05, "loss": 2.2223, "step": 384040 }, { "epoch": 0.67, "learning_rate": 1.6513147110216694e-05, "loss": 2.3804, "step": 384050 }, { "epoch": 0.67, "learning_rate": 1.6512275170289868e-05, "loss": 2.417, "step": 384060 }, { "epoch": 0.67, "learning_rate": 1.6511403230363042e-05, "loss": 2.1915, "step": 384070 }, { "epoch": 0.67, "learning_rate": 1.6510531290436216e-05, "loss": 2.3911, "step": 384080 }, { "epoch": 0.67, "learning_rate": 1.650965935050939e-05, "loss": 2.3231, "step": 384090 }, { "epoch": 0.67, "learning_rate": 1.650878741058256e-05, "loss": 2.3895, "step": 384100 }, { "epoch": 0.67, "learning_rate": 1.6507915470655737e-05, "loss": 2.3471, "step": 384110 }, { "epoch": 0.67, "learning_rate": 1.6507043530728907e-05, "loss": 2.2365, "step": 384120 }, { "epoch": 0.67, "learning_rate": 1.650617159080208e-05, "loss": 2.2926, "step": 384130 }, { "epoch": 0.67, "learning_rate": 1.650529965087525e-05, "loss": 2.3215, "step": 384140 }, { "epoch": 0.67, "learning_rate": 1.650442771094843e-05, "loss": 2.286, "step": 384150 }, { "epoch": 0.67, "learning_rate": 1.65035557710216e-05, "loss": 2.429, "step": 384160 }, { "epoch": 0.67, "learning_rate": 1.6502683831094773e-05, "loss": 2.3624, "step": 384170 }, { "epoch": 0.67, "learning_rate": 1.6501811891167946e-05, "loss": 2.3039, "step": 384180 }, { "epoch": 0.67, "learning_rate": 1.650093995124112e-05, "loss": 2.2557, "step": 384190 }, { "epoch": 0.67, "learning_rate": 1.6500068011314294e-05, "loss": 2.4242, "step": 384200 }, { "epoch": 0.67, "learning_rate": 1.6499196071387464e-05, "loss": 2.341, "step": 384210 }, { "epoch": 0.67, "learning_rate": 1.649832413146064e-05, "loss": 2.2176, "step": 384220 }, { "epoch": 0.67, "learning_rate": 1.6497452191533812e-05, "loss": 2.3336, "step": 384230 }, { "epoch": 0.67, "learning_rate": 1.6496580251606986e-05, "loss": 2.2281, "step": 384240 }, { "epoch": 0.67, "learning_rate": 1.649570831168016e-05, "loss": 2.238, "step": 384250 }, { "epoch": 0.67, "learning_rate": 1.6494836371753333e-05, "loss": 2.2991, "step": 384260 }, { "epoch": 0.67, "learning_rate": 1.6493964431826507e-05, "loss": 2.2564, "step": 384270 }, { "epoch": 0.67, "learning_rate": 1.6493092491899677e-05, "loss": 2.332, "step": 384280 }, { "epoch": 0.67, "learning_rate": 1.6492220551972855e-05, "loss": 2.2224, "step": 384290 }, { "epoch": 0.67, "learning_rate": 1.6491348612046025e-05, "loss": 2.3799, "step": 384300 }, { "epoch": 0.67, "learning_rate": 1.64904766721192e-05, "loss": 2.313, "step": 384310 }, { "epoch": 0.67, "learning_rate": 1.6489604732192372e-05, "loss": 2.3546, "step": 384320 }, { "epoch": 0.67, "learning_rate": 1.6488732792265546e-05, "loss": 2.3152, "step": 384330 }, { "epoch": 0.67, "learning_rate": 1.648786085233872e-05, "loss": 2.3331, "step": 384340 }, { "epoch": 0.67, "learning_rate": 1.648698891241189e-05, "loss": 2.2596, "step": 384350 }, { "epoch": 0.67, "learning_rate": 1.6486116972485064e-05, "loss": 2.3657, "step": 384360 }, { "epoch": 0.67, "learning_rate": 1.6485245032558238e-05, "loss": 2.3099, "step": 384370 }, { "epoch": 0.67, "learning_rate": 1.6484373092631412e-05, "loss": 2.2383, "step": 384380 }, { "epoch": 0.67, "learning_rate": 1.6483501152704582e-05, "loss": 2.3243, "step": 384390 }, { "epoch": 0.67, "learning_rate": 1.6482629212777756e-05, "loss": 2.2838, "step": 384400 }, { "epoch": 0.67, "learning_rate": 1.648175727285093e-05, "loss": 2.3511, "step": 384410 }, { "epoch": 0.67, "learning_rate": 1.6480885332924103e-05, "loss": 2.3273, "step": 384420 }, { "epoch": 0.67, "learning_rate": 1.6480013392997277e-05, "loss": 2.2138, "step": 384430 }, { "epoch": 0.67, "learning_rate": 1.647914145307045e-05, "loss": 2.3739, "step": 384440 }, { "epoch": 0.67, "learning_rate": 1.6478269513143625e-05, "loss": 2.3068, "step": 384450 }, { "epoch": 0.67, "learning_rate": 1.6477397573216795e-05, "loss": 2.2871, "step": 384460 }, { "epoch": 0.67, "learning_rate": 1.647652563328997e-05, "loss": 2.3211, "step": 384470 }, { "epoch": 0.67, "learning_rate": 1.6475653693363143e-05, "loss": 2.3166, "step": 384480 }, { "epoch": 0.67, "learning_rate": 1.6474781753436316e-05, "loss": 2.3668, "step": 384490 }, { "epoch": 0.67, "learning_rate": 1.647390981350949e-05, "loss": 2.3507, "step": 384500 }, { "epoch": 0.67, "learning_rate": 1.647303787358266e-05, "loss": 2.3186, "step": 384510 }, { "epoch": 0.67, "learning_rate": 1.6472165933655838e-05, "loss": 2.3062, "step": 384520 }, { "epoch": 0.67, "learning_rate": 1.6471293993729008e-05, "loss": 2.3427, "step": 384530 }, { "epoch": 0.67, "learning_rate": 1.6470422053802182e-05, "loss": 2.2379, "step": 384540 }, { "epoch": 0.67, "learning_rate": 1.6469550113875352e-05, "loss": 2.2514, "step": 384550 }, { "epoch": 0.67, "learning_rate": 1.646867817394853e-05, "loss": 2.2184, "step": 384560 }, { "epoch": 0.67, "learning_rate": 1.6467806234021703e-05, "loss": 2.3732, "step": 384570 }, { "epoch": 0.67, "learning_rate": 1.6466934294094874e-05, "loss": 2.3661, "step": 384580 }, { "epoch": 0.67, "learning_rate": 1.646606235416805e-05, "loss": 2.2352, "step": 384590 }, { "epoch": 0.67, "learning_rate": 1.646519041424122e-05, "loss": 2.2022, "step": 384600 }, { "epoch": 0.67, "learning_rate": 1.6464318474314395e-05, "loss": 2.21, "step": 384610 }, { "epoch": 0.67, "learning_rate": 1.6463446534387565e-05, "loss": 2.3543, "step": 384620 }, { "epoch": 0.67, "learning_rate": 1.6462574594460742e-05, "loss": 2.3119, "step": 384630 }, { "epoch": 0.67, "learning_rate": 1.6461702654533913e-05, "loss": 2.2795, "step": 384640 }, { "epoch": 0.67, "learning_rate": 1.6460830714607087e-05, "loss": 2.2887, "step": 384650 }, { "epoch": 0.67, "learning_rate": 1.645995877468026e-05, "loss": 2.29, "step": 384660 }, { "epoch": 0.67, "learning_rate": 1.6459086834753434e-05, "loss": 2.2528, "step": 384670 }, { "epoch": 0.67, "learning_rate": 1.6458214894826608e-05, "loss": 2.2412, "step": 384680 }, { "epoch": 0.67, "learning_rate": 1.6457342954899778e-05, "loss": 2.2968, "step": 384690 }, { "epoch": 0.67, "learning_rate": 1.6456471014972955e-05, "loss": 2.2801, "step": 384700 }, { "epoch": 0.67, "learning_rate": 1.6455599075046126e-05, "loss": 2.1281, "step": 384710 }, { "epoch": 0.67, "learning_rate": 1.64547271351193e-05, "loss": 2.2011, "step": 384720 }, { "epoch": 0.67, "learning_rate": 1.6453855195192473e-05, "loss": 2.3534, "step": 384730 }, { "epoch": 0.67, "learning_rate": 1.6452983255265647e-05, "loss": 2.2849, "step": 384740 }, { "epoch": 0.67, "learning_rate": 1.645211131533882e-05, "loss": 2.2978, "step": 384750 }, { "epoch": 0.67, "learning_rate": 1.645123937541199e-05, "loss": 2.3677, "step": 384760 }, { "epoch": 0.67, "learning_rate": 1.6450367435485165e-05, "loss": 2.3098, "step": 384770 }, { "epoch": 0.67, "learning_rate": 1.644949549555834e-05, "loss": 2.3067, "step": 384780 }, { "epoch": 0.67, "learning_rate": 1.6448623555631513e-05, "loss": 2.3002, "step": 384790 }, { "epoch": 0.67, "learning_rate": 1.6447751615704683e-05, "loss": 2.3699, "step": 384800 }, { "epoch": 0.67, "learning_rate": 1.6446879675777857e-05, "loss": 2.3006, "step": 384810 }, { "epoch": 0.67, "learning_rate": 1.6446007735851034e-05, "loss": 2.2576, "step": 384820 }, { "epoch": 0.67, "learning_rate": 1.6445135795924204e-05, "loss": 2.3797, "step": 384830 }, { "epoch": 0.67, "learning_rate": 1.6444263855997378e-05, "loss": 2.2982, "step": 384840 }, { "epoch": 0.67, "learning_rate": 1.6443391916070552e-05, "loss": 2.2108, "step": 384850 }, { "epoch": 0.67, "learning_rate": 1.6442519976143726e-05, "loss": 2.3165, "step": 384860 }, { "epoch": 0.67, "learning_rate": 1.6441648036216896e-05, "loss": 2.2098, "step": 384870 }, { "epoch": 0.67, "learning_rate": 1.644077609629007e-05, "loss": 2.2942, "step": 384880 }, { "epoch": 0.67, "learning_rate": 1.6439904156363243e-05, "loss": 2.4215, "step": 384890 }, { "epoch": 0.67, "learning_rate": 1.6439032216436417e-05, "loss": 2.1985, "step": 384900 }, { "epoch": 0.67, "learning_rate": 1.643816027650959e-05, "loss": 2.3555, "step": 384910 }, { "epoch": 0.67, "learning_rate": 1.643728833658276e-05, "loss": 2.2582, "step": 384920 }, { "epoch": 0.67, "learning_rate": 1.643641639665594e-05, "loss": 2.2876, "step": 384930 }, { "epoch": 0.67, "learning_rate": 1.643554445672911e-05, "loss": 2.4529, "step": 384940 }, { "epoch": 0.67, "learning_rate": 1.6434672516802283e-05, "loss": 2.3395, "step": 384950 }, { "epoch": 0.67, "learning_rate": 1.6433800576875456e-05, "loss": 2.2897, "step": 384960 }, { "epoch": 0.67, "learning_rate": 1.643292863694863e-05, "loss": 2.4071, "step": 384970 }, { "epoch": 0.67, "learning_rate": 1.6432056697021804e-05, "loss": 2.3255, "step": 384980 }, { "epoch": 0.67, "learning_rate": 1.6431184757094974e-05, "loss": 2.3323, "step": 384990 }, { "epoch": 0.67, "learning_rate": 1.643031281716815e-05, "loss": 2.2351, "step": 385000 }, { "epoch": 0.67, "learning_rate": 1.6429440877241322e-05, "loss": 2.3315, "step": 385010 }, { "epoch": 0.67, "learning_rate": 1.6428568937314496e-05, "loss": 2.3603, "step": 385020 }, { "epoch": 0.67, "learning_rate": 1.6427696997387666e-05, "loss": 2.3197, "step": 385030 }, { "epoch": 0.67, "learning_rate": 1.6426825057460843e-05, "loss": 2.2585, "step": 385040 }, { "epoch": 0.67, "learning_rate": 1.6425953117534017e-05, "loss": 2.2167, "step": 385050 }, { "epoch": 0.67, "learning_rate": 1.6425081177607187e-05, "loss": 2.352, "step": 385060 }, { "epoch": 0.67, "learning_rate": 1.642420923768036e-05, "loss": 2.2672, "step": 385070 }, { "epoch": 0.67, "learning_rate": 1.6423337297753535e-05, "loss": 2.3062, "step": 385080 }, { "epoch": 0.67, "learning_rate": 1.642246535782671e-05, "loss": 2.349, "step": 385090 }, { "epoch": 0.67, "learning_rate": 1.642159341789988e-05, "loss": 2.3555, "step": 385100 }, { "epoch": 0.67, "learning_rate": 1.6420721477973056e-05, "loss": 2.2681, "step": 385110 }, { "epoch": 0.67, "learning_rate": 1.6419849538046227e-05, "loss": 2.4067, "step": 385120 }, { "epoch": 0.67, "learning_rate": 1.64189775981194e-05, "loss": 2.2577, "step": 385130 }, { "epoch": 0.67, "learning_rate": 1.6418105658192574e-05, "loss": 2.3237, "step": 385140 }, { "epoch": 0.67, "learning_rate": 1.6417233718265748e-05, "loss": 2.2397, "step": 385150 }, { "epoch": 0.67, "learning_rate": 1.6416361778338922e-05, "loss": 2.3509, "step": 385160 }, { "epoch": 0.67, "learning_rate": 1.6415489838412092e-05, "loss": 2.3446, "step": 385170 }, { "epoch": 0.67, "learning_rate": 1.6414617898485266e-05, "loss": 2.2651, "step": 385180 }, { "epoch": 0.67, "learning_rate": 1.641374595855844e-05, "loss": 2.2793, "step": 385190 }, { "epoch": 0.67, "learning_rate": 1.6412874018631613e-05, "loss": 2.403, "step": 385200 }, { "epoch": 0.67, "learning_rate": 1.6412002078704787e-05, "loss": 2.3456, "step": 385210 }, { "epoch": 0.67, "learning_rate": 1.641113013877796e-05, "loss": 2.1723, "step": 385220 }, { "epoch": 0.67, "learning_rate": 1.6410258198851135e-05, "loss": 2.249, "step": 385230 }, { "epoch": 0.67, "learning_rate": 1.6409386258924305e-05, "loss": 2.266, "step": 385240 }, { "epoch": 0.67, "learning_rate": 1.640851431899748e-05, "loss": 2.4174, "step": 385250 }, { "epoch": 0.67, "learning_rate": 1.6407642379070653e-05, "loss": 2.4106, "step": 385260 }, { "epoch": 0.67, "learning_rate": 1.6406770439143826e-05, "loss": 2.2748, "step": 385270 }, { "epoch": 0.67, "learning_rate": 1.6405898499216997e-05, "loss": 2.4139, "step": 385280 }, { "epoch": 0.67, "learning_rate": 1.640502655929017e-05, "loss": 2.3249, "step": 385290 }, { "epoch": 0.67, "learning_rate": 1.6404154619363348e-05, "loss": 2.3214, "step": 385300 }, { "epoch": 0.67, "learning_rate": 1.6403282679436518e-05, "loss": 2.4261, "step": 385310 }, { "epoch": 0.67, "learning_rate": 1.6402410739509692e-05, "loss": 2.2295, "step": 385320 }, { "epoch": 0.67, "learning_rate": 1.6401538799582862e-05, "loss": 2.2841, "step": 385330 }, { "epoch": 0.67, "learning_rate": 1.640066685965604e-05, "loss": 2.2783, "step": 385340 }, { "epoch": 0.67, "learning_rate": 1.639979491972921e-05, "loss": 2.2538, "step": 385350 }, { "epoch": 0.67, "learning_rate": 1.6398922979802384e-05, "loss": 2.3461, "step": 385360 }, { "epoch": 0.67, "learning_rate": 1.6398051039875557e-05, "loss": 2.2454, "step": 385370 }, { "epoch": 0.67, "learning_rate": 1.639717909994873e-05, "loss": 2.3445, "step": 385380 }, { "epoch": 0.67, "learning_rate": 1.6396307160021905e-05, "loss": 2.3208, "step": 385390 }, { "epoch": 0.67, "learning_rate": 1.6395435220095075e-05, "loss": 2.3916, "step": 385400 }, { "epoch": 0.67, "learning_rate": 1.6394563280168252e-05, "loss": 2.4126, "step": 385410 }, { "epoch": 0.67, "learning_rate": 1.6393691340241423e-05, "loss": 2.3623, "step": 385420 }, { "epoch": 0.67, "learning_rate": 1.6392819400314597e-05, "loss": 2.2613, "step": 385430 }, { "epoch": 0.67, "learning_rate": 1.639194746038777e-05, "loss": 2.1604, "step": 385440 }, { "epoch": 0.67, "learning_rate": 1.6391075520460944e-05, "loss": 2.3776, "step": 385450 }, { "epoch": 0.67, "learning_rate": 1.6390203580534118e-05, "loss": 2.2632, "step": 385460 }, { "epoch": 0.67, "learning_rate": 1.6389331640607288e-05, "loss": 2.3779, "step": 385470 }, { "epoch": 0.67, "learning_rate": 1.6388459700680462e-05, "loss": 2.3125, "step": 385480 }, { "epoch": 0.67, "learning_rate": 1.6387587760753636e-05, "loss": 2.261, "step": 385490 }, { "epoch": 0.67, "learning_rate": 1.638671582082681e-05, "loss": 2.3167, "step": 385500 }, { "epoch": 0.67, "learning_rate": 1.638584388089998e-05, "loss": 2.2813, "step": 385510 }, { "epoch": 0.67, "learning_rate": 1.6384971940973157e-05, "loss": 2.3636, "step": 385520 }, { "epoch": 0.67, "learning_rate": 1.6384100001046327e-05, "loss": 2.3255, "step": 385530 }, { "epoch": 0.67, "learning_rate": 1.63832280611195e-05, "loss": 2.3207, "step": 385540 }, { "epoch": 0.67, "learning_rate": 1.6382356121192675e-05, "loss": 2.3033, "step": 385550 }, { "epoch": 0.67, "learning_rate": 1.638148418126585e-05, "loss": 2.2208, "step": 385560 }, { "epoch": 0.67, "learning_rate": 1.6380612241339023e-05, "loss": 2.3159, "step": 385570 }, { "epoch": 0.67, "learning_rate": 1.6379740301412193e-05, "loss": 2.3398, "step": 385580 }, { "epoch": 0.67, "learning_rate": 1.6378868361485367e-05, "loss": 2.3172, "step": 385590 }, { "epoch": 0.67, "learning_rate": 1.637799642155854e-05, "loss": 2.3732, "step": 385600 }, { "epoch": 0.67, "learning_rate": 1.6377124481631714e-05, "loss": 2.4041, "step": 385610 }, { "epoch": 0.67, "learning_rate": 1.6376252541704888e-05, "loss": 2.2254, "step": 385620 }, { "epoch": 0.67, "learning_rate": 1.6375380601778062e-05, "loss": 2.4214, "step": 385630 }, { "epoch": 0.67, "learning_rate": 1.6374508661851236e-05, "loss": 2.2592, "step": 385640 }, { "epoch": 0.67, "learning_rate": 1.6373636721924406e-05, "loss": 2.2787, "step": 385650 }, { "epoch": 0.67, "learning_rate": 1.637276478199758e-05, "loss": 2.2956, "step": 385660 }, { "epoch": 0.67, "learning_rate": 1.6371892842070753e-05, "loss": 2.3091, "step": 385670 }, { "epoch": 0.67, "learning_rate": 1.6371020902143927e-05, "loss": 2.3977, "step": 385680 }, { "epoch": 0.67, "learning_rate": 1.63701489622171e-05, "loss": 2.3555, "step": 385690 }, { "epoch": 0.67, "learning_rate": 1.636927702229027e-05, "loss": 2.3177, "step": 385700 }, { "epoch": 0.67, "learning_rate": 1.636840508236345e-05, "loss": 2.4001, "step": 385710 }, { "epoch": 0.67, "learning_rate": 1.636753314243662e-05, "loss": 2.3269, "step": 385720 }, { "epoch": 0.67, "learning_rate": 1.6366661202509793e-05, "loss": 2.2939, "step": 385730 }, { "epoch": 0.67, "learning_rate": 1.6365789262582963e-05, "loss": 2.3137, "step": 385740 }, { "epoch": 0.67, "learning_rate": 1.636491732265614e-05, "loss": 2.3548, "step": 385750 }, { "epoch": 0.67, "learning_rate": 1.636404538272931e-05, "loss": 2.3632, "step": 385760 }, { "epoch": 0.67, "learning_rate": 1.6363173442802484e-05, "loss": 2.4345, "step": 385770 }, { "epoch": 0.67, "learning_rate": 1.636230150287566e-05, "loss": 2.2999, "step": 385780 }, { "epoch": 0.67, "learning_rate": 1.6361429562948832e-05, "loss": 2.3895, "step": 385790 }, { "epoch": 0.67, "learning_rate": 1.6360557623022006e-05, "loss": 2.3951, "step": 385800 }, { "epoch": 0.67, "learning_rate": 1.6359685683095176e-05, "loss": 2.3259, "step": 385810 }, { "epoch": 0.67, "learning_rate": 1.6358813743168353e-05, "loss": 2.2434, "step": 385820 }, { "epoch": 0.67, "learning_rate": 1.6357941803241524e-05, "loss": 2.3368, "step": 385830 }, { "epoch": 0.67, "learning_rate": 1.6357069863314697e-05, "loss": 2.2976, "step": 385840 }, { "epoch": 0.67, "learning_rate": 1.635619792338787e-05, "loss": 2.284, "step": 385850 }, { "epoch": 0.67, "learning_rate": 1.6355325983461045e-05, "loss": 2.2439, "step": 385860 }, { "epoch": 0.67, "learning_rate": 1.635445404353422e-05, "loss": 2.2904, "step": 385870 }, { "epoch": 0.67, "learning_rate": 1.635358210360739e-05, "loss": 2.2547, "step": 385880 }, { "epoch": 0.67, "learning_rate": 1.6352710163680566e-05, "loss": 2.3589, "step": 385890 }, { "epoch": 0.67, "learning_rate": 1.6351838223753737e-05, "loss": 2.3053, "step": 385900 }, { "epoch": 0.67, "learning_rate": 1.635096628382691e-05, "loss": 2.2555, "step": 385910 }, { "epoch": 0.67, "learning_rate": 1.6350094343900084e-05, "loss": 2.2956, "step": 385920 }, { "epoch": 0.67, "learning_rate": 1.6349222403973258e-05, "loss": 2.3162, "step": 385930 }, { "epoch": 0.67, "learning_rate": 1.6348350464046432e-05, "loss": 2.3408, "step": 385940 }, { "epoch": 0.67, "learning_rate": 1.6347478524119602e-05, "loss": 2.2444, "step": 385950 }, { "epoch": 0.67, "learning_rate": 1.6346606584192776e-05, "loss": 2.2127, "step": 385960 }, { "epoch": 0.67, "learning_rate": 1.634573464426595e-05, "loss": 2.2073, "step": 385970 }, { "epoch": 0.67, "learning_rate": 1.6344862704339123e-05, "loss": 2.1937, "step": 385980 }, { "epoch": 0.67, "learning_rate": 1.6343990764412294e-05, "loss": 2.3366, "step": 385990 }, { "epoch": 0.67, "learning_rate": 1.6343118824485468e-05, "loss": 2.3472, "step": 386000 }, { "epoch": 0.67, "learning_rate": 1.634224688455864e-05, "loss": 2.4187, "step": 386010 }, { "epoch": 0.67, "learning_rate": 1.6341374944631815e-05, "loss": 2.3379, "step": 386020 }, { "epoch": 0.67, "learning_rate": 1.634050300470499e-05, "loss": 2.3374, "step": 386030 }, { "epoch": 0.67, "learning_rate": 1.6339631064778163e-05, "loss": 2.2241, "step": 386040 }, { "epoch": 0.67, "learning_rate": 1.6338759124851336e-05, "loss": 2.289, "step": 386050 }, { "epoch": 0.67, "learning_rate": 1.6337887184924507e-05, "loss": 2.2513, "step": 386060 }, { "epoch": 0.67, "learning_rate": 1.633701524499768e-05, "loss": 2.3366, "step": 386070 }, { "epoch": 0.67, "learning_rate": 1.6336143305070854e-05, "loss": 2.3317, "step": 386080 }, { "epoch": 0.67, "learning_rate": 1.6335271365144028e-05, "loss": 2.2743, "step": 386090 }, { "epoch": 0.67, "learning_rate": 1.6334399425217202e-05, "loss": 2.3952, "step": 386100 }, { "epoch": 0.67, "learning_rate": 1.6333527485290372e-05, "loss": 2.3662, "step": 386110 }, { "epoch": 0.67, "learning_rate": 1.633265554536355e-05, "loss": 2.3667, "step": 386120 }, { "epoch": 0.67, "learning_rate": 1.633178360543672e-05, "loss": 2.3576, "step": 386130 }, { "epoch": 0.67, "learning_rate": 1.6330911665509894e-05, "loss": 2.2789, "step": 386140 }, { "epoch": 0.67, "learning_rate": 1.6330039725583067e-05, "loss": 2.2935, "step": 386150 }, { "epoch": 0.67, "learning_rate": 1.632916778565624e-05, "loss": 2.2922, "step": 386160 }, { "epoch": 0.67, "learning_rate": 1.6328295845729415e-05, "loss": 2.2855, "step": 386170 }, { "epoch": 0.67, "learning_rate": 1.6327423905802585e-05, "loss": 2.4108, "step": 386180 }, { "epoch": 0.67, "learning_rate": 1.6326551965875762e-05, "loss": 2.3397, "step": 386190 }, { "epoch": 0.67, "learning_rate": 1.6325680025948933e-05, "loss": 2.2701, "step": 386200 }, { "epoch": 0.67, "learning_rate": 1.6324808086022107e-05, "loss": 2.3671, "step": 386210 }, { "epoch": 0.67, "learning_rate": 1.6323936146095277e-05, "loss": 2.3247, "step": 386220 }, { "epoch": 0.67, "learning_rate": 1.6323064206168454e-05, "loss": 2.3158, "step": 386230 }, { "epoch": 0.67, "learning_rate": 1.6322192266241624e-05, "loss": 2.3157, "step": 386240 }, { "epoch": 0.67, "learning_rate": 1.6321320326314798e-05, "loss": 2.281, "step": 386250 }, { "epoch": 0.67, "learning_rate": 1.6320448386387972e-05, "loss": 2.4329, "step": 386260 }, { "epoch": 0.67, "learning_rate": 1.6319576446461146e-05, "loss": 2.3614, "step": 386270 }, { "epoch": 0.67, "learning_rate": 1.631870450653432e-05, "loss": 2.342, "step": 386280 }, { "epoch": 0.67, "learning_rate": 1.631783256660749e-05, "loss": 2.3859, "step": 386290 }, { "epoch": 0.67, "learning_rate": 1.6316960626680667e-05, "loss": 2.4238, "step": 386300 }, { "epoch": 0.67, "learning_rate": 1.6316088686753837e-05, "loss": 2.2738, "step": 386310 }, { "epoch": 0.67, "learning_rate": 1.631521674682701e-05, "loss": 2.3811, "step": 386320 }, { "epoch": 0.67, "learning_rate": 1.6314344806900185e-05, "loss": 2.2698, "step": 386330 }, { "epoch": 0.67, "learning_rate": 1.631347286697336e-05, "loss": 2.2429, "step": 386340 }, { "epoch": 0.67, "learning_rate": 1.6312600927046533e-05, "loss": 2.3438, "step": 386350 }, { "epoch": 0.67, "learning_rate": 1.6311728987119703e-05, "loss": 2.3092, "step": 386360 }, { "epoch": 0.67, "learning_rate": 1.6310857047192877e-05, "loss": 2.3755, "step": 386370 }, { "epoch": 0.67, "learning_rate": 1.630998510726605e-05, "loss": 2.3667, "step": 386380 }, { "epoch": 0.67, "learning_rate": 1.6309113167339224e-05, "loss": 2.39, "step": 386390 }, { "epoch": 0.67, "learning_rate": 1.6308241227412398e-05, "loss": 2.2362, "step": 386400 }, { "epoch": 0.67, "learning_rate": 1.630736928748557e-05, "loss": 2.3752, "step": 386410 }, { "epoch": 0.67, "learning_rate": 1.6306497347558746e-05, "loss": 2.4639, "step": 386420 }, { "epoch": 0.67, "learning_rate": 1.6305625407631916e-05, "loss": 2.3282, "step": 386430 }, { "epoch": 0.67, "learning_rate": 1.630475346770509e-05, "loss": 2.352, "step": 386440 }, { "epoch": 0.67, "learning_rate": 1.6303881527778263e-05, "loss": 2.3803, "step": 386450 }, { "epoch": 0.67, "learning_rate": 1.6303009587851437e-05, "loss": 2.2347, "step": 386460 }, { "epoch": 0.67, "learning_rate": 1.6302137647924608e-05, "loss": 2.3141, "step": 386470 }, { "epoch": 0.67, "learning_rate": 1.630126570799778e-05, "loss": 2.3596, "step": 386480 }, { "epoch": 0.67, "learning_rate": 1.6300393768070955e-05, "loss": 2.2752, "step": 386490 }, { "epoch": 0.67, "learning_rate": 1.629952182814413e-05, "loss": 2.306, "step": 386500 }, { "epoch": 0.67, "learning_rate": 1.6298649888217303e-05, "loss": 2.4311, "step": 386510 }, { "epoch": 0.67, "learning_rate": 1.6297777948290473e-05, "loss": 2.3405, "step": 386520 }, { "epoch": 0.67, "learning_rate": 1.629690600836365e-05, "loss": 2.3042, "step": 386530 }, { "epoch": 0.67, "learning_rate": 1.629603406843682e-05, "loss": 2.3447, "step": 386540 }, { "epoch": 0.67, "learning_rate": 1.6295162128509994e-05, "loss": 2.2854, "step": 386550 }, { "epoch": 0.67, "learning_rate": 1.6294290188583168e-05, "loss": 2.2284, "step": 386560 }, { "epoch": 0.67, "learning_rate": 1.6293418248656342e-05, "loss": 2.2605, "step": 386570 }, { "epoch": 0.67, "learning_rate": 1.6292546308729516e-05, "loss": 2.3753, "step": 386580 }, { "epoch": 0.67, "learning_rate": 1.6291674368802686e-05, "loss": 2.2278, "step": 386590 }, { "epoch": 0.67, "learning_rate": 1.6290802428875863e-05, "loss": 2.3057, "step": 386600 }, { "epoch": 0.67, "learning_rate": 1.6289930488949034e-05, "loss": 2.3556, "step": 386610 }, { "epoch": 0.67, "learning_rate": 1.6289058549022207e-05, "loss": 2.3263, "step": 386620 }, { "epoch": 0.67, "learning_rate": 1.6288186609095378e-05, "loss": 2.2824, "step": 386630 }, { "epoch": 0.67, "learning_rate": 1.6287314669168555e-05, "loss": 2.3695, "step": 386640 }, { "epoch": 0.67, "learning_rate": 1.628644272924173e-05, "loss": 2.1703, "step": 386650 }, { "epoch": 0.67, "learning_rate": 1.62855707893149e-05, "loss": 2.328, "step": 386660 }, { "epoch": 0.67, "learning_rate": 1.6284698849388073e-05, "loss": 2.3304, "step": 386670 }, { "epoch": 0.67, "learning_rate": 1.6283826909461247e-05, "loss": 2.1823, "step": 386680 }, { "epoch": 0.67, "learning_rate": 1.628295496953442e-05, "loss": 2.3588, "step": 386690 }, { "epoch": 0.67, "learning_rate": 1.628208302960759e-05, "loss": 2.4082, "step": 386700 }, { "epoch": 0.67, "learning_rate": 1.6281211089680768e-05, "loss": 2.3514, "step": 386710 }, { "epoch": 0.67, "learning_rate": 1.628033914975394e-05, "loss": 2.3155, "step": 386720 }, { "epoch": 0.67, "learning_rate": 1.6279467209827112e-05, "loss": 2.2995, "step": 386730 }, { "epoch": 0.67, "learning_rate": 1.6278595269900286e-05, "loss": 2.2435, "step": 386740 }, { "epoch": 0.67, "learning_rate": 1.627772332997346e-05, "loss": 2.281, "step": 386750 }, { "epoch": 0.67, "learning_rate": 1.6276851390046633e-05, "loss": 2.3669, "step": 386760 }, { "epoch": 0.67, "learning_rate": 1.6275979450119804e-05, "loss": 2.2698, "step": 386770 }, { "epoch": 0.67, "learning_rate": 1.6275107510192978e-05, "loss": 2.3557, "step": 386780 }, { "epoch": 0.67, "learning_rate": 1.627423557026615e-05, "loss": 2.3314, "step": 386790 }, { "epoch": 0.67, "learning_rate": 1.6273363630339325e-05, "loss": 2.2671, "step": 386800 }, { "epoch": 0.67, "learning_rate": 1.62724916904125e-05, "loss": 2.3079, "step": 386810 }, { "epoch": 0.67, "learning_rate": 1.6271619750485673e-05, "loss": 2.2319, "step": 386820 }, { "epoch": 0.67, "learning_rate": 1.6270747810558846e-05, "loss": 2.3525, "step": 386830 }, { "epoch": 0.67, "learning_rate": 1.6269875870632017e-05, "loss": 2.394, "step": 386840 }, { "epoch": 0.67, "learning_rate": 1.626900393070519e-05, "loss": 2.3832, "step": 386850 }, { "epoch": 0.67, "learning_rate": 1.6268131990778364e-05, "loss": 2.2328, "step": 386860 }, { "epoch": 0.67, "learning_rate": 1.6267260050851538e-05, "loss": 2.3464, "step": 386870 }, { "epoch": 0.67, "learning_rate": 1.626638811092471e-05, "loss": 2.4198, "step": 386880 }, { "epoch": 0.67, "learning_rate": 1.6265516170997882e-05, "loss": 2.273, "step": 386890 }, { "epoch": 0.67, "learning_rate": 1.626464423107106e-05, "loss": 2.2415, "step": 386900 }, { "epoch": 0.67, "learning_rate": 1.626377229114423e-05, "loss": 2.3243, "step": 386910 }, { "epoch": 0.67, "learning_rate": 1.6262900351217404e-05, "loss": 2.3539, "step": 386920 }, { "epoch": 0.67, "learning_rate": 1.6262028411290574e-05, "loss": 2.3748, "step": 386930 }, { "epoch": 0.67, "learning_rate": 1.626115647136375e-05, "loss": 2.2985, "step": 386940 }, { "epoch": 0.67, "learning_rate": 1.626028453143692e-05, "loss": 2.2816, "step": 386950 }, { "epoch": 0.67, "learning_rate": 1.6259412591510095e-05, "loss": 2.3641, "step": 386960 }, { "epoch": 0.67, "learning_rate": 1.625854065158327e-05, "loss": 2.2918, "step": 386970 }, { "epoch": 0.67, "learning_rate": 1.6257668711656443e-05, "loss": 2.3491, "step": 386980 }, { "epoch": 0.67, "learning_rate": 1.6256796771729617e-05, "loss": 2.3451, "step": 386990 }, { "epoch": 0.67, "learning_rate": 1.6255924831802787e-05, "loss": 2.3667, "step": 387000 }, { "epoch": 0.67, "learning_rate": 1.6255052891875964e-05, "loss": 2.2892, "step": 387010 }, { "epoch": 0.67, "learning_rate": 1.6254180951949135e-05, "loss": 2.2838, "step": 387020 }, { "epoch": 0.67, "learning_rate": 1.6253309012022308e-05, "loss": 2.328, "step": 387030 }, { "epoch": 0.67, "learning_rate": 1.6252437072095482e-05, "loss": 2.1384, "step": 387040 }, { "epoch": 0.67, "learning_rate": 1.6251565132168656e-05, "loss": 2.4142, "step": 387050 }, { "epoch": 0.67, "learning_rate": 1.625069319224183e-05, "loss": 2.2928, "step": 387060 }, { "epoch": 0.68, "learning_rate": 1.6249821252315e-05, "loss": 2.3024, "step": 387070 }, { "epoch": 0.68, "learning_rate": 1.6248949312388177e-05, "loss": 2.2663, "step": 387080 }, { "epoch": 0.68, "learning_rate": 1.6248077372461348e-05, "loss": 2.1834, "step": 387090 }, { "epoch": 0.68, "learning_rate": 1.624720543253452e-05, "loss": 2.3416, "step": 387100 }, { "epoch": 0.68, "learning_rate": 1.624633349260769e-05, "loss": 2.3492, "step": 387110 }, { "epoch": 0.68, "learning_rate": 1.624546155268087e-05, "loss": 2.2675, "step": 387120 }, { "epoch": 0.68, "learning_rate": 1.6244589612754043e-05, "loss": 2.2827, "step": 387130 }, { "epoch": 0.68, "learning_rate": 1.6243717672827213e-05, "loss": 2.3195, "step": 387140 }, { "epoch": 0.68, "learning_rate": 1.6242845732900387e-05, "loss": 2.4508, "step": 387150 }, { "epoch": 0.68, "learning_rate": 1.624197379297356e-05, "loss": 2.426, "step": 387160 }, { "epoch": 0.68, "learning_rate": 1.6241101853046734e-05, "loss": 2.4835, "step": 387170 }, { "epoch": 0.68, "learning_rate": 1.6240229913119905e-05, "loss": 2.3315, "step": 387180 }, { "epoch": 0.68, "learning_rate": 1.623935797319308e-05, "loss": 2.2216, "step": 387190 }, { "epoch": 0.68, "learning_rate": 1.6238486033266252e-05, "loss": 2.322, "step": 387200 }, { "epoch": 0.68, "learning_rate": 1.6237614093339426e-05, "loss": 2.2465, "step": 387210 }, { "epoch": 0.68, "learning_rate": 1.62367421534126e-05, "loss": 2.3499, "step": 387220 }, { "epoch": 0.68, "learning_rate": 1.6235870213485774e-05, "loss": 2.3219, "step": 387230 }, { "epoch": 0.68, "learning_rate": 1.6234998273558947e-05, "loss": 2.1485, "step": 387240 }, { "epoch": 0.68, "learning_rate": 1.6234126333632118e-05, "loss": 2.3783, "step": 387250 }, { "epoch": 0.68, "learning_rate": 1.623325439370529e-05, "loss": 2.2715, "step": 387260 }, { "epoch": 0.68, "learning_rate": 1.6232382453778465e-05, "loss": 2.4805, "step": 387270 }, { "epoch": 0.68, "learning_rate": 1.623151051385164e-05, "loss": 2.3308, "step": 387280 }, { "epoch": 0.68, "learning_rate": 1.6230638573924813e-05, "loss": 2.2245, "step": 387290 }, { "epoch": 0.68, "learning_rate": 1.6229766633997983e-05, "loss": 2.3253, "step": 387300 }, { "epoch": 0.68, "learning_rate": 1.622889469407116e-05, "loss": 2.3687, "step": 387310 }, { "epoch": 0.68, "learning_rate": 1.622802275414433e-05, "loss": 2.2319, "step": 387320 }, { "epoch": 0.68, "learning_rate": 1.6227150814217504e-05, "loss": 2.3558, "step": 387330 }, { "epoch": 0.68, "learning_rate": 1.6226278874290675e-05, "loss": 2.3656, "step": 387340 }, { "epoch": 0.68, "learning_rate": 1.6225406934363852e-05, "loss": 2.3759, "step": 387350 }, { "epoch": 0.68, "learning_rate": 1.6224534994437022e-05, "loss": 2.3565, "step": 387360 }, { "epoch": 0.68, "learning_rate": 1.6223663054510196e-05, "loss": 2.1966, "step": 387370 }, { "epoch": 0.68, "learning_rate": 1.6222791114583373e-05, "loss": 2.4492, "step": 387380 }, { "epoch": 0.68, "learning_rate": 1.6221919174656544e-05, "loss": 2.3403, "step": 387390 }, { "epoch": 0.68, "learning_rate": 1.6221047234729717e-05, "loss": 2.2344, "step": 387400 }, { "epoch": 0.68, "learning_rate": 1.6220175294802888e-05, "loss": 2.3281, "step": 387410 }, { "epoch": 0.68, "learning_rate": 1.6219303354876065e-05, "loss": 2.3207, "step": 387420 }, { "epoch": 0.68, "learning_rate": 1.6218431414949235e-05, "loss": 2.4075, "step": 387430 }, { "epoch": 0.68, "learning_rate": 1.621755947502241e-05, "loss": 2.3208, "step": 387440 }, { "epoch": 0.68, "learning_rate": 1.6216687535095583e-05, "loss": 2.2137, "step": 387450 }, { "epoch": 0.68, "learning_rate": 1.6215815595168757e-05, "loss": 2.1981, "step": 387460 }, { "epoch": 0.68, "learning_rate": 1.621494365524193e-05, "loss": 2.2527, "step": 387470 }, { "epoch": 0.68, "learning_rate": 1.62140717153151e-05, "loss": 2.3457, "step": 387480 }, { "epoch": 0.68, "learning_rate": 1.6213199775388278e-05, "loss": 2.2895, "step": 387490 }, { "epoch": 0.68, "learning_rate": 1.621232783546145e-05, "loss": 2.3069, "step": 387500 }, { "epoch": 0.68, "learning_rate": 1.6211455895534622e-05, "loss": 2.4264, "step": 387510 }, { "epoch": 0.68, "learning_rate": 1.6210583955607796e-05, "loss": 2.2451, "step": 387520 }, { "epoch": 0.68, "learning_rate": 1.620971201568097e-05, "loss": 2.2731, "step": 387530 }, { "epoch": 0.68, "learning_rate": 1.6208840075754143e-05, "loss": 2.2984, "step": 387540 }, { "epoch": 0.68, "learning_rate": 1.6207968135827314e-05, "loss": 2.3826, "step": 387550 }, { "epoch": 0.68, "learning_rate": 1.6207096195900488e-05, "loss": 2.1888, "step": 387560 }, { "epoch": 0.68, "learning_rate": 1.620622425597366e-05, "loss": 2.3541, "step": 387570 }, { "epoch": 0.68, "learning_rate": 1.6205352316046835e-05, "loss": 2.2529, "step": 387580 }, { "epoch": 0.68, "learning_rate": 1.6204480376120006e-05, "loss": 2.3685, "step": 387590 }, { "epoch": 0.68, "learning_rate": 1.620360843619318e-05, "loss": 2.2792, "step": 387600 }, { "epoch": 0.68, "learning_rate": 1.6202736496266353e-05, "loss": 2.322, "step": 387610 }, { "epoch": 0.68, "learning_rate": 1.6201864556339527e-05, "loss": 2.2865, "step": 387620 }, { "epoch": 0.68, "learning_rate": 1.62009926164127e-05, "loss": 2.3068, "step": 387630 }, { "epoch": 0.68, "learning_rate": 1.6200120676485874e-05, "loss": 2.3107, "step": 387640 }, { "epoch": 0.68, "learning_rate": 1.6199248736559048e-05, "loss": 2.2491, "step": 387650 }, { "epoch": 0.68, "learning_rate": 1.619837679663222e-05, "loss": 2.3052, "step": 387660 }, { "epoch": 0.68, "learning_rate": 1.6197504856705392e-05, "loss": 2.1886, "step": 387670 }, { "epoch": 0.68, "learning_rate": 1.6196632916778566e-05, "loss": 2.3736, "step": 387680 }, { "epoch": 0.68, "learning_rate": 1.619576097685174e-05, "loss": 2.2945, "step": 387690 }, { "epoch": 0.68, "learning_rate": 1.6194889036924914e-05, "loss": 2.29, "step": 387700 }, { "epoch": 0.68, "learning_rate": 1.6194017096998084e-05, "loss": 2.2418, "step": 387710 }, { "epoch": 0.68, "learning_rate": 1.619314515707126e-05, "loss": 2.2644, "step": 387720 }, { "epoch": 0.68, "learning_rate": 1.619227321714443e-05, "loss": 2.2217, "step": 387730 }, { "epoch": 0.68, "learning_rate": 1.6191401277217605e-05, "loss": 2.439, "step": 387740 }, { "epoch": 0.68, "learning_rate": 1.619052933729078e-05, "loss": 2.2994, "step": 387750 }, { "epoch": 0.68, "learning_rate": 1.6189657397363953e-05, "loss": 2.3447, "step": 387760 }, { "epoch": 0.68, "learning_rate": 1.6188785457437127e-05, "loss": 2.3121, "step": 387770 }, { "epoch": 0.68, "learning_rate": 1.6187913517510297e-05, "loss": 2.3786, "step": 387780 }, { "epoch": 0.68, "learning_rate": 1.6187041577583474e-05, "loss": 2.3283, "step": 387790 }, { "epoch": 0.68, "learning_rate": 1.6186169637656645e-05, "loss": 2.234, "step": 387800 }, { "epoch": 0.68, "learning_rate": 1.6185297697729818e-05, "loss": 2.273, "step": 387810 }, { "epoch": 0.68, "learning_rate": 1.618442575780299e-05, "loss": 2.3731, "step": 387820 }, { "epoch": 0.68, "learning_rate": 1.6183553817876166e-05, "loss": 2.2657, "step": 387830 }, { "epoch": 0.68, "learning_rate": 1.6182681877949336e-05, "loss": 2.301, "step": 387840 }, { "epoch": 0.68, "learning_rate": 1.618180993802251e-05, "loss": 2.3414, "step": 387850 }, { "epoch": 0.68, "learning_rate": 1.6180937998095684e-05, "loss": 2.3473, "step": 387860 }, { "epoch": 0.68, "learning_rate": 1.6180066058168858e-05, "loss": 2.2701, "step": 387870 }, { "epoch": 0.68, "learning_rate": 1.617919411824203e-05, "loss": 2.2662, "step": 387880 }, { "epoch": 0.68, "learning_rate": 1.61783221783152e-05, "loss": 2.2227, "step": 387890 }, { "epoch": 0.68, "learning_rate": 1.617745023838838e-05, "loss": 2.3756, "step": 387900 }, { "epoch": 0.68, "learning_rate": 1.617657829846155e-05, "loss": 2.2146, "step": 387910 }, { "epoch": 0.68, "learning_rate": 1.6175706358534723e-05, "loss": 2.1405, "step": 387920 }, { "epoch": 0.68, "learning_rate": 1.6174834418607897e-05, "loss": 2.2591, "step": 387930 }, { "epoch": 0.68, "learning_rate": 1.617396247868107e-05, "loss": 2.3837, "step": 387940 }, { "epoch": 0.68, "learning_rate": 1.6173090538754244e-05, "loss": 2.3438, "step": 387950 }, { "epoch": 0.68, "learning_rate": 1.6172218598827415e-05, "loss": 2.1956, "step": 387960 }, { "epoch": 0.68, "learning_rate": 1.617134665890059e-05, "loss": 2.3103, "step": 387970 }, { "epoch": 0.68, "learning_rate": 1.6170474718973762e-05, "loss": 2.2559, "step": 387980 }, { "epoch": 0.68, "learning_rate": 1.6169602779046936e-05, "loss": 2.318, "step": 387990 }, { "epoch": 0.68, "learning_rate": 1.616873083912011e-05, "loss": 2.2611, "step": 388000 }, { "epoch": 0.68, "learning_rate": 1.6167858899193284e-05, "loss": 2.3522, "step": 388010 }, { "epoch": 0.68, "learning_rate": 1.6166986959266457e-05, "loss": 2.3061, "step": 388020 }, { "epoch": 0.68, "learning_rate": 1.6166115019339628e-05, "loss": 2.301, "step": 388030 }, { "epoch": 0.68, "learning_rate": 1.61652430794128e-05, "loss": 2.3692, "step": 388040 }, { "epoch": 0.68, "learning_rate": 1.6164371139485975e-05, "loss": 2.2659, "step": 388050 }, { "epoch": 0.68, "learning_rate": 1.616349919955915e-05, "loss": 2.2612, "step": 388060 }, { "epoch": 0.68, "learning_rate": 1.616262725963232e-05, "loss": 2.3319, "step": 388070 }, { "epoch": 0.68, "learning_rate": 1.6161755319705493e-05, "loss": 2.1819, "step": 388080 }, { "epoch": 0.68, "learning_rate": 1.6160883379778667e-05, "loss": 2.3007, "step": 388090 }, { "epoch": 0.68, "learning_rate": 1.616001143985184e-05, "loss": 2.1902, "step": 388100 }, { "epoch": 0.68, "learning_rate": 1.6159139499925014e-05, "loss": 2.3051, "step": 388110 }, { "epoch": 0.68, "learning_rate": 1.6158267559998185e-05, "loss": 2.4543, "step": 388120 }, { "epoch": 0.68, "learning_rate": 1.6157395620071362e-05, "loss": 2.4128, "step": 388130 }, { "epoch": 0.68, "learning_rate": 1.6156523680144532e-05, "loss": 2.2664, "step": 388140 }, { "epoch": 0.68, "learning_rate": 1.6155651740217706e-05, "loss": 2.3513, "step": 388150 }, { "epoch": 0.68, "learning_rate": 1.615477980029088e-05, "loss": 2.3014, "step": 388160 }, { "epoch": 0.68, "learning_rate": 1.6153907860364054e-05, "loss": 2.2532, "step": 388170 }, { "epoch": 0.68, "learning_rate": 1.6153035920437227e-05, "loss": 2.237, "step": 388180 }, { "epoch": 0.68, "learning_rate": 1.6152163980510398e-05, "loss": 2.1962, "step": 388190 }, { "epoch": 0.68, "learning_rate": 1.6151292040583575e-05, "loss": 2.3498, "step": 388200 }, { "epoch": 0.68, "learning_rate": 1.6150420100656745e-05, "loss": 2.3133, "step": 388210 }, { "epoch": 0.68, "learning_rate": 1.614954816072992e-05, "loss": 2.2698, "step": 388220 }, { "epoch": 0.68, "learning_rate": 1.614867622080309e-05, "loss": 2.3502, "step": 388230 }, { "epoch": 0.68, "learning_rate": 1.6147804280876267e-05, "loss": 2.3797, "step": 388240 }, { "epoch": 0.68, "learning_rate": 1.614693234094944e-05, "loss": 2.3822, "step": 388250 }, { "epoch": 0.68, "learning_rate": 1.614606040102261e-05, "loss": 2.3534, "step": 388260 }, { "epoch": 0.68, "learning_rate": 1.6145188461095785e-05, "loss": 2.2668, "step": 388270 }, { "epoch": 0.68, "learning_rate": 1.614431652116896e-05, "loss": 2.305, "step": 388280 }, { "epoch": 0.68, "learning_rate": 1.6143444581242132e-05, "loss": 2.1329, "step": 388290 }, { "epoch": 0.68, "learning_rate": 1.6142572641315303e-05, "loss": 2.2608, "step": 388300 }, { "epoch": 0.68, "learning_rate": 1.614170070138848e-05, "loss": 2.2579, "step": 388310 }, { "epoch": 0.68, "learning_rate": 1.614082876146165e-05, "loss": 2.3078, "step": 388320 }, { "epoch": 0.68, "learning_rate": 1.6139956821534824e-05, "loss": 2.3155, "step": 388330 }, { "epoch": 0.68, "learning_rate": 1.6139084881607998e-05, "loss": 2.2566, "step": 388340 }, { "epoch": 0.68, "learning_rate": 1.613821294168117e-05, "loss": 2.3231, "step": 388350 }, { "epoch": 0.68, "learning_rate": 1.6137341001754345e-05, "loss": 2.3343, "step": 388360 }, { "epoch": 0.68, "learning_rate": 1.6136469061827516e-05, "loss": 2.2462, "step": 388370 }, { "epoch": 0.68, "learning_rate": 1.613559712190069e-05, "loss": 2.3064, "step": 388380 }, { "epoch": 0.68, "learning_rate": 1.6134725181973863e-05, "loss": 2.2149, "step": 388390 }, { "epoch": 0.68, "learning_rate": 1.6133853242047037e-05, "loss": 2.1952, "step": 388400 }, { "epoch": 0.68, "learning_rate": 1.613298130212021e-05, "loss": 2.4144, "step": 388410 }, { "epoch": 0.68, "learning_rate": 1.6132109362193384e-05, "loss": 2.2785, "step": 388420 }, { "epoch": 0.68, "learning_rate": 1.6131237422266558e-05, "loss": 2.3872, "step": 388430 }, { "epoch": 0.68, "learning_rate": 1.613036548233973e-05, "loss": 2.3137, "step": 388440 }, { "epoch": 0.68, "learning_rate": 1.6129493542412902e-05, "loss": 2.231, "step": 388450 }, { "epoch": 0.68, "learning_rate": 1.6128621602486076e-05, "loss": 2.3571, "step": 388460 }, { "epoch": 0.68, "learning_rate": 1.612774966255925e-05, "loss": 2.3547, "step": 388470 }, { "epoch": 0.68, "learning_rate": 1.6126877722632424e-05, "loss": 2.3144, "step": 388480 }, { "epoch": 0.68, "learning_rate": 1.6126005782705594e-05, "loss": 2.276, "step": 388490 }, { "epoch": 0.68, "learning_rate": 1.612513384277877e-05, "loss": 2.2616, "step": 388500 }, { "epoch": 0.68, "learning_rate": 1.612426190285194e-05, "loss": 2.2892, "step": 388510 }, { "epoch": 0.68, "learning_rate": 1.6123389962925115e-05, "loss": 2.3387, "step": 388520 }, { "epoch": 0.68, "learning_rate": 1.6122518022998286e-05, "loss": 2.328, "step": 388530 }, { "epoch": 0.68, "learning_rate": 1.6121646083071463e-05, "loss": 2.2679, "step": 388540 }, { "epoch": 0.68, "learning_rate": 1.6120774143144633e-05, "loss": 2.3201, "step": 388550 }, { "epoch": 0.68, "learning_rate": 1.6119902203217807e-05, "loss": 2.3339, "step": 388560 }, { "epoch": 0.68, "learning_rate": 1.611903026329098e-05, "loss": 2.2255, "step": 388570 }, { "epoch": 0.68, "learning_rate": 1.6118158323364155e-05, "loss": 2.2482, "step": 388580 }, { "epoch": 0.68, "learning_rate": 1.6117286383437328e-05, "loss": 2.2781, "step": 388590 }, { "epoch": 0.68, "learning_rate": 1.61164144435105e-05, "loss": 2.3049, "step": 388600 }, { "epoch": 0.68, "learning_rate": 1.6115542503583676e-05, "loss": 2.2597, "step": 388610 }, { "epoch": 0.68, "learning_rate": 1.6114670563656846e-05, "loss": 2.402, "step": 388620 }, { "epoch": 0.68, "learning_rate": 1.611379862373002e-05, "loss": 2.2346, "step": 388630 }, { "epoch": 0.68, "learning_rate": 1.6112926683803194e-05, "loss": 2.3401, "step": 388640 }, { "epoch": 0.68, "learning_rate": 1.6112054743876368e-05, "loss": 2.3761, "step": 388650 }, { "epoch": 0.68, "learning_rate": 1.611118280394954e-05, "loss": 2.3552, "step": 388660 }, { "epoch": 0.68, "learning_rate": 1.611031086402271e-05, "loss": 2.2666, "step": 388670 }, { "epoch": 0.68, "learning_rate": 1.610943892409589e-05, "loss": 2.2, "step": 388680 }, { "epoch": 0.68, "learning_rate": 1.610856698416906e-05, "loss": 2.2532, "step": 388690 }, { "epoch": 0.68, "learning_rate": 1.6107695044242233e-05, "loss": 2.3067, "step": 388700 }, { "epoch": 0.68, "learning_rate": 1.6106823104315403e-05, "loss": 2.3247, "step": 388710 }, { "epoch": 0.68, "learning_rate": 1.610595116438858e-05, "loss": 2.3331, "step": 388720 }, { "epoch": 0.68, "learning_rate": 1.6105079224461754e-05, "loss": 2.3182, "step": 388730 }, { "epoch": 0.68, "learning_rate": 1.6104207284534925e-05, "loss": 2.2404, "step": 388740 }, { "epoch": 0.68, "learning_rate": 1.61033353446081e-05, "loss": 2.2583, "step": 388750 }, { "epoch": 0.68, "learning_rate": 1.6102463404681272e-05, "loss": 2.3171, "step": 388760 }, { "epoch": 0.68, "learning_rate": 1.6101591464754446e-05, "loss": 2.2435, "step": 388770 }, { "epoch": 0.68, "learning_rate": 1.6100719524827616e-05, "loss": 2.3029, "step": 388780 }, { "epoch": 0.68, "learning_rate": 1.609984758490079e-05, "loss": 2.3802, "step": 388790 }, { "epoch": 0.68, "learning_rate": 1.6098975644973964e-05, "loss": 2.451, "step": 388800 }, { "epoch": 0.68, "learning_rate": 1.6098103705047138e-05, "loss": 2.1918, "step": 388810 }, { "epoch": 0.68, "learning_rate": 1.609723176512031e-05, "loss": 2.349, "step": 388820 }, { "epoch": 0.68, "learning_rate": 1.6096359825193485e-05, "loss": 2.3639, "step": 388830 }, { "epoch": 0.68, "learning_rate": 1.609548788526666e-05, "loss": 2.3476, "step": 388840 }, { "epoch": 0.68, "learning_rate": 1.609461594533983e-05, "loss": 2.2742, "step": 388850 }, { "epoch": 0.68, "learning_rate": 1.6093744005413003e-05, "loss": 2.3243, "step": 388860 }, { "epoch": 0.68, "learning_rate": 1.6092872065486177e-05, "loss": 2.3389, "step": 388870 }, { "epoch": 0.68, "learning_rate": 1.609200012555935e-05, "loss": 2.3322, "step": 388880 }, { "epoch": 0.68, "learning_rate": 1.6091128185632524e-05, "loss": 2.2602, "step": 388890 }, { "epoch": 0.68, "learning_rate": 1.6090256245705695e-05, "loss": 2.331, "step": 388900 }, { "epoch": 0.68, "learning_rate": 1.6089384305778872e-05, "loss": 2.2849, "step": 388910 }, { "epoch": 0.68, "learning_rate": 1.6088512365852042e-05, "loss": 2.2565, "step": 388920 }, { "epoch": 0.68, "learning_rate": 1.6087640425925216e-05, "loss": 2.3292, "step": 388930 }, { "epoch": 0.68, "learning_rate": 1.6086768485998387e-05, "loss": 2.3168, "step": 388940 }, { "epoch": 0.68, "learning_rate": 1.6085896546071564e-05, "loss": 2.3152, "step": 388950 }, { "epoch": 0.68, "learning_rate": 1.6085024606144734e-05, "loss": 2.4024, "step": 388960 }, { "epoch": 0.68, "learning_rate": 1.6084152666217908e-05, "loss": 2.3341, "step": 388970 }, { "epoch": 0.68, "learning_rate": 1.6083280726291085e-05, "loss": 2.3144, "step": 388980 }, { "epoch": 0.68, "learning_rate": 1.6082408786364255e-05, "loss": 2.3894, "step": 388990 }, { "epoch": 0.68, "learning_rate": 1.608153684643743e-05, "loss": 2.2611, "step": 389000 }, { "epoch": 0.68, "learning_rate": 1.60806649065106e-05, "loss": 2.3188, "step": 389010 }, { "epoch": 0.68, "learning_rate": 1.6079792966583777e-05, "loss": 2.3349, "step": 389020 }, { "epoch": 0.68, "learning_rate": 1.6078921026656947e-05, "loss": 2.2778, "step": 389030 }, { "epoch": 0.68, "learning_rate": 1.607804908673012e-05, "loss": 2.2993, "step": 389040 }, { "epoch": 0.68, "learning_rate": 1.6077177146803295e-05, "loss": 2.344, "step": 389050 }, { "epoch": 0.68, "learning_rate": 1.607630520687647e-05, "loss": 2.3117, "step": 389060 }, { "epoch": 0.68, "learning_rate": 1.6075433266949642e-05, "loss": 2.2752, "step": 389070 }, { "epoch": 0.68, "learning_rate": 1.6074561327022813e-05, "loss": 2.3101, "step": 389080 }, { "epoch": 0.68, "learning_rate": 1.607368938709599e-05, "loss": 2.2775, "step": 389090 }, { "epoch": 0.68, "learning_rate": 1.607281744716916e-05, "loss": 2.3851, "step": 389100 }, { "epoch": 0.68, "learning_rate": 1.6071945507242334e-05, "loss": 2.2854, "step": 389110 }, { "epoch": 0.68, "learning_rate": 1.6071073567315508e-05, "loss": 2.3641, "step": 389120 }, { "epoch": 0.68, "learning_rate": 1.607020162738868e-05, "loss": 2.2385, "step": 389130 }, { "epoch": 0.68, "learning_rate": 1.6069329687461855e-05, "loss": 2.3743, "step": 389140 }, { "epoch": 0.68, "learning_rate": 1.6068457747535026e-05, "loss": 2.2683, "step": 389150 }, { "epoch": 0.68, "learning_rate": 1.60675858076082e-05, "loss": 2.2131, "step": 389160 }, { "epoch": 0.68, "learning_rate": 1.6066713867681373e-05, "loss": 2.4416, "step": 389170 }, { "epoch": 0.68, "learning_rate": 1.6065841927754547e-05, "loss": 2.3581, "step": 389180 }, { "epoch": 0.68, "learning_rate": 1.6064969987827717e-05, "loss": 2.2665, "step": 389190 }, { "epoch": 0.68, "learning_rate": 1.606409804790089e-05, "loss": 2.2276, "step": 389200 }, { "epoch": 0.68, "learning_rate": 1.6063226107974068e-05, "loss": 2.2475, "step": 389210 }, { "epoch": 0.68, "learning_rate": 1.606235416804724e-05, "loss": 2.2552, "step": 389220 }, { "epoch": 0.68, "learning_rate": 1.6061482228120412e-05, "loss": 2.2502, "step": 389230 }, { "epoch": 0.68, "learning_rate": 1.6060610288193586e-05, "loss": 2.3266, "step": 389240 }, { "epoch": 0.68, "learning_rate": 1.605973834826676e-05, "loss": 2.3435, "step": 389250 }, { "epoch": 0.68, "learning_rate": 1.605886640833993e-05, "loss": 2.362, "step": 389260 }, { "epoch": 0.68, "learning_rate": 1.6057994468413104e-05, "loss": 2.2992, "step": 389270 }, { "epoch": 0.68, "learning_rate": 1.6057122528486278e-05, "loss": 2.2862, "step": 389280 }, { "epoch": 0.68, "learning_rate": 1.605625058855945e-05, "loss": 2.1968, "step": 389290 }, { "epoch": 0.68, "learning_rate": 1.6055378648632625e-05, "loss": 2.3302, "step": 389300 }, { "epoch": 0.68, "learning_rate": 1.6054506708705796e-05, "loss": 2.246, "step": 389310 }, { "epoch": 0.68, "learning_rate": 1.6053634768778973e-05, "loss": 2.2914, "step": 389320 }, { "epoch": 0.68, "learning_rate": 1.6052762828852143e-05, "loss": 2.3186, "step": 389330 }, { "epoch": 0.68, "learning_rate": 1.6051890888925317e-05, "loss": 2.3414, "step": 389340 }, { "epoch": 0.68, "learning_rate": 1.605101894899849e-05, "loss": 2.3009, "step": 389350 }, { "epoch": 0.68, "learning_rate": 1.6050147009071665e-05, "loss": 2.3298, "step": 389360 }, { "epoch": 0.68, "learning_rate": 1.6049275069144838e-05, "loss": 2.3557, "step": 389370 }, { "epoch": 0.68, "learning_rate": 1.604840312921801e-05, "loss": 2.2774, "step": 389380 }, { "epoch": 0.68, "learning_rate": 1.6047531189291186e-05, "loss": 2.2147, "step": 389390 }, { "epoch": 0.68, "learning_rate": 1.6046659249364356e-05, "loss": 2.37, "step": 389400 }, { "epoch": 0.68, "learning_rate": 1.604578730943753e-05, "loss": 2.4498, "step": 389410 }, { "epoch": 0.68, "learning_rate": 1.60449153695107e-05, "loss": 2.2915, "step": 389420 }, { "epoch": 0.68, "learning_rate": 1.6044043429583878e-05, "loss": 2.2791, "step": 389430 }, { "epoch": 0.68, "learning_rate": 1.6043171489657048e-05, "loss": 2.1935, "step": 389440 }, { "epoch": 0.68, "learning_rate": 1.604229954973022e-05, "loss": 2.4071, "step": 389450 }, { "epoch": 0.68, "learning_rate": 1.6041427609803395e-05, "loss": 2.2599, "step": 389460 }, { "epoch": 0.68, "learning_rate": 1.604055566987657e-05, "loss": 2.2515, "step": 389470 }, { "epoch": 0.68, "learning_rate": 1.6039683729949743e-05, "loss": 2.3087, "step": 389480 }, { "epoch": 0.68, "learning_rate": 1.6038811790022913e-05, "loss": 2.2876, "step": 389490 }, { "epoch": 0.68, "learning_rate": 1.603793985009609e-05, "loss": 2.3833, "step": 389500 }, { "epoch": 0.68, "learning_rate": 1.603706791016926e-05, "loss": 2.3058, "step": 389510 }, { "epoch": 0.68, "learning_rate": 1.6036195970242435e-05, "loss": 2.37, "step": 389520 }, { "epoch": 0.68, "learning_rate": 1.603532403031561e-05, "loss": 2.3089, "step": 389530 }, { "epoch": 0.68, "learning_rate": 1.6034452090388782e-05, "loss": 2.3132, "step": 389540 }, { "epoch": 0.68, "learning_rate": 1.6033580150461956e-05, "loss": 2.317, "step": 389550 }, { "epoch": 0.68, "learning_rate": 1.6032708210535126e-05, "loss": 2.3946, "step": 389560 }, { "epoch": 0.68, "learning_rate": 1.60318362706083e-05, "loss": 2.4033, "step": 389570 }, { "epoch": 0.68, "learning_rate": 1.6030964330681474e-05, "loss": 2.402, "step": 389580 }, { "epoch": 0.68, "learning_rate": 1.6030092390754648e-05, "loss": 2.2994, "step": 389590 }, { "epoch": 0.68, "learning_rate": 1.602922045082782e-05, "loss": 2.292, "step": 389600 }, { "epoch": 0.68, "learning_rate": 1.6028348510900995e-05, "loss": 2.4072, "step": 389610 }, { "epoch": 0.68, "learning_rate": 1.602747657097417e-05, "loss": 2.2963, "step": 389620 }, { "epoch": 0.68, "learning_rate": 1.602660463104734e-05, "loss": 2.3369, "step": 389630 }, { "epoch": 0.68, "learning_rate": 1.6025732691120513e-05, "loss": 2.3152, "step": 389640 }, { "epoch": 0.68, "learning_rate": 1.6024860751193687e-05, "loss": 2.3498, "step": 389650 }, { "epoch": 0.68, "learning_rate": 1.602398881126686e-05, "loss": 2.3316, "step": 389660 }, { "epoch": 0.68, "learning_rate": 1.602311687134003e-05, "loss": 2.2151, "step": 389670 }, { "epoch": 0.68, "learning_rate": 1.6022244931413205e-05, "loss": 2.2316, "step": 389680 }, { "epoch": 0.68, "learning_rate": 1.602137299148638e-05, "loss": 2.4338, "step": 389690 }, { "epoch": 0.68, "learning_rate": 1.6020501051559552e-05, "loss": 2.2665, "step": 389700 }, { "epoch": 0.68, "learning_rate": 1.6019629111632726e-05, "loss": 2.3353, "step": 389710 }, { "epoch": 0.68, "learning_rate": 1.6018757171705897e-05, "loss": 2.3065, "step": 389720 }, { "epoch": 0.68, "learning_rate": 1.6017885231779074e-05, "loss": 2.2952, "step": 389730 }, { "epoch": 0.68, "learning_rate": 1.6017013291852244e-05, "loss": 2.3506, "step": 389740 }, { "epoch": 0.68, "learning_rate": 1.6016141351925418e-05, "loss": 2.3162, "step": 389750 }, { "epoch": 0.68, "learning_rate": 1.601526941199859e-05, "loss": 2.3108, "step": 389760 }, { "epoch": 0.68, "learning_rate": 1.6014397472071765e-05, "loss": 2.3401, "step": 389770 }, { "epoch": 0.68, "learning_rate": 1.601352553214494e-05, "loss": 2.3904, "step": 389780 }, { "epoch": 0.68, "learning_rate": 1.601265359221811e-05, "loss": 2.3693, "step": 389790 }, { "epoch": 0.68, "learning_rate": 1.6011781652291287e-05, "loss": 2.2605, "step": 389800 }, { "epoch": 0.68, "learning_rate": 1.6010909712364457e-05, "loss": 2.3071, "step": 389810 }, { "epoch": 0.68, "learning_rate": 1.601003777243763e-05, "loss": 2.2686, "step": 389820 }, { "epoch": 0.68, "learning_rate": 1.6009165832510805e-05, "loss": 2.3455, "step": 389830 }, { "epoch": 0.68, "learning_rate": 1.600829389258398e-05, "loss": 2.3946, "step": 389840 }, { "epoch": 0.68, "learning_rate": 1.6007421952657152e-05, "loss": 2.3746, "step": 389850 }, { "epoch": 0.68, "learning_rate": 1.6006550012730323e-05, "loss": 2.2865, "step": 389860 }, { "epoch": 0.68, "learning_rate": 1.6005678072803496e-05, "loss": 2.2246, "step": 389870 }, { "epoch": 0.68, "learning_rate": 1.600480613287667e-05, "loss": 2.3543, "step": 389880 }, { "epoch": 0.68, "learning_rate": 1.6003934192949844e-05, "loss": 2.4073, "step": 389890 }, { "epoch": 0.68, "learning_rate": 1.6003062253023014e-05, "loss": 2.3762, "step": 389900 }, { "epoch": 0.68, "learning_rate": 1.600219031309619e-05, "loss": 2.24, "step": 389910 }, { "epoch": 0.68, "learning_rate": 1.6001318373169362e-05, "loss": 2.339, "step": 389920 }, { "epoch": 0.68, "learning_rate": 1.6000446433242536e-05, "loss": 2.3584, "step": 389930 }, { "epoch": 0.68, "learning_rate": 1.599957449331571e-05, "loss": 2.2874, "step": 389940 }, { "epoch": 0.68, "learning_rate": 1.5998702553388883e-05, "loss": 2.3044, "step": 389950 }, { "epoch": 0.68, "learning_rate": 1.5997830613462057e-05, "loss": 2.3621, "step": 389960 }, { "epoch": 0.68, "learning_rate": 1.5996958673535227e-05, "loss": 2.2493, "step": 389970 }, { "epoch": 0.68, "learning_rate": 1.59960867336084e-05, "loss": 2.2918, "step": 389980 }, { "epoch": 0.68, "learning_rate": 1.5995214793681575e-05, "loss": 2.2018, "step": 389990 }, { "epoch": 0.68, "learning_rate": 1.599434285375475e-05, "loss": 2.4768, "step": 390000 }, { "epoch": 0.68, "learning_rate": 1.5993470913827922e-05, "loss": 2.3249, "step": 390010 }, { "epoch": 0.68, "learning_rate": 1.5992598973901096e-05, "loss": 2.2317, "step": 390020 }, { "epoch": 0.68, "learning_rate": 1.599172703397427e-05, "loss": 2.2826, "step": 390030 }, { "epoch": 0.68, "learning_rate": 1.599085509404744e-05, "loss": 2.2686, "step": 390040 }, { "epoch": 0.68, "learning_rate": 1.5989983154120614e-05, "loss": 2.3737, "step": 390050 }, { "epoch": 0.68, "learning_rate": 1.5989111214193788e-05, "loss": 2.1848, "step": 390060 }, { "epoch": 0.68, "learning_rate": 1.598823927426696e-05, "loss": 2.3313, "step": 390070 }, { "epoch": 0.68, "learning_rate": 1.5987367334340135e-05, "loss": 2.2864, "step": 390080 }, { "epoch": 0.68, "learning_rate": 1.5986495394413306e-05, "loss": 2.3846, "step": 390090 }, { "epoch": 0.68, "learning_rate": 1.5985623454486483e-05, "loss": 2.3401, "step": 390100 }, { "epoch": 0.68, "learning_rate": 1.5984751514559653e-05, "loss": 2.3837, "step": 390110 }, { "epoch": 0.68, "learning_rate": 1.5983879574632827e-05, "loss": 2.3641, "step": 390120 }, { "epoch": 0.68, "learning_rate": 1.5983007634705997e-05, "loss": 2.2847, "step": 390130 }, { "epoch": 0.68, "learning_rate": 1.5982135694779175e-05, "loss": 2.3647, "step": 390140 }, { "epoch": 0.68, "learning_rate": 1.5981263754852345e-05, "loss": 2.3037, "step": 390150 }, { "epoch": 0.68, "learning_rate": 1.598039181492552e-05, "loss": 2.34, "step": 390160 }, { "epoch": 0.68, "learning_rate": 1.5979519874998692e-05, "loss": 2.407, "step": 390170 }, { "epoch": 0.68, "learning_rate": 1.5978647935071866e-05, "loss": 2.2737, "step": 390180 }, { "epoch": 0.68, "learning_rate": 1.597777599514504e-05, "loss": 2.3041, "step": 390190 }, { "epoch": 0.68, "learning_rate": 1.597690405521821e-05, "loss": 2.4365, "step": 390200 }, { "epoch": 0.68, "learning_rate": 1.5976032115291388e-05, "loss": 2.3545, "step": 390210 }, { "epoch": 0.68, "learning_rate": 1.5975160175364558e-05, "loss": 2.3361, "step": 390220 }, { "epoch": 0.68, "learning_rate": 1.597428823543773e-05, "loss": 2.308, "step": 390230 }, { "epoch": 0.68, "learning_rate": 1.5973416295510905e-05, "loss": 2.3629, "step": 390240 }, { "epoch": 0.68, "learning_rate": 1.597254435558408e-05, "loss": 2.2241, "step": 390250 }, { "epoch": 0.68, "learning_rate": 1.5971672415657253e-05, "loss": 2.2521, "step": 390260 }, { "epoch": 0.68, "learning_rate": 1.5970800475730423e-05, "loss": 2.2772, "step": 390270 }, { "epoch": 0.68, "learning_rate": 1.59699285358036e-05, "loss": 2.324, "step": 390280 }, { "epoch": 0.68, "learning_rate": 1.596905659587677e-05, "loss": 2.2756, "step": 390290 }, { "epoch": 0.68, "learning_rate": 1.5968184655949945e-05, "loss": 2.4016, "step": 390300 }, { "epoch": 0.68, "learning_rate": 1.5967312716023115e-05, "loss": 2.3166, "step": 390310 }, { "epoch": 0.68, "learning_rate": 1.5966440776096292e-05, "loss": 2.43, "step": 390320 }, { "epoch": 0.68, "learning_rate": 1.5965568836169466e-05, "loss": 2.3729, "step": 390330 }, { "epoch": 0.68, "learning_rate": 1.5964696896242636e-05, "loss": 2.3252, "step": 390340 }, { "epoch": 0.68, "learning_rate": 1.596382495631581e-05, "loss": 2.244, "step": 390350 }, { "epoch": 0.68, "learning_rate": 1.5962953016388984e-05, "loss": 2.3535, "step": 390360 }, { "epoch": 0.68, "learning_rate": 1.5962081076462158e-05, "loss": 2.2126, "step": 390370 }, { "epoch": 0.68, "learning_rate": 1.5961209136535328e-05, "loss": 2.2382, "step": 390380 }, { "epoch": 0.68, "learning_rate": 1.5960337196608502e-05, "loss": 2.3077, "step": 390390 }, { "epoch": 0.68, "learning_rate": 1.5959465256681676e-05, "loss": 2.2771, "step": 390400 }, { "epoch": 0.68, "learning_rate": 1.595859331675485e-05, "loss": 2.3879, "step": 390410 }, { "epoch": 0.68, "learning_rate": 1.5957721376828023e-05, "loss": 2.3372, "step": 390420 }, { "epoch": 0.68, "learning_rate": 1.5956849436901197e-05, "loss": 2.3069, "step": 390430 }, { "epoch": 0.68, "learning_rate": 1.595597749697437e-05, "loss": 2.2456, "step": 390440 }, { "epoch": 0.68, "learning_rate": 1.595510555704754e-05, "loss": 2.1769, "step": 390450 }, { "epoch": 0.68, "learning_rate": 1.5954233617120715e-05, "loss": 2.2579, "step": 390460 }, { "epoch": 0.68, "learning_rate": 1.595336167719389e-05, "loss": 2.2818, "step": 390470 }, { "epoch": 0.68, "learning_rate": 1.5952489737267062e-05, "loss": 2.3678, "step": 390480 }, { "epoch": 0.68, "learning_rate": 1.5951617797340236e-05, "loss": 2.3031, "step": 390490 }, { "epoch": 0.68, "learning_rate": 1.5950745857413407e-05, "loss": 2.3205, "step": 390500 }, { "epoch": 0.68, "learning_rate": 1.5949873917486584e-05, "loss": 2.3239, "step": 390510 }, { "epoch": 0.68, "learning_rate": 1.5949001977559754e-05, "loss": 2.4075, "step": 390520 }, { "epoch": 0.68, "learning_rate": 1.5948130037632928e-05, "loss": 2.3097, "step": 390530 }, { "epoch": 0.68, "learning_rate": 1.59472580977061e-05, "loss": 2.2551, "step": 390540 }, { "epoch": 0.68, "learning_rate": 1.5946386157779275e-05, "loss": 2.3264, "step": 390550 }, { "epoch": 0.68, "learning_rate": 1.594551421785245e-05, "loss": 2.2655, "step": 390560 }, { "epoch": 0.68, "learning_rate": 1.594464227792562e-05, "loss": 2.2184, "step": 390570 }, { "epoch": 0.68, "learning_rate": 1.5943770337998797e-05, "loss": 2.2413, "step": 390580 }, { "epoch": 0.68, "learning_rate": 1.5942898398071967e-05, "loss": 2.356, "step": 390590 }, { "epoch": 0.68, "learning_rate": 1.594202645814514e-05, "loss": 2.3301, "step": 390600 }, { "epoch": 0.68, "learning_rate": 1.594115451821831e-05, "loss": 2.2759, "step": 390610 }, { "epoch": 0.68, "learning_rate": 1.594028257829149e-05, "loss": 2.2273, "step": 390620 }, { "epoch": 0.68, "learning_rate": 1.593941063836466e-05, "loss": 2.3807, "step": 390630 }, { "epoch": 0.68, "learning_rate": 1.5938538698437833e-05, "loss": 2.3054, "step": 390640 }, { "epoch": 0.68, "learning_rate": 1.5937666758511006e-05, "loss": 2.2265, "step": 390650 }, { "epoch": 0.68, "learning_rate": 1.593679481858418e-05, "loss": 2.2518, "step": 390660 }, { "epoch": 0.68, "learning_rate": 1.5935922878657354e-05, "loss": 2.3048, "step": 390670 }, { "epoch": 0.68, "learning_rate": 1.5935050938730524e-05, "loss": 2.3092, "step": 390680 }, { "epoch": 0.68, "learning_rate": 1.59341789988037e-05, "loss": 2.4397, "step": 390690 }, { "epoch": 0.68, "learning_rate": 1.5933307058876872e-05, "loss": 2.2872, "step": 390700 }, { "epoch": 0.68, "learning_rate": 1.5932435118950046e-05, "loss": 2.3086, "step": 390710 }, { "epoch": 0.68, "learning_rate": 1.593156317902322e-05, "loss": 2.3189, "step": 390720 }, { "epoch": 0.68, "learning_rate": 1.5930691239096393e-05, "loss": 2.3358, "step": 390730 }, { "epoch": 0.68, "learning_rate": 1.5929819299169567e-05, "loss": 2.341, "step": 390740 }, { "epoch": 0.68, "learning_rate": 1.5928947359242737e-05, "loss": 2.3128, "step": 390750 }, { "epoch": 0.68, "learning_rate": 1.592807541931591e-05, "loss": 2.3712, "step": 390760 }, { "epoch": 0.68, "learning_rate": 1.5927203479389085e-05, "loss": 2.3202, "step": 390770 }, { "epoch": 0.68, "learning_rate": 1.592633153946226e-05, "loss": 2.3053, "step": 390780 }, { "epoch": 0.68, "learning_rate": 1.592545959953543e-05, "loss": 2.2493, "step": 390790 }, { "epoch": 0.68, "learning_rate": 1.5924587659608603e-05, "loss": 2.2907, "step": 390800 }, { "epoch": 0.68, "learning_rate": 1.592371571968178e-05, "loss": 2.4087, "step": 390810 }, { "epoch": 0.68, "learning_rate": 1.592284377975495e-05, "loss": 2.29, "step": 390820 }, { "epoch": 0.68, "learning_rate": 1.5921971839828124e-05, "loss": 2.3427, "step": 390830 }, { "epoch": 0.68, "learning_rate": 1.5921099899901298e-05, "loss": 2.3398, "step": 390840 }, { "epoch": 0.68, "learning_rate": 1.592022795997447e-05, "loss": 2.2975, "step": 390850 }, { "epoch": 0.68, "learning_rate": 1.5919356020047642e-05, "loss": 2.4008, "step": 390860 }, { "epoch": 0.68, "learning_rate": 1.5918484080120816e-05, "loss": 2.3011, "step": 390870 }, { "epoch": 0.68, "learning_rate": 1.591761214019399e-05, "loss": 2.2187, "step": 390880 }, { "epoch": 0.68, "learning_rate": 1.5916740200267163e-05, "loss": 2.1479, "step": 390890 }, { "epoch": 0.68, "learning_rate": 1.5915868260340337e-05, "loss": 2.4636, "step": 390900 }, { "epoch": 0.68, "learning_rate": 1.5914996320413507e-05, "loss": 2.2456, "step": 390910 }, { "epoch": 0.68, "learning_rate": 1.5914124380486685e-05, "loss": 2.3569, "step": 390920 }, { "epoch": 0.68, "learning_rate": 1.5913252440559855e-05, "loss": 2.3442, "step": 390930 }, { "epoch": 0.68, "learning_rate": 1.591238050063303e-05, "loss": 2.2646, "step": 390940 }, { "epoch": 0.68, "learning_rate": 1.5911508560706202e-05, "loss": 2.3772, "step": 390950 }, { "epoch": 0.68, "learning_rate": 1.5910636620779376e-05, "loss": 2.2648, "step": 390960 }, { "epoch": 0.68, "learning_rate": 1.590976468085255e-05, "loss": 2.2739, "step": 390970 }, { "epoch": 0.68, "learning_rate": 1.590889274092572e-05, "loss": 2.1613, "step": 390980 }, { "epoch": 0.68, "learning_rate": 1.5908020800998898e-05, "loss": 2.3222, "step": 390990 }, { "epoch": 0.68, "learning_rate": 1.5907148861072068e-05, "loss": 2.3008, "step": 391000 }, { "epoch": 0.68, "learning_rate": 1.590627692114524e-05, "loss": 2.2727, "step": 391010 }, { "epoch": 0.68, "learning_rate": 1.5905404981218412e-05, "loss": 2.3853, "step": 391020 }, { "epoch": 0.68, "learning_rate": 1.590453304129159e-05, "loss": 2.3491, "step": 391030 }, { "epoch": 0.68, "learning_rate": 1.590366110136476e-05, "loss": 2.262, "step": 391040 }, { "epoch": 0.68, "learning_rate": 1.5902789161437933e-05, "loss": 2.3055, "step": 391050 }, { "epoch": 0.68, "learning_rate": 1.5901917221511107e-05, "loss": 2.3221, "step": 391060 }, { "epoch": 0.68, "learning_rate": 1.590104528158428e-05, "loss": 2.3747, "step": 391070 }, { "epoch": 0.68, "learning_rate": 1.5900173341657455e-05, "loss": 2.37, "step": 391080 }, { "epoch": 0.68, "learning_rate": 1.5899301401730625e-05, "loss": 2.3406, "step": 391090 }, { "epoch": 0.68, "learning_rate": 1.5898429461803802e-05, "loss": 2.3394, "step": 391100 }, { "epoch": 0.68, "learning_rate": 1.5897557521876973e-05, "loss": 2.266, "step": 391110 }, { "epoch": 0.68, "learning_rate": 1.5896685581950146e-05, "loss": 2.2881, "step": 391120 }, { "epoch": 0.68, "learning_rate": 1.589581364202332e-05, "loss": 2.3114, "step": 391130 }, { "epoch": 0.68, "learning_rate": 1.5894941702096494e-05, "loss": 2.303, "step": 391140 }, { "epoch": 0.68, "learning_rate": 1.5894069762169668e-05, "loss": 2.3888, "step": 391150 }, { "epoch": 0.68, "learning_rate": 1.5893197822242838e-05, "loss": 2.3135, "step": 391160 }, { "epoch": 0.68, "learning_rate": 1.5892325882316012e-05, "loss": 2.2574, "step": 391170 }, { "epoch": 0.68, "learning_rate": 1.5891453942389186e-05, "loss": 2.302, "step": 391180 }, { "epoch": 0.68, "learning_rate": 1.589058200246236e-05, "loss": 2.3527, "step": 391190 }, { "epoch": 0.68, "learning_rate": 1.5889710062535533e-05, "loss": 2.3467, "step": 391200 }, { "epoch": 0.68, "learning_rate": 1.5888838122608707e-05, "loss": 2.3434, "step": 391210 }, { "epoch": 0.68, "learning_rate": 1.588796618268188e-05, "loss": 2.4504, "step": 391220 }, { "epoch": 0.68, "learning_rate": 1.588709424275505e-05, "loss": 2.3672, "step": 391230 }, { "epoch": 0.68, "learning_rate": 1.5886222302828225e-05, "loss": 2.4139, "step": 391240 }, { "epoch": 0.68, "learning_rate": 1.58853503629014e-05, "loss": 2.2881, "step": 391250 }, { "epoch": 0.68, "learning_rate": 1.5884478422974572e-05, "loss": 2.3084, "step": 391260 }, { "epoch": 0.68, "learning_rate": 1.5883606483047743e-05, "loss": 2.3502, "step": 391270 }, { "epoch": 0.68, "learning_rate": 1.5882734543120917e-05, "loss": 2.2187, "step": 391280 }, { "epoch": 0.68, "learning_rate": 1.5881862603194094e-05, "loss": 2.249, "step": 391290 }, { "epoch": 0.68, "learning_rate": 1.5880990663267264e-05, "loss": 2.1938, "step": 391300 }, { "epoch": 0.68, "learning_rate": 1.5880118723340438e-05, "loss": 2.2939, "step": 391310 }, { "epoch": 0.68, "learning_rate": 1.5879246783413608e-05, "loss": 2.3734, "step": 391320 }, { "epoch": 0.68, "learning_rate": 1.5878374843486785e-05, "loss": 2.3384, "step": 391330 }, { "epoch": 0.68, "learning_rate": 1.5877502903559956e-05, "loss": 2.4195, "step": 391340 }, { "epoch": 0.68, "learning_rate": 1.587663096363313e-05, "loss": 2.0815, "step": 391350 }, { "epoch": 0.68, "learning_rate": 1.5875759023706303e-05, "loss": 2.3929, "step": 391360 }, { "epoch": 0.68, "learning_rate": 1.5874887083779477e-05, "loss": 2.2279, "step": 391370 }, { "epoch": 0.68, "learning_rate": 1.587401514385265e-05, "loss": 2.3749, "step": 391380 }, { "epoch": 0.68, "learning_rate": 1.587314320392582e-05, "loss": 2.1414, "step": 391390 }, { "epoch": 0.68, "learning_rate": 1.5872271263999e-05, "loss": 2.3219, "step": 391400 }, { "epoch": 0.68, "learning_rate": 1.587139932407217e-05, "loss": 2.2351, "step": 391410 }, { "epoch": 0.68, "learning_rate": 1.5870527384145343e-05, "loss": 2.2712, "step": 391420 }, { "epoch": 0.68, "learning_rate": 1.5869655444218516e-05, "loss": 2.2513, "step": 391430 }, { "epoch": 0.68, "learning_rate": 1.586878350429169e-05, "loss": 2.3922, "step": 391440 }, { "epoch": 0.68, "learning_rate": 1.5867911564364864e-05, "loss": 2.2051, "step": 391450 }, { "epoch": 0.68, "learning_rate": 1.5867039624438034e-05, "loss": 2.3934, "step": 391460 }, { "epoch": 0.68, "learning_rate": 1.586616768451121e-05, "loss": 2.2629, "step": 391470 }, { "epoch": 0.68, "learning_rate": 1.5865295744584382e-05, "loss": 2.2959, "step": 391480 }, { "epoch": 0.68, "learning_rate": 1.5864423804657556e-05, "loss": 2.3307, "step": 391490 }, { "epoch": 0.68, "learning_rate": 1.5863551864730726e-05, "loss": 2.1836, "step": 391500 }, { "epoch": 0.68, "learning_rate": 1.5862679924803903e-05, "loss": 2.2554, "step": 391510 }, { "epoch": 0.68, "learning_rate": 1.5861807984877073e-05, "loss": 2.2118, "step": 391520 }, { "epoch": 0.68, "learning_rate": 1.5860936044950247e-05, "loss": 2.381, "step": 391530 }, { "epoch": 0.68, "learning_rate": 1.586006410502342e-05, "loss": 2.3692, "step": 391540 }, { "epoch": 0.68, "learning_rate": 1.5859192165096595e-05, "loss": 2.1428, "step": 391550 }, { "epoch": 0.68, "learning_rate": 1.585832022516977e-05, "loss": 2.4009, "step": 391560 }, { "epoch": 0.68, "learning_rate": 1.585744828524294e-05, "loss": 2.3524, "step": 391570 }, { "epoch": 0.68, "learning_rate": 1.5856576345316113e-05, "loss": 2.3244, "step": 391580 }, { "epoch": 0.68, "learning_rate": 1.5855704405389286e-05, "loss": 2.3223, "step": 391590 }, { "epoch": 0.68, "learning_rate": 1.585483246546246e-05, "loss": 2.2617, "step": 391600 }, { "epoch": 0.68, "learning_rate": 1.5853960525535634e-05, "loss": 2.275, "step": 391610 }, { "epoch": 0.68, "learning_rate": 1.5853088585608808e-05, "loss": 2.3008, "step": 391620 }, { "epoch": 0.68, "learning_rate": 1.585221664568198e-05, "loss": 2.2634, "step": 391630 }, { "epoch": 0.68, "learning_rate": 1.5851344705755152e-05, "loss": 2.2399, "step": 391640 }, { "epoch": 0.68, "learning_rate": 1.5850472765828326e-05, "loss": 2.2583, "step": 391650 }, { "epoch": 0.68, "learning_rate": 1.58496008259015e-05, "loss": 2.3183, "step": 391660 }, { "epoch": 0.68, "learning_rate": 1.5848728885974673e-05, "loss": 2.159, "step": 391670 }, { "epoch": 0.68, "learning_rate": 1.5847856946047847e-05, "loss": 2.1771, "step": 391680 }, { "epoch": 0.68, "learning_rate": 1.5846985006121017e-05, "loss": 2.3488, "step": 391690 }, { "epoch": 0.68, "learning_rate": 1.5846113066194195e-05, "loss": 2.3316, "step": 391700 }, { "epoch": 0.68, "learning_rate": 1.5845241126267365e-05, "loss": 2.3274, "step": 391710 }, { "epoch": 0.68, "learning_rate": 1.584436918634054e-05, "loss": 2.4284, "step": 391720 }, { "epoch": 0.68, "learning_rate": 1.584349724641371e-05, "loss": 2.2582, "step": 391730 }, { "epoch": 0.68, "learning_rate": 1.5842625306486886e-05, "loss": 2.3055, "step": 391740 }, { "epoch": 0.68, "learning_rate": 1.5841753366560057e-05, "loss": 2.3306, "step": 391750 }, { "epoch": 0.68, "learning_rate": 1.584088142663323e-05, "loss": 2.3548, "step": 391760 }, { "epoch": 0.68, "learning_rate": 1.5840009486706404e-05, "loss": 2.3519, "step": 391770 }, { "epoch": 0.68, "learning_rate": 1.5839137546779578e-05, "loss": 2.3234, "step": 391780 }, { "epoch": 0.68, "learning_rate": 1.5838265606852752e-05, "loss": 2.2974, "step": 391790 }, { "epoch": 0.68, "learning_rate": 1.5837393666925922e-05, "loss": 2.2581, "step": 391800 }, { "epoch": 0.68, "learning_rate": 1.58365217269991e-05, "loss": 2.2507, "step": 391810 }, { "epoch": 0.68, "learning_rate": 1.583564978707227e-05, "loss": 2.1494, "step": 391820 }, { "epoch": 0.68, "learning_rate": 1.5834777847145443e-05, "loss": 2.2824, "step": 391830 }, { "epoch": 0.68, "learning_rate": 1.5833905907218617e-05, "loss": 2.3391, "step": 391840 }, { "epoch": 0.68, "learning_rate": 1.583303396729179e-05, "loss": 2.2957, "step": 391850 }, { "epoch": 0.68, "learning_rate": 1.5832162027364965e-05, "loss": 2.3626, "step": 391860 }, { "epoch": 0.68, "learning_rate": 1.5831290087438135e-05, "loss": 2.3594, "step": 391870 }, { "epoch": 0.68, "learning_rate": 1.5830418147511312e-05, "loss": 2.3654, "step": 391880 }, { "epoch": 0.68, "learning_rate": 1.5829546207584483e-05, "loss": 2.2537, "step": 391890 }, { "epoch": 0.68, "learning_rate": 1.5828674267657656e-05, "loss": 2.2806, "step": 391900 }, { "epoch": 0.68, "learning_rate": 1.582780232773083e-05, "loss": 2.3088, "step": 391910 }, { "epoch": 0.68, "learning_rate": 1.5826930387804004e-05, "loss": 2.273, "step": 391920 }, { "epoch": 0.68, "learning_rate": 1.5826058447877178e-05, "loss": 2.2114, "step": 391930 }, { "epoch": 0.68, "learning_rate": 1.5825186507950348e-05, "loss": 2.2731, "step": 391940 }, { "epoch": 0.68, "learning_rate": 1.5824314568023522e-05, "loss": 2.3592, "step": 391950 }, { "epoch": 0.68, "learning_rate": 1.5823442628096696e-05, "loss": 2.3905, "step": 391960 }, { "epoch": 0.68, "learning_rate": 1.582257068816987e-05, "loss": 2.2106, "step": 391970 }, { "epoch": 0.68, "learning_rate": 1.582169874824304e-05, "loss": 2.2491, "step": 391980 }, { "epoch": 0.68, "learning_rate": 1.5820826808316214e-05, "loss": 2.2564, "step": 391990 }, { "epoch": 0.68, "learning_rate": 1.5819954868389387e-05, "loss": 2.2582, "step": 392000 }, { "epoch": 0.68, "learning_rate": 1.581908292846256e-05, "loss": 2.0975, "step": 392010 }, { "epoch": 0.68, "learning_rate": 1.5818210988535735e-05, "loss": 2.291, "step": 392020 }, { "epoch": 0.68, "learning_rate": 1.581733904860891e-05, "loss": 2.1803, "step": 392030 }, { "epoch": 0.68, "learning_rate": 1.5816467108682082e-05, "loss": 2.3194, "step": 392040 }, { "epoch": 0.68, "learning_rate": 1.5815595168755253e-05, "loss": 2.1958, "step": 392050 }, { "epoch": 0.68, "learning_rate": 1.5814723228828427e-05, "loss": 2.3078, "step": 392060 }, { "epoch": 0.68, "learning_rate": 1.58138512889016e-05, "loss": 2.2691, "step": 392070 }, { "epoch": 0.68, "learning_rate": 1.5812979348974774e-05, "loss": 2.2867, "step": 392080 }, { "epoch": 0.68, "learning_rate": 1.5812107409047948e-05, "loss": 2.4097, "step": 392090 }, { "epoch": 0.68, "learning_rate": 1.5811235469121118e-05, "loss": 2.2522, "step": 392100 }, { "epoch": 0.68, "learning_rate": 1.5810363529194295e-05, "loss": 2.2104, "step": 392110 }, { "epoch": 0.68, "learning_rate": 1.5809491589267466e-05, "loss": 2.351, "step": 392120 }, { "epoch": 0.68, "learning_rate": 1.580861964934064e-05, "loss": 2.3567, "step": 392130 }, { "epoch": 0.68, "learning_rate": 1.5807747709413813e-05, "loss": 2.2424, "step": 392140 }, { "epoch": 0.68, "learning_rate": 1.5806875769486987e-05, "loss": 2.1597, "step": 392150 }, { "epoch": 0.68, "learning_rate": 1.580600382956016e-05, "loss": 2.3506, "step": 392160 }, { "epoch": 0.68, "learning_rate": 1.580513188963333e-05, "loss": 2.2791, "step": 392170 }, { "epoch": 0.68, "learning_rate": 1.580425994970651e-05, "loss": 2.1875, "step": 392180 }, { "epoch": 0.68, "learning_rate": 1.580338800977968e-05, "loss": 2.312, "step": 392190 }, { "epoch": 0.68, "learning_rate": 1.5802516069852853e-05, "loss": 2.206, "step": 392200 }, { "epoch": 0.68, "learning_rate": 1.5801644129926023e-05, "loss": 2.3332, "step": 392210 }, { "epoch": 0.68, "learning_rate": 1.58007721899992e-05, "loss": 2.2836, "step": 392220 }, { "epoch": 0.68, "learning_rate": 1.579990025007237e-05, "loss": 2.3922, "step": 392230 }, { "epoch": 0.68, "learning_rate": 1.5799028310145544e-05, "loss": 2.266, "step": 392240 }, { "epoch": 0.68, "learning_rate": 1.5798156370218718e-05, "loss": 2.4304, "step": 392250 }, { "epoch": 0.68, "learning_rate": 1.5797284430291892e-05, "loss": 2.3437, "step": 392260 }, { "epoch": 0.68, "learning_rate": 1.5796412490365066e-05, "loss": 2.3491, "step": 392270 }, { "epoch": 0.68, "learning_rate": 1.5795540550438236e-05, "loss": 2.2224, "step": 392280 }, { "epoch": 0.68, "learning_rate": 1.5794668610511413e-05, "loss": 2.2815, "step": 392290 }, { "epoch": 0.68, "learning_rate": 1.5793796670584583e-05, "loss": 2.254, "step": 392300 }, { "epoch": 0.68, "learning_rate": 1.5792924730657757e-05, "loss": 2.2111, "step": 392310 }, { "epoch": 0.68, "learning_rate": 1.579205279073093e-05, "loss": 2.2964, "step": 392320 }, { "epoch": 0.68, "learning_rate": 1.5791180850804105e-05, "loss": 2.2012, "step": 392330 }, { "epoch": 0.68, "learning_rate": 1.579030891087728e-05, "loss": 2.2447, "step": 392340 }, { "epoch": 0.68, "learning_rate": 1.578943697095045e-05, "loss": 2.3899, "step": 392350 }, { "epoch": 0.68, "learning_rate": 1.5788565031023623e-05, "loss": 2.3952, "step": 392360 }, { "epoch": 0.68, "learning_rate": 1.5787693091096796e-05, "loss": 2.3136, "step": 392370 }, { "epoch": 0.68, "learning_rate": 1.578682115116997e-05, "loss": 2.2071, "step": 392380 }, { "epoch": 0.68, "learning_rate": 1.578594921124314e-05, "loss": 2.3228, "step": 392390 }, { "epoch": 0.68, "learning_rate": 1.5785077271316318e-05, "loss": 2.3382, "step": 392400 }, { "epoch": 0.68, "learning_rate": 1.578420533138949e-05, "loss": 2.3968, "step": 392410 }, { "epoch": 0.68, "learning_rate": 1.5783333391462662e-05, "loss": 2.3238, "step": 392420 }, { "epoch": 0.68, "learning_rate": 1.5782461451535836e-05, "loss": 2.4164, "step": 392430 }, { "epoch": 0.68, "learning_rate": 1.578158951160901e-05, "loss": 2.2935, "step": 392440 }, { "epoch": 0.68, "learning_rate": 1.5780717571682183e-05, "loss": 2.1633, "step": 392450 }, { "epoch": 0.68, "learning_rate": 1.5779845631755354e-05, "loss": 2.3777, "step": 392460 }, { "epoch": 0.68, "learning_rate": 1.5778973691828527e-05, "loss": 2.3679, "step": 392470 }, { "epoch": 0.68, "learning_rate": 1.57781017519017e-05, "loss": 2.2691, "step": 392480 }, { "epoch": 0.68, "learning_rate": 1.5777229811974875e-05, "loss": 2.2483, "step": 392490 }, { "epoch": 0.68, "learning_rate": 1.577635787204805e-05, "loss": 2.3063, "step": 392500 }, { "epoch": 0.68, "learning_rate": 1.577548593212122e-05, "loss": 2.2587, "step": 392510 }, { "epoch": 0.68, "learning_rate": 1.5774613992194396e-05, "loss": 2.2477, "step": 392520 }, { "epoch": 0.68, "learning_rate": 1.5773742052267567e-05, "loss": 2.3698, "step": 392530 }, { "epoch": 0.68, "learning_rate": 1.577287011234074e-05, "loss": 2.2894, "step": 392540 }, { "epoch": 0.68, "learning_rate": 1.5771998172413914e-05, "loss": 2.3499, "step": 392550 }, { "epoch": 0.68, "learning_rate": 1.5771126232487088e-05, "loss": 2.3456, "step": 392560 }, { "epoch": 0.68, "learning_rate": 1.5770254292560262e-05, "loss": 2.3276, "step": 392570 }, { "epoch": 0.68, "learning_rate": 1.5769382352633432e-05, "loss": 2.3749, "step": 392580 }, { "epoch": 0.68, "learning_rate": 1.576851041270661e-05, "loss": 2.2454, "step": 392590 }, { "epoch": 0.68, "learning_rate": 1.576763847277978e-05, "loss": 2.2309, "step": 392600 }, { "epoch": 0.68, "learning_rate": 1.5766766532852953e-05, "loss": 2.2784, "step": 392610 }, { "epoch": 0.68, "learning_rate": 1.5765894592926124e-05, "loss": 2.3178, "step": 392620 }, { "epoch": 0.68, "learning_rate": 1.57650226529993e-05, "loss": 2.3932, "step": 392630 }, { "epoch": 0.68, "learning_rate": 1.5764150713072475e-05, "loss": 2.3966, "step": 392640 }, { "epoch": 0.68, "learning_rate": 1.5763278773145645e-05, "loss": 2.3525, "step": 392650 }, { "epoch": 0.68, "learning_rate": 1.576240683321882e-05, "loss": 2.3864, "step": 392660 }, { "epoch": 0.68, "learning_rate": 1.5761534893291993e-05, "loss": 2.2953, "step": 392670 }, { "epoch": 0.68, "learning_rate": 1.5760662953365166e-05, "loss": 2.2973, "step": 392680 }, { "epoch": 0.68, "learning_rate": 1.5759791013438337e-05, "loss": 2.2768, "step": 392690 }, { "epoch": 0.68, "learning_rate": 1.5758919073511514e-05, "loss": 2.3058, "step": 392700 }, { "epoch": 0.68, "learning_rate": 1.5758047133584684e-05, "loss": 2.323, "step": 392710 }, { "epoch": 0.68, "learning_rate": 1.5757175193657858e-05, "loss": 2.3241, "step": 392720 }, { "epoch": 0.68, "learning_rate": 1.5756303253731032e-05, "loss": 2.3068, "step": 392730 }, { "epoch": 0.68, "learning_rate": 1.5755431313804206e-05, "loss": 2.3078, "step": 392740 }, { "epoch": 0.68, "learning_rate": 1.575455937387738e-05, "loss": 2.2829, "step": 392750 }, { "epoch": 0.68, "learning_rate": 1.575368743395055e-05, "loss": 2.2243, "step": 392760 }, { "epoch": 0.68, "learning_rate": 1.5752815494023724e-05, "loss": 2.3625, "step": 392770 }, { "epoch": 0.68, "learning_rate": 1.5751943554096897e-05, "loss": 2.2287, "step": 392780 }, { "epoch": 0.68, "learning_rate": 1.575107161417007e-05, "loss": 2.3678, "step": 392790 }, { "epoch": 0.68, "learning_rate": 1.5750199674243245e-05, "loss": 2.2152, "step": 392800 }, { "epoch": 0.69, "learning_rate": 1.574932773431642e-05, "loss": 2.3582, "step": 392810 }, { "epoch": 0.69, "learning_rate": 1.5748455794389592e-05, "loss": 2.2649, "step": 392820 }, { "epoch": 0.69, "learning_rate": 1.5747583854462763e-05, "loss": 2.2394, "step": 392830 }, { "epoch": 0.69, "learning_rate": 1.5746711914535937e-05, "loss": 2.2726, "step": 392840 }, { "epoch": 0.69, "learning_rate": 1.574583997460911e-05, "loss": 2.183, "step": 392850 }, { "epoch": 0.69, "learning_rate": 1.5744968034682284e-05, "loss": 2.2805, "step": 392860 }, { "epoch": 0.69, "learning_rate": 1.5744096094755454e-05, "loss": 2.2444, "step": 392870 }, { "epoch": 0.69, "learning_rate": 1.5743224154828628e-05, "loss": 2.3211, "step": 392880 }, { "epoch": 0.69, "learning_rate": 1.5742352214901805e-05, "loss": 2.2253, "step": 392890 }, { "epoch": 0.69, "learning_rate": 1.5741480274974976e-05, "loss": 2.3672, "step": 392900 }, { "epoch": 0.69, "learning_rate": 1.574060833504815e-05, "loss": 2.3297, "step": 392910 }, { "epoch": 0.69, "learning_rate": 1.573973639512132e-05, "loss": 2.2338, "step": 392920 }, { "epoch": 0.69, "learning_rate": 1.5738864455194497e-05, "loss": 2.2223, "step": 392930 }, { "epoch": 0.69, "learning_rate": 1.5737992515267667e-05, "loss": 2.246, "step": 392940 }, { "epoch": 0.69, "learning_rate": 1.573712057534084e-05, "loss": 2.3785, "step": 392950 }, { "epoch": 0.69, "learning_rate": 1.5736248635414015e-05, "loss": 2.3309, "step": 392960 }, { "epoch": 0.69, "learning_rate": 1.573537669548719e-05, "loss": 2.2634, "step": 392970 }, { "epoch": 0.69, "learning_rate": 1.5734504755560363e-05, "loss": 2.4528, "step": 392980 }, { "epoch": 0.69, "learning_rate": 1.5733632815633533e-05, "loss": 2.2897, "step": 392990 }, { "epoch": 0.69, "learning_rate": 1.573276087570671e-05, "loss": 2.2529, "step": 393000 }, { "epoch": 0.69, "learning_rate": 1.573188893577988e-05, "loss": 2.3341, "step": 393010 }, { "epoch": 0.69, "learning_rate": 1.5731016995853054e-05, "loss": 2.2444, "step": 393020 }, { "epoch": 0.69, "learning_rate": 1.5730145055926228e-05, "loss": 2.3314, "step": 393030 }, { "epoch": 0.69, "learning_rate": 1.5729273115999402e-05, "loss": 2.3303, "step": 393040 }, { "epoch": 0.69, "learning_rate": 1.5728401176072576e-05, "loss": 2.3383, "step": 393050 }, { "epoch": 0.69, "learning_rate": 1.5727529236145746e-05, "loss": 2.2323, "step": 393060 }, { "epoch": 0.69, "learning_rate": 1.5726657296218923e-05, "loss": 2.3111, "step": 393070 }, { "epoch": 0.69, "learning_rate": 1.5725785356292093e-05, "loss": 2.4157, "step": 393080 }, { "epoch": 0.69, "learning_rate": 1.5724913416365267e-05, "loss": 2.3736, "step": 393090 }, { "epoch": 0.69, "learning_rate": 1.5724041476438438e-05, "loss": 2.3733, "step": 393100 }, { "epoch": 0.69, "learning_rate": 1.5723169536511615e-05, "loss": 2.2952, "step": 393110 }, { "epoch": 0.69, "learning_rate": 1.5722297596584785e-05, "loss": 2.2612, "step": 393120 }, { "epoch": 0.69, "learning_rate": 1.572142565665796e-05, "loss": 2.2233, "step": 393130 }, { "epoch": 0.69, "learning_rate": 1.5720553716731133e-05, "loss": 2.2468, "step": 393140 }, { "epoch": 0.69, "learning_rate": 1.5719681776804306e-05, "loss": 2.3753, "step": 393150 }, { "epoch": 0.69, "learning_rate": 1.571880983687748e-05, "loss": 2.3325, "step": 393160 }, { "epoch": 0.69, "learning_rate": 1.571793789695065e-05, "loss": 2.3534, "step": 393170 }, { "epoch": 0.69, "learning_rate": 1.5717065957023824e-05, "loss": 2.3322, "step": 393180 }, { "epoch": 0.69, "learning_rate": 1.5716194017096998e-05, "loss": 2.3921, "step": 393190 }, { "epoch": 0.69, "learning_rate": 1.5715322077170172e-05, "loss": 2.3428, "step": 393200 }, { "epoch": 0.69, "learning_rate": 1.5714450137243346e-05, "loss": 2.3986, "step": 393210 }, { "epoch": 0.69, "learning_rate": 1.571357819731652e-05, "loss": 2.4193, "step": 393220 }, { "epoch": 0.69, "learning_rate": 1.5712706257389693e-05, "loss": 2.297, "step": 393230 }, { "epoch": 0.69, "learning_rate": 1.5711834317462864e-05, "loss": 2.2234, "step": 393240 }, { "epoch": 0.69, "learning_rate": 1.5710962377536037e-05, "loss": 2.334, "step": 393250 }, { "epoch": 0.69, "learning_rate": 1.571009043760921e-05, "loss": 2.2369, "step": 393260 }, { "epoch": 0.69, "learning_rate": 1.5709218497682385e-05, "loss": 2.3147, "step": 393270 }, { "epoch": 0.69, "learning_rate": 1.570834655775556e-05, "loss": 2.2475, "step": 393280 }, { "epoch": 0.69, "learning_rate": 1.570747461782873e-05, "loss": 2.1974, "step": 393290 }, { "epoch": 0.69, "learning_rate": 1.5706602677901906e-05, "loss": 2.2721, "step": 393300 }, { "epoch": 0.69, "learning_rate": 1.5705730737975077e-05, "loss": 2.2605, "step": 393310 }, { "epoch": 0.69, "learning_rate": 1.570485879804825e-05, "loss": 2.3117, "step": 393320 }, { "epoch": 0.69, "learning_rate": 1.5703986858121424e-05, "loss": 2.3696, "step": 393330 }, { "epoch": 0.69, "learning_rate": 1.5703114918194598e-05, "loss": 2.2218, "step": 393340 }, { "epoch": 0.69, "learning_rate": 1.570224297826777e-05, "loss": 2.4, "step": 393350 }, { "epoch": 0.69, "learning_rate": 1.5701371038340942e-05, "loss": 2.4373, "step": 393360 }, { "epoch": 0.69, "learning_rate": 1.570049909841412e-05, "loss": 2.1649, "step": 393370 }, { "epoch": 0.69, "learning_rate": 1.569962715848729e-05, "loss": 2.199, "step": 393380 }, { "epoch": 0.69, "learning_rate": 1.5698755218560463e-05, "loss": 2.2797, "step": 393390 }, { "epoch": 0.69, "learning_rate": 1.5697883278633634e-05, "loss": 2.2641, "step": 393400 }, { "epoch": 0.69, "learning_rate": 1.569701133870681e-05, "loss": 2.4265, "step": 393410 }, { "epoch": 0.69, "learning_rate": 1.569613939877998e-05, "loss": 2.1443, "step": 393420 }, { "epoch": 0.69, "learning_rate": 1.5695267458853155e-05, "loss": 2.4062, "step": 393430 }, { "epoch": 0.69, "learning_rate": 1.569439551892633e-05, "loss": 2.3335, "step": 393440 }, { "epoch": 0.69, "learning_rate": 1.5693523578999503e-05, "loss": 2.1734, "step": 393450 }, { "epoch": 0.69, "learning_rate": 1.5692651639072676e-05, "loss": 2.324, "step": 393460 }, { "epoch": 0.69, "learning_rate": 1.5691779699145847e-05, "loss": 2.3696, "step": 393470 }, { "epoch": 0.69, "learning_rate": 1.5690907759219024e-05, "loss": 2.2167, "step": 393480 }, { "epoch": 0.69, "learning_rate": 1.5690035819292194e-05, "loss": 2.3352, "step": 393490 }, { "epoch": 0.69, "learning_rate": 1.5689163879365368e-05, "loss": 2.3783, "step": 393500 }, { "epoch": 0.69, "learning_rate": 1.5688291939438542e-05, "loss": 2.3169, "step": 393510 }, { "epoch": 0.69, "learning_rate": 1.5687419999511716e-05, "loss": 2.2479, "step": 393520 }, { "epoch": 0.69, "learning_rate": 1.568654805958489e-05, "loss": 2.4021, "step": 393530 }, { "epoch": 0.69, "learning_rate": 1.568567611965806e-05, "loss": 2.3149, "step": 393540 }, { "epoch": 0.69, "learning_rate": 1.5684804179731234e-05, "loss": 2.3804, "step": 393550 }, { "epoch": 0.69, "learning_rate": 1.5683932239804407e-05, "loss": 2.3314, "step": 393560 }, { "epoch": 0.69, "learning_rate": 1.568306029987758e-05, "loss": 2.4249, "step": 393570 }, { "epoch": 0.69, "learning_rate": 1.568218835995075e-05, "loss": 2.2635, "step": 393580 }, { "epoch": 0.69, "learning_rate": 1.5681316420023925e-05, "loss": 2.3269, "step": 393590 }, { "epoch": 0.69, "learning_rate": 1.56804444800971e-05, "loss": 2.3827, "step": 393600 }, { "epoch": 0.69, "learning_rate": 1.5679572540170273e-05, "loss": 2.357, "step": 393610 }, { "epoch": 0.69, "learning_rate": 1.5678700600243447e-05, "loss": 2.3891, "step": 393620 }, { "epoch": 0.69, "learning_rate": 1.567782866031662e-05, "loss": 2.2876, "step": 393630 }, { "epoch": 0.69, "learning_rate": 1.5676956720389794e-05, "loss": 2.3675, "step": 393640 }, { "epoch": 0.69, "learning_rate": 1.5676084780462964e-05, "loss": 2.2496, "step": 393650 }, { "epoch": 0.69, "learning_rate": 1.5675212840536138e-05, "loss": 2.3112, "step": 393660 }, { "epoch": 0.69, "learning_rate": 1.5674340900609312e-05, "loss": 2.4226, "step": 393670 }, { "epoch": 0.69, "learning_rate": 1.5673468960682486e-05, "loss": 2.2863, "step": 393680 }, { "epoch": 0.69, "learning_rate": 1.567259702075566e-05, "loss": 2.4124, "step": 393690 }, { "epoch": 0.69, "learning_rate": 1.567172508082883e-05, "loss": 2.3001, "step": 393700 }, { "epoch": 0.69, "learning_rate": 1.5670853140902007e-05, "loss": 2.2604, "step": 393710 }, { "epoch": 0.69, "learning_rate": 1.5669981200975177e-05, "loss": 2.3939, "step": 393720 }, { "epoch": 0.69, "learning_rate": 1.566910926104835e-05, "loss": 2.2902, "step": 393730 }, { "epoch": 0.69, "learning_rate": 1.5668237321121525e-05, "loss": 2.3638, "step": 393740 }, { "epoch": 0.69, "learning_rate": 1.56673653811947e-05, "loss": 2.3554, "step": 393750 }, { "epoch": 0.69, "learning_rate": 1.5666493441267873e-05, "loss": 2.3898, "step": 393760 }, { "epoch": 0.69, "learning_rate": 1.5665621501341043e-05, "loss": 2.3239, "step": 393770 }, { "epoch": 0.69, "learning_rate": 1.566474956141422e-05, "loss": 2.2882, "step": 393780 }, { "epoch": 0.69, "learning_rate": 1.566387762148739e-05, "loss": 2.3299, "step": 393790 }, { "epoch": 0.69, "learning_rate": 1.5663005681560564e-05, "loss": 2.3978, "step": 393800 }, { "epoch": 0.69, "learning_rate": 1.5662133741633735e-05, "loss": 2.271, "step": 393810 }, { "epoch": 0.69, "learning_rate": 1.5661261801706912e-05, "loss": 2.3018, "step": 393820 }, { "epoch": 0.69, "learning_rate": 1.5660389861780082e-05, "loss": 2.3367, "step": 393830 }, { "epoch": 0.69, "learning_rate": 1.5659517921853256e-05, "loss": 2.2692, "step": 393840 }, { "epoch": 0.69, "learning_rate": 1.565864598192643e-05, "loss": 2.2265, "step": 393850 }, { "epoch": 0.69, "learning_rate": 1.5657774041999603e-05, "loss": 2.2946, "step": 393860 }, { "epoch": 0.69, "learning_rate": 1.5656902102072777e-05, "loss": 2.221, "step": 393870 }, { "epoch": 0.69, "learning_rate": 1.5656030162145948e-05, "loss": 2.3346, "step": 393880 }, { "epoch": 0.69, "learning_rate": 1.5655158222219125e-05, "loss": 2.2784, "step": 393890 }, { "epoch": 0.69, "learning_rate": 1.5654286282292295e-05, "loss": 2.2723, "step": 393900 }, { "epoch": 0.69, "learning_rate": 1.565341434236547e-05, "loss": 2.2093, "step": 393910 }, { "epoch": 0.69, "learning_rate": 1.5652542402438643e-05, "loss": 2.2655, "step": 393920 }, { "epoch": 0.69, "learning_rate": 1.5651670462511816e-05, "loss": 2.3587, "step": 393930 }, { "epoch": 0.69, "learning_rate": 1.565079852258499e-05, "loss": 2.3487, "step": 393940 }, { "epoch": 0.69, "learning_rate": 1.564992658265816e-05, "loss": 2.3593, "step": 393950 }, { "epoch": 0.69, "learning_rate": 1.5649054642731334e-05, "loss": 2.326, "step": 393960 }, { "epoch": 0.69, "learning_rate": 1.5648182702804508e-05, "loss": 2.3346, "step": 393970 }, { "epoch": 0.69, "learning_rate": 1.5647310762877682e-05, "loss": 2.2808, "step": 393980 }, { "epoch": 0.69, "learning_rate": 1.5646438822950856e-05, "loss": 2.236, "step": 393990 }, { "epoch": 0.69, "learning_rate": 1.564556688302403e-05, "loss": 2.2877, "step": 394000 }, { "epoch": 0.69, "learning_rate": 1.5644694943097203e-05, "loss": 2.2897, "step": 394010 }, { "epoch": 0.69, "learning_rate": 1.5643823003170374e-05, "loss": 2.2505, "step": 394020 }, { "epoch": 0.69, "learning_rate": 1.5642951063243547e-05, "loss": 2.2065, "step": 394030 }, { "epoch": 0.69, "learning_rate": 1.564207912331672e-05, "loss": 2.2808, "step": 394040 }, { "epoch": 0.69, "learning_rate": 1.5641207183389895e-05, "loss": 2.4624, "step": 394050 }, { "epoch": 0.69, "learning_rate": 1.5640335243463065e-05, "loss": 2.4113, "step": 394060 }, { "epoch": 0.69, "learning_rate": 1.563946330353624e-05, "loss": 2.4141, "step": 394070 }, { "epoch": 0.69, "learning_rate": 1.5638591363609413e-05, "loss": 2.2436, "step": 394080 }, { "epoch": 0.69, "learning_rate": 1.5637719423682587e-05, "loss": 2.4314, "step": 394090 }, { "epoch": 0.69, "learning_rate": 1.563684748375576e-05, "loss": 2.2061, "step": 394100 }, { "epoch": 0.69, "learning_rate": 1.563597554382893e-05, "loss": 2.2542, "step": 394110 }, { "epoch": 0.69, "learning_rate": 1.5635103603902108e-05, "loss": 2.1864, "step": 394120 }, { "epoch": 0.69, "learning_rate": 1.563423166397528e-05, "loss": 2.3405, "step": 394130 }, { "epoch": 0.69, "learning_rate": 1.5633359724048452e-05, "loss": 2.2129, "step": 394140 }, { "epoch": 0.69, "learning_rate": 1.5632487784121626e-05, "loss": 2.4347, "step": 394150 }, { "epoch": 0.69, "learning_rate": 1.56316158441948e-05, "loss": 2.316, "step": 394160 }, { "epoch": 0.69, "learning_rate": 1.5630743904267973e-05, "loss": 2.226, "step": 394170 }, { "epoch": 0.69, "learning_rate": 1.5629871964341144e-05, "loss": 2.2035, "step": 394180 }, { "epoch": 0.69, "learning_rate": 1.562900002441432e-05, "loss": 2.28, "step": 394190 }, { "epoch": 0.69, "learning_rate": 1.562812808448749e-05, "loss": 2.3183, "step": 394200 }, { "epoch": 0.69, "learning_rate": 1.5627256144560665e-05, "loss": 2.3663, "step": 394210 }, { "epoch": 0.69, "learning_rate": 1.5626384204633835e-05, "loss": 2.4345, "step": 394220 }, { "epoch": 0.69, "learning_rate": 1.5625512264707013e-05, "loss": 2.2684, "step": 394230 }, { "epoch": 0.69, "learning_rate": 1.5624640324780186e-05, "loss": 2.2658, "step": 394240 }, { "epoch": 0.69, "learning_rate": 1.5623768384853357e-05, "loss": 2.3504, "step": 394250 }, { "epoch": 0.69, "learning_rate": 1.562289644492653e-05, "loss": 2.2816, "step": 394260 }, { "epoch": 0.69, "learning_rate": 1.5622024504999704e-05, "loss": 2.2944, "step": 394270 }, { "epoch": 0.69, "learning_rate": 1.5621152565072878e-05, "loss": 2.3261, "step": 394280 }, { "epoch": 0.69, "learning_rate": 1.562028062514605e-05, "loss": 2.3688, "step": 394290 }, { "epoch": 0.69, "learning_rate": 1.5619408685219226e-05, "loss": 2.3641, "step": 394300 }, { "epoch": 0.69, "learning_rate": 1.5618536745292396e-05, "loss": 2.3835, "step": 394310 }, { "epoch": 0.69, "learning_rate": 1.561766480536557e-05, "loss": 2.3628, "step": 394320 }, { "epoch": 0.69, "learning_rate": 1.5616792865438744e-05, "loss": 2.2645, "step": 394330 }, { "epoch": 0.69, "learning_rate": 1.5615920925511917e-05, "loss": 2.3923, "step": 394340 }, { "epoch": 0.69, "learning_rate": 1.561504898558509e-05, "loss": 2.1688, "step": 394350 }, { "epoch": 0.69, "learning_rate": 1.561417704565826e-05, "loss": 2.2958, "step": 394360 }, { "epoch": 0.69, "learning_rate": 1.5613305105731435e-05, "loss": 2.3899, "step": 394370 }, { "epoch": 0.69, "learning_rate": 1.561243316580461e-05, "loss": 2.412, "step": 394380 }, { "epoch": 0.69, "learning_rate": 1.5611561225877783e-05, "loss": 2.2463, "step": 394390 }, { "epoch": 0.69, "learning_rate": 1.5610689285950957e-05, "loss": 2.321, "step": 394400 }, { "epoch": 0.69, "learning_rate": 1.560981734602413e-05, "loss": 2.3217, "step": 394410 }, { "epoch": 0.69, "learning_rate": 1.5608945406097304e-05, "loss": 2.3434, "step": 394420 }, { "epoch": 0.69, "learning_rate": 1.5608073466170474e-05, "loss": 2.3581, "step": 394430 }, { "epoch": 0.69, "learning_rate": 1.5607201526243648e-05, "loss": 2.275, "step": 394440 }, { "epoch": 0.69, "learning_rate": 1.5606329586316822e-05, "loss": 2.3837, "step": 394450 }, { "epoch": 0.69, "learning_rate": 1.5605457646389996e-05, "loss": 2.4262, "step": 394460 }, { "epoch": 0.69, "learning_rate": 1.5604585706463166e-05, "loss": 2.262, "step": 394470 }, { "epoch": 0.69, "learning_rate": 1.560371376653634e-05, "loss": 2.2909, "step": 394480 }, { "epoch": 0.69, "learning_rate": 1.5602841826609517e-05, "loss": 2.2969, "step": 394490 }, { "epoch": 0.69, "learning_rate": 1.5601969886682687e-05, "loss": 2.3265, "step": 394500 }, { "epoch": 0.69, "learning_rate": 1.560109794675586e-05, "loss": 2.2174, "step": 394510 }, { "epoch": 0.69, "learning_rate": 1.560022600682903e-05, "loss": 2.279, "step": 394520 }, { "epoch": 0.69, "learning_rate": 1.559935406690221e-05, "loss": 2.3344, "step": 394530 }, { "epoch": 0.69, "learning_rate": 1.559848212697538e-05, "loss": 2.3447, "step": 394540 }, { "epoch": 0.69, "learning_rate": 1.5597610187048553e-05, "loss": 2.3354, "step": 394550 }, { "epoch": 0.69, "learning_rate": 1.5596738247121727e-05, "loss": 2.136, "step": 394560 }, { "epoch": 0.69, "learning_rate": 1.55958663071949e-05, "loss": 2.4076, "step": 394570 }, { "epoch": 0.69, "learning_rate": 1.5594994367268074e-05, "loss": 2.2347, "step": 394580 }, { "epoch": 0.69, "learning_rate": 1.5594122427341245e-05, "loss": 2.2667, "step": 394590 }, { "epoch": 0.69, "learning_rate": 1.5593250487414422e-05, "loss": 2.3372, "step": 394600 }, { "epoch": 0.69, "learning_rate": 1.5592378547487592e-05, "loss": 2.3842, "step": 394610 }, { "epoch": 0.69, "learning_rate": 1.5591506607560766e-05, "loss": 2.2961, "step": 394620 }, { "epoch": 0.69, "learning_rate": 1.559063466763394e-05, "loss": 2.2801, "step": 394630 }, { "epoch": 0.69, "learning_rate": 1.5589762727707113e-05, "loss": 2.388, "step": 394640 }, { "epoch": 0.69, "learning_rate": 1.5588890787780287e-05, "loss": 2.2325, "step": 394650 }, { "epoch": 0.69, "learning_rate": 1.5588018847853458e-05, "loss": 2.3225, "step": 394660 }, { "epoch": 0.69, "learning_rate": 1.5587146907926635e-05, "loss": 2.2987, "step": 394670 }, { "epoch": 0.69, "learning_rate": 1.5586274967999805e-05, "loss": 2.3647, "step": 394680 }, { "epoch": 0.69, "learning_rate": 1.558540302807298e-05, "loss": 2.3401, "step": 394690 }, { "epoch": 0.69, "learning_rate": 1.558453108814615e-05, "loss": 2.3465, "step": 394700 }, { "epoch": 0.69, "learning_rate": 1.5583659148219326e-05, "loss": 2.3885, "step": 394710 }, { "epoch": 0.69, "learning_rate": 1.55827872082925e-05, "loss": 2.3566, "step": 394720 }, { "epoch": 0.69, "learning_rate": 1.558191526836567e-05, "loss": 2.299, "step": 394730 }, { "epoch": 0.69, "learning_rate": 1.5581043328438844e-05, "loss": 2.1961, "step": 394740 }, { "epoch": 0.69, "learning_rate": 1.5580171388512018e-05, "loss": 2.2944, "step": 394750 }, { "epoch": 0.69, "learning_rate": 1.5579299448585192e-05, "loss": 2.2664, "step": 394760 }, { "epoch": 0.69, "learning_rate": 1.5578427508658362e-05, "loss": 2.299, "step": 394770 }, { "epoch": 0.69, "learning_rate": 1.5577555568731536e-05, "loss": 2.4043, "step": 394780 }, { "epoch": 0.69, "learning_rate": 1.557668362880471e-05, "loss": 2.2369, "step": 394790 }, { "epoch": 0.69, "learning_rate": 1.5575811688877884e-05, "loss": 2.3919, "step": 394800 }, { "epoch": 0.69, "learning_rate": 1.5574939748951057e-05, "loss": 2.2028, "step": 394810 }, { "epoch": 0.69, "learning_rate": 1.557406780902423e-05, "loss": 2.2179, "step": 394820 }, { "epoch": 0.69, "learning_rate": 1.5573195869097405e-05, "loss": 2.3701, "step": 394830 }, { "epoch": 0.69, "learning_rate": 1.5572323929170575e-05, "loss": 2.2566, "step": 394840 }, { "epoch": 0.69, "learning_rate": 1.557145198924375e-05, "loss": 2.3268, "step": 394850 }, { "epoch": 0.69, "learning_rate": 1.5570580049316923e-05, "loss": 2.2484, "step": 394860 }, { "epoch": 0.69, "learning_rate": 1.5569708109390097e-05, "loss": 2.2993, "step": 394870 }, { "epoch": 0.69, "learning_rate": 1.556883616946327e-05, "loss": 2.3486, "step": 394880 }, { "epoch": 0.69, "learning_rate": 1.556796422953644e-05, "loss": 2.3381, "step": 394890 }, { "epoch": 0.69, "learning_rate": 1.5567092289609618e-05, "loss": 2.3471, "step": 394900 }, { "epoch": 0.69, "learning_rate": 1.556622034968279e-05, "loss": 2.3526, "step": 394910 }, { "epoch": 0.69, "learning_rate": 1.5565348409755962e-05, "loss": 2.3438, "step": 394920 }, { "epoch": 0.69, "learning_rate": 1.5564476469829136e-05, "loss": 2.3181, "step": 394930 }, { "epoch": 0.69, "learning_rate": 1.556360452990231e-05, "loss": 2.2979, "step": 394940 }, { "epoch": 0.69, "learning_rate": 1.556273258997548e-05, "loss": 2.4284, "step": 394950 }, { "epoch": 0.69, "learning_rate": 1.5561860650048654e-05, "loss": 2.2853, "step": 394960 }, { "epoch": 0.69, "learning_rate": 1.556098871012183e-05, "loss": 2.3633, "step": 394970 }, { "epoch": 0.69, "learning_rate": 1.5560116770195e-05, "loss": 2.3276, "step": 394980 }, { "epoch": 0.69, "learning_rate": 1.5559244830268175e-05, "loss": 2.2887, "step": 394990 }, { "epoch": 0.69, "learning_rate": 1.5558372890341345e-05, "loss": 2.376, "step": 395000 }, { "epoch": 0.69, "learning_rate": 1.5557500950414523e-05, "loss": 2.3267, "step": 395010 }, { "epoch": 0.69, "learning_rate": 1.5556629010487693e-05, "loss": 2.3067, "step": 395020 }, { "epoch": 0.69, "learning_rate": 1.5555757070560867e-05, "loss": 2.3042, "step": 395030 }, { "epoch": 0.69, "learning_rate": 1.555488513063404e-05, "loss": 2.3333, "step": 395040 }, { "epoch": 0.69, "learning_rate": 1.5554013190707214e-05, "loss": 2.333, "step": 395050 }, { "epoch": 0.69, "learning_rate": 1.5553141250780388e-05, "loss": 2.3083, "step": 395060 }, { "epoch": 0.69, "learning_rate": 1.555226931085356e-05, "loss": 2.2561, "step": 395070 }, { "epoch": 0.69, "learning_rate": 1.5551397370926736e-05, "loss": 2.351, "step": 395080 }, { "epoch": 0.69, "learning_rate": 1.5550525430999906e-05, "loss": 2.3132, "step": 395090 }, { "epoch": 0.69, "learning_rate": 1.554965349107308e-05, "loss": 2.2365, "step": 395100 }, { "epoch": 0.69, "learning_rate": 1.5548781551146254e-05, "loss": 2.28, "step": 395110 }, { "epoch": 0.69, "learning_rate": 1.5547909611219427e-05, "loss": 2.2771, "step": 395120 }, { "epoch": 0.69, "learning_rate": 1.55470376712926e-05, "loss": 2.3436, "step": 395130 }, { "epoch": 0.69, "learning_rate": 1.554616573136577e-05, "loss": 2.2564, "step": 395140 }, { "epoch": 0.69, "learning_rate": 1.5545293791438945e-05, "loss": 2.2285, "step": 395150 }, { "epoch": 0.69, "learning_rate": 1.554442185151212e-05, "loss": 2.3812, "step": 395160 }, { "epoch": 0.69, "learning_rate": 1.5543549911585293e-05, "loss": 2.3396, "step": 395170 }, { "epoch": 0.69, "learning_rate": 1.5542677971658463e-05, "loss": 2.4031, "step": 395180 }, { "epoch": 0.69, "learning_rate": 1.5541806031731637e-05, "loss": 2.3025, "step": 395190 }, { "epoch": 0.69, "learning_rate": 1.554093409180481e-05, "loss": 2.2801, "step": 395200 }, { "epoch": 0.69, "learning_rate": 1.5540062151877984e-05, "loss": 2.2484, "step": 395210 }, { "epoch": 0.69, "learning_rate": 1.5539190211951158e-05, "loss": 2.2389, "step": 395220 }, { "epoch": 0.69, "learning_rate": 1.5538318272024332e-05, "loss": 2.2409, "step": 395230 }, { "epoch": 0.69, "learning_rate": 1.5537446332097506e-05, "loss": 2.1979, "step": 395240 }, { "epoch": 0.69, "learning_rate": 1.5536574392170676e-05, "loss": 2.278, "step": 395250 }, { "epoch": 0.69, "learning_rate": 1.553570245224385e-05, "loss": 2.3018, "step": 395260 }, { "epoch": 0.69, "learning_rate": 1.5534830512317024e-05, "loss": 2.3161, "step": 395270 }, { "epoch": 0.69, "learning_rate": 1.5533958572390197e-05, "loss": 2.3074, "step": 395280 }, { "epoch": 0.69, "learning_rate": 1.553308663246337e-05, "loss": 2.3141, "step": 395290 }, { "epoch": 0.69, "learning_rate": 1.553221469253654e-05, "loss": 2.3614, "step": 395300 }, { "epoch": 0.69, "learning_rate": 1.553134275260972e-05, "loss": 2.289, "step": 395310 }, { "epoch": 0.69, "learning_rate": 1.553047081268289e-05, "loss": 2.301, "step": 395320 }, { "epoch": 0.69, "learning_rate": 1.5529598872756063e-05, "loss": 2.3211, "step": 395330 }, { "epoch": 0.69, "learning_rate": 1.5528726932829237e-05, "loss": 2.3457, "step": 395340 }, { "epoch": 0.69, "learning_rate": 1.552785499290241e-05, "loss": 2.3753, "step": 395350 }, { "epoch": 0.69, "learning_rate": 1.5526983052975584e-05, "loss": 2.3055, "step": 395360 }, { "epoch": 0.69, "learning_rate": 1.5526111113048755e-05, "loss": 2.3308, "step": 395370 }, { "epoch": 0.69, "learning_rate": 1.5525239173121932e-05, "loss": 2.4514, "step": 395380 }, { "epoch": 0.69, "learning_rate": 1.5524367233195102e-05, "loss": 2.369, "step": 395390 }, { "epoch": 0.69, "learning_rate": 1.5523495293268276e-05, "loss": 2.3788, "step": 395400 }, { "epoch": 0.69, "learning_rate": 1.5522623353341446e-05, "loss": 2.3803, "step": 395410 }, { "epoch": 0.69, "learning_rate": 1.5521751413414623e-05, "loss": 2.2862, "step": 395420 }, { "epoch": 0.69, "learning_rate": 1.5520879473487794e-05, "loss": 2.2683, "step": 395430 }, { "epoch": 0.69, "learning_rate": 1.5520007533560968e-05, "loss": 2.3677, "step": 395440 }, { "epoch": 0.69, "learning_rate": 1.551913559363414e-05, "loss": 2.2608, "step": 395450 }, { "epoch": 0.69, "learning_rate": 1.5518263653707315e-05, "loss": 2.1581, "step": 395460 }, { "epoch": 0.69, "learning_rate": 1.551739171378049e-05, "loss": 2.3565, "step": 395470 }, { "epoch": 0.69, "learning_rate": 1.551651977385366e-05, "loss": 2.3942, "step": 395480 }, { "epoch": 0.69, "learning_rate": 1.5515647833926836e-05, "loss": 2.3058, "step": 395490 }, { "epoch": 0.69, "learning_rate": 1.5514775894000007e-05, "loss": 2.3014, "step": 395500 }, { "epoch": 0.69, "learning_rate": 1.551390395407318e-05, "loss": 2.2742, "step": 395510 }, { "epoch": 0.69, "learning_rate": 1.5513032014146354e-05, "loss": 2.2299, "step": 395520 }, { "epoch": 0.69, "learning_rate": 1.5512160074219528e-05, "loss": 2.305, "step": 395530 }, { "epoch": 0.69, "learning_rate": 1.5511288134292702e-05, "loss": 2.3825, "step": 395540 }, { "epoch": 0.69, "learning_rate": 1.5510416194365872e-05, "loss": 2.4033, "step": 395550 }, { "epoch": 0.69, "learning_rate": 1.5509544254439046e-05, "loss": 2.3164, "step": 395560 }, { "epoch": 0.69, "learning_rate": 1.550867231451222e-05, "loss": 2.3531, "step": 395570 }, { "epoch": 0.69, "learning_rate": 1.5507800374585394e-05, "loss": 2.2184, "step": 395580 }, { "epoch": 0.69, "learning_rate": 1.5506928434658567e-05, "loss": 2.3198, "step": 395590 }, { "epoch": 0.69, "learning_rate": 1.550605649473174e-05, "loss": 2.3531, "step": 395600 }, { "epoch": 0.69, "learning_rate": 1.5505184554804915e-05, "loss": 2.3231, "step": 395610 }, { "epoch": 0.69, "learning_rate": 1.5504312614878085e-05, "loss": 2.2097, "step": 395620 }, { "epoch": 0.69, "learning_rate": 1.550344067495126e-05, "loss": 2.2134, "step": 395630 }, { "epoch": 0.69, "learning_rate": 1.5502568735024433e-05, "loss": 2.3955, "step": 395640 }, { "epoch": 0.69, "learning_rate": 1.5501696795097607e-05, "loss": 2.2632, "step": 395650 }, { "epoch": 0.69, "learning_rate": 1.5500824855170777e-05, "loss": 2.2248, "step": 395660 }, { "epoch": 0.69, "learning_rate": 1.549995291524395e-05, "loss": 2.3556, "step": 395670 }, { "epoch": 0.69, "learning_rate": 1.5499080975317125e-05, "loss": 2.2602, "step": 395680 }, { "epoch": 0.69, "learning_rate": 1.54982090353903e-05, "loss": 2.2735, "step": 395690 }, { "epoch": 0.69, "learning_rate": 1.5497337095463472e-05, "loss": 2.32, "step": 395700 }, { "epoch": 0.69, "learning_rate": 1.5496465155536642e-05, "loss": 2.2308, "step": 395710 }, { "epoch": 0.69, "learning_rate": 1.549559321560982e-05, "loss": 2.2699, "step": 395720 }, { "epoch": 0.69, "learning_rate": 1.549472127568299e-05, "loss": 2.3635, "step": 395730 }, { "epoch": 0.69, "learning_rate": 1.5493849335756164e-05, "loss": 2.3517, "step": 395740 }, { "epoch": 0.69, "learning_rate": 1.5492977395829338e-05, "loss": 2.3426, "step": 395750 }, { "epoch": 0.69, "learning_rate": 1.549210545590251e-05, "loss": 2.28, "step": 395760 }, { "epoch": 0.69, "learning_rate": 1.5491233515975685e-05, "loss": 2.4201, "step": 395770 }, { "epoch": 0.69, "learning_rate": 1.5490361576048855e-05, "loss": 2.2772, "step": 395780 }, { "epoch": 0.69, "learning_rate": 1.5489489636122033e-05, "loss": 2.4159, "step": 395790 }, { "epoch": 0.69, "learning_rate": 1.5488617696195203e-05, "loss": 2.3472, "step": 395800 }, { "epoch": 0.69, "learning_rate": 1.5487745756268377e-05, "loss": 2.2485, "step": 395810 }, { "epoch": 0.69, "learning_rate": 1.5486873816341547e-05, "loss": 2.2883, "step": 395820 }, { "epoch": 0.69, "learning_rate": 1.5486001876414724e-05, "loss": 2.3535, "step": 395830 }, { "epoch": 0.69, "learning_rate": 1.5485129936487898e-05, "loss": 2.2573, "step": 395840 }, { "epoch": 0.69, "learning_rate": 1.548425799656107e-05, "loss": 2.2468, "step": 395850 }, { "epoch": 0.69, "learning_rate": 1.5483386056634246e-05, "loss": 2.3805, "step": 395860 }, { "epoch": 0.69, "learning_rate": 1.5482514116707416e-05, "loss": 2.1986, "step": 395870 }, { "epoch": 0.69, "learning_rate": 1.548164217678059e-05, "loss": 2.3739, "step": 395880 }, { "epoch": 0.69, "learning_rate": 1.548077023685376e-05, "loss": 2.262, "step": 395890 }, { "epoch": 0.69, "learning_rate": 1.5479898296926937e-05, "loss": 2.3751, "step": 395900 }, { "epoch": 0.69, "learning_rate": 1.5479026357000108e-05, "loss": 2.3785, "step": 395910 }, { "epoch": 0.69, "learning_rate": 1.547815441707328e-05, "loss": 2.3951, "step": 395920 }, { "epoch": 0.69, "learning_rate": 1.5477282477146455e-05, "loss": 2.3301, "step": 395930 }, { "epoch": 0.69, "learning_rate": 1.547641053721963e-05, "loss": 2.2652, "step": 395940 }, { "epoch": 0.69, "learning_rate": 1.5475538597292803e-05, "loss": 2.2359, "step": 395950 }, { "epoch": 0.69, "learning_rate": 1.5474666657365973e-05, "loss": 2.4125, "step": 395960 }, { "epoch": 0.69, "learning_rate": 1.5473794717439147e-05, "loss": 2.2798, "step": 395970 }, { "epoch": 0.69, "learning_rate": 1.547292277751232e-05, "loss": 2.3076, "step": 395980 }, { "epoch": 0.69, "learning_rate": 1.5472050837585495e-05, "loss": 2.2653, "step": 395990 }, { "epoch": 0.69, "learning_rate": 1.5471178897658668e-05, "loss": 2.277, "step": 396000 }, { "epoch": 0.69, "learning_rate": 1.5470306957731842e-05, "loss": 2.3755, "step": 396010 }, { "epoch": 0.69, "learning_rate": 1.5469435017805016e-05, "loss": 2.2765, "step": 396020 }, { "epoch": 0.69, "learning_rate": 1.5468563077878186e-05, "loss": 2.3161, "step": 396030 }, { "epoch": 0.69, "learning_rate": 1.546769113795136e-05, "loss": 2.4009, "step": 396040 }, { "epoch": 0.69, "learning_rate": 1.5466819198024534e-05, "loss": 2.2029, "step": 396050 }, { "epoch": 0.69, "learning_rate": 1.5465947258097708e-05, "loss": 2.3889, "step": 396060 }, { "epoch": 0.69, "learning_rate": 1.546507531817088e-05, "loss": 2.3063, "step": 396070 }, { "epoch": 0.69, "learning_rate": 1.546420337824405e-05, "loss": 2.2994, "step": 396080 }, { "epoch": 0.69, "learning_rate": 1.546333143831723e-05, "loss": 2.2075, "step": 396090 }, { "epoch": 0.69, "learning_rate": 1.54624594983904e-05, "loss": 2.3803, "step": 396100 }, { "epoch": 0.69, "learning_rate": 1.5461587558463573e-05, "loss": 2.3699, "step": 396110 }, { "epoch": 0.69, "learning_rate": 1.5460715618536743e-05, "loss": 2.2639, "step": 396120 }, { "epoch": 0.69, "learning_rate": 1.545984367860992e-05, "loss": 2.1862, "step": 396130 }, { "epoch": 0.69, "learning_rate": 1.545897173868309e-05, "loss": 2.2633, "step": 396140 }, { "epoch": 0.69, "learning_rate": 1.5458099798756265e-05, "loss": 2.3473, "step": 396150 }, { "epoch": 0.69, "learning_rate": 1.545722785882944e-05, "loss": 2.3035, "step": 396160 }, { "epoch": 0.69, "learning_rate": 1.5456355918902612e-05, "loss": 2.4039, "step": 396170 }, { "epoch": 0.69, "learning_rate": 1.5455483978975786e-05, "loss": 2.2843, "step": 396180 }, { "epoch": 0.69, "learning_rate": 1.5454612039048956e-05, "loss": 2.3618, "step": 396190 }, { "epoch": 0.69, "learning_rate": 1.5453740099122134e-05, "loss": 2.3015, "step": 396200 }, { "epoch": 0.69, "learning_rate": 1.5452868159195304e-05, "loss": 2.3223, "step": 396210 }, { "epoch": 0.69, "learning_rate": 1.5451996219268478e-05, "loss": 2.3696, "step": 396220 }, { "epoch": 0.69, "learning_rate": 1.545112427934165e-05, "loss": 2.1819, "step": 396230 }, { "epoch": 0.69, "learning_rate": 1.5450252339414825e-05, "loss": 2.3864, "step": 396240 }, { "epoch": 0.69, "learning_rate": 1.5449380399488e-05, "loss": 2.2728, "step": 396250 }, { "epoch": 0.69, "learning_rate": 1.544850845956117e-05, "loss": 2.1907, "step": 396260 }, { "epoch": 0.69, "learning_rate": 1.5447636519634347e-05, "loss": 2.2569, "step": 396270 }, { "epoch": 0.69, "learning_rate": 1.5446764579707517e-05, "loss": 2.1923, "step": 396280 }, { "epoch": 0.69, "learning_rate": 1.544589263978069e-05, "loss": 2.2929, "step": 396290 }, { "epoch": 0.69, "learning_rate": 1.544502069985386e-05, "loss": 2.2554, "step": 396300 }, { "epoch": 0.69, "learning_rate": 1.5444148759927038e-05, "loss": 2.4119, "step": 396310 }, { "epoch": 0.69, "learning_rate": 1.5443276820000212e-05, "loss": 2.312, "step": 396320 }, { "epoch": 0.69, "learning_rate": 1.5442404880073382e-05, "loss": 2.2583, "step": 396330 }, { "epoch": 0.69, "learning_rate": 1.5441532940146556e-05, "loss": 2.3277, "step": 396340 }, { "epoch": 0.69, "learning_rate": 1.544066100021973e-05, "loss": 2.3189, "step": 396350 }, { "epoch": 0.69, "learning_rate": 1.5439789060292904e-05, "loss": 2.3145, "step": 396360 }, { "epoch": 0.69, "learning_rate": 1.5438917120366074e-05, "loss": 2.4206, "step": 396370 }, { "epoch": 0.69, "learning_rate": 1.5438045180439248e-05, "loss": 2.2821, "step": 396380 }, { "epoch": 0.69, "learning_rate": 1.543717324051242e-05, "loss": 2.4179, "step": 396390 }, { "epoch": 0.69, "learning_rate": 1.5436301300585595e-05, "loss": 2.2795, "step": 396400 }, { "epoch": 0.69, "learning_rate": 1.543542936065877e-05, "loss": 2.2551, "step": 396410 }, { "epoch": 0.69, "learning_rate": 1.5434557420731943e-05, "loss": 2.2993, "step": 396420 }, { "epoch": 0.69, "learning_rate": 1.5433685480805117e-05, "loss": 2.2638, "step": 396430 }, { "epoch": 0.69, "learning_rate": 1.5432813540878287e-05, "loss": 2.4121, "step": 396440 }, { "epoch": 0.69, "learning_rate": 1.543194160095146e-05, "loss": 2.4194, "step": 396450 }, { "epoch": 0.69, "learning_rate": 1.5431069661024635e-05, "loss": 2.2919, "step": 396460 }, { "epoch": 0.69, "learning_rate": 1.543019772109781e-05, "loss": 2.2703, "step": 396470 }, { "epoch": 0.69, "learning_rate": 1.5429325781170982e-05, "loss": 2.3149, "step": 396480 }, { "epoch": 0.69, "learning_rate": 1.5428453841244153e-05, "loss": 2.3277, "step": 396490 }, { "epoch": 0.69, "learning_rate": 1.542758190131733e-05, "loss": 2.446, "step": 396500 }, { "epoch": 0.69, "learning_rate": 1.54267099613905e-05, "loss": 2.3854, "step": 396510 }, { "epoch": 0.69, "learning_rate": 1.5425838021463674e-05, "loss": 2.2283, "step": 396520 }, { "epoch": 0.69, "learning_rate": 1.5424966081536848e-05, "loss": 2.2674, "step": 396530 }, { "epoch": 0.69, "learning_rate": 1.542409414161002e-05, "loss": 2.379, "step": 396540 }, { "epoch": 0.69, "learning_rate": 1.5423222201683192e-05, "loss": 2.3307, "step": 396550 }, { "epoch": 0.69, "learning_rate": 1.5422350261756366e-05, "loss": 2.2013, "step": 396560 }, { "epoch": 0.69, "learning_rate": 1.5421478321829543e-05, "loss": 2.4225, "step": 396570 }, { "epoch": 0.69, "learning_rate": 1.5420606381902713e-05, "loss": 2.3182, "step": 396580 }, { "epoch": 0.69, "learning_rate": 1.5419734441975887e-05, "loss": 2.2513, "step": 396590 }, { "epoch": 0.69, "learning_rate": 1.5418862502049057e-05, "loss": 2.3567, "step": 396600 }, { "epoch": 0.69, "learning_rate": 1.5417990562122234e-05, "loss": 2.1942, "step": 396610 }, { "epoch": 0.69, "learning_rate": 1.5417118622195405e-05, "loss": 2.3136, "step": 396620 }, { "epoch": 0.69, "learning_rate": 1.541624668226858e-05, "loss": 2.2089, "step": 396630 }, { "epoch": 0.69, "learning_rate": 1.5415374742341752e-05, "loss": 2.3091, "step": 396640 }, { "epoch": 0.69, "learning_rate": 1.5414502802414926e-05, "loss": 2.2761, "step": 396650 }, { "epoch": 0.69, "learning_rate": 1.54136308624881e-05, "loss": 2.2758, "step": 396660 }, { "epoch": 0.69, "learning_rate": 1.541275892256127e-05, "loss": 2.2872, "step": 396670 }, { "epoch": 0.69, "learning_rate": 1.5411886982634447e-05, "loss": 2.3283, "step": 396680 }, { "epoch": 0.69, "learning_rate": 1.5411015042707618e-05, "loss": 2.3407, "step": 396690 }, { "epoch": 0.69, "learning_rate": 1.541014310278079e-05, "loss": 2.175, "step": 396700 }, { "epoch": 0.69, "learning_rate": 1.5409271162853965e-05, "loss": 2.4709, "step": 396710 }, { "epoch": 0.69, "learning_rate": 1.540839922292714e-05, "loss": 2.3246, "step": 396720 }, { "epoch": 0.69, "learning_rate": 1.5407527283000313e-05, "loss": 2.3841, "step": 396730 }, { "epoch": 0.69, "learning_rate": 1.5406655343073483e-05, "loss": 2.2988, "step": 396740 }, { "epoch": 0.69, "learning_rate": 1.5405783403146657e-05, "loss": 2.3253, "step": 396750 }, { "epoch": 0.69, "learning_rate": 1.540491146321983e-05, "loss": 2.2669, "step": 396760 }, { "epoch": 0.69, "learning_rate": 1.5404039523293005e-05, "loss": 2.1275, "step": 396770 }, { "epoch": 0.69, "learning_rate": 1.5403167583366175e-05, "loss": 2.2495, "step": 396780 }, { "epoch": 0.69, "learning_rate": 1.5402295643439352e-05, "loss": 2.3549, "step": 396790 }, { "epoch": 0.69, "learning_rate": 1.5401423703512526e-05, "loss": 2.3201, "step": 396800 }, { "epoch": 0.69, "learning_rate": 1.5400551763585696e-05, "loss": 2.3674, "step": 396810 }, { "epoch": 0.69, "learning_rate": 1.539967982365887e-05, "loss": 2.2574, "step": 396820 }, { "epoch": 0.69, "learning_rate": 1.5398807883732044e-05, "loss": 2.2853, "step": 396830 }, { "epoch": 0.69, "learning_rate": 1.5397935943805218e-05, "loss": 2.3814, "step": 396840 }, { "epoch": 0.69, "learning_rate": 1.5397064003878388e-05, "loss": 2.3429, "step": 396850 }, { "epoch": 0.69, "learning_rate": 1.539619206395156e-05, "loss": 2.329, "step": 396860 }, { "epoch": 0.69, "learning_rate": 1.5395320124024735e-05, "loss": 2.4073, "step": 396870 }, { "epoch": 0.69, "learning_rate": 1.539444818409791e-05, "loss": 2.2175, "step": 396880 }, { "epoch": 0.69, "learning_rate": 1.5393576244171083e-05, "loss": 2.2429, "step": 396890 }, { "epoch": 0.69, "learning_rate": 1.5392704304244253e-05, "loss": 2.3169, "step": 396900 }, { "epoch": 0.69, "learning_rate": 1.539183236431743e-05, "loss": 2.3209, "step": 396910 }, { "epoch": 0.69, "learning_rate": 1.53909604243906e-05, "loss": 2.3308, "step": 396920 }, { "epoch": 0.69, "learning_rate": 1.5390088484463775e-05, "loss": 2.2785, "step": 396930 }, { "epoch": 0.69, "learning_rate": 1.538921654453695e-05, "loss": 2.3832, "step": 396940 }, { "epoch": 0.69, "learning_rate": 1.5388344604610122e-05, "loss": 2.4079, "step": 396950 }, { "epoch": 0.69, "learning_rate": 1.5387472664683296e-05, "loss": 2.3713, "step": 396960 }, { "epoch": 0.69, "learning_rate": 1.5386600724756466e-05, "loss": 2.2909, "step": 396970 }, { "epoch": 0.69, "learning_rate": 1.5385728784829644e-05, "loss": 2.2836, "step": 396980 }, { "epoch": 0.69, "learning_rate": 1.5384856844902814e-05, "loss": 2.2994, "step": 396990 }, { "epoch": 0.69, "learning_rate": 1.5383984904975988e-05, "loss": 2.2853, "step": 397000 }, { "epoch": 0.69, "learning_rate": 1.5383112965049158e-05, "loss": 2.2705, "step": 397010 }, { "epoch": 0.69, "learning_rate": 1.5382241025122335e-05, "loss": 2.3626, "step": 397020 }, { "epoch": 0.69, "learning_rate": 1.5381369085195506e-05, "loss": 2.3657, "step": 397030 }, { "epoch": 0.69, "learning_rate": 1.538049714526868e-05, "loss": 2.2865, "step": 397040 }, { "epoch": 0.69, "learning_rate": 1.5379625205341853e-05, "loss": 2.3215, "step": 397050 }, { "epoch": 0.69, "learning_rate": 1.5378753265415027e-05, "loss": 2.2779, "step": 397060 }, { "epoch": 0.69, "learning_rate": 1.53778813254882e-05, "loss": 2.318, "step": 397070 }, { "epoch": 0.69, "learning_rate": 1.537700938556137e-05, "loss": 2.2654, "step": 397080 }, { "epoch": 0.69, "learning_rate": 1.5376137445634548e-05, "loss": 2.3914, "step": 397090 }, { "epoch": 0.69, "learning_rate": 1.537526550570772e-05, "loss": 2.2859, "step": 397100 }, { "epoch": 0.69, "learning_rate": 1.5374393565780892e-05, "loss": 2.2715, "step": 397110 }, { "epoch": 0.69, "learning_rate": 1.5373521625854066e-05, "loss": 2.2473, "step": 397120 }, { "epoch": 0.69, "learning_rate": 1.537264968592724e-05, "loss": 2.2281, "step": 397130 }, { "epoch": 0.69, "learning_rate": 1.5371777746000414e-05, "loss": 2.286, "step": 397140 }, { "epoch": 0.69, "learning_rate": 1.5370905806073584e-05, "loss": 2.4335, "step": 397150 }, { "epoch": 0.69, "learning_rate": 1.5370033866146758e-05, "loss": 2.2875, "step": 397160 }, { "epoch": 0.69, "learning_rate": 1.536916192621993e-05, "loss": 2.3389, "step": 397170 }, { "epoch": 0.69, "learning_rate": 1.5368289986293105e-05, "loss": 2.3979, "step": 397180 }, { "epoch": 0.69, "learning_rate": 1.536741804636628e-05, "loss": 2.34, "step": 397190 }, { "epoch": 0.69, "learning_rate": 1.5366546106439453e-05, "loss": 2.2795, "step": 397200 }, { "epoch": 0.69, "learning_rate": 1.5365674166512627e-05, "loss": 2.3282, "step": 397210 }, { "epoch": 0.69, "learning_rate": 1.5364802226585797e-05, "loss": 2.3454, "step": 397220 }, { "epoch": 0.69, "learning_rate": 1.536393028665897e-05, "loss": 2.252, "step": 397230 }, { "epoch": 0.69, "learning_rate": 1.5363058346732145e-05, "loss": 2.2852, "step": 397240 }, { "epoch": 0.69, "learning_rate": 1.536218640680532e-05, "loss": 2.362, "step": 397250 }, { "epoch": 0.69, "learning_rate": 1.536131446687849e-05, "loss": 2.2083, "step": 397260 }, { "epoch": 0.69, "learning_rate": 1.5360442526951663e-05, "loss": 2.2981, "step": 397270 }, { "epoch": 0.69, "learning_rate": 1.535957058702484e-05, "loss": 2.3123, "step": 397280 }, { "epoch": 0.69, "learning_rate": 1.535869864709801e-05, "loss": 2.314, "step": 397290 }, { "epoch": 0.69, "learning_rate": 1.5357826707171184e-05, "loss": 2.304, "step": 397300 }, { "epoch": 0.69, "learning_rate": 1.5356954767244354e-05, "loss": 2.2802, "step": 397310 }, { "epoch": 0.69, "learning_rate": 1.535608282731753e-05, "loss": 2.2816, "step": 397320 }, { "epoch": 0.69, "learning_rate": 1.5355210887390702e-05, "loss": 2.2673, "step": 397330 }, { "epoch": 0.69, "learning_rate": 1.5354338947463876e-05, "loss": 2.2474, "step": 397340 }, { "epoch": 0.69, "learning_rate": 1.535346700753705e-05, "loss": 2.4621, "step": 397350 }, { "epoch": 0.69, "learning_rate": 1.5352595067610223e-05, "loss": 2.3762, "step": 397360 }, { "epoch": 0.69, "learning_rate": 1.5351723127683397e-05, "loss": 2.2136, "step": 397370 }, { "epoch": 0.69, "learning_rate": 1.5350851187756567e-05, "loss": 2.3029, "step": 397380 }, { "epoch": 0.69, "learning_rate": 1.5349979247829744e-05, "loss": 2.3313, "step": 397390 }, { "epoch": 0.69, "learning_rate": 1.5349107307902915e-05, "loss": 2.2845, "step": 397400 }, { "epoch": 0.69, "learning_rate": 1.534823536797609e-05, "loss": 2.3748, "step": 397410 }, { "epoch": 0.69, "learning_rate": 1.5347363428049262e-05, "loss": 2.3053, "step": 397420 }, { "epoch": 0.69, "learning_rate": 1.5346491488122436e-05, "loss": 2.3873, "step": 397430 }, { "epoch": 0.69, "learning_rate": 1.534561954819561e-05, "loss": 2.2546, "step": 397440 }, { "epoch": 0.69, "learning_rate": 1.534474760826878e-05, "loss": 2.4081, "step": 397450 }, { "epoch": 0.69, "learning_rate": 1.5343875668341957e-05, "loss": 2.3718, "step": 397460 }, { "epoch": 0.69, "learning_rate": 1.5343003728415128e-05, "loss": 2.4268, "step": 397470 }, { "epoch": 0.69, "learning_rate": 1.53421317884883e-05, "loss": 2.356, "step": 397480 }, { "epoch": 0.69, "learning_rate": 1.5341259848561472e-05, "loss": 2.4205, "step": 397490 }, { "epoch": 0.69, "learning_rate": 1.534038790863465e-05, "loss": 2.2566, "step": 397500 }, { "epoch": 0.69, "learning_rate": 1.533951596870782e-05, "loss": 2.3289, "step": 397510 }, { "epoch": 0.69, "learning_rate": 1.5338644028780993e-05, "loss": 2.2578, "step": 397520 }, { "epoch": 0.69, "learning_rate": 1.5337772088854167e-05, "loss": 2.3334, "step": 397530 }, { "epoch": 0.69, "learning_rate": 1.533690014892734e-05, "loss": 2.3298, "step": 397540 }, { "epoch": 0.69, "learning_rate": 1.5336028209000515e-05, "loss": 2.141, "step": 397550 }, { "epoch": 0.69, "learning_rate": 1.5335156269073685e-05, "loss": 2.2419, "step": 397560 }, { "epoch": 0.69, "learning_rate": 1.533428432914686e-05, "loss": 2.2974, "step": 397570 }, { "epoch": 0.69, "learning_rate": 1.5333412389220032e-05, "loss": 2.3032, "step": 397580 }, { "epoch": 0.69, "learning_rate": 1.5332540449293206e-05, "loss": 2.3134, "step": 397590 }, { "epoch": 0.69, "learning_rate": 1.533166850936638e-05, "loss": 2.3651, "step": 397600 }, { "epoch": 0.69, "learning_rate": 1.5330796569439554e-05, "loss": 2.3105, "step": 397610 }, { "epoch": 0.69, "learning_rate": 1.5329924629512728e-05, "loss": 2.3277, "step": 397620 }, { "epoch": 0.69, "learning_rate": 1.5329052689585898e-05, "loss": 2.3321, "step": 397630 }, { "epoch": 0.69, "learning_rate": 1.532818074965907e-05, "loss": 2.2878, "step": 397640 }, { "epoch": 0.69, "learning_rate": 1.5327308809732245e-05, "loss": 2.2543, "step": 397650 }, { "epoch": 0.69, "learning_rate": 1.532643686980542e-05, "loss": 2.3129, "step": 397660 }, { "epoch": 0.69, "learning_rate": 1.5325564929878593e-05, "loss": 2.2757, "step": 397670 }, { "epoch": 0.69, "learning_rate": 1.5324692989951763e-05, "loss": 2.2983, "step": 397680 }, { "epoch": 0.69, "learning_rate": 1.532382105002494e-05, "loss": 2.2269, "step": 397690 }, { "epoch": 0.69, "learning_rate": 1.532294911009811e-05, "loss": 2.2703, "step": 397700 }, { "epoch": 0.69, "learning_rate": 1.5322077170171285e-05, "loss": 2.2738, "step": 397710 }, { "epoch": 0.69, "learning_rate": 1.532120523024446e-05, "loss": 2.2162, "step": 397720 }, { "epoch": 0.69, "learning_rate": 1.5320333290317632e-05, "loss": 2.3062, "step": 397730 }, { "epoch": 0.69, "learning_rate": 1.5319461350390803e-05, "loss": 2.4196, "step": 397740 }, { "epoch": 0.69, "learning_rate": 1.5318589410463976e-05, "loss": 2.4371, "step": 397750 }, { "epoch": 0.69, "learning_rate": 1.531771747053715e-05, "loss": 2.345, "step": 397760 }, { "epoch": 0.69, "learning_rate": 1.5316845530610324e-05, "loss": 2.3785, "step": 397770 }, { "epoch": 0.69, "learning_rate": 1.5315973590683498e-05, "loss": 2.3155, "step": 397780 }, { "epoch": 0.69, "learning_rate": 1.5315101650756668e-05, "loss": 2.2764, "step": 397790 }, { "epoch": 0.69, "learning_rate": 1.5314229710829845e-05, "loss": 2.3887, "step": 397800 }, { "epoch": 0.69, "learning_rate": 1.5313357770903016e-05, "loss": 2.3019, "step": 397810 }, { "epoch": 0.69, "learning_rate": 1.531248583097619e-05, "loss": 2.3632, "step": 397820 }, { "epoch": 0.69, "learning_rate": 1.5311613891049363e-05, "loss": 2.3322, "step": 397830 }, { "epoch": 0.69, "learning_rate": 1.5310741951122537e-05, "loss": 2.3158, "step": 397840 }, { "epoch": 0.69, "learning_rate": 1.530987001119571e-05, "loss": 2.2786, "step": 397850 }, { "epoch": 0.69, "learning_rate": 1.530899807126888e-05, "loss": 2.2971, "step": 397860 }, { "epoch": 0.69, "learning_rate": 1.5308126131342058e-05, "loss": 2.2399, "step": 397870 }, { "epoch": 0.69, "learning_rate": 1.530725419141523e-05, "loss": 2.2705, "step": 397880 }, { "epoch": 0.69, "learning_rate": 1.5306382251488402e-05, "loss": 2.2576, "step": 397890 }, { "epoch": 0.69, "learning_rate": 1.5305510311561576e-05, "loss": 2.321, "step": 397900 }, { "epoch": 0.69, "learning_rate": 1.530463837163475e-05, "loss": 2.2492, "step": 397910 }, { "epoch": 0.69, "learning_rate": 1.5303766431707924e-05, "loss": 2.3147, "step": 397920 }, { "epoch": 0.69, "learning_rate": 1.5302894491781094e-05, "loss": 2.2829, "step": 397930 }, { "epoch": 0.69, "learning_rate": 1.5302022551854268e-05, "loss": 2.2388, "step": 397940 }, { "epoch": 0.69, "learning_rate": 1.530115061192744e-05, "loss": 2.3234, "step": 397950 }, { "epoch": 0.69, "learning_rate": 1.5300278672000615e-05, "loss": 2.2323, "step": 397960 }, { "epoch": 0.69, "learning_rate": 1.5299406732073786e-05, "loss": 2.3307, "step": 397970 }, { "epoch": 0.69, "learning_rate": 1.529853479214696e-05, "loss": 2.2935, "step": 397980 }, { "epoch": 0.69, "learning_rate": 1.5297662852220133e-05, "loss": 2.2337, "step": 397990 }, { "epoch": 0.69, "learning_rate": 1.5296790912293307e-05, "loss": 2.3382, "step": 398000 }, { "epoch": 0.69, "learning_rate": 1.529591897236648e-05, "loss": 2.226, "step": 398010 }, { "epoch": 0.69, "learning_rate": 1.5295047032439655e-05, "loss": 2.1419, "step": 398020 }, { "epoch": 0.69, "learning_rate": 1.529417509251283e-05, "loss": 2.3141, "step": 398030 }, { "epoch": 0.69, "learning_rate": 1.5293303152586e-05, "loss": 2.3895, "step": 398040 }, { "epoch": 0.69, "learning_rate": 1.5292431212659173e-05, "loss": 2.3832, "step": 398050 }, { "epoch": 0.69, "learning_rate": 1.5291559272732346e-05, "loss": 2.4115, "step": 398060 }, { "epoch": 0.69, "learning_rate": 1.529068733280552e-05, "loss": 2.238, "step": 398070 }, { "epoch": 0.69, "learning_rate": 1.5289815392878694e-05, "loss": 2.4244, "step": 398080 }, { "epoch": 0.69, "learning_rate": 1.5288943452951864e-05, "loss": 2.435, "step": 398090 }, { "epoch": 0.69, "learning_rate": 1.528807151302504e-05, "loss": 2.3677, "step": 398100 }, { "epoch": 0.69, "learning_rate": 1.5287199573098212e-05, "loss": 2.415, "step": 398110 }, { "epoch": 0.69, "learning_rate": 1.5286327633171386e-05, "loss": 2.293, "step": 398120 }, { "epoch": 0.69, "learning_rate": 1.528545569324456e-05, "loss": 2.2891, "step": 398130 }, { "epoch": 0.69, "learning_rate": 1.5284583753317733e-05, "loss": 2.3227, "step": 398140 }, { "epoch": 0.69, "learning_rate": 1.5283711813390907e-05, "loss": 2.2517, "step": 398150 }, { "epoch": 0.69, "learning_rate": 1.5282839873464077e-05, "loss": 2.3309, "step": 398160 }, { "epoch": 0.69, "learning_rate": 1.5281967933537254e-05, "loss": 2.3424, "step": 398170 }, { "epoch": 0.69, "learning_rate": 1.5281095993610425e-05, "loss": 2.2622, "step": 398180 }, { "epoch": 0.69, "learning_rate": 1.52802240536836e-05, "loss": 2.3076, "step": 398190 }, { "epoch": 0.69, "learning_rate": 1.527935211375677e-05, "loss": 2.3092, "step": 398200 }, { "epoch": 0.69, "learning_rate": 1.5278480173829946e-05, "loss": 2.328, "step": 398210 }, { "epoch": 0.69, "learning_rate": 1.5277608233903116e-05, "loss": 2.2264, "step": 398220 }, { "epoch": 0.69, "learning_rate": 1.527673629397629e-05, "loss": 2.3936, "step": 398230 }, { "epoch": 0.69, "learning_rate": 1.5275864354049464e-05, "loss": 2.2692, "step": 398240 }, { "epoch": 0.69, "learning_rate": 1.5274992414122638e-05, "loss": 2.3768, "step": 398250 }, { "epoch": 0.69, "learning_rate": 1.527412047419581e-05, "loss": 2.2573, "step": 398260 }, { "epoch": 0.69, "learning_rate": 1.5273248534268982e-05, "loss": 2.4525, "step": 398270 }, { "epoch": 0.69, "learning_rate": 1.527237659434216e-05, "loss": 2.4224, "step": 398280 }, { "epoch": 0.69, "learning_rate": 1.527150465441533e-05, "loss": 2.2197, "step": 398290 }, { "epoch": 0.69, "learning_rate": 1.5270632714488503e-05, "loss": 2.3149, "step": 398300 }, { "epoch": 0.69, "learning_rate": 1.5269760774561677e-05, "loss": 2.1988, "step": 398310 }, { "epoch": 0.69, "learning_rate": 1.526888883463485e-05, "loss": 2.3999, "step": 398320 }, { "epoch": 0.69, "learning_rate": 1.5268016894708025e-05, "loss": 2.2879, "step": 398330 }, { "epoch": 0.69, "learning_rate": 1.5267144954781195e-05, "loss": 2.3095, "step": 398340 }, { "epoch": 0.69, "learning_rate": 1.526627301485437e-05, "loss": 2.29, "step": 398350 }, { "epoch": 0.69, "learning_rate": 1.5265401074927542e-05, "loss": 2.1799, "step": 398360 }, { "epoch": 0.69, "learning_rate": 1.5264529135000716e-05, "loss": 2.3708, "step": 398370 }, { "epoch": 0.69, "learning_rate": 1.5263657195073887e-05, "loss": 2.328, "step": 398380 }, { "epoch": 0.69, "learning_rate": 1.5262785255147064e-05, "loss": 2.2672, "step": 398390 }, { "epoch": 0.69, "learning_rate": 1.5261913315220238e-05, "loss": 2.2802, "step": 398400 }, { "epoch": 0.69, "learning_rate": 1.5261041375293408e-05, "loss": 2.3122, "step": 398410 }, { "epoch": 0.69, "learning_rate": 1.526016943536658e-05, "loss": 2.1281, "step": 398420 }, { "epoch": 0.69, "learning_rate": 1.5259297495439755e-05, "loss": 2.3292, "step": 398430 }, { "epoch": 0.69, "learning_rate": 1.525842555551293e-05, "loss": 2.3434, "step": 398440 }, { "epoch": 0.69, "learning_rate": 1.5257553615586101e-05, "loss": 2.2391, "step": 398450 }, { "epoch": 0.69, "learning_rate": 1.5256681675659273e-05, "loss": 2.2508, "step": 398460 }, { "epoch": 0.69, "learning_rate": 1.5255809735732449e-05, "loss": 2.3562, "step": 398470 }, { "epoch": 0.69, "learning_rate": 1.5254937795805621e-05, "loss": 2.3362, "step": 398480 }, { "epoch": 0.69, "learning_rate": 1.5254065855878793e-05, "loss": 2.2035, "step": 398490 }, { "epoch": 0.69, "learning_rate": 1.5253193915951967e-05, "loss": 2.4258, "step": 398500 }, { "epoch": 0.69, "learning_rate": 1.525232197602514e-05, "loss": 2.3688, "step": 398510 }, { "epoch": 0.69, "learning_rate": 1.5251450036098314e-05, "loss": 2.2958, "step": 398520 }, { "epoch": 0.69, "learning_rate": 1.5250578096171486e-05, "loss": 2.2612, "step": 398530 }, { "epoch": 0.7, "learning_rate": 1.5249706156244662e-05, "loss": 2.2705, "step": 398540 }, { "epoch": 0.7, "learning_rate": 1.5248834216317834e-05, "loss": 2.2602, "step": 398550 }, { "epoch": 0.7, "learning_rate": 1.5247962276391006e-05, "loss": 2.1693, "step": 398560 }, { "epoch": 0.7, "learning_rate": 1.5247090336464178e-05, "loss": 2.3598, "step": 398570 }, { "epoch": 0.7, "learning_rate": 1.5246218396537354e-05, "loss": 2.3635, "step": 398580 }, { "epoch": 0.7, "learning_rate": 1.5245346456610526e-05, "loss": 2.328, "step": 398590 }, { "epoch": 0.7, "learning_rate": 1.52444745166837e-05, "loss": 2.2707, "step": 398600 }, { "epoch": 0.7, "learning_rate": 1.5243602576756871e-05, "loss": 2.3478, "step": 398610 }, { "epoch": 0.7, "learning_rate": 1.5242730636830047e-05, "loss": 2.3767, "step": 398620 }, { "epoch": 0.7, "learning_rate": 1.5241858696903219e-05, "loss": 2.17, "step": 398630 }, { "epoch": 0.7, "learning_rate": 1.5240986756976391e-05, "loss": 2.2585, "step": 398640 }, { "epoch": 0.7, "learning_rate": 1.5240114817049563e-05, "loss": 2.2552, "step": 398650 }, { "epoch": 0.7, "learning_rate": 1.5239242877122739e-05, "loss": 2.304, "step": 398660 }, { "epoch": 0.7, "learning_rate": 1.5238370937195912e-05, "loss": 2.3271, "step": 398670 }, { "epoch": 0.7, "learning_rate": 1.5237498997269084e-05, "loss": 2.4087, "step": 398680 }, { "epoch": 0.7, "learning_rate": 1.523662705734226e-05, "loss": 2.2433, "step": 398690 }, { "epoch": 0.7, "learning_rate": 1.5235755117415432e-05, "loss": 2.3141, "step": 398700 }, { "epoch": 0.7, "learning_rate": 1.5234883177488604e-05, "loss": 2.3355, "step": 398710 }, { "epoch": 0.7, "learning_rate": 1.5234011237561776e-05, "loss": 2.3807, "step": 398720 }, { "epoch": 0.7, "learning_rate": 1.5233139297634952e-05, "loss": 2.2294, "step": 398730 }, { "epoch": 0.7, "learning_rate": 1.5232267357708124e-05, "loss": 2.1472, "step": 398740 }, { "epoch": 0.7, "learning_rate": 1.5231395417781297e-05, "loss": 2.2988, "step": 398750 }, { "epoch": 0.7, "learning_rate": 1.523052347785447e-05, "loss": 2.3928, "step": 398760 }, { "epoch": 0.7, "learning_rate": 1.5229651537927645e-05, "loss": 2.3178, "step": 398770 }, { "epoch": 0.7, "learning_rate": 1.5228779598000817e-05, "loss": 2.3277, "step": 398780 }, { "epoch": 0.7, "learning_rate": 1.5227907658073989e-05, "loss": 2.1567, "step": 398790 }, { "epoch": 0.7, "learning_rate": 1.5227035718147165e-05, "loss": 2.2519, "step": 398800 }, { "epoch": 0.7, "learning_rate": 1.5226163778220337e-05, "loss": 2.2675, "step": 398810 }, { "epoch": 0.7, "learning_rate": 1.5225291838293509e-05, "loss": 2.2054, "step": 398820 }, { "epoch": 0.7, "learning_rate": 1.5224419898366683e-05, "loss": 2.3419, "step": 398830 }, { "epoch": 0.7, "learning_rate": 1.5223547958439858e-05, "loss": 2.1841, "step": 398840 }, { "epoch": 0.7, "learning_rate": 1.522267601851303e-05, "loss": 2.2743, "step": 398850 }, { "epoch": 0.7, "learning_rate": 1.5221804078586202e-05, "loss": 2.3222, "step": 398860 }, { "epoch": 0.7, "learning_rate": 1.5220932138659374e-05, "loss": 2.2289, "step": 398870 }, { "epoch": 0.7, "learning_rate": 1.522006019873255e-05, "loss": 2.3902, "step": 398880 }, { "epoch": 0.7, "learning_rate": 1.5219188258805722e-05, "loss": 2.2041, "step": 398890 }, { "epoch": 0.7, "learning_rate": 1.5218316318878894e-05, "loss": 2.1734, "step": 398900 }, { "epoch": 0.7, "learning_rate": 1.5217444378952068e-05, "loss": 2.3725, "step": 398910 }, { "epoch": 0.7, "learning_rate": 1.5216572439025243e-05, "loss": 2.3601, "step": 398920 }, { "epoch": 0.7, "learning_rate": 1.5215700499098415e-05, "loss": 2.2902, "step": 398930 }, { "epoch": 0.7, "learning_rate": 1.5214828559171587e-05, "loss": 2.3189, "step": 398940 }, { "epoch": 0.7, "learning_rate": 1.5213956619244763e-05, "loss": 2.1762, "step": 398950 }, { "epoch": 0.7, "learning_rate": 1.5213084679317935e-05, "loss": 2.3245, "step": 398960 }, { "epoch": 0.7, "learning_rate": 1.5212212739391107e-05, "loss": 2.343, "step": 398970 }, { "epoch": 0.7, "learning_rate": 1.521134079946428e-05, "loss": 2.3868, "step": 398980 }, { "epoch": 0.7, "learning_rate": 1.5210468859537454e-05, "loss": 2.3304, "step": 398990 }, { "epoch": 0.7, "learning_rate": 1.5209596919610628e-05, "loss": 2.3113, "step": 399000 }, { "epoch": 0.7, "learning_rate": 1.52087249796838e-05, "loss": 2.0861, "step": 399010 }, { "epoch": 0.7, "learning_rate": 1.5207853039756972e-05, "loss": 2.2944, "step": 399020 }, { "epoch": 0.7, "learning_rate": 1.5206981099830148e-05, "loss": 2.4091, "step": 399030 }, { "epoch": 0.7, "learning_rate": 1.520610915990332e-05, "loss": 2.2496, "step": 399040 }, { "epoch": 0.7, "learning_rate": 1.5205237219976492e-05, "loss": 2.3181, "step": 399050 }, { "epoch": 0.7, "learning_rate": 1.5204365280049667e-05, "loss": 2.2907, "step": 399060 }, { "epoch": 0.7, "learning_rate": 1.520349334012284e-05, "loss": 2.2826, "step": 399070 }, { "epoch": 0.7, "learning_rate": 1.5202621400196013e-05, "loss": 2.2661, "step": 399080 }, { "epoch": 0.7, "learning_rate": 1.5201749460269185e-05, "loss": 2.2618, "step": 399090 }, { "epoch": 0.7, "learning_rate": 1.520087752034236e-05, "loss": 2.3369, "step": 399100 }, { "epoch": 0.7, "learning_rate": 1.5200005580415533e-05, "loss": 2.3886, "step": 399110 }, { "epoch": 0.7, "learning_rate": 1.5199133640488705e-05, "loss": 2.3669, "step": 399120 }, { "epoch": 0.7, "learning_rate": 1.5198261700561877e-05, "loss": 2.2292, "step": 399130 }, { "epoch": 0.7, "learning_rate": 1.5197389760635052e-05, "loss": 2.2915, "step": 399140 }, { "epoch": 0.7, "learning_rate": 1.5196517820708226e-05, "loss": 2.286, "step": 399150 }, { "epoch": 0.7, "learning_rate": 1.5195645880781398e-05, "loss": 2.3198, "step": 399160 }, { "epoch": 0.7, "learning_rate": 1.519477394085457e-05, "loss": 2.2054, "step": 399170 }, { "epoch": 0.7, "learning_rate": 1.5193902000927746e-05, "loss": 2.3742, "step": 399180 }, { "epoch": 0.7, "learning_rate": 1.5193030061000918e-05, "loss": 2.2231, "step": 399190 }, { "epoch": 0.7, "learning_rate": 1.519215812107409e-05, "loss": 2.3406, "step": 399200 }, { "epoch": 0.7, "learning_rate": 1.5191286181147265e-05, "loss": 2.2697, "step": 399210 }, { "epoch": 0.7, "learning_rate": 1.5190414241220438e-05, "loss": 2.2328, "step": 399220 }, { "epoch": 0.7, "learning_rate": 1.5189542301293611e-05, "loss": 2.2116, "step": 399230 }, { "epoch": 0.7, "learning_rate": 1.5188670361366783e-05, "loss": 2.1739, "step": 399240 }, { "epoch": 0.7, "learning_rate": 1.5187798421439959e-05, "loss": 2.3312, "step": 399250 }, { "epoch": 0.7, "learning_rate": 1.5186926481513131e-05, "loss": 2.3088, "step": 399260 }, { "epoch": 0.7, "learning_rate": 1.5186054541586303e-05, "loss": 2.4505, "step": 399270 }, { "epoch": 0.7, "learning_rate": 1.5185182601659475e-05, "loss": 2.3479, "step": 399280 }, { "epoch": 0.7, "learning_rate": 1.518431066173265e-05, "loss": 2.3414, "step": 399290 }, { "epoch": 0.7, "learning_rate": 1.5183438721805823e-05, "loss": 2.2441, "step": 399300 }, { "epoch": 0.7, "learning_rate": 1.5182566781878996e-05, "loss": 2.2602, "step": 399310 }, { "epoch": 0.7, "learning_rate": 1.518169484195217e-05, "loss": 2.2562, "step": 399320 }, { "epoch": 0.7, "learning_rate": 1.5180822902025344e-05, "loss": 2.3237, "step": 399330 }, { "epoch": 0.7, "learning_rate": 1.5179950962098516e-05, "loss": 2.2518, "step": 399340 }, { "epoch": 0.7, "learning_rate": 1.5179079022171688e-05, "loss": 2.3438, "step": 399350 }, { "epoch": 0.7, "learning_rate": 1.5178207082244864e-05, "loss": 2.2361, "step": 399360 }, { "epoch": 0.7, "learning_rate": 1.5177335142318036e-05, "loss": 2.4049, "step": 399370 }, { "epoch": 0.7, "learning_rate": 1.5176463202391208e-05, "loss": 2.2407, "step": 399380 }, { "epoch": 0.7, "learning_rate": 1.5175591262464381e-05, "loss": 2.2378, "step": 399390 }, { "epoch": 0.7, "learning_rate": 1.5174719322537557e-05, "loss": 2.1391, "step": 399400 }, { "epoch": 0.7, "learning_rate": 1.5173847382610729e-05, "loss": 2.3556, "step": 399410 }, { "epoch": 0.7, "learning_rate": 1.5172975442683901e-05, "loss": 2.3587, "step": 399420 }, { "epoch": 0.7, "learning_rate": 1.5172103502757073e-05, "loss": 2.3495, "step": 399430 }, { "epoch": 0.7, "learning_rate": 1.5171231562830249e-05, "loss": 2.266, "step": 399440 }, { "epoch": 0.7, "learning_rate": 1.517035962290342e-05, "loss": 2.3385, "step": 399450 }, { "epoch": 0.7, "learning_rate": 1.5169487682976594e-05, "loss": 2.3987, "step": 399460 }, { "epoch": 0.7, "learning_rate": 1.5168615743049768e-05, "loss": 2.1875, "step": 399470 }, { "epoch": 0.7, "learning_rate": 1.5167743803122942e-05, "loss": 2.2809, "step": 399480 }, { "epoch": 0.7, "learning_rate": 1.5166871863196114e-05, "loss": 2.1601, "step": 399490 }, { "epoch": 0.7, "learning_rate": 1.5165999923269286e-05, "loss": 2.3426, "step": 399500 }, { "epoch": 0.7, "learning_rate": 1.5165127983342462e-05, "loss": 2.2558, "step": 399510 }, { "epoch": 0.7, "learning_rate": 1.5164256043415634e-05, "loss": 2.3171, "step": 399520 }, { "epoch": 0.7, "learning_rate": 1.5163384103488806e-05, "loss": 2.2165, "step": 399530 }, { "epoch": 0.7, "learning_rate": 1.516251216356198e-05, "loss": 2.2667, "step": 399540 }, { "epoch": 0.7, "learning_rate": 1.5161640223635153e-05, "loss": 2.2008, "step": 399550 }, { "epoch": 0.7, "learning_rate": 1.5160768283708327e-05, "loss": 2.3407, "step": 399560 }, { "epoch": 0.7, "learning_rate": 1.5159896343781499e-05, "loss": 2.2799, "step": 399570 }, { "epoch": 0.7, "learning_rate": 1.5159024403854671e-05, "loss": 2.3064, "step": 399580 }, { "epoch": 0.7, "learning_rate": 1.5158152463927847e-05, "loss": 2.2539, "step": 399590 }, { "epoch": 0.7, "learning_rate": 1.5157280524001019e-05, "loss": 2.2829, "step": 399600 }, { "epoch": 0.7, "learning_rate": 1.515640858407419e-05, "loss": 2.265, "step": 399610 }, { "epoch": 0.7, "learning_rate": 1.5155536644147366e-05, "loss": 2.3754, "step": 399620 }, { "epoch": 0.7, "learning_rate": 1.5154664704220538e-05, "loss": 2.3593, "step": 399630 }, { "epoch": 0.7, "learning_rate": 1.5153792764293712e-05, "loss": 2.2924, "step": 399640 }, { "epoch": 0.7, "learning_rate": 1.5152920824366884e-05, "loss": 2.262, "step": 399650 }, { "epoch": 0.7, "learning_rate": 1.515204888444006e-05, "loss": 2.2722, "step": 399660 }, { "epoch": 0.7, "learning_rate": 1.5151176944513232e-05, "loss": 2.317, "step": 399670 }, { "epoch": 0.7, "learning_rate": 1.5150305004586404e-05, "loss": 2.2415, "step": 399680 }, { "epoch": 0.7, "learning_rate": 1.5149433064659576e-05, "loss": 2.2741, "step": 399690 }, { "epoch": 0.7, "learning_rate": 1.5148561124732751e-05, "loss": 2.3447, "step": 399700 }, { "epoch": 0.7, "learning_rate": 1.5147689184805925e-05, "loss": 2.2687, "step": 399710 }, { "epoch": 0.7, "learning_rate": 1.5146817244879097e-05, "loss": 2.3792, "step": 399720 }, { "epoch": 0.7, "learning_rate": 1.5145945304952273e-05, "loss": 2.3499, "step": 399730 }, { "epoch": 0.7, "learning_rate": 1.5145073365025445e-05, "loss": 2.3838, "step": 399740 }, { "epoch": 0.7, "learning_rate": 1.5144201425098617e-05, "loss": 2.1788, "step": 399750 }, { "epoch": 0.7, "learning_rate": 1.5143329485171789e-05, "loss": 2.3289, "step": 399760 }, { "epoch": 0.7, "learning_rate": 1.5142457545244964e-05, "loss": 2.3245, "step": 399770 }, { "epoch": 0.7, "learning_rate": 1.5141585605318136e-05, "loss": 2.2909, "step": 399780 }, { "epoch": 0.7, "learning_rate": 1.514071366539131e-05, "loss": 2.3831, "step": 399790 }, { "epoch": 0.7, "learning_rate": 1.5139841725464482e-05, "loss": 2.3554, "step": 399800 }, { "epoch": 0.7, "learning_rate": 1.5138969785537658e-05, "loss": 2.2683, "step": 399810 }, { "epoch": 0.7, "learning_rate": 1.513809784561083e-05, "loss": 2.1912, "step": 399820 }, { "epoch": 0.7, "learning_rate": 1.5137225905684002e-05, "loss": 2.202, "step": 399830 }, { "epoch": 0.7, "learning_rate": 1.5136353965757174e-05, "loss": 2.403, "step": 399840 }, { "epoch": 0.7, "learning_rate": 1.513548202583035e-05, "loss": 2.322, "step": 399850 }, { "epoch": 0.7, "learning_rate": 1.5134610085903522e-05, "loss": 2.3893, "step": 399860 }, { "epoch": 0.7, "learning_rate": 1.5133738145976695e-05, "loss": 2.2471, "step": 399870 }, { "epoch": 0.7, "learning_rate": 1.513286620604987e-05, "loss": 2.2812, "step": 399880 }, { "epoch": 0.7, "learning_rate": 1.5131994266123043e-05, "loss": 2.424, "step": 399890 }, { "epoch": 0.7, "learning_rate": 1.5131122326196215e-05, "loss": 2.4303, "step": 399900 }, { "epoch": 0.7, "learning_rate": 1.5130250386269387e-05, "loss": 2.3253, "step": 399910 }, { "epoch": 0.7, "learning_rate": 1.5129378446342562e-05, "loss": 2.303, "step": 399920 }, { "epoch": 0.7, "learning_rate": 1.5128506506415735e-05, "loss": 2.2859, "step": 399930 }, { "epoch": 0.7, "learning_rate": 1.5127634566488907e-05, "loss": 2.4975, "step": 399940 }, { "epoch": 0.7, "learning_rate": 1.512676262656208e-05, "loss": 2.2584, "step": 399950 }, { "epoch": 0.7, "learning_rate": 1.5125890686635256e-05, "loss": 2.2841, "step": 399960 }, { "epoch": 0.7, "learning_rate": 1.5125018746708428e-05, "loss": 2.4113, "step": 399970 }, { "epoch": 0.7, "learning_rate": 1.51241468067816e-05, "loss": 2.3934, "step": 399980 }, { "epoch": 0.7, "learning_rate": 1.5123274866854775e-05, "loss": 2.3295, "step": 399990 }, { "epoch": 0.7, "learning_rate": 1.5122402926927948e-05, "loss": 2.2265, "step": 400000 }, { "epoch": 0.7, "learning_rate": 1.512153098700112e-05, "loss": 2.2558, "step": 400010 }, { "epoch": 0.7, "learning_rate": 1.5120659047074293e-05, "loss": 2.3104, "step": 400020 }, { "epoch": 0.7, "learning_rate": 1.5119787107147467e-05, "loss": 2.3432, "step": 400030 }, { "epoch": 0.7, "learning_rate": 1.5118915167220641e-05, "loss": 2.2026, "step": 400040 }, { "epoch": 0.7, "learning_rate": 1.5118043227293813e-05, "loss": 2.3438, "step": 400050 }, { "epoch": 0.7, "learning_rate": 1.5117171287366985e-05, "loss": 2.2399, "step": 400060 }, { "epoch": 0.7, "learning_rate": 1.511629934744016e-05, "loss": 2.2797, "step": 400070 }, { "epoch": 0.7, "learning_rate": 1.5115427407513333e-05, "loss": 2.2995, "step": 400080 }, { "epoch": 0.7, "learning_rate": 1.5114555467586505e-05, "loss": 2.4303, "step": 400090 }, { "epoch": 0.7, "learning_rate": 1.5113683527659678e-05, "loss": 2.319, "step": 400100 }, { "epoch": 0.7, "learning_rate": 1.5112811587732852e-05, "loss": 2.3175, "step": 400110 }, { "epoch": 0.7, "learning_rate": 1.5111939647806026e-05, "loss": 2.4791, "step": 400120 }, { "epoch": 0.7, "learning_rate": 1.5111067707879198e-05, "loss": 2.2435, "step": 400130 }, { "epoch": 0.7, "learning_rate": 1.5110195767952374e-05, "loss": 2.3577, "step": 400140 }, { "epoch": 0.7, "learning_rate": 1.5109323828025546e-05, "loss": 2.3702, "step": 400150 }, { "epoch": 0.7, "learning_rate": 1.5108451888098718e-05, "loss": 2.2402, "step": 400160 }, { "epoch": 0.7, "learning_rate": 1.510757994817189e-05, "loss": 2.2862, "step": 400170 }, { "epoch": 0.7, "learning_rate": 1.5106708008245065e-05, "loss": 2.2193, "step": 400180 }, { "epoch": 0.7, "learning_rate": 1.5105836068318239e-05, "loss": 2.1555, "step": 400190 }, { "epoch": 0.7, "learning_rate": 1.5104964128391411e-05, "loss": 2.2112, "step": 400200 }, { "epoch": 0.7, "learning_rate": 1.5104092188464583e-05, "loss": 2.4192, "step": 400210 }, { "epoch": 0.7, "learning_rate": 1.5103220248537759e-05, "loss": 2.3441, "step": 400220 }, { "epoch": 0.7, "learning_rate": 1.510234830861093e-05, "loss": 2.2329, "step": 400230 }, { "epoch": 0.7, "learning_rate": 1.5101476368684103e-05, "loss": 2.4366, "step": 400240 }, { "epoch": 0.7, "learning_rate": 1.5100604428757278e-05, "loss": 2.3247, "step": 400250 }, { "epoch": 0.7, "learning_rate": 1.509973248883045e-05, "loss": 2.2826, "step": 400260 }, { "epoch": 0.7, "learning_rate": 1.5098860548903624e-05, "loss": 2.2887, "step": 400270 }, { "epoch": 0.7, "learning_rate": 1.5097988608976796e-05, "loss": 2.3439, "step": 400280 }, { "epoch": 0.7, "learning_rate": 1.5097116669049972e-05, "loss": 2.3632, "step": 400290 }, { "epoch": 0.7, "learning_rate": 1.5096244729123144e-05, "loss": 2.2308, "step": 400300 }, { "epoch": 0.7, "learning_rate": 1.5095372789196316e-05, "loss": 2.2254, "step": 400310 }, { "epoch": 0.7, "learning_rate": 1.5094500849269488e-05, "loss": 2.3112, "step": 400320 }, { "epoch": 0.7, "learning_rate": 1.5093628909342663e-05, "loss": 2.4018, "step": 400330 }, { "epoch": 0.7, "learning_rate": 1.5092756969415835e-05, "loss": 2.3322, "step": 400340 }, { "epoch": 0.7, "learning_rate": 1.509188502948901e-05, "loss": 2.3031, "step": 400350 }, { "epoch": 0.7, "learning_rate": 1.5091013089562181e-05, "loss": 2.2672, "step": 400360 }, { "epoch": 0.7, "learning_rate": 1.5090141149635357e-05, "loss": 2.252, "step": 400370 }, { "epoch": 0.7, "learning_rate": 1.5089269209708529e-05, "loss": 2.3581, "step": 400380 }, { "epoch": 0.7, "learning_rate": 1.50883972697817e-05, "loss": 2.3934, "step": 400390 }, { "epoch": 0.7, "learning_rate": 1.5087525329854876e-05, "loss": 2.2679, "step": 400400 }, { "epoch": 0.7, "learning_rate": 1.5086653389928048e-05, "loss": 2.3268, "step": 400410 }, { "epoch": 0.7, "learning_rate": 1.508578145000122e-05, "loss": 2.353, "step": 400420 }, { "epoch": 0.7, "learning_rate": 1.5084909510074394e-05, "loss": 2.2451, "step": 400430 }, { "epoch": 0.7, "learning_rate": 1.508403757014757e-05, "loss": 2.2552, "step": 400440 }, { "epoch": 0.7, "learning_rate": 1.5083165630220742e-05, "loss": 2.2241, "step": 400450 }, { "epoch": 0.7, "learning_rate": 1.5082293690293914e-05, "loss": 2.3158, "step": 400460 }, { "epoch": 0.7, "learning_rate": 1.5081421750367086e-05, "loss": 2.3128, "step": 400470 }, { "epoch": 0.7, "learning_rate": 1.5080549810440261e-05, "loss": 2.3517, "step": 400480 }, { "epoch": 0.7, "learning_rate": 1.5079677870513433e-05, "loss": 2.2926, "step": 400490 }, { "epoch": 0.7, "learning_rate": 1.5078805930586607e-05, "loss": 2.3091, "step": 400500 }, { "epoch": 0.7, "learning_rate": 1.507793399065978e-05, "loss": 2.1556, "step": 400510 }, { "epoch": 0.7, "learning_rate": 1.5077062050732955e-05, "loss": 2.3562, "step": 400520 }, { "epoch": 0.7, "learning_rate": 1.5076190110806127e-05, "loss": 2.3799, "step": 400530 }, { "epoch": 0.7, "learning_rate": 1.5075318170879299e-05, "loss": 2.4081, "step": 400540 }, { "epoch": 0.7, "learning_rate": 1.5074446230952474e-05, "loss": 2.2503, "step": 400550 }, { "epoch": 0.7, "learning_rate": 1.5073574291025646e-05, "loss": 2.2873, "step": 400560 }, { "epoch": 0.7, "learning_rate": 1.5072702351098819e-05, "loss": 2.3453, "step": 400570 }, { "epoch": 0.7, "learning_rate": 1.5071830411171992e-05, "loss": 2.2834, "step": 400580 }, { "epoch": 0.7, "learning_rate": 1.5070958471245166e-05, "loss": 2.2758, "step": 400590 }, { "epoch": 0.7, "learning_rate": 1.507008653131834e-05, "loss": 2.1469, "step": 400600 }, { "epoch": 0.7, "learning_rate": 1.5069214591391512e-05, "loss": 2.2566, "step": 400610 }, { "epoch": 0.7, "learning_rate": 1.5068342651464684e-05, "loss": 2.1736, "step": 400620 }, { "epoch": 0.7, "learning_rate": 1.506747071153786e-05, "loss": 2.336, "step": 400630 }, { "epoch": 0.7, "learning_rate": 1.5066598771611032e-05, "loss": 2.181, "step": 400640 }, { "epoch": 0.7, "learning_rate": 1.5065726831684204e-05, "loss": 2.234, "step": 400650 }, { "epoch": 0.7, "learning_rate": 1.5064854891757379e-05, "loss": 2.2929, "step": 400660 }, { "epoch": 0.7, "learning_rate": 1.5063982951830551e-05, "loss": 2.2963, "step": 400670 }, { "epoch": 0.7, "learning_rate": 1.5063111011903725e-05, "loss": 2.3096, "step": 400680 }, { "epoch": 0.7, "learning_rate": 1.5062239071976897e-05, "loss": 2.3106, "step": 400690 }, { "epoch": 0.7, "learning_rate": 1.5061367132050072e-05, "loss": 2.2022, "step": 400700 }, { "epoch": 0.7, "learning_rate": 1.5060495192123245e-05, "loss": 2.3847, "step": 400710 }, { "epoch": 0.7, "learning_rate": 1.5059623252196417e-05, "loss": 2.2776, "step": 400720 }, { "epoch": 0.7, "learning_rate": 1.5058751312269589e-05, "loss": 2.2245, "step": 400730 }, { "epoch": 0.7, "learning_rate": 1.5057879372342764e-05, "loss": 2.4228, "step": 400740 }, { "epoch": 0.7, "learning_rate": 1.5057007432415938e-05, "loss": 2.3049, "step": 400750 }, { "epoch": 0.7, "learning_rate": 1.505613549248911e-05, "loss": 2.2536, "step": 400760 }, { "epoch": 0.7, "learning_rate": 1.5055263552562282e-05, "loss": 2.2973, "step": 400770 }, { "epoch": 0.7, "learning_rate": 1.5054391612635458e-05, "loss": 2.3622, "step": 400780 }, { "epoch": 0.7, "learning_rate": 1.505351967270863e-05, "loss": 2.3559, "step": 400790 }, { "epoch": 0.7, "learning_rate": 1.5052647732781802e-05, "loss": 2.3914, "step": 400800 }, { "epoch": 0.7, "learning_rate": 1.5051775792854977e-05, "loss": 2.2839, "step": 400810 }, { "epoch": 0.7, "learning_rate": 1.505090385292815e-05, "loss": 2.2659, "step": 400820 }, { "epoch": 0.7, "learning_rate": 1.5050031913001323e-05, "loss": 2.3192, "step": 400830 }, { "epoch": 0.7, "learning_rate": 1.5049159973074495e-05, "loss": 2.4039, "step": 400840 }, { "epoch": 0.7, "learning_rate": 1.504828803314767e-05, "loss": 2.2961, "step": 400850 }, { "epoch": 0.7, "learning_rate": 1.5047416093220843e-05, "loss": 2.2537, "step": 400860 }, { "epoch": 0.7, "learning_rate": 1.5046544153294015e-05, "loss": 2.2784, "step": 400870 }, { "epoch": 0.7, "learning_rate": 1.5045672213367187e-05, "loss": 2.2748, "step": 400880 }, { "epoch": 0.7, "learning_rate": 1.5044800273440362e-05, "loss": 2.3528, "step": 400890 }, { "epoch": 0.7, "learning_rate": 1.5043928333513534e-05, "loss": 2.2669, "step": 400900 }, { "epoch": 0.7, "learning_rate": 1.5043056393586708e-05, "loss": 2.219, "step": 400910 }, { "epoch": 0.7, "learning_rate": 1.5042184453659884e-05, "loss": 2.3566, "step": 400920 }, { "epoch": 0.7, "learning_rate": 1.5041312513733056e-05, "loss": 2.3912, "step": 400930 }, { "epoch": 0.7, "learning_rate": 1.5040440573806228e-05, "loss": 2.3176, "step": 400940 }, { "epoch": 0.7, "learning_rate": 1.50395686338794e-05, "loss": 2.2482, "step": 400950 }, { "epoch": 0.7, "learning_rate": 1.5038696693952575e-05, "loss": 2.3404, "step": 400960 }, { "epoch": 0.7, "learning_rate": 1.5037824754025747e-05, "loss": 2.3542, "step": 400970 }, { "epoch": 0.7, "learning_rate": 1.503695281409892e-05, "loss": 2.3866, "step": 400980 }, { "epoch": 0.7, "learning_rate": 1.5036080874172093e-05, "loss": 2.2588, "step": 400990 }, { "epoch": 0.7, "learning_rate": 1.5035208934245269e-05, "loss": 2.4393, "step": 401000 }, { "epoch": 0.7, "learning_rate": 1.503433699431844e-05, "loss": 2.3049, "step": 401010 }, { "epoch": 0.7, "learning_rate": 1.5033465054391613e-05, "loss": 2.2878, "step": 401020 }, { "epoch": 0.7, "learning_rate": 1.5032593114464785e-05, "loss": 2.3208, "step": 401030 }, { "epoch": 0.7, "learning_rate": 1.503172117453796e-05, "loss": 2.2407, "step": 401040 }, { "epoch": 0.7, "learning_rate": 1.5030849234611132e-05, "loss": 2.4005, "step": 401050 }, { "epoch": 0.7, "learning_rate": 1.5029977294684306e-05, "loss": 2.4162, "step": 401060 }, { "epoch": 0.7, "learning_rate": 1.502910535475748e-05, "loss": 2.2772, "step": 401070 }, { "epoch": 0.7, "learning_rate": 1.5028233414830654e-05, "loss": 2.2609, "step": 401080 }, { "epoch": 0.7, "learning_rate": 1.5027361474903826e-05, "loss": 2.2989, "step": 401090 }, { "epoch": 0.7, "learning_rate": 1.5026489534976998e-05, "loss": 2.3655, "step": 401100 }, { "epoch": 0.7, "learning_rate": 1.5025617595050173e-05, "loss": 2.3431, "step": 401110 }, { "epoch": 0.7, "learning_rate": 1.5024745655123345e-05, "loss": 2.3721, "step": 401120 }, { "epoch": 0.7, "learning_rate": 1.5023873715196517e-05, "loss": 2.3714, "step": 401130 }, { "epoch": 0.7, "learning_rate": 1.5023001775269691e-05, "loss": 2.2265, "step": 401140 }, { "epoch": 0.7, "learning_rate": 1.5022129835342865e-05, "loss": 2.2432, "step": 401150 }, { "epoch": 0.7, "learning_rate": 1.5021257895416039e-05, "loss": 2.2426, "step": 401160 }, { "epoch": 0.7, "learning_rate": 1.5020385955489211e-05, "loss": 2.3351, "step": 401170 }, { "epoch": 0.7, "learning_rate": 1.5019514015562386e-05, "loss": 2.294, "step": 401180 }, { "epoch": 0.7, "learning_rate": 1.5018642075635558e-05, "loss": 2.3279, "step": 401190 }, { "epoch": 0.7, "learning_rate": 1.501777013570873e-05, "loss": 2.3737, "step": 401200 }, { "epoch": 0.7, "learning_rate": 1.5016898195781903e-05, "loss": 2.3627, "step": 401210 }, { "epoch": 0.7, "learning_rate": 1.5016026255855078e-05, "loss": 2.1763, "step": 401220 }, { "epoch": 0.7, "learning_rate": 1.5015154315928252e-05, "loss": 2.3371, "step": 401230 }, { "epoch": 0.7, "learning_rate": 1.5014282376001424e-05, "loss": 2.2448, "step": 401240 }, { "epoch": 0.7, "learning_rate": 1.5013410436074596e-05, "loss": 2.4475, "step": 401250 }, { "epoch": 0.7, "learning_rate": 1.5012538496147771e-05, "loss": 2.3353, "step": 401260 }, { "epoch": 0.7, "learning_rate": 1.5011666556220943e-05, "loss": 2.2933, "step": 401270 }, { "epoch": 0.7, "learning_rate": 1.5010794616294116e-05, "loss": 2.3298, "step": 401280 }, { "epoch": 0.7, "learning_rate": 1.5009922676367288e-05, "loss": 2.2345, "step": 401290 }, { "epoch": 0.7, "learning_rate": 1.5009050736440463e-05, "loss": 2.2295, "step": 401300 }, { "epoch": 0.7, "learning_rate": 1.5008178796513637e-05, "loss": 2.2706, "step": 401310 }, { "epoch": 0.7, "learning_rate": 1.5007306856586809e-05, "loss": 2.2174, "step": 401320 }, { "epoch": 0.7, "learning_rate": 1.5006434916659984e-05, "loss": 2.32, "step": 401330 }, { "epoch": 0.7, "learning_rate": 1.5005562976733156e-05, "loss": 2.2256, "step": 401340 }, { "epoch": 0.7, "learning_rate": 1.5004691036806329e-05, "loss": 2.1894, "step": 401350 }, { "epoch": 0.7, "learning_rate": 1.50038190968795e-05, "loss": 2.2735, "step": 401360 }, { "epoch": 0.7, "learning_rate": 1.5002947156952676e-05, "loss": 2.3745, "step": 401370 }, { "epoch": 0.7, "learning_rate": 1.5002075217025848e-05, "loss": 2.2702, "step": 401380 }, { "epoch": 0.7, "learning_rate": 1.5001203277099022e-05, "loss": 2.2919, "step": 401390 }, { "epoch": 0.7, "learning_rate": 1.5000331337172194e-05, "loss": 2.3258, "step": 401400 }, { "epoch": 0.7, "learning_rate": 1.499945939724537e-05, "loss": 2.3299, "step": 401410 }, { "epoch": 0.7, "learning_rate": 1.4998587457318542e-05, "loss": 2.2997, "step": 401420 }, { "epoch": 0.7, "learning_rate": 1.4997715517391714e-05, "loss": 2.2505, "step": 401430 }, { "epoch": 0.7, "learning_rate": 1.4996843577464886e-05, "loss": 2.4142, "step": 401440 }, { "epoch": 0.7, "learning_rate": 1.4995971637538061e-05, "loss": 2.3535, "step": 401450 }, { "epoch": 0.7, "learning_rate": 1.4995099697611233e-05, "loss": 2.3525, "step": 401460 }, { "epoch": 0.7, "learning_rate": 1.4994227757684407e-05, "loss": 2.248, "step": 401470 }, { "epoch": 0.7, "learning_rate": 1.4993355817757582e-05, "loss": 2.35, "step": 401480 }, { "epoch": 0.7, "learning_rate": 1.4992483877830755e-05, "loss": 2.3696, "step": 401490 }, { "epoch": 0.7, "learning_rate": 1.4991611937903927e-05, "loss": 2.2609, "step": 401500 }, { "epoch": 0.7, "learning_rate": 1.4990739997977099e-05, "loss": 2.3561, "step": 401510 }, { "epoch": 0.7, "learning_rate": 1.4989868058050274e-05, "loss": 2.2433, "step": 401520 }, { "epoch": 0.7, "learning_rate": 1.4988996118123446e-05, "loss": 2.3131, "step": 401530 }, { "epoch": 0.7, "learning_rate": 1.498812417819662e-05, "loss": 2.2956, "step": 401540 }, { "epoch": 0.7, "learning_rate": 1.4987252238269792e-05, "loss": 2.3202, "step": 401550 }, { "epoch": 0.7, "learning_rate": 1.4986380298342968e-05, "loss": 2.3046, "step": 401560 }, { "epoch": 0.7, "learning_rate": 1.498550835841614e-05, "loss": 2.2931, "step": 401570 }, { "epoch": 0.7, "learning_rate": 1.4984636418489312e-05, "loss": 2.4354, "step": 401580 }, { "epoch": 0.7, "learning_rate": 1.4983764478562487e-05, "loss": 2.229, "step": 401590 }, { "epoch": 0.7, "learning_rate": 1.498289253863566e-05, "loss": 2.3572, "step": 401600 }, { "epoch": 0.7, "learning_rate": 1.4982020598708831e-05, "loss": 2.2381, "step": 401610 }, { "epoch": 0.7, "learning_rate": 1.4981148658782005e-05, "loss": 2.4016, "step": 401620 }, { "epoch": 0.7, "learning_rate": 1.4980276718855179e-05, "loss": 2.4185, "step": 401630 }, { "epoch": 0.7, "learning_rate": 1.4979404778928353e-05, "loss": 2.2682, "step": 401640 }, { "epoch": 0.7, "learning_rate": 1.4978532839001525e-05, "loss": 2.2275, "step": 401650 }, { "epoch": 0.7, "learning_rate": 1.4977660899074697e-05, "loss": 2.4249, "step": 401660 }, { "epoch": 0.7, "learning_rate": 1.4976788959147872e-05, "loss": 2.3111, "step": 401670 }, { "epoch": 0.7, "learning_rate": 1.4975917019221044e-05, "loss": 2.374, "step": 401680 }, { "epoch": 0.7, "learning_rate": 1.4975045079294216e-05, "loss": 2.493, "step": 401690 }, { "epoch": 0.7, "learning_rate": 1.497417313936739e-05, "loss": 2.3374, "step": 401700 }, { "epoch": 0.7, "learning_rate": 1.4973301199440564e-05, "loss": 2.3457, "step": 401710 }, { "epoch": 0.7, "learning_rate": 1.4972429259513738e-05, "loss": 2.4315, "step": 401720 }, { "epoch": 0.7, "learning_rate": 1.497155731958691e-05, "loss": 2.3647, "step": 401730 }, { "epoch": 0.7, "learning_rate": 1.4970685379660085e-05, "loss": 2.3469, "step": 401740 }, { "epoch": 0.7, "learning_rate": 1.4969813439733257e-05, "loss": 2.3887, "step": 401750 }, { "epoch": 0.7, "learning_rate": 1.496894149980643e-05, "loss": 2.3686, "step": 401760 }, { "epoch": 0.7, "learning_rate": 1.4968069559879601e-05, "loss": 2.303, "step": 401770 }, { "epoch": 0.7, "learning_rate": 1.4967197619952777e-05, "loss": 2.3221, "step": 401780 }, { "epoch": 0.7, "learning_rate": 1.496632568002595e-05, "loss": 2.1624, "step": 401790 }, { "epoch": 0.7, "learning_rate": 1.4965453740099123e-05, "loss": 2.2366, "step": 401800 }, { "epoch": 0.7, "learning_rate": 1.4964581800172295e-05, "loss": 2.299, "step": 401810 }, { "epoch": 0.7, "learning_rate": 1.496370986024547e-05, "loss": 2.3569, "step": 401820 }, { "epoch": 0.7, "learning_rate": 1.4962837920318642e-05, "loss": 2.2562, "step": 401830 }, { "epoch": 0.7, "learning_rate": 1.4961965980391814e-05, "loss": 2.2854, "step": 401840 }, { "epoch": 0.7, "learning_rate": 1.496109404046499e-05, "loss": 2.295, "step": 401850 }, { "epoch": 0.7, "learning_rate": 1.4960222100538162e-05, "loss": 2.2469, "step": 401860 }, { "epoch": 0.7, "learning_rate": 1.4959350160611336e-05, "loss": 2.245, "step": 401870 }, { "epoch": 0.7, "learning_rate": 1.4958478220684508e-05, "loss": 2.1099, "step": 401880 }, { "epoch": 0.7, "learning_rate": 1.4957606280757683e-05, "loss": 2.2834, "step": 401890 }, { "epoch": 0.7, "learning_rate": 1.4956734340830855e-05, "loss": 2.2836, "step": 401900 }, { "epoch": 0.7, "learning_rate": 1.4955862400904027e-05, "loss": 2.2892, "step": 401910 }, { "epoch": 0.7, "learning_rate": 1.49549904609772e-05, "loss": 2.3819, "step": 401920 }, { "epoch": 0.7, "learning_rate": 1.4954118521050375e-05, "loss": 2.3125, "step": 401930 }, { "epoch": 0.7, "learning_rate": 1.4953246581123547e-05, "loss": 2.3021, "step": 401940 }, { "epoch": 0.7, "learning_rate": 1.4952374641196721e-05, "loss": 2.2966, "step": 401950 }, { "epoch": 0.7, "learning_rate": 1.4951502701269893e-05, "loss": 2.3441, "step": 401960 }, { "epoch": 0.7, "learning_rate": 1.4950630761343068e-05, "loss": 2.1984, "step": 401970 }, { "epoch": 0.7, "learning_rate": 1.494975882141624e-05, "loss": 2.269, "step": 401980 }, { "epoch": 0.7, "learning_rate": 1.4948886881489413e-05, "loss": 2.3389, "step": 401990 }, { "epoch": 0.7, "learning_rate": 1.4948014941562588e-05, "loss": 2.3479, "step": 402000 }, { "epoch": 0.7, "learning_rate": 1.494714300163576e-05, "loss": 2.2671, "step": 402010 }, { "epoch": 0.7, "learning_rate": 1.4946271061708932e-05, "loss": 2.3166, "step": 402020 }, { "epoch": 0.7, "learning_rate": 1.4945399121782106e-05, "loss": 2.4144, "step": 402030 }, { "epoch": 0.7, "learning_rate": 1.4944527181855281e-05, "loss": 2.1952, "step": 402040 }, { "epoch": 0.7, "learning_rate": 1.4943655241928453e-05, "loss": 2.2193, "step": 402050 }, { "epoch": 0.7, "learning_rate": 1.4942783302001626e-05, "loss": 2.3611, "step": 402060 }, { "epoch": 0.7, "learning_rate": 1.4941911362074798e-05, "loss": 2.3603, "step": 402070 }, { "epoch": 0.7, "learning_rate": 1.4941039422147973e-05, "loss": 2.3544, "step": 402080 }, { "epoch": 0.7, "learning_rate": 1.4940167482221145e-05, "loss": 2.2841, "step": 402090 }, { "epoch": 0.7, "learning_rate": 1.4939295542294319e-05, "loss": 2.2035, "step": 402100 }, { "epoch": 0.7, "learning_rate": 1.4938423602367493e-05, "loss": 2.3199, "step": 402110 }, { "epoch": 0.7, "learning_rate": 1.4937551662440666e-05, "loss": 2.3762, "step": 402120 }, { "epoch": 0.7, "learning_rate": 1.4936679722513839e-05, "loss": 2.301, "step": 402130 }, { "epoch": 0.7, "learning_rate": 1.493580778258701e-05, "loss": 2.4507, "step": 402140 }, { "epoch": 0.7, "learning_rate": 1.4934935842660186e-05, "loss": 2.3771, "step": 402150 }, { "epoch": 0.7, "learning_rate": 1.4934063902733358e-05, "loss": 2.2751, "step": 402160 }, { "epoch": 0.7, "learning_rate": 1.493319196280653e-05, "loss": 2.2724, "step": 402170 }, { "epoch": 0.7, "learning_rate": 1.4932320022879704e-05, "loss": 2.4229, "step": 402180 }, { "epoch": 0.7, "learning_rate": 1.4931448082952878e-05, "loss": 2.3139, "step": 402190 }, { "epoch": 0.7, "learning_rate": 1.4930576143026052e-05, "loss": 2.3176, "step": 402200 }, { "epoch": 0.7, "learning_rate": 1.4929704203099224e-05, "loss": 2.3241, "step": 402210 }, { "epoch": 0.7, "learning_rate": 1.4928832263172396e-05, "loss": 2.4747, "step": 402220 }, { "epoch": 0.7, "learning_rate": 1.4927960323245571e-05, "loss": 2.2529, "step": 402230 }, { "epoch": 0.7, "learning_rate": 1.4927088383318743e-05, "loss": 2.2225, "step": 402240 }, { "epoch": 0.7, "learning_rate": 1.4926216443391915e-05, "loss": 2.2393, "step": 402250 }, { "epoch": 0.7, "learning_rate": 1.492534450346509e-05, "loss": 2.3659, "step": 402260 }, { "epoch": 0.7, "learning_rate": 1.4924472563538265e-05, "loss": 2.2129, "step": 402270 }, { "epoch": 0.7, "learning_rate": 1.4923600623611437e-05, "loss": 2.3242, "step": 402280 }, { "epoch": 0.7, "learning_rate": 1.4922728683684609e-05, "loss": 2.3423, "step": 402290 }, { "epoch": 0.7, "learning_rate": 1.4921856743757784e-05, "loss": 2.4096, "step": 402300 }, { "epoch": 0.7, "learning_rate": 1.4920984803830956e-05, "loss": 2.3049, "step": 402310 }, { "epoch": 0.7, "learning_rate": 1.4920112863904128e-05, "loss": 2.2676, "step": 402320 }, { "epoch": 0.7, "learning_rate": 1.49192409239773e-05, "loss": 2.2346, "step": 402330 }, { "epoch": 0.7, "learning_rate": 1.4918368984050476e-05, "loss": 2.2865, "step": 402340 }, { "epoch": 0.7, "learning_rate": 1.491749704412365e-05, "loss": 2.3214, "step": 402350 }, { "epoch": 0.7, "learning_rate": 1.4916625104196822e-05, "loss": 2.3431, "step": 402360 }, { "epoch": 0.7, "learning_rate": 1.4915753164269994e-05, "loss": 2.3429, "step": 402370 }, { "epoch": 0.7, "learning_rate": 1.491488122434317e-05, "loss": 2.3089, "step": 402380 }, { "epoch": 0.7, "learning_rate": 1.4914009284416341e-05, "loss": 2.2511, "step": 402390 }, { "epoch": 0.7, "learning_rate": 1.4913137344489513e-05, "loss": 2.105, "step": 402400 }, { "epoch": 0.7, "learning_rate": 1.4912265404562689e-05, "loss": 2.2628, "step": 402410 }, { "epoch": 0.7, "learning_rate": 1.4911393464635861e-05, "loss": 2.2927, "step": 402420 }, { "epoch": 0.7, "learning_rate": 1.4910521524709035e-05, "loss": 2.3772, "step": 402430 }, { "epoch": 0.7, "learning_rate": 1.4909649584782207e-05, "loss": 2.2567, "step": 402440 }, { "epoch": 0.7, "learning_rate": 1.4908777644855382e-05, "loss": 2.3654, "step": 402450 }, { "epoch": 0.7, "learning_rate": 1.4907905704928554e-05, "loss": 2.3402, "step": 402460 }, { "epoch": 0.7, "learning_rate": 1.4907033765001726e-05, "loss": 2.2457, "step": 402470 }, { "epoch": 0.7, "learning_rate": 1.4906161825074898e-05, "loss": 2.4582, "step": 402480 }, { "epoch": 0.7, "learning_rate": 1.4905289885148074e-05, "loss": 2.1535, "step": 402490 }, { "epoch": 0.7, "learning_rate": 1.4904417945221246e-05, "loss": 2.3923, "step": 402500 }, { "epoch": 0.7, "learning_rate": 1.490354600529442e-05, "loss": 2.3615, "step": 402510 }, { "epoch": 0.7, "learning_rate": 1.4902674065367595e-05, "loss": 2.3886, "step": 402520 }, { "epoch": 0.7, "learning_rate": 1.4901802125440767e-05, "loss": 2.2895, "step": 402530 }, { "epoch": 0.7, "learning_rate": 1.490093018551394e-05, "loss": 2.3563, "step": 402540 }, { "epoch": 0.7, "learning_rate": 1.4900058245587111e-05, "loss": 2.2678, "step": 402550 }, { "epoch": 0.7, "learning_rate": 1.4899186305660287e-05, "loss": 2.2645, "step": 402560 }, { "epoch": 0.7, "learning_rate": 1.4898314365733459e-05, "loss": 2.2359, "step": 402570 }, { "epoch": 0.7, "learning_rate": 1.4897442425806633e-05, "loss": 2.2964, "step": 402580 }, { "epoch": 0.7, "learning_rate": 1.4896570485879805e-05, "loss": 2.308, "step": 402590 }, { "epoch": 0.7, "learning_rate": 1.489569854595298e-05, "loss": 2.4024, "step": 402600 }, { "epoch": 0.7, "learning_rate": 1.4894826606026152e-05, "loss": 2.2477, "step": 402610 }, { "epoch": 0.7, "learning_rate": 1.4893954666099324e-05, "loss": 2.3617, "step": 402620 }, { "epoch": 0.7, "learning_rate": 1.4893082726172497e-05, "loss": 2.2477, "step": 402630 }, { "epoch": 0.7, "learning_rate": 1.4892210786245672e-05, "loss": 2.2847, "step": 402640 }, { "epoch": 0.7, "learning_rate": 1.4891338846318844e-05, "loss": 2.21, "step": 402650 }, { "epoch": 0.7, "learning_rate": 1.4890466906392018e-05, "loss": 2.3918, "step": 402660 }, { "epoch": 0.7, "learning_rate": 1.4889594966465192e-05, "loss": 2.3722, "step": 402670 }, { "epoch": 0.7, "learning_rate": 1.4888723026538365e-05, "loss": 2.2617, "step": 402680 }, { "epoch": 0.7, "learning_rate": 1.4887851086611537e-05, "loss": 2.3492, "step": 402690 }, { "epoch": 0.7, "learning_rate": 1.488697914668471e-05, "loss": 2.3192, "step": 402700 }, { "epoch": 0.7, "learning_rate": 1.4886107206757885e-05, "loss": 2.2869, "step": 402710 }, { "epoch": 0.7, "learning_rate": 1.4885235266831057e-05, "loss": 2.2716, "step": 402720 }, { "epoch": 0.7, "learning_rate": 1.488436332690423e-05, "loss": 2.1945, "step": 402730 }, { "epoch": 0.7, "learning_rate": 1.4883491386977403e-05, "loss": 2.3466, "step": 402740 }, { "epoch": 0.7, "learning_rate": 1.4882619447050577e-05, "loss": 2.3043, "step": 402750 }, { "epoch": 0.7, "learning_rate": 1.488174750712375e-05, "loss": 2.391, "step": 402760 }, { "epoch": 0.7, "learning_rate": 1.4880875567196923e-05, "loss": 2.2504, "step": 402770 }, { "epoch": 0.7, "learning_rate": 1.4880003627270098e-05, "loss": 2.2986, "step": 402780 }, { "epoch": 0.7, "learning_rate": 1.487913168734327e-05, "loss": 2.2819, "step": 402790 }, { "epoch": 0.7, "learning_rate": 1.4878259747416442e-05, "loss": 2.2186, "step": 402800 }, { "epoch": 0.7, "learning_rate": 1.4877387807489614e-05, "loss": 2.211, "step": 402810 }, { "epoch": 0.7, "learning_rate": 1.487651586756279e-05, "loss": 2.2764, "step": 402820 }, { "epoch": 0.7, "learning_rate": 1.4875643927635963e-05, "loss": 2.2068, "step": 402830 }, { "epoch": 0.7, "learning_rate": 1.4874771987709136e-05, "loss": 2.3025, "step": 402840 }, { "epoch": 0.7, "learning_rate": 1.4873900047782308e-05, "loss": 2.3346, "step": 402850 }, { "epoch": 0.7, "learning_rate": 1.4873028107855483e-05, "loss": 2.2278, "step": 402860 }, { "epoch": 0.7, "learning_rate": 1.4872156167928655e-05, "loss": 2.3399, "step": 402870 }, { "epoch": 0.7, "learning_rate": 1.4871284228001827e-05, "loss": 2.2974, "step": 402880 }, { "epoch": 0.7, "learning_rate": 1.4870412288075001e-05, "loss": 2.2443, "step": 402890 }, { "epoch": 0.7, "learning_rate": 1.4869540348148175e-05, "loss": 2.369, "step": 402900 }, { "epoch": 0.7, "learning_rate": 1.4868668408221349e-05, "loss": 2.2771, "step": 402910 }, { "epoch": 0.7, "learning_rate": 1.486779646829452e-05, "loss": 2.3354, "step": 402920 }, { "epoch": 0.7, "learning_rate": 1.4866924528367696e-05, "loss": 2.3038, "step": 402930 }, { "epoch": 0.7, "learning_rate": 1.4866052588440868e-05, "loss": 2.3768, "step": 402940 }, { "epoch": 0.7, "learning_rate": 1.486518064851404e-05, "loss": 2.2394, "step": 402950 }, { "epoch": 0.7, "learning_rate": 1.4864308708587212e-05, "loss": 2.3156, "step": 402960 }, { "epoch": 0.7, "learning_rate": 1.4863436768660388e-05, "loss": 2.3541, "step": 402970 }, { "epoch": 0.7, "learning_rate": 1.486256482873356e-05, "loss": 2.3227, "step": 402980 }, { "epoch": 0.7, "learning_rate": 1.4861692888806734e-05, "loss": 2.3144, "step": 402990 }, { "epoch": 0.7, "learning_rate": 1.4860820948879906e-05, "loss": 2.1914, "step": 403000 }, { "epoch": 0.7, "learning_rate": 1.4859949008953081e-05, "loss": 2.2744, "step": 403010 }, { "epoch": 0.7, "learning_rate": 1.4859077069026253e-05, "loss": 2.2181, "step": 403020 }, { "epoch": 0.7, "learning_rate": 1.4858205129099425e-05, "loss": 2.305, "step": 403030 }, { "epoch": 0.7, "learning_rate": 1.48573331891726e-05, "loss": 2.3908, "step": 403040 }, { "epoch": 0.7, "learning_rate": 1.4856461249245773e-05, "loss": 2.289, "step": 403050 }, { "epoch": 0.7, "learning_rate": 1.4855589309318945e-05, "loss": 2.2859, "step": 403060 }, { "epoch": 0.7, "learning_rate": 1.4854717369392119e-05, "loss": 2.2698, "step": 403070 }, { "epoch": 0.7, "learning_rate": 1.4853845429465294e-05, "loss": 2.2977, "step": 403080 }, { "epoch": 0.7, "learning_rate": 1.4852973489538466e-05, "loss": 2.2656, "step": 403090 }, { "epoch": 0.7, "learning_rate": 1.4852101549611638e-05, "loss": 2.3393, "step": 403100 }, { "epoch": 0.7, "learning_rate": 1.485122960968481e-05, "loss": 2.2813, "step": 403110 }, { "epoch": 0.7, "learning_rate": 1.4850357669757986e-05, "loss": 2.1651, "step": 403120 }, { "epoch": 0.7, "learning_rate": 1.4849485729831158e-05, "loss": 2.3131, "step": 403130 }, { "epoch": 0.7, "learning_rate": 1.4848613789904332e-05, "loss": 2.3648, "step": 403140 }, { "epoch": 0.7, "learning_rate": 1.4847741849977504e-05, "loss": 2.4047, "step": 403150 }, { "epoch": 0.7, "learning_rate": 1.484686991005068e-05, "loss": 2.147, "step": 403160 }, { "epoch": 0.7, "learning_rate": 1.4845997970123851e-05, "loss": 2.3275, "step": 403170 }, { "epoch": 0.7, "learning_rate": 1.4845126030197023e-05, "loss": 2.3493, "step": 403180 }, { "epoch": 0.7, "learning_rate": 1.4844254090270199e-05, "loss": 2.3929, "step": 403190 }, { "epoch": 0.7, "learning_rate": 1.4843382150343371e-05, "loss": 2.405, "step": 403200 }, { "epoch": 0.7, "learning_rate": 1.4842510210416543e-05, "loss": 2.2641, "step": 403210 }, { "epoch": 0.7, "learning_rate": 1.4841638270489717e-05, "loss": 2.3638, "step": 403220 }, { "epoch": 0.7, "learning_rate": 1.484076633056289e-05, "loss": 2.2606, "step": 403230 }, { "epoch": 0.7, "learning_rate": 1.4839894390636064e-05, "loss": 2.2041, "step": 403240 }, { "epoch": 0.7, "learning_rate": 1.4839022450709236e-05, "loss": 2.3283, "step": 403250 }, { "epoch": 0.7, "learning_rate": 1.4838150510782408e-05, "loss": 2.3704, "step": 403260 }, { "epoch": 0.7, "learning_rate": 1.4837278570855584e-05, "loss": 2.3204, "step": 403270 }, { "epoch": 0.7, "learning_rate": 1.4836406630928756e-05, "loss": 2.4268, "step": 403280 }, { "epoch": 0.7, "learning_rate": 1.4835534691001928e-05, "loss": 2.247, "step": 403290 }, { "epoch": 0.7, "learning_rate": 1.4834662751075102e-05, "loss": 2.3306, "step": 403300 }, { "epoch": 0.7, "learning_rate": 1.4833790811148277e-05, "loss": 2.3726, "step": 403310 }, { "epoch": 0.7, "learning_rate": 1.483291887122145e-05, "loss": 2.2505, "step": 403320 }, { "epoch": 0.7, "learning_rate": 1.4832046931294621e-05, "loss": 2.2739, "step": 403330 }, { "epoch": 0.7, "learning_rate": 1.4831174991367797e-05, "loss": 2.3703, "step": 403340 }, { "epoch": 0.7, "learning_rate": 1.4830303051440969e-05, "loss": 2.1819, "step": 403350 }, { "epoch": 0.7, "learning_rate": 1.4829431111514141e-05, "loss": 2.2324, "step": 403360 }, { "epoch": 0.7, "learning_rate": 1.4828559171587313e-05, "loss": 2.3182, "step": 403370 }, { "epoch": 0.7, "learning_rate": 1.4827687231660489e-05, "loss": 2.3734, "step": 403380 }, { "epoch": 0.7, "learning_rate": 1.4826815291733662e-05, "loss": 2.2756, "step": 403390 }, { "epoch": 0.7, "learning_rate": 1.4825943351806834e-05, "loss": 2.3313, "step": 403400 }, { "epoch": 0.7, "learning_rate": 1.4825071411880007e-05, "loss": 2.3865, "step": 403410 }, { "epoch": 0.7, "learning_rate": 1.4824199471953182e-05, "loss": 2.3286, "step": 403420 }, { "epoch": 0.7, "learning_rate": 1.4823327532026354e-05, "loss": 2.3766, "step": 403430 }, { "epoch": 0.7, "learning_rate": 1.4822455592099526e-05, "loss": 2.2864, "step": 403440 }, { "epoch": 0.7, "learning_rate": 1.4821583652172702e-05, "loss": 2.3434, "step": 403450 }, { "epoch": 0.7, "learning_rate": 1.4820711712245874e-05, "loss": 2.308, "step": 403460 }, { "epoch": 0.7, "learning_rate": 1.4819839772319047e-05, "loss": 2.3884, "step": 403470 }, { "epoch": 0.7, "learning_rate": 1.481896783239222e-05, "loss": 2.2191, "step": 403480 }, { "epoch": 0.7, "learning_rate": 1.4818095892465395e-05, "loss": 2.3903, "step": 403490 }, { "epoch": 0.7, "learning_rate": 1.4817223952538567e-05, "loss": 2.3731, "step": 403500 }, { "epoch": 0.7, "learning_rate": 1.481635201261174e-05, "loss": 2.3489, "step": 403510 }, { "epoch": 0.7, "learning_rate": 1.4815480072684911e-05, "loss": 2.277, "step": 403520 }, { "epoch": 0.7, "learning_rate": 1.4814608132758087e-05, "loss": 2.2992, "step": 403530 }, { "epoch": 0.7, "learning_rate": 1.4813736192831259e-05, "loss": 2.294, "step": 403540 }, { "epoch": 0.7, "learning_rate": 1.4812864252904433e-05, "loss": 2.3183, "step": 403550 }, { "epoch": 0.7, "learning_rate": 1.4811992312977605e-05, "loss": 2.3045, "step": 403560 }, { "epoch": 0.7, "learning_rate": 1.481112037305078e-05, "loss": 2.2758, "step": 403570 }, { "epoch": 0.7, "learning_rate": 1.4810248433123952e-05, "loss": 2.3286, "step": 403580 }, { "epoch": 0.7, "learning_rate": 1.4809376493197124e-05, "loss": 2.2508, "step": 403590 }, { "epoch": 0.7, "learning_rate": 1.48085045532703e-05, "loss": 2.3015, "step": 403600 }, { "epoch": 0.7, "learning_rate": 1.4807632613343472e-05, "loss": 2.3567, "step": 403610 }, { "epoch": 0.7, "learning_rate": 1.4806760673416646e-05, "loss": 2.2523, "step": 403620 }, { "epoch": 0.7, "learning_rate": 1.4805888733489818e-05, "loss": 2.29, "step": 403630 }, { "epoch": 0.7, "learning_rate": 1.4805016793562993e-05, "loss": 2.2832, "step": 403640 }, { "epoch": 0.7, "learning_rate": 1.4804144853636165e-05, "loss": 2.3941, "step": 403650 }, { "epoch": 0.7, "learning_rate": 1.4803272913709337e-05, "loss": 2.347, "step": 403660 }, { "epoch": 0.7, "learning_rate": 1.480240097378251e-05, "loss": 2.3361, "step": 403670 }, { "epoch": 0.7, "learning_rate": 1.4801529033855685e-05, "loss": 2.2824, "step": 403680 }, { "epoch": 0.7, "learning_rate": 1.4800657093928857e-05, "loss": 2.2824, "step": 403690 }, { "epoch": 0.7, "learning_rate": 1.479978515400203e-05, "loss": 2.3557, "step": 403700 }, { "epoch": 0.7, "learning_rate": 1.4798913214075204e-05, "loss": 2.3189, "step": 403710 }, { "epoch": 0.7, "learning_rate": 1.4798041274148378e-05, "loss": 2.3162, "step": 403720 }, { "epoch": 0.7, "learning_rate": 1.479716933422155e-05, "loss": 2.2994, "step": 403730 }, { "epoch": 0.7, "learning_rate": 1.4796297394294722e-05, "loss": 2.3294, "step": 403740 }, { "epoch": 0.7, "learning_rate": 1.4795425454367898e-05, "loss": 2.3543, "step": 403750 }, { "epoch": 0.7, "learning_rate": 1.479455351444107e-05, "loss": 2.3779, "step": 403760 }, { "epoch": 0.7, "learning_rate": 1.4793681574514242e-05, "loss": 2.2753, "step": 403770 }, { "epoch": 0.7, "learning_rate": 1.4792809634587416e-05, "loss": 2.2847, "step": 403780 }, { "epoch": 0.7, "learning_rate": 1.479193769466059e-05, "loss": 2.3245, "step": 403790 }, { "epoch": 0.7, "learning_rate": 1.4791065754733763e-05, "loss": 2.3493, "step": 403800 }, { "epoch": 0.7, "learning_rate": 1.4790193814806935e-05, "loss": 2.3645, "step": 403810 }, { "epoch": 0.7, "learning_rate": 1.4789321874880107e-05, "loss": 2.4687, "step": 403820 }, { "epoch": 0.7, "learning_rate": 1.4788449934953283e-05, "loss": 2.302, "step": 403830 }, { "epoch": 0.7, "learning_rate": 1.4787577995026455e-05, "loss": 2.3528, "step": 403840 }, { "epoch": 0.7, "learning_rate": 1.4786706055099627e-05, "loss": 2.2615, "step": 403850 }, { "epoch": 0.7, "learning_rate": 1.4785834115172802e-05, "loss": 2.2823, "step": 403860 }, { "epoch": 0.7, "learning_rate": 1.4784962175245976e-05, "loss": 2.2736, "step": 403870 }, { "epoch": 0.7, "learning_rate": 1.4784090235319148e-05, "loss": 2.3577, "step": 403880 }, { "epoch": 0.7, "learning_rate": 1.478321829539232e-05, "loss": 2.2179, "step": 403890 }, { "epoch": 0.7, "learning_rate": 1.4782346355465496e-05, "loss": 2.4429, "step": 403900 }, { "epoch": 0.7, "learning_rate": 1.4781474415538668e-05, "loss": 2.3053, "step": 403910 }, { "epoch": 0.7, "learning_rate": 1.478060247561184e-05, "loss": 2.2781, "step": 403920 }, { "epoch": 0.7, "learning_rate": 1.4779730535685014e-05, "loss": 2.4213, "step": 403930 }, { "epoch": 0.7, "learning_rate": 1.4778858595758188e-05, "loss": 2.4395, "step": 403940 }, { "epoch": 0.7, "learning_rate": 1.4777986655831361e-05, "loss": 2.2535, "step": 403950 }, { "epoch": 0.7, "learning_rate": 1.4777114715904533e-05, "loss": 2.2925, "step": 403960 }, { "epoch": 0.7, "learning_rate": 1.4776242775977705e-05, "loss": 2.3395, "step": 403970 }, { "epoch": 0.7, "learning_rate": 1.4775370836050881e-05, "loss": 2.2903, "step": 403980 }, { "epoch": 0.7, "learning_rate": 1.4774498896124053e-05, "loss": 2.3215, "step": 403990 }, { "epoch": 0.7, "learning_rate": 1.4773626956197225e-05, "loss": 2.2772, "step": 404000 }, { "epoch": 0.7, "learning_rate": 1.47727550162704e-05, "loss": 2.3939, "step": 404010 }, { "epoch": 0.7, "learning_rate": 1.4771883076343573e-05, "loss": 2.2796, "step": 404020 }, { "epoch": 0.7, "learning_rate": 1.4771011136416746e-05, "loss": 2.2946, "step": 404030 }, { "epoch": 0.7, "learning_rate": 1.4770139196489918e-05, "loss": 2.2736, "step": 404040 }, { "epoch": 0.7, "learning_rate": 1.4769267256563094e-05, "loss": 2.2854, "step": 404050 }, { "epoch": 0.7, "learning_rate": 1.4768395316636266e-05, "loss": 2.3291, "step": 404060 }, { "epoch": 0.7, "learning_rate": 1.4767523376709438e-05, "loss": 2.2812, "step": 404070 }, { "epoch": 0.7, "learning_rate": 1.476665143678261e-05, "loss": 2.317, "step": 404080 }, { "epoch": 0.7, "learning_rate": 1.4765779496855786e-05, "loss": 2.2407, "step": 404090 }, { "epoch": 0.7, "learning_rate": 1.4764907556928958e-05, "loss": 2.2345, "step": 404100 }, { "epoch": 0.7, "learning_rate": 1.4764035617002131e-05, "loss": 2.3509, "step": 404110 }, { "epoch": 0.7, "learning_rate": 1.4763163677075307e-05, "loss": 2.194, "step": 404120 }, { "epoch": 0.7, "learning_rate": 1.4762291737148479e-05, "loss": 2.4011, "step": 404130 }, { "epoch": 0.7, "learning_rate": 1.4761419797221651e-05, "loss": 2.2844, "step": 404140 }, { "epoch": 0.7, "learning_rate": 1.4760547857294823e-05, "loss": 2.3464, "step": 404150 }, { "epoch": 0.7, "learning_rate": 1.4759675917367999e-05, "loss": 2.2672, "step": 404160 }, { "epoch": 0.7, "learning_rate": 1.475880397744117e-05, "loss": 2.2867, "step": 404170 }, { "epoch": 0.7, "learning_rate": 1.4757932037514344e-05, "loss": 2.3923, "step": 404180 }, { "epoch": 0.7, "learning_rate": 1.4757060097587517e-05, "loss": 2.2955, "step": 404190 }, { "epoch": 0.7, "learning_rate": 1.4756188157660692e-05, "loss": 2.292, "step": 404200 }, { "epoch": 0.7, "learning_rate": 1.4755316217733864e-05, "loss": 2.267, "step": 404210 }, { "epoch": 0.7, "learning_rate": 1.4754444277807036e-05, "loss": 2.2697, "step": 404220 }, { "epoch": 0.7, "learning_rate": 1.4753572337880208e-05, "loss": 2.294, "step": 404230 }, { "epoch": 0.7, "learning_rate": 1.4752700397953384e-05, "loss": 2.2056, "step": 404240 }, { "epoch": 0.7, "learning_rate": 1.4751828458026556e-05, "loss": 2.2641, "step": 404250 }, { "epoch": 0.7, "learning_rate": 1.475095651809973e-05, "loss": 2.3967, "step": 404260 }, { "epoch": 0.7, "learning_rate": 1.4750084578172903e-05, "loss": 2.3665, "step": 404270 }, { "epoch": 0.71, "learning_rate": 1.4749212638246077e-05, "loss": 2.2526, "step": 404280 }, { "epoch": 0.71, "learning_rate": 1.474834069831925e-05, "loss": 2.3094, "step": 404290 }, { "epoch": 0.71, "learning_rate": 1.4747468758392421e-05, "loss": 2.2828, "step": 404300 }, { "epoch": 0.71, "learning_rate": 1.4746596818465597e-05, "loss": 2.3039, "step": 404310 }, { "epoch": 0.71, "learning_rate": 1.4745724878538769e-05, "loss": 2.4298, "step": 404320 }, { "epoch": 0.71, "learning_rate": 1.4744852938611941e-05, "loss": 2.3901, "step": 404330 }, { "epoch": 0.71, "learning_rate": 1.4743980998685115e-05, "loss": 2.4151, "step": 404340 }, { "epoch": 0.71, "learning_rate": 1.474310905875829e-05, "loss": 2.3485, "step": 404350 }, { "epoch": 0.71, "learning_rate": 1.4742237118831462e-05, "loss": 2.2297, "step": 404360 }, { "epoch": 0.71, "learning_rate": 1.4741365178904634e-05, "loss": 2.3955, "step": 404370 }, { "epoch": 0.71, "learning_rate": 1.474049323897781e-05, "loss": 2.3048, "step": 404380 }, { "epoch": 0.71, "learning_rate": 1.4739621299050982e-05, "loss": 2.3284, "step": 404390 }, { "epoch": 0.71, "learning_rate": 1.4738749359124154e-05, "loss": 2.2376, "step": 404400 }, { "epoch": 0.71, "learning_rate": 1.4737877419197326e-05, "loss": 2.2969, "step": 404410 }, { "epoch": 0.71, "learning_rate": 1.4737005479270501e-05, "loss": 2.3709, "step": 404420 }, { "epoch": 0.71, "learning_rate": 1.4736133539343675e-05, "loss": 2.2556, "step": 404430 }, { "epoch": 0.71, "learning_rate": 1.4735261599416847e-05, "loss": 2.21, "step": 404440 }, { "epoch": 0.71, "learning_rate": 1.473438965949002e-05, "loss": 2.255, "step": 404450 }, { "epoch": 0.71, "learning_rate": 1.4733517719563195e-05, "loss": 2.1935, "step": 404460 }, { "epoch": 0.71, "learning_rate": 1.4732645779636367e-05, "loss": 2.3582, "step": 404470 }, { "epoch": 0.71, "learning_rate": 1.4731773839709539e-05, "loss": 2.268, "step": 404480 }, { "epoch": 0.71, "learning_rate": 1.4730901899782713e-05, "loss": 2.3245, "step": 404490 }, { "epoch": 0.71, "learning_rate": 1.4730029959855886e-05, "loss": 2.3566, "step": 404500 }, { "epoch": 0.71, "learning_rate": 1.472915801992906e-05, "loss": 2.3303, "step": 404510 }, { "epoch": 0.71, "learning_rate": 1.4728286080002232e-05, "loss": 2.3134, "step": 404520 }, { "epoch": 0.71, "learning_rate": 1.4727414140075408e-05, "loss": 2.316, "step": 404530 }, { "epoch": 0.71, "learning_rate": 1.472654220014858e-05, "loss": 2.3314, "step": 404540 }, { "epoch": 0.71, "learning_rate": 1.4725670260221752e-05, "loss": 2.2756, "step": 404550 }, { "epoch": 0.71, "learning_rate": 1.4724798320294924e-05, "loss": 2.3111, "step": 404560 }, { "epoch": 0.71, "learning_rate": 1.47239263803681e-05, "loss": 2.2404, "step": 404570 }, { "epoch": 0.71, "learning_rate": 1.4723054440441272e-05, "loss": 2.2482, "step": 404580 }, { "epoch": 0.71, "learning_rate": 1.4722182500514445e-05, "loss": 2.2734, "step": 404590 }, { "epoch": 0.71, "learning_rate": 1.4721310560587617e-05, "loss": 2.1869, "step": 404600 }, { "epoch": 0.71, "learning_rate": 1.4720438620660793e-05, "loss": 2.2696, "step": 404610 }, { "epoch": 0.71, "learning_rate": 1.4719566680733965e-05, "loss": 2.3672, "step": 404620 }, { "epoch": 0.71, "learning_rate": 1.4718694740807137e-05, "loss": 2.2506, "step": 404630 }, { "epoch": 0.71, "learning_rate": 1.4717822800880313e-05, "loss": 2.3698, "step": 404640 }, { "epoch": 0.71, "learning_rate": 1.4716950860953485e-05, "loss": 2.3726, "step": 404650 }, { "epoch": 0.71, "learning_rate": 1.4716078921026658e-05, "loss": 2.2425, "step": 404660 }, { "epoch": 0.71, "learning_rate": 1.471520698109983e-05, "loss": 2.3471, "step": 404670 }, { "epoch": 0.71, "learning_rate": 1.4714335041173006e-05, "loss": 2.2781, "step": 404680 }, { "epoch": 0.71, "learning_rate": 1.4713463101246178e-05, "loss": 2.2313, "step": 404690 }, { "epoch": 0.71, "learning_rate": 1.471259116131935e-05, "loss": 2.2636, "step": 404700 }, { "epoch": 0.71, "learning_rate": 1.4711719221392522e-05, "loss": 2.3778, "step": 404710 }, { "epoch": 0.71, "learning_rate": 1.4710847281465698e-05, "loss": 2.3587, "step": 404720 }, { "epoch": 0.71, "learning_rate": 1.470997534153887e-05, "loss": 2.3345, "step": 404730 }, { "epoch": 0.71, "learning_rate": 1.4709103401612043e-05, "loss": 2.3122, "step": 404740 }, { "epoch": 0.71, "learning_rate": 1.4708231461685215e-05, "loss": 2.3332, "step": 404750 }, { "epoch": 0.71, "learning_rate": 1.4707359521758391e-05, "loss": 2.2986, "step": 404760 }, { "epoch": 0.71, "learning_rate": 1.4706487581831563e-05, "loss": 2.2207, "step": 404770 }, { "epoch": 0.71, "learning_rate": 1.4705615641904735e-05, "loss": 2.2933, "step": 404780 }, { "epoch": 0.71, "learning_rate": 1.470474370197791e-05, "loss": 2.3005, "step": 404790 }, { "epoch": 0.71, "learning_rate": 1.4703871762051083e-05, "loss": 2.3285, "step": 404800 }, { "epoch": 0.71, "learning_rate": 1.4702999822124255e-05, "loss": 2.4306, "step": 404810 }, { "epoch": 0.71, "learning_rate": 1.4702127882197429e-05, "loss": 2.185, "step": 404820 }, { "epoch": 0.71, "learning_rate": 1.4701255942270602e-05, "loss": 2.3834, "step": 404830 }, { "epoch": 0.71, "learning_rate": 1.4700384002343776e-05, "loss": 2.3335, "step": 404840 }, { "epoch": 0.71, "learning_rate": 1.4699512062416948e-05, "loss": 2.3367, "step": 404850 }, { "epoch": 0.71, "learning_rate": 1.469864012249012e-05, "loss": 2.3473, "step": 404860 }, { "epoch": 0.71, "learning_rate": 1.4697768182563296e-05, "loss": 2.2252, "step": 404870 }, { "epoch": 0.71, "learning_rate": 1.4696896242636468e-05, "loss": 2.3771, "step": 404880 }, { "epoch": 0.71, "learning_rate": 1.469602430270964e-05, "loss": 2.325, "step": 404890 }, { "epoch": 0.71, "learning_rate": 1.4695152362782814e-05, "loss": 2.331, "step": 404900 }, { "epoch": 0.71, "learning_rate": 1.4694280422855989e-05, "loss": 2.3362, "step": 404910 }, { "epoch": 0.71, "learning_rate": 1.4693408482929161e-05, "loss": 2.3556, "step": 404920 }, { "epoch": 0.71, "learning_rate": 1.4692536543002333e-05, "loss": 2.3203, "step": 404930 }, { "epoch": 0.71, "learning_rate": 1.4691664603075509e-05, "loss": 2.4027, "step": 404940 }, { "epoch": 0.71, "learning_rate": 1.469079266314868e-05, "loss": 2.2577, "step": 404950 }, { "epoch": 0.71, "learning_rate": 1.4689920723221853e-05, "loss": 2.2799, "step": 404960 }, { "epoch": 0.71, "learning_rate": 1.4689048783295027e-05, "loss": 2.271, "step": 404970 }, { "epoch": 0.71, "learning_rate": 1.46881768433682e-05, "loss": 2.3234, "step": 404980 }, { "epoch": 0.71, "learning_rate": 1.4687304903441374e-05, "loss": 2.2289, "step": 404990 }, { "epoch": 0.71, "learning_rate": 1.4686432963514546e-05, "loss": 2.2303, "step": 405000 }, { "epoch": 0.71, "learning_rate": 1.4685561023587718e-05, "loss": 2.3355, "step": 405010 }, { "epoch": 0.71, "learning_rate": 1.4684689083660894e-05, "loss": 2.3081, "step": 405020 }, { "epoch": 0.71, "learning_rate": 1.4683817143734066e-05, "loss": 2.2528, "step": 405030 }, { "epoch": 0.71, "learning_rate": 1.4682945203807238e-05, "loss": 2.3264, "step": 405040 }, { "epoch": 0.71, "learning_rate": 1.4682073263880413e-05, "loss": 2.3082, "step": 405050 }, { "epoch": 0.71, "learning_rate": 1.4681201323953585e-05, "loss": 2.3139, "step": 405060 }, { "epoch": 0.71, "learning_rate": 1.468032938402676e-05, "loss": 2.1947, "step": 405070 }, { "epoch": 0.71, "learning_rate": 1.4679457444099931e-05, "loss": 2.336, "step": 405080 }, { "epoch": 0.71, "learning_rate": 1.4678585504173107e-05, "loss": 2.3672, "step": 405090 }, { "epoch": 0.71, "learning_rate": 1.4677713564246279e-05, "loss": 2.2876, "step": 405100 }, { "epoch": 0.71, "learning_rate": 1.4676841624319451e-05, "loss": 2.2318, "step": 405110 }, { "epoch": 0.71, "learning_rate": 1.4675969684392623e-05, "loss": 2.2785, "step": 405120 }, { "epoch": 0.71, "learning_rate": 1.4675097744465798e-05, "loss": 2.26, "step": 405130 }, { "epoch": 0.71, "learning_rate": 1.467422580453897e-05, "loss": 2.2721, "step": 405140 }, { "epoch": 0.71, "learning_rate": 1.4673353864612144e-05, "loss": 2.3147, "step": 405150 }, { "epoch": 0.71, "learning_rate": 1.4672481924685316e-05, "loss": 2.2652, "step": 405160 }, { "epoch": 0.71, "learning_rate": 1.4671609984758492e-05, "loss": 2.3489, "step": 405170 }, { "epoch": 0.71, "learning_rate": 1.4670738044831664e-05, "loss": 2.2394, "step": 405180 }, { "epoch": 0.71, "learning_rate": 1.4669866104904836e-05, "loss": 2.392, "step": 405190 }, { "epoch": 0.71, "learning_rate": 1.4668994164978011e-05, "loss": 2.1843, "step": 405200 }, { "epoch": 0.71, "learning_rate": 1.4668122225051184e-05, "loss": 2.3436, "step": 405210 }, { "epoch": 0.71, "learning_rate": 1.4667250285124357e-05, "loss": 2.3696, "step": 405220 }, { "epoch": 0.71, "learning_rate": 1.466637834519753e-05, "loss": 2.167, "step": 405230 }, { "epoch": 0.71, "learning_rate": 1.4665506405270705e-05, "loss": 2.325, "step": 405240 }, { "epoch": 0.71, "learning_rate": 1.4664634465343877e-05, "loss": 2.2067, "step": 405250 }, { "epoch": 0.71, "learning_rate": 1.4663762525417049e-05, "loss": 2.4072, "step": 405260 }, { "epoch": 0.71, "learning_rate": 1.4662890585490221e-05, "loss": 2.33, "step": 405270 }, { "epoch": 0.71, "learning_rate": 1.4662018645563397e-05, "loss": 2.3152, "step": 405280 }, { "epoch": 0.71, "learning_rate": 1.4661146705636569e-05, "loss": 2.247, "step": 405290 }, { "epoch": 0.71, "learning_rate": 1.4660274765709742e-05, "loss": 2.3903, "step": 405300 }, { "epoch": 0.71, "learning_rate": 1.4659402825782916e-05, "loss": 2.3047, "step": 405310 }, { "epoch": 0.71, "learning_rate": 1.465853088585609e-05, "loss": 2.2341, "step": 405320 }, { "epoch": 0.71, "learning_rate": 1.4657658945929262e-05, "loss": 2.2593, "step": 405330 }, { "epoch": 0.71, "learning_rate": 1.4656787006002434e-05, "loss": 2.2686, "step": 405340 }, { "epoch": 0.71, "learning_rate": 1.465591506607561e-05, "loss": 2.3717, "step": 405350 }, { "epoch": 0.71, "learning_rate": 1.4655043126148782e-05, "loss": 2.3166, "step": 405360 }, { "epoch": 0.71, "learning_rate": 1.4654171186221954e-05, "loss": 2.3889, "step": 405370 }, { "epoch": 0.71, "learning_rate": 1.4653299246295127e-05, "loss": 2.2835, "step": 405380 }, { "epoch": 0.71, "learning_rate": 1.4652427306368303e-05, "loss": 2.2791, "step": 405390 }, { "epoch": 0.71, "learning_rate": 1.4651555366441475e-05, "loss": 2.3842, "step": 405400 }, { "epoch": 0.71, "learning_rate": 1.4650683426514647e-05, "loss": 2.3392, "step": 405410 }, { "epoch": 0.71, "learning_rate": 1.4649811486587819e-05, "loss": 2.3122, "step": 405420 }, { "epoch": 0.71, "learning_rate": 1.4648939546660995e-05, "loss": 2.3388, "step": 405430 }, { "epoch": 0.71, "learning_rate": 1.4648067606734167e-05, "loss": 2.3371, "step": 405440 }, { "epoch": 0.71, "learning_rate": 1.4647195666807339e-05, "loss": 2.342, "step": 405450 }, { "epoch": 0.71, "learning_rate": 1.4646323726880514e-05, "loss": 2.2974, "step": 405460 }, { "epoch": 0.71, "learning_rate": 1.4645451786953688e-05, "loss": 2.2981, "step": 405470 }, { "epoch": 0.71, "learning_rate": 1.464457984702686e-05, "loss": 2.2609, "step": 405480 }, { "epoch": 0.71, "learning_rate": 1.4643707907100032e-05, "loss": 2.3585, "step": 405490 }, { "epoch": 0.71, "learning_rate": 1.4642835967173208e-05, "loss": 2.2998, "step": 405500 }, { "epoch": 0.71, "learning_rate": 1.464196402724638e-05, "loss": 2.3295, "step": 405510 }, { "epoch": 0.71, "learning_rate": 1.4641092087319552e-05, "loss": 2.3237, "step": 405520 }, { "epoch": 0.71, "learning_rate": 1.4640220147392726e-05, "loss": 2.2822, "step": 405530 }, { "epoch": 0.71, "learning_rate": 1.46393482074659e-05, "loss": 2.259, "step": 405540 }, { "epoch": 0.71, "learning_rate": 1.4638476267539073e-05, "loss": 2.2917, "step": 405550 }, { "epoch": 0.71, "learning_rate": 1.4637604327612245e-05, "loss": 2.2778, "step": 405560 }, { "epoch": 0.71, "learning_rate": 1.463673238768542e-05, "loss": 2.2588, "step": 405570 }, { "epoch": 0.71, "learning_rate": 1.4635860447758593e-05, "loss": 2.3896, "step": 405580 }, { "epoch": 0.71, "learning_rate": 1.4634988507831765e-05, "loss": 2.2729, "step": 405590 }, { "epoch": 0.71, "learning_rate": 1.4634116567904937e-05, "loss": 2.2293, "step": 405600 }, { "epoch": 0.71, "learning_rate": 1.4633244627978112e-05, "loss": 2.2916, "step": 405610 }, { "epoch": 0.71, "learning_rate": 1.4632372688051284e-05, "loss": 2.341, "step": 405620 }, { "epoch": 0.71, "learning_rate": 1.4631500748124458e-05, "loss": 2.3481, "step": 405630 }, { "epoch": 0.71, "learning_rate": 1.463062880819763e-05, "loss": 2.3005, "step": 405640 }, { "epoch": 0.71, "learning_rate": 1.4629756868270806e-05, "loss": 2.2919, "step": 405650 }, { "epoch": 0.71, "learning_rate": 1.4628884928343978e-05, "loss": 2.2994, "step": 405660 }, { "epoch": 0.71, "learning_rate": 1.462801298841715e-05, "loss": 2.1775, "step": 405670 }, { "epoch": 0.71, "learning_rate": 1.4627141048490322e-05, "loss": 2.2564, "step": 405680 }, { "epoch": 0.71, "learning_rate": 1.4626269108563497e-05, "loss": 2.3848, "step": 405690 }, { "epoch": 0.71, "learning_rate": 1.4625397168636671e-05, "loss": 2.3866, "step": 405700 }, { "epoch": 0.71, "learning_rate": 1.4624525228709843e-05, "loss": 2.3366, "step": 405710 }, { "epoch": 0.71, "learning_rate": 1.4623653288783019e-05, "loss": 2.2779, "step": 405720 }, { "epoch": 0.71, "learning_rate": 1.462278134885619e-05, "loss": 2.3646, "step": 405730 }, { "epoch": 0.71, "learning_rate": 1.4621909408929363e-05, "loss": 2.3205, "step": 405740 }, { "epoch": 0.71, "learning_rate": 1.4621037469002535e-05, "loss": 2.3229, "step": 405750 }, { "epoch": 0.71, "learning_rate": 1.462016552907571e-05, "loss": 2.2258, "step": 405760 }, { "epoch": 0.71, "learning_rate": 1.4619293589148882e-05, "loss": 2.2275, "step": 405770 }, { "epoch": 0.71, "learning_rate": 1.4618421649222056e-05, "loss": 2.3233, "step": 405780 }, { "epoch": 0.71, "learning_rate": 1.4617549709295228e-05, "loss": 2.4321, "step": 405790 }, { "epoch": 0.71, "learning_rate": 1.4616677769368404e-05, "loss": 2.2646, "step": 405800 }, { "epoch": 0.71, "learning_rate": 1.4615805829441576e-05, "loss": 2.3205, "step": 405810 }, { "epoch": 0.71, "learning_rate": 1.4614933889514748e-05, "loss": 2.3677, "step": 405820 }, { "epoch": 0.71, "learning_rate": 1.461406194958792e-05, "loss": 2.3217, "step": 405830 }, { "epoch": 0.71, "learning_rate": 1.4613190009661095e-05, "loss": 2.2297, "step": 405840 }, { "epoch": 0.71, "learning_rate": 1.4612318069734268e-05, "loss": 2.1955, "step": 405850 }, { "epoch": 0.71, "learning_rate": 1.4611446129807441e-05, "loss": 2.3676, "step": 405860 }, { "epoch": 0.71, "learning_rate": 1.4610574189880615e-05, "loss": 2.2545, "step": 405870 }, { "epoch": 0.71, "learning_rate": 1.4609702249953789e-05, "loss": 2.3455, "step": 405880 }, { "epoch": 0.71, "learning_rate": 1.4608830310026961e-05, "loss": 2.2587, "step": 405890 }, { "epoch": 0.71, "learning_rate": 1.4607958370100133e-05, "loss": 2.3584, "step": 405900 }, { "epoch": 0.71, "learning_rate": 1.4607086430173308e-05, "loss": 2.2252, "step": 405910 }, { "epoch": 0.71, "learning_rate": 1.460621449024648e-05, "loss": 2.3208, "step": 405920 }, { "epoch": 0.71, "learning_rate": 1.4605342550319653e-05, "loss": 2.3625, "step": 405930 }, { "epoch": 0.71, "learning_rate": 1.4604470610392826e-05, "loss": 2.2457, "step": 405940 }, { "epoch": 0.71, "learning_rate": 1.4603598670466002e-05, "loss": 2.2162, "step": 405950 }, { "epoch": 0.71, "learning_rate": 1.4602726730539174e-05, "loss": 2.2952, "step": 405960 }, { "epoch": 0.71, "learning_rate": 1.4601854790612346e-05, "loss": 2.3628, "step": 405970 }, { "epoch": 0.71, "learning_rate": 1.4600982850685521e-05, "loss": 2.3549, "step": 405980 }, { "epoch": 0.71, "learning_rate": 1.4600110910758694e-05, "loss": 2.3194, "step": 405990 }, { "epoch": 0.71, "learning_rate": 1.4599238970831866e-05, "loss": 2.3571, "step": 406000 }, { "epoch": 0.71, "learning_rate": 1.459836703090504e-05, "loss": 2.3875, "step": 406010 }, { "epoch": 0.71, "learning_rate": 1.4597495090978213e-05, "loss": 2.3327, "step": 406020 }, { "epoch": 0.71, "learning_rate": 1.4596623151051387e-05, "loss": 2.2434, "step": 406030 }, { "epoch": 0.71, "learning_rate": 1.4595751211124559e-05, "loss": 2.2908, "step": 406040 }, { "epoch": 0.71, "learning_rate": 1.4594879271197731e-05, "loss": 2.2484, "step": 406050 }, { "epoch": 0.71, "learning_rate": 1.4594007331270907e-05, "loss": 2.2777, "step": 406060 }, { "epoch": 0.71, "learning_rate": 1.4593135391344079e-05, "loss": 2.3066, "step": 406070 }, { "epoch": 0.71, "learning_rate": 1.459226345141725e-05, "loss": 2.2157, "step": 406080 }, { "epoch": 0.71, "learning_rate": 1.4591391511490424e-05, "loss": 2.2501, "step": 406090 }, { "epoch": 0.71, "learning_rate": 1.4590519571563598e-05, "loss": 2.3046, "step": 406100 }, { "epoch": 0.71, "learning_rate": 1.4589647631636772e-05, "loss": 2.3513, "step": 406110 }, { "epoch": 0.71, "learning_rate": 1.4588775691709944e-05, "loss": 2.302, "step": 406120 }, { "epoch": 0.71, "learning_rate": 1.458790375178312e-05, "loss": 2.3496, "step": 406130 }, { "epoch": 0.71, "learning_rate": 1.4587031811856292e-05, "loss": 2.3269, "step": 406140 }, { "epoch": 0.71, "learning_rate": 1.4586159871929464e-05, "loss": 2.3033, "step": 406150 }, { "epoch": 0.71, "learning_rate": 1.4585287932002636e-05, "loss": 2.2392, "step": 406160 }, { "epoch": 0.71, "learning_rate": 1.4584415992075811e-05, "loss": 2.2866, "step": 406170 }, { "epoch": 0.71, "learning_rate": 1.4583544052148983e-05, "loss": 2.3122, "step": 406180 }, { "epoch": 0.71, "learning_rate": 1.4582672112222157e-05, "loss": 2.3633, "step": 406190 }, { "epoch": 0.71, "learning_rate": 1.4581800172295329e-05, "loss": 2.427, "step": 406200 }, { "epoch": 0.71, "learning_rate": 1.4580928232368505e-05, "loss": 2.4307, "step": 406210 }, { "epoch": 0.71, "learning_rate": 1.4580056292441677e-05, "loss": 2.3017, "step": 406220 }, { "epoch": 0.71, "learning_rate": 1.4579184352514849e-05, "loss": 2.3263, "step": 406230 }, { "epoch": 0.71, "learning_rate": 1.4578312412588024e-05, "loss": 2.3203, "step": 406240 }, { "epoch": 0.71, "learning_rate": 1.4577440472661196e-05, "loss": 2.2139, "step": 406250 }, { "epoch": 0.71, "learning_rate": 1.457656853273437e-05, "loss": 2.1539, "step": 406260 }, { "epoch": 0.71, "learning_rate": 1.4575696592807542e-05, "loss": 2.3035, "step": 406270 }, { "epoch": 0.71, "learning_rate": 1.4574824652880718e-05, "loss": 2.3462, "step": 406280 }, { "epoch": 0.71, "learning_rate": 1.457395271295389e-05, "loss": 2.2276, "step": 406290 }, { "epoch": 0.71, "learning_rate": 1.4573080773027062e-05, "loss": 2.3536, "step": 406300 }, { "epoch": 0.71, "learning_rate": 1.4572208833100234e-05, "loss": 2.2612, "step": 406310 }, { "epoch": 0.71, "learning_rate": 1.457133689317341e-05, "loss": 2.3002, "step": 406320 }, { "epoch": 0.71, "learning_rate": 1.4570464953246581e-05, "loss": 2.2195, "step": 406330 }, { "epoch": 0.71, "learning_rate": 1.4569593013319755e-05, "loss": 2.2572, "step": 406340 }, { "epoch": 0.71, "learning_rate": 1.4568721073392927e-05, "loss": 2.3544, "step": 406350 }, { "epoch": 0.71, "learning_rate": 1.4567849133466103e-05, "loss": 2.1754, "step": 406360 }, { "epoch": 0.71, "learning_rate": 1.4566977193539275e-05, "loss": 2.1899, "step": 406370 }, { "epoch": 0.71, "learning_rate": 1.4566105253612447e-05, "loss": 2.2235, "step": 406380 }, { "epoch": 0.71, "learning_rate": 1.4565233313685622e-05, "loss": 2.2945, "step": 406390 }, { "epoch": 0.71, "learning_rate": 1.4564361373758794e-05, "loss": 2.3305, "step": 406400 }, { "epoch": 0.71, "learning_rate": 1.4563489433831966e-05, "loss": 2.2789, "step": 406410 }, { "epoch": 0.71, "learning_rate": 1.456261749390514e-05, "loss": 2.327, "step": 406420 }, { "epoch": 0.71, "learning_rate": 1.4561745553978316e-05, "loss": 2.1705, "step": 406430 }, { "epoch": 0.71, "learning_rate": 1.4560873614051488e-05, "loss": 2.3384, "step": 406440 }, { "epoch": 0.71, "learning_rate": 1.456000167412466e-05, "loss": 2.1935, "step": 406450 }, { "epoch": 0.71, "learning_rate": 1.4559129734197832e-05, "loss": 2.2937, "step": 406460 }, { "epoch": 0.71, "learning_rate": 1.4558257794271007e-05, "loss": 2.2786, "step": 406470 }, { "epoch": 0.71, "learning_rate": 1.455738585434418e-05, "loss": 2.2411, "step": 406480 }, { "epoch": 0.71, "learning_rate": 1.4556513914417352e-05, "loss": 2.3001, "step": 406490 }, { "epoch": 0.71, "learning_rate": 1.4555641974490527e-05, "loss": 2.3357, "step": 406500 }, { "epoch": 0.71, "learning_rate": 1.45547700345637e-05, "loss": 2.3119, "step": 406510 }, { "epoch": 0.71, "learning_rate": 1.4553898094636873e-05, "loss": 2.3392, "step": 406520 }, { "epoch": 0.71, "learning_rate": 1.4553026154710045e-05, "loss": 2.2411, "step": 406530 }, { "epoch": 0.71, "learning_rate": 1.455215421478322e-05, "loss": 2.2285, "step": 406540 }, { "epoch": 0.71, "learning_rate": 1.4551282274856392e-05, "loss": 2.3513, "step": 406550 }, { "epoch": 0.71, "learning_rate": 1.4550410334929565e-05, "loss": 2.3249, "step": 406560 }, { "epoch": 0.71, "learning_rate": 1.4549538395002738e-05, "loss": 2.2917, "step": 406570 }, { "epoch": 0.71, "learning_rate": 1.4548666455075912e-05, "loss": 2.3717, "step": 406580 }, { "epoch": 0.71, "learning_rate": 1.4547794515149086e-05, "loss": 2.185, "step": 406590 }, { "epoch": 0.71, "learning_rate": 1.4546922575222258e-05, "loss": 2.2745, "step": 406600 }, { "epoch": 0.71, "learning_rate": 1.454605063529543e-05, "loss": 2.2326, "step": 406610 }, { "epoch": 0.71, "learning_rate": 1.4545178695368605e-05, "loss": 2.3097, "step": 406620 }, { "epoch": 0.71, "learning_rate": 1.4544306755441778e-05, "loss": 2.1192, "step": 406630 }, { "epoch": 0.71, "learning_rate": 1.454343481551495e-05, "loss": 2.3642, "step": 406640 }, { "epoch": 0.71, "learning_rate": 1.4542562875588125e-05, "loss": 2.4093, "step": 406650 }, { "epoch": 0.71, "learning_rate": 1.4541690935661297e-05, "loss": 2.2512, "step": 406660 }, { "epoch": 0.71, "learning_rate": 1.4540818995734471e-05, "loss": 2.2511, "step": 406670 }, { "epoch": 0.71, "learning_rate": 1.4539947055807643e-05, "loss": 2.2553, "step": 406680 }, { "epoch": 0.71, "learning_rate": 1.4539075115880818e-05, "loss": 2.3681, "step": 406690 }, { "epoch": 0.71, "learning_rate": 1.453820317595399e-05, "loss": 2.3349, "step": 406700 }, { "epoch": 0.71, "learning_rate": 1.4537331236027163e-05, "loss": 2.286, "step": 406710 }, { "epoch": 0.71, "learning_rate": 1.4536459296100335e-05, "loss": 2.3432, "step": 406720 }, { "epoch": 0.71, "learning_rate": 1.453558735617351e-05, "loss": 2.2672, "step": 406730 }, { "epoch": 0.71, "learning_rate": 1.4534715416246684e-05, "loss": 2.3193, "step": 406740 }, { "epoch": 0.71, "learning_rate": 1.4533843476319856e-05, "loss": 2.3213, "step": 406750 }, { "epoch": 0.71, "learning_rate": 1.4532971536393028e-05, "loss": 2.3073, "step": 406760 }, { "epoch": 0.71, "learning_rate": 1.4532099596466204e-05, "loss": 2.3808, "step": 406770 }, { "epoch": 0.71, "learning_rate": 1.4531227656539376e-05, "loss": 2.282, "step": 406780 }, { "epoch": 0.71, "learning_rate": 1.4530355716612548e-05, "loss": 2.3605, "step": 406790 }, { "epoch": 0.71, "learning_rate": 1.4529483776685723e-05, "loss": 2.2274, "step": 406800 }, { "epoch": 0.71, "learning_rate": 1.4528611836758895e-05, "loss": 2.2345, "step": 406810 }, { "epoch": 0.71, "learning_rate": 1.4527739896832069e-05, "loss": 2.3542, "step": 406820 }, { "epoch": 0.71, "learning_rate": 1.4526867956905241e-05, "loss": 2.3284, "step": 406830 }, { "epoch": 0.71, "learning_rate": 1.4525996016978417e-05, "loss": 2.3225, "step": 406840 }, { "epoch": 0.71, "learning_rate": 1.4525124077051589e-05, "loss": 2.3539, "step": 406850 }, { "epoch": 0.71, "learning_rate": 1.452425213712476e-05, "loss": 2.2642, "step": 406860 }, { "epoch": 0.71, "learning_rate": 1.4523380197197933e-05, "loss": 2.1956, "step": 406870 }, { "epoch": 0.71, "learning_rate": 1.4522508257271108e-05, "loss": 2.3357, "step": 406880 }, { "epoch": 0.71, "learning_rate": 1.452163631734428e-05, "loss": 2.2694, "step": 406890 }, { "epoch": 0.71, "learning_rate": 1.4520764377417454e-05, "loss": 2.2282, "step": 406900 }, { "epoch": 0.71, "learning_rate": 1.4519892437490628e-05, "loss": 2.2994, "step": 406910 }, { "epoch": 0.71, "learning_rate": 1.4519020497563802e-05, "loss": 2.27, "step": 406920 }, { "epoch": 0.71, "learning_rate": 1.4518148557636974e-05, "loss": 2.2855, "step": 406930 }, { "epoch": 0.71, "learning_rate": 1.4517276617710146e-05, "loss": 2.4237, "step": 406940 }, { "epoch": 0.71, "learning_rate": 1.4516404677783321e-05, "loss": 2.3458, "step": 406950 }, { "epoch": 0.71, "learning_rate": 1.4515532737856493e-05, "loss": 2.308, "step": 406960 }, { "epoch": 0.71, "learning_rate": 1.4514660797929665e-05, "loss": 2.303, "step": 406970 }, { "epoch": 0.71, "learning_rate": 1.4513788858002839e-05, "loss": 2.2444, "step": 406980 }, { "epoch": 0.71, "learning_rate": 1.4512916918076015e-05, "loss": 2.1528, "step": 406990 }, { "epoch": 0.71, "learning_rate": 1.4512044978149187e-05, "loss": 2.3256, "step": 407000 }, { "epoch": 0.71, "learning_rate": 1.4511173038222359e-05, "loss": 2.354, "step": 407010 }, { "epoch": 0.71, "learning_rate": 1.451030109829553e-05, "loss": 2.4322, "step": 407020 }, { "epoch": 0.71, "learning_rate": 1.4509429158368706e-05, "loss": 2.355, "step": 407030 }, { "epoch": 0.71, "learning_rate": 1.4508557218441878e-05, "loss": 2.263, "step": 407040 }, { "epoch": 0.71, "learning_rate": 1.4507685278515052e-05, "loss": 2.2444, "step": 407050 }, { "epoch": 0.71, "learning_rate": 1.4506813338588226e-05, "loss": 2.2639, "step": 407060 }, { "epoch": 0.71, "learning_rate": 1.45059413986614e-05, "loss": 2.3254, "step": 407070 }, { "epoch": 0.71, "learning_rate": 1.4505069458734572e-05, "loss": 2.2285, "step": 407080 }, { "epoch": 0.71, "learning_rate": 1.4504197518807744e-05, "loss": 2.1984, "step": 407090 }, { "epoch": 0.71, "learning_rate": 1.450332557888092e-05, "loss": 2.4729, "step": 407100 }, { "epoch": 0.71, "learning_rate": 1.4502453638954091e-05, "loss": 2.2883, "step": 407110 }, { "epoch": 0.71, "learning_rate": 1.4501581699027263e-05, "loss": 2.238, "step": 407120 }, { "epoch": 0.71, "learning_rate": 1.4500709759100437e-05, "loss": 2.2113, "step": 407130 }, { "epoch": 0.71, "learning_rate": 1.4499837819173611e-05, "loss": 2.3442, "step": 407140 }, { "epoch": 0.71, "learning_rate": 1.4498965879246785e-05, "loss": 2.2011, "step": 407150 }, { "epoch": 0.71, "learning_rate": 1.4498093939319957e-05, "loss": 2.407, "step": 407160 }, { "epoch": 0.71, "learning_rate": 1.4497221999393132e-05, "loss": 2.361, "step": 407170 }, { "epoch": 0.71, "learning_rate": 1.4496350059466304e-05, "loss": 2.2028, "step": 407180 }, { "epoch": 0.71, "learning_rate": 1.4495478119539476e-05, "loss": 2.3988, "step": 407190 }, { "epoch": 0.71, "learning_rate": 1.4494606179612649e-05, "loss": 2.2833, "step": 407200 }, { "epoch": 0.71, "learning_rate": 1.4493734239685824e-05, "loss": 2.3814, "step": 407210 }, { "epoch": 0.71, "learning_rate": 1.4492862299758996e-05, "loss": 2.3984, "step": 407220 }, { "epoch": 0.71, "learning_rate": 1.449199035983217e-05, "loss": 2.4355, "step": 407230 }, { "epoch": 0.71, "learning_rate": 1.4491118419905342e-05, "loss": 2.3801, "step": 407240 }, { "epoch": 0.71, "learning_rate": 1.4490246479978517e-05, "loss": 2.3082, "step": 407250 }, { "epoch": 0.71, "learning_rate": 1.448937454005169e-05, "loss": 2.3526, "step": 407260 }, { "epoch": 0.71, "learning_rate": 1.4488502600124862e-05, "loss": 2.2429, "step": 407270 }, { "epoch": 0.71, "learning_rate": 1.4487630660198034e-05, "loss": 2.3291, "step": 407280 }, { "epoch": 0.71, "learning_rate": 1.4486758720271209e-05, "loss": 2.2962, "step": 407290 }, { "epoch": 0.71, "learning_rate": 1.4485886780344383e-05, "loss": 2.228, "step": 407300 }, { "epoch": 0.71, "learning_rate": 1.4485014840417555e-05, "loss": 2.3131, "step": 407310 }, { "epoch": 0.71, "learning_rate": 1.448414290049073e-05, "loss": 2.2817, "step": 407320 }, { "epoch": 0.71, "learning_rate": 1.4483270960563902e-05, "loss": 2.3272, "step": 407330 }, { "epoch": 0.71, "learning_rate": 1.4482399020637075e-05, "loss": 2.3096, "step": 407340 }, { "epoch": 0.71, "learning_rate": 1.4481527080710247e-05, "loss": 2.3315, "step": 407350 }, { "epoch": 0.71, "learning_rate": 1.4480655140783422e-05, "loss": 2.3018, "step": 407360 }, { "epoch": 0.71, "learning_rate": 1.4479783200856594e-05, "loss": 2.322, "step": 407370 }, { "epoch": 0.71, "learning_rate": 1.4478911260929768e-05, "loss": 2.3497, "step": 407380 }, { "epoch": 0.71, "learning_rate": 1.447803932100294e-05, "loss": 2.2925, "step": 407390 }, { "epoch": 0.71, "learning_rate": 1.4477167381076115e-05, "loss": 2.2791, "step": 407400 }, { "epoch": 0.71, "learning_rate": 1.4476295441149288e-05, "loss": 2.3135, "step": 407410 }, { "epoch": 0.71, "learning_rate": 1.447542350122246e-05, "loss": 2.2977, "step": 407420 }, { "epoch": 0.71, "learning_rate": 1.4474551561295635e-05, "loss": 2.3538, "step": 407430 }, { "epoch": 0.71, "learning_rate": 1.4473679621368807e-05, "loss": 2.3209, "step": 407440 }, { "epoch": 0.71, "learning_rate": 1.447280768144198e-05, "loss": 2.2611, "step": 407450 }, { "epoch": 0.71, "learning_rate": 1.4471935741515153e-05, "loss": 2.2475, "step": 407460 }, { "epoch": 0.71, "learning_rate": 1.4471063801588328e-05, "loss": 2.389, "step": 407470 }, { "epoch": 0.71, "learning_rate": 1.44701918616615e-05, "loss": 2.2823, "step": 407480 }, { "epoch": 0.71, "learning_rate": 1.4469319921734673e-05, "loss": 2.2456, "step": 407490 }, { "epoch": 0.71, "learning_rate": 1.4468447981807845e-05, "loss": 2.2022, "step": 407500 }, { "epoch": 0.71, "learning_rate": 1.446757604188102e-05, "loss": 2.3355, "step": 407510 }, { "epoch": 0.71, "learning_rate": 1.4466704101954192e-05, "loss": 2.3167, "step": 407520 }, { "epoch": 0.71, "learning_rate": 1.4465832162027364e-05, "loss": 2.2937, "step": 407530 }, { "epoch": 0.71, "learning_rate": 1.4464960222100538e-05, "loss": 2.308, "step": 407540 }, { "epoch": 0.71, "learning_rate": 1.4464088282173714e-05, "loss": 2.3358, "step": 407550 }, { "epoch": 0.71, "learning_rate": 1.4463216342246886e-05, "loss": 2.3867, "step": 407560 }, { "epoch": 0.71, "learning_rate": 1.4462344402320058e-05, "loss": 2.2005, "step": 407570 }, { "epoch": 0.71, "learning_rate": 1.4461472462393233e-05, "loss": 2.2486, "step": 407580 }, { "epoch": 0.71, "learning_rate": 1.4460600522466405e-05, "loss": 2.3812, "step": 407590 }, { "epoch": 0.71, "learning_rate": 1.4459728582539577e-05, "loss": 2.2572, "step": 407600 }, { "epoch": 0.71, "learning_rate": 1.4458856642612751e-05, "loss": 2.3243, "step": 407610 }, { "epoch": 0.71, "learning_rate": 1.4457984702685925e-05, "loss": 2.1795, "step": 407620 }, { "epoch": 0.71, "learning_rate": 1.4457112762759099e-05, "loss": 2.3515, "step": 407630 }, { "epoch": 0.71, "learning_rate": 1.445624082283227e-05, "loss": 2.3927, "step": 407640 }, { "epoch": 0.71, "learning_rate": 1.4455368882905443e-05, "loss": 2.3575, "step": 407650 }, { "epoch": 0.71, "learning_rate": 1.4454496942978618e-05, "loss": 2.3282, "step": 407660 }, { "epoch": 0.71, "learning_rate": 1.445362500305179e-05, "loss": 2.1839, "step": 407670 }, { "epoch": 0.71, "learning_rate": 1.4452753063124962e-05, "loss": 2.2535, "step": 407680 }, { "epoch": 0.71, "learning_rate": 1.4451881123198136e-05, "loss": 2.4169, "step": 407690 }, { "epoch": 0.71, "learning_rate": 1.445100918327131e-05, "loss": 2.2609, "step": 407700 }, { "epoch": 0.71, "learning_rate": 1.4450137243344484e-05, "loss": 2.2888, "step": 407710 }, { "epoch": 0.71, "learning_rate": 1.4449265303417656e-05, "loss": 2.1859, "step": 407720 }, { "epoch": 0.71, "learning_rate": 1.4448393363490831e-05, "loss": 2.2598, "step": 407730 }, { "epoch": 0.71, "learning_rate": 1.4447521423564003e-05, "loss": 2.3568, "step": 407740 }, { "epoch": 0.71, "learning_rate": 1.4446649483637175e-05, "loss": 2.1986, "step": 407750 }, { "epoch": 0.71, "learning_rate": 1.4445777543710347e-05, "loss": 2.2994, "step": 407760 }, { "epoch": 0.71, "learning_rate": 1.4444905603783523e-05, "loss": 2.2179, "step": 407770 }, { "epoch": 0.71, "learning_rate": 1.4444033663856697e-05, "loss": 2.2459, "step": 407780 }, { "epoch": 0.71, "learning_rate": 1.4443161723929869e-05, "loss": 2.2763, "step": 407790 }, { "epoch": 0.71, "learning_rate": 1.444228978400304e-05, "loss": 2.2773, "step": 407800 }, { "epoch": 0.71, "learning_rate": 1.4441417844076216e-05, "loss": 2.4279, "step": 407810 }, { "epoch": 0.71, "learning_rate": 1.4440545904149388e-05, "loss": 2.3567, "step": 407820 }, { "epoch": 0.71, "learning_rate": 1.443967396422256e-05, "loss": 2.4124, "step": 407830 }, { "epoch": 0.71, "learning_rate": 1.4438802024295736e-05, "loss": 2.2866, "step": 407840 }, { "epoch": 0.71, "learning_rate": 1.4437930084368908e-05, "loss": 2.2348, "step": 407850 }, { "epoch": 0.71, "learning_rate": 1.4437058144442082e-05, "loss": 2.495, "step": 407860 }, { "epoch": 0.71, "learning_rate": 1.4436186204515254e-05, "loss": 2.2972, "step": 407870 }, { "epoch": 0.71, "learning_rate": 1.443531426458843e-05, "loss": 2.3601, "step": 407880 }, { "epoch": 0.71, "learning_rate": 1.4434442324661601e-05, "loss": 2.4092, "step": 407890 }, { "epoch": 0.71, "learning_rate": 1.4433570384734773e-05, "loss": 2.3152, "step": 407900 }, { "epoch": 0.71, "learning_rate": 1.4432698444807946e-05, "loss": 2.2764, "step": 407910 }, { "epoch": 0.71, "learning_rate": 1.4431826504881121e-05, "loss": 2.2799, "step": 407920 }, { "epoch": 0.71, "learning_rate": 1.4430954564954293e-05, "loss": 2.2807, "step": 407930 }, { "epoch": 0.71, "learning_rate": 1.4430082625027467e-05, "loss": 2.3516, "step": 407940 }, { "epoch": 0.71, "learning_rate": 1.4429210685100639e-05, "loss": 2.249, "step": 407950 }, { "epoch": 0.71, "learning_rate": 1.4428338745173814e-05, "loss": 2.4031, "step": 407960 }, { "epoch": 0.71, "learning_rate": 1.4427466805246986e-05, "loss": 2.2901, "step": 407970 }, { "epoch": 0.71, "learning_rate": 1.4426594865320159e-05, "loss": 2.2195, "step": 407980 }, { "epoch": 0.71, "learning_rate": 1.4425722925393334e-05, "loss": 2.3116, "step": 407990 }, { "epoch": 0.71, "learning_rate": 1.4424850985466506e-05, "loss": 2.2136, "step": 408000 }, { "epoch": 0.71, "learning_rate": 1.4423979045539678e-05, "loss": 2.2927, "step": 408010 }, { "epoch": 0.71, "learning_rate": 1.4423107105612852e-05, "loss": 2.3139, "step": 408020 }, { "epoch": 0.71, "learning_rate": 1.4422235165686027e-05, "loss": 2.425, "step": 408030 }, { "epoch": 0.71, "learning_rate": 1.44213632257592e-05, "loss": 2.3279, "step": 408040 }, { "epoch": 0.71, "learning_rate": 1.4420491285832372e-05, "loss": 2.3102, "step": 408050 }, { "epoch": 0.71, "learning_rate": 1.4419619345905544e-05, "loss": 2.3882, "step": 408060 }, { "epoch": 0.71, "learning_rate": 1.4418747405978719e-05, "loss": 2.2339, "step": 408070 }, { "epoch": 0.71, "learning_rate": 1.4417875466051891e-05, "loss": 2.2357, "step": 408080 }, { "epoch": 0.71, "learning_rate": 1.4417003526125065e-05, "loss": 2.3939, "step": 408090 }, { "epoch": 0.71, "learning_rate": 1.4416131586198239e-05, "loss": 2.3245, "step": 408100 }, { "epoch": 0.71, "learning_rate": 1.4415259646271412e-05, "loss": 2.2751, "step": 408110 }, { "epoch": 0.71, "learning_rate": 1.4414387706344585e-05, "loss": 2.3206, "step": 408120 }, { "epoch": 0.71, "learning_rate": 1.4413515766417757e-05, "loss": 2.2985, "step": 408130 }, { "epoch": 0.71, "learning_rate": 1.4412643826490932e-05, "loss": 2.3406, "step": 408140 }, { "epoch": 0.71, "learning_rate": 1.4411771886564104e-05, "loss": 2.3532, "step": 408150 }, { "epoch": 0.71, "learning_rate": 1.4410899946637276e-05, "loss": 2.2949, "step": 408160 }, { "epoch": 0.71, "learning_rate": 1.441002800671045e-05, "loss": 2.3744, "step": 408170 }, { "epoch": 0.71, "learning_rate": 1.4409156066783624e-05, "loss": 2.3075, "step": 408180 }, { "epoch": 0.71, "learning_rate": 1.4408284126856798e-05, "loss": 2.3565, "step": 408190 }, { "epoch": 0.71, "learning_rate": 1.440741218692997e-05, "loss": 2.3428, "step": 408200 }, { "epoch": 0.71, "learning_rate": 1.4406540247003142e-05, "loss": 2.2797, "step": 408210 }, { "epoch": 0.71, "learning_rate": 1.4405668307076317e-05, "loss": 2.2953, "step": 408220 }, { "epoch": 0.71, "learning_rate": 1.440479636714949e-05, "loss": 2.2863, "step": 408230 }, { "epoch": 0.71, "learning_rate": 1.4403924427222661e-05, "loss": 2.2384, "step": 408240 }, { "epoch": 0.71, "learning_rate": 1.4403052487295837e-05, "loss": 2.4241, "step": 408250 }, { "epoch": 0.71, "learning_rate": 1.4402180547369009e-05, "loss": 2.3176, "step": 408260 }, { "epoch": 0.71, "learning_rate": 1.4401308607442183e-05, "loss": 2.3128, "step": 408270 }, { "epoch": 0.71, "learning_rate": 1.4400436667515355e-05, "loss": 2.3669, "step": 408280 }, { "epoch": 0.71, "learning_rate": 1.439956472758853e-05, "loss": 2.3838, "step": 408290 }, { "epoch": 0.71, "learning_rate": 1.4398692787661702e-05, "loss": 2.2707, "step": 408300 }, { "epoch": 0.71, "learning_rate": 1.4397820847734874e-05, "loss": 2.3564, "step": 408310 }, { "epoch": 0.71, "learning_rate": 1.4396948907808046e-05, "loss": 2.3043, "step": 408320 }, { "epoch": 0.71, "learning_rate": 1.4396076967881222e-05, "loss": 2.3112, "step": 408330 }, { "epoch": 0.71, "learning_rate": 1.4395205027954396e-05, "loss": 2.2781, "step": 408340 }, { "epoch": 0.71, "learning_rate": 1.4394333088027568e-05, "loss": 2.4628, "step": 408350 }, { "epoch": 0.71, "learning_rate": 1.439346114810074e-05, "loss": 2.264, "step": 408360 }, { "epoch": 0.71, "learning_rate": 1.4392589208173915e-05, "loss": 2.2842, "step": 408370 }, { "epoch": 0.71, "learning_rate": 1.4391717268247087e-05, "loss": 2.2841, "step": 408380 }, { "epoch": 0.71, "learning_rate": 1.439084532832026e-05, "loss": 2.2837, "step": 408390 }, { "epoch": 0.71, "learning_rate": 1.4389973388393435e-05, "loss": 2.3412, "step": 408400 }, { "epoch": 0.71, "learning_rate": 1.4389101448466607e-05, "loss": 2.2453, "step": 408410 }, { "epoch": 0.71, "learning_rate": 1.438822950853978e-05, "loss": 2.4157, "step": 408420 }, { "epoch": 0.71, "learning_rate": 1.4387357568612953e-05, "loss": 2.3599, "step": 408430 }, { "epoch": 0.71, "learning_rate": 1.4386485628686128e-05, "loss": 2.3135, "step": 408440 }, { "epoch": 0.71, "learning_rate": 1.43856136887593e-05, "loss": 2.3133, "step": 408450 }, { "epoch": 0.71, "learning_rate": 1.4384741748832472e-05, "loss": 2.2692, "step": 408460 }, { "epoch": 0.71, "learning_rate": 1.4383869808905644e-05, "loss": 2.318, "step": 408470 }, { "epoch": 0.71, "learning_rate": 1.438299786897882e-05, "loss": 2.324, "step": 408480 }, { "epoch": 0.71, "learning_rate": 1.4382125929051992e-05, "loss": 2.4057, "step": 408490 }, { "epoch": 0.71, "learning_rate": 1.4381253989125166e-05, "loss": 2.3576, "step": 408500 }, { "epoch": 0.71, "learning_rate": 1.4380382049198341e-05, "loss": 2.1252, "step": 408510 }, { "epoch": 0.71, "learning_rate": 1.4379510109271513e-05, "loss": 2.2164, "step": 408520 }, { "epoch": 0.71, "learning_rate": 1.4378638169344685e-05, "loss": 2.3065, "step": 408530 }, { "epoch": 0.71, "learning_rate": 1.4377766229417857e-05, "loss": 2.2948, "step": 408540 }, { "epoch": 0.71, "learning_rate": 1.4376894289491033e-05, "loss": 2.3043, "step": 408550 }, { "epoch": 0.71, "learning_rate": 1.4376022349564205e-05, "loss": 2.2799, "step": 408560 }, { "epoch": 0.71, "learning_rate": 1.4375150409637377e-05, "loss": 2.2938, "step": 408570 }, { "epoch": 0.71, "learning_rate": 1.437427846971055e-05, "loss": 2.3348, "step": 408580 }, { "epoch": 0.71, "learning_rate": 1.4373406529783726e-05, "loss": 2.2504, "step": 408590 }, { "epoch": 0.71, "learning_rate": 1.4372534589856898e-05, "loss": 2.2351, "step": 408600 }, { "epoch": 0.71, "learning_rate": 1.437166264993007e-05, "loss": 2.2892, "step": 408610 }, { "epoch": 0.71, "learning_rate": 1.4370790710003243e-05, "loss": 2.2084, "step": 408620 }, { "epoch": 0.71, "learning_rate": 1.4369918770076418e-05, "loss": 2.1785, "step": 408630 }, { "epoch": 0.71, "learning_rate": 1.436904683014959e-05, "loss": 2.2998, "step": 408640 }, { "epoch": 0.71, "learning_rate": 1.4368174890222764e-05, "loss": 2.3574, "step": 408650 }, { "epoch": 0.71, "learning_rate": 1.4367302950295938e-05, "loss": 2.1762, "step": 408660 }, { "epoch": 0.71, "learning_rate": 1.4366431010369111e-05, "loss": 2.2407, "step": 408670 }, { "epoch": 0.71, "learning_rate": 1.4365559070442283e-05, "loss": 2.4483, "step": 408680 }, { "epoch": 0.71, "learning_rate": 1.4364687130515456e-05, "loss": 2.2409, "step": 408690 }, { "epoch": 0.71, "learning_rate": 1.4363815190588631e-05, "loss": 2.2121, "step": 408700 }, { "epoch": 0.71, "learning_rate": 1.4362943250661803e-05, "loss": 2.2524, "step": 408710 }, { "epoch": 0.71, "learning_rate": 1.4362071310734975e-05, "loss": 2.3783, "step": 408720 }, { "epoch": 0.71, "learning_rate": 1.4361199370808149e-05, "loss": 2.2969, "step": 408730 }, { "epoch": 0.71, "learning_rate": 1.4360327430881323e-05, "loss": 2.2141, "step": 408740 }, { "epoch": 0.71, "learning_rate": 1.4359455490954496e-05, "loss": 2.1993, "step": 408750 }, { "epoch": 0.71, "learning_rate": 1.4358583551027669e-05, "loss": 2.3092, "step": 408760 }, { "epoch": 0.71, "learning_rate": 1.4357711611100844e-05, "loss": 2.3733, "step": 408770 }, { "epoch": 0.71, "learning_rate": 1.4356839671174016e-05, "loss": 2.3076, "step": 408780 }, { "epoch": 0.71, "learning_rate": 1.4355967731247188e-05, "loss": 2.3512, "step": 408790 }, { "epoch": 0.71, "learning_rate": 1.435509579132036e-05, "loss": 2.2937, "step": 408800 }, { "epoch": 0.71, "learning_rate": 1.4354223851393536e-05, "loss": 2.348, "step": 408810 }, { "epoch": 0.71, "learning_rate": 1.435335191146671e-05, "loss": 2.2995, "step": 408820 }, { "epoch": 0.71, "learning_rate": 1.4352479971539882e-05, "loss": 2.2485, "step": 408830 }, { "epoch": 0.71, "learning_rate": 1.4351608031613054e-05, "loss": 2.2533, "step": 408840 }, { "epoch": 0.71, "learning_rate": 1.4350736091686229e-05, "loss": 2.2013, "step": 408850 }, { "epoch": 0.71, "learning_rate": 1.4349864151759401e-05, "loss": 2.324, "step": 408860 }, { "epoch": 0.71, "learning_rate": 1.4348992211832573e-05, "loss": 2.3637, "step": 408870 }, { "epoch": 0.71, "learning_rate": 1.4348120271905745e-05, "loss": 2.3654, "step": 408880 }, { "epoch": 0.71, "learning_rate": 1.434724833197892e-05, "loss": 2.2479, "step": 408890 }, { "epoch": 0.71, "learning_rate": 1.4346376392052095e-05, "loss": 2.3415, "step": 408900 }, { "epoch": 0.71, "learning_rate": 1.4345504452125267e-05, "loss": 2.3552, "step": 408910 }, { "epoch": 0.71, "learning_rate": 1.4344632512198442e-05, "loss": 2.4181, "step": 408920 }, { "epoch": 0.71, "learning_rate": 1.4343760572271614e-05, "loss": 2.372, "step": 408930 }, { "epoch": 0.71, "learning_rate": 1.4342888632344786e-05, "loss": 2.3413, "step": 408940 }, { "epoch": 0.71, "learning_rate": 1.4342016692417958e-05, "loss": 2.2577, "step": 408950 }, { "epoch": 0.71, "learning_rate": 1.4341144752491134e-05, "loss": 2.3983, "step": 408960 }, { "epoch": 0.71, "learning_rate": 1.4340272812564306e-05, "loss": 2.3052, "step": 408970 }, { "epoch": 0.71, "learning_rate": 1.433940087263748e-05, "loss": 2.2906, "step": 408980 }, { "epoch": 0.71, "learning_rate": 1.4338528932710652e-05, "loss": 2.2871, "step": 408990 }, { "epoch": 0.71, "learning_rate": 1.4337656992783827e-05, "loss": 2.1225, "step": 409000 }, { "epoch": 0.71, "learning_rate": 1.4336785052857e-05, "loss": 2.3252, "step": 409010 }, { "epoch": 0.71, "learning_rate": 1.4335913112930171e-05, "loss": 2.2685, "step": 409020 }, { "epoch": 0.71, "learning_rate": 1.4335041173003347e-05, "loss": 2.2406, "step": 409030 }, { "epoch": 0.71, "learning_rate": 1.4334169233076519e-05, "loss": 2.2536, "step": 409040 }, { "epoch": 0.71, "learning_rate": 1.4333297293149691e-05, "loss": 2.3156, "step": 409050 }, { "epoch": 0.71, "learning_rate": 1.4332425353222865e-05, "loss": 2.2555, "step": 409060 }, { "epoch": 0.71, "learning_rate": 1.433155341329604e-05, "loss": 2.2265, "step": 409070 }, { "epoch": 0.71, "learning_rate": 1.4330681473369212e-05, "loss": 2.2522, "step": 409080 }, { "epoch": 0.71, "learning_rate": 1.4329809533442384e-05, "loss": 2.2378, "step": 409090 }, { "epoch": 0.71, "learning_rate": 1.4328937593515556e-05, "loss": 2.2536, "step": 409100 }, { "epoch": 0.71, "learning_rate": 1.4328065653588732e-05, "loss": 2.1252, "step": 409110 }, { "epoch": 0.71, "learning_rate": 1.4327193713661904e-05, "loss": 2.3894, "step": 409120 }, { "epoch": 0.71, "learning_rate": 1.4326321773735078e-05, "loss": 2.4247, "step": 409130 }, { "epoch": 0.71, "learning_rate": 1.432544983380825e-05, "loss": 2.3062, "step": 409140 }, { "epoch": 0.71, "learning_rate": 1.4324577893881425e-05, "loss": 2.2832, "step": 409150 }, { "epoch": 0.71, "learning_rate": 1.4323705953954597e-05, "loss": 2.1436, "step": 409160 }, { "epoch": 0.71, "learning_rate": 1.432283401402777e-05, "loss": 2.3635, "step": 409170 }, { "epoch": 0.71, "learning_rate": 1.4321962074100945e-05, "loss": 2.2255, "step": 409180 }, { "epoch": 0.71, "learning_rate": 1.4321090134174117e-05, "loss": 2.3225, "step": 409190 }, { "epoch": 0.71, "learning_rate": 1.4320218194247289e-05, "loss": 2.2516, "step": 409200 }, { "epoch": 0.71, "learning_rate": 1.4319346254320463e-05, "loss": 2.2993, "step": 409210 }, { "epoch": 0.71, "learning_rate": 1.4318474314393637e-05, "loss": 2.2694, "step": 409220 }, { "epoch": 0.71, "learning_rate": 1.431760237446681e-05, "loss": 2.4361, "step": 409230 }, { "epoch": 0.71, "learning_rate": 1.4316730434539982e-05, "loss": 2.3495, "step": 409240 }, { "epoch": 0.71, "learning_rate": 1.4315858494613154e-05, "loss": 2.2524, "step": 409250 }, { "epoch": 0.71, "learning_rate": 1.431498655468633e-05, "loss": 2.2208, "step": 409260 }, { "epoch": 0.71, "learning_rate": 1.4314114614759502e-05, "loss": 2.3427, "step": 409270 }, { "epoch": 0.71, "learning_rate": 1.4313242674832674e-05, "loss": 2.345, "step": 409280 }, { "epoch": 0.71, "learning_rate": 1.4312370734905848e-05, "loss": 2.3288, "step": 409290 }, { "epoch": 0.71, "learning_rate": 1.4311498794979022e-05, "loss": 2.2919, "step": 409300 }, { "epoch": 0.71, "learning_rate": 1.4310626855052195e-05, "loss": 2.3329, "step": 409310 }, { "epoch": 0.71, "learning_rate": 1.4309754915125367e-05, "loss": 2.2208, "step": 409320 }, { "epoch": 0.71, "learning_rate": 1.4308882975198543e-05, "loss": 2.3314, "step": 409330 }, { "epoch": 0.71, "learning_rate": 1.4308011035271715e-05, "loss": 2.3461, "step": 409340 }, { "epoch": 0.71, "learning_rate": 1.4307139095344887e-05, "loss": 2.2917, "step": 409350 }, { "epoch": 0.71, "learning_rate": 1.430626715541806e-05, "loss": 2.2453, "step": 409360 }, { "epoch": 0.71, "learning_rate": 1.4305395215491235e-05, "loss": 2.3483, "step": 409370 }, { "epoch": 0.71, "learning_rate": 1.4304523275564408e-05, "loss": 2.2584, "step": 409380 }, { "epoch": 0.71, "learning_rate": 1.430365133563758e-05, "loss": 2.2354, "step": 409390 }, { "epoch": 0.71, "learning_rate": 1.4302779395710753e-05, "loss": 2.3285, "step": 409400 }, { "epoch": 0.71, "learning_rate": 1.4301907455783928e-05, "loss": 2.3826, "step": 409410 }, { "epoch": 0.71, "learning_rate": 1.43010355158571e-05, "loss": 2.1855, "step": 409420 }, { "epoch": 0.71, "learning_rate": 1.4300163575930272e-05, "loss": 2.3253, "step": 409430 }, { "epoch": 0.71, "learning_rate": 1.4299291636003448e-05, "loss": 2.3005, "step": 409440 }, { "epoch": 0.71, "learning_rate": 1.429841969607662e-05, "loss": 2.2126, "step": 409450 }, { "epoch": 0.71, "learning_rate": 1.4297547756149793e-05, "loss": 2.2641, "step": 409460 }, { "epoch": 0.71, "learning_rate": 1.4296675816222966e-05, "loss": 2.2584, "step": 409470 }, { "epoch": 0.71, "learning_rate": 1.4295803876296141e-05, "loss": 2.3062, "step": 409480 }, { "epoch": 0.71, "learning_rate": 1.4294931936369313e-05, "loss": 2.2829, "step": 409490 }, { "epoch": 0.71, "learning_rate": 1.4294059996442485e-05, "loss": 2.2646, "step": 409500 }, { "epoch": 0.71, "learning_rate": 1.4293188056515657e-05, "loss": 2.3772, "step": 409510 }, { "epoch": 0.71, "learning_rate": 1.4292316116588833e-05, "loss": 2.2987, "step": 409520 }, { "epoch": 0.71, "learning_rate": 1.4291444176662005e-05, "loss": 2.259, "step": 409530 }, { "epoch": 0.71, "learning_rate": 1.4290572236735179e-05, "loss": 2.353, "step": 409540 }, { "epoch": 0.71, "learning_rate": 1.428970029680835e-05, "loss": 2.2897, "step": 409550 }, { "epoch": 0.71, "learning_rate": 1.4288828356881526e-05, "loss": 2.2648, "step": 409560 }, { "epoch": 0.71, "learning_rate": 1.4287956416954698e-05, "loss": 2.2268, "step": 409570 }, { "epoch": 0.71, "learning_rate": 1.428708447702787e-05, "loss": 2.3063, "step": 409580 }, { "epoch": 0.71, "learning_rate": 1.4286212537101046e-05, "loss": 2.1523, "step": 409590 }, { "epoch": 0.71, "learning_rate": 1.4285340597174218e-05, "loss": 2.1455, "step": 409600 }, { "epoch": 0.71, "learning_rate": 1.4284468657247392e-05, "loss": 2.3609, "step": 409610 }, { "epoch": 0.71, "learning_rate": 1.4283596717320564e-05, "loss": 2.3014, "step": 409620 }, { "epoch": 0.71, "learning_rate": 1.4282724777393739e-05, "loss": 2.3922, "step": 409630 }, { "epoch": 0.71, "learning_rate": 1.4281852837466911e-05, "loss": 2.3175, "step": 409640 }, { "epoch": 0.71, "learning_rate": 1.4280980897540083e-05, "loss": 2.3396, "step": 409650 }, { "epoch": 0.71, "learning_rate": 1.4280108957613255e-05, "loss": 2.2448, "step": 409660 }, { "epoch": 0.71, "learning_rate": 1.427923701768643e-05, "loss": 2.3112, "step": 409670 }, { "epoch": 0.71, "learning_rate": 1.4278365077759603e-05, "loss": 2.2698, "step": 409680 }, { "epoch": 0.71, "learning_rate": 1.4277493137832777e-05, "loss": 2.3672, "step": 409690 }, { "epoch": 0.71, "learning_rate": 1.427662119790595e-05, "loss": 2.2177, "step": 409700 }, { "epoch": 0.71, "learning_rate": 1.4275749257979124e-05, "loss": 2.3918, "step": 409710 }, { "epoch": 0.71, "learning_rate": 1.4274877318052296e-05, "loss": 2.3946, "step": 409720 }, { "epoch": 0.71, "learning_rate": 1.4274005378125468e-05, "loss": 2.3199, "step": 409730 }, { "epoch": 0.71, "learning_rate": 1.4273133438198644e-05, "loss": 2.3151, "step": 409740 }, { "epoch": 0.71, "learning_rate": 1.4272261498271816e-05, "loss": 2.3199, "step": 409750 }, { "epoch": 0.71, "learning_rate": 1.4271389558344988e-05, "loss": 2.3063, "step": 409760 }, { "epoch": 0.71, "learning_rate": 1.4270517618418162e-05, "loss": 2.2657, "step": 409770 }, { "epoch": 0.71, "learning_rate": 1.4269645678491335e-05, "loss": 2.2742, "step": 409780 }, { "epoch": 0.71, "learning_rate": 1.426877373856451e-05, "loss": 2.2852, "step": 409790 }, { "epoch": 0.71, "learning_rate": 1.4267901798637681e-05, "loss": 2.3933, "step": 409800 }, { "epoch": 0.71, "learning_rate": 1.4267029858710853e-05, "loss": 2.3493, "step": 409810 }, { "epoch": 0.71, "learning_rate": 1.4266157918784029e-05, "loss": 2.2732, "step": 409820 }, { "epoch": 0.71, "learning_rate": 1.4265285978857201e-05, "loss": 2.2529, "step": 409830 }, { "epoch": 0.71, "learning_rate": 1.4264414038930373e-05, "loss": 2.41, "step": 409840 }, { "epoch": 0.71, "learning_rate": 1.4263542099003548e-05, "loss": 2.3889, "step": 409850 }, { "epoch": 0.71, "learning_rate": 1.4262670159076722e-05, "loss": 2.3161, "step": 409860 }, { "epoch": 0.71, "learning_rate": 1.4261798219149894e-05, "loss": 2.268, "step": 409870 }, { "epoch": 0.71, "learning_rate": 1.4260926279223066e-05, "loss": 2.2463, "step": 409880 }, { "epoch": 0.71, "learning_rate": 1.4260054339296242e-05, "loss": 2.4281, "step": 409890 }, { "epoch": 0.71, "learning_rate": 1.4259182399369414e-05, "loss": 2.3234, "step": 409900 }, { "epoch": 0.71, "learning_rate": 1.4258310459442586e-05, "loss": 2.2609, "step": 409910 }, { "epoch": 0.71, "learning_rate": 1.425743851951576e-05, "loss": 2.2702, "step": 409920 }, { "epoch": 0.71, "learning_rate": 1.4256566579588934e-05, "loss": 2.1751, "step": 409930 }, { "epoch": 0.71, "learning_rate": 1.4255694639662107e-05, "loss": 2.3381, "step": 409940 }, { "epoch": 0.71, "learning_rate": 1.425482269973528e-05, "loss": 2.3776, "step": 409950 }, { "epoch": 0.71, "learning_rate": 1.4253950759808455e-05, "loss": 2.2819, "step": 409960 }, { "epoch": 0.71, "learning_rate": 1.4253078819881627e-05, "loss": 2.225, "step": 409970 }, { "epoch": 0.71, "learning_rate": 1.4252206879954799e-05, "loss": 2.4418, "step": 409980 }, { "epoch": 0.71, "learning_rate": 1.4251334940027971e-05, "loss": 2.2392, "step": 409990 }, { "epoch": 0.71, "learning_rate": 1.4250463000101147e-05, "loss": 2.3815, "step": 410000 }, { "epoch": 0.72, "learning_rate": 1.4249591060174319e-05, "loss": 2.3014, "step": 410010 }, { "epoch": 0.72, "learning_rate": 1.4248719120247492e-05, "loss": 2.3152, "step": 410020 }, { "epoch": 0.72, "learning_rate": 1.4247847180320664e-05, "loss": 2.4168, "step": 410030 }, { "epoch": 0.72, "learning_rate": 1.424697524039384e-05, "loss": 2.2639, "step": 410040 }, { "epoch": 0.72, "learning_rate": 1.4246103300467012e-05, "loss": 2.2753, "step": 410050 }, { "epoch": 0.72, "learning_rate": 1.4245231360540184e-05, "loss": 2.2441, "step": 410060 }, { "epoch": 0.72, "learning_rate": 1.4244359420613356e-05, "loss": 2.2051, "step": 410070 }, { "epoch": 0.72, "learning_rate": 1.4243487480686532e-05, "loss": 2.2733, "step": 410080 }, { "epoch": 0.72, "learning_rate": 1.4242615540759704e-05, "loss": 2.3304, "step": 410090 }, { "epoch": 0.72, "learning_rate": 1.4241743600832877e-05, "loss": 2.357, "step": 410100 }, { "epoch": 0.72, "learning_rate": 1.4240871660906053e-05, "loss": 2.2929, "step": 410110 }, { "epoch": 0.72, "learning_rate": 1.4239999720979225e-05, "loss": 2.2572, "step": 410120 }, { "epoch": 0.72, "learning_rate": 1.4239127781052397e-05, "loss": 2.3366, "step": 410130 }, { "epoch": 0.72, "learning_rate": 1.423825584112557e-05, "loss": 2.4477, "step": 410140 }, { "epoch": 0.72, "learning_rate": 1.4237383901198745e-05, "loss": 2.1976, "step": 410150 }, { "epoch": 0.72, "learning_rate": 1.4236511961271917e-05, "loss": 2.3262, "step": 410160 }, { "epoch": 0.72, "learning_rate": 1.423564002134509e-05, "loss": 2.2981, "step": 410170 }, { "epoch": 0.72, "learning_rate": 1.4234768081418263e-05, "loss": 2.1583, "step": 410180 }, { "epoch": 0.72, "learning_rate": 1.4233896141491438e-05, "loss": 2.3859, "step": 410190 }, { "epoch": 0.72, "learning_rate": 1.423302420156461e-05, "loss": 2.1584, "step": 410200 }, { "epoch": 0.72, "learning_rate": 1.4232152261637782e-05, "loss": 2.3434, "step": 410210 }, { "epoch": 0.72, "learning_rate": 1.4231280321710954e-05, "loss": 2.3099, "step": 410220 }, { "epoch": 0.72, "learning_rate": 1.423040838178413e-05, "loss": 2.3484, "step": 410230 }, { "epoch": 0.72, "learning_rate": 1.4229536441857302e-05, "loss": 2.2554, "step": 410240 }, { "epoch": 0.72, "learning_rate": 1.4228664501930476e-05, "loss": 2.2434, "step": 410250 }, { "epoch": 0.72, "learning_rate": 1.422779256200365e-05, "loss": 2.3826, "step": 410260 }, { "epoch": 0.72, "learning_rate": 1.4226920622076823e-05, "loss": 2.3317, "step": 410270 }, { "epoch": 0.72, "learning_rate": 1.4226048682149995e-05, "loss": 2.2783, "step": 410280 }, { "epoch": 0.72, "learning_rate": 1.4225176742223167e-05, "loss": 2.3188, "step": 410290 }, { "epoch": 0.72, "learning_rate": 1.4224304802296343e-05, "loss": 2.3342, "step": 410300 }, { "epoch": 0.72, "learning_rate": 1.4223432862369515e-05, "loss": 2.3644, "step": 410310 }, { "epoch": 0.72, "learning_rate": 1.4222560922442687e-05, "loss": 2.3331, "step": 410320 }, { "epoch": 0.72, "learning_rate": 1.422168898251586e-05, "loss": 2.3564, "step": 410330 }, { "epoch": 0.72, "learning_rate": 1.4220817042589036e-05, "loss": 2.2653, "step": 410340 }, { "epoch": 0.72, "learning_rate": 1.4219945102662208e-05, "loss": 2.3658, "step": 410350 }, { "epoch": 0.72, "learning_rate": 1.421907316273538e-05, "loss": 2.252, "step": 410360 }, { "epoch": 0.72, "learning_rate": 1.4218201222808556e-05, "loss": 2.3111, "step": 410370 }, { "epoch": 0.72, "learning_rate": 1.4217329282881728e-05, "loss": 2.2692, "step": 410380 }, { "epoch": 0.72, "learning_rate": 1.42164573429549e-05, "loss": 2.2606, "step": 410390 }, { "epoch": 0.72, "learning_rate": 1.4215585403028072e-05, "loss": 2.3221, "step": 410400 }, { "epoch": 0.72, "learning_rate": 1.4214713463101247e-05, "loss": 2.4038, "step": 410410 }, { "epoch": 0.72, "learning_rate": 1.4213841523174421e-05, "loss": 2.3396, "step": 410420 }, { "epoch": 0.72, "learning_rate": 1.4212969583247593e-05, "loss": 2.3541, "step": 410430 }, { "epoch": 0.72, "learning_rate": 1.4212097643320765e-05, "loss": 2.3612, "step": 410440 }, { "epoch": 0.72, "learning_rate": 1.421122570339394e-05, "loss": 2.2785, "step": 410450 }, { "epoch": 0.72, "learning_rate": 1.4210353763467113e-05, "loss": 2.2564, "step": 410460 }, { "epoch": 0.72, "learning_rate": 1.4209481823540285e-05, "loss": 2.313, "step": 410470 }, { "epoch": 0.72, "learning_rate": 1.4208609883613459e-05, "loss": 2.3403, "step": 410480 }, { "epoch": 0.72, "learning_rate": 1.4207737943686632e-05, "loss": 2.2731, "step": 410490 }, { "epoch": 0.72, "learning_rate": 1.4206866003759806e-05, "loss": 2.3236, "step": 410500 }, { "epoch": 0.72, "learning_rate": 1.4205994063832978e-05, "loss": 2.395, "step": 410510 }, { "epoch": 0.72, "learning_rate": 1.4205122123906154e-05, "loss": 2.3283, "step": 410520 }, { "epoch": 0.72, "learning_rate": 1.4204250183979326e-05, "loss": 2.3497, "step": 410530 }, { "epoch": 0.72, "learning_rate": 1.4203378244052498e-05, "loss": 2.3239, "step": 410540 }, { "epoch": 0.72, "learning_rate": 1.420250630412567e-05, "loss": 2.2123, "step": 410550 }, { "epoch": 0.72, "learning_rate": 1.4201634364198845e-05, "loss": 2.2706, "step": 410560 }, { "epoch": 0.72, "learning_rate": 1.4200762424272018e-05, "loss": 2.3515, "step": 410570 }, { "epoch": 0.72, "learning_rate": 1.4199890484345191e-05, "loss": 2.326, "step": 410580 }, { "epoch": 0.72, "learning_rate": 1.4199018544418363e-05, "loss": 2.3037, "step": 410590 }, { "epoch": 0.72, "learning_rate": 1.4198146604491539e-05, "loss": 2.397, "step": 410600 }, { "epoch": 0.72, "learning_rate": 1.4197274664564711e-05, "loss": 2.3575, "step": 410610 }, { "epoch": 0.72, "learning_rate": 1.4196402724637883e-05, "loss": 2.1267, "step": 410620 }, { "epoch": 0.72, "learning_rate": 1.4195530784711058e-05, "loss": 2.2598, "step": 410630 }, { "epoch": 0.72, "learning_rate": 1.419465884478423e-05, "loss": 2.3186, "step": 410640 }, { "epoch": 0.72, "learning_rate": 1.4193786904857404e-05, "loss": 2.2474, "step": 410650 }, { "epoch": 0.72, "learning_rate": 1.4192914964930576e-05, "loss": 2.2446, "step": 410660 }, { "epoch": 0.72, "learning_rate": 1.4192043025003752e-05, "loss": 2.4465, "step": 410670 }, { "epoch": 0.72, "learning_rate": 1.4191171085076924e-05, "loss": 2.337, "step": 410680 }, { "epoch": 0.72, "learning_rate": 1.4190299145150096e-05, "loss": 2.3668, "step": 410690 }, { "epoch": 0.72, "learning_rate": 1.4189427205223268e-05, "loss": 2.303, "step": 410700 }, { "epoch": 0.72, "learning_rate": 1.4188555265296444e-05, "loss": 2.2933, "step": 410710 }, { "epoch": 0.72, "learning_rate": 1.4187683325369616e-05, "loss": 2.2902, "step": 410720 }, { "epoch": 0.72, "learning_rate": 1.418681138544279e-05, "loss": 2.2665, "step": 410730 }, { "epoch": 0.72, "learning_rate": 1.4185939445515961e-05, "loss": 2.1693, "step": 410740 }, { "epoch": 0.72, "learning_rate": 1.4185067505589137e-05, "loss": 2.3445, "step": 410750 }, { "epoch": 0.72, "learning_rate": 1.4184195565662309e-05, "loss": 2.1984, "step": 410760 }, { "epoch": 0.72, "learning_rate": 1.4183323625735481e-05, "loss": 2.2971, "step": 410770 }, { "epoch": 0.72, "learning_rate": 1.4182451685808657e-05, "loss": 2.3154, "step": 410780 }, { "epoch": 0.72, "learning_rate": 1.4181579745881829e-05, "loss": 2.3419, "step": 410790 }, { "epoch": 0.72, "learning_rate": 1.4180707805955e-05, "loss": 2.2443, "step": 410800 }, { "epoch": 0.72, "learning_rate": 1.4179835866028174e-05, "loss": 2.368, "step": 410810 }, { "epoch": 0.72, "learning_rate": 1.4178963926101348e-05, "loss": 2.3034, "step": 410820 }, { "epoch": 0.72, "learning_rate": 1.4178091986174522e-05, "loss": 2.3355, "step": 410830 }, { "epoch": 0.72, "learning_rate": 1.4177220046247694e-05, "loss": 2.2877, "step": 410840 }, { "epoch": 0.72, "learning_rate": 1.4176348106320866e-05, "loss": 2.2348, "step": 410850 }, { "epoch": 0.72, "learning_rate": 1.4175476166394042e-05, "loss": 2.3338, "step": 410860 }, { "epoch": 0.72, "learning_rate": 1.4174604226467214e-05, "loss": 2.2395, "step": 410870 }, { "epoch": 0.72, "learning_rate": 1.4173732286540386e-05, "loss": 2.1864, "step": 410880 }, { "epoch": 0.72, "learning_rate": 1.4172860346613561e-05, "loss": 2.2465, "step": 410890 }, { "epoch": 0.72, "learning_rate": 1.4171988406686735e-05, "loss": 2.2038, "step": 410900 }, { "epoch": 0.72, "learning_rate": 1.4171116466759907e-05, "loss": 2.3138, "step": 410910 }, { "epoch": 0.72, "learning_rate": 1.417024452683308e-05, "loss": 2.1939, "step": 410920 }, { "epoch": 0.72, "learning_rate": 1.4169372586906255e-05, "loss": 2.2879, "step": 410930 }, { "epoch": 0.72, "learning_rate": 1.4168500646979427e-05, "loss": 2.1923, "step": 410940 }, { "epoch": 0.72, "learning_rate": 1.4167628707052599e-05, "loss": 2.3466, "step": 410950 }, { "epoch": 0.72, "learning_rate": 1.4166756767125773e-05, "loss": 2.2715, "step": 410960 }, { "epoch": 0.72, "learning_rate": 1.4165884827198946e-05, "loss": 2.2879, "step": 410970 }, { "epoch": 0.72, "learning_rate": 1.416501288727212e-05, "loss": 2.2736, "step": 410980 }, { "epoch": 0.72, "learning_rate": 1.4164140947345292e-05, "loss": 2.2953, "step": 410990 }, { "epoch": 0.72, "learning_rate": 1.4163269007418464e-05, "loss": 2.3679, "step": 411000 }, { "epoch": 0.72, "learning_rate": 1.416239706749164e-05, "loss": 2.37, "step": 411010 }, { "epoch": 0.72, "learning_rate": 1.4161525127564812e-05, "loss": 2.2003, "step": 411020 }, { "epoch": 0.72, "learning_rate": 1.4160653187637984e-05, "loss": 2.2488, "step": 411030 }, { "epoch": 0.72, "learning_rate": 1.415978124771116e-05, "loss": 2.3053, "step": 411040 }, { "epoch": 0.72, "learning_rate": 1.4158909307784331e-05, "loss": 2.2106, "step": 411050 }, { "epoch": 0.72, "learning_rate": 1.4158037367857505e-05, "loss": 2.2077, "step": 411060 }, { "epoch": 0.72, "learning_rate": 1.4157165427930677e-05, "loss": 2.2859, "step": 411070 }, { "epoch": 0.72, "learning_rate": 1.4156293488003853e-05, "loss": 2.2369, "step": 411080 }, { "epoch": 0.72, "learning_rate": 1.4155421548077025e-05, "loss": 2.2612, "step": 411090 }, { "epoch": 0.72, "learning_rate": 1.4154549608150197e-05, "loss": 2.3571, "step": 411100 }, { "epoch": 0.72, "learning_rate": 1.4153677668223369e-05, "loss": 2.3135, "step": 411110 }, { "epoch": 0.72, "learning_rate": 1.4152805728296544e-05, "loss": 2.2471, "step": 411120 }, { "epoch": 0.72, "learning_rate": 1.4151933788369716e-05, "loss": 2.2927, "step": 411130 }, { "epoch": 0.72, "learning_rate": 1.415106184844289e-05, "loss": 2.2429, "step": 411140 }, { "epoch": 0.72, "learning_rate": 1.4150189908516062e-05, "loss": 2.2638, "step": 411150 }, { "epoch": 0.72, "learning_rate": 1.4149317968589238e-05, "loss": 2.2694, "step": 411160 }, { "epoch": 0.72, "learning_rate": 1.414844602866241e-05, "loss": 2.2855, "step": 411170 }, { "epoch": 0.72, "learning_rate": 1.4147574088735582e-05, "loss": 2.1992, "step": 411180 }, { "epoch": 0.72, "learning_rate": 1.4146702148808757e-05, "loss": 2.3424, "step": 411190 }, { "epoch": 0.72, "learning_rate": 1.414583020888193e-05, "loss": 2.3068, "step": 411200 }, { "epoch": 0.72, "learning_rate": 1.4144958268955103e-05, "loss": 2.3015, "step": 411210 }, { "epoch": 0.72, "learning_rate": 1.4144086329028275e-05, "loss": 2.3471, "step": 411220 }, { "epoch": 0.72, "learning_rate": 1.414321438910145e-05, "loss": 2.3288, "step": 411230 }, { "epoch": 0.72, "learning_rate": 1.4142342449174623e-05, "loss": 2.2587, "step": 411240 }, { "epoch": 0.72, "learning_rate": 1.4141470509247795e-05, "loss": 2.2313, "step": 411250 }, { "epoch": 0.72, "learning_rate": 1.4140598569320967e-05, "loss": 2.3767, "step": 411260 }, { "epoch": 0.72, "learning_rate": 1.4139726629394142e-05, "loss": 2.4077, "step": 411270 }, { "epoch": 0.72, "learning_rate": 1.4138854689467315e-05, "loss": 2.3059, "step": 411280 }, { "epoch": 0.72, "learning_rate": 1.4137982749540488e-05, "loss": 2.1935, "step": 411290 }, { "epoch": 0.72, "learning_rate": 1.4137110809613662e-05, "loss": 2.1945, "step": 411300 }, { "epoch": 0.72, "learning_rate": 1.4136238869686836e-05, "loss": 2.2649, "step": 411310 }, { "epoch": 0.72, "learning_rate": 1.4135366929760008e-05, "loss": 2.3038, "step": 411320 }, { "epoch": 0.72, "learning_rate": 1.413449498983318e-05, "loss": 2.283, "step": 411330 }, { "epoch": 0.72, "learning_rate": 1.4133623049906355e-05, "loss": 2.2982, "step": 411340 }, { "epoch": 0.72, "learning_rate": 1.4132751109979528e-05, "loss": 2.2654, "step": 411350 }, { "epoch": 0.72, "learning_rate": 1.41318791700527e-05, "loss": 2.3029, "step": 411360 }, { "epoch": 0.72, "learning_rate": 1.4131007230125873e-05, "loss": 2.3711, "step": 411370 }, { "epoch": 0.72, "learning_rate": 1.4130135290199049e-05, "loss": 2.2894, "step": 411380 }, { "epoch": 0.72, "learning_rate": 1.4129263350272221e-05, "loss": 2.2583, "step": 411390 }, { "epoch": 0.72, "learning_rate": 1.4128391410345393e-05, "loss": 2.2525, "step": 411400 }, { "epoch": 0.72, "learning_rate": 1.4127519470418565e-05, "loss": 2.2661, "step": 411410 }, { "epoch": 0.72, "learning_rate": 1.412664753049174e-05, "loss": 2.3401, "step": 411420 }, { "epoch": 0.72, "learning_rate": 1.4125775590564913e-05, "loss": 2.3056, "step": 411430 }, { "epoch": 0.72, "learning_rate": 1.4124903650638085e-05, "loss": 2.2859, "step": 411440 }, { "epoch": 0.72, "learning_rate": 1.412403171071126e-05, "loss": 2.427, "step": 411450 }, { "epoch": 0.72, "learning_rate": 1.4123159770784434e-05, "loss": 2.2951, "step": 411460 }, { "epoch": 0.72, "learning_rate": 1.4122287830857606e-05, "loss": 2.2207, "step": 411470 }, { "epoch": 0.72, "learning_rate": 1.4121415890930778e-05, "loss": 2.2846, "step": 411480 }, { "epoch": 0.72, "learning_rate": 1.4120543951003954e-05, "loss": 2.4013, "step": 411490 }, { "epoch": 0.72, "learning_rate": 1.4119672011077126e-05, "loss": 2.2701, "step": 411500 }, { "epoch": 0.72, "learning_rate": 1.4118800071150298e-05, "loss": 2.4111, "step": 411510 }, { "epoch": 0.72, "learning_rate": 1.4117928131223471e-05, "loss": 2.2296, "step": 411520 }, { "epoch": 0.72, "learning_rate": 1.4117056191296645e-05, "loss": 2.3165, "step": 411530 }, { "epoch": 0.72, "learning_rate": 1.4116184251369819e-05, "loss": 2.2996, "step": 411540 }, { "epoch": 0.72, "learning_rate": 1.4115312311442991e-05, "loss": 2.2728, "step": 411550 }, { "epoch": 0.72, "learning_rate": 1.4114440371516167e-05, "loss": 2.345, "step": 411560 }, { "epoch": 0.72, "learning_rate": 1.4113568431589339e-05, "loss": 2.2952, "step": 411570 }, { "epoch": 0.72, "learning_rate": 1.411269649166251e-05, "loss": 2.3407, "step": 411580 }, { "epoch": 0.72, "learning_rate": 1.4111824551735683e-05, "loss": 2.3325, "step": 411590 }, { "epoch": 0.72, "learning_rate": 1.4110952611808858e-05, "loss": 2.3098, "step": 411600 }, { "epoch": 0.72, "learning_rate": 1.411008067188203e-05, "loss": 2.2148, "step": 411610 }, { "epoch": 0.72, "learning_rate": 1.4109208731955204e-05, "loss": 2.3238, "step": 411620 }, { "epoch": 0.72, "learning_rate": 1.4108336792028376e-05, "loss": 2.4254, "step": 411630 }, { "epoch": 0.72, "learning_rate": 1.4107464852101552e-05, "loss": 2.2651, "step": 411640 }, { "epoch": 0.72, "learning_rate": 1.4106592912174724e-05, "loss": 2.283, "step": 411650 }, { "epoch": 0.72, "learning_rate": 1.4105720972247896e-05, "loss": 2.3913, "step": 411660 }, { "epoch": 0.72, "learning_rate": 1.4104849032321068e-05, "loss": 2.1865, "step": 411670 }, { "epoch": 0.72, "learning_rate": 1.4103977092394243e-05, "loss": 2.309, "step": 411680 }, { "epoch": 0.72, "learning_rate": 1.4103105152467417e-05, "loss": 2.2547, "step": 411690 }, { "epoch": 0.72, "learning_rate": 1.410223321254059e-05, "loss": 2.3469, "step": 411700 }, { "epoch": 0.72, "learning_rate": 1.4101361272613765e-05, "loss": 2.3642, "step": 411710 }, { "epoch": 0.72, "learning_rate": 1.4100489332686937e-05, "loss": 2.215, "step": 411720 }, { "epoch": 0.72, "learning_rate": 1.4099617392760109e-05, "loss": 2.2612, "step": 411730 }, { "epoch": 0.72, "learning_rate": 1.4098745452833281e-05, "loss": 2.1988, "step": 411740 }, { "epoch": 0.72, "learning_rate": 1.4097873512906456e-05, "loss": 2.2863, "step": 411750 }, { "epoch": 0.72, "learning_rate": 1.4097001572979628e-05, "loss": 2.2704, "step": 411760 }, { "epoch": 0.72, "learning_rate": 1.4096129633052802e-05, "loss": 2.3557, "step": 411770 }, { "epoch": 0.72, "learning_rate": 1.4095257693125974e-05, "loss": 2.2288, "step": 411780 }, { "epoch": 0.72, "learning_rate": 1.409438575319915e-05, "loss": 2.2656, "step": 411790 }, { "epoch": 0.72, "learning_rate": 1.4093513813272322e-05, "loss": 2.3459, "step": 411800 }, { "epoch": 0.72, "learning_rate": 1.4092641873345494e-05, "loss": 2.1948, "step": 411810 }, { "epoch": 0.72, "learning_rate": 1.409176993341867e-05, "loss": 2.3969, "step": 411820 }, { "epoch": 0.72, "learning_rate": 1.4090897993491841e-05, "loss": 2.2622, "step": 411830 }, { "epoch": 0.72, "learning_rate": 1.4090026053565013e-05, "loss": 2.3233, "step": 411840 }, { "epoch": 0.72, "learning_rate": 1.4089154113638187e-05, "loss": 2.2456, "step": 411850 }, { "epoch": 0.72, "learning_rate": 1.4088282173711361e-05, "loss": 2.3021, "step": 411860 }, { "epoch": 0.72, "learning_rate": 1.4087410233784535e-05, "loss": 2.2741, "step": 411870 }, { "epoch": 0.72, "learning_rate": 1.4086538293857707e-05, "loss": 2.1965, "step": 411880 }, { "epoch": 0.72, "learning_rate": 1.4085666353930879e-05, "loss": 2.3674, "step": 411890 }, { "epoch": 0.72, "learning_rate": 1.4084794414004054e-05, "loss": 2.2483, "step": 411900 }, { "epoch": 0.72, "learning_rate": 1.4083922474077226e-05, "loss": 2.219, "step": 411910 }, { "epoch": 0.72, "learning_rate": 1.4083050534150399e-05, "loss": 2.313, "step": 411920 }, { "epoch": 0.72, "learning_rate": 1.4082178594223572e-05, "loss": 2.2417, "step": 411930 }, { "epoch": 0.72, "learning_rate": 1.4081306654296748e-05, "loss": 2.3373, "step": 411940 }, { "epoch": 0.72, "learning_rate": 1.408043471436992e-05, "loss": 2.365, "step": 411950 }, { "epoch": 0.72, "learning_rate": 1.4079562774443092e-05, "loss": 2.3641, "step": 411960 }, { "epoch": 0.72, "learning_rate": 1.4078690834516267e-05, "loss": 2.2961, "step": 411970 }, { "epoch": 0.72, "learning_rate": 1.407781889458944e-05, "loss": 2.3343, "step": 411980 }, { "epoch": 0.72, "learning_rate": 1.4076946954662612e-05, "loss": 2.267, "step": 411990 }, { "epoch": 0.72, "learning_rate": 1.4076075014735785e-05, "loss": 2.1972, "step": 412000 }, { "epoch": 0.72, "learning_rate": 1.4075203074808959e-05, "loss": 2.2664, "step": 412010 }, { "epoch": 0.72, "learning_rate": 1.4074331134882133e-05, "loss": 2.3482, "step": 412020 }, { "epoch": 0.72, "learning_rate": 1.4073459194955305e-05, "loss": 2.2937, "step": 412030 }, { "epoch": 0.72, "learning_rate": 1.4072587255028477e-05, "loss": 2.4094, "step": 412040 }, { "epoch": 0.72, "learning_rate": 1.4071715315101652e-05, "loss": 2.279, "step": 412050 }, { "epoch": 0.72, "learning_rate": 1.4070843375174825e-05, "loss": 2.3856, "step": 412060 }, { "epoch": 0.72, "learning_rate": 1.4069971435247997e-05, "loss": 2.2145, "step": 412070 }, { "epoch": 0.72, "learning_rate": 1.406909949532117e-05, "loss": 2.2984, "step": 412080 }, { "epoch": 0.72, "learning_rate": 1.4068227555394344e-05, "loss": 2.3559, "step": 412090 }, { "epoch": 0.72, "learning_rate": 1.4067355615467518e-05, "loss": 2.4158, "step": 412100 }, { "epoch": 0.72, "learning_rate": 1.406648367554069e-05, "loss": 2.3435, "step": 412110 }, { "epoch": 0.72, "learning_rate": 1.4065611735613865e-05, "loss": 2.2828, "step": 412120 }, { "epoch": 0.72, "learning_rate": 1.4064739795687038e-05, "loss": 2.3059, "step": 412130 }, { "epoch": 0.72, "learning_rate": 1.406386785576021e-05, "loss": 2.3188, "step": 412140 }, { "epoch": 0.72, "learning_rate": 1.4062995915833382e-05, "loss": 2.42, "step": 412150 }, { "epoch": 0.72, "learning_rate": 1.4062123975906557e-05, "loss": 2.364, "step": 412160 }, { "epoch": 0.72, "learning_rate": 1.406125203597973e-05, "loss": 2.3518, "step": 412170 }, { "epoch": 0.72, "learning_rate": 1.4060380096052903e-05, "loss": 2.2879, "step": 412180 }, { "epoch": 0.72, "learning_rate": 1.4059508156126075e-05, "loss": 2.3535, "step": 412190 }, { "epoch": 0.72, "learning_rate": 1.405863621619925e-05, "loss": 2.3537, "step": 412200 }, { "epoch": 0.72, "learning_rate": 1.4057764276272423e-05, "loss": 2.3015, "step": 412210 }, { "epoch": 0.72, "learning_rate": 1.4056892336345595e-05, "loss": 2.3915, "step": 412220 }, { "epoch": 0.72, "learning_rate": 1.405602039641877e-05, "loss": 2.1822, "step": 412230 }, { "epoch": 0.72, "learning_rate": 1.4055148456491942e-05, "loss": 2.277, "step": 412240 }, { "epoch": 0.72, "learning_rate": 1.4054276516565116e-05, "loss": 2.2915, "step": 412250 }, { "epoch": 0.72, "learning_rate": 1.4053404576638288e-05, "loss": 2.1519, "step": 412260 }, { "epoch": 0.72, "learning_rate": 1.4052532636711464e-05, "loss": 2.3618, "step": 412270 }, { "epoch": 0.72, "learning_rate": 1.4051660696784636e-05, "loss": 2.2291, "step": 412280 }, { "epoch": 0.72, "learning_rate": 1.4050788756857808e-05, "loss": 2.2488, "step": 412290 }, { "epoch": 0.72, "learning_rate": 1.404991681693098e-05, "loss": 2.2491, "step": 412300 }, { "epoch": 0.72, "learning_rate": 1.4049044877004155e-05, "loss": 2.3874, "step": 412310 }, { "epoch": 0.72, "learning_rate": 1.4048172937077327e-05, "loss": 2.3904, "step": 412320 }, { "epoch": 0.72, "learning_rate": 1.4047300997150501e-05, "loss": 2.3105, "step": 412330 }, { "epoch": 0.72, "learning_rate": 1.4046429057223673e-05, "loss": 2.2731, "step": 412340 }, { "epoch": 0.72, "learning_rate": 1.4045557117296849e-05, "loss": 2.3477, "step": 412350 }, { "epoch": 0.72, "learning_rate": 1.404468517737002e-05, "loss": 2.3943, "step": 412360 }, { "epoch": 0.72, "learning_rate": 1.4043813237443193e-05, "loss": 2.223, "step": 412370 }, { "epoch": 0.72, "learning_rate": 1.4042941297516368e-05, "loss": 2.25, "step": 412380 }, { "epoch": 0.72, "learning_rate": 1.404206935758954e-05, "loss": 2.3839, "step": 412390 }, { "epoch": 0.72, "learning_rate": 1.4041197417662712e-05, "loss": 2.4107, "step": 412400 }, { "epoch": 0.72, "learning_rate": 1.4040325477735886e-05, "loss": 2.2539, "step": 412410 }, { "epoch": 0.72, "learning_rate": 1.4039453537809062e-05, "loss": 2.3523, "step": 412420 }, { "epoch": 0.72, "learning_rate": 1.4038581597882234e-05, "loss": 2.3442, "step": 412430 }, { "epoch": 0.72, "learning_rate": 1.4037709657955406e-05, "loss": 2.3334, "step": 412440 }, { "epoch": 0.72, "learning_rate": 1.4036837718028578e-05, "loss": 2.2176, "step": 412450 }, { "epoch": 0.72, "learning_rate": 1.4035965778101753e-05, "loss": 2.2637, "step": 412460 }, { "epoch": 0.72, "learning_rate": 1.4035093838174925e-05, "loss": 2.2419, "step": 412470 }, { "epoch": 0.72, "learning_rate": 1.4034221898248097e-05, "loss": 2.2325, "step": 412480 }, { "epoch": 0.72, "learning_rate": 1.4033349958321273e-05, "loss": 2.3481, "step": 412490 }, { "epoch": 0.72, "learning_rate": 1.4032478018394447e-05, "loss": 2.3503, "step": 412500 }, { "epoch": 0.72, "learning_rate": 1.4031606078467619e-05, "loss": 2.2608, "step": 412510 }, { "epoch": 0.72, "learning_rate": 1.4030734138540791e-05, "loss": 2.2371, "step": 412520 }, { "epoch": 0.72, "learning_rate": 1.4029862198613966e-05, "loss": 2.2422, "step": 412530 }, { "epoch": 0.72, "learning_rate": 1.4028990258687138e-05, "loss": 2.1695, "step": 412540 }, { "epoch": 0.72, "learning_rate": 1.402811831876031e-05, "loss": 2.3628, "step": 412550 }, { "epoch": 0.72, "learning_rate": 1.4027246378833484e-05, "loss": 2.2547, "step": 412560 }, { "epoch": 0.72, "learning_rate": 1.4026374438906658e-05, "loss": 2.2338, "step": 412570 }, { "epoch": 0.72, "learning_rate": 1.4025502498979832e-05, "loss": 2.3372, "step": 412580 }, { "epoch": 0.72, "learning_rate": 1.4024630559053004e-05, "loss": 2.3338, "step": 412590 }, { "epoch": 0.72, "learning_rate": 1.4023758619126176e-05, "loss": 2.292, "step": 412600 }, { "epoch": 0.72, "learning_rate": 1.4022886679199351e-05, "loss": 2.1934, "step": 412610 }, { "epoch": 0.72, "learning_rate": 1.4022014739272523e-05, "loss": 2.3415, "step": 412620 }, { "epoch": 0.72, "learning_rate": 1.4021142799345696e-05, "loss": 2.4619, "step": 412630 }, { "epoch": 0.72, "learning_rate": 1.4020270859418871e-05, "loss": 2.2732, "step": 412640 }, { "epoch": 0.72, "learning_rate": 1.4019398919492043e-05, "loss": 2.3118, "step": 412650 }, { "epoch": 0.72, "learning_rate": 1.4018526979565217e-05, "loss": 2.3868, "step": 412660 }, { "epoch": 0.72, "learning_rate": 1.4017655039638389e-05, "loss": 2.3708, "step": 412670 }, { "epoch": 0.72, "learning_rate": 1.4016783099711564e-05, "loss": 2.2847, "step": 412680 }, { "epoch": 0.72, "learning_rate": 1.4015911159784736e-05, "loss": 2.1828, "step": 412690 }, { "epoch": 0.72, "learning_rate": 1.4015039219857909e-05, "loss": 2.4773, "step": 412700 }, { "epoch": 0.72, "learning_rate": 1.401416727993108e-05, "loss": 2.3921, "step": 412710 }, { "epoch": 0.72, "learning_rate": 1.4013295340004256e-05, "loss": 2.1711, "step": 412720 }, { "epoch": 0.72, "learning_rate": 1.401242340007743e-05, "loss": 2.2785, "step": 412730 }, { "epoch": 0.72, "learning_rate": 1.4011551460150602e-05, "loss": 2.3721, "step": 412740 }, { "epoch": 0.72, "learning_rate": 1.4010679520223774e-05, "loss": 2.2685, "step": 412750 }, { "epoch": 0.72, "learning_rate": 1.400980758029695e-05, "loss": 2.36, "step": 412760 }, { "epoch": 0.72, "learning_rate": 1.4008935640370122e-05, "loss": 2.3122, "step": 412770 }, { "epoch": 0.72, "learning_rate": 1.4008063700443294e-05, "loss": 2.2705, "step": 412780 }, { "epoch": 0.72, "learning_rate": 1.4007191760516469e-05, "loss": 2.3748, "step": 412790 }, { "epoch": 0.72, "learning_rate": 1.4006319820589641e-05, "loss": 2.4002, "step": 412800 }, { "epoch": 0.72, "learning_rate": 1.4005447880662815e-05, "loss": 2.2831, "step": 412810 }, { "epoch": 0.72, "learning_rate": 1.4004575940735987e-05, "loss": 2.2681, "step": 412820 }, { "epoch": 0.72, "learning_rate": 1.4003704000809162e-05, "loss": 2.3096, "step": 412830 }, { "epoch": 0.72, "learning_rate": 1.4002832060882335e-05, "loss": 2.2949, "step": 412840 }, { "epoch": 0.72, "learning_rate": 1.4001960120955507e-05, "loss": 2.2591, "step": 412850 }, { "epoch": 0.72, "learning_rate": 1.4001088181028679e-05, "loss": 2.278, "step": 412860 }, { "epoch": 0.72, "learning_rate": 1.4000216241101854e-05, "loss": 2.2874, "step": 412870 }, { "epoch": 0.72, "learning_rate": 1.3999344301175026e-05, "loss": 2.3639, "step": 412880 }, { "epoch": 0.72, "learning_rate": 1.39984723612482e-05, "loss": 2.327, "step": 412890 }, { "epoch": 0.72, "learning_rate": 1.3997600421321374e-05, "loss": 2.2791, "step": 412900 }, { "epoch": 0.72, "learning_rate": 1.3996728481394548e-05, "loss": 2.3977, "step": 412910 }, { "epoch": 0.72, "learning_rate": 1.399585654146772e-05, "loss": 2.2388, "step": 412920 }, { "epoch": 0.72, "learning_rate": 1.3994984601540892e-05, "loss": 2.3345, "step": 412930 }, { "epoch": 0.72, "learning_rate": 1.3994112661614067e-05, "loss": 2.315, "step": 412940 }, { "epoch": 0.72, "learning_rate": 1.399324072168724e-05, "loss": 2.2887, "step": 412950 }, { "epoch": 0.72, "learning_rate": 1.3992368781760411e-05, "loss": 2.3151, "step": 412960 }, { "epoch": 0.72, "learning_rate": 1.3991496841833585e-05, "loss": 2.4646, "step": 412970 }, { "epoch": 0.72, "learning_rate": 1.399062490190676e-05, "loss": 2.2717, "step": 412980 }, { "epoch": 0.72, "learning_rate": 1.3989752961979933e-05, "loss": 2.3367, "step": 412990 }, { "epoch": 0.72, "learning_rate": 1.3988881022053105e-05, "loss": 2.3176, "step": 413000 }, { "epoch": 0.72, "learning_rate": 1.3988009082126277e-05, "loss": 2.3394, "step": 413010 }, { "epoch": 0.72, "learning_rate": 1.3987137142199452e-05, "loss": 2.3453, "step": 413020 }, { "epoch": 0.72, "learning_rate": 1.3986265202272624e-05, "loss": 2.2606, "step": 413030 }, { "epoch": 0.72, "learning_rate": 1.3985393262345798e-05, "loss": 2.2967, "step": 413040 }, { "epoch": 0.72, "learning_rate": 1.3984521322418972e-05, "loss": 2.3233, "step": 413050 }, { "epoch": 0.72, "learning_rate": 1.3983649382492146e-05, "loss": 2.3533, "step": 413060 }, { "epoch": 0.72, "learning_rate": 1.3982777442565318e-05, "loss": 2.2431, "step": 413070 }, { "epoch": 0.72, "learning_rate": 1.398190550263849e-05, "loss": 2.4271, "step": 413080 }, { "epoch": 0.72, "learning_rate": 1.3981033562711665e-05, "loss": 2.3302, "step": 413090 }, { "epoch": 0.72, "learning_rate": 1.3980161622784837e-05, "loss": 2.2829, "step": 413100 }, { "epoch": 0.72, "learning_rate": 1.397928968285801e-05, "loss": 2.2974, "step": 413110 }, { "epoch": 0.72, "learning_rate": 1.3978417742931183e-05, "loss": 2.2764, "step": 413120 }, { "epoch": 0.72, "learning_rate": 1.3977545803004357e-05, "loss": 2.3293, "step": 413130 }, { "epoch": 0.72, "learning_rate": 1.397667386307753e-05, "loss": 2.3089, "step": 413140 }, { "epoch": 0.72, "learning_rate": 1.3975801923150703e-05, "loss": 2.3142, "step": 413150 }, { "epoch": 0.72, "learning_rate": 1.3974929983223878e-05, "loss": 2.3383, "step": 413160 }, { "epoch": 0.72, "learning_rate": 1.397405804329705e-05, "loss": 2.3274, "step": 413170 }, { "epoch": 0.72, "learning_rate": 1.3973186103370222e-05, "loss": 2.371, "step": 413180 }, { "epoch": 0.72, "learning_rate": 1.3972314163443394e-05, "loss": 2.2662, "step": 413190 }, { "epoch": 0.72, "learning_rate": 1.397144222351657e-05, "loss": 2.3364, "step": 413200 }, { "epoch": 0.72, "learning_rate": 1.3970570283589742e-05, "loss": 2.3185, "step": 413210 }, { "epoch": 0.72, "learning_rate": 1.3969698343662916e-05, "loss": 2.2819, "step": 413220 }, { "epoch": 0.72, "learning_rate": 1.3968826403736088e-05, "loss": 2.2856, "step": 413230 }, { "epoch": 0.72, "learning_rate": 1.3967954463809263e-05, "loss": 2.3645, "step": 413240 }, { "epoch": 0.72, "learning_rate": 1.3967082523882435e-05, "loss": 2.3464, "step": 413250 }, { "epoch": 0.72, "learning_rate": 1.3966210583955607e-05, "loss": 2.3727, "step": 413260 }, { "epoch": 0.72, "learning_rate": 1.396533864402878e-05, "loss": 2.2689, "step": 413270 }, { "epoch": 0.72, "learning_rate": 1.3964466704101955e-05, "loss": 2.4352, "step": 413280 }, { "epoch": 0.72, "learning_rate": 1.3963594764175129e-05, "loss": 2.3032, "step": 413290 }, { "epoch": 0.72, "learning_rate": 1.3962722824248301e-05, "loss": 2.2381, "step": 413300 }, { "epoch": 0.72, "learning_rate": 1.3961850884321476e-05, "loss": 2.3282, "step": 413310 }, { "epoch": 0.72, "learning_rate": 1.3960978944394648e-05, "loss": 2.2147, "step": 413320 }, { "epoch": 0.72, "learning_rate": 1.396010700446782e-05, "loss": 2.4243, "step": 413330 }, { "epoch": 0.72, "learning_rate": 1.3959235064540993e-05, "loss": 2.206, "step": 413340 }, { "epoch": 0.72, "learning_rate": 1.3958363124614168e-05, "loss": 2.2412, "step": 413350 }, { "epoch": 0.72, "learning_rate": 1.395749118468734e-05, "loss": 2.4255, "step": 413360 }, { "epoch": 0.72, "learning_rate": 1.3956619244760514e-05, "loss": 2.2955, "step": 413370 }, { "epoch": 0.72, "learning_rate": 1.3955747304833686e-05, "loss": 2.3742, "step": 413380 }, { "epoch": 0.72, "learning_rate": 1.3954875364906861e-05, "loss": 2.3123, "step": 413390 }, { "epoch": 0.72, "learning_rate": 1.3954003424980033e-05, "loss": 2.3239, "step": 413400 }, { "epoch": 0.72, "learning_rate": 1.3953131485053206e-05, "loss": 2.2314, "step": 413410 }, { "epoch": 0.72, "learning_rate": 1.3952259545126381e-05, "loss": 2.335, "step": 413420 }, { "epoch": 0.72, "learning_rate": 1.3951387605199553e-05, "loss": 2.2558, "step": 413430 }, { "epoch": 0.72, "learning_rate": 1.3950515665272725e-05, "loss": 2.3397, "step": 413440 }, { "epoch": 0.72, "learning_rate": 1.3949643725345899e-05, "loss": 2.3072, "step": 413450 }, { "epoch": 0.72, "learning_rate": 1.3948771785419074e-05, "loss": 2.1826, "step": 413460 }, { "epoch": 0.72, "learning_rate": 1.3947899845492246e-05, "loss": 2.435, "step": 413470 }, { "epoch": 0.72, "learning_rate": 1.3947027905565419e-05, "loss": 2.3543, "step": 413480 }, { "epoch": 0.72, "learning_rate": 1.394615596563859e-05, "loss": 2.3236, "step": 413490 }, { "epoch": 0.72, "learning_rate": 1.3945284025711766e-05, "loss": 2.347, "step": 413500 }, { "epoch": 0.72, "learning_rate": 1.3944412085784938e-05, "loss": 2.2568, "step": 413510 }, { "epoch": 0.72, "learning_rate": 1.394354014585811e-05, "loss": 2.3404, "step": 413520 }, { "epoch": 0.72, "learning_rate": 1.3942668205931284e-05, "loss": 2.3346, "step": 413530 }, { "epoch": 0.72, "learning_rate": 1.394179626600446e-05, "loss": 2.2398, "step": 413540 }, { "epoch": 0.72, "learning_rate": 1.3940924326077632e-05, "loss": 2.2857, "step": 413550 }, { "epoch": 0.72, "learning_rate": 1.3940052386150804e-05, "loss": 2.1688, "step": 413560 }, { "epoch": 0.72, "learning_rate": 1.3939180446223979e-05, "loss": 2.3378, "step": 413570 }, { "epoch": 0.72, "learning_rate": 1.3938308506297151e-05, "loss": 2.2542, "step": 413580 }, { "epoch": 0.72, "learning_rate": 1.3937436566370323e-05, "loss": 2.2833, "step": 413590 }, { "epoch": 0.72, "learning_rate": 1.3936564626443497e-05, "loss": 2.3578, "step": 413600 }, { "epoch": 0.72, "learning_rate": 1.393569268651667e-05, "loss": 2.3295, "step": 413610 }, { "epoch": 0.72, "learning_rate": 1.3934820746589845e-05, "loss": 2.2849, "step": 413620 }, { "epoch": 0.72, "learning_rate": 1.3933948806663017e-05, "loss": 2.3786, "step": 413630 }, { "epoch": 0.72, "learning_rate": 1.3933076866736189e-05, "loss": 2.3338, "step": 413640 }, { "epoch": 0.72, "learning_rate": 1.3932204926809364e-05, "loss": 2.3075, "step": 413650 }, { "epoch": 0.72, "learning_rate": 1.3931332986882536e-05, "loss": 2.2543, "step": 413660 }, { "epoch": 0.72, "learning_rate": 1.3930461046955708e-05, "loss": 2.3831, "step": 413670 }, { "epoch": 0.72, "learning_rate": 1.3929589107028882e-05, "loss": 2.3333, "step": 413680 }, { "epoch": 0.72, "learning_rate": 1.3928717167102056e-05, "loss": 2.2634, "step": 413690 }, { "epoch": 0.72, "learning_rate": 1.392784522717523e-05, "loss": 2.2454, "step": 413700 }, { "epoch": 0.72, "learning_rate": 1.3926973287248402e-05, "loss": 2.2685, "step": 413710 }, { "epoch": 0.72, "learning_rate": 1.3926101347321577e-05, "loss": 2.2409, "step": 413720 }, { "epoch": 0.72, "learning_rate": 1.392522940739475e-05, "loss": 2.4206, "step": 413730 }, { "epoch": 0.72, "learning_rate": 1.3924357467467921e-05, "loss": 2.3922, "step": 413740 }, { "epoch": 0.72, "learning_rate": 1.3923485527541093e-05, "loss": 2.1995, "step": 413750 }, { "epoch": 0.72, "learning_rate": 1.3922613587614269e-05, "loss": 2.2769, "step": 413760 }, { "epoch": 0.72, "learning_rate": 1.3921741647687443e-05, "loss": 2.4169, "step": 413770 }, { "epoch": 0.72, "learning_rate": 1.3920869707760615e-05, "loss": 2.267, "step": 413780 }, { "epoch": 0.72, "learning_rate": 1.3919997767833787e-05, "loss": 2.2818, "step": 413790 }, { "epoch": 0.72, "learning_rate": 1.3919125827906962e-05, "loss": 2.1798, "step": 413800 }, { "epoch": 0.72, "learning_rate": 1.3918253887980134e-05, "loss": 2.3588, "step": 413810 }, { "epoch": 0.72, "learning_rate": 1.3917381948053306e-05, "loss": 2.1618, "step": 413820 }, { "epoch": 0.72, "learning_rate": 1.3916510008126482e-05, "loss": 2.4103, "step": 413830 }, { "epoch": 0.72, "learning_rate": 1.3915638068199654e-05, "loss": 2.3578, "step": 413840 }, { "epoch": 0.72, "learning_rate": 1.3914766128272828e-05, "loss": 2.306, "step": 413850 }, { "epoch": 0.72, "learning_rate": 1.3913894188346e-05, "loss": 2.324, "step": 413860 }, { "epoch": 0.72, "learning_rate": 1.3913022248419175e-05, "loss": 2.2739, "step": 413870 }, { "epoch": 0.72, "learning_rate": 1.3912150308492347e-05, "loss": 2.4021, "step": 413880 }, { "epoch": 0.72, "learning_rate": 1.391127836856552e-05, "loss": 2.3038, "step": 413890 }, { "epoch": 0.72, "learning_rate": 1.3910406428638692e-05, "loss": 2.2743, "step": 413900 }, { "epoch": 0.72, "learning_rate": 1.3909534488711867e-05, "loss": 2.37, "step": 413910 }, { "epoch": 0.72, "learning_rate": 1.3908662548785039e-05, "loss": 2.2735, "step": 413920 }, { "epoch": 0.72, "learning_rate": 1.3907790608858213e-05, "loss": 2.2985, "step": 413930 }, { "epoch": 0.72, "learning_rate": 1.3906918668931385e-05, "loss": 2.2921, "step": 413940 }, { "epoch": 0.72, "learning_rate": 1.390604672900456e-05, "loss": 2.2775, "step": 413950 }, { "epoch": 0.72, "learning_rate": 1.3905174789077732e-05, "loss": 2.1681, "step": 413960 }, { "epoch": 0.72, "learning_rate": 1.3904302849150905e-05, "loss": 2.423, "step": 413970 }, { "epoch": 0.72, "learning_rate": 1.390343090922408e-05, "loss": 2.186, "step": 413980 }, { "epoch": 0.72, "learning_rate": 1.3902558969297252e-05, "loss": 2.2277, "step": 413990 }, { "epoch": 0.72, "learning_rate": 1.3901687029370424e-05, "loss": 2.1995, "step": 414000 }, { "epoch": 0.72, "learning_rate": 1.3900815089443598e-05, "loss": 2.3167, "step": 414010 }, { "epoch": 0.72, "learning_rate": 1.3899943149516773e-05, "loss": 2.3119, "step": 414020 }, { "epoch": 0.72, "learning_rate": 1.3899071209589945e-05, "loss": 2.3705, "step": 414030 }, { "epoch": 0.72, "learning_rate": 1.3898199269663118e-05, "loss": 2.3055, "step": 414040 }, { "epoch": 0.72, "learning_rate": 1.389732732973629e-05, "loss": 2.3548, "step": 414050 }, { "epoch": 0.72, "learning_rate": 1.3896455389809465e-05, "loss": 2.2253, "step": 414060 }, { "epoch": 0.72, "learning_rate": 1.3895583449882637e-05, "loss": 2.419, "step": 414070 }, { "epoch": 0.72, "learning_rate": 1.3894711509955811e-05, "loss": 2.4399, "step": 414080 }, { "epoch": 0.72, "learning_rate": 1.3893839570028985e-05, "loss": 2.2303, "step": 414090 }, { "epoch": 0.72, "learning_rate": 1.3892967630102158e-05, "loss": 2.3062, "step": 414100 }, { "epoch": 0.72, "learning_rate": 1.389209569017533e-05, "loss": 2.3316, "step": 414110 }, { "epoch": 0.72, "learning_rate": 1.3891223750248503e-05, "loss": 2.3971, "step": 414120 }, { "epoch": 0.72, "learning_rate": 1.3890351810321678e-05, "loss": 2.2045, "step": 414130 }, { "epoch": 0.72, "learning_rate": 1.388947987039485e-05, "loss": 2.2341, "step": 414140 }, { "epoch": 0.72, "learning_rate": 1.3888607930468022e-05, "loss": 2.3123, "step": 414150 }, { "epoch": 0.72, "learning_rate": 1.3887735990541196e-05, "loss": 2.3413, "step": 414160 }, { "epoch": 0.72, "learning_rate": 1.388686405061437e-05, "loss": 2.4197, "step": 414170 }, { "epoch": 0.72, "learning_rate": 1.3885992110687544e-05, "loss": 2.2643, "step": 414180 }, { "epoch": 0.72, "learning_rate": 1.3885120170760716e-05, "loss": 2.339, "step": 414190 }, { "epoch": 0.72, "learning_rate": 1.3884248230833888e-05, "loss": 2.3222, "step": 414200 }, { "epoch": 0.72, "learning_rate": 1.3883376290907063e-05, "loss": 2.2482, "step": 414210 }, { "epoch": 0.72, "learning_rate": 1.3882504350980235e-05, "loss": 2.2677, "step": 414220 }, { "epoch": 0.72, "learning_rate": 1.3881632411053407e-05, "loss": 2.387, "step": 414230 }, { "epoch": 0.72, "learning_rate": 1.3880760471126583e-05, "loss": 2.1745, "step": 414240 }, { "epoch": 0.72, "learning_rate": 1.3879888531199755e-05, "loss": 2.2621, "step": 414250 }, { "epoch": 0.72, "learning_rate": 1.3879016591272929e-05, "loss": 2.3648, "step": 414260 }, { "epoch": 0.72, "learning_rate": 1.38781446513461e-05, "loss": 2.2902, "step": 414270 }, { "epoch": 0.72, "learning_rate": 1.3877272711419276e-05, "loss": 2.326, "step": 414280 }, { "epoch": 0.72, "learning_rate": 1.3876400771492448e-05, "loss": 2.2604, "step": 414290 }, { "epoch": 0.72, "learning_rate": 1.387552883156562e-05, "loss": 2.3448, "step": 414300 }, { "epoch": 0.72, "learning_rate": 1.3874656891638792e-05, "loss": 2.313, "step": 414310 }, { "epoch": 0.72, "learning_rate": 1.3873784951711968e-05, "loss": 2.241, "step": 414320 }, { "epoch": 0.72, "learning_rate": 1.3872913011785142e-05, "loss": 2.2767, "step": 414330 }, { "epoch": 0.72, "learning_rate": 1.3872041071858314e-05, "loss": 2.2855, "step": 414340 }, { "epoch": 0.72, "learning_rate": 1.3871169131931489e-05, "loss": 2.3112, "step": 414350 }, { "epoch": 0.72, "learning_rate": 1.3870297192004661e-05, "loss": 2.2428, "step": 414360 }, { "epoch": 0.72, "learning_rate": 1.3869425252077833e-05, "loss": 2.3461, "step": 414370 }, { "epoch": 0.72, "learning_rate": 1.3868553312151005e-05, "loss": 2.2923, "step": 414380 }, { "epoch": 0.72, "learning_rate": 1.386768137222418e-05, "loss": 2.4235, "step": 414390 }, { "epoch": 0.72, "learning_rate": 1.3866809432297353e-05, "loss": 2.367, "step": 414400 }, { "epoch": 0.72, "learning_rate": 1.3865937492370527e-05, "loss": 2.3201, "step": 414410 }, { "epoch": 0.72, "learning_rate": 1.3865065552443699e-05, "loss": 2.3549, "step": 414420 }, { "epoch": 0.72, "learning_rate": 1.3864193612516874e-05, "loss": 2.3569, "step": 414430 }, { "epoch": 0.72, "learning_rate": 1.3863321672590046e-05, "loss": 2.2674, "step": 414440 }, { "epoch": 0.72, "learning_rate": 1.3862449732663218e-05, "loss": 2.3099, "step": 414450 }, { "epoch": 0.72, "learning_rate": 1.386157779273639e-05, "loss": 2.2065, "step": 414460 }, { "epoch": 0.72, "learning_rate": 1.3860705852809566e-05, "loss": 2.3429, "step": 414470 }, { "epoch": 0.72, "learning_rate": 1.3859833912882738e-05, "loss": 2.3444, "step": 414480 }, { "epoch": 0.72, "learning_rate": 1.3858961972955912e-05, "loss": 2.2147, "step": 414490 }, { "epoch": 0.72, "learning_rate": 1.3858090033029087e-05, "loss": 2.1707, "step": 414500 }, { "epoch": 0.72, "learning_rate": 1.385721809310226e-05, "loss": 2.2482, "step": 414510 }, { "epoch": 0.72, "learning_rate": 1.3856346153175431e-05, "loss": 2.3438, "step": 414520 }, { "epoch": 0.72, "learning_rate": 1.3855474213248603e-05, "loss": 2.2063, "step": 414530 }, { "epoch": 0.72, "learning_rate": 1.3854602273321779e-05, "loss": 2.3334, "step": 414540 }, { "epoch": 0.72, "learning_rate": 1.3853730333394951e-05, "loss": 2.2479, "step": 414550 }, { "epoch": 0.72, "learning_rate": 1.3852858393468123e-05, "loss": 2.2696, "step": 414560 }, { "epoch": 0.72, "learning_rate": 1.3851986453541297e-05, "loss": 2.2955, "step": 414570 }, { "epoch": 0.72, "learning_rate": 1.3851114513614472e-05, "loss": 2.3569, "step": 414580 }, { "epoch": 0.72, "learning_rate": 1.3850242573687644e-05, "loss": 2.3954, "step": 414590 }, { "epoch": 0.72, "learning_rate": 1.3849370633760816e-05, "loss": 2.2585, "step": 414600 }, { "epoch": 0.72, "learning_rate": 1.3848498693833989e-05, "loss": 2.2515, "step": 414610 }, { "epoch": 0.72, "learning_rate": 1.3847626753907164e-05, "loss": 2.1645, "step": 414620 }, { "epoch": 0.72, "learning_rate": 1.3846754813980336e-05, "loss": 2.4385, "step": 414630 }, { "epoch": 0.72, "learning_rate": 1.384588287405351e-05, "loss": 2.2504, "step": 414640 }, { "epoch": 0.72, "learning_rate": 1.3845010934126684e-05, "loss": 2.2776, "step": 414650 }, { "epoch": 0.72, "learning_rate": 1.3844138994199857e-05, "loss": 2.3911, "step": 414660 }, { "epoch": 0.72, "learning_rate": 1.384326705427303e-05, "loss": 2.3224, "step": 414670 }, { "epoch": 0.72, "learning_rate": 1.3842395114346202e-05, "loss": 2.2692, "step": 414680 }, { "epoch": 0.72, "learning_rate": 1.3841523174419377e-05, "loss": 2.3327, "step": 414690 }, { "epoch": 0.72, "learning_rate": 1.3840651234492549e-05, "loss": 2.3016, "step": 414700 }, { "epoch": 0.72, "learning_rate": 1.3839779294565721e-05, "loss": 2.3463, "step": 414710 }, { "epoch": 0.72, "learning_rate": 1.3838907354638895e-05, "loss": 2.4561, "step": 414720 }, { "epoch": 0.72, "learning_rate": 1.3838035414712069e-05, "loss": 2.4446, "step": 414730 }, { "epoch": 0.72, "learning_rate": 1.3837163474785242e-05, "loss": 2.2725, "step": 414740 }, { "epoch": 0.72, "learning_rate": 1.3836291534858415e-05, "loss": 2.2771, "step": 414750 }, { "epoch": 0.72, "learning_rate": 1.383541959493159e-05, "loss": 2.2986, "step": 414760 }, { "epoch": 0.72, "learning_rate": 1.3834547655004762e-05, "loss": 2.3167, "step": 414770 }, { "epoch": 0.72, "learning_rate": 1.3833675715077934e-05, "loss": 2.2509, "step": 414780 }, { "epoch": 0.72, "learning_rate": 1.3832803775151106e-05, "loss": 2.3449, "step": 414790 }, { "epoch": 0.72, "learning_rate": 1.3831931835224282e-05, "loss": 2.4386, "step": 414800 }, { "epoch": 0.72, "learning_rate": 1.3831059895297455e-05, "loss": 2.3438, "step": 414810 }, { "epoch": 0.72, "learning_rate": 1.3830187955370628e-05, "loss": 2.2938, "step": 414820 }, { "epoch": 0.72, "learning_rate": 1.38293160154438e-05, "loss": 2.2716, "step": 414830 }, { "epoch": 0.72, "learning_rate": 1.3828444075516975e-05, "loss": 2.2715, "step": 414840 }, { "epoch": 0.72, "learning_rate": 1.3827572135590147e-05, "loss": 2.2669, "step": 414850 }, { "epoch": 0.72, "learning_rate": 1.382670019566332e-05, "loss": 2.3747, "step": 414860 }, { "epoch": 0.72, "learning_rate": 1.3825828255736491e-05, "loss": 2.2399, "step": 414870 }, { "epoch": 0.72, "learning_rate": 1.3824956315809667e-05, "loss": 2.3042, "step": 414880 }, { "epoch": 0.72, "learning_rate": 1.382408437588284e-05, "loss": 2.3847, "step": 414890 }, { "epoch": 0.72, "learning_rate": 1.3823212435956013e-05, "loss": 2.2952, "step": 414900 }, { "epoch": 0.72, "learning_rate": 1.3822340496029188e-05, "loss": 2.2372, "step": 414910 }, { "epoch": 0.72, "learning_rate": 1.382146855610236e-05, "loss": 2.3008, "step": 414920 }, { "epoch": 0.72, "learning_rate": 1.3820596616175532e-05, "loss": 2.3054, "step": 414930 }, { "epoch": 0.72, "learning_rate": 1.3819724676248704e-05, "loss": 2.2928, "step": 414940 }, { "epoch": 0.72, "learning_rate": 1.381885273632188e-05, "loss": 2.3654, "step": 414950 }, { "epoch": 0.72, "learning_rate": 1.3817980796395052e-05, "loss": 2.3344, "step": 414960 }, { "epoch": 0.72, "learning_rate": 1.3817108856468226e-05, "loss": 2.2504, "step": 414970 }, { "epoch": 0.72, "learning_rate": 1.3816236916541398e-05, "loss": 2.2951, "step": 414980 }, { "epoch": 0.72, "learning_rate": 1.3815364976614573e-05, "loss": 2.2982, "step": 414990 }, { "epoch": 0.72, "learning_rate": 1.3814493036687745e-05, "loss": 2.3187, "step": 415000 }, { "epoch": 0.72, "learning_rate": 1.3813621096760917e-05, "loss": 2.1673, "step": 415010 }, { "epoch": 0.72, "learning_rate": 1.3812749156834093e-05, "loss": 2.2943, "step": 415020 }, { "epoch": 0.72, "learning_rate": 1.3811877216907265e-05, "loss": 2.2697, "step": 415030 }, { "epoch": 0.72, "learning_rate": 1.3811005276980437e-05, "loss": 2.2958, "step": 415040 }, { "epoch": 0.72, "learning_rate": 1.381013333705361e-05, "loss": 2.3928, "step": 415050 }, { "epoch": 0.72, "learning_rate": 1.3809261397126786e-05, "loss": 2.3803, "step": 415060 }, { "epoch": 0.72, "learning_rate": 1.3808389457199958e-05, "loss": 2.2644, "step": 415070 }, { "epoch": 0.72, "learning_rate": 1.380751751727313e-05, "loss": 2.3381, "step": 415080 }, { "epoch": 0.72, "learning_rate": 1.3806645577346302e-05, "loss": 2.2467, "step": 415090 }, { "epoch": 0.72, "learning_rate": 1.3805773637419478e-05, "loss": 2.3133, "step": 415100 }, { "epoch": 0.72, "learning_rate": 1.380490169749265e-05, "loss": 2.3648, "step": 415110 }, { "epoch": 0.72, "learning_rate": 1.3804029757565824e-05, "loss": 2.3277, "step": 415120 }, { "epoch": 0.72, "learning_rate": 1.3803157817638996e-05, "loss": 2.4418, "step": 415130 }, { "epoch": 0.72, "learning_rate": 1.3802285877712171e-05, "loss": 2.281, "step": 415140 }, { "epoch": 0.72, "learning_rate": 1.3801413937785343e-05, "loss": 2.3323, "step": 415150 }, { "epoch": 0.72, "learning_rate": 1.3800541997858515e-05, "loss": 2.396, "step": 415160 }, { "epoch": 0.72, "learning_rate": 1.379967005793169e-05, "loss": 2.3894, "step": 415170 }, { "epoch": 0.72, "learning_rate": 1.3798798118004863e-05, "loss": 2.3257, "step": 415180 }, { "epoch": 0.72, "learning_rate": 1.3797926178078035e-05, "loss": 2.4242, "step": 415190 }, { "epoch": 0.72, "learning_rate": 1.3797054238151209e-05, "loss": 2.3415, "step": 415200 }, { "epoch": 0.72, "learning_rate": 1.3796182298224383e-05, "loss": 2.363, "step": 415210 }, { "epoch": 0.72, "learning_rate": 1.3795310358297556e-05, "loss": 2.1792, "step": 415220 }, { "epoch": 0.72, "learning_rate": 1.3794438418370728e-05, "loss": 2.4018, "step": 415230 }, { "epoch": 0.72, "learning_rate": 1.37935664784439e-05, "loss": 2.3227, "step": 415240 }, { "epoch": 0.72, "learning_rate": 1.3792694538517076e-05, "loss": 2.2331, "step": 415250 }, { "epoch": 0.72, "learning_rate": 1.3791822598590248e-05, "loss": 2.2625, "step": 415260 }, { "epoch": 0.72, "learning_rate": 1.379095065866342e-05, "loss": 2.3046, "step": 415270 }, { "epoch": 0.72, "learning_rate": 1.3790078718736596e-05, "loss": 2.2263, "step": 415280 }, { "epoch": 0.72, "learning_rate": 1.3789206778809768e-05, "loss": 2.3363, "step": 415290 }, { "epoch": 0.72, "learning_rate": 1.3788334838882941e-05, "loss": 2.2121, "step": 415300 }, { "epoch": 0.72, "learning_rate": 1.3787462898956113e-05, "loss": 2.2303, "step": 415310 }, { "epoch": 0.72, "learning_rate": 1.3786590959029289e-05, "loss": 2.2469, "step": 415320 }, { "epoch": 0.72, "learning_rate": 1.3785719019102461e-05, "loss": 2.346, "step": 415330 }, { "epoch": 0.72, "learning_rate": 1.3784847079175633e-05, "loss": 2.3428, "step": 415340 }, { "epoch": 0.72, "learning_rate": 1.3783975139248805e-05, "loss": 2.2102, "step": 415350 }, { "epoch": 0.72, "learning_rate": 1.378310319932198e-05, "loss": 2.2586, "step": 415360 }, { "epoch": 0.72, "learning_rate": 1.3782231259395154e-05, "loss": 2.3218, "step": 415370 }, { "epoch": 0.72, "learning_rate": 1.3781359319468326e-05, "loss": 2.3062, "step": 415380 }, { "epoch": 0.72, "learning_rate": 1.3780487379541499e-05, "loss": 2.2311, "step": 415390 }, { "epoch": 0.72, "learning_rate": 1.3779615439614674e-05, "loss": 2.2892, "step": 415400 }, { "epoch": 0.72, "learning_rate": 1.3778743499687846e-05, "loss": 2.3313, "step": 415410 }, { "epoch": 0.72, "learning_rate": 1.3777871559761018e-05, "loss": 2.3319, "step": 415420 }, { "epoch": 0.72, "learning_rate": 1.3776999619834194e-05, "loss": 2.3042, "step": 415430 }, { "epoch": 0.72, "learning_rate": 1.3776127679907366e-05, "loss": 2.2327, "step": 415440 }, { "epoch": 0.72, "learning_rate": 1.377525573998054e-05, "loss": 2.2598, "step": 415450 }, { "epoch": 0.72, "learning_rate": 1.3774383800053712e-05, "loss": 2.3284, "step": 415460 }, { "epoch": 0.72, "learning_rate": 1.3773511860126887e-05, "loss": 2.3569, "step": 415470 }, { "epoch": 0.72, "learning_rate": 1.3772639920200059e-05, "loss": 2.4733, "step": 415480 }, { "epoch": 0.72, "learning_rate": 1.3771767980273231e-05, "loss": 2.2941, "step": 415490 }, { "epoch": 0.72, "learning_rate": 1.3770896040346403e-05, "loss": 2.3917, "step": 415500 }, { "epoch": 0.72, "learning_rate": 1.3770024100419579e-05, "loss": 2.313, "step": 415510 }, { "epoch": 0.72, "learning_rate": 1.376915216049275e-05, "loss": 2.3749, "step": 415520 }, { "epoch": 0.72, "learning_rate": 1.3768280220565925e-05, "loss": 2.2921, "step": 415530 }, { "epoch": 0.72, "learning_rate": 1.3767408280639097e-05, "loss": 2.4631, "step": 415540 }, { "epoch": 0.72, "learning_rate": 1.3766536340712272e-05, "loss": 2.4096, "step": 415550 }, { "epoch": 0.72, "learning_rate": 1.3765664400785444e-05, "loss": 2.2456, "step": 415560 }, { "epoch": 0.72, "learning_rate": 1.3764792460858616e-05, "loss": 2.3864, "step": 415570 }, { "epoch": 0.72, "learning_rate": 1.3763920520931792e-05, "loss": 2.3681, "step": 415580 }, { "epoch": 0.72, "learning_rate": 1.3763048581004964e-05, "loss": 2.352, "step": 415590 }, { "epoch": 0.72, "learning_rate": 1.3762176641078136e-05, "loss": 2.2698, "step": 415600 }, { "epoch": 0.72, "learning_rate": 1.376130470115131e-05, "loss": 2.2555, "step": 415610 }, { "epoch": 0.72, "learning_rate": 1.3760432761224485e-05, "loss": 2.3244, "step": 415620 }, { "epoch": 0.72, "learning_rate": 1.3759560821297657e-05, "loss": 2.3977, "step": 415630 }, { "epoch": 0.72, "learning_rate": 1.375868888137083e-05, "loss": 2.2446, "step": 415640 }, { "epoch": 0.72, "learning_rate": 1.3757816941444001e-05, "loss": 2.2767, "step": 415650 }, { "epoch": 0.72, "learning_rate": 1.3756945001517177e-05, "loss": 2.2732, "step": 415660 }, { "epoch": 0.72, "learning_rate": 1.3756073061590349e-05, "loss": 2.1919, "step": 415670 }, { "epoch": 0.72, "learning_rate": 1.3755201121663523e-05, "loss": 2.2464, "step": 415680 }, { "epoch": 0.72, "learning_rate": 1.3754329181736696e-05, "loss": 2.3936, "step": 415690 }, { "epoch": 0.72, "learning_rate": 1.375345724180987e-05, "loss": 2.3093, "step": 415700 }, { "epoch": 0.72, "learning_rate": 1.3752585301883042e-05, "loss": 2.2678, "step": 415710 }, { "epoch": 0.72, "learning_rate": 1.3751713361956214e-05, "loss": 2.2637, "step": 415720 }, { "epoch": 0.72, "learning_rate": 1.375084142202939e-05, "loss": 2.3827, "step": 415730 }, { "epoch": 0.73, "learning_rate": 1.3749969482102562e-05, "loss": 2.2377, "step": 415740 }, { "epoch": 0.73, "learning_rate": 1.3749097542175734e-05, "loss": 2.212, "step": 415750 }, { "epoch": 0.73, "learning_rate": 1.3748225602248908e-05, "loss": 2.3252, "step": 415760 }, { "epoch": 0.73, "learning_rate": 1.3747353662322081e-05, "loss": 2.4124, "step": 415770 }, { "epoch": 0.73, "learning_rate": 1.3746481722395255e-05, "loss": 2.4405, "step": 415780 }, { "epoch": 0.73, "learning_rate": 1.3745609782468427e-05, "loss": 2.2972, "step": 415790 }, { "epoch": 0.73, "learning_rate": 1.37447378425416e-05, "loss": 2.2554, "step": 415800 }, { "epoch": 0.73, "learning_rate": 1.3743865902614775e-05, "loss": 2.3053, "step": 415810 }, { "epoch": 0.73, "learning_rate": 1.3742993962687947e-05, "loss": 2.2841, "step": 415820 }, { "epoch": 0.73, "learning_rate": 1.3742122022761119e-05, "loss": 2.2694, "step": 415830 }, { "epoch": 0.73, "learning_rate": 1.3741250082834294e-05, "loss": 2.2948, "step": 415840 }, { "epoch": 0.73, "learning_rate": 1.3740378142907468e-05, "loss": 2.3977, "step": 415850 }, { "epoch": 0.73, "learning_rate": 1.373950620298064e-05, "loss": 2.3165, "step": 415860 }, { "epoch": 0.73, "learning_rate": 1.3738634263053812e-05, "loss": 2.348, "step": 415870 }, { "epoch": 0.73, "learning_rate": 1.3737762323126988e-05, "loss": 2.3273, "step": 415880 }, { "epoch": 0.73, "learning_rate": 1.373689038320016e-05, "loss": 2.3053, "step": 415890 }, { "epoch": 0.73, "learning_rate": 1.3736018443273332e-05, "loss": 2.2154, "step": 415900 }, { "epoch": 0.73, "learning_rate": 1.3735146503346504e-05, "loss": 2.3529, "step": 415910 }, { "epoch": 0.73, "learning_rate": 1.373427456341968e-05, "loss": 2.3012, "step": 415920 }, { "epoch": 0.73, "learning_rate": 1.3733402623492853e-05, "loss": 2.204, "step": 415930 }, { "epoch": 0.73, "learning_rate": 1.3732530683566025e-05, "loss": 2.4152, "step": 415940 }, { "epoch": 0.73, "learning_rate": 1.37316587436392e-05, "loss": 2.4046, "step": 415950 }, { "epoch": 0.73, "learning_rate": 1.3730786803712373e-05, "loss": 2.251, "step": 415960 }, { "epoch": 0.73, "learning_rate": 1.3729914863785545e-05, "loss": 2.2198, "step": 415970 }, { "epoch": 0.73, "learning_rate": 1.3729042923858717e-05, "loss": 2.2971, "step": 415980 }, { "epoch": 0.73, "learning_rate": 1.3728170983931893e-05, "loss": 2.242, "step": 415990 }, { "epoch": 0.73, "learning_rate": 1.3727299044005065e-05, "loss": 2.3331, "step": 416000 }, { "epoch": 0.73, "learning_rate": 1.3726427104078238e-05, "loss": 2.2637, "step": 416010 }, { "epoch": 0.73, "learning_rate": 1.372555516415141e-05, "loss": 2.3179, "step": 416020 }, { "epoch": 0.73, "learning_rate": 1.3724683224224586e-05, "loss": 2.2886, "step": 416030 }, { "epoch": 0.73, "learning_rate": 1.3723811284297758e-05, "loss": 2.3137, "step": 416040 }, { "epoch": 0.73, "learning_rate": 1.372293934437093e-05, "loss": 2.2073, "step": 416050 }, { "epoch": 0.73, "learning_rate": 1.3722067404444102e-05, "loss": 2.323, "step": 416060 }, { "epoch": 0.73, "learning_rate": 1.3721195464517278e-05, "loss": 2.3172, "step": 416070 }, { "epoch": 0.73, "learning_rate": 1.372032352459045e-05, "loss": 2.3427, "step": 416080 }, { "epoch": 0.73, "learning_rate": 1.3719451584663623e-05, "loss": 2.38, "step": 416090 }, { "epoch": 0.73, "learning_rate": 1.3718579644736799e-05, "loss": 2.2764, "step": 416100 }, { "epoch": 0.73, "learning_rate": 1.3717707704809971e-05, "loss": 2.2975, "step": 416110 }, { "epoch": 0.73, "learning_rate": 1.3716835764883143e-05, "loss": 2.2867, "step": 416120 }, { "epoch": 0.73, "learning_rate": 1.3715963824956315e-05, "loss": 2.2478, "step": 416130 }, { "epoch": 0.73, "learning_rate": 1.371509188502949e-05, "loss": 2.2668, "step": 416140 }, { "epoch": 0.73, "learning_rate": 1.3714219945102663e-05, "loss": 2.3715, "step": 416150 }, { "epoch": 0.73, "learning_rate": 1.3713348005175836e-05, "loss": 2.4052, "step": 416160 }, { "epoch": 0.73, "learning_rate": 1.3712476065249009e-05, "loss": 2.4084, "step": 416170 }, { "epoch": 0.73, "learning_rate": 1.3711604125322184e-05, "loss": 2.2185, "step": 416180 }, { "epoch": 0.73, "learning_rate": 1.3710732185395356e-05, "loss": 2.2235, "step": 416190 }, { "epoch": 0.73, "learning_rate": 1.3709860245468528e-05, "loss": 2.2532, "step": 416200 }, { "epoch": 0.73, "learning_rate": 1.3708988305541704e-05, "loss": 2.2648, "step": 416210 }, { "epoch": 0.73, "learning_rate": 1.3708116365614876e-05, "loss": 2.3271, "step": 416220 }, { "epoch": 0.73, "learning_rate": 1.3707244425688048e-05, "loss": 2.3384, "step": 416230 }, { "epoch": 0.73, "learning_rate": 1.3706372485761222e-05, "loss": 2.2476, "step": 416240 }, { "epoch": 0.73, "learning_rate": 1.3705500545834395e-05, "loss": 2.3799, "step": 416250 }, { "epoch": 0.73, "learning_rate": 1.3704628605907569e-05, "loss": 2.3403, "step": 416260 }, { "epoch": 0.73, "learning_rate": 1.3703756665980741e-05, "loss": 2.2183, "step": 416270 }, { "epoch": 0.73, "learning_rate": 1.3702884726053913e-05, "loss": 2.3017, "step": 416280 }, { "epoch": 0.73, "learning_rate": 1.3702012786127089e-05, "loss": 2.2375, "step": 416290 }, { "epoch": 0.73, "learning_rate": 1.370114084620026e-05, "loss": 2.3493, "step": 416300 }, { "epoch": 0.73, "learning_rate": 1.3700268906273433e-05, "loss": 2.1701, "step": 416310 }, { "epoch": 0.73, "learning_rate": 1.3699396966346607e-05, "loss": 2.2827, "step": 416320 }, { "epoch": 0.73, "learning_rate": 1.369852502641978e-05, "loss": 2.3042, "step": 416330 }, { "epoch": 0.73, "learning_rate": 1.3697653086492954e-05, "loss": 2.2023, "step": 416340 }, { "epoch": 0.73, "learning_rate": 1.3696781146566126e-05, "loss": 2.2578, "step": 416350 }, { "epoch": 0.73, "learning_rate": 1.3695909206639302e-05, "loss": 2.3252, "step": 416360 }, { "epoch": 0.73, "learning_rate": 1.3695037266712474e-05, "loss": 2.39, "step": 416370 }, { "epoch": 0.73, "learning_rate": 1.3694165326785646e-05, "loss": 2.3404, "step": 416380 }, { "epoch": 0.73, "learning_rate": 1.3693293386858818e-05, "loss": 2.242, "step": 416390 }, { "epoch": 0.73, "learning_rate": 1.3692421446931993e-05, "loss": 2.2445, "step": 416400 }, { "epoch": 0.73, "learning_rate": 1.3691549507005167e-05, "loss": 2.3567, "step": 416410 }, { "epoch": 0.73, "learning_rate": 1.369067756707834e-05, "loss": 2.2374, "step": 416420 }, { "epoch": 0.73, "learning_rate": 1.3689805627151511e-05, "loss": 2.312, "step": 416430 }, { "epoch": 0.73, "learning_rate": 1.3688933687224687e-05, "loss": 2.2894, "step": 416440 }, { "epoch": 0.73, "learning_rate": 1.3688061747297859e-05, "loss": 2.2745, "step": 416450 }, { "epoch": 0.73, "learning_rate": 1.3687189807371031e-05, "loss": 2.1889, "step": 416460 }, { "epoch": 0.73, "learning_rate": 1.3686317867444205e-05, "loss": 2.3292, "step": 416470 }, { "epoch": 0.73, "learning_rate": 1.3685445927517378e-05, "loss": 2.2992, "step": 416480 }, { "epoch": 0.73, "learning_rate": 1.3684573987590552e-05, "loss": 2.3431, "step": 416490 }, { "epoch": 0.73, "learning_rate": 1.3683702047663724e-05, "loss": 2.2276, "step": 416500 }, { "epoch": 0.73, "learning_rate": 1.36828301077369e-05, "loss": 2.3711, "step": 416510 }, { "epoch": 0.73, "learning_rate": 1.3681958167810072e-05, "loss": 2.3049, "step": 416520 }, { "epoch": 0.73, "learning_rate": 1.3681086227883244e-05, "loss": 2.3162, "step": 416530 }, { "epoch": 0.73, "learning_rate": 1.3680214287956416e-05, "loss": 2.2607, "step": 416540 }, { "epoch": 0.73, "learning_rate": 1.3679342348029591e-05, "loss": 2.2634, "step": 416550 }, { "epoch": 0.73, "learning_rate": 1.3678470408102764e-05, "loss": 2.183, "step": 416560 }, { "epoch": 0.73, "learning_rate": 1.3677598468175937e-05, "loss": 2.249, "step": 416570 }, { "epoch": 0.73, "learning_rate": 1.367672652824911e-05, "loss": 2.2464, "step": 416580 }, { "epoch": 0.73, "learning_rate": 1.3675854588322285e-05, "loss": 2.2819, "step": 416590 }, { "epoch": 0.73, "learning_rate": 1.3674982648395457e-05, "loss": 2.3333, "step": 416600 }, { "epoch": 0.73, "learning_rate": 1.3674110708468629e-05, "loss": 2.4057, "step": 416610 }, { "epoch": 0.73, "learning_rate": 1.3673238768541804e-05, "loss": 2.2897, "step": 416620 }, { "epoch": 0.73, "learning_rate": 1.3672366828614977e-05, "loss": 2.5331, "step": 416630 }, { "epoch": 0.73, "learning_rate": 1.3671494888688149e-05, "loss": 2.1556, "step": 416640 }, { "epoch": 0.73, "learning_rate": 1.3670622948761322e-05, "loss": 2.2206, "step": 416650 }, { "epoch": 0.73, "learning_rate": 1.3669751008834498e-05, "loss": 2.2526, "step": 416660 }, { "epoch": 0.73, "learning_rate": 1.366887906890767e-05, "loss": 2.1602, "step": 416670 }, { "epoch": 0.73, "learning_rate": 1.3668007128980842e-05, "loss": 2.3447, "step": 416680 }, { "epoch": 0.73, "learning_rate": 1.3667135189054014e-05, "loss": 2.2904, "step": 416690 }, { "epoch": 0.73, "learning_rate": 1.366626324912719e-05, "loss": 2.3485, "step": 416700 }, { "epoch": 0.73, "learning_rate": 1.3665391309200362e-05, "loss": 2.3504, "step": 416710 }, { "epoch": 0.73, "learning_rate": 1.3664519369273535e-05, "loss": 2.2875, "step": 416720 }, { "epoch": 0.73, "learning_rate": 1.3663647429346707e-05, "loss": 2.3026, "step": 416730 }, { "epoch": 0.73, "learning_rate": 1.3662775489419883e-05, "loss": 2.284, "step": 416740 }, { "epoch": 0.73, "learning_rate": 1.3661903549493055e-05, "loss": 2.1687, "step": 416750 }, { "epoch": 0.73, "learning_rate": 1.3661031609566227e-05, "loss": 2.3942, "step": 416760 }, { "epoch": 0.73, "learning_rate": 1.3660159669639403e-05, "loss": 2.2521, "step": 416770 }, { "epoch": 0.73, "learning_rate": 1.3659287729712575e-05, "loss": 2.2618, "step": 416780 }, { "epoch": 0.73, "learning_rate": 1.3658415789785747e-05, "loss": 2.2331, "step": 416790 }, { "epoch": 0.73, "learning_rate": 1.365754384985892e-05, "loss": 2.4094, "step": 416800 }, { "epoch": 0.73, "learning_rate": 1.3656671909932094e-05, "loss": 2.2192, "step": 416810 }, { "epoch": 0.73, "learning_rate": 1.3655799970005268e-05, "loss": 2.2283, "step": 416820 }, { "epoch": 0.73, "learning_rate": 1.365492803007844e-05, "loss": 2.2816, "step": 416830 }, { "epoch": 0.73, "learning_rate": 1.3654056090151612e-05, "loss": 2.3655, "step": 416840 }, { "epoch": 0.73, "learning_rate": 1.3653184150224788e-05, "loss": 2.4086, "step": 416850 }, { "epoch": 0.73, "learning_rate": 1.365231221029796e-05, "loss": 2.3266, "step": 416860 }, { "epoch": 0.73, "learning_rate": 1.3651440270371132e-05, "loss": 2.2237, "step": 416870 }, { "epoch": 0.73, "learning_rate": 1.3650568330444307e-05, "loss": 2.3258, "step": 416880 }, { "epoch": 0.73, "learning_rate": 1.3649696390517481e-05, "loss": 2.2466, "step": 416890 }, { "epoch": 0.73, "learning_rate": 1.3648824450590653e-05, "loss": 2.3124, "step": 416900 }, { "epoch": 0.73, "learning_rate": 1.3647952510663825e-05, "loss": 2.3215, "step": 416910 }, { "epoch": 0.73, "learning_rate": 1.3647080570737e-05, "loss": 2.2597, "step": 416920 }, { "epoch": 0.73, "learning_rate": 1.3646208630810173e-05, "loss": 2.2232, "step": 416930 }, { "epoch": 0.73, "learning_rate": 1.3645336690883345e-05, "loss": 2.2931, "step": 416940 }, { "epoch": 0.73, "learning_rate": 1.3644464750956517e-05, "loss": 2.2262, "step": 416950 }, { "epoch": 0.73, "learning_rate": 1.3643592811029692e-05, "loss": 2.3286, "step": 416960 }, { "epoch": 0.73, "learning_rate": 1.3642720871102866e-05, "loss": 2.2995, "step": 416970 }, { "epoch": 0.73, "learning_rate": 1.3641848931176038e-05, "loss": 2.3532, "step": 416980 }, { "epoch": 0.73, "learning_rate": 1.364097699124921e-05, "loss": 2.3452, "step": 416990 }, { "epoch": 0.73, "learning_rate": 1.3640105051322386e-05, "loss": 2.3576, "step": 417000 }, { "epoch": 0.73, "learning_rate": 1.3639233111395558e-05, "loss": 2.2491, "step": 417010 }, { "epoch": 0.73, "learning_rate": 1.363836117146873e-05, "loss": 2.2604, "step": 417020 }, { "epoch": 0.73, "learning_rate": 1.3637489231541905e-05, "loss": 2.3354, "step": 417030 }, { "epoch": 0.73, "learning_rate": 1.3636617291615077e-05, "loss": 2.4027, "step": 417040 }, { "epoch": 0.73, "learning_rate": 1.3635745351688251e-05, "loss": 2.347, "step": 417050 }, { "epoch": 0.73, "learning_rate": 1.3634873411761423e-05, "loss": 2.2956, "step": 417060 }, { "epoch": 0.73, "learning_rate": 1.3634001471834599e-05, "loss": 2.2713, "step": 417070 }, { "epoch": 0.73, "learning_rate": 1.363312953190777e-05, "loss": 2.4122, "step": 417080 }, { "epoch": 0.73, "learning_rate": 1.3632257591980943e-05, "loss": 2.2683, "step": 417090 }, { "epoch": 0.73, "learning_rate": 1.3631385652054115e-05, "loss": 2.3061, "step": 417100 }, { "epoch": 0.73, "learning_rate": 1.363051371212729e-05, "loss": 2.3531, "step": 417110 }, { "epoch": 0.73, "learning_rate": 1.3629641772200462e-05, "loss": 2.2371, "step": 417120 }, { "epoch": 0.73, "learning_rate": 1.3628769832273636e-05, "loss": 2.2433, "step": 417130 }, { "epoch": 0.73, "learning_rate": 1.3627897892346812e-05, "loss": 2.3503, "step": 417140 }, { "epoch": 0.73, "learning_rate": 1.3627025952419984e-05, "loss": 2.3751, "step": 417150 }, { "epoch": 0.73, "learning_rate": 1.3626154012493156e-05, "loss": 2.4177, "step": 417160 }, { "epoch": 0.73, "learning_rate": 1.3625282072566328e-05, "loss": 2.2331, "step": 417170 }, { "epoch": 0.73, "learning_rate": 1.3624410132639503e-05, "loss": 2.3158, "step": 417180 }, { "epoch": 0.73, "learning_rate": 1.3623538192712675e-05, "loss": 2.2693, "step": 417190 }, { "epoch": 0.73, "learning_rate": 1.362266625278585e-05, "loss": 2.2509, "step": 417200 }, { "epoch": 0.73, "learning_rate": 1.3621794312859021e-05, "loss": 2.3535, "step": 417210 }, { "epoch": 0.73, "learning_rate": 1.3620922372932197e-05, "loss": 2.1126, "step": 417220 }, { "epoch": 0.73, "learning_rate": 1.3620050433005369e-05, "loss": 2.2329, "step": 417230 }, { "epoch": 0.73, "learning_rate": 1.3619178493078541e-05, "loss": 2.3545, "step": 417240 }, { "epoch": 0.73, "learning_rate": 1.3618306553151713e-05, "loss": 2.3174, "step": 417250 }, { "epoch": 0.73, "learning_rate": 1.3617434613224888e-05, "loss": 2.398, "step": 417260 }, { "epoch": 0.73, "learning_rate": 1.361656267329806e-05, "loss": 2.2931, "step": 417270 }, { "epoch": 0.73, "learning_rate": 1.3615690733371234e-05, "loss": 2.3376, "step": 417280 }, { "epoch": 0.73, "learning_rate": 1.3614818793444408e-05, "loss": 2.3066, "step": 417290 }, { "epoch": 0.73, "learning_rate": 1.3613946853517582e-05, "loss": 2.272, "step": 417300 }, { "epoch": 0.73, "learning_rate": 1.3613074913590754e-05, "loss": 2.2418, "step": 417310 }, { "epoch": 0.73, "learning_rate": 1.3612202973663926e-05, "loss": 2.2475, "step": 417320 }, { "epoch": 0.73, "learning_rate": 1.3611331033737101e-05, "loss": 2.3597, "step": 417330 }, { "epoch": 0.73, "learning_rate": 1.3610459093810274e-05, "loss": 2.3456, "step": 417340 }, { "epoch": 0.73, "learning_rate": 1.3609587153883446e-05, "loss": 2.3253, "step": 417350 }, { "epoch": 0.73, "learning_rate": 1.360871521395662e-05, "loss": 2.2684, "step": 417360 }, { "epoch": 0.73, "learning_rate": 1.3607843274029793e-05, "loss": 2.1416, "step": 417370 }, { "epoch": 0.73, "learning_rate": 1.3606971334102967e-05, "loss": 2.2806, "step": 417380 }, { "epoch": 0.73, "learning_rate": 1.3606099394176139e-05, "loss": 2.2749, "step": 417390 }, { "epoch": 0.73, "learning_rate": 1.3605227454249311e-05, "loss": 2.1783, "step": 417400 }, { "epoch": 0.73, "learning_rate": 1.3604355514322487e-05, "loss": 2.2531, "step": 417410 }, { "epoch": 0.73, "learning_rate": 1.3603483574395659e-05, "loss": 2.2885, "step": 417420 }, { "epoch": 0.73, "learning_rate": 1.360261163446883e-05, "loss": 2.35, "step": 417430 }, { "epoch": 0.73, "learning_rate": 1.3601739694542006e-05, "loss": 2.3246, "step": 417440 }, { "epoch": 0.73, "learning_rate": 1.360086775461518e-05, "loss": 2.2607, "step": 417450 }, { "epoch": 0.73, "learning_rate": 1.3599995814688352e-05, "loss": 2.2877, "step": 417460 }, { "epoch": 0.73, "learning_rate": 1.3599123874761524e-05, "loss": 2.3139, "step": 417470 }, { "epoch": 0.73, "learning_rate": 1.35982519348347e-05, "loss": 2.3194, "step": 417480 }, { "epoch": 0.73, "learning_rate": 1.3597379994907872e-05, "loss": 2.3143, "step": 417490 }, { "epoch": 0.73, "learning_rate": 1.3596508054981044e-05, "loss": 2.2805, "step": 417500 }, { "epoch": 0.73, "learning_rate": 1.3595636115054217e-05, "loss": 2.3386, "step": 417510 }, { "epoch": 0.73, "learning_rate": 1.3594764175127391e-05, "loss": 2.3469, "step": 417520 }, { "epoch": 0.73, "learning_rate": 1.3593892235200565e-05, "loss": 2.2471, "step": 417530 }, { "epoch": 0.73, "learning_rate": 1.3593020295273737e-05, "loss": 2.2355, "step": 417540 }, { "epoch": 0.73, "learning_rate": 1.3592148355346913e-05, "loss": 2.3021, "step": 417550 }, { "epoch": 0.73, "learning_rate": 1.3591276415420085e-05, "loss": 2.2892, "step": 417560 }, { "epoch": 0.73, "learning_rate": 1.3590404475493257e-05, "loss": 2.345, "step": 417570 }, { "epoch": 0.73, "learning_rate": 1.3589532535566429e-05, "loss": 2.3835, "step": 417580 }, { "epoch": 0.73, "learning_rate": 1.3588660595639604e-05, "loss": 2.2152, "step": 417590 }, { "epoch": 0.73, "learning_rate": 1.3587788655712776e-05, "loss": 2.3859, "step": 417600 }, { "epoch": 0.73, "learning_rate": 1.358691671578595e-05, "loss": 2.209, "step": 417610 }, { "epoch": 0.73, "learning_rate": 1.3586044775859122e-05, "loss": 2.3836, "step": 417620 }, { "epoch": 0.73, "learning_rate": 1.3585172835932298e-05, "loss": 2.1868, "step": 417630 }, { "epoch": 0.73, "learning_rate": 1.358430089600547e-05, "loss": 2.2373, "step": 417640 }, { "epoch": 0.73, "learning_rate": 1.3583428956078642e-05, "loss": 2.2997, "step": 417650 }, { "epoch": 0.73, "learning_rate": 1.3582557016151814e-05, "loss": 2.2485, "step": 417660 }, { "epoch": 0.73, "learning_rate": 1.358168507622499e-05, "loss": 2.3846, "step": 417670 }, { "epoch": 0.73, "learning_rate": 1.3580813136298161e-05, "loss": 2.2668, "step": 417680 }, { "epoch": 0.73, "learning_rate": 1.3579941196371335e-05, "loss": 2.2747, "step": 417690 }, { "epoch": 0.73, "learning_rate": 1.357906925644451e-05, "loss": 2.3108, "step": 417700 }, { "epoch": 0.73, "learning_rate": 1.3578197316517683e-05, "loss": 2.3239, "step": 417710 }, { "epoch": 0.73, "learning_rate": 1.3577325376590855e-05, "loss": 2.2243, "step": 417720 }, { "epoch": 0.73, "learning_rate": 1.3576453436664027e-05, "loss": 2.3318, "step": 417730 }, { "epoch": 0.73, "learning_rate": 1.3575581496737202e-05, "loss": 2.2744, "step": 417740 }, { "epoch": 0.73, "learning_rate": 1.3574709556810374e-05, "loss": 2.3492, "step": 417750 }, { "epoch": 0.73, "learning_rate": 1.3573837616883548e-05, "loss": 2.2395, "step": 417760 }, { "epoch": 0.73, "learning_rate": 1.357296567695672e-05, "loss": 2.2008, "step": 417770 }, { "epoch": 0.73, "learning_rate": 1.3572093737029896e-05, "loss": 2.318, "step": 417780 }, { "epoch": 0.73, "learning_rate": 1.3571221797103068e-05, "loss": 2.2754, "step": 417790 }, { "epoch": 0.73, "learning_rate": 1.357034985717624e-05, "loss": 2.2343, "step": 417800 }, { "epoch": 0.73, "learning_rate": 1.3569477917249415e-05, "loss": 2.4031, "step": 417810 }, { "epoch": 0.73, "learning_rate": 1.3568605977322587e-05, "loss": 2.2712, "step": 417820 }, { "epoch": 0.73, "learning_rate": 1.356773403739576e-05, "loss": 2.342, "step": 417830 }, { "epoch": 0.73, "learning_rate": 1.3566862097468933e-05, "loss": 2.1214, "step": 417840 }, { "epoch": 0.73, "learning_rate": 1.3565990157542107e-05, "loss": 2.42, "step": 417850 }, { "epoch": 0.73, "learning_rate": 1.356511821761528e-05, "loss": 2.3674, "step": 417860 }, { "epoch": 0.73, "learning_rate": 1.3564246277688453e-05, "loss": 2.3021, "step": 417870 }, { "epoch": 0.73, "learning_rate": 1.3563374337761625e-05, "loss": 2.2857, "step": 417880 }, { "epoch": 0.73, "learning_rate": 1.35625023978348e-05, "loss": 2.2938, "step": 417890 }, { "epoch": 0.73, "learning_rate": 1.3561630457907972e-05, "loss": 2.372, "step": 417900 }, { "epoch": 0.73, "learning_rate": 1.3560758517981145e-05, "loss": 2.3559, "step": 417910 }, { "epoch": 0.73, "learning_rate": 1.3559886578054318e-05, "loss": 2.2885, "step": 417920 }, { "epoch": 0.73, "learning_rate": 1.3559014638127494e-05, "loss": 2.3257, "step": 417930 }, { "epoch": 0.73, "learning_rate": 1.3558142698200666e-05, "loss": 2.4316, "step": 417940 }, { "epoch": 0.73, "learning_rate": 1.3557270758273838e-05, "loss": 2.2101, "step": 417950 }, { "epoch": 0.73, "learning_rate": 1.3556398818347013e-05, "loss": 2.267, "step": 417960 }, { "epoch": 0.73, "learning_rate": 1.3555526878420185e-05, "loss": 2.2868, "step": 417970 }, { "epoch": 0.73, "learning_rate": 1.3554654938493358e-05, "loss": 2.2608, "step": 417980 }, { "epoch": 0.73, "learning_rate": 1.355378299856653e-05, "loss": 2.3093, "step": 417990 }, { "epoch": 0.73, "learning_rate": 1.3552911058639705e-05, "loss": 2.385, "step": 418000 }, { "epoch": 0.73, "learning_rate": 1.3552039118712879e-05, "loss": 2.1781, "step": 418010 }, { "epoch": 0.73, "learning_rate": 1.3551167178786051e-05, "loss": 2.3077, "step": 418020 }, { "epoch": 0.73, "learning_rate": 1.3550295238859223e-05, "loss": 2.2559, "step": 418030 }, { "epoch": 0.73, "learning_rate": 1.3549423298932398e-05, "loss": 2.2391, "step": 418040 }, { "epoch": 0.73, "learning_rate": 1.354855135900557e-05, "loss": 2.3124, "step": 418050 }, { "epoch": 0.73, "learning_rate": 1.3547679419078743e-05, "loss": 2.2327, "step": 418060 }, { "epoch": 0.73, "learning_rate": 1.3546807479151916e-05, "loss": 2.2829, "step": 418070 }, { "epoch": 0.73, "learning_rate": 1.354593553922509e-05, "loss": 2.304, "step": 418080 }, { "epoch": 0.73, "learning_rate": 1.3545063599298264e-05, "loss": 2.1539, "step": 418090 }, { "epoch": 0.73, "learning_rate": 1.3544191659371436e-05, "loss": 2.3014, "step": 418100 }, { "epoch": 0.73, "learning_rate": 1.3543319719444611e-05, "loss": 2.2661, "step": 418110 }, { "epoch": 0.73, "learning_rate": 1.3542447779517784e-05, "loss": 2.3855, "step": 418120 }, { "epoch": 0.73, "learning_rate": 1.3541575839590956e-05, "loss": 2.1942, "step": 418130 }, { "epoch": 0.73, "learning_rate": 1.3540703899664128e-05, "loss": 2.2382, "step": 418140 }, { "epoch": 0.73, "learning_rate": 1.3539831959737303e-05, "loss": 2.3085, "step": 418150 }, { "epoch": 0.73, "learning_rate": 1.3538960019810475e-05, "loss": 2.2115, "step": 418160 }, { "epoch": 0.73, "learning_rate": 1.3538088079883649e-05, "loss": 2.25, "step": 418170 }, { "epoch": 0.73, "learning_rate": 1.3537216139956821e-05, "loss": 2.3442, "step": 418180 }, { "epoch": 0.73, "learning_rate": 1.3536344200029997e-05, "loss": 2.3919, "step": 418190 }, { "epoch": 0.73, "learning_rate": 1.3535472260103169e-05, "loss": 2.286, "step": 418200 }, { "epoch": 0.73, "learning_rate": 1.353460032017634e-05, "loss": 2.2831, "step": 418210 }, { "epoch": 0.73, "learning_rate": 1.3533728380249516e-05, "loss": 2.3463, "step": 418220 }, { "epoch": 0.73, "learning_rate": 1.3532856440322688e-05, "loss": 2.2816, "step": 418230 }, { "epoch": 0.73, "learning_rate": 1.3531984500395862e-05, "loss": 2.3523, "step": 418240 }, { "epoch": 0.73, "learning_rate": 1.3531112560469034e-05, "loss": 2.3225, "step": 418250 }, { "epoch": 0.73, "learning_rate": 1.353024062054221e-05, "loss": 2.3031, "step": 418260 }, { "epoch": 0.73, "learning_rate": 1.3529368680615382e-05, "loss": 2.3694, "step": 418270 }, { "epoch": 0.73, "learning_rate": 1.3528496740688554e-05, "loss": 2.2337, "step": 418280 }, { "epoch": 0.73, "learning_rate": 1.3527624800761726e-05, "loss": 2.3211, "step": 418290 }, { "epoch": 0.73, "learning_rate": 1.3526752860834901e-05, "loss": 2.2969, "step": 418300 }, { "epoch": 0.73, "learning_rate": 1.3525880920908073e-05, "loss": 2.2001, "step": 418310 }, { "epoch": 0.73, "learning_rate": 1.3525008980981247e-05, "loss": 2.3489, "step": 418320 }, { "epoch": 0.73, "learning_rate": 1.352413704105442e-05, "loss": 2.2031, "step": 418330 }, { "epoch": 0.73, "learning_rate": 1.3523265101127595e-05, "loss": 2.2642, "step": 418340 }, { "epoch": 0.73, "learning_rate": 1.3522393161200767e-05, "loss": 2.3519, "step": 418350 }, { "epoch": 0.73, "learning_rate": 1.3521521221273939e-05, "loss": 2.3785, "step": 418360 }, { "epoch": 0.73, "learning_rate": 1.3520649281347114e-05, "loss": 2.2885, "step": 418370 }, { "epoch": 0.73, "learning_rate": 1.3519777341420286e-05, "loss": 2.3186, "step": 418380 }, { "epoch": 0.73, "learning_rate": 1.3518905401493458e-05, "loss": 2.317, "step": 418390 }, { "epoch": 0.73, "learning_rate": 1.3518033461566632e-05, "loss": 2.3424, "step": 418400 }, { "epoch": 0.73, "learning_rate": 1.3517161521639806e-05, "loss": 2.2718, "step": 418410 }, { "epoch": 0.73, "learning_rate": 1.351628958171298e-05, "loss": 2.3517, "step": 418420 }, { "epoch": 0.73, "learning_rate": 1.3515417641786152e-05, "loss": 2.3412, "step": 418430 }, { "epoch": 0.73, "learning_rate": 1.3514545701859324e-05, "loss": 2.2488, "step": 418440 }, { "epoch": 0.73, "learning_rate": 1.35136737619325e-05, "loss": 2.2626, "step": 418450 }, { "epoch": 0.73, "learning_rate": 1.3512801822005671e-05, "loss": 2.3271, "step": 418460 }, { "epoch": 0.73, "learning_rate": 1.3511929882078843e-05, "loss": 2.3205, "step": 418470 }, { "epoch": 0.73, "learning_rate": 1.3511057942152019e-05, "loss": 2.2643, "step": 418480 }, { "epoch": 0.73, "learning_rate": 1.3510186002225193e-05, "loss": 2.4347, "step": 418490 }, { "epoch": 0.73, "learning_rate": 1.3509314062298365e-05, "loss": 2.3743, "step": 418500 }, { "epoch": 0.73, "learning_rate": 1.3508442122371537e-05, "loss": 2.3112, "step": 418510 }, { "epoch": 0.73, "learning_rate": 1.3507570182444712e-05, "loss": 2.3003, "step": 418520 }, { "epoch": 0.73, "learning_rate": 1.3506698242517884e-05, "loss": 2.2942, "step": 418530 }, { "epoch": 0.73, "learning_rate": 1.3505826302591056e-05, "loss": 2.1884, "step": 418540 }, { "epoch": 0.73, "learning_rate": 1.350495436266423e-05, "loss": 2.3018, "step": 418550 }, { "epoch": 0.73, "learning_rate": 1.3504082422737404e-05, "loss": 2.3428, "step": 418560 }, { "epoch": 0.73, "learning_rate": 1.3503210482810578e-05, "loss": 2.2792, "step": 418570 }, { "epoch": 0.73, "learning_rate": 1.350233854288375e-05, "loss": 2.2512, "step": 418580 }, { "epoch": 0.73, "learning_rate": 1.3501466602956922e-05, "loss": 2.3593, "step": 418590 }, { "epoch": 0.73, "learning_rate": 1.3500594663030097e-05, "loss": 2.3193, "step": 418600 }, { "epoch": 0.73, "learning_rate": 1.349972272310327e-05, "loss": 2.2961, "step": 418610 }, { "epoch": 0.73, "learning_rate": 1.3498850783176442e-05, "loss": 2.3159, "step": 418620 }, { "epoch": 0.73, "learning_rate": 1.3497978843249617e-05, "loss": 2.301, "step": 418630 }, { "epoch": 0.73, "learning_rate": 1.3497106903322789e-05, "loss": 2.2751, "step": 418640 }, { "epoch": 0.73, "learning_rate": 1.3496234963395963e-05, "loss": 2.3962, "step": 418650 }, { "epoch": 0.73, "learning_rate": 1.3495363023469135e-05, "loss": 2.1987, "step": 418660 }, { "epoch": 0.73, "learning_rate": 1.349449108354231e-05, "loss": 2.3869, "step": 418670 }, { "epoch": 0.73, "learning_rate": 1.3493619143615482e-05, "loss": 2.5269, "step": 418680 }, { "epoch": 0.73, "learning_rate": 1.3492747203688655e-05, "loss": 2.2525, "step": 418690 }, { "epoch": 0.73, "learning_rate": 1.3491875263761827e-05, "loss": 2.3175, "step": 418700 }, { "epoch": 0.73, "learning_rate": 1.3491003323835002e-05, "loss": 2.2034, "step": 418710 }, { "epoch": 0.73, "learning_rate": 1.3490131383908174e-05, "loss": 2.2852, "step": 418720 }, { "epoch": 0.73, "learning_rate": 1.3489259443981348e-05, "loss": 2.3553, "step": 418730 }, { "epoch": 0.73, "learning_rate": 1.3488387504054523e-05, "loss": 2.2309, "step": 418740 }, { "epoch": 0.73, "learning_rate": 1.3487515564127695e-05, "loss": 2.3706, "step": 418750 }, { "epoch": 0.73, "learning_rate": 1.3486643624200868e-05, "loss": 2.238, "step": 418760 }, { "epoch": 0.73, "learning_rate": 1.348577168427404e-05, "loss": 2.298, "step": 418770 }, { "epoch": 0.73, "learning_rate": 1.3484899744347215e-05, "loss": 2.1199, "step": 418780 }, { "epoch": 0.73, "learning_rate": 1.3484027804420387e-05, "loss": 2.2998, "step": 418790 }, { "epoch": 0.73, "learning_rate": 1.3483155864493561e-05, "loss": 2.3394, "step": 418800 }, { "epoch": 0.73, "learning_rate": 1.3482283924566733e-05, "loss": 2.1951, "step": 418810 }, { "epoch": 0.73, "learning_rate": 1.3481411984639908e-05, "loss": 2.277, "step": 418820 }, { "epoch": 0.73, "learning_rate": 1.348054004471308e-05, "loss": 2.3071, "step": 418830 }, { "epoch": 0.73, "learning_rate": 1.3479668104786253e-05, "loss": 2.3567, "step": 418840 }, { "epoch": 0.73, "learning_rate": 1.3478796164859425e-05, "loss": 2.3295, "step": 418850 }, { "epoch": 0.73, "learning_rate": 1.34779242249326e-05, "loss": 2.3164, "step": 418860 }, { "epoch": 0.73, "learning_rate": 1.3477052285005772e-05, "loss": 2.314, "step": 418870 }, { "epoch": 0.73, "learning_rate": 1.3476180345078946e-05, "loss": 2.3359, "step": 418880 }, { "epoch": 0.73, "learning_rate": 1.347530840515212e-05, "loss": 2.2242, "step": 418890 }, { "epoch": 0.73, "learning_rate": 1.3474436465225294e-05, "loss": 2.4067, "step": 418900 }, { "epoch": 0.73, "learning_rate": 1.3473564525298466e-05, "loss": 2.2243, "step": 418910 }, { "epoch": 0.73, "learning_rate": 1.3472692585371638e-05, "loss": 2.3696, "step": 418920 }, { "epoch": 0.73, "learning_rate": 1.3471820645444813e-05, "loss": 2.2341, "step": 418930 }, { "epoch": 0.73, "learning_rate": 1.3470948705517985e-05, "loss": 2.2334, "step": 418940 }, { "epoch": 0.73, "learning_rate": 1.3470076765591157e-05, "loss": 2.3161, "step": 418950 }, { "epoch": 0.73, "learning_rate": 1.3469204825664331e-05, "loss": 2.2967, "step": 418960 }, { "epoch": 0.73, "learning_rate": 1.3468332885737507e-05, "loss": 2.2895, "step": 418970 }, { "epoch": 0.73, "learning_rate": 1.3467460945810679e-05, "loss": 2.2899, "step": 418980 }, { "epoch": 0.73, "learning_rate": 1.346658900588385e-05, "loss": 2.4693, "step": 418990 }, { "epoch": 0.73, "learning_rate": 1.3465717065957023e-05, "loss": 2.2732, "step": 419000 }, { "epoch": 0.73, "learning_rate": 1.3464845126030198e-05, "loss": 2.3354, "step": 419010 }, { "epoch": 0.73, "learning_rate": 1.346397318610337e-05, "loss": 2.2988, "step": 419020 }, { "epoch": 0.73, "learning_rate": 1.3463101246176542e-05, "loss": 2.2794, "step": 419030 }, { "epoch": 0.73, "learning_rate": 1.3462229306249718e-05, "loss": 2.2539, "step": 419040 }, { "epoch": 0.73, "learning_rate": 1.3461357366322892e-05, "loss": 2.2423, "step": 419050 }, { "epoch": 0.73, "learning_rate": 1.3460485426396064e-05, "loss": 2.4104, "step": 419060 }, { "epoch": 0.73, "learning_rate": 1.3459613486469236e-05, "loss": 2.4023, "step": 419070 }, { "epoch": 0.73, "learning_rate": 1.3458741546542411e-05, "loss": 2.2893, "step": 419080 }, { "epoch": 0.73, "learning_rate": 1.3457869606615583e-05, "loss": 2.2153, "step": 419090 }, { "epoch": 0.73, "learning_rate": 1.3456997666688755e-05, "loss": 2.3248, "step": 419100 }, { "epoch": 0.73, "learning_rate": 1.345612572676193e-05, "loss": 2.2657, "step": 419110 }, { "epoch": 0.73, "learning_rate": 1.3455253786835103e-05, "loss": 2.3943, "step": 419120 }, { "epoch": 0.73, "learning_rate": 1.3454381846908277e-05, "loss": 2.2825, "step": 419130 }, { "epoch": 0.73, "learning_rate": 1.3453509906981449e-05, "loss": 2.2875, "step": 419140 }, { "epoch": 0.73, "learning_rate": 1.3452637967054624e-05, "loss": 2.2919, "step": 419150 }, { "epoch": 0.73, "learning_rate": 1.3451766027127796e-05, "loss": 2.3901, "step": 419160 }, { "epoch": 0.73, "learning_rate": 1.3450894087200968e-05, "loss": 2.4297, "step": 419170 }, { "epoch": 0.73, "learning_rate": 1.345002214727414e-05, "loss": 2.3257, "step": 419180 }, { "epoch": 0.73, "learning_rate": 1.3449150207347316e-05, "loss": 2.2771, "step": 419190 }, { "epoch": 0.73, "learning_rate": 1.3448278267420488e-05, "loss": 2.2397, "step": 419200 }, { "epoch": 0.73, "learning_rate": 1.3447406327493662e-05, "loss": 2.318, "step": 419210 }, { "epoch": 0.73, "learning_rate": 1.3446534387566834e-05, "loss": 2.3274, "step": 419220 }, { "epoch": 0.73, "learning_rate": 1.344566244764001e-05, "loss": 2.3646, "step": 419230 }, { "epoch": 0.73, "learning_rate": 1.3444790507713181e-05, "loss": 2.2777, "step": 419240 }, { "epoch": 0.73, "learning_rate": 1.3443918567786353e-05, "loss": 2.216, "step": 419250 }, { "epoch": 0.73, "learning_rate": 1.3443046627859526e-05, "loss": 2.2637, "step": 419260 }, { "epoch": 0.73, "learning_rate": 1.3442174687932701e-05, "loss": 2.312, "step": 419270 }, { "epoch": 0.73, "learning_rate": 1.3441302748005875e-05, "loss": 2.2541, "step": 419280 }, { "epoch": 0.73, "learning_rate": 1.3440430808079047e-05, "loss": 2.2653, "step": 419290 }, { "epoch": 0.73, "learning_rate": 1.3439558868152222e-05, "loss": 2.3765, "step": 419300 }, { "epoch": 0.73, "learning_rate": 1.3438686928225394e-05, "loss": 2.3301, "step": 419310 }, { "epoch": 0.73, "learning_rate": 1.3437814988298566e-05, "loss": 2.3232, "step": 419320 }, { "epoch": 0.73, "learning_rate": 1.3436943048371739e-05, "loss": 2.2866, "step": 419330 }, { "epoch": 0.73, "learning_rate": 1.3436071108444914e-05, "loss": 2.2342, "step": 419340 }, { "epoch": 0.73, "learning_rate": 1.3435199168518086e-05, "loss": 2.2373, "step": 419350 }, { "epoch": 0.73, "learning_rate": 1.343432722859126e-05, "loss": 2.1894, "step": 419360 }, { "epoch": 0.73, "learning_rate": 1.3433455288664432e-05, "loss": 2.304, "step": 419370 }, { "epoch": 0.73, "learning_rate": 1.3432583348737607e-05, "loss": 2.2607, "step": 419380 }, { "epoch": 0.73, "learning_rate": 1.343171140881078e-05, "loss": 2.4156, "step": 419390 }, { "epoch": 0.73, "learning_rate": 1.3430839468883952e-05, "loss": 2.3406, "step": 419400 }, { "epoch": 0.73, "learning_rate": 1.3429967528957127e-05, "loss": 2.1864, "step": 419410 }, { "epoch": 0.73, "learning_rate": 1.3429095589030299e-05, "loss": 2.32, "step": 419420 }, { "epoch": 0.73, "learning_rate": 1.3428223649103471e-05, "loss": 2.3745, "step": 419430 }, { "epoch": 0.73, "learning_rate": 1.3427351709176645e-05, "loss": 2.4009, "step": 419440 }, { "epoch": 0.73, "learning_rate": 1.3426479769249819e-05, "loss": 2.3478, "step": 419450 }, { "epoch": 0.73, "learning_rate": 1.3425607829322992e-05, "loss": 2.4416, "step": 419460 }, { "epoch": 0.73, "learning_rate": 1.3424735889396165e-05, "loss": 2.2345, "step": 419470 }, { "epoch": 0.73, "learning_rate": 1.3423863949469337e-05, "loss": 2.2333, "step": 419480 }, { "epoch": 0.73, "learning_rate": 1.3422992009542512e-05, "loss": 2.2059, "step": 419490 }, { "epoch": 0.73, "learning_rate": 1.3422120069615684e-05, "loss": 2.3351, "step": 419500 }, { "epoch": 0.73, "learning_rate": 1.3421248129688856e-05, "loss": 2.3632, "step": 419510 }, { "epoch": 0.73, "learning_rate": 1.342037618976203e-05, "loss": 2.4774, "step": 419520 }, { "epoch": 0.73, "learning_rate": 1.3419504249835205e-05, "loss": 2.3384, "step": 419530 }, { "epoch": 0.73, "learning_rate": 1.3418632309908378e-05, "loss": 2.3412, "step": 419540 }, { "epoch": 0.73, "learning_rate": 1.341776036998155e-05, "loss": 2.3627, "step": 419550 }, { "epoch": 0.73, "learning_rate": 1.3416888430054725e-05, "loss": 2.2951, "step": 419560 }, { "epoch": 0.73, "learning_rate": 1.3416016490127897e-05, "loss": 2.3522, "step": 419570 }, { "epoch": 0.73, "learning_rate": 1.341514455020107e-05, "loss": 2.318, "step": 419580 }, { "epoch": 0.73, "learning_rate": 1.3414272610274243e-05, "loss": 2.341, "step": 419590 }, { "epoch": 0.73, "learning_rate": 1.3413400670347417e-05, "loss": 2.3369, "step": 419600 }, { "epoch": 0.73, "learning_rate": 1.341252873042059e-05, "loss": 2.3403, "step": 419610 }, { "epoch": 0.73, "learning_rate": 1.3411656790493763e-05, "loss": 2.2692, "step": 419620 }, { "epoch": 0.73, "learning_rate": 1.3410784850566935e-05, "loss": 2.3267, "step": 419630 }, { "epoch": 0.73, "learning_rate": 1.340991291064011e-05, "loss": 2.3309, "step": 419640 }, { "epoch": 0.73, "learning_rate": 1.3409040970713282e-05, "loss": 2.2546, "step": 419650 }, { "epoch": 0.73, "learning_rate": 1.3408169030786454e-05, "loss": 2.4044, "step": 419660 }, { "epoch": 0.73, "learning_rate": 1.340729709085963e-05, "loss": 2.3011, "step": 419670 }, { "epoch": 0.73, "learning_rate": 1.3406425150932802e-05, "loss": 2.2142, "step": 419680 }, { "epoch": 0.73, "learning_rate": 1.3405553211005976e-05, "loss": 2.3042, "step": 419690 }, { "epoch": 0.73, "learning_rate": 1.3404681271079148e-05, "loss": 2.2825, "step": 419700 }, { "epoch": 0.73, "learning_rate": 1.3403809331152323e-05, "loss": 2.2919, "step": 419710 }, { "epoch": 0.73, "learning_rate": 1.3402937391225495e-05, "loss": 2.2368, "step": 419720 }, { "epoch": 0.73, "learning_rate": 1.3402065451298667e-05, "loss": 2.2282, "step": 419730 }, { "epoch": 0.73, "learning_rate": 1.340119351137184e-05, "loss": 2.1846, "step": 419740 }, { "epoch": 0.73, "learning_rate": 1.3400321571445015e-05, "loss": 2.3716, "step": 419750 }, { "epoch": 0.73, "learning_rate": 1.3399449631518187e-05, "loss": 2.419, "step": 419760 }, { "epoch": 0.73, "learning_rate": 1.339857769159136e-05, "loss": 2.327, "step": 419770 }, { "epoch": 0.73, "learning_rate": 1.3397705751664533e-05, "loss": 2.257, "step": 419780 }, { "epoch": 0.73, "learning_rate": 1.3396833811737708e-05, "loss": 2.3252, "step": 419790 }, { "epoch": 0.73, "learning_rate": 1.339596187181088e-05, "loss": 2.3032, "step": 419800 }, { "epoch": 0.73, "learning_rate": 1.3395089931884052e-05, "loss": 2.3351, "step": 419810 }, { "epoch": 0.73, "learning_rate": 1.3394217991957228e-05, "loss": 2.2626, "step": 419820 }, { "epoch": 0.73, "learning_rate": 1.33933460520304e-05, "loss": 2.3233, "step": 419830 }, { "epoch": 0.73, "learning_rate": 1.3392474112103574e-05, "loss": 2.3005, "step": 419840 }, { "epoch": 0.73, "learning_rate": 1.3391602172176746e-05, "loss": 2.2732, "step": 419850 }, { "epoch": 0.73, "learning_rate": 1.3390730232249921e-05, "loss": 2.3799, "step": 419860 }, { "epoch": 0.73, "learning_rate": 1.3389858292323093e-05, "loss": 2.302, "step": 419870 }, { "epoch": 0.73, "learning_rate": 1.3388986352396265e-05, "loss": 2.2836, "step": 419880 }, { "epoch": 0.73, "learning_rate": 1.3388114412469437e-05, "loss": 2.3709, "step": 419890 }, { "epoch": 0.73, "learning_rate": 1.3387242472542613e-05, "loss": 2.2988, "step": 419900 }, { "epoch": 0.73, "learning_rate": 1.3386370532615785e-05, "loss": 2.3428, "step": 419910 }, { "epoch": 0.73, "learning_rate": 1.3385498592688959e-05, "loss": 2.2796, "step": 419920 }, { "epoch": 0.73, "learning_rate": 1.3384626652762131e-05, "loss": 2.2488, "step": 419930 }, { "epoch": 0.73, "learning_rate": 1.3383754712835306e-05, "loss": 2.369, "step": 419940 }, { "epoch": 0.73, "learning_rate": 1.3382882772908478e-05, "loss": 2.3355, "step": 419950 }, { "epoch": 0.73, "learning_rate": 1.338201083298165e-05, "loss": 2.3078, "step": 419960 }, { "epoch": 0.73, "learning_rate": 1.3381138893054826e-05, "loss": 2.3567, "step": 419970 }, { "epoch": 0.73, "learning_rate": 1.3380266953127998e-05, "loss": 2.3313, "step": 419980 }, { "epoch": 0.73, "learning_rate": 1.337939501320117e-05, "loss": 2.2741, "step": 419990 }, { "epoch": 0.73, "learning_rate": 1.3378523073274344e-05, "loss": 2.1983, "step": 420000 }, { "epoch": 0.73, "learning_rate": 1.337765113334752e-05, "loss": 2.3719, "step": 420010 }, { "epoch": 0.73, "learning_rate": 1.3376779193420691e-05, "loss": 2.2092, "step": 420020 }, { "epoch": 0.73, "learning_rate": 1.3375907253493863e-05, "loss": 2.3106, "step": 420030 }, { "epoch": 0.73, "learning_rate": 1.3375035313567036e-05, "loss": 2.209, "step": 420040 }, { "epoch": 0.73, "learning_rate": 1.3374163373640211e-05, "loss": 2.2517, "step": 420050 }, { "epoch": 0.73, "learning_rate": 1.3373291433713383e-05, "loss": 2.3326, "step": 420060 }, { "epoch": 0.73, "learning_rate": 1.3372419493786555e-05, "loss": 2.3495, "step": 420070 }, { "epoch": 0.73, "learning_rate": 1.337154755385973e-05, "loss": 2.3323, "step": 420080 }, { "epoch": 0.73, "learning_rate": 1.3370675613932904e-05, "loss": 2.3206, "step": 420090 }, { "epoch": 0.73, "learning_rate": 1.3369803674006076e-05, "loss": 2.3255, "step": 420100 }, { "epoch": 0.73, "learning_rate": 1.3368931734079249e-05, "loss": 2.3134, "step": 420110 }, { "epoch": 0.73, "learning_rate": 1.3368059794152424e-05, "loss": 2.2942, "step": 420120 }, { "epoch": 0.73, "learning_rate": 1.3367187854225596e-05, "loss": 2.2401, "step": 420130 }, { "epoch": 0.73, "learning_rate": 1.3366315914298768e-05, "loss": 2.1778, "step": 420140 }, { "epoch": 0.73, "learning_rate": 1.3365443974371942e-05, "loss": 2.3361, "step": 420150 }, { "epoch": 0.73, "learning_rate": 1.3364572034445116e-05, "loss": 2.2803, "step": 420160 }, { "epoch": 0.73, "learning_rate": 1.336370009451829e-05, "loss": 2.3977, "step": 420170 }, { "epoch": 0.73, "learning_rate": 1.3362828154591462e-05, "loss": 2.3316, "step": 420180 }, { "epoch": 0.73, "learning_rate": 1.3361956214664634e-05, "loss": 2.269, "step": 420190 }, { "epoch": 0.73, "learning_rate": 1.3361084274737809e-05, "loss": 2.258, "step": 420200 }, { "epoch": 0.73, "learning_rate": 1.3360212334810981e-05, "loss": 2.2815, "step": 420210 }, { "epoch": 0.73, "learning_rate": 1.3359340394884153e-05, "loss": 2.2818, "step": 420220 }, { "epoch": 0.73, "learning_rate": 1.3358468454957329e-05, "loss": 2.354, "step": 420230 }, { "epoch": 0.73, "learning_rate": 1.33575965150305e-05, "loss": 2.3283, "step": 420240 }, { "epoch": 0.73, "learning_rate": 1.3356724575103675e-05, "loss": 2.334, "step": 420250 }, { "epoch": 0.73, "learning_rate": 1.3355852635176847e-05, "loss": 2.2664, "step": 420260 }, { "epoch": 0.73, "learning_rate": 1.3354980695250022e-05, "loss": 2.3265, "step": 420270 }, { "epoch": 0.73, "learning_rate": 1.3354108755323194e-05, "loss": 2.292, "step": 420280 }, { "epoch": 0.73, "learning_rate": 1.3353236815396366e-05, "loss": 2.2486, "step": 420290 }, { "epoch": 0.73, "learning_rate": 1.3352364875469538e-05, "loss": 2.2262, "step": 420300 }, { "epoch": 0.73, "learning_rate": 1.3351492935542714e-05, "loss": 2.2857, "step": 420310 }, { "epoch": 0.73, "learning_rate": 1.3350620995615888e-05, "loss": 2.2857, "step": 420320 }, { "epoch": 0.73, "learning_rate": 1.334974905568906e-05, "loss": 2.2519, "step": 420330 }, { "epoch": 0.73, "learning_rate": 1.3348877115762235e-05, "loss": 2.3539, "step": 420340 }, { "epoch": 0.73, "learning_rate": 1.3348005175835407e-05, "loss": 2.3118, "step": 420350 }, { "epoch": 0.73, "learning_rate": 1.334713323590858e-05, "loss": 2.3123, "step": 420360 }, { "epoch": 0.73, "learning_rate": 1.3346261295981751e-05, "loss": 2.294, "step": 420370 }, { "epoch": 0.73, "learning_rate": 1.3345389356054927e-05, "loss": 2.3204, "step": 420380 }, { "epoch": 0.73, "learning_rate": 1.3344517416128099e-05, "loss": 2.3168, "step": 420390 }, { "epoch": 0.73, "learning_rate": 1.3343645476201273e-05, "loss": 2.3578, "step": 420400 }, { "epoch": 0.73, "learning_rate": 1.3342773536274445e-05, "loss": 2.2471, "step": 420410 }, { "epoch": 0.73, "learning_rate": 1.334190159634762e-05, "loss": 2.2203, "step": 420420 }, { "epoch": 0.73, "learning_rate": 1.3341029656420792e-05, "loss": 2.3289, "step": 420430 }, { "epoch": 0.73, "learning_rate": 1.3340157716493964e-05, "loss": 2.408, "step": 420440 }, { "epoch": 0.73, "learning_rate": 1.3339285776567136e-05, "loss": 2.2996, "step": 420450 }, { "epoch": 0.73, "learning_rate": 1.3338413836640312e-05, "loss": 2.19, "step": 420460 }, { "epoch": 0.73, "learning_rate": 1.3337541896713484e-05, "loss": 2.2586, "step": 420470 }, { "epoch": 0.73, "learning_rate": 1.3336669956786658e-05, "loss": 2.2825, "step": 420480 }, { "epoch": 0.73, "learning_rate": 1.3335798016859831e-05, "loss": 2.2668, "step": 420490 }, { "epoch": 0.73, "learning_rate": 1.3334926076933005e-05, "loss": 2.1933, "step": 420500 }, { "epoch": 0.73, "learning_rate": 1.3334054137006177e-05, "loss": 2.2524, "step": 420510 }, { "epoch": 0.73, "learning_rate": 1.333318219707935e-05, "loss": 2.3034, "step": 420520 }, { "epoch": 0.73, "learning_rate": 1.3332310257152525e-05, "loss": 2.3051, "step": 420530 }, { "epoch": 0.73, "learning_rate": 1.3331438317225697e-05, "loss": 2.3938, "step": 420540 }, { "epoch": 0.73, "learning_rate": 1.3330566377298869e-05, "loss": 2.3587, "step": 420550 }, { "epoch": 0.73, "learning_rate": 1.3329694437372043e-05, "loss": 2.2774, "step": 420560 }, { "epoch": 0.73, "learning_rate": 1.3328822497445218e-05, "loss": 2.3643, "step": 420570 }, { "epoch": 0.73, "learning_rate": 1.332795055751839e-05, "loss": 2.4041, "step": 420580 }, { "epoch": 0.73, "learning_rate": 1.3327078617591562e-05, "loss": 2.2453, "step": 420590 }, { "epoch": 0.73, "learning_rate": 1.3326206677664738e-05, "loss": 2.3723, "step": 420600 }, { "epoch": 0.73, "learning_rate": 1.332533473773791e-05, "loss": 2.2709, "step": 420610 }, { "epoch": 0.73, "learning_rate": 1.3324462797811082e-05, "loss": 2.2045, "step": 420620 }, { "epoch": 0.73, "learning_rate": 1.3323590857884256e-05, "loss": 2.3138, "step": 420630 }, { "epoch": 0.73, "learning_rate": 1.332271891795743e-05, "loss": 2.2719, "step": 420640 }, { "epoch": 0.73, "learning_rate": 1.3321846978030603e-05, "loss": 2.2564, "step": 420650 }, { "epoch": 0.73, "learning_rate": 1.3320975038103775e-05, "loss": 2.2643, "step": 420660 }, { "epoch": 0.73, "learning_rate": 1.3320103098176947e-05, "loss": 2.3099, "step": 420670 }, { "epoch": 0.73, "learning_rate": 1.3319231158250123e-05, "loss": 2.3017, "step": 420680 }, { "epoch": 0.73, "learning_rate": 1.3318359218323295e-05, "loss": 2.2662, "step": 420690 }, { "epoch": 0.73, "learning_rate": 1.3317487278396467e-05, "loss": 2.3207, "step": 420700 }, { "epoch": 0.73, "learning_rate": 1.3316615338469641e-05, "loss": 2.3639, "step": 420710 }, { "epoch": 0.73, "learning_rate": 1.3315743398542815e-05, "loss": 2.274, "step": 420720 }, { "epoch": 0.73, "learning_rate": 1.3314871458615988e-05, "loss": 2.3666, "step": 420730 }, { "epoch": 0.73, "learning_rate": 1.331399951868916e-05, "loss": 2.3078, "step": 420740 }, { "epoch": 0.73, "learning_rate": 1.3313127578762336e-05, "loss": 2.2575, "step": 420750 }, { "epoch": 0.73, "learning_rate": 1.3312255638835508e-05, "loss": 2.3083, "step": 420760 }, { "epoch": 0.73, "learning_rate": 1.331138369890868e-05, "loss": 2.3179, "step": 420770 }, { "epoch": 0.73, "learning_rate": 1.3310511758981852e-05, "loss": 2.2606, "step": 420780 }, { "epoch": 0.73, "learning_rate": 1.3309639819055028e-05, "loss": 2.2789, "step": 420790 }, { "epoch": 0.73, "learning_rate": 1.33087678791282e-05, "loss": 2.3664, "step": 420800 }, { "epoch": 0.73, "learning_rate": 1.3307895939201373e-05, "loss": 2.3067, "step": 420810 }, { "epoch": 0.73, "learning_rate": 1.3307023999274546e-05, "loss": 2.3043, "step": 420820 }, { "epoch": 0.73, "learning_rate": 1.3306152059347721e-05, "loss": 2.4116, "step": 420830 }, { "epoch": 0.73, "learning_rate": 1.3305280119420893e-05, "loss": 2.424, "step": 420840 }, { "epoch": 0.73, "learning_rate": 1.3304408179494065e-05, "loss": 2.2678, "step": 420850 }, { "epoch": 0.73, "learning_rate": 1.3303536239567237e-05, "loss": 2.3222, "step": 420860 }, { "epoch": 0.73, "learning_rate": 1.3302664299640413e-05, "loss": 2.3846, "step": 420870 }, { "epoch": 0.73, "learning_rate": 1.3301792359713586e-05, "loss": 2.2511, "step": 420880 }, { "epoch": 0.73, "learning_rate": 1.3300920419786759e-05, "loss": 2.3339, "step": 420890 }, { "epoch": 0.73, "learning_rate": 1.3300048479859934e-05, "loss": 2.3908, "step": 420900 }, { "epoch": 0.73, "learning_rate": 1.3299176539933106e-05, "loss": 2.2713, "step": 420910 }, { "epoch": 0.73, "learning_rate": 1.3298304600006278e-05, "loss": 2.1764, "step": 420920 }, { "epoch": 0.73, "learning_rate": 1.329743266007945e-05, "loss": 2.3631, "step": 420930 }, { "epoch": 0.73, "learning_rate": 1.3296560720152626e-05, "loss": 2.1162, "step": 420940 }, { "epoch": 0.73, "learning_rate": 1.3295688780225798e-05, "loss": 2.2668, "step": 420950 }, { "epoch": 0.73, "learning_rate": 1.3294816840298972e-05, "loss": 2.1941, "step": 420960 }, { "epoch": 0.73, "learning_rate": 1.3293944900372144e-05, "loss": 2.2673, "step": 420970 }, { "epoch": 0.73, "learning_rate": 1.3293072960445319e-05, "loss": 2.3067, "step": 420980 }, { "epoch": 0.73, "learning_rate": 1.3292201020518491e-05, "loss": 2.1884, "step": 420990 }, { "epoch": 0.73, "learning_rate": 1.3291329080591663e-05, "loss": 2.364, "step": 421000 }, { "epoch": 0.73, "learning_rate": 1.3290457140664839e-05, "loss": 2.2583, "step": 421010 }, { "epoch": 0.73, "learning_rate": 1.328958520073801e-05, "loss": 2.3157, "step": 421020 }, { "epoch": 0.73, "learning_rate": 1.3288713260811183e-05, "loss": 2.2997, "step": 421030 }, { "epoch": 0.73, "learning_rate": 1.3287841320884357e-05, "loss": 2.1537, "step": 421040 }, { "epoch": 0.73, "learning_rate": 1.3286969380957532e-05, "loss": 2.3772, "step": 421050 }, { "epoch": 0.73, "learning_rate": 1.3286097441030704e-05, "loss": 2.4154, "step": 421060 }, { "epoch": 0.73, "learning_rate": 1.3285225501103876e-05, "loss": 2.2937, "step": 421070 }, { "epoch": 0.73, "learning_rate": 1.3284353561177048e-05, "loss": 2.2822, "step": 421080 }, { "epoch": 0.73, "learning_rate": 1.3283481621250224e-05, "loss": 2.3942, "step": 421090 }, { "epoch": 0.73, "learning_rate": 1.3282609681323396e-05, "loss": 2.2964, "step": 421100 }, { "epoch": 0.73, "learning_rate": 1.3281737741396568e-05, "loss": 2.2444, "step": 421110 }, { "epoch": 0.73, "learning_rate": 1.3280865801469742e-05, "loss": 2.2997, "step": 421120 }, { "epoch": 0.73, "learning_rate": 1.3279993861542917e-05, "loss": 2.308, "step": 421130 }, { "epoch": 0.73, "learning_rate": 1.327912192161609e-05, "loss": 2.2362, "step": 421140 }, { "epoch": 0.73, "learning_rate": 1.3278249981689261e-05, "loss": 2.2838, "step": 421150 }, { "epoch": 0.73, "learning_rate": 1.3277378041762437e-05, "loss": 2.2861, "step": 421160 }, { "epoch": 0.73, "learning_rate": 1.3276506101835609e-05, "loss": 2.295, "step": 421170 }, { "epoch": 0.73, "learning_rate": 1.3275634161908781e-05, "loss": 2.3885, "step": 421180 }, { "epoch": 0.73, "learning_rate": 1.3274762221981955e-05, "loss": 2.3695, "step": 421190 }, { "epoch": 0.73, "learning_rate": 1.3273890282055128e-05, "loss": 2.1641, "step": 421200 }, { "epoch": 0.73, "learning_rate": 1.3273018342128302e-05, "loss": 2.255, "step": 421210 }, { "epoch": 0.73, "learning_rate": 1.3272146402201474e-05, "loss": 2.2954, "step": 421220 }, { "epoch": 0.73, "learning_rate": 1.3271274462274646e-05, "loss": 2.3818, "step": 421230 }, { "epoch": 0.73, "learning_rate": 1.3270402522347822e-05, "loss": 2.3168, "step": 421240 }, { "epoch": 0.73, "learning_rate": 1.3269530582420994e-05, "loss": 2.3023, "step": 421250 }, { "epoch": 0.73, "learning_rate": 1.3268658642494166e-05, "loss": 2.3412, "step": 421260 }, { "epoch": 0.73, "learning_rate": 1.3267786702567341e-05, "loss": 2.2924, "step": 421270 }, { "epoch": 0.73, "learning_rate": 1.3266914762640514e-05, "loss": 2.2213, "step": 421280 }, { "epoch": 0.73, "learning_rate": 1.3266042822713687e-05, "loss": 2.3757, "step": 421290 }, { "epoch": 0.73, "learning_rate": 1.326517088278686e-05, "loss": 2.348, "step": 421300 }, { "epoch": 0.73, "learning_rate": 1.3264298942860035e-05, "loss": 2.3966, "step": 421310 }, { "epoch": 0.73, "learning_rate": 1.3263427002933207e-05, "loss": 2.3589, "step": 421320 }, { "epoch": 0.73, "learning_rate": 1.3262555063006379e-05, "loss": 2.2015, "step": 421330 }, { "epoch": 0.73, "learning_rate": 1.3261683123079551e-05, "loss": 2.392, "step": 421340 }, { "epoch": 0.73, "learning_rate": 1.3260811183152727e-05, "loss": 2.2767, "step": 421350 }, { "epoch": 0.73, "learning_rate": 1.32599392432259e-05, "loss": 2.2801, "step": 421360 }, { "epoch": 0.73, "learning_rate": 1.3259067303299072e-05, "loss": 2.3068, "step": 421370 }, { "epoch": 0.73, "learning_rate": 1.3258195363372244e-05, "loss": 2.2075, "step": 421380 }, { "epoch": 0.73, "learning_rate": 1.325732342344542e-05, "loss": 2.1862, "step": 421390 }, { "epoch": 0.73, "learning_rate": 1.3256451483518592e-05, "loss": 2.316, "step": 421400 }, { "epoch": 0.73, "learning_rate": 1.3255579543591764e-05, "loss": 2.1855, "step": 421410 }, { "epoch": 0.73, "learning_rate": 1.325470760366494e-05, "loss": 2.2711, "step": 421420 }, { "epoch": 0.73, "learning_rate": 1.3253835663738112e-05, "loss": 2.3044, "step": 421430 }, { "epoch": 0.73, "learning_rate": 1.3252963723811285e-05, "loss": 2.3692, "step": 421440 }, { "epoch": 0.73, "learning_rate": 1.3252091783884457e-05, "loss": 2.4838, "step": 421450 }, { "epoch": 0.73, "learning_rate": 1.3251219843957633e-05, "loss": 2.2339, "step": 421460 }, { "epoch": 0.73, "learning_rate": 1.3250347904030805e-05, "loss": 2.3488, "step": 421470 }, { "epoch": 0.74, "learning_rate": 1.3249475964103977e-05, "loss": 2.2971, "step": 421480 }, { "epoch": 0.74, "learning_rate": 1.324860402417715e-05, "loss": 2.4036, "step": 421490 }, { "epoch": 0.74, "learning_rate": 1.3247732084250325e-05, "loss": 2.3149, "step": 421500 }, { "epoch": 0.74, "learning_rate": 1.3246860144323497e-05, "loss": 2.3874, "step": 421510 }, { "epoch": 0.74, "learning_rate": 1.324598820439667e-05, "loss": 2.4423, "step": 421520 }, { "epoch": 0.74, "learning_rate": 1.3245116264469844e-05, "loss": 2.1739, "step": 421530 }, { "epoch": 0.74, "learning_rate": 1.3244244324543018e-05, "loss": 2.2703, "step": 421540 }, { "epoch": 0.74, "learning_rate": 1.324337238461619e-05, "loss": 2.375, "step": 421550 }, { "epoch": 0.74, "learning_rate": 1.3242500444689362e-05, "loss": 2.4143, "step": 421560 }, { "epoch": 0.74, "learning_rate": 1.3241628504762538e-05, "loss": 2.2857, "step": 421570 }, { "epoch": 0.74, "learning_rate": 1.324075656483571e-05, "loss": 2.3682, "step": 421580 }, { "epoch": 0.74, "learning_rate": 1.3239884624908882e-05, "loss": 2.2951, "step": 421590 }, { "epoch": 0.74, "learning_rate": 1.3239012684982056e-05, "loss": 2.4426, "step": 421600 }, { "epoch": 0.74, "learning_rate": 1.3238140745055231e-05, "loss": 2.3634, "step": 421610 }, { "epoch": 0.74, "learning_rate": 1.3237268805128403e-05, "loss": 2.3668, "step": 421620 }, { "epoch": 0.74, "learning_rate": 1.3236396865201575e-05, "loss": 2.298, "step": 421630 }, { "epoch": 0.74, "learning_rate": 1.3235524925274747e-05, "loss": 2.357, "step": 421640 }, { "epoch": 0.74, "learning_rate": 1.3234652985347923e-05, "loss": 2.3762, "step": 421650 }, { "epoch": 0.74, "learning_rate": 1.3233781045421095e-05, "loss": 2.2381, "step": 421660 }, { "epoch": 0.74, "learning_rate": 1.3232909105494269e-05, "loss": 2.3573, "step": 421670 }, { "epoch": 0.74, "learning_rate": 1.3232037165567442e-05, "loss": 2.3007, "step": 421680 }, { "epoch": 0.74, "learning_rate": 1.3231165225640616e-05, "loss": 2.3537, "step": 421690 }, { "epoch": 0.74, "learning_rate": 1.3230293285713788e-05, "loss": 2.199, "step": 421700 }, { "epoch": 0.74, "learning_rate": 1.322942134578696e-05, "loss": 2.2983, "step": 421710 }, { "epoch": 0.74, "learning_rate": 1.3228549405860136e-05, "loss": 2.2604, "step": 421720 }, { "epoch": 0.74, "learning_rate": 1.3227677465933308e-05, "loss": 2.3329, "step": 421730 }, { "epoch": 0.74, "learning_rate": 1.322680552600648e-05, "loss": 2.3127, "step": 421740 }, { "epoch": 0.74, "learning_rate": 1.3225933586079654e-05, "loss": 2.2861, "step": 421750 }, { "epoch": 0.74, "learning_rate": 1.3225061646152827e-05, "loss": 2.2756, "step": 421760 }, { "epoch": 0.74, "learning_rate": 1.3224189706226001e-05, "loss": 2.2775, "step": 421770 }, { "epoch": 0.74, "learning_rate": 1.3223317766299173e-05, "loss": 2.4184, "step": 421780 }, { "epoch": 0.74, "learning_rate": 1.3222445826372345e-05, "loss": 2.1973, "step": 421790 }, { "epoch": 0.74, "learning_rate": 1.322157388644552e-05, "loss": 2.3695, "step": 421800 }, { "epoch": 0.74, "learning_rate": 1.3220701946518693e-05, "loss": 2.2757, "step": 421810 }, { "epoch": 0.74, "learning_rate": 1.3219830006591865e-05, "loss": 2.2944, "step": 421820 }, { "epoch": 0.74, "learning_rate": 1.321895806666504e-05, "loss": 2.2724, "step": 421830 }, { "epoch": 0.74, "learning_rate": 1.3218086126738212e-05, "loss": 2.2973, "step": 421840 }, { "epoch": 0.74, "learning_rate": 1.3217214186811386e-05, "loss": 2.2987, "step": 421850 }, { "epoch": 0.74, "learning_rate": 1.3216342246884558e-05, "loss": 2.3569, "step": 421860 }, { "epoch": 0.74, "learning_rate": 1.3215470306957734e-05, "loss": 2.3422, "step": 421870 }, { "epoch": 0.74, "learning_rate": 1.3214598367030906e-05, "loss": 2.2916, "step": 421880 }, { "epoch": 0.74, "learning_rate": 1.3213726427104078e-05, "loss": 2.25, "step": 421890 }, { "epoch": 0.74, "learning_rate": 1.321285448717725e-05, "loss": 2.3152, "step": 421900 }, { "epoch": 0.74, "learning_rate": 1.3211982547250425e-05, "loss": 2.3392, "step": 421910 }, { "epoch": 0.74, "learning_rate": 1.32111106073236e-05, "loss": 2.3393, "step": 421920 }, { "epoch": 0.74, "learning_rate": 1.3210238667396771e-05, "loss": 2.3616, "step": 421930 }, { "epoch": 0.74, "learning_rate": 1.3209366727469947e-05, "loss": 2.4351, "step": 421940 }, { "epoch": 0.74, "learning_rate": 1.3208494787543119e-05, "loss": 2.2922, "step": 421950 }, { "epoch": 0.74, "learning_rate": 1.3207622847616291e-05, "loss": 2.2986, "step": 421960 }, { "epoch": 0.74, "learning_rate": 1.3206750907689463e-05, "loss": 2.3535, "step": 421970 }, { "epoch": 0.74, "learning_rate": 1.3205878967762638e-05, "loss": 2.2853, "step": 421980 }, { "epoch": 0.74, "learning_rate": 1.320500702783581e-05, "loss": 2.2718, "step": 421990 }, { "epoch": 0.74, "learning_rate": 1.3204135087908984e-05, "loss": 2.3634, "step": 422000 }, { "epoch": 0.74, "learning_rate": 1.3203263147982156e-05, "loss": 2.2764, "step": 422010 }, { "epoch": 0.74, "learning_rate": 1.3202391208055332e-05, "loss": 2.3229, "step": 422020 }, { "epoch": 0.74, "learning_rate": 1.3201519268128504e-05, "loss": 2.2125, "step": 422030 }, { "epoch": 0.74, "learning_rate": 1.3200647328201676e-05, "loss": 2.3127, "step": 422040 }, { "epoch": 0.74, "learning_rate": 1.3199775388274848e-05, "loss": 2.2561, "step": 422050 }, { "epoch": 0.74, "learning_rate": 1.3198903448348024e-05, "loss": 2.301, "step": 422060 }, { "epoch": 0.74, "learning_rate": 1.3198031508421196e-05, "loss": 2.2302, "step": 422070 }, { "epoch": 0.74, "learning_rate": 1.319715956849437e-05, "loss": 2.2025, "step": 422080 }, { "epoch": 0.74, "learning_rate": 1.3196287628567545e-05, "loss": 2.3185, "step": 422090 }, { "epoch": 0.74, "learning_rate": 1.3195415688640717e-05, "loss": 2.3748, "step": 422100 }, { "epoch": 0.74, "learning_rate": 1.3194543748713889e-05, "loss": 2.3925, "step": 422110 }, { "epoch": 0.74, "learning_rate": 1.3193671808787061e-05, "loss": 2.2504, "step": 422120 }, { "epoch": 0.74, "learning_rate": 1.3192799868860237e-05, "loss": 2.4084, "step": 422130 }, { "epoch": 0.74, "learning_rate": 1.3191927928933409e-05, "loss": 2.3568, "step": 422140 }, { "epoch": 0.74, "learning_rate": 1.319105598900658e-05, "loss": 2.2569, "step": 422150 }, { "epoch": 0.74, "learning_rate": 1.3190184049079754e-05, "loss": 2.4299, "step": 422160 }, { "epoch": 0.74, "learning_rate": 1.318931210915293e-05, "loss": 2.2504, "step": 422170 }, { "epoch": 0.74, "learning_rate": 1.3188440169226102e-05, "loss": 2.3937, "step": 422180 }, { "epoch": 0.74, "learning_rate": 1.3187568229299274e-05, "loss": 2.4045, "step": 422190 }, { "epoch": 0.74, "learning_rate": 1.318669628937245e-05, "loss": 2.2578, "step": 422200 }, { "epoch": 0.74, "learning_rate": 1.3185824349445622e-05, "loss": 2.2869, "step": 422210 }, { "epoch": 0.74, "learning_rate": 1.3184952409518794e-05, "loss": 2.2881, "step": 422220 }, { "epoch": 0.74, "learning_rate": 1.3184080469591967e-05, "loss": 2.275, "step": 422230 }, { "epoch": 0.74, "learning_rate": 1.3183208529665141e-05, "loss": 2.3379, "step": 422240 }, { "epoch": 0.74, "learning_rate": 1.3182336589738315e-05, "loss": 2.2107, "step": 422250 }, { "epoch": 0.74, "learning_rate": 1.3181464649811487e-05, "loss": 2.3251, "step": 422260 }, { "epoch": 0.74, "learning_rate": 1.318059270988466e-05, "loss": 2.3077, "step": 422270 }, { "epoch": 0.74, "learning_rate": 1.3179720769957835e-05, "loss": 2.1784, "step": 422280 }, { "epoch": 0.74, "learning_rate": 1.3178848830031007e-05, "loss": 2.3484, "step": 422290 }, { "epoch": 0.74, "learning_rate": 1.3177976890104179e-05, "loss": 2.2851, "step": 422300 }, { "epoch": 0.74, "learning_rate": 1.3177104950177353e-05, "loss": 2.3913, "step": 422310 }, { "epoch": 0.74, "learning_rate": 1.3176233010250526e-05, "loss": 2.3338, "step": 422320 }, { "epoch": 0.74, "learning_rate": 1.31753610703237e-05, "loss": 2.3193, "step": 422330 }, { "epoch": 0.74, "learning_rate": 1.3174489130396872e-05, "loss": 2.3092, "step": 422340 }, { "epoch": 0.74, "learning_rate": 1.3173617190470048e-05, "loss": 2.4006, "step": 422350 }, { "epoch": 0.74, "learning_rate": 1.317274525054322e-05, "loss": 2.3484, "step": 422360 }, { "epoch": 0.74, "learning_rate": 1.3171873310616392e-05, "loss": 2.4023, "step": 422370 }, { "epoch": 0.74, "learning_rate": 1.3171001370689564e-05, "loss": 2.2273, "step": 422380 }, { "epoch": 0.74, "learning_rate": 1.317012943076274e-05, "loss": 2.1958, "step": 422390 }, { "epoch": 0.74, "learning_rate": 1.3169257490835913e-05, "loss": 2.3093, "step": 422400 }, { "epoch": 0.74, "learning_rate": 1.3168385550909085e-05, "loss": 2.3737, "step": 422410 }, { "epoch": 0.74, "learning_rate": 1.3167513610982257e-05, "loss": 2.1521, "step": 422420 }, { "epoch": 0.74, "learning_rate": 1.3166641671055433e-05, "loss": 2.1514, "step": 422430 }, { "epoch": 0.74, "learning_rate": 1.3165769731128605e-05, "loss": 2.3051, "step": 422440 }, { "epoch": 0.74, "learning_rate": 1.3164897791201777e-05, "loss": 2.4599, "step": 422450 }, { "epoch": 0.74, "learning_rate": 1.316402585127495e-05, "loss": 2.3126, "step": 422460 }, { "epoch": 0.74, "learning_rate": 1.3163153911348124e-05, "loss": 2.3017, "step": 422470 }, { "epoch": 0.74, "learning_rate": 1.3162281971421298e-05, "loss": 2.2048, "step": 422480 }, { "epoch": 0.74, "learning_rate": 1.316141003149447e-05, "loss": 2.4562, "step": 422490 }, { "epoch": 0.74, "learning_rate": 1.3160538091567646e-05, "loss": 2.2126, "step": 422500 }, { "epoch": 0.74, "learning_rate": 1.3159666151640818e-05, "loss": 2.1914, "step": 422510 }, { "epoch": 0.74, "learning_rate": 1.315879421171399e-05, "loss": 2.2986, "step": 422520 }, { "epoch": 0.74, "learning_rate": 1.3157922271787162e-05, "loss": 2.3506, "step": 422530 }, { "epoch": 0.74, "learning_rate": 1.3157050331860337e-05, "loss": 2.4304, "step": 422540 }, { "epoch": 0.74, "learning_rate": 1.315617839193351e-05, "loss": 2.2895, "step": 422550 }, { "epoch": 0.74, "learning_rate": 1.3155306452006683e-05, "loss": 2.3035, "step": 422560 }, { "epoch": 0.74, "learning_rate": 1.3154434512079855e-05, "loss": 2.2396, "step": 422570 }, { "epoch": 0.74, "learning_rate": 1.315356257215303e-05, "loss": 2.3022, "step": 422580 }, { "epoch": 0.74, "learning_rate": 1.3152690632226203e-05, "loss": 2.1777, "step": 422590 }, { "epoch": 0.74, "learning_rate": 1.3151818692299375e-05, "loss": 2.1674, "step": 422600 }, { "epoch": 0.74, "learning_rate": 1.315094675237255e-05, "loss": 2.2545, "step": 422610 }, { "epoch": 0.74, "learning_rate": 1.3150074812445723e-05, "loss": 2.2442, "step": 422620 }, { "epoch": 0.74, "learning_rate": 1.3149202872518895e-05, "loss": 2.3141, "step": 422630 }, { "epoch": 0.74, "learning_rate": 1.3148330932592068e-05, "loss": 2.3717, "step": 422640 }, { "epoch": 0.74, "learning_rate": 1.3147458992665244e-05, "loss": 2.2798, "step": 422650 }, { "epoch": 0.74, "learning_rate": 1.3146587052738416e-05, "loss": 2.2973, "step": 422660 }, { "epoch": 0.74, "learning_rate": 1.3145715112811588e-05, "loss": 2.3426, "step": 422670 }, { "epoch": 0.74, "learning_rate": 1.314484317288476e-05, "loss": 2.3374, "step": 422680 }, { "epoch": 0.74, "learning_rate": 1.3143971232957936e-05, "loss": 2.2601, "step": 422690 }, { "epoch": 0.74, "learning_rate": 1.3143099293031108e-05, "loss": 2.3095, "step": 422700 }, { "epoch": 0.74, "learning_rate": 1.3142227353104281e-05, "loss": 2.2143, "step": 422710 }, { "epoch": 0.74, "learning_rate": 1.3141355413177453e-05, "loss": 2.2194, "step": 422720 }, { "epoch": 0.74, "learning_rate": 1.3140483473250629e-05, "loss": 2.3312, "step": 422730 }, { "epoch": 0.74, "learning_rate": 1.3139611533323801e-05, "loss": 2.242, "step": 422740 }, { "epoch": 0.74, "learning_rate": 1.3138739593396973e-05, "loss": 2.3138, "step": 422750 }, { "epoch": 0.74, "learning_rate": 1.3137867653470149e-05, "loss": 2.3001, "step": 422760 }, { "epoch": 0.74, "learning_rate": 1.313699571354332e-05, "loss": 2.3024, "step": 422770 }, { "epoch": 0.74, "learning_rate": 1.3136123773616493e-05, "loss": 2.2874, "step": 422780 }, { "epoch": 0.74, "learning_rate": 1.3135251833689666e-05, "loss": 2.3442, "step": 422790 }, { "epoch": 0.74, "learning_rate": 1.313437989376284e-05, "loss": 2.2803, "step": 422800 }, { "epoch": 0.74, "learning_rate": 1.3133507953836014e-05, "loss": 2.2651, "step": 422810 }, { "epoch": 0.74, "learning_rate": 1.3132636013909186e-05, "loss": 2.4126, "step": 422820 }, { "epoch": 0.74, "learning_rate": 1.3131764073982358e-05, "loss": 2.415, "step": 422830 }, { "epoch": 0.74, "learning_rate": 1.3130892134055534e-05, "loss": 2.1327, "step": 422840 }, { "epoch": 0.74, "learning_rate": 1.3130020194128706e-05, "loss": 2.3068, "step": 422850 }, { "epoch": 0.74, "learning_rate": 1.3129148254201878e-05, "loss": 2.246, "step": 422860 }, { "epoch": 0.74, "learning_rate": 1.3128276314275053e-05, "loss": 2.3617, "step": 422870 }, { "epoch": 0.74, "learning_rate": 1.3127404374348227e-05, "loss": 2.3211, "step": 422880 }, { "epoch": 0.74, "learning_rate": 1.3126532434421399e-05, "loss": 2.4197, "step": 422890 }, { "epoch": 0.74, "learning_rate": 1.3125660494494571e-05, "loss": 2.1742, "step": 422900 }, { "epoch": 0.74, "learning_rate": 1.3124788554567747e-05, "loss": 2.3276, "step": 422910 }, { "epoch": 0.74, "learning_rate": 1.3123916614640919e-05, "loss": 2.2675, "step": 422920 }, { "epoch": 0.74, "learning_rate": 1.312304467471409e-05, "loss": 2.2098, "step": 422930 }, { "epoch": 0.74, "learning_rate": 1.3122172734787263e-05, "loss": 2.3089, "step": 422940 }, { "epoch": 0.74, "learning_rate": 1.3121300794860438e-05, "loss": 2.4355, "step": 422950 }, { "epoch": 0.74, "learning_rate": 1.3120428854933612e-05, "loss": 2.396, "step": 422960 }, { "epoch": 0.74, "learning_rate": 1.3119556915006784e-05, "loss": 2.3966, "step": 422970 }, { "epoch": 0.74, "learning_rate": 1.3118684975079956e-05, "loss": 2.2654, "step": 422980 }, { "epoch": 0.74, "learning_rate": 1.3117813035153132e-05, "loss": 2.3095, "step": 422990 }, { "epoch": 0.74, "learning_rate": 1.3116941095226304e-05, "loss": 2.2646, "step": 423000 }, { "epoch": 0.74, "learning_rate": 1.3116069155299476e-05, "loss": 2.2137, "step": 423010 }, { "epoch": 0.74, "learning_rate": 1.3115197215372651e-05, "loss": 2.4599, "step": 423020 }, { "epoch": 0.74, "learning_rate": 1.3114325275445823e-05, "loss": 2.2618, "step": 423030 }, { "epoch": 0.74, "learning_rate": 1.3113453335518997e-05, "loss": 2.3388, "step": 423040 }, { "epoch": 0.74, "learning_rate": 1.311258139559217e-05, "loss": 2.339, "step": 423050 }, { "epoch": 0.74, "learning_rate": 1.3111709455665345e-05, "loss": 2.2821, "step": 423060 }, { "epoch": 0.74, "learning_rate": 1.3110837515738517e-05, "loss": 2.3103, "step": 423070 }, { "epoch": 0.74, "learning_rate": 1.3109965575811689e-05, "loss": 2.2327, "step": 423080 }, { "epoch": 0.74, "learning_rate": 1.3109093635884861e-05, "loss": 2.3603, "step": 423090 }, { "epoch": 0.74, "learning_rate": 1.3108221695958036e-05, "loss": 2.2072, "step": 423100 }, { "epoch": 0.74, "learning_rate": 1.3107349756031208e-05, "loss": 2.4111, "step": 423110 }, { "epoch": 0.74, "learning_rate": 1.3106477816104382e-05, "loss": 2.2768, "step": 423120 }, { "epoch": 0.74, "learning_rate": 1.3105605876177558e-05, "loss": 2.1458, "step": 423130 }, { "epoch": 0.74, "learning_rate": 1.310473393625073e-05, "loss": 2.3063, "step": 423140 }, { "epoch": 0.74, "learning_rate": 1.3103861996323902e-05, "loss": 2.321, "step": 423150 }, { "epoch": 0.74, "learning_rate": 1.3102990056397074e-05, "loss": 2.2542, "step": 423160 }, { "epoch": 0.74, "learning_rate": 1.310211811647025e-05, "loss": 2.2871, "step": 423170 }, { "epoch": 0.74, "learning_rate": 1.3101246176543421e-05, "loss": 2.2685, "step": 423180 }, { "epoch": 0.74, "learning_rate": 1.3100374236616595e-05, "loss": 2.3032, "step": 423190 }, { "epoch": 0.74, "learning_rate": 1.3099502296689767e-05, "loss": 2.4071, "step": 423200 }, { "epoch": 0.74, "learning_rate": 1.3098630356762943e-05, "loss": 2.283, "step": 423210 }, { "epoch": 0.74, "learning_rate": 1.3097758416836115e-05, "loss": 2.273, "step": 423220 }, { "epoch": 0.74, "learning_rate": 1.3096886476909287e-05, "loss": 2.2937, "step": 423230 }, { "epoch": 0.74, "learning_rate": 1.3096014536982459e-05, "loss": 2.28, "step": 423240 }, { "epoch": 0.74, "learning_rate": 1.3095142597055634e-05, "loss": 2.2466, "step": 423250 }, { "epoch": 0.74, "learning_rate": 1.3094270657128807e-05, "loss": 2.1375, "step": 423260 }, { "epoch": 0.74, "learning_rate": 1.309339871720198e-05, "loss": 2.1914, "step": 423270 }, { "epoch": 0.74, "learning_rate": 1.3092526777275154e-05, "loss": 2.3435, "step": 423280 }, { "epoch": 0.74, "learning_rate": 1.3091654837348328e-05, "loss": 2.299, "step": 423290 }, { "epoch": 0.74, "learning_rate": 1.30907828974215e-05, "loss": 2.2157, "step": 423300 }, { "epoch": 0.74, "learning_rate": 1.3089910957494672e-05, "loss": 2.2674, "step": 423310 }, { "epoch": 0.74, "learning_rate": 1.3089039017567847e-05, "loss": 2.3856, "step": 423320 }, { "epoch": 0.74, "learning_rate": 1.308816707764102e-05, "loss": 2.3597, "step": 423330 }, { "epoch": 0.74, "learning_rate": 1.3087295137714192e-05, "loss": 2.3412, "step": 423340 }, { "epoch": 0.74, "learning_rate": 1.3086423197787365e-05, "loss": 2.2645, "step": 423350 }, { "epoch": 0.74, "learning_rate": 1.3085551257860539e-05, "loss": 2.2724, "step": 423360 }, { "epoch": 0.74, "learning_rate": 1.3084679317933713e-05, "loss": 2.2903, "step": 423370 }, { "epoch": 0.74, "learning_rate": 1.3083807378006885e-05, "loss": 2.2896, "step": 423380 }, { "epoch": 0.74, "learning_rate": 1.3082935438080057e-05, "loss": 2.444, "step": 423390 }, { "epoch": 0.74, "learning_rate": 1.3082063498153233e-05, "loss": 2.2987, "step": 423400 }, { "epoch": 0.74, "learning_rate": 1.3081191558226405e-05, "loss": 2.3328, "step": 423410 }, { "epoch": 0.74, "learning_rate": 1.3080319618299577e-05, "loss": 2.218, "step": 423420 }, { "epoch": 0.74, "learning_rate": 1.3079447678372752e-05, "loss": 2.2922, "step": 423430 }, { "epoch": 0.74, "learning_rate": 1.3078575738445926e-05, "loss": 2.2677, "step": 423440 }, { "epoch": 0.74, "learning_rate": 1.3077703798519098e-05, "loss": 2.2752, "step": 423450 }, { "epoch": 0.74, "learning_rate": 1.307683185859227e-05, "loss": 2.2689, "step": 423460 }, { "epoch": 0.74, "learning_rate": 1.3075959918665446e-05, "loss": 2.4626, "step": 423470 }, { "epoch": 0.74, "learning_rate": 1.3075087978738618e-05, "loss": 2.4144, "step": 423480 }, { "epoch": 0.74, "learning_rate": 1.307421603881179e-05, "loss": 2.2629, "step": 423490 }, { "epoch": 0.74, "learning_rate": 1.3073344098884963e-05, "loss": 2.3403, "step": 423500 }, { "epoch": 0.74, "learning_rate": 1.3072472158958137e-05, "loss": 2.3025, "step": 423510 }, { "epoch": 0.74, "learning_rate": 1.3071600219031311e-05, "loss": 2.3532, "step": 423520 }, { "epoch": 0.74, "learning_rate": 1.3070728279104483e-05, "loss": 2.3511, "step": 423530 }, { "epoch": 0.74, "learning_rate": 1.3069856339177659e-05, "loss": 2.3071, "step": 423540 }, { "epoch": 0.74, "learning_rate": 1.306898439925083e-05, "loss": 2.3016, "step": 423550 }, { "epoch": 0.74, "learning_rate": 1.3068112459324003e-05, "loss": 2.34, "step": 423560 }, { "epoch": 0.74, "learning_rate": 1.3067240519397175e-05, "loss": 2.3066, "step": 423570 }, { "epoch": 0.74, "learning_rate": 1.306636857947035e-05, "loss": 2.2354, "step": 423580 }, { "epoch": 0.74, "learning_rate": 1.3065496639543522e-05, "loss": 2.3129, "step": 423590 }, { "epoch": 0.74, "learning_rate": 1.3064624699616696e-05, "loss": 2.2307, "step": 423600 }, { "epoch": 0.74, "learning_rate": 1.3063752759689868e-05, "loss": 2.2669, "step": 423610 }, { "epoch": 0.74, "learning_rate": 1.3062880819763044e-05, "loss": 2.2807, "step": 423620 }, { "epoch": 0.74, "learning_rate": 1.3062008879836216e-05, "loss": 2.378, "step": 423630 }, { "epoch": 0.74, "learning_rate": 1.3061136939909388e-05, "loss": 2.406, "step": 423640 }, { "epoch": 0.74, "learning_rate": 1.306026499998256e-05, "loss": 2.2688, "step": 423650 }, { "epoch": 0.74, "learning_rate": 1.3059393060055735e-05, "loss": 2.2208, "step": 423660 }, { "epoch": 0.74, "learning_rate": 1.3058521120128907e-05, "loss": 2.2605, "step": 423670 }, { "epoch": 0.74, "learning_rate": 1.3057649180202081e-05, "loss": 2.2844, "step": 423680 }, { "epoch": 0.74, "learning_rate": 1.3056777240275257e-05, "loss": 2.2764, "step": 423690 }, { "epoch": 0.74, "learning_rate": 1.3055905300348429e-05, "loss": 2.3216, "step": 423700 }, { "epoch": 0.74, "learning_rate": 1.30550333604216e-05, "loss": 2.2684, "step": 423710 }, { "epoch": 0.74, "learning_rate": 1.3054161420494773e-05, "loss": 2.258, "step": 423720 }, { "epoch": 0.74, "learning_rate": 1.3053289480567948e-05, "loss": 2.2599, "step": 423730 }, { "epoch": 0.74, "learning_rate": 1.305241754064112e-05, "loss": 2.3126, "step": 423740 }, { "epoch": 0.74, "learning_rate": 1.3051545600714294e-05, "loss": 2.313, "step": 423750 }, { "epoch": 0.74, "learning_rate": 1.3050673660787466e-05, "loss": 2.292, "step": 423760 }, { "epoch": 0.74, "learning_rate": 1.3049801720860642e-05, "loss": 2.233, "step": 423770 }, { "epoch": 0.74, "learning_rate": 1.3048929780933814e-05, "loss": 2.3019, "step": 423780 }, { "epoch": 0.74, "learning_rate": 1.3048057841006986e-05, "loss": 2.3358, "step": 423790 }, { "epoch": 0.74, "learning_rate": 1.3047185901080161e-05, "loss": 2.3216, "step": 423800 }, { "epoch": 0.74, "learning_rate": 1.3046313961153333e-05, "loss": 2.413, "step": 423810 }, { "epoch": 0.74, "learning_rate": 1.3045442021226505e-05, "loss": 2.3645, "step": 423820 }, { "epoch": 0.74, "learning_rate": 1.304457008129968e-05, "loss": 2.2903, "step": 423830 }, { "epoch": 0.74, "learning_rate": 1.3043698141372853e-05, "loss": 2.4125, "step": 423840 }, { "epoch": 0.74, "learning_rate": 1.3042826201446027e-05, "loss": 2.3314, "step": 423850 }, { "epoch": 0.74, "learning_rate": 1.3041954261519199e-05, "loss": 2.3749, "step": 423860 }, { "epoch": 0.74, "learning_rate": 1.3041082321592371e-05, "loss": 2.1941, "step": 423870 }, { "epoch": 0.74, "learning_rate": 1.3040210381665546e-05, "loss": 2.287, "step": 423880 }, { "epoch": 0.74, "learning_rate": 1.3039338441738718e-05, "loss": 2.3887, "step": 423890 }, { "epoch": 0.74, "learning_rate": 1.303846650181189e-05, "loss": 2.311, "step": 423900 }, { "epoch": 0.74, "learning_rate": 1.3037594561885064e-05, "loss": 2.3866, "step": 423910 }, { "epoch": 0.74, "learning_rate": 1.303672262195824e-05, "loss": 2.4264, "step": 423920 }, { "epoch": 0.74, "learning_rate": 1.3035850682031412e-05, "loss": 2.3246, "step": 423930 }, { "epoch": 0.74, "learning_rate": 1.3034978742104584e-05, "loss": 2.3345, "step": 423940 }, { "epoch": 0.74, "learning_rate": 1.303410680217776e-05, "loss": 2.3408, "step": 423950 }, { "epoch": 0.74, "learning_rate": 1.3033234862250931e-05, "loss": 2.3533, "step": 423960 }, { "epoch": 0.74, "learning_rate": 1.3032362922324104e-05, "loss": 2.398, "step": 423970 }, { "epoch": 0.74, "learning_rate": 1.3031490982397276e-05, "loss": 2.2287, "step": 423980 }, { "epoch": 0.74, "learning_rate": 1.3030619042470451e-05, "loss": 2.3555, "step": 423990 }, { "epoch": 0.74, "learning_rate": 1.3029747102543625e-05, "loss": 2.2868, "step": 424000 }, { "epoch": 0.74, "learning_rate": 1.3028875162616797e-05, "loss": 2.3162, "step": 424010 }, { "epoch": 0.74, "learning_rate": 1.3028003222689969e-05, "loss": 2.2895, "step": 424020 }, { "epoch": 0.74, "learning_rate": 1.3027131282763144e-05, "loss": 2.2424, "step": 424030 }, { "epoch": 0.74, "learning_rate": 1.3026259342836317e-05, "loss": 2.2555, "step": 424040 }, { "epoch": 0.74, "learning_rate": 1.3025387402909489e-05, "loss": 2.2236, "step": 424050 }, { "epoch": 0.74, "learning_rate": 1.3024515462982664e-05, "loss": 2.3055, "step": 424060 }, { "epoch": 0.74, "learning_rate": 1.3023643523055836e-05, "loss": 2.242, "step": 424070 }, { "epoch": 0.74, "learning_rate": 1.302277158312901e-05, "loss": 2.2157, "step": 424080 }, { "epoch": 0.74, "learning_rate": 1.3021899643202182e-05, "loss": 2.3133, "step": 424090 }, { "epoch": 0.74, "learning_rate": 1.3021027703275357e-05, "loss": 2.2935, "step": 424100 }, { "epoch": 0.74, "learning_rate": 1.302015576334853e-05, "loss": 2.3229, "step": 424110 }, { "epoch": 0.74, "learning_rate": 1.3019283823421702e-05, "loss": 2.2146, "step": 424120 }, { "epoch": 0.74, "learning_rate": 1.3018411883494874e-05, "loss": 2.2858, "step": 424130 }, { "epoch": 0.74, "learning_rate": 1.3017539943568049e-05, "loss": 2.2677, "step": 424140 }, { "epoch": 0.74, "learning_rate": 1.3016668003641221e-05, "loss": 2.2931, "step": 424150 }, { "epoch": 0.74, "learning_rate": 1.3015796063714395e-05, "loss": 2.2373, "step": 424160 }, { "epoch": 0.74, "learning_rate": 1.3014924123787567e-05, "loss": 2.2684, "step": 424170 }, { "epoch": 0.74, "learning_rate": 1.3014052183860743e-05, "loss": 2.2891, "step": 424180 }, { "epoch": 0.74, "learning_rate": 1.3013180243933915e-05, "loss": 2.2579, "step": 424190 }, { "epoch": 0.74, "learning_rate": 1.3012308304007087e-05, "loss": 2.2638, "step": 424200 }, { "epoch": 0.74, "learning_rate": 1.3011436364080262e-05, "loss": 2.4067, "step": 424210 }, { "epoch": 0.74, "learning_rate": 1.3010564424153434e-05, "loss": 2.3492, "step": 424220 }, { "epoch": 0.74, "learning_rate": 1.3009692484226608e-05, "loss": 2.2458, "step": 424230 }, { "epoch": 0.74, "learning_rate": 1.300882054429978e-05, "loss": 2.345, "step": 424240 }, { "epoch": 0.74, "learning_rate": 1.3007948604372956e-05, "loss": 2.308, "step": 424250 }, { "epoch": 0.74, "learning_rate": 1.3007076664446128e-05, "loss": 2.2263, "step": 424260 }, { "epoch": 0.74, "learning_rate": 1.30062047245193e-05, "loss": 2.2953, "step": 424270 }, { "epoch": 0.74, "learning_rate": 1.3005332784592472e-05, "loss": 2.3069, "step": 424280 }, { "epoch": 0.74, "learning_rate": 1.3004460844665647e-05, "loss": 2.2515, "step": 424290 }, { "epoch": 0.74, "learning_rate": 1.300358890473882e-05, "loss": 2.346, "step": 424300 }, { "epoch": 0.74, "learning_rate": 1.3002716964811993e-05, "loss": 2.3555, "step": 424310 }, { "epoch": 0.74, "learning_rate": 1.3001845024885165e-05, "loss": 2.1906, "step": 424320 }, { "epoch": 0.74, "learning_rate": 1.300097308495834e-05, "loss": 2.2148, "step": 424330 }, { "epoch": 0.74, "learning_rate": 1.3000101145031513e-05, "loss": 2.255, "step": 424340 }, { "epoch": 0.74, "learning_rate": 1.2999229205104685e-05, "loss": 2.2056, "step": 424350 }, { "epoch": 0.74, "learning_rate": 1.299835726517786e-05, "loss": 2.3169, "step": 424360 }, { "epoch": 0.74, "learning_rate": 1.2997485325251032e-05, "loss": 2.3075, "step": 424370 }, { "epoch": 0.74, "learning_rate": 1.2996613385324204e-05, "loss": 2.3292, "step": 424380 }, { "epoch": 0.74, "learning_rate": 1.2995741445397378e-05, "loss": 2.4528, "step": 424390 }, { "epoch": 0.74, "learning_rate": 1.2994869505470552e-05, "loss": 2.279, "step": 424400 }, { "epoch": 0.74, "learning_rate": 1.2993997565543726e-05, "loss": 2.3482, "step": 424410 }, { "epoch": 0.74, "learning_rate": 1.2993125625616898e-05, "loss": 2.1972, "step": 424420 }, { "epoch": 0.74, "learning_rate": 1.299225368569007e-05, "loss": 2.3324, "step": 424430 }, { "epoch": 0.74, "learning_rate": 1.2991381745763245e-05, "loss": 2.1826, "step": 424440 }, { "epoch": 0.74, "learning_rate": 1.2990509805836417e-05, "loss": 2.3573, "step": 424450 }, { "epoch": 0.74, "learning_rate": 1.298963786590959e-05, "loss": 2.3239, "step": 424460 }, { "epoch": 0.74, "learning_rate": 1.2988765925982765e-05, "loss": 2.2044, "step": 424470 }, { "epoch": 0.74, "learning_rate": 1.2987893986055939e-05, "loss": 2.3965, "step": 424480 }, { "epoch": 0.74, "learning_rate": 1.298702204612911e-05, "loss": 2.3034, "step": 424490 }, { "epoch": 0.74, "learning_rate": 1.2986150106202283e-05, "loss": 2.3175, "step": 424500 }, { "epoch": 0.74, "learning_rate": 1.2985278166275458e-05, "loss": 2.2037, "step": 424510 }, { "epoch": 0.74, "learning_rate": 1.298440622634863e-05, "loss": 2.4287, "step": 424520 }, { "epoch": 0.74, "learning_rate": 1.2983534286421802e-05, "loss": 2.2594, "step": 424530 }, { "epoch": 0.74, "learning_rate": 1.2982662346494976e-05, "loss": 2.193, "step": 424540 }, { "epoch": 0.74, "learning_rate": 1.298179040656815e-05, "loss": 2.3404, "step": 424550 }, { "epoch": 0.74, "learning_rate": 1.2980918466641324e-05, "loss": 2.3511, "step": 424560 }, { "epoch": 0.74, "learning_rate": 1.2980046526714496e-05, "loss": 2.2279, "step": 424570 }, { "epoch": 0.74, "learning_rate": 1.2979174586787668e-05, "loss": 2.3629, "step": 424580 }, { "epoch": 0.74, "learning_rate": 1.2978302646860843e-05, "loss": 2.3818, "step": 424590 }, { "epoch": 0.74, "learning_rate": 1.2977430706934015e-05, "loss": 2.4654, "step": 424600 }, { "epoch": 0.74, "learning_rate": 1.2976558767007188e-05, "loss": 2.2323, "step": 424610 }, { "epoch": 0.74, "learning_rate": 1.2975686827080363e-05, "loss": 2.3387, "step": 424620 }, { "epoch": 0.74, "learning_rate": 1.2974814887153535e-05, "loss": 2.2153, "step": 424630 }, { "epoch": 0.74, "learning_rate": 1.2973942947226709e-05, "loss": 2.3062, "step": 424640 }, { "epoch": 0.74, "learning_rate": 1.2973071007299881e-05, "loss": 2.2875, "step": 424650 }, { "epoch": 0.74, "learning_rate": 1.2972199067373056e-05, "loss": 2.3532, "step": 424660 }, { "epoch": 0.74, "learning_rate": 1.2971327127446228e-05, "loss": 2.277, "step": 424670 }, { "epoch": 0.74, "learning_rate": 1.29704551875194e-05, "loss": 2.2467, "step": 424680 }, { "epoch": 0.74, "learning_rate": 1.2969583247592573e-05, "loss": 2.258, "step": 424690 }, { "epoch": 0.74, "learning_rate": 1.2968711307665748e-05, "loss": 2.3057, "step": 424700 }, { "epoch": 0.74, "learning_rate": 1.296783936773892e-05, "loss": 2.3182, "step": 424710 }, { "epoch": 0.74, "learning_rate": 1.2966967427812094e-05, "loss": 2.2796, "step": 424720 }, { "epoch": 0.74, "learning_rate": 1.296609548788527e-05, "loss": 2.2052, "step": 424730 }, { "epoch": 0.74, "learning_rate": 1.2965223547958441e-05, "loss": 2.2478, "step": 424740 }, { "epoch": 0.74, "learning_rate": 1.2964351608031614e-05, "loss": 2.3472, "step": 424750 }, { "epoch": 0.74, "learning_rate": 1.2963479668104786e-05, "loss": 2.351, "step": 424760 }, { "epoch": 0.74, "learning_rate": 1.2962607728177961e-05, "loss": 2.2938, "step": 424770 }, { "epoch": 0.74, "learning_rate": 1.2961735788251133e-05, "loss": 2.3623, "step": 424780 }, { "epoch": 0.74, "learning_rate": 1.2960863848324307e-05, "loss": 2.3099, "step": 424790 }, { "epoch": 0.74, "learning_rate": 1.2959991908397479e-05, "loss": 2.3868, "step": 424800 }, { "epoch": 0.74, "learning_rate": 1.2959119968470654e-05, "loss": 2.2602, "step": 424810 }, { "epoch": 0.74, "learning_rate": 1.2958248028543827e-05, "loss": 2.3175, "step": 424820 }, { "epoch": 0.74, "learning_rate": 1.2957376088616999e-05, "loss": 2.2707, "step": 424830 }, { "epoch": 0.74, "learning_rate": 1.295650414869017e-05, "loss": 2.4049, "step": 424840 }, { "epoch": 0.74, "learning_rate": 1.2955632208763346e-05, "loss": 2.2962, "step": 424850 }, { "epoch": 0.74, "learning_rate": 1.2954760268836518e-05, "loss": 2.3117, "step": 424860 }, { "epoch": 0.74, "learning_rate": 1.2953888328909692e-05, "loss": 2.2402, "step": 424870 }, { "epoch": 0.74, "learning_rate": 1.2953016388982866e-05, "loss": 2.2246, "step": 424880 }, { "epoch": 0.74, "learning_rate": 1.295214444905604e-05, "loss": 2.232, "step": 424890 }, { "epoch": 0.74, "learning_rate": 1.2951272509129212e-05, "loss": 2.298, "step": 424900 }, { "epoch": 0.74, "learning_rate": 1.2950400569202384e-05, "loss": 2.2286, "step": 424910 }, { "epoch": 0.74, "learning_rate": 1.2949528629275559e-05, "loss": 2.2773, "step": 424920 }, { "epoch": 0.74, "learning_rate": 1.2948656689348731e-05, "loss": 2.2504, "step": 424930 }, { "epoch": 0.74, "learning_rate": 1.2947784749421903e-05, "loss": 2.202, "step": 424940 }, { "epoch": 0.74, "learning_rate": 1.2946912809495077e-05, "loss": 2.2346, "step": 424950 }, { "epoch": 0.74, "learning_rate": 1.2946040869568253e-05, "loss": 2.315, "step": 424960 }, { "epoch": 0.74, "learning_rate": 1.2945168929641425e-05, "loss": 2.3666, "step": 424970 }, { "epoch": 0.74, "learning_rate": 1.2944296989714597e-05, "loss": 2.4372, "step": 424980 }, { "epoch": 0.74, "learning_rate": 1.2943425049787772e-05, "loss": 2.296, "step": 424990 }, { "epoch": 0.74, "learning_rate": 1.2942553109860944e-05, "loss": 2.3503, "step": 425000 }, { "epoch": 0.74, "learning_rate": 1.2941681169934116e-05, "loss": 2.3558, "step": 425010 }, { "epoch": 0.74, "learning_rate": 1.2940809230007288e-05, "loss": 2.3423, "step": 425020 }, { "epoch": 0.74, "learning_rate": 1.2939937290080464e-05, "loss": 2.3436, "step": 425030 }, { "epoch": 0.74, "learning_rate": 1.2939065350153638e-05, "loss": 2.3237, "step": 425040 }, { "epoch": 0.74, "learning_rate": 1.293819341022681e-05, "loss": 2.3037, "step": 425050 }, { "epoch": 0.74, "learning_rate": 1.2937321470299982e-05, "loss": 2.2948, "step": 425060 }, { "epoch": 0.74, "learning_rate": 1.2936449530373157e-05, "loss": 2.266, "step": 425070 }, { "epoch": 0.74, "learning_rate": 1.293557759044633e-05, "loss": 2.3544, "step": 425080 }, { "epoch": 0.74, "learning_rate": 1.2934705650519501e-05, "loss": 2.2751, "step": 425090 }, { "epoch": 0.74, "learning_rate": 1.2933833710592675e-05, "loss": 2.2929, "step": 425100 }, { "epoch": 0.74, "learning_rate": 1.2932961770665849e-05, "loss": 2.3326, "step": 425110 }, { "epoch": 0.74, "learning_rate": 1.2932089830739023e-05, "loss": 2.314, "step": 425120 }, { "epoch": 0.74, "learning_rate": 1.2931217890812195e-05, "loss": 2.3144, "step": 425130 }, { "epoch": 0.74, "learning_rate": 1.293034595088537e-05, "loss": 2.2934, "step": 425140 }, { "epoch": 0.74, "learning_rate": 1.2929474010958542e-05, "loss": 2.3552, "step": 425150 }, { "epoch": 0.74, "learning_rate": 1.2928602071031714e-05, "loss": 2.37, "step": 425160 }, { "epoch": 0.74, "learning_rate": 1.2927730131104886e-05, "loss": 2.3498, "step": 425170 }, { "epoch": 0.74, "learning_rate": 1.2926858191178062e-05, "loss": 2.3065, "step": 425180 }, { "epoch": 0.74, "learning_rate": 1.2925986251251234e-05, "loss": 2.3282, "step": 425190 }, { "epoch": 0.74, "learning_rate": 1.2925114311324408e-05, "loss": 2.2815, "step": 425200 }, { "epoch": 0.74, "learning_rate": 1.292424237139758e-05, "loss": 2.385, "step": 425210 }, { "epoch": 0.74, "learning_rate": 1.2923370431470755e-05, "loss": 2.3553, "step": 425220 }, { "epoch": 0.74, "learning_rate": 1.2922498491543927e-05, "loss": 2.2366, "step": 425230 }, { "epoch": 0.74, "learning_rate": 1.29216265516171e-05, "loss": 2.187, "step": 425240 }, { "epoch": 0.74, "learning_rate": 1.2920754611690272e-05, "loss": 2.1891, "step": 425250 }, { "epoch": 0.74, "learning_rate": 1.2919882671763447e-05, "loss": 2.2118, "step": 425260 }, { "epoch": 0.74, "learning_rate": 1.291901073183662e-05, "loss": 2.1524, "step": 425270 }, { "epoch": 0.74, "learning_rate": 1.2918138791909793e-05, "loss": 2.2495, "step": 425280 }, { "epoch": 0.74, "learning_rate": 1.2917266851982968e-05, "loss": 2.3346, "step": 425290 }, { "epoch": 0.74, "learning_rate": 1.291639491205614e-05, "loss": 2.2317, "step": 425300 }, { "epoch": 0.74, "learning_rate": 1.2915522972129312e-05, "loss": 2.3541, "step": 425310 }, { "epoch": 0.74, "learning_rate": 1.2914651032202485e-05, "loss": 2.1646, "step": 425320 }, { "epoch": 0.74, "learning_rate": 1.291377909227566e-05, "loss": 2.3818, "step": 425330 }, { "epoch": 0.74, "learning_rate": 1.2912907152348832e-05, "loss": 2.3045, "step": 425340 }, { "epoch": 0.74, "learning_rate": 1.2912035212422006e-05, "loss": 2.2115, "step": 425350 }, { "epoch": 0.74, "learning_rate": 1.2911163272495178e-05, "loss": 2.2539, "step": 425360 }, { "epoch": 0.74, "learning_rate": 1.2910291332568353e-05, "loss": 2.3765, "step": 425370 }, { "epoch": 0.74, "learning_rate": 1.2909419392641525e-05, "loss": 2.1783, "step": 425380 }, { "epoch": 0.74, "learning_rate": 1.2908547452714698e-05, "loss": 2.3033, "step": 425390 }, { "epoch": 0.74, "learning_rate": 1.2907675512787873e-05, "loss": 2.314, "step": 425400 }, { "epoch": 0.74, "learning_rate": 1.2906803572861045e-05, "loss": 2.3091, "step": 425410 }, { "epoch": 0.74, "learning_rate": 1.2905931632934217e-05, "loss": 2.2542, "step": 425420 }, { "epoch": 0.74, "learning_rate": 1.2905059693007391e-05, "loss": 2.2323, "step": 425430 }, { "epoch": 0.74, "learning_rate": 1.2904187753080565e-05, "loss": 2.265, "step": 425440 }, { "epoch": 0.74, "learning_rate": 1.2903315813153738e-05, "loss": 2.288, "step": 425450 }, { "epoch": 0.74, "learning_rate": 1.290244387322691e-05, "loss": 2.4525, "step": 425460 }, { "epoch": 0.74, "learning_rate": 1.2901571933300083e-05, "loss": 2.2632, "step": 425470 }, { "epoch": 0.74, "learning_rate": 1.2900699993373258e-05, "loss": 2.2992, "step": 425480 }, { "epoch": 0.74, "learning_rate": 1.289982805344643e-05, "loss": 2.3668, "step": 425490 }, { "epoch": 0.74, "learning_rate": 1.2898956113519602e-05, "loss": 2.3134, "step": 425500 }, { "epoch": 0.74, "learning_rate": 1.2898084173592776e-05, "loss": 2.3688, "step": 425510 }, { "epoch": 0.74, "learning_rate": 1.2897212233665951e-05, "loss": 2.3327, "step": 425520 }, { "epoch": 0.74, "learning_rate": 1.2896340293739124e-05, "loss": 2.3018, "step": 425530 }, { "epoch": 0.74, "learning_rate": 1.2895468353812296e-05, "loss": 2.3049, "step": 425540 }, { "epoch": 0.74, "learning_rate": 1.2894596413885471e-05, "loss": 2.3639, "step": 425550 }, { "epoch": 0.74, "learning_rate": 1.2893724473958643e-05, "loss": 2.3315, "step": 425560 }, { "epoch": 0.74, "learning_rate": 1.2892852534031815e-05, "loss": 2.1887, "step": 425570 }, { "epoch": 0.74, "learning_rate": 1.2891980594104989e-05, "loss": 2.2305, "step": 425580 }, { "epoch": 0.74, "learning_rate": 1.2891108654178163e-05, "loss": 2.3333, "step": 425590 }, { "epoch": 0.74, "learning_rate": 1.2890236714251337e-05, "loss": 2.2267, "step": 425600 }, { "epoch": 0.74, "learning_rate": 1.2889364774324509e-05, "loss": 2.2995, "step": 425610 }, { "epoch": 0.74, "learning_rate": 1.288849283439768e-05, "loss": 2.3094, "step": 425620 }, { "epoch": 0.74, "learning_rate": 1.2887620894470856e-05, "loss": 2.4354, "step": 425630 }, { "epoch": 0.74, "learning_rate": 1.2886748954544028e-05, "loss": 2.4238, "step": 425640 }, { "epoch": 0.74, "learning_rate": 1.28858770146172e-05, "loss": 2.3473, "step": 425650 }, { "epoch": 0.74, "learning_rate": 1.2885005074690376e-05, "loss": 2.1976, "step": 425660 }, { "epoch": 0.74, "learning_rate": 1.2884133134763548e-05, "loss": 2.4744, "step": 425670 }, { "epoch": 0.74, "learning_rate": 1.2883261194836722e-05, "loss": 2.2807, "step": 425680 }, { "epoch": 0.74, "learning_rate": 1.2882389254909894e-05, "loss": 2.2764, "step": 425690 }, { "epoch": 0.74, "learning_rate": 1.2881517314983069e-05, "loss": 2.3103, "step": 425700 }, { "epoch": 0.74, "learning_rate": 1.2880645375056241e-05, "loss": 2.2309, "step": 425710 }, { "epoch": 0.74, "learning_rate": 1.2879773435129413e-05, "loss": 2.2823, "step": 425720 }, { "epoch": 0.74, "learning_rate": 1.2878901495202585e-05, "loss": 2.2578, "step": 425730 }, { "epoch": 0.74, "learning_rate": 1.287802955527576e-05, "loss": 2.2483, "step": 425740 }, { "epoch": 0.74, "learning_rate": 1.2877157615348933e-05, "loss": 2.3581, "step": 425750 }, { "epoch": 0.74, "learning_rate": 1.2876285675422107e-05, "loss": 2.3155, "step": 425760 }, { "epoch": 0.74, "learning_rate": 1.2875413735495279e-05, "loss": 2.3715, "step": 425770 }, { "epoch": 0.74, "learning_rate": 1.2874541795568454e-05, "loss": 2.2605, "step": 425780 }, { "epoch": 0.74, "learning_rate": 1.2873669855641626e-05, "loss": 2.2693, "step": 425790 }, { "epoch": 0.74, "learning_rate": 1.2872797915714798e-05, "loss": 2.2966, "step": 425800 }, { "epoch": 0.74, "learning_rate": 1.2871925975787974e-05, "loss": 2.393, "step": 425810 }, { "epoch": 0.74, "learning_rate": 1.2871054035861146e-05, "loss": 2.2953, "step": 425820 }, { "epoch": 0.74, "learning_rate": 1.287018209593432e-05, "loss": 2.2692, "step": 425830 }, { "epoch": 0.74, "learning_rate": 1.2869310156007492e-05, "loss": 2.3418, "step": 425840 }, { "epoch": 0.74, "learning_rate": 1.2868438216080667e-05, "loss": 2.4206, "step": 425850 }, { "epoch": 0.74, "learning_rate": 1.286756627615384e-05, "loss": 2.2242, "step": 425860 }, { "epoch": 0.74, "learning_rate": 1.2866694336227011e-05, "loss": 2.4132, "step": 425870 }, { "epoch": 0.74, "learning_rate": 1.2865822396300183e-05, "loss": 2.275, "step": 425880 }, { "epoch": 0.74, "learning_rate": 1.2864950456373359e-05, "loss": 2.2273, "step": 425890 }, { "epoch": 0.74, "learning_rate": 1.2864078516446531e-05, "loss": 2.2501, "step": 425900 }, { "epoch": 0.74, "learning_rate": 1.2863206576519705e-05, "loss": 2.3736, "step": 425910 }, { "epoch": 0.74, "learning_rate": 1.2862334636592879e-05, "loss": 2.2369, "step": 425920 }, { "epoch": 0.74, "learning_rate": 1.2861462696666052e-05, "loss": 2.3492, "step": 425930 }, { "epoch": 0.74, "learning_rate": 1.2860590756739224e-05, "loss": 2.2936, "step": 425940 }, { "epoch": 0.74, "learning_rate": 1.2859718816812396e-05, "loss": 2.3347, "step": 425950 }, { "epoch": 0.74, "learning_rate": 1.2858846876885572e-05, "loss": 2.3164, "step": 425960 }, { "epoch": 0.74, "learning_rate": 1.2857974936958744e-05, "loss": 2.2924, "step": 425970 }, { "epoch": 0.74, "learning_rate": 1.2857102997031916e-05, "loss": 2.2932, "step": 425980 }, { "epoch": 0.74, "learning_rate": 1.285623105710509e-05, "loss": 2.2052, "step": 425990 }, { "epoch": 0.74, "learning_rate": 1.2855359117178265e-05, "loss": 2.2564, "step": 426000 }, { "epoch": 0.74, "learning_rate": 1.2854487177251437e-05, "loss": 2.2621, "step": 426010 }, { "epoch": 0.74, "learning_rate": 1.285361523732461e-05, "loss": 2.3652, "step": 426020 }, { "epoch": 0.74, "learning_rate": 1.2852743297397782e-05, "loss": 2.2714, "step": 426030 }, { "epoch": 0.74, "learning_rate": 1.2851871357470957e-05, "loss": 2.2578, "step": 426040 }, { "epoch": 0.74, "learning_rate": 1.2850999417544129e-05, "loss": 2.2461, "step": 426050 }, { "epoch": 0.74, "learning_rate": 1.2850127477617301e-05, "loss": 2.1916, "step": 426060 }, { "epoch": 0.74, "learning_rate": 1.2849255537690477e-05, "loss": 2.2427, "step": 426070 }, { "epoch": 0.74, "learning_rate": 1.284838359776365e-05, "loss": 2.1682, "step": 426080 }, { "epoch": 0.74, "learning_rate": 1.2847511657836822e-05, "loss": 2.3149, "step": 426090 }, { "epoch": 0.74, "learning_rate": 1.2846639717909995e-05, "loss": 2.3221, "step": 426100 }, { "epoch": 0.74, "learning_rate": 1.284576777798317e-05, "loss": 2.2231, "step": 426110 }, { "epoch": 0.74, "learning_rate": 1.2844895838056342e-05, "loss": 2.3239, "step": 426120 }, { "epoch": 0.74, "learning_rate": 1.2844023898129514e-05, "loss": 2.2734, "step": 426130 }, { "epoch": 0.74, "learning_rate": 1.2843151958202688e-05, "loss": 2.3867, "step": 426140 }, { "epoch": 0.74, "learning_rate": 1.2842280018275862e-05, "loss": 2.3155, "step": 426150 }, { "epoch": 0.74, "learning_rate": 1.2841408078349035e-05, "loss": 2.3511, "step": 426160 }, { "epoch": 0.74, "learning_rate": 1.2840536138422208e-05, "loss": 2.2868, "step": 426170 }, { "epoch": 0.74, "learning_rate": 1.283966419849538e-05, "loss": 2.4232, "step": 426180 }, { "epoch": 0.74, "learning_rate": 1.2838792258568555e-05, "loss": 2.2564, "step": 426190 }, { "epoch": 0.74, "learning_rate": 1.2837920318641727e-05, "loss": 2.251, "step": 426200 }, { "epoch": 0.74, "learning_rate": 1.28370483787149e-05, "loss": 2.3695, "step": 426210 }, { "epoch": 0.74, "learning_rate": 1.2836176438788075e-05, "loss": 2.1671, "step": 426220 }, { "epoch": 0.74, "learning_rate": 1.2835304498861247e-05, "loss": 2.2722, "step": 426230 }, { "epoch": 0.74, "learning_rate": 1.283443255893442e-05, "loss": 2.381, "step": 426240 }, { "epoch": 0.74, "learning_rate": 1.2833560619007593e-05, "loss": 2.1946, "step": 426250 }, { "epoch": 0.74, "learning_rate": 1.2832688679080768e-05, "loss": 2.2892, "step": 426260 }, { "epoch": 0.74, "learning_rate": 1.283181673915394e-05, "loss": 2.2314, "step": 426270 }, { "epoch": 0.74, "learning_rate": 1.2830944799227112e-05, "loss": 2.2315, "step": 426280 }, { "epoch": 0.74, "learning_rate": 1.2830072859300284e-05, "loss": 2.2994, "step": 426290 }, { "epoch": 0.74, "learning_rate": 1.282920091937346e-05, "loss": 2.2716, "step": 426300 }, { "epoch": 0.74, "learning_rate": 1.2828328979446634e-05, "loss": 2.3445, "step": 426310 }, { "epoch": 0.74, "learning_rate": 1.2827457039519806e-05, "loss": 2.26, "step": 426320 }, { "epoch": 0.74, "learning_rate": 1.2826585099592981e-05, "loss": 2.2979, "step": 426330 }, { "epoch": 0.74, "learning_rate": 1.2825713159666153e-05, "loss": 2.3045, "step": 426340 }, { "epoch": 0.74, "learning_rate": 1.2824841219739325e-05, "loss": 2.3063, "step": 426350 }, { "epoch": 0.74, "learning_rate": 1.2823969279812497e-05, "loss": 2.2174, "step": 426360 }, { "epoch": 0.74, "learning_rate": 1.2823097339885673e-05, "loss": 2.3775, "step": 426370 }, { "epoch": 0.74, "learning_rate": 1.2822225399958845e-05, "loss": 2.3425, "step": 426380 }, { "epoch": 0.74, "learning_rate": 1.2821353460032019e-05, "loss": 2.2955, "step": 426390 }, { "epoch": 0.74, "learning_rate": 1.282048152010519e-05, "loss": 2.3067, "step": 426400 }, { "epoch": 0.74, "learning_rate": 1.2819609580178366e-05, "loss": 2.328, "step": 426410 }, { "epoch": 0.74, "learning_rate": 1.2818737640251538e-05, "loss": 2.4774, "step": 426420 }, { "epoch": 0.74, "learning_rate": 1.281786570032471e-05, "loss": 2.3169, "step": 426430 }, { "epoch": 0.74, "learning_rate": 1.2816993760397882e-05, "loss": 2.2383, "step": 426440 }, { "epoch": 0.74, "learning_rate": 1.2816121820471058e-05, "loss": 2.3168, "step": 426450 }, { "epoch": 0.74, "learning_rate": 1.281524988054423e-05, "loss": 2.3179, "step": 426460 }, { "epoch": 0.74, "learning_rate": 1.2814377940617404e-05, "loss": 2.4369, "step": 426470 }, { "epoch": 0.74, "learning_rate": 1.2813506000690577e-05, "loss": 2.3934, "step": 426480 }, { "epoch": 0.74, "learning_rate": 1.2812634060763751e-05, "loss": 2.2677, "step": 426490 }, { "epoch": 0.74, "learning_rate": 1.2811762120836923e-05, "loss": 2.2514, "step": 426500 }, { "epoch": 0.74, "learning_rate": 1.2810890180910095e-05, "loss": 2.3554, "step": 426510 }, { "epoch": 0.74, "learning_rate": 1.281001824098327e-05, "loss": 2.2198, "step": 426520 }, { "epoch": 0.74, "learning_rate": 1.2809146301056443e-05, "loss": 2.2334, "step": 426530 }, { "epoch": 0.74, "learning_rate": 1.2808274361129615e-05, "loss": 2.3271, "step": 426540 }, { "epoch": 0.74, "learning_rate": 1.2807402421202789e-05, "loss": 2.396, "step": 426550 }, { "epoch": 0.74, "learning_rate": 1.2806530481275964e-05, "loss": 2.1531, "step": 426560 }, { "epoch": 0.74, "learning_rate": 1.2805658541349136e-05, "loss": 2.3516, "step": 426570 }, { "epoch": 0.74, "learning_rate": 1.2804786601422308e-05, "loss": 2.3483, "step": 426580 }, { "epoch": 0.74, "learning_rate": 1.2803914661495484e-05, "loss": 2.4123, "step": 426590 }, { "epoch": 0.74, "learning_rate": 1.2803042721568656e-05, "loss": 2.2762, "step": 426600 }, { "epoch": 0.74, "learning_rate": 1.2802170781641828e-05, "loss": 2.3533, "step": 426610 }, { "epoch": 0.74, "learning_rate": 1.2801298841715002e-05, "loss": 2.3854, "step": 426620 }, { "epoch": 0.74, "learning_rate": 1.2800426901788176e-05, "loss": 2.245, "step": 426630 }, { "epoch": 0.74, "learning_rate": 1.279955496186135e-05, "loss": 2.2645, "step": 426640 }, { "epoch": 0.74, "learning_rate": 1.2798683021934521e-05, "loss": 2.3054, "step": 426650 }, { "epoch": 0.74, "learning_rate": 1.2797811082007693e-05, "loss": 2.3399, "step": 426660 }, { "epoch": 0.74, "learning_rate": 1.2796939142080869e-05, "loss": 2.2052, "step": 426670 }, { "epoch": 0.74, "learning_rate": 1.2796067202154041e-05, "loss": 2.2664, "step": 426680 }, { "epoch": 0.74, "learning_rate": 1.2795195262227213e-05, "loss": 2.2544, "step": 426690 }, { "epoch": 0.74, "learning_rate": 1.2794323322300387e-05, "loss": 2.2523, "step": 426700 }, { "epoch": 0.74, "learning_rate": 1.279345138237356e-05, "loss": 2.2167, "step": 426710 }, { "epoch": 0.74, "learning_rate": 1.2792579442446734e-05, "loss": 2.3599, "step": 426720 }, { "epoch": 0.74, "learning_rate": 1.2791707502519906e-05, "loss": 2.3374, "step": 426730 }, { "epoch": 0.74, "learning_rate": 1.2790835562593082e-05, "loss": 2.2787, "step": 426740 }, { "epoch": 0.74, "learning_rate": 1.2789963622666254e-05, "loss": 2.297, "step": 426750 }, { "epoch": 0.74, "learning_rate": 1.2789091682739426e-05, "loss": 2.2318, "step": 426760 }, { "epoch": 0.74, "learning_rate": 1.2788219742812598e-05, "loss": 2.1947, "step": 426770 }, { "epoch": 0.74, "learning_rate": 1.2787347802885774e-05, "loss": 2.2497, "step": 426780 }, { "epoch": 0.74, "learning_rate": 1.2786475862958946e-05, "loss": 2.3655, "step": 426790 }, { "epoch": 0.74, "learning_rate": 1.278560392303212e-05, "loss": 2.3224, "step": 426800 }, { "epoch": 0.74, "learning_rate": 1.2784731983105292e-05, "loss": 2.3529, "step": 426810 }, { "epoch": 0.74, "learning_rate": 1.2783860043178467e-05, "loss": 2.3054, "step": 426820 }, { "epoch": 0.74, "learning_rate": 1.2782988103251639e-05, "loss": 2.1812, "step": 426830 }, { "epoch": 0.74, "learning_rate": 1.2782116163324811e-05, "loss": 2.1832, "step": 426840 }, { "epoch": 0.74, "learning_rate": 1.2781244223397987e-05, "loss": 2.2471, "step": 426850 }, { "epoch": 0.74, "learning_rate": 1.2780372283471159e-05, "loss": 2.2926, "step": 426860 }, { "epoch": 0.74, "learning_rate": 1.2779500343544332e-05, "loss": 2.2486, "step": 426870 }, { "epoch": 0.74, "learning_rate": 1.2778628403617505e-05, "loss": 2.382, "step": 426880 }, { "epoch": 0.74, "learning_rate": 1.277775646369068e-05, "loss": 2.3627, "step": 426890 }, { "epoch": 0.74, "learning_rate": 1.2776884523763852e-05, "loss": 2.3608, "step": 426900 }, { "epoch": 0.74, "learning_rate": 1.2776012583837024e-05, "loss": 2.2485, "step": 426910 }, { "epoch": 0.74, "learning_rate": 1.2775140643910196e-05, "loss": 2.3219, "step": 426920 }, { "epoch": 0.74, "learning_rate": 1.2774268703983372e-05, "loss": 2.2409, "step": 426930 }, { "epoch": 0.74, "learning_rate": 1.2773396764056544e-05, "loss": 2.3138, "step": 426940 }, { "epoch": 0.74, "learning_rate": 1.2772524824129718e-05, "loss": 2.2372, "step": 426950 }, { "epoch": 0.74, "learning_rate": 1.277165288420289e-05, "loss": 2.3694, "step": 426960 }, { "epoch": 0.74, "learning_rate": 1.2770780944276065e-05, "loss": 2.3195, "step": 426970 }, { "epoch": 0.74, "learning_rate": 1.2769909004349237e-05, "loss": 2.299, "step": 426980 }, { "epoch": 0.74, "learning_rate": 1.276903706442241e-05, "loss": 2.2719, "step": 426990 }, { "epoch": 0.74, "learning_rate": 1.2768165124495585e-05, "loss": 2.3227, "step": 427000 }, { "epoch": 0.74, "learning_rate": 1.2767293184568757e-05, "loss": 2.3344, "step": 427010 }, { "epoch": 0.74, "learning_rate": 1.2766421244641929e-05, "loss": 2.3043, "step": 427020 }, { "epoch": 0.74, "learning_rate": 1.2765549304715103e-05, "loss": 2.2727, "step": 427030 }, { "epoch": 0.74, "learning_rate": 1.2764677364788278e-05, "loss": 2.2267, "step": 427040 }, { "epoch": 0.74, "learning_rate": 1.276380542486145e-05, "loss": 2.292, "step": 427050 }, { "epoch": 0.74, "learning_rate": 1.2762933484934622e-05, "loss": 2.2526, "step": 427060 }, { "epoch": 0.74, "learning_rate": 1.2762061545007794e-05, "loss": 2.32, "step": 427070 }, { "epoch": 0.74, "learning_rate": 1.276118960508097e-05, "loss": 2.3542, "step": 427080 }, { "epoch": 0.74, "learning_rate": 1.2760317665154142e-05, "loss": 2.2609, "step": 427090 }, { "epoch": 0.74, "learning_rate": 1.2759445725227314e-05, "loss": 2.2753, "step": 427100 }, { "epoch": 0.74, "learning_rate": 1.2758573785300488e-05, "loss": 2.2078, "step": 427110 }, { "epoch": 0.74, "learning_rate": 1.2757701845373663e-05, "loss": 2.353, "step": 427120 }, { "epoch": 0.74, "learning_rate": 1.2756829905446835e-05, "loss": 2.3686, "step": 427130 }, { "epoch": 0.74, "learning_rate": 1.2755957965520007e-05, "loss": 2.3508, "step": 427140 }, { "epoch": 0.74, "learning_rate": 1.2755086025593183e-05, "loss": 2.3317, "step": 427150 }, { "epoch": 0.74, "learning_rate": 1.2754214085666355e-05, "loss": 2.2903, "step": 427160 }, { "epoch": 0.74, "learning_rate": 1.2753342145739527e-05, "loss": 2.344, "step": 427170 }, { "epoch": 0.74, "learning_rate": 1.27524702058127e-05, "loss": 2.2762, "step": 427180 }, { "epoch": 0.74, "learning_rate": 1.2751598265885874e-05, "loss": 2.3019, "step": 427190 }, { "epoch": 0.74, "learning_rate": 1.2750726325959048e-05, "loss": 2.3484, "step": 427200 }, { "epoch": 0.75, "learning_rate": 1.274985438603222e-05, "loss": 2.2539, "step": 427210 }, { "epoch": 0.75, "learning_rate": 1.2748982446105392e-05, "loss": 2.2996, "step": 427220 }, { "epoch": 0.75, "learning_rate": 1.2748110506178568e-05, "loss": 2.3495, "step": 427230 }, { "epoch": 0.75, "learning_rate": 1.274723856625174e-05, "loss": 2.3103, "step": 427240 }, { "epoch": 0.75, "learning_rate": 1.2746366626324912e-05, "loss": 2.3337, "step": 427250 }, { "epoch": 0.75, "learning_rate": 1.2745494686398087e-05, "loss": 2.3735, "step": 427260 }, { "epoch": 0.75, "learning_rate": 1.274462274647126e-05, "loss": 2.3138, "step": 427270 }, { "epoch": 0.75, "learning_rate": 1.2743750806544433e-05, "loss": 2.3854, "step": 427280 }, { "epoch": 0.75, "learning_rate": 1.2742878866617605e-05, "loss": 2.2414, "step": 427290 }, { "epoch": 0.75, "learning_rate": 1.2742006926690781e-05, "loss": 2.2411, "step": 427300 }, { "epoch": 0.75, "learning_rate": 1.2741134986763953e-05, "loss": 2.328, "step": 427310 }, { "epoch": 0.75, "learning_rate": 1.2740263046837125e-05, "loss": 2.3118, "step": 427320 }, { "epoch": 0.75, "learning_rate": 1.2739391106910297e-05, "loss": 2.2028, "step": 427330 }, { "epoch": 0.75, "learning_rate": 1.2738519166983473e-05, "loss": 2.2871, "step": 427340 }, { "epoch": 0.75, "learning_rate": 1.2737647227056646e-05, "loss": 2.2957, "step": 427350 }, { "epoch": 0.75, "learning_rate": 1.2736775287129818e-05, "loss": 2.3161, "step": 427360 }, { "epoch": 0.75, "learning_rate": 1.273590334720299e-05, "loss": 2.3104, "step": 427370 }, { "epoch": 0.75, "learning_rate": 1.2735031407276166e-05, "loss": 2.1806, "step": 427380 }, { "epoch": 0.75, "learning_rate": 1.2734159467349338e-05, "loss": 2.1583, "step": 427390 }, { "epoch": 0.75, "learning_rate": 1.273328752742251e-05, "loss": 2.2891, "step": 427400 }, { "epoch": 0.75, "learning_rate": 1.2732415587495686e-05, "loss": 2.2192, "step": 427410 }, { "epoch": 0.75, "learning_rate": 1.2731543647568858e-05, "loss": 2.198, "step": 427420 }, { "epoch": 0.75, "learning_rate": 1.2730671707642031e-05, "loss": 2.2498, "step": 427430 }, { "epoch": 0.75, "learning_rate": 1.2729799767715203e-05, "loss": 2.3343, "step": 427440 }, { "epoch": 0.75, "learning_rate": 1.2728927827788379e-05, "loss": 2.2685, "step": 427450 }, { "epoch": 0.75, "learning_rate": 1.2728055887861551e-05, "loss": 2.3365, "step": 427460 }, { "epoch": 0.75, "learning_rate": 1.2727183947934723e-05, "loss": 2.2553, "step": 427470 }, { "epoch": 0.75, "learning_rate": 1.2726312008007895e-05, "loss": 2.3586, "step": 427480 }, { "epoch": 0.75, "learning_rate": 1.272544006808107e-05, "loss": 2.3864, "step": 427490 }, { "epoch": 0.75, "learning_rate": 1.2724568128154243e-05, "loss": 2.3961, "step": 427500 }, { "epoch": 0.75, "learning_rate": 1.2723696188227416e-05, "loss": 2.3577, "step": 427510 }, { "epoch": 0.75, "learning_rate": 1.272282424830059e-05, "loss": 2.4164, "step": 427520 }, { "epoch": 0.75, "learning_rate": 1.2721952308373764e-05, "loss": 2.2949, "step": 427530 }, { "epoch": 0.75, "learning_rate": 1.2721080368446936e-05, "loss": 2.3114, "step": 427540 }, { "epoch": 0.75, "learning_rate": 1.2720208428520108e-05, "loss": 2.2914, "step": 427550 }, { "epoch": 0.75, "learning_rate": 1.2719336488593284e-05, "loss": 2.3349, "step": 427560 }, { "epoch": 0.75, "learning_rate": 1.2718464548666456e-05, "loss": 2.1842, "step": 427570 }, { "epoch": 0.75, "learning_rate": 1.2717592608739628e-05, "loss": 2.3024, "step": 427580 }, { "epoch": 0.75, "learning_rate": 1.2716720668812802e-05, "loss": 2.3439, "step": 427590 }, { "epoch": 0.75, "learning_rate": 1.2715848728885977e-05, "loss": 2.4224, "step": 427600 }, { "epoch": 0.75, "learning_rate": 1.2714976788959149e-05, "loss": 2.2835, "step": 427610 }, { "epoch": 0.75, "learning_rate": 1.2714104849032321e-05, "loss": 2.4283, "step": 427620 }, { "epoch": 0.75, "learning_rate": 1.2713232909105493e-05, "loss": 2.3624, "step": 427630 }, { "epoch": 0.75, "learning_rate": 1.2712360969178669e-05, "loss": 2.291, "step": 427640 }, { "epoch": 0.75, "learning_rate": 1.271148902925184e-05, "loss": 2.338, "step": 427650 }, { "epoch": 0.75, "learning_rate": 1.2710617089325015e-05, "loss": 2.137, "step": 427660 }, { "epoch": 0.75, "learning_rate": 1.2709745149398188e-05, "loss": 2.3319, "step": 427670 }, { "epoch": 0.75, "learning_rate": 1.2708873209471362e-05, "loss": 2.358, "step": 427680 }, { "epoch": 0.75, "learning_rate": 1.2708001269544534e-05, "loss": 2.1922, "step": 427690 }, { "epoch": 0.75, "learning_rate": 1.2707129329617706e-05, "loss": 2.3485, "step": 427700 }, { "epoch": 0.75, "learning_rate": 1.2706257389690882e-05, "loss": 2.3436, "step": 427710 }, { "epoch": 0.75, "learning_rate": 1.2705385449764054e-05, "loss": 2.2881, "step": 427720 }, { "epoch": 0.75, "learning_rate": 1.2704513509837226e-05, "loss": 2.2323, "step": 427730 }, { "epoch": 0.75, "learning_rate": 1.27036415699104e-05, "loss": 2.2931, "step": 427740 }, { "epoch": 0.75, "learning_rate": 1.2702769629983573e-05, "loss": 2.3473, "step": 427750 }, { "epoch": 0.75, "learning_rate": 1.2701897690056747e-05, "loss": 2.238, "step": 427760 }, { "epoch": 0.75, "learning_rate": 1.270102575012992e-05, "loss": 2.3562, "step": 427770 }, { "epoch": 0.75, "learning_rate": 1.2700153810203091e-05, "loss": 2.2953, "step": 427780 }, { "epoch": 0.75, "learning_rate": 1.2699281870276267e-05, "loss": 2.3623, "step": 427790 }, { "epoch": 0.75, "learning_rate": 1.2698409930349439e-05, "loss": 2.4194, "step": 427800 }, { "epoch": 0.75, "learning_rate": 1.2697537990422611e-05, "loss": 2.2922, "step": 427810 }, { "epoch": 0.75, "learning_rate": 1.2696666050495786e-05, "loss": 2.3996, "step": 427820 }, { "epoch": 0.75, "learning_rate": 1.2695794110568958e-05, "loss": 2.3309, "step": 427830 }, { "epoch": 0.75, "learning_rate": 1.2694922170642132e-05, "loss": 2.2257, "step": 427840 }, { "epoch": 0.75, "learning_rate": 1.2694050230715304e-05, "loss": 2.3211, "step": 427850 }, { "epoch": 0.75, "learning_rate": 1.269317829078848e-05, "loss": 2.3007, "step": 427860 }, { "epoch": 0.75, "learning_rate": 1.2692306350861652e-05, "loss": 2.2854, "step": 427870 }, { "epoch": 0.75, "learning_rate": 1.2691434410934824e-05, "loss": 2.3506, "step": 427880 }, { "epoch": 0.75, "learning_rate": 1.2690562471007996e-05, "loss": 2.3264, "step": 427890 }, { "epoch": 0.75, "learning_rate": 1.2689690531081171e-05, "loss": 2.2475, "step": 427900 }, { "epoch": 0.75, "learning_rate": 1.2688818591154345e-05, "loss": 2.3421, "step": 427910 }, { "epoch": 0.75, "learning_rate": 1.2687946651227517e-05, "loss": 2.2825, "step": 427920 }, { "epoch": 0.75, "learning_rate": 1.2687074711300693e-05, "loss": 2.3102, "step": 427930 }, { "epoch": 0.75, "learning_rate": 1.2686202771373865e-05, "loss": 2.2546, "step": 427940 }, { "epoch": 0.75, "learning_rate": 1.2685330831447037e-05, "loss": 2.2659, "step": 427950 }, { "epoch": 0.75, "learning_rate": 1.2684458891520209e-05, "loss": 2.2774, "step": 427960 }, { "epoch": 0.75, "learning_rate": 1.2683586951593384e-05, "loss": 2.2001, "step": 427970 }, { "epoch": 0.75, "learning_rate": 1.2682715011666557e-05, "loss": 2.2541, "step": 427980 }, { "epoch": 0.75, "learning_rate": 1.268184307173973e-05, "loss": 2.3907, "step": 427990 }, { "epoch": 0.75, "learning_rate": 1.2680971131812902e-05, "loss": 2.3241, "step": 428000 }, { "epoch": 0.75, "learning_rate": 1.2680099191886078e-05, "loss": 2.3213, "step": 428010 }, { "epoch": 0.75, "learning_rate": 1.267922725195925e-05, "loss": 2.3483, "step": 428020 }, { "epoch": 0.75, "learning_rate": 1.2678355312032422e-05, "loss": 2.3835, "step": 428030 }, { "epoch": 0.75, "learning_rate": 1.2677483372105594e-05, "loss": 2.3446, "step": 428040 }, { "epoch": 0.75, "learning_rate": 1.267661143217877e-05, "loss": 2.3246, "step": 428050 }, { "epoch": 0.75, "learning_rate": 1.2675739492251942e-05, "loss": 2.2427, "step": 428060 }, { "epoch": 0.75, "learning_rate": 1.2674867552325115e-05, "loss": 2.2901, "step": 428070 }, { "epoch": 0.75, "learning_rate": 1.2673995612398291e-05, "loss": 2.0889, "step": 428080 }, { "epoch": 0.75, "learning_rate": 1.2673123672471463e-05, "loss": 2.2811, "step": 428090 }, { "epoch": 0.75, "learning_rate": 1.2672251732544635e-05, "loss": 2.3438, "step": 428100 }, { "epoch": 0.75, "learning_rate": 1.2671379792617807e-05, "loss": 2.2951, "step": 428110 }, { "epoch": 0.75, "learning_rate": 1.2670507852690983e-05, "loss": 2.2885, "step": 428120 }, { "epoch": 0.75, "learning_rate": 1.2669635912764155e-05, "loss": 2.3522, "step": 428130 }, { "epoch": 0.75, "learning_rate": 1.2668763972837327e-05, "loss": 2.3224, "step": 428140 }, { "epoch": 0.75, "learning_rate": 1.26678920329105e-05, "loss": 2.3119, "step": 428150 }, { "epoch": 0.75, "learning_rate": 1.2667020092983676e-05, "loss": 2.2574, "step": 428160 }, { "epoch": 0.75, "learning_rate": 1.2666148153056848e-05, "loss": 2.2948, "step": 428170 }, { "epoch": 0.75, "learning_rate": 1.266527621313002e-05, "loss": 2.4124, "step": 428180 }, { "epoch": 0.75, "learning_rate": 1.2664404273203196e-05, "loss": 2.2785, "step": 428190 }, { "epoch": 0.75, "learning_rate": 1.2663532333276368e-05, "loss": 2.2787, "step": 428200 }, { "epoch": 0.75, "learning_rate": 1.266266039334954e-05, "loss": 2.336, "step": 428210 }, { "epoch": 0.75, "learning_rate": 1.2661788453422713e-05, "loss": 2.2911, "step": 428220 }, { "epoch": 0.75, "learning_rate": 1.2660916513495887e-05, "loss": 2.3358, "step": 428230 }, { "epoch": 0.75, "learning_rate": 1.2660044573569061e-05, "loss": 2.3435, "step": 428240 }, { "epoch": 0.75, "learning_rate": 1.2659172633642233e-05, "loss": 2.3094, "step": 428250 }, { "epoch": 0.75, "learning_rate": 1.2658300693715405e-05, "loss": 2.2371, "step": 428260 }, { "epoch": 0.75, "learning_rate": 1.265742875378858e-05, "loss": 2.149, "step": 428270 }, { "epoch": 0.75, "learning_rate": 1.2656556813861753e-05, "loss": 2.3117, "step": 428280 }, { "epoch": 0.75, "learning_rate": 1.2655684873934925e-05, "loss": 2.3452, "step": 428290 }, { "epoch": 0.75, "learning_rate": 1.2654812934008099e-05, "loss": 2.4521, "step": 428300 }, { "epoch": 0.75, "learning_rate": 1.2653940994081272e-05, "loss": 2.3157, "step": 428310 }, { "epoch": 0.75, "learning_rate": 1.2653069054154446e-05, "loss": 2.3468, "step": 428320 }, { "epoch": 0.75, "learning_rate": 1.2652197114227618e-05, "loss": 2.2541, "step": 428330 }, { "epoch": 0.75, "learning_rate": 1.2651325174300794e-05, "loss": 2.3085, "step": 428340 }, { "epoch": 0.75, "learning_rate": 1.2650453234373966e-05, "loss": 2.3485, "step": 428350 }, { "epoch": 0.75, "learning_rate": 1.2649581294447138e-05, "loss": 2.3203, "step": 428360 }, { "epoch": 0.75, "learning_rate": 1.264870935452031e-05, "loss": 2.2292, "step": 428370 }, { "epoch": 0.75, "learning_rate": 1.2647837414593485e-05, "loss": 2.3703, "step": 428380 }, { "epoch": 0.75, "learning_rate": 1.2646965474666659e-05, "loss": 2.3596, "step": 428390 }, { "epoch": 0.75, "learning_rate": 1.2646093534739831e-05, "loss": 2.2557, "step": 428400 }, { "epoch": 0.75, "learning_rate": 1.2645221594813003e-05, "loss": 2.2273, "step": 428410 }, { "epoch": 0.75, "learning_rate": 1.2644349654886179e-05, "loss": 2.2813, "step": 428420 }, { "epoch": 0.75, "learning_rate": 1.264347771495935e-05, "loss": 2.3938, "step": 428430 }, { "epoch": 0.75, "learning_rate": 1.2642605775032523e-05, "loss": 2.2174, "step": 428440 }, { "epoch": 0.75, "learning_rate": 1.2641733835105698e-05, "loss": 2.3638, "step": 428450 }, { "epoch": 0.75, "learning_rate": 1.264086189517887e-05, "loss": 2.2816, "step": 428460 }, { "epoch": 0.75, "learning_rate": 1.2639989955252044e-05, "loss": 2.2666, "step": 428470 }, { "epoch": 0.75, "learning_rate": 1.2639118015325216e-05, "loss": 2.424, "step": 428480 }, { "epoch": 0.75, "learning_rate": 1.2638246075398392e-05, "loss": 2.2251, "step": 428490 }, { "epoch": 0.75, "learning_rate": 1.2637374135471564e-05, "loss": 2.2485, "step": 428500 }, { "epoch": 0.75, "learning_rate": 1.2636502195544736e-05, "loss": 2.2797, "step": 428510 }, { "epoch": 0.75, "learning_rate": 1.2635630255617908e-05, "loss": 2.2738, "step": 428520 }, { "epoch": 0.75, "learning_rate": 1.2634758315691083e-05, "loss": 2.2671, "step": 428530 }, { "epoch": 0.75, "learning_rate": 1.2633886375764255e-05, "loss": 2.2411, "step": 428540 }, { "epoch": 0.75, "learning_rate": 1.263301443583743e-05, "loss": 2.3489, "step": 428550 }, { "epoch": 0.75, "learning_rate": 1.2632142495910601e-05, "loss": 2.3603, "step": 428560 }, { "epoch": 0.75, "learning_rate": 1.2631270555983777e-05, "loss": 2.2538, "step": 428570 }, { "epoch": 0.75, "learning_rate": 1.2630398616056949e-05, "loss": 2.2398, "step": 428580 }, { "epoch": 0.75, "learning_rate": 1.2629526676130121e-05, "loss": 2.3871, "step": 428590 }, { "epoch": 0.75, "learning_rate": 1.2628654736203296e-05, "loss": 2.3093, "step": 428600 }, { "epoch": 0.75, "learning_rate": 1.2627782796276468e-05, "loss": 2.3077, "step": 428610 }, { "epoch": 0.75, "learning_rate": 1.262691085634964e-05, "loss": 2.3587, "step": 428620 }, { "epoch": 0.75, "learning_rate": 1.2626038916422814e-05, "loss": 2.2906, "step": 428630 }, { "epoch": 0.75, "learning_rate": 1.262516697649599e-05, "loss": 2.2076, "step": 428640 }, { "epoch": 0.75, "learning_rate": 1.2624295036569162e-05, "loss": 2.1888, "step": 428650 }, { "epoch": 0.75, "learning_rate": 1.2623423096642334e-05, "loss": 2.299, "step": 428660 }, { "epoch": 0.75, "learning_rate": 1.2622551156715506e-05, "loss": 2.3576, "step": 428670 }, { "epoch": 0.75, "learning_rate": 1.2621679216788681e-05, "loss": 2.1995, "step": 428680 }, { "epoch": 0.75, "learning_rate": 1.2620807276861854e-05, "loss": 2.3016, "step": 428690 }, { "epoch": 0.75, "learning_rate": 1.2619935336935027e-05, "loss": 2.1625, "step": 428700 }, { "epoch": 0.75, "learning_rate": 1.26190633970082e-05, "loss": 2.3626, "step": 428710 }, { "epoch": 0.75, "learning_rate": 1.2618191457081375e-05, "loss": 2.3414, "step": 428720 }, { "epoch": 0.75, "learning_rate": 1.2617319517154547e-05, "loss": 2.3943, "step": 428730 }, { "epoch": 0.75, "learning_rate": 1.2616447577227719e-05, "loss": 2.2171, "step": 428740 }, { "epoch": 0.75, "learning_rate": 1.2615575637300894e-05, "loss": 2.2017, "step": 428750 }, { "epoch": 0.75, "learning_rate": 1.2614703697374067e-05, "loss": 2.2874, "step": 428760 }, { "epoch": 0.75, "learning_rate": 1.2613831757447239e-05, "loss": 2.3699, "step": 428770 }, { "epoch": 0.75, "learning_rate": 1.2612959817520412e-05, "loss": 2.3567, "step": 428780 }, { "epoch": 0.75, "learning_rate": 1.2612087877593586e-05, "loss": 2.3365, "step": 428790 }, { "epoch": 0.75, "learning_rate": 1.261121593766676e-05, "loss": 2.2256, "step": 428800 }, { "epoch": 0.75, "learning_rate": 1.2610343997739932e-05, "loss": 2.263, "step": 428810 }, { "epoch": 0.75, "learning_rate": 1.2609472057813104e-05, "loss": 2.1801, "step": 428820 }, { "epoch": 0.75, "learning_rate": 1.260860011788628e-05, "loss": 2.3598, "step": 428830 }, { "epoch": 0.75, "learning_rate": 1.2607728177959452e-05, "loss": 2.18, "step": 428840 }, { "epoch": 0.75, "learning_rate": 1.2606856238032624e-05, "loss": 2.2425, "step": 428850 }, { "epoch": 0.75, "learning_rate": 1.26059842981058e-05, "loss": 2.2818, "step": 428860 }, { "epoch": 0.75, "learning_rate": 1.2605112358178971e-05, "loss": 2.2217, "step": 428870 }, { "epoch": 0.75, "learning_rate": 1.2604240418252145e-05, "loss": 2.3881, "step": 428880 }, { "epoch": 0.75, "learning_rate": 1.2603368478325317e-05, "loss": 2.3546, "step": 428890 }, { "epoch": 0.75, "learning_rate": 1.2602496538398493e-05, "loss": 2.38, "step": 428900 }, { "epoch": 0.75, "learning_rate": 1.2601624598471665e-05, "loss": 2.2649, "step": 428910 }, { "epoch": 0.75, "learning_rate": 1.2600752658544837e-05, "loss": 2.2933, "step": 428920 }, { "epoch": 0.75, "learning_rate": 1.2599880718618009e-05, "loss": 2.2862, "step": 428930 }, { "epoch": 0.75, "learning_rate": 1.2599008778691184e-05, "loss": 2.207, "step": 428940 }, { "epoch": 0.75, "learning_rate": 1.2598136838764358e-05, "loss": 2.1495, "step": 428950 }, { "epoch": 0.75, "learning_rate": 1.259726489883753e-05, "loss": 2.2837, "step": 428960 }, { "epoch": 0.75, "learning_rate": 1.2596392958910702e-05, "loss": 2.1271, "step": 428970 }, { "epoch": 0.75, "learning_rate": 1.2595521018983878e-05, "loss": 2.3183, "step": 428980 }, { "epoch": 0.75, "learning_rate": 1.259464907905705e-05, "loss": 2.2, "step": 428990 }, { "epoch": 0.75, "learning_rate": 1.2593777139130222e-05, "loss": 2.2845, "step": 429000 }, { "epoch": 0.75, "learning_rate": 1.2592905199203397e-05, "loss": 2.255, "step": 429010 }, { "epoch": 0.75, "learning_rate": 1.259203325927657e-05, "loss": 2.2112, "step": 429020 }, { "epoch": 0.75, "learning_rate": 1.2591161319349743e-05, "loss": 2.3706, "step": 429030 }, { "epoch": 0.75, "learning_rate": 1.2590289379422915e-05, "loss": 2.3109, "step": 429040 }, { "epoch": 0.75, "learning_rate": 1.258941743949609e-05, "loss": 2.3016, "step": 429050 }, { "epoch": 0.75, "learning_rate": 1.2588545499569263e-05, "loss": 2.2403, "step": 429060 }, { "epoch": 0.75, "learning_rate": 1.2587673559642435e-05, "loss": 2.3567, "step": 429070 }, { "epoch": 0.75, "learning_rate": 1.2586801619715607e-05, "loss": 2.2794, "step": 429080 }, { "epoch": 0.75, "learning_rate": 1.2585929679788782e-05, "loss": 2.2749, "step": 429090 }, { "epoch": 0.75, "learning_rate": 1.2585057739861954e-05, "loss": 2.3986, "step": 429100 }, { "epoch": 0.75, "learning_rate": 1.2584185799935128e-05, "loss": 2.3954, "step": 429110 }, { "epoch": 0.75, "learning_rate": 1.2583313860008304e-05, "loss": 2.3538, "step": 429120 }, { "epoch": 0.75, "learning_rate": 1.2582441920081476e-05, "loss": 2.2754, "step": 429130 }, { "epoch": 0.75, "learning_rate": 1.2581569980154648e-05, "loss": 2.2697, "step": 429140 }, { "epoch": 0.75, "learning_rate": 1.258069804022782e-05, "loss": 2.3046, "step": 429150 }, { "epoch": 0.75, "learning_rate": 1.2579826100300995e-05, "loss": 2.2519, "step": 429160 }, { "epoch": 0.75, "learning_rate": 1.2578954160374167e-05, "loss": 2.2765, "step": 429170 }, { "epoch": 0.75, "learning_rate": 1.257808222044734e-05, "loss": 2.2253, "step": 429180 }, { "epoch": 0.75, "learning_rate": 1.2577210280520513e-05, "loss": 2.3191, "step": 429190 }, { "epoch": 0.75, "learning_rate": 1.2576338340593689e-05, "loss": 2.1579, "step": 429200 }, { "epoch": 0.75, "learning_rate": 1.257546640066686e-05, "loss": 2.2884, "step": 429210 }, { "epoch": 0.75, "learning_rate": 1.2574594460740033e-05, "loss": 2.3666, "step": 429220 }, { "epoch": 0.75, "learning_rate": 1.2573722520813205e-05, "loss": 2.3003, "step": 429230 }, { "epoch": 0.75, "learning_rate": 1.257285058088638e-05, "loss": 2.3723, "step": 429240 }, { "epoch": 0.75, "learning_rate": 1.2571978640959552e-05, "loss": 2.3006, "step": 429250 }, { "epoch": 0.75, "learning_rate": 1.2571106701032726e-05, "loss": 2.3629, "step": 429260 }, { "epoch": 0.75, "learning_rate": 1.25702347611059e-05, "loss": 2.2096, "step": 429270 }, { "epoch": 0.75, "learning_rate": 1.2569362821179074e-05, "loss": 2.3598, "step": 429280 }, { "epoch": 0.75, "learning_rate": 1.2568490881252246e-05, "loss": 2.3131, "step": 429290 }, { "epoch": 0.75, "learning_rate": 1.2567618941325418e-05, "loss": 2.2707, "step": 429300 }, { "epoch": 0.75, "learning_rate": 1.2566747001398593e-05, "loss": 2.2118, "step": 429310 }, { "epoch": 0.75, "learning_rate": 1.2565875061471765e-05, "loss": 2.2013, "step": 429320 }, { "epoch": 0.75, "learning_rate": 1.2565003121544938e-05, "loss": 2.3399, "step": 429330 }, { "epoch": 0.75, "learning_rate": 1.2564131181618111e-05, "loss": 2.3324, "step": 429340 }, { "epoch": 0.75, "learning_rate": 1.2563259241691285e-05, "loss": 2.3219, "step": 429350 }, { "epoch": 0.75, "learning_rate": 1.2562387301764459e-05, "loss": 2.338, "step": 429360 }, { "epoch": 0.75, "learning_rate": 1.2561515361837631e-05, "loss": 2.2719, "step": 429370 }, { "epoch": 0.75, "learning_rate": 1.2560643421910806e-05, "loss": 2.3537, "step": 429380 }, { "epoch": 0.75, "learning_rate": 1.2559771481983978e-05, "loss": 2.344, "step": 429390 }, { "epoch": 0.75, "learning_rate": 1.255889954205715e-05, "loss": 2.3254, "step": 429400 }, { "epoch": 0.75, "learning_rate": 1.2558027602130323e-05, "loss": 2.2969, "step": 429410 }, { "epoch": 0.75, "learning_rate": 1.2557155662203498e-05, "loss": 2.3201, "step": 429420 }, { "epoch": 0.75, "learning_rate": 1.2556283722276672e-05, "loss": 2.2946, "step": 429430 }, { "epoch": 0.75, "learning_rate": 1.2555411782349844e-05, "loss": 2.311, "step": 429440 }, { "epoch": 0.75, "learning_rate": 1.2554539842423016e-05, "loss": 2.3764, "step": 429450 }, { "epoch": 0.75, "learning_rate": 1.2553667902496191e-05, "loss": 2.2321, "step": 429460 }, { "epoch": 0.75, "learning_rate": 1.2552795962569364e-05, "loss": 2.2953, "step": 429470 }, { "epoch": 0.75, "learning_rate": 1.2551924022642536e-05, "loss": 2.2417, "step": 429480 }, { "epoch": 0.75, "learning_rate": 1.2551052082715708e-05, "loss": 2.2974, "step": 429490 }, { "epoch": 0.75, "learning_rate": 1.2550180142788883e-05, "loss": 2.3408, "step": 429500 }, { "epoch": 0.75, "learning_rate": 1.2549308202862057e-05, "loss": 2.221, "step": 429510 }, { "epoch": 0.75, "learning_rate": 1.2548436262935229e-05, "loss": 2.3572, "step": 429520 }, { "epoch": 0.75, "learning_rate": 1.2547564323008404e-05, "loss": 2.4, "step": 429530 }, { "epoch": 0.75, "learning_rate": 1.2546692383081577e-05, "loss": 2.1124, "step": 429540 }, { "epoch": 0.75, "learning_rate": 1.2545820443154749e-05, "loss": 2.321, "step": 429550 }, { "epoch": 0.75, "learning_rate": 1.254494850322792e-05, "loss": 2.3177, "step": 429560 }, { "epoch": 0.75, "learning_rate": 1.2544076563301096e-05, "loss": 2.4005, "step": 429570 }, { "epoch": 0.75, "learning_rate": 1.2543204623374268e-05, "loss": 2.32, "step": 429580 }, { "epoch": 0.75, "learning_rate": 1.2542332683447442e-05, "loss": 2.2283, "step": 429590 }, { "epoch": 0.75, "learning_rate": 1.2541460743520614e-05, "loss": 2.4201, "step": 429600 }, { "epoch": 0.75, "learning_rate": 1.254058880359379e-05, "loss": 2.3056, "step": 429610 }, { "epoch": 0.75, "learning_rate": 1.2539716863666962e-05, "loss": 2.2576, "step": 429620 }, { "epoch": 0.75, "learning_rate": 1.2538844923740134e-05, "loss": 2.4192, "step": 429630 }, { "epoch": 0.75, "learning_rate": 1.2537972983813306e-05, "loss": 2.3112, "step": 429640 }, { "epoch": 0.75, "learning_rate": 1.2537101043886481e-05, "loss": 2.2509, "step": 429650 }, { "epoch": 0.75, "learning_rate": 1.2536229103959653e-05, "loss": 2.2446, "step": 429660 }, { "epoch": 0.75, "learning_rate": 1.2535357164032827e-05, "loss": 2.2774, "step": 429670 }, { "epoch": 0.75, "learning_rate": 1.2534485224106003e-05, "loss": 2.2675, "step": 429680 }, { "epoch": 0.75, "learning_rate": 1.2533613284179175e-05, "loss": 2.2531, "step": 429690 }, { "epoch": 0.75, "learning_rate": 1.2532741344252347e-05, "loss": 2.3141, "step": 429700 }, { "epoch": 0.75, "learning_rate": 1.2531869404325519e-05, "loss": 2.3724, "step": 429710 }, { "epoch": 0.75, "learning_rate": 1.2530997464398694e-05, "loss": 2.4073, "step": 429720 }, { "epoch": 0.75, "learning_rate": 1.2530125524471866e-05, "loss": 2.2659, "step": 429730 }, { "epoch": 0.75, "learning_rate": 1.252925358454504e-05, "loss": 2.335, "step": 429740 }, { "epoch": 0.75, "learning_rate": 1.2528381644618212e-05, "loss": 2.3803, "step": 429750 }, { "epoch": 0.75, "learning_rate": 1.2527509704691388e-05, "loss": 2.3049, "step": 429760 }, { "epoch": 0.75, "learning_rate": 1.252663776476456e-05, "loss": 2.44, "step": 429770 }, { "epoch": 0.75, "learning_rate": 1.2525765824837732e-05, "loss": 2.3378, "step": 429780 }, { "epoch": 0.75, "learning_rate": 1.2524893884910907e-05, "loss": 2.3233, "step": 429790 }, { "epoch": 0.75, "learning_rate": 1.252402194498408e-05, "loss": 2.2883, "step": 429800 }, { "epoch": 0.75, "learning_rate": 1.2523150005057251e-05, "loss": 2.2993, "step": 429810 }, { "epoch": 0.75, "learning_rate": 1.2522278065130425e-05, "loss": 2.286, "step": 429820 }, { "epoch": 0.75, "learning_rate": 1.2521406125203599e-05, "loss": 2.3248, "step": 429830 }, { "epoch": 0.75, "learning_rate": 1.2520534185276773e-05, "loss": 2.3474, "step": 429840 }, { "epoch": 0.75, "learning_rate": 1.2519662245349945e-05, "loss": 2.353, "step": 429850 }, { "epoch": 0.75, "learning_rate": 1.2518790305423117e-05, "loss": 2.2929, "step": 429860 }, { "epoch": 0.75, "learning_rate": 1.2517918365496292e-05, "loss": 2.2918, "step": 429870 }, { "epoch": 0.75, "learning_rate": 1.2517046425569464e-05, "loss": 2.1749, "step": 429880 }, { "epoch": 0.75, "learning_rate": 1.2516174485642636e-05, "loss": 2.3313, "step": 429890 }, { "epoch": 0.75, "learning_rate": 1.251530254571581e-05, "loss": 2.3798, "step": 429900 }, { "epoch": 0.75, "learning_rate": 1.2514430605788984e-05, "loss": 2.3129, "step": 429910 }, { "epoch": 0.75, "learning_rate": 1.2513558665862158e-05, "loss": 2.3621, "step": 429920 }, { "epoch": 0.75, "learning_rate": 1.251268672593533e-05, "loss": 2.3206, "step": 429930 }, { "epoch": 0.75, "learning_rate": 1.2511814786008505e-05, "loss": 2.3201, "step": 429940 }, { "epoch": 0.75, "learning_rate": 1.2510942846081677e-05, "loss": 2.2501, "step": 429950 }, { "epoch": 0.75, "learning_rate": 1.251007090615485e-05, "loss": 2.3295, "step": 429960 }, { "epoch": 0.75, "learning_rate": 1.2509198966228022e-05, "loss": 2.2833, "step": 429970 }, { "epoch": 0.75, "learning_rate": 1.2508327026301197e-05, "loss": 2.307, "step": 429980 }, { "epoch": 0.75, "learning_rate": 1.250745508637437e-05, "loss": 2.1906, "step": 429990 }, { "epoch": 0.75, "learning_rate": 1.2506583146447543e-05, "loss": 2.3406, "step": 430000 }, { "epoch": 0.75, "learning_rate": 1.2505711206520715e-05, "loss": 2.2772, "step": 430010 }, { "epoch": 0.75, "learning_rate": 1.250483926659389e-05, "loss": 2.2328, "step": 430020 }, { "epoch": 0.75, "learning_rate": 1.2503967326667062e-05, "loss": 2.3465, "step": 430030 }, { "epoch": 0.75, "learning_rate": 1.2503095386740235e-05, "loss": 2.204, "step": 430040 }, { "epoch": 0.75, "learning_rate": 1.250222344681341e-05, "loss": 2.2941, "step": 430050 }, { "epoch": 0.75, "learning_rate": 1.2501351506886582e-05, "loss": 2.291, "step": 430060 }, { "epoch": 0.75, "learning_rate": 1.2500479566959756e-05, "loss": 2.302, "step": 430070 }, { "epoch": 0.75, "learning_rate": 1.249960762703293e-05, "loss": 2.3651, "step": 430080 }, { "epoch": 0.75, "learning_rate": 1.2498735687106102e-05, "loss": 2.2469, "step": 430090 }, { "epoch": 0.75, "learning_rate": 1.2497863747179275e-05, "loss": 2.2324, "step": 430100 }, { "epoch": 0.75, "learning_rate": 1.2496991807252448e-05, "loss": 2.3362, "step": 430110 }, { "epoch": 0.75, "learning_rate": 1.2496119867325621e-05, "loss": 2.1829, "step": 430120 }, { "epoch": 0.75, "learning_rate": 1.2495247927398793e-05, "loss": 2.338, "step": 430130 }, { "epoch": 0.75, "learning_rate": 1.2494375987471967e-05, "loss": 2.1362, "step": 430140 }, { "epoch": 0.75, "learning_rate": 1.2493504047545141e-05, "loss": 2.1693, "step": 430150 }, { "epoch": 0.75, "learning_rate": 1.2492632107618315e-05, "loss": 2.3345, "step": 430160 }, { "epoch": 0.75, "learning_rate": 1.2491760167691487e-05, "loss": 2.31, "step": 430170 }, { "epoch": 0.75, "learning_rate": 1.249088822776466e-05, "loss": 2.1956, "step": 430180 }, { "epoch": 0.75, "learning_rate": 1.2490016287837834e-05, "loss": 2.2792, "step": 430190 }, { "epoch": 0.75, "learning_rate": 1.2489144347911006e-05, "loss": 2.277, "step": 430200 }, { "epoch": 0.75, "learning_rate": 1.248827240798418e-05, "loss": 2.2261, "step": 430210 }, { "epoch": 0.75, "learning_rate": 1.2487400468057352e-05, "loss": 2.3165, "step": 430220 }, { "epoch": 0.75, "learning_rate": 1.2486528528130528e-05, "loss": 2.2603, "step": 430230 }, { "epoch": 0.75, "learning_rate": 1.24856565882037e-05, "loss": 2.2627, "step": 430240 }, { "epoch": 0.75, "learning_rate": 1.2484784648276874e-05, "loss": 2.2724, "step": 430250 }, { "epoch": 0.75, "learning_rate": 1.2483912708350046e-05, "loss": 2.326, "step": 430260 }, { "epoch": 0.75, "learning_rate": 1.248304076842322e-05, "loss": 2.3078, "step": 430270 }, { "epoch": 0.75, "learning_rate": 1.2482168828496391e-05, "loss": 2.2616, "step": 430280 }, { "epoch": 0.75, "learning_rate": 1.2481296888569565e-05, "loss": 2.3336, "step": 430290 }, { "epoch": 0.75, "learning_rate": 1.2480424948642739e-05, "loss": 2.2896, "step": 430300 }, { "epoch": 0.75, "learning_rate": 1.2479553008715913e-05, "loss": 2.2755, "step": 430310 }, { "epoch": 0.75, "learning_rate": 1.2478681068789087e-05, "loss": 2.3078, "step": 430320 }, { "epoch": 0.75, "learning_rate": 1.2477809128862259e-05, "loss": 2.4001, "step": 430330 }, { "epoch": 0.75, "learning_rate": 1.2476937188935432e-05, "loss": 2.3428, "step": 430340 }, { "epoch": 0.75, "learning_rate": 1.2476065249008604e-05, "loss": 2.4513, "step": 430350 }, { "epoch": 0.75, "learning_rate": 1.2475193309081778e-05, "loss": 2.2398, "step": 430360 }, { "epoch": 0.75, "learning_rate": 1.247432136915495e-05, "loss": 2.3023, "step": 430370 }, { "epoch": 0.75, "learning_rate": 1.2473449429228124e-05, "loss": 2.2842, "step": 430380 }, { "epoch": 0.75, "learning_rate": 1.2472577489301298e-05, "loss": 2.3243, "step": 430390 }, { "epoch": 0.75, "learning_rate": 1.2471705549374472e-05, "loss": 2.1835, "step": 430400 }, { "epoch": 0.75, "learning_rate": 1.2470833609447644e-05, "loss": 2.2384, "step": 430410 }, { "epoch": 0.75, "learning_rate": 1.2469961669520817e-05, "loss": 2.2934, "step": 430420 }, { "epoch": 0.75, "learning_rate": 1.246908972959399e-05, "loss": 2.2791, "step": 430430 }, { "epoch": 0.75, "learning_rate": 1.2468217789667163e-05, "loss": 2.3289, "step": 430440 }, { "epoch": 0.75, "learning_rate": 1.2467345849740337e-05, "loss": 2.2266, "step": 430450 }, { "epoch": 0.75, "learning_rate": 1.246647390981351e-05, "loss": 2.283, "step": 430460 }, { "epoch": 0.75, "learning_rate": 1.2465601969886685e-05, "loss": 2.2633, "step": 430470 }, { "epoch": 0.75, "learning_rate": 1.2464730029959857e-05, "loss": 2.2677, "step": 430480 }, { "epoch": 0.75, "learning_rate": 1.246385809003303e-05, "loss": 2.35, "step": 430490 }, { "epoch": 0.75, "learning_rate": 1.2462986150106203e-05, "loss": 2.2852, "step": 430500 }, { "epoch": 0.75, "learning_rate": 1.2462114210179376e-05, "loss": 2.2767, "step": 430510 }, { "epoch": 0.75, "learning_rate": 1.2461242270252548e-05, "loss": 2.1912, "step": 430520 }, { "epoch": 0.75, "learning_rate": 1.2460370330325722e-05, "loss": 2.23, "step": 430530 }, { "epoch": 0.75, "learning_rate": 1.2459498390398896e-05, "loss": 2.3149, "step": 430540 }, { "epoch": 0.75, "learning_rate": 1.245862645047207e-05, "loss": 2.3125, "step": 430550 }, { "epoch": 0.75, "learning_rate": 1.2457754510545242e-05, "loss": 2.2934, "step": 430560 }, { "epoch": 0.75, "learning_rate": 1.2456882570618416e-05, "loss": 2.3053, "step": 430570 }, { "epoch": 0.75, "learning_rate": 1.245601063069159e-05, "loss": 2.3255, "step": 430580 }, { "epoch": 0.75, "learning_rate": 1.2455138690764761e-05, "loss": 2.2165, "step": 430590 }, { "epoch": 0.75, "learning_rate": 1.2454266750837935e-05, "loss": 2.3666, "step": 430600 }, { "epoch": 0.75, "learning_rate": 1.2453394810911107e-05, "loss": 2.2977, "step": 430610 }, { "epoch": 0.75, "learning_rate": 1.2452522870984281e-05, "loss": 2.2188, "step": 430620 }, { "epoch": 0.75, "learning_rate": 1.2451650931057455e-05, "loss": 2.2685, "step": 430630 }, { "epoch": 0.75, "learning_rate": 1.2450778991130629e-05, "loss": 2.2936, "step": 430640 }, { "epoch": 0.75, "learning_rate": 1.24499070512038e-05, "loss": 2.3253, "step": 430650 }, { "epoch": 0.75, "learning_rate": 1.2449035111276974e-05, "loss": 2.2544, "step": 430660 }, { "epoch": 0.75, "learning_rate": 1.2448163171350146e-05, "loss": 2.213, "step": 430670 }, { "epoch": 0.75, "learning_rate": 1.244729123142332e-05, "loss": 2.2439, "step": 430680 }, { "epoch": 0.75, "learning_rate": 1.2446419291496492e-05, "loss": 2.2306, "step": 430690 }, { "epoch": 0.75, "learning_rate": 1.2445547351569666e-05, "loss": 2.3207, "step": 430700 }, { "epoch": 0.75, "learning_rate": 1.2444675411642842e-05, "loss": 2.1876, "step": 430710 }, { "epoch": 0.75, "learning_rate": 1.2443803471716014e-05, "loss": 2.3452, "step": 430720 }, { "epoch": 0.75, "learning_rate": 1.2442931531789187e-05, "loss": 2.2607, "step": 430730 }, { "epoch": 0.75, "learning_rate": 1.244205959186236e-05, "loss": 2.3531, "step": 430740 }, { "epoch": 0.75, "learning_rate": 1.2441187651935533e-05, "loss": 2.253, "step": 430750 }, { "epoch": 0.75, "learning_rate": 1.2440315712008705e-05, "loss": 2.2587, "step": 430760 }, { "epoch": 0.75, "learning_rate": 1.2439443772081879e-05, "loss": 2.3564, "step": 430770 }, { "epoch": 0.75, "learning_rate": 1.2438571832155053e-05, "loss": 2.26, "step": 430780 }, { "epoch": 0.75, "learning_rate": 1.2437699892228227e-05, "loss": 2.3151, "step": 430790 }, { "epoch": 0.75, "learning_rate": 1.2436827952301399e-05, "loss": 2.3336, "step": 430800 }, { "epoch": 0.75, "learning_rate": 1.2435956012374572e-05, "loss": 2.4097, "step": 430810 }, { "epoch": 0.75, "learning_rate": 1.2435084072447745e-05, "loss": 2.3263, "step": 430820 }, { "epoch": 0.75, "learning_rate": 1.2434212132520918e-05, "loss": 2.2847, "step": 430830 }, { "epoch": 0.75, "learning_rate": 1.243334019259409e-05, "loss": 2.2821, "step": 430840 }, { "epoch": 0.75, "learning_rate": 1.2432468252667264e-05, "loss": 2.2294, "step": 430850 }, { "epoch": 0.75, "learning_rate": 1.2431596312740438e-05, "loss": 2.2835, "step": 430860 }, { "epoch": 0.75, "learning_rate": 1.2430724372813612e-05, "loss": 2.3482, "step": 430870 }, { "epoch": 0.75, "learning_rate": 1.2429852432886785e-05, "loss": 2.2268, "step": 430880 }, { "epoch": 0.75, "learning_rate": 1.2428980492959958e-05, "loss": 2.3767, "step": 430890 }, { "epoch": 0.75, "learning_rate": 1.2428108553033131e-05, "loss": 2.3723, "step": 430900 }, { "epoch": 0.75, "learning_rate": 1.2427236613106303e-05, "loss": 2.2646, "step": 430910 }, { "epoch": 0.75, "learning_rate": 1.2426364673179477e-05, "loss": 2.1816, "step": 430920 }, { "epoch": 0.75, "learning_rate": 1.242549273325265e-05, "loss": 2.2341, "step": 430930 }, { "epoch": 0.75, "learning_rate": 1.2424620793325823e-05, "loss": 2.4105, "step": 430940 }, { "epoch": 0.75, "learning_rate": 1.2423748853398997e-05, "loss": 2.3706, "step": 430950 }, { "epoch": 0.75, "learning_rate": 1.242287691347217e-05, "loss": 2.2288, "step": 430960 }, { "epoch": 0.75, "learning_rate": 1.2422004973545343e-05, "loss": 2.1493, "step": 430970 }, { "epoch": 0.75, "learning_rate": 1.2421133033618516e-05, "loss": 2.3942, "step": 430980 }, { "epoch": 0.75, "learning_rate": 1.242026109369169e-05, "loss": 2.3133, "step": 430990 }, { "epoch": 0.75, "learning_rate": 1.2419389153764862e-05, "loss": 2.3313, "step": 431000 }, { "epoch": 0.75, "learning_rate": 1.2418517213838036e-05, "loss": 2.2344, "step": 431010 }, { "epoch": 0.75, "learning_rate": 1.241764527391121e-05, "loss": 2.2585, "step": 431020 }, { "epoch": 0.75, "learning_rate": 1.2416773333984384e-05, "loss": 2.3969, "step": 431030 }, { "epoch": 0.75, "learning_rate": 1.2415901394057556e-05, "loss": 2.3141, "step": 431040 }, { "epoch": 0.75, "learning_rate": 1.241502945413073e-05, "loss": 2.1783, "step": 431050 }, { "epoch": 0.75, "learning_rate": 1.2414157514203901e-05, "loss": 2.337, "step": 431060 }, { "epoch": 0.75, "learning_rate": 1.2413285574277075e-05, "loss": 2.1364, "step": 431070 }, { "epoch": 0.75, "learning_rate": 1.2412413634350247e-05, "loss": 2.3021, "step": 431080 }, { "epoch": 0.75, "learning_rate": 1.2411541694423421e-05, "loss": 2.3385, "step": 431090 }, { "epoch": 0.75, "learning_rate": 1.2410669754496595e-05, "loss": 2.218, "step": 431100 }, { "epoch": 0.75, "learning_rate": 1.2409797814569769e-05, "loss": 2.1744, "step": 431110 }, { "epoch": 0.75, "learning_rate": 1.2408925874642942e-05, "loss": 2.1865, "step": 431120 }, { "epoch": 0.75, "learning_rate": 1.2408053934716114e-05, "loss": 2.2268, "step": 431130 }, { "epoch": 0.75, "learning_rate": 1.2407181994789288e-05, "loss": 2.3231, "step": 431140 }, { "epoch": 0.75, "learning_rate": 1.240631005486246e-05, "loss": 2.3173, "step": 431150 }, { "epoch": 0.75, "learning_rate": 1.2405438114935634e-05, "loss": 2.3424, "step": 431160 }, { "epoch": 0.75, "learning_rate": 1.2404566175008806e-05, "loss": 2.3555, "step": 431170 }, { "epoch": 0.75, "learning_rate": 1.240369423508198e-05, "loss": 2.3902, "step": 431180 }, { "epoch": 0.75, "learning_rate": 1.2402822295155154e-05, "loss": 2.2431, "step": 431190 }, { "epoch": 0.75, "learning_rate": 1.2401950355228327e-05, "loss": 2.2839, "step": 431200 }, { "epoch": 0.75, "learning_rate": 1.24010784153015e-05, "loss": 2.4037, "step": 431210 }, { "epoch": 0.75, "learning_rate": 1.2400206475374673e-05, "loss": 2.2102, "step": 431220 }, { "epoch": 0.75, "learning_rate": 1.2399334535447845e-05, "loss": 2.2618, "step": 431230 }, { "epoch": 0.75, "learning_rate": 1.239846259552102e-05, "loss": 2.3489, "step": 431240 }, { "epoch": 0.75, "learning_rate": 1.2397590655594193e-05, "loss": 2.3412, "step": 431250 }, { "epoch": 0.75, "learning_rate": 1.2396718715667365e-05, "loss": 2.3083, "step": 431260 }, { "epoch": 0.75, "learning_rate": 1.239584677574054e-05, "loss": 2.325, "step": 431270 }, { "epoch": 0.75, "learning_rate": 1.2394974835813713e-05, "loss": 2.2436, "step": 431280 }, { "epoch": 0.75, "learning_rate": 1.2394102895886886e-05, "loss": 2.2675, "step": 431290 }, { "epoch": 0.75, "learning_rate": 1.2393230955960058e-05, "loss": 2.2711, "step": 431300 }, { "epoch": 0.75, "learning_rate": 1.2392359016033232e-05, "loss": 2.2689, "step": 431310 }, { "epoch": 0.75, "learning_rate": 1.2391487076106404e-05, "loss": 2.2739, "step": 431320 }, { "epoch": 0.75, "learning_rate": 1.2390615136179578e-05, "loss": 2.2429, "step": 431330 }, { "epoch": 0.75, "learning_rate": 1.2389743196252752e-05, "loss": 2.1971, "step": 431340 }, { "epoch": 0.75, "learning_rate": 1.2388871256325926e-05, "loss": 2.2773, "step": 431350 }, { "epoch": 0.75, "learning_rate": 1.2387999316399098e-05, "loss": 2.2624, "step": 431360 }, { "epoch": 0.75, "learning_rate": 1.2387127376472271e-05, "loss": 2.3473, "step": 431370 }, { "epoch": 0.75, "learning_rate": 1.2386255436545445e-05, "loss": 2.3948, "step": 431380 }, { "epoch": 0.75, "learning_rate": 1.2385383496618617e-05, "loss": 2.2383, "step": 431390 }, { "epoch": 0.75, "learning_rate": 1.2384511556691791e-05, "loss": 2.1901, "step": 431400 }, { "epoch": 0.75, "learning_rate": 1.2383639616764963e-05, "loss": 2.2535, "step": 431410 }, { "epoch": 0.75, "learning_rate": 1.2382767676838137e-05, "loss": 2.4933, "step": 431420 }, { "epoch": 0.75, "learning_rate": 1.238189573691131e-05, "loss": 2.2502, "step": 431430 }, { "epoch": 0.75, "learning_rate": 1.2381023796984484e-05, "loss": 2.2589, "step": 431440 }, { "epoch": 0.75, "learning_rate": 1.2380151857057656e-05, "loss": 2.2068, "step": 431450 }, { "epoch": 0.75, "learning_rate": 1.237927991713083e-05, "loss": 2.347, "step": 431460 }, { "epoch": 0.75, "learning_rate": 1.2378407977204002e-05, "loss": 2.2005, "step": 431470 }, { "epoch": 0.75, "learning_rate": 1.2377536037277176e-05, "loss": 2.3444, "step": 431480 }, { "epoch": 0.75, "learning_rate": 1.2376664097350348e-05, "loss": 2.4076, "step": 431490 }, { "epoch": 0.75, "learning_rate": 1.2375792157423522e-05, "loss": 2.2486, "step": 431500 }, { "epoch": 0.75, "learning_rate": 1.2374920217496697e-05, "loss": 2.3379, "step": 431510 }, { "epoch": 0.75, "learning_rate": 1.237404827756987e-05, "loss": 2.3295, "step": 431520 }, { "epoch": 0.75, "learning_rate": 1.2373176337643043e-05, "loss": 2.3363, "step": 431530 }, { "epoch": 0.75, "learning_rate": 1.2372304397716215e-05, "loss": 2.327, "step": 431540 }, { "epoch": 0.75, "learning_rate": 1.2371432457789389e-05, "loss": 2.2871, "step": 431550 }, { "epoch": 0.75, "learning_rate": 1.2370560517862561e-05, "loss": 2.3273, "step": 431560 }, { "epoch": 0.75, "learning_rate": 1.2369688577935735e-05, "loss": 2.3299, "step": 431570 }, { "epoch": 0.75, "learning_rate": 1.2368816638008909e-05, "loss": 2.2492, "step": 431580 }, { "epoch": 0.75, "learning_rate": 1.2367944698082083e-05, "loss": 2.2303, "step": 431590 }, { "epoch": 0.75, "learning_rate": 1.2367072758155255e-05, "loss": 2.1952, "step": 431600 }, { "epoch": 0.75, "learning_rate": 1.2366200818228428e-05, "loss": 2.2524, "step": 431610 }, { "epoch": 0.75, "learning_rate": 1.23653288783016e-05, "loss": 2.253, "step": 431620 }, { "epoch": 0.75, "learning_rate": 1.2364456938374774e-05, "loss": 2.1553, "step": 431630 }, { "epoch": 0.75, "learning_rate": 1.2363584998447948e-05, "loss": 2.2896, "step": 431640 }, { "epoch": 0.75, "learning_rate": 1.236271305852112e-05, "loss": 2.362, "step": 431650 }, { "epoch": 0.75, "learning_rate": 1.2361841118594294e-05, "loss": 2.2717, "step": 431660 }, { "epoch": 0.75, "learning_rate": 1.2360969178667468e-05, "loss": 2.2061, "step": 431670 }, { "epoch": 0.75, "learning_rate": 1.2360097238740641e-05, "loss": 2.2638, "step": 431680 }, { "epoch": 0.75, "learning_rate": 1.2359225298813813e-05, "loss": 2.3124, "step": 431690 }, { "epoch": 0.75, "learning_rate": 1.2358353358886987e-05, "loss": 2.2623, "step": 431700 }, { "epoch": 0.75, "learning_rate": 1.235748141896016e-05, "loss": 2.257, "step": 431710 }, { "epoch": 0.75, "learning_rate": 1.2356609479033333e-05, "loss": 2.2747, "step": 431720 }, { "epoch": 0.75, "learning_rate": 1.2355737539106505e-05, "loss": 2.3743, "step": 431730 }, { "epoch": 0.75, "learning_rate": 1.2354865599179679e-05, "loss": 2.2992, "step": 431740 }, { "epoch": 0.75, "learning_rate": 1.2353993659252853e-05, "loss": 2.3413, "step": 431750 }, { "epoch": 0.75, "learning_rate": 1.2353121719326026e-05, "loss": 2.2194, "step": 431760 }, { "epoch": 0.75, "learning_rate": 1.2352249779399199e-05, "loss": 2.445, "step": 431770 }, { "epoch": 0.75, "learning_rate": 1.2351377839472372e-05, "loss": 2.3065, "step": 431780 }, { "epoch": 0.75, "learning_rate": 1.2350505899545546e-05, "loss": 2.3713, "step": 431790 }, { "epoch": 0.75, "learning_rate": 1.2349633959618718e-05, "loss": 2.3308, "step": 431800 }, { "epoch": 0.75, "learning_rate": 1.2348762019691892e-05, "loss": 2.1941, "step": 431810 }, { "epoch": 0.75, "learning_rate": 1.2347890079765066e-05, "loss": 2.439, "step": 431820 }, { "epoch": 0.75, "learning_rate": 1.234701813983824e-05, "loss": 2.1827, "step": 431830 }, { "epoch": 0.75, "learning_rate": 1.2346146199911412e-05, "loss": 2.1707, "step": 431840 }, { "epoch": 0.75, "learning_rate": 1.2345274259984585e-05, "loss": 2.2451, "step": 431850 }, { "epoch": 0.75, "learning_rate": 1.2344402320057757e-05, "loss": 2.3095, "step": 431860 }, { "epoch": 0.75, "learning_rate": 1.2343530380130931e-05, "loss": 2.4196, "step": 431870 }, { "epoch": 0.75, "learning_rate": 1.2342658440204103e-05, "loss": 2.3124, "step": 431880 }, { "epoch": 0.75, "learning_rate": 1.2341786500277277e-05, "loss": 2.1628, "step": 431890 }, { "epoch": 0.75, "learning_rate": 1.234091456035045e-05, "loss": 2.2246, "step": 431900 }, { "epoch": 0.75, "learning_rate": 1.2340042620423625e-05, "loss": 2.3087, "step": 431910 }, { "epoch": 0.75, "learning_rate": 1.2339170680496798e-05, "loss": 2.2268, "step": 431920 }, { "epoch": 0.75, "learning_rate": 1.233829874056997e-05, "loss": 2.2193, "step": 431930 }, { "epoch": 0.75, "learning_rate": 1.2337426800643144e-05, "loss": 2.2155, "step": 431940 }, { "epoch": 0.75, "learning_rate": 1.2336554860716316e-05, "loss": 2.2813, "step": 431950 }, { "epoch": 0.75, "learning_rate": 1.233568292078949e-05, "loss": 2.217, "step": 431960 }, { "epoch": 0.75, "learning_rate": 1.2334810980862662e-05, "loss": 2.3602, "step": 431970 }, { "epoch": 0.75, "learning_rate": 1.2333939040935836e-05, "loss": 2.3269, "step": 431980 }, { "epoch": 0.75, "learning_rate": 1.233306710100901e-05, "loss": 2.3882, "step": 431990 }, { "epoch": 0.75, "learning_rate": 1.2332195161082183e-05, "loss": 2.1942, "step": 432000 }, { "epoch": 0.75, "learning_rate": 1.2331323221155355e-05, "loss": 2.2282, "step": 432010 }, { "epoch": 0.75, "learning_rate": 1.233045128122853e-05, "loss": 2.2575, "step": 432020 }, { "epoch": 0.75, "learning_rate": 1.2329579341301701e-05, "loss": 2.1454, "step": 432030 }, { "epoch": 0.75, "learning_rate": 1.2328707401374875e-05, "loss": 2.3605, "step": 432040 }, { "epoch": 0.75, "learning_rate": 1.2327835461448049e-05, "loss": 2.339, "step": 432050 }, { "epoch": 0.75, "learning_rate": 1.2326963521521223e-05, "loss": 2.2501, "step": 432060 }, { "epoch": 0.75, "learning_rate": 1.2326091581594396e-05, "loss": 2.3426, "step": 432070 }, { "epoch": 0.75, "learning_rate": 1.2325219641667568e-05, "loss": 2.2078, "step": 432080 }, { "epoch": 0.75, "learning_rate": 1.2324347701740742e-05, "loss": 2.2359, "step": 432090 }, { "epoch": 0.75, "learning_rate": 1.2323475761813914e-05, "loss": 2.316, "step": 432100 }, { "epoch": 0.75, "learning_rate": 1.2322603821887088e-05, "loss": 2.3265, "step": 432110 }, { "epoch": 0.75, "learning_rate": 1.232173188196026e-05, "loss": 2.3798, "step": 432120 }, { "epoch": 0.75, "learning_rate": 1.2320859942033434e-05, "loss": 2.2483, "step": 432130 }, { "epoch": 0.75, "learning_rate": 1.2319988002106608e-05, "loss": 2.2666, "step": 432140 }, { "epoch": 0.75, "learning_rate": 1.2319116062179781e-05, "loss": 2.268, "step": 432150 }, { "epoch": 0.75, "learning_rate": 1.2318244122252954e-05, "loss": 2.3563, "step": 432160 }, { "epoch": 0.75, "learning_rate": 1.2317372182326127e-05, "loss": 2.3811, "step": 432170 }, { "epoch": 0.75, "learning_rate": 1.2316500242399301e-05, "loss": 2.3372, "step": 432180 }, { "epoch": 0.75, "learning_rate": 1.2315628302472473e-05, "loss": 2.2457, "step": 432190 }, { "epoch": 0.75, "learning_rate": 1.2314756362545647e-05, "loss": 2.3501, "step": 432200 }, { "epoch": 0.75, "learning_rate": 1.2313884422618819e-05, "loss": 2.2886, "step": 432210 }, { "epoch": 0.75, "learning_rate": 1.2313012482691993e-05, "loss": 2.3366, "step": 432220 }, { "epoch": 0.75, "learning_rate": 1.2312140542765167e-05, "loss": 2.3237, "step": 432230 }, { "epoch": 0.75, "learning_rate": 1.231126860283834e-05, "loss": 2.2527, "step": 432240 }, { "epoch": 0.75, "learning_rate": 1.2310396662911512e-05, "loss": 2.1979, "step": 432250 }, { "epoch": 0.75, "learning_rate": 1.2309524722984686e-05, "loss": 2.3028, "step": 432260 }, { "epoch": 0.75, "learning_rate": 1.2308652783057858e-05, "loss": 2.3212, "step": 432270 }, { "epoch": 0.75, "learning_rate": 1.2307780843131032e-05, "loss": 2.277, "step": 432280 }, { "epoch": 0.75, "learning_rate": 1.2306908903204204e-05, "loss": 2.2678, "step": 432290 }, { "epoch": 0.75, "learning_rate": 1.2306036963277378e-05, "loss": 2.172, "step": 432300 }, { "epoch": 0.75, "learning_rate": 1.2305165023350553e-05, "loss": 2.1756, "step": 432310 }, { "epoch": 0.75, "learning_rate": 1.2304293083423725e-05, "loss": 2.2474, "step": 432320 }, { "epoch": 0.75, "learning_rate": 1.2303421143496899e-05, "loss": 2.2323, "step": 432330 }, { "epoch": 0.75, "learning_rate": 1.2302549203570071e-05, "loss": 2.3816, "step": 432340 }, { "epoch": 0.75, "learning_rate": 1.2301677263643245e-05, "loss": 2.2799, "step": 432350 }, { "epoch": 0.75, "learning_rate": 1.2300805323716417e-05, "loss": 2.2751, "step": 432360 }, { "epoch": 0.75, "learning_rate": 1.229993338378959e-05, "loss": 2.2545, "step": 432370 }, { "epoch": 0.75, "learning_rate": 1.2299061443862765e-05, "loss": 2.3215, "step": 432380 }, { "epoch": 0.75, "learning_rate": 1.2298189503935938e-05, "loss": 2.2608, "step": 432390 }, { "epoch": 0.75, "learning_rate": 1.229731756400911e-05, "loss": 2.2394, "step": 432400 }, { "epoch": 0.75, "learning_rate": 1.2296445624082284e-05, "loss": 2.3429, "step": 432410 }, { "epoch": 0.75, "learning_rate": 1.2295573684155456e-05, "loss": 2.3905, "step": 432420 }, { "epoch": 0.75, "learning_rate": 1.229470174422863e-05, "loss": 2.309, "step": 432430 }, { "epoch": 0.75, "learning_rate": 1.2293829804301804e-05, "loss": 2.2944, "step": 432440 }, { "epoch": 0.75, "learning_rate": 1.2292957864374976e-05, "loss": 2.217, "step": 432450 }, { "epoch": 0.75, "learning_rate": 1.229208592444815e-05, "loss": 2.3549, "step": 432460 }, { "epoch": 0.75, "learning_rate": 1.2291213984521323e-05, "loss": 2.2179, "step": 432470 }, { "epoch": 0.75, "learning_rate": 1.2290342044594497e-05, "loss": 2.2638, "step": 432480 }, { "epoch": 0.75, "learning_rate": 1.228947010466767e-05, "loss": 2.2747, "step": 432490 }, { "epoch": 0.75, "learning_rate": 1.2288598164740843e-05, "loss": 2.2716, "step": 432500 }, { "epoch": 0.75, "learning_rate": 1.2287726224814015e-05, "loss": 2.2474, "step": 432510 }, { "epoch": 0.75, "learning_rate": 1.2286854284887189e-05, "loss": 2.2574, "step": 432520 }, { "epoch": 0.75, "learning_rate": 1.2285982344960361e-05, "loss": 2.2848, "step": 432530 }, { "epoch": 0.75, "learning_rate": 1.2285110405033535e-05, "loss": 2.3045, "step": 432540 }, { "epoch": 0.75, "learning_rate": 1.2284238465106709e-05, "loss": 2.2349, "step": 432550 }, { "epoch": 0.75, "learning_rate": 1.2283366525179882e-05, "loss": 2.2166, "step": 432560 }, { "epoch": 0.75, "learning_rate": 1.2282494585253056e-05, "loss": 2.3255, "step": 432570 }, { "epoch": 0.75, "learning_rate": 1.2281622645326228e-05, "loss": 2.2917, "step": 432580 }, { "epoch": 0.75, "learning_rate": 1.2280750705399402e-05, "loss": 2.1825, "step": 432590 }, { "epoch": 0.75, "learning_rate": 1.2279878765472574e-05, "loss": 2.4541, "step": 432600 }, { "epoch": 0.75, "learning_rate": 1.2279006825545748e-05, "loss": 2.4021, "step": 432610 }, { "epoch": 0.75, "learning_rate": 1.2278134885618922e-05, "loss": 2.2482, "step": 432620 }, { "epoch": 0.75, "learning_rate": 1.2277262945692095e-05, "loss": 2.3189, "step": 432630 }, { "epoch": 0.75, "learning_rate": 1.2276391005765267e-05, "loss": 2.2188, "step": 432640 }, { "epoch": 0.75, "learning_rate": 1.2275519065838441e-05, "loss": 2.382, "step": 432650 }, { "epoch": 0.75, "learning_rate": 1.2274647125911613e-05, "loss": 2.2912, "step": 432660 }, { "epoch": 0.75, "learning_rate": 1.2273775185984787e-05, "loss": 2.1922, "step": 432670 }, { "epoch": 0.75, "learning_rate": 1.2272903246057959e-05, "loss": 2.3746, "step": 432680 }, { "epoch": 0.75, "learning_rate": 1.2272031306131133e-05, "loss": 2.2201, "step": 432690 }, { "epoch": 0.75, "learning_rate": 1.2271159366204307e-05, "loss": 2.2845, "step": 432700 }, { "epoch": 0.75, "learning_rate": 1.227028742627748e-05, "loss": 2.3539, "step": 432710 }, { "epoch": 0.75, "learning_rate": 1.2269415486350654e-05, "loss": 2.3064, "step": 432720 }, { "epoch": 0.75, "learning_rate": 1.2268543546423826e-05, "loss": 2.29, "step": 432730 }, { "epoch": 0.75, "learning_rate": 1.2267671606497e-05, "loss": 2.2329, "step": 432740 }, { "epoch": 0.75, "learning_rate": 1.2266799666570172e-05, "loss": 2.3186, "step": 432750 }, { "epoch": 0.75, "learning_rate": 1.2265927726643346e-05, "loss": 2.3822, "step": 432760 }, { "epoch": 0.75, "learning_rate": 1.2265055786716518e-05, "loss": 2.2437, "step": 432770 }, { "epoch": 0.75, "learning_rate": 1.2264183846789692e-05, "loss": 2.1741, "step": 432780 }, { "epoch": 0.75, "learning_rate": 1.2263311906862865e-05, "loss": 2.3217, "step": 432790 }, { "epoch": 0.75, "learning_rate": 1.226243996693604e-05, "loss": 2.3937, "step": 432800 }, { "epoch": 0.75, "learning_rate": 1.2261568027009211e-05, "loss": 2.2544, "step": 432810 }, { "epoch": 0.75, "learning_rate": 1.2260696087082385e-05, "loss": 2.1612, "step": 432820 }, { "epoch": 0.75, "learning_rate": 1.2259824147155557e-05, "loss": 2.2168, "step": 432830 }, { "epoch": 0.75, "learning_rate": 1.2258952207228731e-05, "loss": 2.3348, "step": 432840 }, { "epoch": 0.75, "learning_rate": 1.2258080267301905e-05, "loss": 2.3217, "step": 432850 }, { "epoch": 0.75, "learning_rate": 1.2257208327375078e-05, "loss": 2.2607, "step": 432860 }, { "epoch": 0.75, "learning_rate": 1.2256336387448252e-05, "loss": 2.2428, "step": 432870 }, { "epoch": 0.75, "learning_rate": 1.2255464447521424e-05, "loss": 2.2038, "step": 432880 }, { "epoch": 0.75, "learning_rate": 1.2254592507594598e-05, "loss": 2.276, "step": 432890 }, { "epoch": 0.75, "learning_rate": 1.225372056766777e-05, "loss": 2.3743, "step": 432900 }, { "epoch": 0.75, "learning_rate": 1.2252848627740944e-05, "loss": 2.3315, "step": 432910 }, { "epoch": 0.75, "learning_rate": 1.2251976687814116e-05, "loss": 2.2787, "step": 432920 }, { "epoch": 0.75, "learning_rate": 1.225110474788729e-05, "loss": 2.2751, "step": 432930 }, { "epoch": 0.75, "learning_rate": 1.2250232807960464e-05, "loss": 2.3161, "step": 432940 }, { "epoch": 0.76, "learning_rate": 1.2249360868033637e-05, "loss": 2.2476, "step": 432950 }, { "epoch": 0.76, "learning_rate": 1.224848892810681e-05, "loss": 2.3039, "step": 432960 }, { "epoch": 0.76, "learning_rate": 1.2247616988179983e-05, "loss": 2.2871, "step": 432970 }, { "epoch": 0.76, "learning_rate": 1.2246745048253157e-05, "loss": 2.3461, "step": 432980 }, { "epoch": 0.76, "learning_rate": 1.2245873108326329e-05, "loss": 2.1529, "step": 432990 }, { "epoch": 0.76, "learning_rate": 1.2245001168399503e-05, "loss": 2.3567, "step": 433000 }, { "epoch": 0.76, "learning_rate": 1.2244129228472675e-05, "loss": 2.3715, "step": 433010 }, { "epoch": 0.76, "learning_rate": 1.2243257288545849e-05, "loss": 2.2445, "step": 433020 }, { "epoch": 0.76, "learning_rate": 1.2242385348619022e-05, "loss": 2.301, "step": 433030 }, { "epoch": 0.76, "learning_rate": 1.2241513408692196e-05, "loss": 2.2616, "step": 433040 }, { "epoch": 0.76, "learning_rate": 1.2240641468765368e-05, "loss": 2.2741, "step": 433050 }, { "epoch": 0.76, "learning_rate": 1.2239769528838542e-05, "loss": 2.3001, "step": 433060 }, { "epoch": 0.76, "learning_rate": 1.2238897588911714e-05, "loss": 2.288, "step": 433070 }, { "epoch": 0.76, "learning_rate": 1.2238025648984888e-05, "loss": 2.1951, "step": 433080 }, { "epoch": 0.76, "learning_rate": 1.223715370905806e-05, "loss": 2.3228, "step": 433090 }, { "epoch": 0.76, "learning_rate": 1.2236281769131235e-05, "loss": 2.3128, "step": 433100 }, { "epoch": 0.76, "learning_rate": 1.2235409829204409e-05, "loss": 2.2805, "step": 433110 }, { "epoch": 0.76, "learning_rate": 1.2234537889277581e-05, "loss": 2.2675, "step": 433120 }, { "epoch": 0.76, "learning_rate": 1.2233665949350755e-05, "loss": 2.3546, "step": 433130 }, { "epoch": 0.76, "learning_rate": 1.2232794009423927e-05, "loss": 2.2527, "step": 433140 }, { "epoch": 0.76, "learning_rate": 1.22319220694971e-05, "loss": 2.3533, "step": 433150 }, { "epoch": 0.76, "learning_rate": 1.2231050129570273e-05, "loss": 2.2791, "step": 433160 }, { "epoch": 0.76, "learning_rate": 1.2230178189643447e-05, "loss": 2.3351, "step": 433170 }, { "epoch": 0.76, "learning_rate": 1.222930624971662e-05, "loss": 2.323, "step": 433180 }, { "epoch": 0.76, "learning_rate": 1.2228434309789794e-05, "loss": 2.3258, "step": 433190 }, { "epoch": 0.76, "learning_rate": 1.2227562369862966e-05, "loss": 2.3105, "step": 433200 }, { "epoch": 0.76, "learning_rate": 1.222669042993614e-05, "loss": 2.2381, "step": 433210 }, { "epoch": 0.76, "learning_rate": 1.2225818490009312e-05, "loss": 2.2836, "step": 433220 }, { "epoch": 0.76, "learning_rate": 1.2224946550082486e-05, "loss": 2.2295, "step": 433230 }, { "epoch": 0.76, "learning_rate": 1.222407461015566e-05, "loss": 2.394, "step": 433240 }, { "epoch": 0.76, "learning_rate": 1.2223202670228832e-05, "loss": 2.3541, "step": 433250 }, { "epoch": 0.76, "learning_rate": 1.2222330730302006e-05, "loss": 2.3361, "step": 433260 }, { "epoch": 0.76, "learning_rate": 1.222145879037518e-05, "loss": 2.3056, "step": 433270 }, { "epoch": 0.76, "learning_rate": 1.2220586850448353e-05, "loss": 2.3278, "step": 433280 }, { "epoch": 0.76, "learning_rate": 1.2219714910521525e-05, "loss": 2.3015, "step": 433290 }, { "epoch": 0.76, "learning_rate": 1.2218842970594699e-05, "loss": 2.3064, "step": 433300 }, { "epoch": 0.76, "learning_rate": 1.2217971030667871e-05, "loss": 2.337, "step": 433310 }, { "epoch": 0.76, "learning_rate": 1.2217099090741045e-05, "loss": 2.2979, "step": 433320 }, { "epoch": 0.76, "learning_rate": 1.2216227150814217e-05, "loss": 2.3166, "step": 433330 }, { "epoch": 0.76, "learning_rate": 1.221535521088739e-05, "loss": 2.2371, "step": 433340 }, { "epoch": 0.76, "learning_rate": 1.2214483270960564e-05, "loss": 2.2954, "step": 433350 }, { "epoch": 0.76, "learning_rate": 1.2213611331033738e-05, "loss": 2.2702, "step": 433360 }, { "epoch": 0.76, "learning_rate": 1.2212739391106912e-05, "loss": 2.3288, "step": 433370 }, { "epoch": 0.76, "learning_rate": 1.2211867451180084e-05, "loss": 2.1678, "step": 433380 }, { "epoch": 0.76, "learning_rate": 1.2210995511253258e-05, "loss": 2.4486, "step": 433390 }, { "epoch": 0.76, "learning_rate": 1.221012357132643e-05, "loss": 2.391, "step": 433400 }, { "epoch": 0.76, "learning_rate": 1.2209251631399604e-05, "loss": 2.2991, "step": 433410 }, { "epoch": 0.76, "learning_rate": 1.2208379691472777e-05, "loss": 2.3054, "step": 433420 }, { "epoch": 0.76, "learning_rate": 1.2207507751545951e-05, "loss": 2.2189, "step": 433430 }, { "epoch": 0.76, "learning_rate": 1.2206635811619123e-05, "loss": 2.1663, "step": 433440 }, { "epoch": 0.76, "learning_rate": 1.2205763871692297e-05, "loss": 2.3414, "step": 433450 }, { "epoch": 0.76, "learning_rate": 1.2204891931765469e-05, "loss": 2.1358, "step": 433460 }, { "epoch": 0.76, "learning_rate": 1.2204019991838643e-05, "loss": 2.3007, "step": 433470 }, { "epoch": 0.76, "learning_rate": 1.2203148051911815e-05, "loss": 2.3154, "step": 433480 }, { "epoch": 0.76, "learning_rate": 1.2202276111984989e-05, "loss": 2.2839, "step": 433490 }, { "epoch": 0.76, "learning_rate": 1.2201404172058162e-05, "loss": 2.3322, "step": 433500 }, { "epoch": 0.76, "learning_rate": 1.2200532232131336e-05, "loss": 2.4088, "step": 433510 }, { "epoch": 0.76, "learning_rate": 1.219966029220451e-05, "loss": 2.1762, "step": 433520 }, { "epoch": 0.76, "learning_rate": 1.2198788352277682e-05, "loss": 2.2413, "step": 433530 }, { "epoch": 0.76, "learning_rate": 1.2197916412350856e-05, "loss": 2.3604, "step": 433540 }, { "epoch": 0.76, "learning_rate": 1.2197044472424028e-05, "loss": 2.2466, "step": 433550 }, { "epoch": 0.76, "learning_rate": 1.2196172532497202e-05, "loss": 2.3996, "step": 433560 }, { "epoch": 0.76, "learning_rate": 1.2195300592570374e-05, "loss": 2.2444, "step": 433570 }, { "epoch": 0.76, "learning_rate": 1.2194428652643548e-05, "loss": 2.303, "step": 433580 }, { "epoch": 0.76, "learning_rate": 1.2193556712716721e-05, "loss": 2.2899, "step": 433590 }, { "epoch": 0.76, "learning_rate": 1.2192684772789895e-05, "loss": 2.2272, "step": 433600 }, { "epoch": 0.76, "learning_rate": 1.2191812832863067e-05, "loss": 2.1924, "step": 433610 }, { "epoch": 0.76, "learning_rate": 1.2190940892936241e-05, "loss": 2.3394, "step": 433620 }, { "epoch": 0.76, "learning_rate": 1.2190068953009413e-05, "loss": 2.2221, "step": 433630 }, { "epoch": 0.76, "learning_rate": 1.2189197013082587e-05, "loss": 2.2687, "step": 433640 }, { "epoch": 0.76, "learning_rate": 1.218832507315576e-05, "loss": 2.3711, "step": 433650 }, { "epoch": 0.76, "learning_rate": 1.2187453133228934e-05, "loss": 2.3461, "step": 433660 }, { "epoch": 0.76, "learning_rate": 1.2186581193302108e-05, "loss": 2.2049, "step": 433670 }, { "epoch": 0.76, "learning_rate": 1.218570925337528e-05, "loss": 2.2887, "step": 433680 }, { "epoch": 0.76, "learning_rate": 1.2184837313448454e-05, "loss": 2.29, "step": 433690 }, { "epoch": 0.76, "learning_rate": 1.2183965373521626e-05, "loss": 2.3307, "step": 433700 }, { "epoch": 0.76, "learning_rate": 1.21830934335948e-05, "loss": 2.2696, "step": 433710 }, { "epoch": 0.76, "learning_rate": 1.2182221493667972e-05, "loss": 2.223, "step": 433720 }, { "epoch": 0.76, "learning_rate": 1.2181349553741146e-05, "loss": 2.2038, "step": 433730 }, { "epoch": 0.76, "learning_rate": 1.218047761381432e-05, "loss": 2.3218, "step": 433740 }, { "epoch": 0.76, "learning_rate": 1.2179605673887493e-05, "loss": 2.2946, "step": 433750 }, { "epoch": 0.76, "learning_rate": 1.2178733733960665e-05, "loss": 2.3072, "step": 433760 }, { "epoch": 0.76, "learning_rate": 1.2177861794033839e-05, "loss": 2.2707, "step": 433770 }, { "epoch": 0.76, "learning_rate": 1.2176989854107013e-05, "loss": 2.2303, "step": 433780 }, { "epoch": 0.76, "learning_rate": 1.2176117914180185e-05, "loss": 2.3097, "step": 433790 }, { "epoch": 0.76, "learning_rate": 1.2175245974253359e-05, "loss": 2.1335, "step": 433800 }, { "epoch": 0.76, "learning_rate": 1.217437403432653e-05, "loss": 2.2695, "step": 433810 }, { "epoch": 0.76, "learning_rate": 1.2173502094399704e-05, "loss": 2.3014, "step": 433820 }, { "epoch": 0.76, "learning_rate": 1.2172630154472878e-05, "loss": 2.2408, "step": 433830 }, { "epoch": 0.76, "learning_rate": 1.2171758214546052e-05, "loss": 2.2663, "step": 433840 }, { "epoch": 0.76, "learning_rate": 1.2170886274619224e-05, "loss": 2.2492, "step": 433850 }, { "epoch": 0.76, "learning_rate": 1.2170014334692398e-05, "loss": 2.3336, "step": 433860 }, { "epoch": 0.76, "learning_rate": 1.216914239476557e-05, "loss": 2.3229, "step": 433870 }, { "epoch": 0.76, "learning_rate": 1.2168270454838744e-05, "loss": 2.3273, "step": 433880 }, { "epoch": 0.76, "learning_rate": 1.2167398514911916e-05, "loss": 2.3287, "step": 433890 }, { "epoch": 0.76, "learning_rate": 1.2166526574985091e-05, "loss": 2.1744, "step": 433900 }, { "epoch": 0.76, "learning_rate": 1.2165654635058265e-05, "loss": 2.2443, "step": 433910 }, { "epoch": 0.76, "learning_rate": 1.2164782695131437e-05, "loss": 2.3509, "step": 433920 }, { "epoch": 0.76, "learning_rate": 1.216391075520461e-05, "loss": 2.1948, "step": 433930 }, { "epoch": 0.76, "learning_rate": 1.2163038815277783e-05, "loss": 2.2224, "step": 433940 }, { "epoch": 0.76, "learning_rate": 1.2162166875350957e-05, "loss": 2.2941, "step": 433950 }, { "epoch": 0.76, "learning_rate": 1.2161294935424129e-05, "loss": 2.3805, "step": 433960 }, { "epoch": 0.76, "learning_rate": 1.2160422995497303e-05, "loss": 2.3235, "step": 433970 }, { "epoch": 0.76, "learning_rate": 1.2159551055570476e-05, "loss": 2.3223, "step": 433980 }, { "epoch": 0.76, "learning_rate": 1.215867911564365e-05, "loss": 2.2689, "step": 433990 }, { "epoch": 0.76, "learning_rate": 1.2157807175716822e-05, "loss": 2.2087, "step": 434000 }, { "epoch": 0.76, "learning_rate": 1.2156935235789996e-05, "loss": 2.3336, "step": 434010 }, { "epoch": 0.76, "learning_rate": 1.2156063295863168e-05, "loss": 2.3619, "step": 434020 }, { "epoch": 0.76, "learning_rate": 1.2155191355936342e-05, "loss": 2.2452, "step": 434030 }, { "epoch": 0.76, "learning_rate": 1.2154319416009516e-05, "loss": 2.3374, "step": 434040 }, { "epoch": 0.76, "learning_rate": 1.2153447476082688e-05, "loss": 2.2307, "step": 434050 }, { "epoch": 0.76, "learning_rate": 1.2152575536155861e-05, "loss": 2.258, "step": 434060 }, { "epoch": 0.76, "learning_rate": 1.2151703596229035e-05, "loss": 2.2428, "step": 434070 }, { "epoch": 0.76, "learning_rate": 1.2150831656302209e-05, "loss": 2.2406, "step": 434080 }, { "epoch": 0.76, "learning_rate": 1.2149959716375381e-05, "loss": 2.1973, "step": 434090 }, { "epoch": 0.76, "learning_rate": 1.2149087776448555e-05, "loss": 2.2102, "step": 434100 }, { "epoch": 0.76, "learning_rate": 1.2148215836521727e-05, "loss": 2.2985, "step": 434110 }, { "epoch": 0.76, "learning_rate": 1.21473438965949e-05, "loss": 2.2877, "step": 434120 }, { "epoch": 0.76, "learning_rate": 1.2146471956668073e-05, "loss": 2.3153, "step": 434130 }, { "epoch": 0.76, "learning_rate": 1.2145600016741248e-05, "loss": 2.3168, "step": 434140 }, { "epoch": 0.76, "learning_rate": 1.214472807681442e-05, "loss": 2.3024, "step": 434150 }, { "epoch": 0.76, "learning_rate": 1.2143856136887594e-05, "loss": 2.3861, "step": 434160 }, { "epoch": 0.76, "learning_rate": 1.2142984196960768e-05, "loss": 2.2474, "step": 434170 }, { "epoch": 0.76, "learning_rate": 1.214211225703394e-05, "loss": 2.3182, "step": 434180 }, { "epoch": 0.76, "learning_rate": 1.2141240317107114e-05, "loss": 2.2311, "step": 434190 }, { "epoch": 0.76, "learning_rate": 1.2140368377180286e-05, "loss": 2.1735, "step": 434200 }, { "epoch": 0.76, "learning_rate": 1.213949643725346e-05, "loss": 2.3278, "step": 434210 }, { "epoch": 0.76, "learning_rate": 1.2138624497326633e-05, "loss": 2.2257, "step": 434220 }, { "epoch": 0.76, "learning_rate": 1.2137752557399807e-05, "loss": 2.2758, "step": 434230 }, { "epoch": 0.76, "learning_rate": 1.2136880617472979e-05, "loss": 2.2629, "step": 434240 }, { "epoch": 0.76, "learning_rate": 1.2136008677546153e-05, "loss": 2.3442, "step": 434250 }, { "epoch": 0.76, "learning_rate": 1.2135136737619325e-05, "loss": 2.3744, "step": 434260 }, { "epoch": 0.76, "learning_rate": 1.2134264797692499e-05, "loss": 2.2936, "step": 434270 }, { "epoch": 0.76, "learning_rate": 1.213339285776567e-05, "loss": 2.2281, "step": 434280 }, { "epoch": 0.76, "learning_rate": 1.2132520917838845e-05, "loss": 2.3654, "step": 434290 }, { "epoch": 0.76, "learning_rate": 1.2131648977912018e-05, "loss": 2.2773, "step": 434300 }, { "epoch": 0.76, "learning_rate": 1.2130777037985192e-05, "loss": 2.3002, "step": 434310 }, { "epoch": 0.76, "learning_rate": 1.2129905098058366e-05, "loss": 2.1493, "step": 434320 }, { "epoch": 0.76, "learning_rate": 1.2129033158131538e-05, "loss": 2.2955, "step": 434330 }, { "epoch": 0.76, "learning_rate": 1.2128161218204712e-05, "loss": 2.3985, "step": 434340 }, { "epoch": 0.76, "learning_rate": 1.2127289278277884e-05, "loss": 2.2304, "step": 434350 }, { "epoch": 0.76, "learning_rate": 1.2126417338351058e-05, "loss": 2.3558, "step": 434360 }, { "epoch": 0.76, "learning_rate": 1.212554539842423e-05, "loss": 2.2084, "step": 434370 }, { "epoch": 0.76, "learning_rate": 1.2124673458497403e-05, "loss": 2.4218, "step": 434380 }, { "epoch": 0.76, "learning_rate": 1.2123801518570577e-05, "loss": 2.2544, "step": 434390 }, { "epoch": 0.76, "learning_rate": 1.2122929578643751e-05, "loss": 2.3, "step": 434400 }, { "epoch": 0.76, "learning_rate": 1.2122057638716923e-05, "loss": 2.2691, "step": 434410 }, { "epoch": 0.76, "learning_rate": 1.2121185698790097e-05, "loss": 2.2578, "step": 434420 }, { "epoch": 0.76, "learning_rate": 1.2120313758863269e-05, "loss": 2.3645, "step": 434430 }, { "epoch": 0.76, "learning_rate": 1.2119441818936443e-05, "loss": 2.2347, "step": 434440 }, { "epoch": 0.76, "learning_rate": 1.2118569879009616e-05, "loss": 2.27, "step": 434450 }, { "epoch": 0.76, "learning_rate": 1.211769793908279e-05, "loss": 2.2927, "step": 434460 }, { "epoch": 0.76, "learning_rate": 1.2116825999155964e-05, "loss": 2.2392, "step": 434470 }, { "epoch": 0.76, "learning_rate": 1.2115954059229136e-05, "loss": 2.2985, "step": 434480 }, { "epoch": 0.76, "learning_rate": 1.211508211930231e-05, "loss": 2.3113, "step": 434490 }, { "epoch": 0.76, "learning_rate": 1.2114210179375482e-05, "loss": 2.4351, "step": 434500 }, { "epoch": 0.76, "learning_rate": 1.2113338239448656e-05, "loss": 2.2837, "step": 434510 }, { "epoch": 0.76, "learning_rate": 1.2112466299521828e-05, "loss": 2.3278, "step": 434520 }, { "epoch": 0.76, "learning_rate": 1.2111594359595001e-05, "loss": 2.3032, "step": 434530 }, { "epoch": 0.76, "learning_rate": 1.2110722419668175e-05, "loss": 2.3435, "step": 434540 }, { "epoch": 0.76, "learning_rate": 1.2109850479741349e-05, "loss": 2.4171, "step": 434550 }, { "epoch": 0.76, "learning_rate": 1.2108978539814521e-05, "loss": 2.1678, "step": 434560 }, { "epoch": 0.76, "learning_rate": 1.2108106599887695e-05, "loss": 2.2568, "step": 434570 }, { "epoch": 0.76, "learning_rate": 1.2107234659960869e-05, "loss": 2.3171, "step": 434580 }, { "epoch": 0.76, "learning_rate": 1.210636272003404e-05, "loss": 2.3063, "step": 434590 }, { "epoch": 0.76, "learning_rate": 1.2105490780107214e-05, "loss": 2.2913, "step": 434600 }, { "epoch": 0.76, "learning_rate": 1.2104618840180387e-05, "loss": 2.2838, "step": 434610 }, { "epoch": 0.76, "learning_rate": 1.210374690025356e-05, "loss": 2.2443, "step": 434620 }, { "epoch": 0.76, "learning_rate": 1.2102874960326734e-05, "loss": 2.314, "step": 434630 }, { "epoch": 0.76, "learning_rate": 1.2102003020399908e-05, "loss": 2.292, "step": 434640 }, { "epoch": 0.76, "learning_rate": 1.210113108047308e-05, "loss": 2.2669, "step": 434650 }, { "epoch": 0.76, "learning_rate": 1.2100259140546254e-05, "loss": 2.2929, "step": 434660 }, { "epoch": 0.76, "learning_rate": 1.2099387200619426e-05, "loss": 2.1524, "step": 434670 }, { "epoch": 0.76, "learning_rate": 1.20985152606926e-05, "loss": 2.2483, "step": 434680 }, { "epoch": 0.76, "learning_rate": 1.2097643320765772e-05, "loss": 2.349, "step": 434690 }, { "epoch": 0.76, "learning_rate": 1.2096771380838947e-05, "loss": 2.3567, "step": 434700 }, { "epoch": 0.76, "learning_rate": 1.209589944091212e-05, "loss": 2.1778, "step": 434710 }, { "epoch": 0.76, "learning_rate": 1.2095027500985293e-05, "loss": 2.3361, "step": 434720 }, { "epoch": 0.76, "learning_rate": 1.2094155561058467e-05, "loss": 2.2951, "step": 434730 }, { "epoch": 0.76, "learning_rate": 1.2093283621131639e-05, "loss": 2.3174, "step": 434740 }, { "epoch": 0.76, "learning_rate": 1.2092411681204813e-05, "loss": 2.2889, "step": 434750 }, { "epoch": 0.76, "learning_rate": 1.2091539741277985e-05, "loss": 2.4059, "step": 434760 }, { "epoch": 0.76, "learning_rate": 1.2090667801351158e-05, "loss": 2.2874, "step": 434770 }, { "epoch": 0.76, "learning_rate": 1.2089795861424332e-05, "loss": 2.2742, "step": 434780 }, { "epoch": 0.76, "learning_rate": 1.2088923921497506e-05, "loss": 2.2326, "step": 434790 }, { "epoch": 0.76, "learning_rate": 1.2088051981570678e-05, "loss": 2.2288, "step": 434800 }, { "epoch": 0.76, "learning_rate": 1.2087180041643852e-05, "loss": 2.2833, "step": 434810 }, { "epoch": 0.76, "learning_rate": 1.2086308101717024e-05, "loss": 2.3285, "step": 434820 }, { "epoch": 0.76, "learning_rate": 1.2085436161790198e-05, "loss": 2.2895, "step": 434830 }, { "epoch": 0.76, "learning_rate": 1.2084564221863371e-05, "loss": 2.273, "step": 434840 }, { "epoch": 0.76, "learning_rate": 1.2083692281936543e-05, "loss": 2.2998, "step": 434850 }, { "epoch": 0.76, "learning_rate": 1.2082820342009717e-05, "loss": 2.3696, "step": 434860 }, { "epoch": 0.76, "learning_rate": 1.2081948402082891e-05, "loss": 2.2377, "step": 434870 }, { "epoch": 0.76, "learning_rate": 1.2081076462156065e-05, "loss": 2.2346, "step": 434880 }, { "epoch": 0.76, "learning_rate": 1.2080204522229237e-05, "loss": 2.2638, "step": 434890 }, { "epoch": 0.76, "learning_rate": 1.207933258230241e-05, "loss": 2.2955, "step": 434900 }, { "epoch": 0.76, "learning_rate": 1.2078460642375583e-05, "loss": 2.3776, "step": 434910 }, { "epoch": 0.76, "learning_rate": 1.2077588702448756e-05, "loss": 2.3274, "step": 434920 }, { "epoch": 0.76, "learning_rate": 1.2076716762521929e-05, "loss": 2.2582, "step": 434930 }, { "epoch": 0.76, "learning_rate": 1.2075844822595104e-05, "loss": 2.3308, "step": 434940 }, { "epoch": 0.76, "learning_rate": 1.2074972882668276e-05, "loss": 2.3247, "step": 434950 }, { "epoch": 0.76, "learning_rate": 1.207410094274145e-05, "loss": 2.2948, "step": 434960 }, { "epoch": 0.76, "learning_rate": 1.2073229002814624e-05, "loss": 2.3518, "step": 434970 }, { "epoch": 0.76, "learning_rate": 1.2072357062887796e-05, "loss": 2.3521, "step": 434980 }, { "epoch": 0.76, "learning_rate": 1.207148512296097e-05, "loss": 2.2491, "step": 434990 }, { "epoch": 0.76, "learning_rate": 1.2070613183034142e-05, "loss": 2.143, "step": 435000 }, { "epoch": 0.76, "learning_rate": 1.2069741243107315e-05, "loss": 2.3631, "step": 435010 }, { "epoch": 0.76, "learning_rate": 1.2068869303180489e-05, "loss": 2.2669, "step": 435020 }, { "epoch": 0.76, "learning_rate": 1.2067997363253663e-05, "loss": 2.3158, "step": 435030 }, { "epoch": 0.76, "learning_rate": 1.2067125423326835e-05, "loss": 2.2045, "step": 435040 }, { "epoch": 0.76, "learning_rate": 1.2066253483400009e-05, "loss": 2.1861, "step": 435050 }, { "epoch": 0.76, "learning_rate": 1.206538154347318e-05, "loss": 2.3619, "step": 435060 }, { "epoch": 0.76, "learning_rate": 1.2064509603546355e-05, "loss": 2.3582, "step": 435070 }, { "epoch": 0.76, "learning_rate": 1.2063637663619527e-05, "loss": 2.2134, "step": 435080 }, { "epoch": 0.76, "learning_rate": 1.20627657236927e-05, "loss": 2.2489, "step": 435090 }, { "epoch": 0.76, "learning_rate": 1.2061893783765874e-05, "loss": 2.2232, "step": 435100 }, { "epoch": 0.76, "learning_rate": 1.2061021843839048e-05, "loss": 2.3629, "step": 435110 }, { "epoch": 0.76, "learning_rate": 1.2060149903912222e-05, "loss": 2.2823, "step": 435120 }, { "epoch": 0.76, "learning_rate": 1.2059277963985394e-05, "loss": 2.1805, "step": 435130 }, { "epoch": 0.76, "learning_rate": 1.2058406024058568e-05, "loss": 2.1763, "step": 435140 }, { "epoch": 0.76, "learning_rate": 1.205753408413174e-05, "loss": 2.2928, "step": 435150 }, { "epoch": 0.76, "learning_rate": 1.2056662144204913e-05, "loss": 2.206, "step": 435160 }, { "epoch": 0.76, "learning_rate": 1.2055790204278085e-05, "loss": 2.2718, "step": 435170 }, { "epoch": 0.76, "learning_rate": 1.2054918264351261e-05, "loss": 2.3268, "step": 435180 }, { "epoch": 0.76, "learning_rate": 1.2054046324424433e-05, "loss": 2.3362, "step": 435190 }, { "epoch": 0.76, "learning_rate": 1.2053174384497607e-05, "loss": 2.1401, "step": 435200 }, { "epoch": 0.76, "learning_rate": 1.2052302444570779e-05, "loss": 2.3287, "step": 435210 }, { "epoch": 0.76, "learning_rate": 1.2051430504643953e-05, "loss": 2.2279, "step": 435220 }, { "epoch": 0.76, "learning_rate": 1.2050558564717126e-05, "loss": 2.2728, "step": 435230 }, { "epoch": 0.76, "learning_rate": 1.2049686624790298e-05, "loss": 2.327, "step": 435240 }, { "epoch": 0.76, "learning_rate": 1.2048814684863472e-05, "loss": 2.2526, "step": 435250 }, { "epoch": 0.76, "learning_rate": 1.2047942744936646e-05, "loss": 2.2893, "step": 435260 }, { "epoch": 0.76, "learning_rate": 1.204707080500982e-05, "loss": 2.2525, "step": 435270 }, { "epoch": 0.76, "learning_rate": 1.2046198865082992e-05, "loss": 2.2365, "step": 435280 }, { "epoch": 0.76, "learning_rate": 1.2045326925156166e-05, "loss": 2.3474, "step": 435290 }, { "epoch": 0.76, "learning_rate": 1.2044454985229338e-05, "loss": 2.3316, "step": 435300 }, { "epoch": 0.76, "learning_rate": 1.2043583045302511e-05, "loss": 2.3184, "step": 435310 }, { "epoch": 0.76, "learning_rate": 1.2042711105375684e-05, "loss": 2.3553, "step": 435320 }, { "epoch": 0.76, "learning_rate": 1.2041839165448857e-05, "loss": 2.2137, "step": 435330 }, { "epoch": 0.76, "learning_rate": 1.2040967225522031e-05, "loss": 2.2568, "step": 435340 }, { "epoch": 0.76, "learning_rate": 1.2040095285595205e-05, "loss": 2.4449, "step": 435350 }, { "epoch": 0.76, "learning_rate": 1.2039223345668377e-05, "loss": 2.1973, "step": 435360 }, { "epoch": 0.76, "learning_rate": 1.203835140574155e-05, "loss": 2.2499, "step": 435370 }, { "epoch": 0.76, "learning_rate": 1.2037479465814724e-05, "loss": 2.1725, "step": 435380 }, { "epoch": 0.76, "learning_rate": 1.2036607525887897e-05, "loss": 2.3479, "step": 435390 }, { "epoch": 0.76, "learning_rate": 1.203573558596107e-05, "loss": 2.2611, "step": 435400 }, { "epoch": 0.76, "learning_rate": 1.2034863646034242e-05, "loss": 2.3087, "step": 435410 }, { "epoch": 0.76, "learning_rate": 1.2033991706107418e-05, "loss": 2.2493, "step": 435420 }, { "epoch": 0.76, "learning_rate": 1.203311976618059e-05, "loss": 2.2386, "step": 435430 }, { "epoch": 0.76, "learning_rate": 1.2032247826253764e-05, "loss": 2.3229, "step": 435440 }, { "epoch": 0.76, "learning_rate": 1.2031375886326936e-05, "loss": 2.2988, "step": 435450 }, { "epoch": 0.76, "learning_rate": 1.203050394640011e-05, "loss": 2.3215, "step": 435460 }, { "epoch": 0.76, "learning_rate": 1.2029632006473282e-05, "loss": 2.3625, "step": 435470 }, { "epoch": 0.76, "learning_rate": 1.2028760066546455e-05, "loss": 2.2332, "step": 435480 }, { "epoch": 0.76, "learning_rate": 1.2027888126619629e-05, "loss": 2.2513, "step": 435490 }, { "epoch": 0.76, "learning_rate": 1.2027016186692803e-05, "loss": 2.2617, "step": 435500 }, { "epoch": 0.76, "learning_rate": 1.2026144246765977e-05, "loss": 2.3146, "step": 435510 }, { "epoch": 0.76, "learning_rate": 1.2025272306839149e-05, "loss": 2.195, "step": 435520 }, { "epoch": 0.76, "learning_rate": 1.2024400366912323e-05, "loss": 2.2957, "step": 435530 }, { "epoch": 0.76, "learning_rate": 1.2023528426985495e-05, "loss": 2.2153, "step": 435540 }, { "epoch": 0.76, "learning_rate": 1.2022656487058668e-05, "loss": 2.2859, "step": 435550 }, { "epoch": 0.76, "learning_rate": 1.202178454713184e-05, "loss": 2.3039, "step": 435560 }, { "epoch": 0.76, "learning_rate": 1.2020912607205014e-05, "loss": 2.4033, "step": 435570 }, { "epoch": 0.76, "learning_rate": 1.2020040667278188e-05, "loss": 2.2287, "step": 435580 }, { "epoch": 0.76, "learning_rate": 1.2019168727351362e-05, "loss": 2.3503, "step": 435590 }, { "epoch": 0.76, "learning_rate": 1.2018296787424534e-05, "loss": 2.4052, "step": 435600 }, { "epoch": 0.76, "learning_rate": 1.2017424847497708e-05, "loss": 2.3102, "step": 435610 }, { "epoch": 0.76, "learning_rate": 1.201655290757088e-05, "loss": 2.3511, "step": 435620 }, { "epoch": 0.76, "learning_rate": 1.2015680967644053e-05, "loss": 2.3118, "step": 435630 }, { "epoch": 0.76, "learning_rate": 1.2014809027717227e-05, "loss": 2.3303, "step": 435640 }, { "epoch": 0.76, "learning_rate": 1.20139370877904e-05, "loss": 2.249, "step": 435650 }, { "epoch": 0.76, "learning_rate": 1.2013065147863573e-05, "loss": 2.3284, "step": 435660 }, { "epoch": 0.76, "learning_rate": 1.2012193207936747e-05, "loss": 2.2634, "step": 435670 }, { "epoch": 0.76, "learning_rate": 1.201132126800992e-05, "loss": 2.3045, "step": 435680 }, { "epoch": 0.76, "learning_rate": 1.2010449328083093e-05, "loss": 2.2956, "step": 435690 }, { "epoch": 0.76, "learning_rate": 1.2009577388156266e-05, "loss": 2.3301, "step": 435700 }, { "epoch": 0.76, "learning_rate": 1.2008705448229439e-05, "loss": 2.277, "step": 435710 }, { "epoch": 0.76, "learning_rate": 1.2007833508302612e-05, "loss": 2.2494, "step": 435720 }, { "epoch": 0.76, "learning_rate": 1.2006961568375786e-05, "loss": 2.3249, "step": 435730 }, { "epoch": 0.76, "learning_rate": 1.200608962844896e-05, "loss": 2.2809, "step": 435740 }, { "epoch": 0.76, "learning_rate": 1.2005217688522132e-05, "loss": 2.1963, "step": 435750 }, { "epoch": 0.76, "learning_rate": 1.2004345748595306e-05, "loss": 2.2939, "step": 435760 }, { "epoch": 0.76, "learning_rate": 1.200347380866848e-05, "loss": 2.3309, "step": 435770 }, { "epoch": 0.76, "learning_rate": 1.2002601868741652e-05, "loss": 2.2723, "step": 435780 }, { "epoch": 0.76, "learning_rate": 1.2001729928814825e-05, "loss": 2.2678, "step": 435790 }, { "epoch": 0.76, "learning_rate": 1.2000857988887997e-05, "loss": 2.2241, "step": 435800 }, { "epoch": 0.76, "learning_rate": 1.1999986048961171e-05, "loss": 2.2807, "step": 435810 }, { "epoch": 0.76, "learning_rate": 1.1999114109034345e-05, "loss": 2.2729, "step": 435820 }, { "epoch": 0.76, "learning_rate": 1.1998242169107519e-05, "loss": 2.2196, "step": 435830 }, { "epoch": 0.76, "learning_rate": 1.199737022918069e-05, "loss": 2.3225, "step": 435840 }, { "epoch": 0.76, "learning_rate": 1.1996498289253865e-05, "loss": 2.3192, "step": 435850 }, { "epoch": 0.76, "learning_rate": 1.1995626349327037e-05, "loss": 2.2917, "step": 435860 }, { "epoch": 0.76, "learning_rate": 1.199475440940021e-05, "loss": 2.263, "step": 435870 }, { "epoch": 0.76, "learning_rate": 1.1993882469473382e-05, "loss": 2.2684, "step": 435880 }, { "epoch": 0.76, "learning_rate": 1.1993010529546556e-05, "loss": 2.3755, "step": 435890 }, { "epoch": 0.76, "learning_rate": 1.199213858961973e-05, "loss": 2.2566, "step": 435900 }, { "epoch": 0.76, "learning_rate": 1.1991266649692904e-05, "loss": 2.2614, "step": 435910 }, { "epoch": 0.76, "learning_rate": 1.1990394709766078e-05, "loss": 2.3387, "step": 435920 }, { "epoch": 0.76, "learning_rate": 1.198952276983925e-05, "loss": 2.343, "step": 435930 }, { "epoch": 0.76, "learning_rate": 1.1988650829912423e-05, "loss": 2.277, "step": 435940 }, { "epoch": 0.76, "learning_rate": 1.1987778889985595e-05, "loss": 2.2908, "step": 435950 }, { "epoch": 0.76, "learning_rate": 1.198690695005877e-05, "loss": 2.2535, "step": 435960 }, { "epoch": 0.76, "learning_rate": 1.1986035010131941e-05, "loss": 2.2077, "step": 435970 }, { "epoch": 0.76, "learning_rate": 1.1985163070205117e-05, "loss": 2.3141, "step": 435980 }, { "epoch": 0.76, "learning_rate": 1.1984291130278289e-05, "loss": 2.3001, "step": 435990 }, { "epoch": 0.76, "learning_rate": 1.1983419190351463e-05, "loss": 2.3169, "step": 436000 }, { "epoch": 0.76, "learning_rate": 1.1982547250424635e-05, "loss": 2.3274, "step": 436010 }, { "epoch": 0.76, "learning_rate": 1.1981675310497808e-05, "loss": 2.2395, "step": 436020 }, { "epoch": 0.76, "learning_rate": 1.1980803370570982e-05, "loss": 2.263, "step": 436030 }, { "epoch": 0.76, "learning_rate": 1.1979931430644154e-05, "loss": 2.2891, "step": 436040 }, { "epoch": 0.76, "learning_rate": 1.1979059490717328e-05, "loss": 2.1914, "step": 436050 }, { "epoch": 0.76, "learning_rate": 1.1978187550790502e-05, "loss": 2.2523, "step": 436060 }, { "epoch": 0.76, "learning_rate": 1.1977315610863676e-05, "loss": 2.3598, "step": 436070 }, { "epoch": 0.76, "learning_rate": 1.1976443670936848e-05, "loss": 2.1507, "step": 436080 }, { "epoch": 0.76, "learning_rate": 1.1975571731010021e-05, "loss": 2.2127, "step": 436090 }, { "epoch": 0.76, "learning_rate": 1.1974699791083194e-05, "loss": 2.3488, "step": 436100 }, { "epoch": 0.76, "learning_rate": 1.1973827851156367e-05, "loss": 2.4749, "step": 436110 }, { "epoch": 0.76, "learning_rate": 1.197295591122954e-05, "loss": 2.4008, "step": 436120 }, { "epoch": 0.76, "learning_rate": 1.1972083971302713e-05, "loss": 2.3095, "step": 436130 }, { "epoch": 0.76, "learning_rate": 1.1971212031375887e-05, "loss": 2.2396, "step": 436140 }, { "epoch": 0.76, "learning_rate": 1.197034009144906e-05, "loss": 2.3284, "step": 436150 }, { "epoch": 0.76, "learning_rate": 1.1969468151522233e-05, "loss": 2.2921, "step": 436160 }, { "epoch": 0.76, "learning_rate": 1.1968596211595407e-05, "loss": 2.1272, "step": 436170 }, { "epoch": 0.76, "learning_rate": 1.196772427166858e-05, "loss": 2.2505, "step": 436180 }, { "epoch": 0.76, "learning_rate": 1.1966852331741752e-05, "loss": 2.4698, "step": 436190 }, { "epoch": 0.76, "learning_rate": 1.1965980391814926e-05, "loss": 2.2598, "step": 436200 }, { "epoch": 0.76, "learning_rate": 1.1965108451888098e-05, "loss": 2.2108, "step": 436210 }, { "epoch": 0.76, "learning_rate": 1.1964236511961274e-05, "loss": 2.2687, "step": 436220 }, { "epoch": 0.76, "learning_rate": 1.1963364572034446e-05, "loss": 2.3736, "step": 436230 }, { "epoch": 0.76, "learning_rate": 1.196249263210762e-05, "loss": 2.2154, "step": 436240 }, { "epoch": 0.76, "learning_rate": 1.1961620692180792e-05, "loss": 2.3473, "step": 436250 }, { "epoch": 0.76, "learning_rate": 1.1960748752253965e-05, "loss": 2.3345, "step": 436260 }, { "epoch": 0.76, "learning_rate": 1.1959876812327137e-05, "loss": 2.3999, "step": 436270 }, { "epoch": 0.76, "learning_rate": 1.1959004872400311e-05, "loss": 2.3477, "step": 436280 }, { "epoch": 0.76, "learning_rate": 1.1958132932473485e-05, "loss": 2.2641, "step": 436290 }, { "epoch": 0.76, "learning_rate": 1.1957260992546659e-05, "loss": 2.2217, "step": 436300 }, { "epoch": 0.76, "learning_rate": 1.1956389052619833e-05, "loss": 2.279, "step": 436310 }, { "epoch": 0.76, "learning_rate": 1.1955517112693005e-05, "loss": 2.2767, "step": 436320 }, { "epoch": 0.76, "learning_rate": 1.1954645172766178e-05, "loss": 2.3269, "step": 436330 }, { "epoch": 0.76, "learning_rate": 1.195377323283935e-05, "loss": 2.329, "step": 436340 }, { "epoch": 0.76, "learning_rate": 1.1952901292912524e-05, "loss": 2.35, "step": 436350 }, { "epoch": 0.76, "learning_rate": 1.1952029352985696e-05, "loss": 2.3343, "step": 436360 }, { "epoch": 0.76, "learning_rate": 1.195115741305887e-05, "loss": 2.305, "step": 436370 }, { "epoch": 0.76, "learning_rate": 1.1950285473132044e-05, "loss": 2.3208, "step": 436380 }, { "epoch": 0.76, "learning_rate": 1.1949413533205218e-05, "loss": 2.1747, "step": 436390 }, { "epoch": 0.76, "learning_rate": 1.194854159327839e-05, "loss": 2.2471, "step": 436400 }, { "epoch": 0.76, "learning_rate": 1.1947669653351563e-05, "loss": 2.2062, "step": 436410 }, { "epoch": 0.76, "learning_rate": 1.1946797713424736e-05, "loss": 2.293, "step": 436420 }, { "epoch": 0.76, "learning_rate": 1.194592577349791e-05, "loss": 2.3584, "step": 436430 }, { "epoch": 0.76, "learning_rate": 1.1945053833571083e-05, "loss": 2.2629, "step": 436440 }, { "epoch": 0.76, "learning_rate": 1.1944181893644255e-05, "loss": 2.2457, "step": 436450 }, { "epoch": 0.76, "learning_rate": 1.194330995371743e-05, "loss": 2.233, "step": 436460 }, { "epoch": 0.76, "learning_rate": 1.1942438013790603e-05, "loss": 2.2983, "step": 436470 }, { "epoch": 0.76, "learning_rate": 1.1941566073863776e-05, "loss": 2.2692, "step": 436480 }, { "epoch": 0.76, "learning_rate": 1.1940694133936949e-05, "loss": 2.3063, "step": 436490 }, { "epoch": 0.76, "learning_rate": 1.1939822194010122e-05, "loss": 2.2382, "step": 436500 }, { "epoch": 0.76, "learning_rate": 1.1938950254083294e-05, "loss": 2.1981, "step": 436510 }, { "epoch": 0.76, "learning_rate": 1.1938078314156468e-05, "loss": 2.3661, "step": 436520 }, { "epoch": 0.76, "learning_rate": 1.1937206374229642e-05, "loss": 2.2696, "step": 436530 }, { "epoch": 0.76, "learning_rate": 1.1936334434302816e-05, "loss": 2.1254, "step": 436540 }, { "epoch": 0.76, "learning_rate": 1.1935462494375988e-05, "loss": 2.3049, "step": 436550 }, { "epoch": 0.76, "learning_rate": 1.1934590554449162e-05, "loss": 2.2027, "step": 436560 }, { "epoch": 0.76, "learning_rate": 1.1933718614522335e-05, "loss": 2.2369, "step": 436570 }, { "epoch": 0.76, "learning_rate": 1.1932846674595507e-05, "loss": 2.288, "step": 436580 }, { "epoch": 0.76, "learning_rate": 1.1931974734668681e-05, "loss": 2.2328, "step": 436590 }, { "epoch": 0.76, "learning_rate": 1.1931102794741853e-05, "loss": 2.2589, "step": 436600 }, { "epoch": 0.76, "learning_rate": 1.1930230854815027e-05, "loss": 2.2404, "step": 436610 }, { "epoch": 0.76, "learning_rate": 1.19293589148882e-05, "loss": 2.3324, "step": 436620 }, { "epoch": 0.76, "learning_rate": 1.1928486974961375e-05, "loss": 2.3032, "step": 436630 }, { "epoch": 0.76, "learning_rate": 1.1927615035034547e-05, "loss": 2.264, "step": 436640 }, { "epoch": 0.76, "learning_rate": 1.192674309510772e-05, "loss": 2.2035, "step": 436650 }, { "epoch": 0.76, "learning_rate": 1.1925871155180892e-05, "loss": 2.3162, "step": 436660 }, { "epoch": 0.76, "learning_rate": 1.1924999215254066e-05, "loss": 2.3383, "step": 436670 }, { "epoch": 0.76, "learning_rate": 1.1924127275327238e-05, "loss": 2.14, "step": 436680 }, { "epoch": 0.76, "learning_rate": 1.1923255335400412e-05, "loss": 2.3076, "step": 436690 }, { "epoch": 0.76, "learning_rate": 1.1922383395473586e-05, "loss": 2.3565, "step": 436700 }, { "epoch": 0.76, "learning_rate": 1.192151145554676e-05, "loss": 2.2616, "step": 436710 }, { "epoch": 0.76, "learning_rate": 1.1920639515619933e-05, "loss": 2.1697, "step": 436720 }, { "epoch": 0.76, "learning_rate": 1.1919767575693105e-05, "loss": 2.2209, "step": 436730 }, { "epoch": 0.76, "learning_rate": 1.191889563576628e-05, "loss": 2.3401, "step": 436740 }, { "epoch": 0.76, "learning_rate": 1.1918023695839451e-05, "loss": 2.2343, "step": 436750 }, { "epoch": 0.76, "learning_rate": 1.1917151755912625e-05, "loss": 2.2252, "step": 436760 }, { "epoch": 0.76, "learning_rate": 1.1916279815985799e-05, "loss": 2.3167, "step": 436770 }, { "epoch": 0.76, "learning_rate": 1.1915407876058973e-05, "loss": 2.3346, "step": 436780 }, { "epoch": 0.76, "learning_rate": 1.1914535936132145e-05, "loss": 2.305, "step": 436790 }, { "epoch": 0.76, "learning_rate": 1.1913663996205318e-05, "loss": 2.385, "step": 436800 }, { "epoch": 0.76, "learning_rate": 1.191279205627849e-05, "loss": 2.4493, "step": 436810 }, { "epoch": 0.76, "learning_rate": 1.1911920116351664e-05, "loss": 2.2704, "step": 436820 }, { "epoch": 0.76, "learning_rate": 1.1911048176424838e-05, "loss": 2.4191, "step": 436830 }, { "epoch": 0.76, "learning_rate": 1.191017623649801e-05, "loss": 2.2549, "step": 436840 }, { "epoch": 0.76, "learning_rate": 1.1909304296571184e-05, "loss": 2.3122, "step": 436850 }, { "epoch": 0.76, "learning_rate": 1.1908432356644358e-05, "loss": 2.49, "step": 436860 }, { "epoch": 0.76, "learning_rate": 1.1907560416717531e-05, "loss": 2.3083, "step": 436870 }, { "epoch": 0.76, "learning_rate": 1.1906688476790704e-05, "loss": 2.2988, "step": 436880 }, { "epoch": 0.76, "learning_rate": 1.1905816536863877e-05, "loss": 2.2913, "step": 436890 }, { "epoch": 0.76, "learning_rate": 1.190494459693705e-05, "loss": 2.3435, "step": 436900 }, { "epoch": 0.76, "learning_rate": 1.1904072657010223e-05, "loss": 2.1962, "step": 436910 }, { "epoch": 0.76, "learning_rate": 1.1903200717083395e-05, "loss": 2.2966, "step": 436920 }, { "epoch": 0.76, "learning_rate": 1.1902328777156569e-05, "loss": 2.266, "step": 436930 }, { "epoch": 0.76, "learning_rate": 1.1901456837229743e-05, "loss": 2.1955, "step": 436940 }, { "epoch": 0.76, "learning_rate": 1.1900584897302917e-05, "loss": 2.289, "step": 436950 }, { "epoch": 0.76, "learning_rate": 1.189971295737609e-05, "loss": 2.1969, "step": 436960 }, { "epoch": 0.76, "learning_rate": 1.1898841017449262e-05, "loss": 2.2713, "step": 436970 }, { "epoch": 0.76, "learning_rate": 1.1897969077522436e-05, "loss": 2.2985, "step": 436980 }, { "epoch": 0.76, "learning_rate": 1.1897097137595608e-05, "loss": 2.4081, "step": 436990 }, { "epoch": 0.76, "learning_rate": 1.1896225197668782e-05, "loss": 2.2888, "step": 437000 }, { "epoch": 0.76, "learning_rate": 1.1895353257741954e-05, "loss": 2.2729, "step": 437010 }, { "epoch": 0.76, "learning_rate": 1.189448131781513e-05, "loss": 2.2797, "step": 437020 }, { "epoch": 0.76, "learning_rate": 1.1893609377888302e-05, "loss": 2.3011, "step": 437030 }, { "epoch": 0.76, "learning_rate": 1.1892737437961475e-05, "loss": 2.2451, "step": 437040 }, { "epoch": 0.76, "learning_rate": 1.1891865498034647e-05, "loss": 2.1881, "step": 437050 }, { "epoch": 0.76, "learning_rate": 1.1890993558107821e-05, "loss": 2.0864, "step": 437060 }, { "epoch": 0.76, "learning_rate": 1.1890121618180993e-05, "loss": 2.2867, "step": 437070 }, { "epoch": 0.76, "learning_rate": 1.1889249678254167e-05, "loss": 2.3077, "step": 437080 }, { "epoch": 0.76, "learning_rate": 1.1888377738327341e-05, "loss": 2.2078, "step": 437090 }, { "epoch": 0.76, "learning_rate": 1.1887505798400515e-05, "loss": 2.3033, "step": 437100 }, { "epoch": 0.76, "learning_rate": 1.1886633858473688e-05, "loss": 2.453, "step": 437110 }, { "epoch": 0.76, "learning_rate": 1.188576191854686e-05, "loss": 2.2234, "step": 437120 }, { "epoch": 0.76, "learning_rate": 1.1884889978620034e-05, "loss": 2.2932, "step": 437130 }, { "epoch": 0.76, "learning_rate": 1.1884018038693206e-05, "loss": 2.1201, "step": 437140 }, { "epoch": 0.76, "learning_rate": 1.188314609876638e-05, "loss": 2.259, "step": 437150 }, { "epoch": 0.76, "learning_rate": 1.1882274158839552e-05, "loss": 2.2026, "step": 437160 }, { "epoch": 0.76, "learning_rate": 1.1881402218912726e-05, "loss": 2.3185, "step": 437170 }, { "epoch": 0.76, "learning_rate": 1.18805302789859e-05, "loss": 2.3925, "step": 437180 }, { "epoch": 0.76, "learning_rate": 1.1879658339059073e-05, "loss": 2.3445, "step": 437190 }, { "epoch": 0.76, "learning_rate": 1.1878786399132246e-05, "loss": 2.3259, "step": 437200 }, { "epoch": 0.76, "learning_rate": 1.187791445920542e-05, "loss": 2.2819, "step": 437210 }, { "epoch": 0.76, "learning_rate": 1.1877042519278591e-05, "loss": 2.3233, "step": 437220 }, { "epoch": 0.76, "learning_rate": 1.1876170579351765e-05, "loss": 2.325, "step": 437230 }, { "epoch": 0.76, "learning_rate": 1.1875298639424939e-05, "loss": 2.3831, "step": 437240 }, { "epoch": 0.76, "learning_rate": 1.1874426699498111e-05, "loss": 2.2647, "step": 437250 }, { "epoch": 0.76, "learning_rate": 1.1873554759571286e-05, "loss": 2.2267, "step": 437260 }, { "epoch": 0.76, "learning_rate": 1.1872682819644459e-05, "loss": 2.2798, "step": 437270 }, { "epoch": 0.76, "learning_rate": 1.1871810879717632e-05, "loss": 2.2716, "step": 437280 }, { "epoch": 0.76, "learning_rate": 1.1870938939790804e-05, "loss": 2.3968, "step": 437290 }, { "epoch": 0.76, "learning_rate": 1.1870066999863978e-05, "loss": 2.2871, "step": 437300 }, { "epoch": 0.76, "learning_rate": 1.186919505993715e-05, "loss": 2.2939, "step": 437310 }, { "epoch": 0.76, "learning_rate": 1.1868323120010324e-05, "loss": 2.1815, "step": 437320 }, { "epoch": 0.76, "learning_rate": 1.1867451180083498e-05, "loss": 2.336, "step": 437330 }, { "epoch": 0.76, "learning_rate": 1.1866579240156672e-05, "loss": 2.2191, "step": 437340 }, { "epoch": 0.76, "learning_rate": 1.1865707300229844e-05, "loss": 2.3454, "step": 437350 }, { "epoch": 0.76, "learning_rate": 1.1864835360303017e-05, "loss": 2.4072, "step": 437360 }, { "epoch": 0.76, "learning_rate": 1.1863963420376191e-05, "loss": 2.2659, "step": 437370 }, { "epoch": 0.76, "learning_rate": 1.1863091480449363e-05, "loss": 2.2704, "step": 437380 }, { "epoch": 0.76, "learning_rate": 1.1862219540522537e-05, "loss": 2.1928, "step": 437390 }, { "epoch": 0.76, "learning_rate": 1.1861347600595709e-05, "loss": 2.3157, "step": 437400 }, { "epoch": 0.76, "learning_rate": 1.1860475660668883e-05, "loss": 2.1856, "step": 437410 }, { "epoch": 0.76, "learning_rate": 1.1859603720742057e-05, "loss": 2.3807, "step": 437420 }, { "epoch": 0.76, "learning_rate": 1.185873178081523e-05, "loss": 2.3126, "step": 437430 }, { "epoch": 0.76, "learning_rate": 1.1857859840888402e-05, "loss": 2.2362, "step": 437440 }, { "epoch": 0.76, "learning_rate": 1.1856987900961576e-05, "loss": 2.3099, "step": 437450 }, { "epoch": 0.76, "learning_rate": 1.1856115961034748e-05, "loss": 2.2985, "step": 437460 }, { "epoch": 0.76, "learning_rate": 1.1855244021107922e-05, "loss": 2.3315, "step": 437470 }, { "epoch": 0.76, "learning_rate": 1.1854372081181094e-05, "loss": 2.2503, "step": 437480 }, { "epoch": 0.76, "learning_rate": 1.1853500141254268e-05, "loss": 2.3502, "step": 437490 }, { "epoch": 0.76, "learning_rate": 1.1852628201327443e-05, "loss": 2.2484, "step": 437500 }, { "epoch": 0.76, "learning_rate": 1.1851756261400615e-05, "loss": 2.3198, "step": 437510 }, { "epoch": 0.76, "learning_rate": 1.185088432147379e-05, "loss": 2.3559, "step": 437520 }, { "epoch": 0.76, "learning_rate": 1.1850012381546961e-05, "loss": 2.2279, "step": 437530 }, { "epoch": 0.76, "learning_rate": 1.1849140441620135e-05, "loss": 2.2293, "step": 437540 }, { "epoch": 0.76, "learning_rate": 1.1848268501693307e-05, "loss": 2.3317, "step": 437550 }, { "epoch": 0.76, "learning_rate": 1.1847396561766481e-05, "loss": 2.3056, "step": 437560 }, { "epoch": 0.76, "learning_rate": 1.1846524621839655e-05, "loss": 2.3609, "step": 437570 }, { "epoch": 0.76, "learning_rate": 1.1845652681912828e-05, "loss": 2.2955, "step": 437580 }, { "epoch": 0.76, "learning_rate": 1.1844780741986e-05, "loss": 2.2439, "step": 437590 }, { "epoch": 0.76, "learning_rate": 1.1843908802059174e-05, "loss": 2.2649, "step": 437600 }, { "epoch": 0.76, "learning_rate": 1.1843036862132346e-05, "loss": 2.2604, "step": 437610 }, { "epoch": 0.76, "learning_rate": 1.184216492220552e-05, "loss": 2.2809, "step": 437620 }, { "epoch": 0.76, "learning_rate": 1.1841292982278694e-05, "loss": 2.2751, "step": 437630 }, { "epoch": 0.76, "learning_rate": 1.1840421042351866e-05, "loss": 2.3787, "step": 437640 }, { "epoch": 0.76, "learning_rate": 1.183954910242504e-05, "loss": 2.368, "step": 437650 }, { "epoch": 0.76, "learning_rate": 1.1838677162498214e-05, "loss": 2.2282, "step": 437660 }, { "epoch": 0.76, "learning_rate": 1.1837805222571387e-05, "loss": 2.2739, "step": 437670 }, { "epoch": 0.76, "learning_rate": 1.183693328264456e-05, "loss": 2.3552, "step": 437680 }, { "epoch": 0.76, "learning_rate": 1.1836061342717733e-05, "loss": 2.0246, "step": 437690 }, { "epoch": 0.76, "learning_rate": 1.1835189402790905e-05, "loss": 2.241, "step": 437700 }, { "epoch": 0.76, "learning_rate": 1.1834317462864079e-05, "loss": 2.3704, "step": 437710 }, { "epoch": 0.76, "learning_rate": 1.1833445522937251e-05, "loss": 2.1794, "step": 437720 }, { "epoch": 0.76, "learning_rate": 1.1832573583010425e-05, "loss": 2.1826, "step": 437730 }, { "epoch": 0.76, "learning_rate": 1.1831701643083599e-05, "loss": 2.3267, "step": 437740 }, { "epoch": 0.76, "learning_rate": 1.1830829703156772e-05, "loss": 2.2485, "step": 437750 }, { "epoch": 0.76, "learning_rate": 1.1829957763229946e-05, "loss": 2.3579, "step": 437760 }, { "epoch": 0.76, "learning_rate": 1.1829085823303118e-05, "loss": 2.1757, "step": 437770 }, { "epoch": 0.76, "learning_rate": 1.1828213883376292e-05, "loss": 2.3029, "step": 437780 }, { "epoch": 0.76, "learning_rate": 1.1827341943449464e-05, "loss": 2.2348, "step": 437790 }, { "epoch": 0.76, "learning_rate": 1.1826470003522638e-05, "loss": 2.3018, "step": 437800 }, { "epoch": 0.76, "learning_rate": 1.1825598063595812e-05, "loss": 2.2963, "step": 437810 }, { "epoch": 0.76, "learning_rate": 1.1824726123668985e-05, "loss": 2.3649, "step": 437820 }, { "epoch": 0.76, "learning_rate": 1.1823854183742157e-05, "loss": 2.2898, "step": 437830 }, { "epoch": 0.76, "learning_rate": 1.1822982243815331e-05, "loss": 2.2651, "step": 437840 }, { "epoch": 0.76, "learning_rate": 1.1822110303888503e-05, "loss": 2.2584, "step": 437850 }, { "epoch": 0.76, "learning_rate": 1.1821238363961677e-05, "loss": 2.328, "step": 437860 }, { "epoch": 0.76, "learning_rate": 1.182036642403485e-05, "loss": 2.2122, "step": 437870 }, { "epoch": 0.76, "learning_rate": 1.1819494484108023e-05, "loss": 2.1238, "step": 437880 }, { "epoch": 0.76, "learning_rate": 1.1818622544181197e-05, "loss": 2.2369, "step": 437890 }, { "epoch": 0.76, "learning_rate": 1.181775060425437e-05, "loss": 2.2601, "step": 437900 }, { "epoch": 0.76, "learning_rate": 1.1816878664327544e-05, "loss": 2.3041, "step": 437910 }, { "epoch": 0.76, "learning_rate": 1.1816006724400716e-05, "loss": 2.2176, "step": 437920 }, { "epoch": 0.76, "learning_rate": 1.181513478447389e-05, "loss": 2.2778, "step": 437930 }, { "epoch": 0.76, "learning_rate": 1.1814262844547062e-05, "loss": 2.2285, "step": 437940 }, { "epoch": 0.76, "learning_rate": 1.1813390904620236e-05, "loss": 2.267, "step": 437950 }, { "epoch": 0.76, "learning_rate": 1.1812518964693408e-05, "loss": 2.2607, "step": 437960 }, { "epoch": 0.76, "learning_rate": 1.1811647024766582e-05, "loss": 2.3241, "step": 437970 }, { "epoch": 0.76, "learning_rate": 1.1810775084839756e-05, "loss": 2.2849, "step": 437980 }, { "epoch": 0.76, "learning_rate": 1.180990314491293e-05, "loss": 2.3362, "step": 437990 }, { "epoch": 0.76, "learning_rate": 1.1809031204986101e-05, "loss": 2.3062, "step": 438000 }, { "epoch": 0.76, "learning_rate": 1.1808159265059275e-05, "loss": 2.195, "step": 438010 }, { "epoch": 0.76, "learning_rate": 1.1807287325132447e-05, "loss": 2.3272, "step": 438020 }, { "epoch": 0.76, "learning_rate": 1.1806415385205621e-05, "loss": 2.3001, "step": 438030 }, { "epoch": 0.76, "learning_rate": 1.1805543445278795e-05, "loss": 2.315, "step": 438040 }, { "epoch": 0.76, "learning_rate": 1.1804671505351967e-05, "loss": 2.1472, "step": 438050 }, { "epoch": 0.76, "learning_rate": 1.1803799565425142e-05, "loss": 2.2429, "step": 438060 }, { "epoch": 0.76, "learning_rate": 1.1802927625498314e-05, "loss": 2.2475, "step": 438070 }, { "epoch": 0.76, "learning_rate": 1.1802055685571488e-05, "loss": 2.2943, "step": 438080 }, { "epoch": 0.76, "learning_rate": 1.180118374564466e-05, "loss": 2.3692, "step": 438090 }, { "epoch": 0.76, "learning_rate": 1.1800311805717834e-05, "loss": 2.327, "step": 438100 }, { "epoch": 0.76, "learning_rate": 1.1799439865791006e-05, "loss": 2.2793, "step": 438110 }, { "epoch": 0.76, "learning_rate": 1.179856792586418e-05, "loss": 2.1828, "step": 438120 }, { "epoch": 0.76, "learning_rate": 1.1797695985937354e-05, "loss": 2.4025, "step": 438130 }, { "epoch": 0.76, "learning_rate": 1.1796824046010527e-05, "loss": 2.3, "step": 438140 }, { "epoch": 0.76, "learning_rate": 1.17959521060837e-05, "loss": 2.2573, "step": 438150 }, { "epoch": 0.76, "learning_rate": 1.1795080166156873e-05, "loss": 2.19, "step": 438160 }, { "epoch": 0.76, "learning_rate": 1.1794208226230047e-05, "loss": 2.274, "step": 438170 }, { "epoch": 0.76, "learning_rate": 1.1793336286303219e-05, "loss": 2.3055, "step": 438180 }, { "epoch": 0.76, "learning_rate": 1.1792464346376393e-05, "loss": 2.3269, "step": 438190 }, { "epoch": 0.76, "learning_rate": 1.1791592406449565e-05, "loss": 2.268, "step": 438200 }, { "epoch": 0.76, "learning_rate": 1.1790720466522739e-05, "loss": 2.2477, "step": 438210 }, { "epoch": 0.76, "learning_rate": 1.1789848526595912e-05, "loss": 2.2705, "step": 438220 }, { "epoch": 0.76, "learning_rate": 1.1788976586669086e-05, "loss": 2.2868, "step": 438230 }, { "epoch": 0.76, "learning_rate": 1.1788104646742258e-05, "loss": 2.2267, "step": 438240 }, { "epoch": 0.76, "learning_rate": 1.1787232706815432e-05, "loss": 2.264, "step": 438250 }, { "epoch": 0.76, "learning_rate": 1.1786360766888604e-05, "loss": 2.2902, "step": 438260 }, { "epoch": 0.76, "learning_rate": 1.1785488826961778e-05, "loss": 2.3549, "step": 438270 }, { "epoch": 0.76, "learning_rate": 1.178461688703495e-05, "loss": 2.2446, "step": 438280 }, { "epoch": 0.76, "learning_rate": 1.1783744947108124e-05, "loss": 2.3461, "step": 438290 }, { "epoch": 0.76, "learning_rate": 1.17828730071813e-05, "loss": 2.4054, "step": 438300 }, { "epoch": 0.76, "learning_rate": 1.1782001067254471e-05, "loss": 2.3446, "step": 438310 }, { "epoch": 0.76, "learning_rate": 1.1781129127327645e-05, "loss": 2.1767, "step": 438320 }, { "epoch": 0.76, "learning_rate": 1.1780257187400817e-05, "loss": 2.1974, "step": 438330 }, { "epoch": 0.76, "learning_rate": 1.1779385247473991e-05, "loss": 2.3541, "step": 438340 }, { "epoch": 0.76, "learning_rate": 1.1778513307547163e-05, "loss": 2.4266, "step": 438350 }, { "epoch": 0.76, "learning_rate": 1.1777641367620337e-05, "loss": 2.3797, "step": 438360 }, { "epoch": 0.76, "learning_rate": 1.177676942769351e-05, "loss": 2.3331, "step": 438370 }, { "epoch": 0.76, "learning_rate": 1.1775897487766684e-05, "loss": 2.3934, "step": 438380 }, { "epoch": 0.76, "learning_rate": 1.1775025547839856e-05, "loss": 2.2746, "step": 438390 }, { "epoch": 0.76, "learning_rate": 1.177415360791303e-05, "loss": 2.4004, "step": 438400 }, { "epoch": 0.76, "learning_rate": 1.1773281667986202e-05, "loss": 2.3522, "step": 438410 }, { "epoch": 0.76, "learning_rate": 1.1772409728059376e-05, "loss": 2.2364, "step": 438420 }, { "epoch": 0.76, "learning_rate": 1.177153778813255e-05, "loss": 2.1708, "step": 438430 }, { "epoch": 0.76, "learning_rate": 1.1770665848205722e-05, "loss": 2.2358, "step": 438440 }, { "epoch": 0.76, "learning_rate": 1.1769793908278896e-05, "loss": 2.2252, "step": 438450 }, { "epoch": 0.76, "learning_rate": 1.176892196835207e-05, "loss": 2.4012, "step": 438460 }, { "epoch": 0.76, "learning_rate": 1.1768050028425243e-05, "loss": 2.317, "step": 438470 }, { "epoch": 0.76, "learning_rate": 1.1767178088498415e-05, "loss": 2.3128, "step": 438480 }, { "epoch": 0.76, "learning_rate": 1.1766306148571589e-05, "loss": 2.415, "step": 438490 }, { "epoch": 0.76, "learning_rate": 1.1765434208644761e-05, "loss": 2.2636, "step": 438500 }, { "epoch": 0.76, "learning_rate": 1.1764562268717935e-05, "loss": 2.3215, "step": 438510 }, { "epoch": 0.76, "learning_rate": 1.1763690328791107e-05, "loss": 2.2097, "step": 438520 }, { "epoch": 0.76, "learning_rate": 1.176281838886428e-05, "loss": 2.1438, "step": 438530 }, { "epoch": 0.76, "learning_rate": 1.1761946448937454e-05, "loss": 2.265, "step": 438540 }, { "epoch": 0.76, "learning_rate": 1.1761074509010628e-05, "loss": 2.2696, "step": 438550 }, { "epoch": 0.76, "learning_rate": 1.1760202569083802e-05, "loss": 2.4999, "step": 438560 }, { "epoch": 0.76, "learning_rate": 1.1759330629156974e-05, "loss": 2.371, "step": 438570 }, { "epoch": 0.76, "learning_rate": 1.1758458689230148e-05, "loss": 2.2285, "step": 438580 }, { "epoch": 0.76, "learning_rate": 1.175758674930332e-05, "loss": 2.2791, "step": 438590 }, { "epoch": 0.76, "learning_rate": 1.1756714809376494e-05, "loss": 2.3049, "step": 438600 }, { "epoch": 0.76, "learning_rate": 1.1755842869449667e-05, "loss": 2.2164, "step": 438610 }, { "epoch": 0.76, "learning_rate": 1.1754970929522841e-05, "loss": 2.2926, "step": 438620 }, { "epoch": 0.76, "learning_rate": 1.1754098989596013e-05, "loss": 2.2853, "step": 438630 }, { "epoch": 0.76, "learning_rate": 1.1753227049669187e-05, "loss": 2.3771, "step": 438640 }, { "epoch": 0.76, "learning_rate": 1.175235510974236e-05, "loss": 2.3758, "step": 438650 }, { "epoch": 0.76, "learning_rate": 1.1751483169815533e-05, "loss": 2.3044, "step": 438660 }, { "epoch": 0.76, "learning_rate": 1.1750611229888705e-05, "loss": 2.1976, "step": 438670 }, { "epoch": 0.77, "learning_rate": 1.1749739289961879e-05, "loss": 2.2946, "step": 438680 }, { "epoch": 0.77, "learning_rate": 1.1748867350035053e-05, "loss": 2.1538, "step": 438690 }, { "epoch": 0.77, "learning_rate": 1.1747995410108226e-05, "loss": 2.2845, "step": 438700 }, { "epoch": 0.77, "learning_rate": 1.17471234701814e-05, "loss": 2.2547, "step": 438710 }, { "epoch": 0.77, "learning_rate": 1.1746251530254572e-05, "loss": 2.3169, "step": 438720 }, { "epoch": 0.77, "learning_rate": 1.1745379590327746e-05, "loss": 2.2718, "step": 438730 }, { "epoch": 0.77, "learning_rate": 1.1744507650400918e-05, "loss": 2.2979, "step": 438740 }, { "epoch": 0.77, "learning_rate": 1.1743635710474092e-05, "loss": 2.1868, "step": 438750 }, { "epoch": 0.77, "learning_rate": 1.1742763770547264e-05, "loss": 2.2695, "step": 438760 }, { "epoch": 0.77, "learning_rate": 1.1741891830620438e-05, "loss": 2.2908, "step": 438770 }, { "epoch": 0.77, "learning_rate": 1.1741019890693611e-05, "loss": 2.2445, "step": 438780 }, { "epoch": 0.77, "learning_rate": 1.1740147950766785e-05, "loss": 2.4076, "step": 438790 }, { "epoch": 0.77, "learning_rate": 1.1739276010839957e-05, "loss": 2.3065, "step": 438800 }, { "epoch": 0.77, "learning_rate": 1.1738404070913131e-05, "loss": 2.3337, "step": 438810 }, { "epoch": 0.77, "learning_rate": 1.1737532130986303e-05, "loss": 2.2239, "step": 438820 }, { "epoch": 0.77, "learning_rate": 1.1736660191059477e-05, "loss": 2.3039, "step": 438830 }, { "epoch": 0.77, "learning_rate": 1.173578825113265e-05, "loss": 2.3793, "step": 438840 }, { "epoch": 0.77, "learning_rate": 1.1734916311205824e-05, "loss": 2.239, "step": 438850 }, { "epoch": 0.77, "learning_rate": 1.1734044371278998e-05, "loss": 2.2663, "step": 438860 }, { "epoch": 0.77, "learning_rate": 1.173317243135217e-05, "loss": 2.1068, "step": 438870 }, { "epoch": 0.77, "learning_rate": 1.1732300491425344e-05, "loss": 2.1901, "step": 438880 }, { "epoch": 0.77, "learning_rate": 1.1731428551498516e-05, "loss": 2.229, "step": 438890 }, { "epoch": 0.77, "learning_rate": 1.173055661157169e-05, "loss": 2.2318, "step": 438900 }, { "epoch": 0.77, "learning_rate": 1.1729684671644862e-05, "loss": 2.1943, "step": 438910 }, { "epoch": 0.77, "learning_rate": 1.1728812731718036e-05, "loss": 2.2803, "step": 438920 }, { "epoch": 0.77, "learning_rate": 1.172794079179121e-05, "loss": 2.2416, "step": 438930 }, { "epoch": 0.77, "learning_rate": 1.1727068851864383e-05, "loss": 2.2278, "step": 438940 }, { "epoch": 0.77, "learning_rate": 1.1726196911937555e-05, "loss": 2.2074, "step": 438950 }, { "epoch": 0.77, "learning_rate": 1.1725324972010729e-05, "loss": 2.182, "step": 438960 }, { "epoch": 0.77, "learning_rate": 1.1724453032083903e-05, "loss": 2.2698, "step": 438970 }, { "epoch": 0.77, "learning_rate": 1.1723581092157075e-05, "loss": 2.2911, "step": 438980 }, { "epoch": 0.77, "learning_rate": 1.1722709152230249e-05, "loss": 2.3819, "step": 438990 }, { "epoch": 0.77, "learning_rate": 1.172183721230342e-05, "loss": 2.2482, "step": 439000 }, { "epoch": 0.77, "learning_rate": 1.1720965272376595e-05, "loss": 2.1293, "step": 439010 }, { "epoch": 0.77, "learning_rate": 1.1720093332449768e-05, "loss": 2.2876, "step": 439020 }, { "epoch": 0.77, "learning_rate": 1.1719221392522942e-05, "loss": 2.2393, "step": 439030 }, { "epoch": 0.77, "learning_rate": 1.1718349452596114e-05, "loss": 2.2584, "step": 439040 }, { "epoch": 0.77, "learning_rate": 1.1717477512669288e-05, "loss": 2.3677, "step": 439050 }, { "epoch": 0.77, "learning_rate": 1.171660557274246e-05, "loss": 2.2718, "step": 439060 }, { "epoch": 0.77, "learning_rate": 1.1715733632815634e-05, "loss": 2.2359, "step": 439070 }, { "epoch": 0.77, "learning_rate": 1.1714861692888806e-05, "loss": 2.2136, "step": 439080 }, { "epoch": 0.77, "learning_rate": 1.171398975296198e-05, "loss": 2.2367, "step": 439090 }, { "epoch": 0.77, "learning_rate": 1.1713117813035155e-05, "loss": 2.3731, "step": 439100 }, { "epoch": 0.77, "learning_rate": 1.1712245873108327e-05, "loss": 2.2727, "step": 439110 }, { "epoch": 0.77, "learning_rate": 1.1711373933181501e-05, "loss": 2.2035, "step": 439120 }, { "epoch": 0.77, "learning_rate": 1.1710501993254673e-05, "loss": 2.3439, "step": 439130 }, { "epoch": 0.77, "learning_rate": 1.1709630053327847e-05, "loss": 2.3064, "step": 439140 }, { "epoch": 0.77, "learning_rate": 1.1708758113401019e-05, "loss": 2.3385, "step": 439150 }, { "epoch": 0.77, "learning_rate": 1.1707886173474193e-05, "loss": 2.2957, "step": 439160 }, { "epoch": 0.77, "learning_rate": 1.1707014233547366e-05, "loss": 2.3467, "step": 439170 }, { "epoch": 0.77, "learning_rate": 1.170614229362054e-05, "loss": 2.3405, "step": 439180 }, { "epoch": 0.77, "learning_rate": 1.1705270353693712e-05, "loss": 2.3456, "step": 439190 }, { "epoch": 0.77, "learning_rate": 1.1704398413766886e-05, "loss": 2.3471, "step": 439200 }, { "epoch": 0.77, "learning_rate": 1.1703526473840058e-05, "loss": 2.3141, "step": 439210 }, { "epoch": 0.77, "learning_rate": 1.1702654533913232e-05, "loss": 2.3868, "step": 439220 }, { "epoch": 0.77, "learning_rate": 1.1701782593986406e-05, "loss": 2.2235, "step": 439230 }, { "epoch": 0.77, "learning_rate": 1.1700910654059578e-05, "loss": 2.189, "step": 439240 }, { "epoch": 0.77, "learning_rate": 1.1700038714132751e-05, "loss": 2.2305, "step": 439250 }, { "epoch": 0.77, "learning_rate": 1.1699166774205925e-05, "loss": 2.3076, "step": 439260 }, { "epoch": 0.77, "learning_rate": 1.1698294834279099e-05, "loss": 2.365, "step": 439270 }, { "epoch": 0.77, "learning_rate": 1.1697422894352271e-05, "loss": 2.3477, "step": 439280 }, { "epoch": 0.77, "learning_rate": 1.1696550954425445e-05, "loss": 2.3484, "step": 439290 }, { "epoch": 0.77, "learning_rate": 1.1695679014498617e-05, "loss": 2.2972, "step": 439300 }, { "epoch": 0.77, "learning_rate": 1.169480707457179e-05, "loss": 2.2838, "step": 439310 }, { "epoch": 0.77, "learning_rate": 1.1693935134644963e-05, "loss": 2.2388, "step": 439320 }, { "epoch": 0.77, "learning_rate": 1.1693063194718137e-05, "loss": 2.3089, "step": 439330 }, { "epoch": 0.77, "learning_rate": 1.169219125479131e-05, "loss": 2.2813, "step": 439340 }, { "epoch": 0.77, "learning_rate": 1.1691319314864484e-05, "loss": 2.4205, "step": 439350 }, { "epoch": 0.77, "learning_rate": 1.1690447374937658e-05, "loss": 2.3515, "step": 439360 }, { "epoch": 0.77, "learning_rate": 1.168957543501083e-05, "loss": 2.3287, "step": 439370 }, { "epoch": 0.77, "learning_rate": 1.1688703495084004e-05, "loss": 2.3202, "step": 439380 }, { "epoch": 0.77, "learning_rate": 1.1687831555157176e-05, "loss": 2.3228, "step": 439390 }, { "epoch": 0.77, "learning_rate": 1.168695961523035e-05, "loss": 2.265, "step": 439400 }, { "epoch": 0.77, "learning_rate": 1.1686087675303523e-05, "loss": 2.2284, "step": 439410 }, { "epoch": 0.77, "learning_rate": 1.1685215735376697e-05, "loss": 2.4191, "step": 439420 }, { "epoch": 0.77, "learning_rate": 1.168434379544987e-05, "loss": 2.3629, "step": 439430 }, { "epoch": 0.77, "learning_rate": 1.1683471855523043e-05, "loss": 2.3072, "step": 439440 }, { "epoch": 0.77, "learning_rate": 1.1682599915596215e-05, "loss": 2.2466, "step": 439450 }, { "epoch": 0.77, "learning_rate": 1.1681727975669389e-05, "loss": 2.3138, "step": 439460 }, { "epoch": 0.77, "learning_rate": 1.1680856035742561e-05, "loss": 2.285, "step": 439470 }, { "epoch": 0.77, "learning_rate": 1.1679984095815735e-05, "loss": 2.3356, "step": 439480 }, { "epoch": 0.77, "learning_rate": 1.1679112155888908e-05, "loss": 2.2668, "step": 439490 }, { "epoch": 0.77, "learning_rate": 1.1678240215962082e-05, "loss": 2.3318, "step": 439500 }, { "epoch": 0.77, "learning_rate": 1.1677368276035256e-05, "loss": 2.276, "step": 439510 }, { "epoch": 0.77, "learning_rate": 1.1676496336108428e-05, "loss": 2.2518, "step": 439520 }, { "epoch": 0.77, "learning_rate": 1.1675624396181602e-05, "loss": 2.3168, "step": 439530 }, { "epoch": 0.77, "learning_rate": 1.1674752456254774e-05, "loss": 2.3134, "step": 439540 }, { "epoch": 0.77, "learning_rate": 1.1673880516327948e-05, "loss": 2.3527, "step": 439550 }, { "epoch": 0.77, "learning_rate": 1.167300857640112e-05, "loss": 2.4295, "step": 439560 }, { "epoch": 0.77, "learning_rate": 1.1672136636474293e-05, "loss": 2.3475, "step": 439570 }, { "epoch": 0.77, "learning_rate": 1.1671264696547467e-05, "loss": 2.1997, "step": 439580 }, { "epoch": 0.77, "learning_rate": 1.1670392756620641e-05, "loss": 2.2278, "step": 439590 }, { "epoch": 0.77, "learning_rate": 1.1669520816693813e-05, "loss": 2.204, "step": 439600 }, { "epoch": 0.77, "learning_rate": 1.1668648876766987e-05, "loss": 2.3062, "step": 439610 }, { "epoch": 0.77, "learning_rate": 1.166777693684016e-05, "loss": 2.2507, "step": 439620 }, { "epoch": 0.77, "learning_rate": 1.1666904996913333e-05, "loss": 2.3325, "step": 439630 }, { "epoch": 0.77, "learning_rate": 1.1666033056986506e-05, "loss": 2.2483, "step": 439640 }, { "epoch": 0.77, "learning_rate": 1.166516111705968e-05, "loss": 2.3445, "step": 439650 }, { "epoch": 0.77, "learning_rate": 1.1664289177132854e-05, "loss": 2.1863, "step": 439660 }, { "epoch": 0.77, "learning_rate": 1.1663417237206026e-05, "loss": 2.283, "step": 439670 }, { "epoch": 0.77, "learning_rate": 1.16625452972792e-05, "loss": 2.2978, "step": 439680 }, { "epoch": 0.77, "learning_rate": 1.1661673357352372e-05, "loss": 2.2829, "step": 439690 }, { "epoch": 0.77, "learning_rate": 1.1660801417425546e-05, "loss": 2.3124, "step": 439700 }, { "epoch": 0.77, "learning_rate": 1.1659929477498718e-05, "loss": 2.3278, "step": 439710 }, { "epoch": 0.77, "learning_rate": 1.1659057537571892e-05, "loss": 2.2392, "step": 439720 }, { "epoch": 0.77, "learning_rate": 1.1658185597645065e-05, "loss": 2.344, "step": 439730 }, { "epoch": 0.77, "learning_rate": 1.1657313657718239e-05, "loss": 2.165, "step": 439740 }, { "epoch": 0.77, "learning_rate": 1.1656441717791411e-05, "loss": 2.3424, "step": 439750 }, { "epoch": 0.77, "learning_rate": 1.1655569777864585e-05, "loss": 2.3458, "step": 439760 }, { "epoch": 0.77, "learning_rate": 1.1654697837937759e-05, "loss": 2.3166, "step": 439770 }, { "epoch": 0.77, "learning_rate": 1.165382589801093e-05, "loss": 2.256, "step": 439780 }, { "epoch": 0.77, "learning_rate": 1.1652953958084105e-05, "loss": 2.2272, "step": 439790 }, { "epoch": 0.77, "learning_rate": 1.1652082018157277e-05, "loss": 2.322, "step": 439800 }, { "epoch": 0.77, "learning_rate": 1.165121007823045e-05, "loss": 2.2766, "step": 439810 }, { "epoch": 0.77, "learning_rate": 1.1650338138303624e-05, "loss": 2.3352, "step": 439820 }, { "epoch": 0.77, "learning_rate": 1.1649466198376798e-05, "loss": 2.4012, "step": 439830 }, { "epoch": 0.77, "learning_rate": 1.164859425844997e-05, "loss": 2.3911, "step": 439840 }, { "epoch": 0.77, "learning_rate": 1.1647722318523144e-05, "loss": 2.3384, "step": 439850 }, { "epoch": 0.77, "learning_rate": 1.1646850378596316e-05, "loss": 2.2549, "step": 439860 }, { "epoch": 0.77, "learning_rate": 1.164597843866949e-05, "loss": 2.3206, "step": 439870 }, { "epoch": 0.77, "learning_rate": 1.1645106498742662e-05, "loss": 2.353, "step": 439880 }, { "epoch": 0.77, "learning_rate": 1.1644234558815837e-05, "loss": 2.2649, "step": 439890 }, { "epoch": 0.77, "learning_rate": 1.1643362618889011e-05, "loss": 2.239, "step": 439900 }, { "epoch": 0.77, "learning_rate": 1.1642490678962183e-05, "loss": 2.1971, "step": 439910 }, { "epoch": 0.77, "learning_rate": 1.1641618739035357e-05, "loss": 2.3096, "step": 439920 }, { "epoch": 0.77, "learning_rate": 1.1640746799108529e-05, "loss": 2.3334, "step": 439930 }, { "epoch": 0.77, "learning_rate": 1.1639874859181703e-05, "loss": 2.374, "step": 439940 }, { "epoch": 0.77, "learning_rate": 1.1639002919254875e-05, "loss": 2.3248, "step": 439950 }, { "epoch": 0.77, "learning_rate": 1.1638130979328048e-05, "loss": 2.3077, "step": 439960 }, { "epoch": 0.77, "learning_rate": 1.1637259039401222e-05, "loss": 2.3445, "step": 439970 }, { "epoch": 0.77, "learning_rate": 1.1636387099474396e-05, "loss": 2.2927, "step": 439980 }, { "epoch": 0.77, "learning_rate": 1.1635515159547568e-05, "loss": 2.2255, "step": 439990 }, { "epoch": 0.77, "learning_rate": 1.1634643219620742e-05, "loss": 2.344, "step": 440000 }, { "epoch": 0.77, "learning_rate": 1.1633771279693914e-05, "loss": 2.2819, "step": 440010 }, { "epoch": 0.77, "learning_rate": 1.1632899339767088e-05, "loss": 2.2565, "step": 440020 }, { "epoch": 0.77, "learning_rate": 1.1632027399840261e-05, "loss": 2.2535, "step": 440030 }, { "epoch": 0.77, "learning_rate": 1.1631155459913434e-05, "loss": 2.3199, "step": 440040 }, { "epoch": 0.77, "learning_rate": 1.1630283519986607e-05, "loss": 2.2195, "step": 440050 }, { "epoch": 0.77, "learning_rate": 1.1629411580059781e-05, "loss": 2.2199, "step": 440060 }, { "epoch": 0.77, "learning_rate": 1.1628539640132955e-05, "loss": 2.2482, "step": 440070 }, { "epoch": 0.77, "learning_rate": 1.1627667700206127e-05, "loss": 2.2641, "step": 440080 }, { "epoch": 0.77, "learning_rate": 1.16267957602793e-05, "loss": 2.2342, "step": 440090 }, { "epoch": 0.77, "learning_rate": 1.1625923820352473e-05, "loss": 2.3322, "step": 440100 }, { "epoch": 0.77, "learning_rate": 1.1625051880425647e-05, "loss": 2.3296, "step": 440110 }, { "epoch": 0.77, "learning_rate": 1.1624179940498819e-05, "loss": 2.3057, "step": 440120 }, { "epoch": 0.77, "learning_rate": 1.1623308000571992e-05, "loss": 2.3281, "step": 440130 }, { "epoch": 0.77, "learning_rate": 1.1622436060645166e-05, "loss": 2.2251, "step": 440140 }, { "epoch": 0.77, "learning_rate": 1.162156412071834e-05, "loss": 2.138, "step": 440150 }, { "epoch": 0.77, "learning_rate": 1.1620692180791514e-05, "loss": 2.2566, "step": 440160 }, { "epoch": 0.77, "learning_rate": 1.1619820240864686e-05, "loss": 2.3324, "step": 440170 }, { "epoch": 0.77, "learning_rate": 1.161894830093786e-05, "loss": 2.3647, "step": 440180 }, { "epoch": 0.77, "learning_rate": 1.1618076361011032e-05, "loss": 2.2662, "step": 440190 }, { "epoch": 0.77, "learning_rate": 1.1617204421084205e-05, "loss": 2.3397, "step": 440200 }, { "epoch": 0.77, "learning_rate": 1.161633248115738e-05, "loss": 2.1374, "step": 440210 }, { "epoch": 0.77, "learning_rate": 1.1615460541230553e-05, "loss": 2.3566, "step": 440220 }, { "epoch": 0.77, "learning_rate": 1.1614588601303725e-05, "loss": 2.3496, "step": 440230 }, { "epoch": 0.77, "learning_rate": 1.1613716661376899e-05, "loss": 2.3534, "step": 440240 }, { "epoch": 0.77, "learning_rate": 1.1612844721450071e-05, "loss": 2.2905, "step": 440250 }, { "epoch": 0.77, "learning_rate": 1.1611972781523245e-05, "loss": 2.2326, "step": 440260 }, { "epoch": 0.77, "learning_rate": 1.1611100841596417e-05, "loss": 2.3108, "step": 440270 }, { "epoch": 0.77, "learning_rate": 1.161022890166959e-05, "loss": 2.2599, "step": 440280 }, { "epoch": 0.77, "learning_rate": 1.1609356961742764e-05, "loss": 2.3368, "step": 440290 }, { "epoch": 0.77, "learning_rate": 1.1608485021815938e-05, "loss": 2.372, "step": 440300 }, { "epoch": 0.77, "learning_rate": 1.1607613081889112e-05, "loss": 2.3474, "step": 440310 }, { "epoch": 0.77, "learning_rate": 1.1606741141962284e-05, "loss": 2.2903, "step": 440320 }, { "epoch": 0.77, "learning_rate": 1.1605869202035458e-05, "loss": 2.3847, "step": 440330 }, { "epoch": 0.77, "learning_rate": 1.160499726210863e-05, "loss": 2.3456, "step": 440340 }, { "epoch": 0.77, "learning_rate": 1.1604125322181803e-05, "loss": 2.1777, "step": 440350 }, { "epoch": 0.77, "learning_rate": 1.1603253382254976e-05, "loss": 2.3557, "step": 440360 }, { "epoch": 0.77, "learning_rate": 1.160238144232815e-05, "loss": 2.3247, "step": 440370 }, { "epoch": 0.77, "learning_rate": 1.1601509502401323e-05, "loss": 2.3388, "step": 440380 }, { "epoch": 0.77, "learning_rate": 1.1600637562474497e-05, "loss": 2.2179, "step": 440390 }, { "epoch": 0.77, "learning_rate": 1.1599765622547669e-05, "loss": 2.2306, "step": 440400 }, { "epoch": 0.77, "learning_rate": 1.1598893682620843e-05, "loss": 2.277, "step": 440410 }, { "epoch": 0.77, "learning_rate": 1.1598021742694017e-05, "loss": 2.2958, "step": 440420 }, { "epoch": 0.77, "learning_rate": 1.1597149802767189e-05, "loss": 2.2306, "step": 440430 }, { "epoch": 0.77, "learning_rate": 1.1596277862840362e-05, "loss": 2.1943, "step": 440440 }, { "epoch": 0.77, "learning_rate": 1.1595405922913536e-05, "loss": 2.3639, "step": 440450 }, { "epoch": 0.77, "learning_rate": 1.159453398298671e-05, "loss": 2.2936, "step": 440460 }, { "epoch": 0.77, "learning_rate": 1.1593662043059882e-05, "loss": 2.176, "step": 440470 }, { "epoch": 0.77, "learning_rate": 1.1592790103133056e-05, "loss": 2.1451, "step": 440480 }, { "epoch": 0.77, "learning_rate": 1.1591918163206228e-05, "loss": 2.3523, "step": 440490 }, { "epoch": 0.77, "learning_rate": 1.1591046223279402e-05, "loss": 2.3878, "step": 440500 }, { "epoch": 0.77, "learning_rate": 1.1590174283352574e-05, "loss": 2.3117, "step": 440510 }, { "epoch": 0.77, "learning_rate": 1.1589302343425747e-05, "loss": 2.4163, "step": 440520 }, { "epoch": 0.77, "learning_rate": 1.1588430403498921e-05, "loss": 2.3461, "step": 440530 }, { "epoch": 0.77, "learning_rate": 1.1587558463572095e-05, "loss": 2.2792, "step": 440540 }, { "epoch": 0.77, "learning_rate": 1.1586686523645267e-05, "loss": 2.3513, "step": 440550 }, { "epoch": 0.77, "learning_rate": 1.158581458371844e-05, "loss": 2.3076, "step": 440560 }, { "epoch": 0.77, "learning_rate": 1.1584942643791615e-05, "loss": 2.1899, "step": 440570 }, { "epoch": 0.77, "learning_rate": 1.1584070703864787e-05, "loss": 2.1465, "step": 440580 }, { "epoch": 0.77, "learning_rate": 1.158319876393796e-05, "loss": 2.2403, "step": 440590 }, { "epoch": 0.77, "learning_rate": 1.1582326824011133e-05, "loss": 2.2381, "step": 440600 }, { "epoch": 0.77, "learning_rate": 1.1581454884084306e-05, "loss": 2.2999, "step": 440610 }, { "epoch": 0.77, "learning_rate": 1.158058294415748e-05, "loss": 2.3578, "step": 440620 }, { "epoch": 0.77, "learning_rate": 1.1579711004230654e-05, "loss": 2.3703, "step": 440630 }, { "epoch": 0.77, "learning_rate": 1.1578839064303826e-05, "loss": 2.2819, "step": 440640 }, { "epoch": 0.77, "learning_rate": 1.1577967124377e-05, "loss": 2.3156, "step": 440650 }, { "epoch": 0.77, "learning_rate": 1.1577095184450172e-05, "loss": 2.3167, "step": 440660 }, { "epoch": 0.77, "learning_rate": 1.1576223244523346e-05, "loss": 2.2281, "step": 440670 }, { "epoch": 0.77, "learning_rate": 1.1575351304596518e-05, "loss": 2.2529, "step": 440680 }, { "epoch": 0.77, "learning_rate": 1.1574479364669693e-05, "loss": 2.3718, "step": 440690 }, { "epoch": 0.77, "learning_rate": 1.1573607424742867e-05, "loss": 2.3906, "step": 440700 }, { "epoch": 0.77, "learning_rate": 1.1572735484816039e-05, "loss": 2.3601, "step": 440710 }, { "epoch": 0.77, "learning_rate": 1.1571863544889213e-05, "loss": 2.2727, "step": 440720 }, { "epoch": 0.77, "learning_rate": 1.1570991604962385e-05, "loss": 2.2464, "step": 440730 }, { "epoch": 0.77, "learning_rate": 1.1570119665035559e-05, "loss": 2.2479, "step": 440740 }, { "epoch": 0.77, "learning_rate": 1.156924772510873e-05, "loss": 2.1991, "step": 440750 }, { "epoch": 0.77, "learning_rate": 1.1568375785181904e-05, "loss": 2.2424, "step": 440760 }, { "epoch": 0.77, "learning_rate": 1.1567503845255078e-05, "loss": 2.2998, "step": 440770 }, { "epoch": 0.77, "learning_rate": 1.1566631905328252e-05, "loss": 2.2732, "step": 440780 }, { "epoch": 0.77, "learning_rate": 1.1565759965401424e-05, "loss": 2.2798, "step": 440790 }, { "epoch": 0.77, "learning_rate": 1.1564888025474598e-05, "loss": 2.3549, "step": 440800 }, { "epoch": 0.77, "learning_rate": 1.156401608554777e-05, "loss": 2.385, "step": 440810 }, { "epoch": 0.77, "learning_rate": 1.1563144145620944e-05, "loss": 2.23, "step": 440820 }, { "epoch": 0.77, "learning_rate": 1.1562272205694117e-05, "loss": 2.2472, "step": 440830 }, { "epoch": 0.77, "learning_rate": 1.156140026576729e-05, "loss": 2.3045, "step": 440840 }, { "epoch": 0.77, "learning_rate": 1.1560528325840463e-05, "loss": 2.2812, "step": 440850 }, { "epoch": 0.77, "learning_rate": 1.1559656385913637e-05, "loss": 2.3309, "step": 440860 }, { "epoch": 0.77, "learning_rate": 1.155878444598681e-05, "loss": 2.3459, "step": 440870 }, { "epoch": 0.77, "learning_rate": 1.1557912506059983e-05, "loss": 2.3818, "step": 440880 }, { "epoch": 0.77, "learning_rate": 1.1557040566133157e-05, "loss": 2.3476, "step": 440890 }, { "epoch": 0.77, "learning_rate": 1.1556168626206329e-05, "loss": 2.2308, "step": 440900 }, { "epoch": 0.77, "learning_rate": 1.1555296686279502e-05, "loss": 2.2354, "step": 440910 }, { "epoch": 0.77, "learning_rate": 1.1554424746352675e-05, "loss": 2.2878, "step": 440920 }, { "epoch": 0.77, "learning_rate": 1.155355280642585e-05, "loss": 2.291, "step": 440930 }, { "epoch": 0.77, "learning_rate": 1.1552680866499022e-05, "loss": 2.2726, "step": 440940 }, { "epoch": 0.77, "learning_rate": 1.1551808926572196e-05, "loss": 2.3957, "step": 440950 }, { "epoch": 0.77, "learning_rate": 1.155093698664537e-05, "loss": 2.3692, "step": 440960 }, { "epoch": 0.77, "learning_rate": 1.1550065046718542e-05, "loss": 2.252, "step": 440970 }, { "epoch": 0.77, "learning_rate": 1.1549193106791715e-05, "loss": 2.4021, "step": 440980 }, { "epoch": 0.77, "learning_rate": 1.1548321166864888e-05, "loss": 2.2444, "step": 440990 }, { "epoch": 0.77, "learning_rate": 1.1547449226938061e-05, "loss": 2.2714, "step": 441000 }, { "epoch": 0.77, "learning_rate": 1.1546577287011235e-05, "loss": 2.2246, "step": 441010 }, { "epoch": 0.77, "learning_rate": 1.1545705347084409e-05, "loss": 2.3502, "step": 441020 }, { "epoch": 0.77, "learning_rate": 1.1544833407157581e-05, "loss": 2.3964, "step": 441030 }, { "epoch": 0.77, "learning_rate": 1.1543961467230755e-05, "loss": 2.2211, "step": 441040 }, { "epoch": 0.77, "learning_rate": 1.1543089527303927e-05, "loss": 2.3345, "step": 441050 }, { "epoch": 0.77, "learning_rate": 1.15422175873771e-05, "loss": 2.23, "step": 441060 }, { "epoch": 0.77, "learning_rate": 1.1541345647450273e-05, "loss": 2.3012, "step": 441070 }, { "epoch": 0.77, "learning_rate": 1.1540473707523446e-05, "loss": 2.3837, "step": 441080 }, { "epoch": 0.77, "learning_rate": 1.153960176759662e-05, "loss": 2.2867, "step": 441090 }, { "epoch": 0.77, "learning_rate": 1.1538729827669794e-05, "loss": 2.3403, "step": 441100 }, { "epoch": 0.77, "learning_rate": 1.1537857887742968e-05, "loss": 2.4245, "step": 441110 }, { "epoch": 0.77, "learning_rate": 1.153698594781614e-05, "loss": 2.2826, "step": 441120 }, { "epoch": 0.77, "learning_rate": 1.1536114007889314e-05, "loss": 2.1886, "step": 441130 }, { "epoch": 0.77, "learning_rate": 1.1535242067962486e-05, "loss": 2.1808, "step": 441140 }, { "epoch": 0.77, "learning_rate": 1.153437012803566e-05, "loss": 2.2924, "step": 441150 }, { "epoch": 0.77, "learning_rate": 1.1533498188108831e-05, "loss": 2.2438, "step": 441160 }, { "epoch": 0.77, "learning_rate": 1.1532626248182005e-05, "loss": 2.275, "step": 441170 }, { "epoch": 0.77, "learning_rate": 1.1531754308255179e-05, "loss": 2.333, "step": 441180 }, { "epoch": 0.77, "learning_rate": 1.1530882368328353e-05, "loss": 2.3186, "step": 441190 }, { "epoch": 0.77, "learning_rate": 1.1530010428401525e-05, "loss": 2.3236, "step": 441200 }, { "epoch": 0.77, "learning_rate": 1.1529138488474699e-05, "loss": 2.2094, "step": 441210 }, { "epoch": 0.77, "learning_rate": 1.1528266548547872e-05, "loss": 2.3318, "step": 441220 }, { "epoch": 0.77, "learning_rate": 1.1527394608621044e-05, "loss": 2.2167, "step": 441230 }, { "epoch": 0.77, "learning_rate": 1.1526522668694218e-05, "loss": 2.2774, "step": 441240 }, { "epoch": 0.77, "learning_rate": 1.1525650728767392e-05, "loss": 2.2971, "step": 441250 }, { "epoch": 0.77, "learning_rate": 1.1524778788840566e-05, "loss": 2.4035, "step": 441260 }, { "epoch": 0.77, "learning_rate": 1.1523906848913738e-05, "loss": 2.3331, "step": 441270 }, { "epoch": 0.77, "learning_rate": 1.1523034908986912e-05, "loss": 2.3294, "step": 441280 }, { "epoch": 0.77, "learning_rate": 1.1522162969060084e-05, "loss": 2.3198, "step": 441290 }, { "epoch": 0.77, "learning_rate": 1.1521291029133257e-05, "loss": 2.3225, "step": 441300 }, { "epoch": 0.77, "learning_rate": 1.152041908920643e-05, "loss": 2.1802, "step": 441310 }, { "epoch": 0.77, "learning_rate": 1.1519547149279603e-05, "loss": 2.3921, "step": 441320 }, { "epoch": 0.77, "learning_rate": 1.1518675209352777e-05, "loss": 2.3137, "step": 441330 }, { "epoch": 0.77, "learning_rate": 1.151780326942595e-05, "loss": 2.4577, "step": 441340 }, { "epoch": 0.77, "learning_rate": 1.1516931329499125e-05, "loss": 2.2941, "step": 441350 }, { "epoch": 0.77, "learning_rate": 1.1516059389572297e-05, "loss": 2.3541, "step": 441360 }, { "epoch": 0.77, "learning_rate": 1.151518744964547e-05, "loss": 2.2608, "step": 441370 }, { "epoch": 0.77, "learning_rate": 1.1514315509718643e-05, "loss": 2.2543, "step": 441380 }, { "epoch": 0.77, "learning_rate": 1.1513443569791816e-05, "loss": 2.2413, "step": 441390 }, { "epoch": 0.77, "learning_rate": 1.1512571629864988e-05, "loss": 2.2585, "step": 441400 }, { "epoch": 0.77, "learning_rate": 1.1511699689938162e-05, "loss": 2.2774, "step": 441410 }, { "epoch": 0.77, "learning_rate": 1.1510827750011336e-05, "loss": 2.3072, "step": 441420 }, { "epoch": 0.77, "learning_rate": 1.150995581008451e-05, "loss": 2.202, "step": 441430 }, { "epoch": 0.77, "learning_rate": 1.1509083870157682e-05, "loss": 2.2669, "step": 441440 }, { "epoch": 0.77, "learning_rate": 1.1508211930230856e-05, "loss": 2.2946, "step": 441450 }, { "epoch": 0.77, "learning_rate": 1.1507339990304028e-05, "loss": 2.2571, "step": 441460 }, { "epoch": 0.77, "learning_rate": 1.1506468050377201e-05, "loss": 2.2855, "step": 441470 }, { "epoch": 0.77, "learning_rate": 1.1505596110450373e-05, "loss": 2.1909, "step": 441480 }, { "epoch": 0.77, "learning_rate": 1.1504724170523549e-05, "loss": 2.1876, "step": 441490 }, { "epoch": 0.77, "learning_rate": 1.1503852230596723e-05, "loss": 2.3172, "step": 441500 }, { "epoch": 0.77, "learning_rate": 1.1502980290669895e-05, "loss": 2.2001, "step": 441510 }, { "epoch": 0.77, "learning_rate": 1.1502108350743069e-05, "loss": 2.3835, "step": 441520 }, { "epoch": 0.77, "learning_rate": 1.150123641081624e-05, "loss": 2.2911, "step": 441530 }, { "epoch": 0.77, "learning_rate": 1.1500364470889414e-05, "loss": 2.3556, "step": 441540 }, { "epoch": 0.77, "learning_rate": 1.1499492530962586e-05, "loss": 2.202, "step": 441550 }, { "epoch": 0.77, "learning_rate": 1.149862059103576e-05, "loss": 2.3068, "step": 441560 }, { "epoch": 0.77, "learning_rate": 1.1497748651108934e-05, "loss": 2.2696, "step": 441570 }, { "epoch": 0.77, "learning_rate": 1.1496876711182108e-05, "loss": 2.3124, "step": 441580 }, { "epoch": 0.77, "learning_rate": 1.149600477125528e-05, "loss": 2.3974, "step": 441590 }, { "epoch": 0.77, "learning_rate": 1.1495132831328454e-05, "loss": 2.2354, "step": 441600 }, { "epoch": 0.77, "learning_rate": 1.1494260891401626e-05, "loss": 2.3868, "step": 441610 }, { "epoch": 0.77, "learning_rate": 1.14933889514748e-05, "loss": 2.4555, "step": 441620 }, { "epoch": 0.77, "learning_rate": 1.1492517011547973e-05, "loss": 2.3575, "step": 441630 }, { "epoch": 0.77, "learning_rate": 1.1491645071621145e-05, "loss": 2.2476, "step": 441640 }, { "epoch": 0.77, "learning_rate": 1.1490773131694319e-05, "loss": 2.3353, "step": 441650 }, { "epoch": 0.77, "learning_rate": 1.1489901191767493e-05, "loss": 2.3245, "step": 441660 }, { "epoch": 0.77, "learning_rate": 1.1489029251840667e-05, "loss": 2.3207, "step": 441670 }, { "epoch": 0.77, "learning_rate": 1.1488157311913839e-05, "loss": 2.1932, "step": 441680 }, { "epoch": 0.77, "learning_rate": 1.1487285371987012e-05, "loss": 2.2192, "step": 441690 }, { "epoch": 0.77, "learning_rate": 1.1486413432060185e-05, "loss": 2.3155, "step": 441700 }, { "epoch": 0.77, "learning_rate": 1.1485541492133358e-05, "loss": 2.352, "step": 441710 }, { "epoch": 0.77, "learning_rate": 1.148466955220653e-05, "loss": 2.3711, "step": 441720 }, { "epoch": 0.77, "learning_rate": 1.1483797612279706e-05, "loss": 2.2626, "step": 441730 }, { "epoch": 0.77, "learning_rate": 1.1482925672352878e-05, "loss": 2.1487, "step": 441740 }, { "epoch": 0.77, "learning_rate": 1.1482053732426052e-05, "loss": 2.2826, "step": 441750 }, { "epoch": 0.77, "learning_rate": 1.1481181792499225e-05, "loss": 2.2136, "step": 441760 }, { "epoch": 0.77, "learning_rate": 1.1480309852572398e-05, "loss": 2.3015, "step": 441770 }, { "epoch": 0.77, "learning_rate": 1.1479437912645571e-05, "loss": 2.1912, "step": 441780 }, { "epoch": 0.77, "learning_rate": 1.1478565972718743e-05, "loss": 2.2176, "step": 441790 }, { "epoch": 0.77, "learning_rate": 1.1477694032791917e-05, "loss": 2.3106, "step": 441800 }, { "epoch": 0.77, "learning_rate": 1.1476822092865091e-05, "loss": 2.2558, "step": 441810 }, { "epoch": 0.77, "learning_rate": 1.1475950152938265e-05, "loss": 2.2964, "step": 441820 }, { "epoch": 0.77, "learning_rate": 1.1475078213011437e-05, "loss": 2.2797, "step": 441830 }, { "epoch": 0.77, "learning_rate": 1.147420627308461e-05, "loss": 2.2214, "step": 441840 }, { "epoch": 0.77, "learning_rate": 1.1473334333157783e-05, "loss": 2.4091, "step": 441850 }, { "epoch": 0.77, "learning_rate": 1.1472462393230956e-05, "loss": 2.2337, "step": 441860 }, { "epoch": 0.77, "learning_rate": 1.1471590453304128e-05, "loss": 2.3971, "step": 441870 }, { "epoch": 0.77, "learning_rate": 1.1470718513377302e-05, "loss": 2.359, "step": 441880 }, { "epoch": 0.77, "learning_rate": 1.1469846573450476e-05, "loss": 2.3386, "step": 441890 }, { "epoch": 0.77, "learning_rate": 1.146897463352365e-05, "loss": 2.3293, "step": 441900 }, { "epoch": 0.77, "learning_rate": 1.1468102693596824e-05, "loss": 2.2993, "step": 441910 }, { "epoch": 0.77, "learning_rate": 1.1467230753669996e-05, "loss": 2.2495, "step": 441920 }, { "epoch": 0.77, "learning_rate": 1.146635881374317e-05, "loss": 2.2235, "step": 441930 }, { "epoch": 0.77, "learning_rate": 1.1465486873816341e-05, "loss": 2.2756, "step": 441940 }, { "epoch": 0.77, "learning_rate": 1.1464614933889515e-05, "loss": 2.361, "step": 441950 }, { "epoch": 0.77, "learning_rate": 1.1463742993962687e-05, "loss": 2.2701, "step": 441960 }, { "epoch": 0.77, "learning_rate": 1.1462871054035863e-05, "loss": 2.3264, "step": 441970 }, { "epoch": 0.77, "learning_rate": 1.1461999114109035e-05, "loss": 2.3145, "step": 441980 }, { "epoch": 0.77, "learning_rate": 1.1461127174182209e-05, "loss": 2.2411, "step": 441990 }, { "epoch": 0.77, "learning_rate": 1.146025523425538e-05, "loss": 2.3803, "step": 442000 }, { "epoch": 0.77, "learning_rate": 1.1459383294328554e-05, "loss": 2.3105, "step": 442010 }, { "epoch": 0.77, "learning_rate": 1.1458511354401728e-05, "loss": 2.2808, "step": 442020 }, { "epoch": 0.77, "learning_rate": 1.14576394144749e-05, "loss": 2.3209, "step": 442030 }, { "epoch": 0.77, "learning_rate": 1.1456767474548074e-05, "loss": 2.2561, "step": 442040 }, { "epoch": 0.77, "learning_rate": 1.1455895534621248e-05, "loss": 2.4107, "step": 442050 }, { "epoch": 0.77, "learning_rate": 1.1455023594694422e-05, "loss": 2.215, "step": 442060 }, { "epoch": 0.77, "learning_rate": 1.1454151654767594e-05, "loss": 2.3042, "step": 442070 }, { "epoch": 0.77, "learning_rate": 1.1453279714840767e-05, "loss": 2.3641, "step": 442080 }, { "epoch": 0.77, "learning_rate": 1.145240777491394e-05, "loss": 2.2658, "step": 442090 }, { "epoch": 0.77, "learning_rate": 1.1451535834987113e-05, "loss": 2.3063, "step": 442100 }, { "epoch": 0.77, "learning_rate": 1.1450663895060285e-05, "loss": 2.2094, "step": 442110 }, { "epoch": 0.77, "learning_rate": 1.1449791955133459e-05, "loss": 2.3612, "step": 442120 }, { "epoch": 0.77, "learning_rate": 1.1448920015206633e-05, "loss": 2.2046, "step": 442130 }, { "epoch": 0.77, "learning_rate": 1.1448048075279807e-05, "loss": 2.2141, "step": 442140 }, { "epoch": 0.77, "learning_rate": 1.144717613535298e-05, "loss": 2.2333, "step": 442150 }, { "epoch": 0.77, "learning_rate": 1.1446304195426153e-05, "loss": 2.178, "step": 442160 }, { "epoch": 0.77, "learning_rate": 1.1445432255499326e-05, "loss": 2.283, "step": 442170 }, { "epoch": 0.77, "learning_rate": 1.1444560315572498e-05, "loss": 2.2878, "step": 442180 }, { "epoch": 0.77, "learning_rate": 1.1443688375645672e-05, "loss": 2.302, "step": 442190 }, { "epoch": 0.77, "learning_rate": 1.1442816435718844e-05, "loss": 2.372, "step": 442200 }, { "epoch": 0.77, "learning_rate": 1.144194449579202e-05, "loss": 2.2427, "step": 442210 }, { "epoch": 0.77, "learning_rate": 1.1441072555865192e-05, "loss": 2.2689, "step": 442220 }, { "epoch": 0.77, "learning_rate": 1.1440200615938366e-05, "loss": 2.297, "step": 442230 }, { "epoch": 0.77, "learning_rate": 1.1439328676011538e-05, "loss": 2.1606, "step": 442240 }, { "epoch": 0.77, "learning_rate": 1.1438456736084711e-05, "loss": 2.2629, "step": 442250 }, { "epoch": 0.77, "learning_rate": 1.1437584796157883e-05, "loss": 2.2376, "step": 442260 }, { "epoch": 0.77, "learning_rate": 1.1436712856231057e-05, "loss": 2.3667, "step": 442270 }, { "epoch": 0.77, "learning_rate": 1.1435840916304231e-05, "loss": 2.2862, "step": 442280 }, { "epoch": 0.77, "learning_rate": 1.1434968976377405e-05, "loss": 2.2437, "step": 442290 }, { "epoch": 0.77, "learning_rate": 1.1434097036450579e-05, "loss": 2.4049, "step": 442300 }, { "epoch": 0.77, "learning_rate": 1.143322509652375e-05, "loss": 2.1968, "step": 442310 }, { "epoch": 0.77, "learning_rate": 1.1432353156596924e-05, "loss": 2.324, "step": 442320 }, { "epoch": 0.77, "learning_rate": 1.1431481216670096e-05, "loss": 2.2881, "step": 442330 }, { "epoch": 0.77, "learning_rate": 1.143060927674327e-05, "loss": 2.2988, "step": 442340 }, { "epoch": 0.77, "learning_rate": 1.1429737336816442e-05, "loss": 2.3386, "step": 442350 }, { "epoch": 0.77, "learning_rate": 1.1428865396889616e-05, "loss": 2.2011, "step": 442360 }, { "epoch": 0.77, "learning_rate": 1.142799345696279e-05, "loss": 2.402, "step": 442370 }, { "epoch": 0.77, "learning_rate": 1.1427121517035964e-05, "loss": 2.181, "step": 442380 }, { "epoch": 0.77, "learning_rate": 1.1426249577109136e-05, "loss": 2.1969, "step": 442390 }, { "epoch": 0.77, "learning_rate": 1.142537763718231e-05, "loss": 2.3544, "step": 442400 }, { "epoch": 0.77, "learning_rate": 1.1424505697255482e-05, "loss": 2.3886, "step": 442410 }, { "epoch": 0.77, "learning_rate": 1.1423633757328655e-05, "loss": 2.3261, "step": 442420 }, { "epoch": 0.77, "learning_rate": 1.1422761817401829e-05, "loss": 2.3483, "step": 442430 }, { "epoch": 0.77, "learning_rate": 1.1421889877475001e-05, "loss": 2.3505, "step": 442440 }, { "epoch": 0.77, "learning_rate": 1.1421017937548175e-05, "loss": 2.2604, "step": 442450 }, { "epoch": 0.77, "learning_rate": 1.1420145997621349e-05, "loss": 2.3345, "step": 442460 }, { "epoch": 0.77, "learning_rate": 1.1419274057694522e-05, "loss": 2.3471, "step": 442470 }, { "epoch": 0.77, "learning_rate": 1.1418402117767695e-05, "loss": 2.3064, "step": 442480 }, { "epoch": 0.77, "learning_rate": 1.1417530177840868e-05, "loss": 2.3729, "step": 442490 }, { "epoch": 0.77, "learning_rate": 1.141665823791404e-05, "loss": 2.3103, "step": 442500 }, { "epoch": 0.77, "learning_rate": 1.1415786297987214e-05, "loss": 2.1957, "step": 442510 }, { "epoch": 0.77, "learning_rate": 1.1414914358060388e-05, "loss": 2.3828, "step": 442520 }, { "epoch": 0.77, "learning_rate": 1.1414042418133562e-05, "loss": 2.3158, "step": 442530 }, { "epoch": 0.77, "learning_rate": 1.1413170478206734e-05, "loss": 2.3615, "step": 442540 }, { "epoch": 0.77, "learning_rate": 1.1412298538279908e-05, "loss": 2.3379, "step": 442550 }, { "epoch": 0.77, "learning_rate": 1.1411426598353081e-05, "loss": 2.2441, "step": 442560 }, { "epoch": 0.77, "learning_rate": 1.1410554658426253e-05, "loss": 2.2827, "step": 442570 }, { "epoch": 0.77, "learning_rate": 1.1409682718499427e-05, "loss": 2.2765, "step": 442580 }, { "epoch": 0.77, "learning_rate": 1.14088107785726e-05, "loss": 2.3964, "step": 442590 }, { "epoch": 0.77, "learning_rate": 1.1407938838645773e-05, "loss": 2.3709, "step": 442600 }, { "epoch": 0.77, "learning_rate": 1.1407066898718947e-05, "loss": 2.2688, "step": 442610 }, { "epoch": 0.77, "learning_rate": 1.140619495879212e-05, "loss": 2.3644, "step": 442620 }, { "epoch": 0.77, "learning_rate": 1.1405323018865293e-05, "loss": 2.3784, "step": 442630 }, { "epoch": 0.77, "learning_rate": 1.1404451078938466e-05, "loss": 2.3041, "step": 442640 }, { "epoch": 0.77, "learning_rate": 1.1403579139011638e-05, "loss": 2.3006, "step": 442650 }, { "epoch": 0.77, "learning_rate": 1.1402707199084812e-05, "loss": 2.3316, "step": 442660 }, { "epoch": 0.77, "learning_rate": 1.1401835259157984e-05, "loss": 2.2732, "step": 442670 }, { "epoch": 0.77, "learning_rate": 1.1400963319231158e-05, "loss": 2.2693, "step": 442680 }, { "epoch": 0.77, "learning_rate": 1.1400091379304332e-05, "loss": 2.3554, "step": 442690 }, { "epoch": 0.77, "learning_rate": 1.1399219439377506e-05, "loss": 2.3022, "step": 442700 }, { "epoch": 0.77, "learning_rate": 1.139834749945068e-05, "loss": 2.2779, "step": 442710 }, { "epoch": 0.77, "learning_rate": 1.1397475559523851e-05, "loss": 2.1976, "step": 442720 }, { "epoch": 0.77, "learning_rate": 1.1396603619597025e-05, "loss": 2.2241, "step": 442730 }, { "epoch": 0.77, "learning_rate": 1.1395731679670197e-05, "loss": 2.1747, "step": 442740 }, { "epoch": 0.77, "learning_rate": 1.1394859739743371e-05, "loss": 2.2242, "step": 442750 }, { "epoch": 0.77, "learning_rate": 1.1393987799816543e-05, "loss": 2.2127, "step": 442760 }, { "epoch": 0.77, "learning_rate": 1.1393115859889719e-05, "loss": 2.25, "step": 442770 }, { "epoch": 0.77, "learning_rate": 1.139224391996289e-05, "loss": 2.304, "step": 442780 }, { "epoch": 0.77, "learning_rate": 1.1391371980036064e-05, "loss": 2.3174, "step": 442790 }, { "epoch": 0.77, "learning_rate": 1.1390500040109237e-05, "loss": 2.3089, "step": 442800 }, { "epoch": 0.77, "learning_rate": 1.138962810018241e-05, "loss": 2.2301, "step": 442810 }, { "epoch": 0.77, "learning_rate": 1.1388756160255584e-05, "loss": 2.1689, "step": 442820 }, { "epoch": 0.77, "learning_rate": 1.1387884220328756e-05, "loss": 2.1705, "step": 442830 }, { "epoch": 0.77, "learning_rate": 1.138701228040193e-05, "loss": 2.3199, "step": 442840 }, { "epoch": 0.77, "learning_rate": 1.1386140340475104e-05, "loss": 2.2517, "step": 442850 }, { "epoch": 0.77, "learning_rate": 1.1385268400548277e-05, "loss": 2.2468, "step": 442860 }, { "epoch": 0.77, "learning_rate": 1.138439646062145e-05, "loss": 2.1731, "step": 442870 }, { "epoch": 0.77, "learning_rate": 1.1383524520694623e-05, "loss": 2.3136, "step": 442880 }, { "epoch": 0.77, "learning_rate": 1.1382652580767795e-05, "loss": 2.36, "step": 442890 }, { "epoch": 0.77, "learning_rate": 1.1381780640840969e-05, "loss": 2.2493, "step": 442900 }, { "epoch": 0.77, "learning_rate": 1.1380908700914141e-05, "loss": 2.2718, "step": 442910 }, { "epoch": 0.77, "learning_rate": 1.1380036760987315e-05, "loss": 2.3636, "step": 442920 }, { "epoch": 0.77, "learning_rate": 1.1379164821060489e-05, "loss": 2.2011, "step": 442930 }, { "epoch": 0.77, "learning_rate": 1.1378292881133663e-05, "loss": 2.2611, "step": 442940 }, { "epoch": 0.77, "learning_rate": 1.1377420941206836e-05, "loss": 2.2703, "step": 442950 }, { "epoch": 0.77, "learning_rate": 1.1376549001280008e-05, "loss": 2.2762, "step": 442960 }, { "epoch": 0.77, "learning_rate": 1.1375677061353182e-05, "loss": 2.2718, "step": 442970 }, { "epoch": 0.77, "learning_rate": 1.1374805121426354e-05, "loss": 2.2008, "step": 442980 }, { "epoch": 0.77, "learning_rate": 1.1373933181499528e-05, "loss": 2.2625, "step": 442990 }, { "epoch": 0.77, "learning_rate": 1.13730612415727e-05, "loss": 2.2905, "step": 443000 }, { "epoch": 0.77, "learning_rate": 1.1372189301645876e-05, "loss": 2.2955, "step": 443010 }, { "epoch": 0.77, "learning_rate": 1.1371317361719048e-05, "loss": 2.4221, "step": 443020 }, { "epoch": 0.77, "learning_rate": 1.1370445421792221e-05, "loss": 2.2002, "step": 443030 }, { "epoch": 0.77, "learning_rate": 1.1369573481865393e-05, "loss": 2.2964, "step": 443040 }, { "epoch": 0.77, "learning_rate": 1.1368701541938567e-05, "loss": 2.2398, "step": 443050 }, { "epoch": 0.77, "learning_rate": 1.136782960201174e-05, "loss": 2.3681, "step": 443060 }, { "epoch": 0.77, "learning_rate": 1.1366957662084913e-05, "loss": 2.3536, "step": 443070 }, { "epoch": 0.77, "learning_rate": 1.1366085722158087e-05, "loss": 2.3502, "step": 443080 }, { "epoch": 0.77, "learning_rate": 1.136521378223126e-05, "loss": 2.2787, "step": 443090 }, { "epoch": 0.77, "learning_rate": 1.1364341842304434e-05, "loss": 2.1749, "step": 443100 }, { "epoch": 0.77, "learning_rate": 1.1363469902377606e-05, "loss": 2.2683, "step": 443110 }, { "epoch": 0.77, "learning_rate": 1.136259796245078e-05, "loss": 2.3503, "step": 443120 }, { "epoch": 0.77, "learning_rate": 1.1361726022523952e-05, "loss": 2.2559, "step": 443130 }, { "epoch": 0.77, "learning_rate": 1.1360854082597126e-05, "loss": 2.3696, "step": 443140 }, { "epoch": 0.77, "learning_rate": 1.1359982142670298e-05, "loss": 2.3032, "step": 443150 }, { "epoch": 0.77, "learning_rate": 1.1359110202743472e-05, "loss": 2.331, "step": 443160 }, { "epoch": 0.77, "learning_rate": 1.1358238262816646e-05, "loss": 2.1705, "step": 443170 }, { "epoch": 0.77, "learning_rate": 1.135736632288982e-05, "loss": 2.3288, "step": 443180 }, { "epoch": 0.77, "learning_rate": 1.1356494382962992e-05, "loss": 2.3141, "step": 443190 }, { "epoch": 0.77, "learning_rate": 1.1355622443036165e-05, "loss": 2.2466, "step": 443200 }, { "epoch": 0.77, "learning_rate": 1.1354750503109337e-05, "loss": 2.3888, "step": 443210 }, { "epoch": 0.77, "learning_rate": 1.1353878563182511e-05, "loss": 2.3667, "step": 443220 }, { "epoch": 0.77, "learning_rate": 1.1353006623255685e-05, "loss": 2.2648, "step": 443230 }, { "epoch": 0.77, "learning_rate": 1.1352134683328857e-05, "loss": 2.2556, "step": 443240 }, { "epoch": 0.77, "learning_rate": 1.1351262743402032e-05, "loss": 2.3124, "step": 443250 }, { "epoch": 0.77, "learning_rate": 1.1350390803475205e-05, "loss": 2.2525, "step": 443260 }, { "epoch": 0.77, "learning_rate": 1.1349518863548378e-05, "loss": 2.1357, "step": 443270 }, { "epoch": 0.77, "learning_rate": 1.134864692362155e-05, "loss": 2.3506, "step": 443280 }, { "epoch": 0.77, "learning_rate": 1.1347774983694724e-05, "loss": 2.2727, "step": 443290 }, { "epoch": 0.77, "learning_rate": 1.1346903043767896e-05, "loss": 2.3041, "step": 443300 }, { "epoch": 0.77, "learning_rate": 1.134603110384107e-05, "loss": 2.2606, "step": 443310 }, { "epoch": 0.77, "learning_rate": 1.1345159163914244e-05, "loss": 2.2527, "step": 443320 }, { "epoch": 0.77, "learning_rate": 1.1344287223987418e-05, "loss": 2.2761, "step": 443330 }, { "epoch": 0.77, "learning_rate": 1.134341528406059e-05, "loss": 2.207, "step": 443340 }, { "epoch": 0.77, "learning_rate": 1.1342543344133763e-05, "loss": 2.2462, "step": 443350 }, { "epoch": 0.77, "learning_rate": 1.1341671404206937e-05, "loss": 2.2754, "step": 443360 }, { "epoch": 0.77, "learning_rate": 1.134079946428011e-05, "loss": 2.2876, "step": 443370 }, { "epoch": 0.77, "learning_rate": 1.1339927524353283e-05, "loss": 2.2097, "step": 443380 }, { "epoch": 0.77, "learning_rate": 1.1339055584426455e-05, "loss": 2.2854, "step": 443390 }, { "epoch": 0.77, "learning_rate": 1.1338183644499629e-05, "loss": 2.3233, "step": 443400 }, { "epoch": 0.77, "learning_rate": 1.1337311704572803e-05, "loss": 2.2621, "step": 443410 }, { "epoch": 0.77, "learning_rate": 1.1336439764645976e-05, "loss": 2.2674, "step": 443420 }, { "epoch": 0.77, "learning_rate": 1.1335567824719148e-05, "loss": 2.2612, "step": 443430 }, { "epoch": 0.77, "learning_rate": 1.1334695884792322e-05, "loss": 2.3003, "step": 443440 }, { "epoch": 0.77, "learning_rate": 1.1333823944865494e-05, "loss": 2.3331, "step": 443450 }, { "epoch": 0.77, "learning_rate": 1.1332952004938668e-05, "loss": 2.3157, "step": 443460 }, { "epoch": 0.77, "learning_rate": 1.133208006501184e-05, "loss": 2.3107, "step": 443470 }, { "epoch": 0.77, "learning_rate": 1.1331208125085014e-05, "loss": 2.2727, "step": 443480 }, { "epoch": 0.77, "learning_rate": 1.1330336185158188e-05, "loss": 2.1937, "step": 443490 }, { "epoch": 0.77, "learning_rate": 1.1329464245231361e-05, "loss": 2.2603, "step": 443500 }, { "epoch": 0.77, "learning_rate": 1.1328592305304535e-05, "loss": 2.3079, "step": 443510 }, { "epoch": 0.77, "learning_rate": 1.1327720365377707e-05, "loss": 2.2434, "step": 443520 }, { "epoch": 0.77, "learning_rate": 1.1326848425450881e-05, "loss": 2.4682, "step": 443530 }, { "epoch": 0.77, "learning_rate": 1.1325976485524053e-05, "loss": 2.3533, "step": 443540 }, { "epoch": 0.77, "learning_rate": 1.1325104545597227e-05, "loss": 2.3551, "step": 443550 }, { "epoch": 0.77, "learning_rate": 1.13242326056704e-05, "loss": 2.2796, "step": 443560 }, { "epoch": 0.77, "learning_rate": 1.1323360665743574e-05, "loss": 2.3481, "step": 443570 }, { "epoch": 0.77, "learning_rate": 1.1322488725816747e-05, "loss": 2.3078, "step": 443580 }, { "epoch": 0.77, "learning_rate": 1.132161678588992e-05, "loss": 2.3236, "step": 443590 }, { "epoch": 0.77, "learning_rate": 1.1320744845963092e-05, "loss": 2.2767, "step": 443600 }, { "epoch": 0.77, "learning_rate": 1.1319872906036266e-05, "loss": 2.2666, "step": 443610 }, { "epoch": 0.77, "learning_rate": 1.131900096610944e-05, "loss": 2.1927, "step": 443620 }, { "epoch": 0.77, "learning_rate": 1.1318129026182612e-05, "loss": 2.4212, "step": 443630 }, { "epoch": 0.77, "learning_rate": 1.1317257086255786e-05, "loss": 2.2373, "step": 443640 }, { "epoch": 0.77, "learning_rate": 1.131638514632896e-05, "loss": 2.3863, "step": 443650 }, { "epoch": 0.77, "learning_rate": 1.1315513206402133e-05, "loss": 2.3001, "step": 443660 }, { "epoch": 0.77, "learning_rate": 1.1314641266475305e-05, "loss": 2.4255, "step": 443670 }, { "epoch": 0.77, "learning_rate": 1.1313769326548479e-05, "loss": 2.2708, "step": 443680 }, { "epoch": 0.77, "learning_rate": 1.1312897386621651e-05, "loss": 2.3324, "step": 443690 }, { "epoch": 0.77, "learning_rate": 1.1312025446694825e-05, "loss": 2.264, "step": 443700 }, { "epoch": 0.77, "learning_rate": 1.1311153506767997e-05, "loss": 2.3868, "step": 443710 }, { "epoch": 0.77, "learning_rate": 1.131028156684117e-05, "loss": 2.3644, "step": 443720 }, { "epoch": 0.77, "learning_rate": 1.1309409626914345e-05, "loss": 2.274, "step": 443730 }, { "epoch": 0.77, "learning_rate": 1.1308537686987518e-05, "loss": 2.3552, "step": 443740 }, { "epoch": 0.77, "learning_rate": 1.1307665747060692e-05, "loss": 2.3022, "step": 443750 }, { "epoch": 0.77, "learning_rate": 1.1306793807133864e-05, "loss": 2.2444, "step": 443760 }, { "epoch": 0.77, "learning_rate": 1.1305921867207038e-05, "loss": 2.2508, "step": 443770 }, { "epoch": 0.77, "learning_rate": 1.130504992728021e-05, "loss": 2.321, "step": 443780 }, { "epoch": 0.77, "learning_rate": 1.1304177987353384e-05, "loss": 2.3016, "step": 443790 }, { "epoch": 0.77, "learning_rate": 1.1303306047426556e-05, "loss": 2.3187, "step": 443800 }, { "epoch": 0.77, "learning_rate": 1.1302434107499731e-05, "loss": 2.0915, "step": 443810 }, { "epoch": 0.77, "learning_rate": 1.1301562167572903e-05, "loss": 2.2583, "step": 443820 }, { "epoch": 0.77, "learning_rate": 1.1300690227646077e-05, "loss": 2.099, "step": 443830 }, { "epoch": 0.77, "learning_rate": 1.129981828771925e-05, "loss": 2.2144, "step": 443840 }, { "epoch": 0.77, "learning_rate": 1.1298946347792423e-05, "loss": 2.2657, "step": 443850 }, { "epoch": 0.77, "learning_rate": 1.1298074407865595e-05, "loss": 2.2708, "step": 443860 }, { "epoch": 0.77, "learning_rate": 1.1297202467938769e-05, "loss": 2.2895, "step": 443870 }, { "epoch": 0.77, "learning_rate": 1.1296330528011943e-05, "loss": 2.2475, "step": 443880 }, { "epoch": 0.77, "learning_rate": 1.1295458588085116e-05, "loss": 2.362, "step": 443890 }, { "epoch": 0.77, "learning_rate": 1.129458664815829e-05, "loss": 2.2924, "step": 443900 }, { "epoch": 0.77, "learning_rate": 1.1293714708231462e-05, "loss": 2.2876, "step": 443910 }, { "epoch": 0.77, "learning_rate": 1.1292842768304636e-05, "loss": 2.2846, "step": 443920 }, { "epoch": 0.77, "learning_rate": 1.1291970828377808e-05, "loss": 2.281, "step": 443930 }, { "epoch": 0.77, "learning_rate": 1.1291098888450982e-05, "loss": 2.2607, "step": 443940 }, { "epoch": 0.77, "learning_rate": 1.1290226948524154e-05, "loss": 2.2328, "step": 443950 }, { "epoch": 0.77, "learning_rate": 1.1289355008597328e-05, "loss": 2.3527, "step": 443960 }, { "epoch": 0.77, "learning_rate": 1.1288483068670502e-05, "loss": 2.2653, "step": 443970 }, { "epoch": 0.77, "learning_rate": 1.1287611128743675e-05, "loss": 2.2704, "step": 443980 }, { "epoch": 0.77, "learning_rate": 1.1286739188816847e-05, "loss": 2.2154, "step": 443990 }, { "epoch": 0.77, "learning_rate": 1.1285867248890021e-05, "loss": 2.4098, "step": 444000 }, { "epoch": 0.77, "learning_rate": 1.1284995308963195e-05, "loss": 2.1601, "step": 444010 }, { "epoch": 0.77, "learning_rate": 1.1284123369036367e-05, "loss": 2.2257, "step": 444020 }, { "epoch": 0.77, "learning_rate": 1.128325142910954e-05, "loss": 2.3907, "step": 444030 }, { "epoch": 0.77, "learning_rate": 1.1282379489182713e-05, "loss": 2.3331, "step": 444040 }, { "epoch": 0.77, "learning_rate": 1.1281507549255888e-05, "loss": 2.2241, "step": 444050 }, { "epoch": 0.77, "learning_rate": 1.128063560932906e-05, "loss": 2.2878, "step": 444060 }, { "epoch": 0.77, "learning_rate": 1.1279763669402234e-05, "loss": 2.1922, "step": 444070 }, { "epoch": 0.77, "learning_rate": 1.1278891729475406e-05, "loss": 2.1935, "step": 444080 }, { "epoch": 0.77, "learning_rate": 1.127801978954858e-05, "loss": 2.257, "step": 444090 }, { "epoch": 0.77, "learning_rate": 1.1277147849621752e-05, "loss": 2.2388, "step": 444100 }, { "epoch": 0.77, "learning_rate": 1.1276275909694926e-05, "loss": 2.3457, "step": 444110 }, { "epoch": 0.77, "learning_rate": 1.12754039697681e-05, "loss": 2.3185, "step": 444120 }, { "epoch": 0.77, "learning_rate": 1.1274532029841273e-05, "loss": 2.2908, "step": 444130 }, { "epoch": 0.77, "learning_rate": 1.1273660089914445e-05, "loss": 2.3729, "step": 444140 }, { "epoch": 0.77, "learning_rate": 1.127278814998762e-05, "loss": 2.295, "step": 444150 }, { "epoch": 0.77, "learning_rate": 1.1271916210060793e-05, "loss": 2.3062, "step": 444160 }, { "epoch": 0.77, "learning_rate": 1.1271044270133965e-05, "loss": 2.3516, "step": 444170 }, { "epoch": 0.77, "learning_rate": 1.1270172330207139e-05, "loss": 2.1769, "step": 444180 }, { "epoch": 0.77, "learning_rate": 1.1269300390280311e-05, "loss": 2.2359, "step": 444190 }, { "epoch": 0.77, "learning_rate": 1.1268428450353485e-05, "loss": 2.3965, "step": 444200 }, { "epoch": 0.77, "learning_rate": 1.1267556510426658e-05, "loss": 2.2488, "step": 444210 }, { "epoch": 0.77, "learning_rate": 1.1266684570499832e-05, "loss": 2.2517, "step": 444220 }, { "epoch": 0.77, "learning_rate": 1.1265812630573004e-05, "loss": 2.1965, "step": 444230 }, { "epoch": 0.77, "learning_rate": 1.1264940690646178e-05, "loss": 2.2403, "step": 444240 }, { "epoch": 0.77, "learning_rate": 1.126406875071935e-05, "loss": 2.2833, "step": 444250 }, { "epoch": 0.77, "learning_rate": 1.1263196810792524e-05, "loss": 2.2581, "step": 444260 }, { "epoch": 0.77, "learning_rate": 1.1262324870865696e-05, "loss": 2.291, "step": 444270 }, { "epoch": 0.77, "learning_rate": 1.126145293093887e-05, "loss": 2.2796, "step": 444280 }, { "epoch": 0.77, "learning_rate": 1.1260580991012045e-05, "loss": 2.2586, "step": 444290 }, { "epoch": 0.77, "learning_rate": 1.1259709051085217e-05, "loss": 2.325, "step": 444300 }, { "epoch": 0.77, "learning_rate": 1.1258837111158391e-05, "loss": 2.3854, "step": 444310 }, { "epoch": 0.77, "learning_rate": 1.1257965171231563e-05, "loss": 2.5011, "step": 444320 }, { "epoch": 0.77, "learning_rate": 1.1257093231304737e-05, "loss": 2.2575, "step": 444330 }, { "epoch": 0.77, "learning_rate": 1.1256221291377909e-05, "loss": 2.1858, "step": 444340 }, { "epoch": 0.77, "learning_rate": 1.1255349351451083e-05, "loss": 2.329, "step": 444350 }, { "epoch": 0.77, "learning_rate": 1.1254477411524257e-05, "loss": 2.3247, "step": 444360 }, { "epoch": 0.77, "learning_rate": 1.125360547159743e-05, "loss": 2.1808, "step": 444370 }, { "epoch": 0.77, "learning_rate": 1.1252733531670602e-05, "loss": 2.2999, "step": 444380 }, { "epoch": 0.77, "learning_rate": 1.1251861591743776e-05, "loss": 2.3184, "step": 444390 }, { "epoch": 0.77, "learning_rate": 1.1250989651816948e-05, "loss": 2.0871, "step": 444400 }, { "epoch": 0.77, "learning_rate": 1.1250117711890122e-05, "loss": 2.3079, "step": 444410 }, { "epoch": 0.78, "learning_rate": 1.1249245771963296e-05, "loss": 2.218, "step": 444420 }, { "epoch": 0.78, "learning_rate": 1.1248373832036468e-05, "loss": 2.2505, "step": 444430 }, { "epoch": 0.78, "learning_rate": 1.1247501892109642e-05, "loss": 2.2965, "step": 444440 }, { "epoch": 0.78, "learning_rate": 1.1246629952182815e-05, "loss": 2.2786, "step": 444450 }, { "epoch": 0.78, "learning_rate": 1.1245758012255989e-05, "loss": 2.2333, "step": 444460 }, { "epoch": 0.78, "learning_rate": 1.1244886072329161e-05, "loss": 2.2494, "step": 444470 }, { "epoch": 0.78, "learning_rate": 1.1244014132402335e-05, "loss": 2.3123, "step": 444480 }, { "epoch": 0.78, "learning_rate": 1.1243142192475507e-05, "loss": 2.1919, "step": 444490 }, { "epoch": 0.78, "learning_rate": 1.124227025254868e-05, "loss": 2.3422, "step": 444500 }, { "epoch": 0.78, "learning_rate": 1.1241398312621853e-05, "loss": 2.1733, "step": 444510 }, { "epoch": 0.78, "learning_rate": 1.1240526372695027e-05, "loss": 2.2518, "step": 444520 }, { "epoch": 0.78, "learning_rate": 1.12396544327682e-05, "loss": 2.3716, "step": 444530 }, { "epoch": 0.78, "learning_rate": 1.1238782492841374e-05, "loss": 2.2074, "step": 444540 }, { "epoch": 0.78, "learning_rate": 1.1237910552914548e-05, "loss": 2.2585, "step": 444550 }, { "epoch": 0.78, "learning_rate": 1.123703861298772e-05, "loss": 2.3049, "step": 444560 }, { "epoch": 0.78, "learning_rate": 1.1236166673060894e-05, "loss": 2.2581, "step": 444570 }, { "epoch": 0.78, "learning_rate": 1.1235294733134066e-05, "loss": 2.379, "step": 444580 }, { "epoch": 0.78, "learning_rate": 1.123442279320724e-05, "loss": 2.3974, "step": 444590 }, { "epoch": 0.78, "learning_rate": 1.1233550853280413e-05, "loss": 2.3748, "step": 444600 }, { "epoch": 0.78, "learning_rate": 1.1232678913353587e-05, "loss": 2.4447, "step": 444610 }, { "epoch": 0.78, "learning_rate": 1.123180697342676e-05, "loss": 2.4431, "step": 444620 }, { "epoch": 0.78, "learning_rate": 1.1230935033499933e-05, "loss": 2.4242, "step": 444630 }, { "epoch": 0.78, "learning_rate": 1.1230063093573105e-05, "loss": 2.2831, "step": 444640 }, { "epoch": 0.78, "learning_rate": 1.1229191153646279e-05, "loss": 2.2753, "step": 444650 }, { "epoch": 0.78, "learning_rate": 1.1228319213719451e-05, "loss": 2.2655, "step": 444660 }, { "epoch": 0.78, "learning_rate": 1.1227447273792625e-05, "loss": 2.2909, "step": 444670 }, { "epoch": 0.78, "learning_rate": 1.1226575333865799e-05, "loss": 2.2935, "step": 444680 }, { "epoch": 0.78, "learning_rate": 1.1225703393938972e-05, "loss": 2.2303, "step": 444690 }, { "epoch": 0.78, "learning_rate": 1.1224831454012146e-05, "loss": 2.2456, "step": 444700 }, { "epoch": 0.78, "learning_rate": 1.1223959514085318e-05, "loss": 2.2644, "step": 444710 }, { "epoch": 0.78, "learning_rate": 1.1223087574158492e-05, "loss": 2.2878, "step": 444720 }, { "epoch": 0.78, "learning_rate": 1.1222215634231664e-05, "loss": 2.3468, "step": 444730 }, { "epoch": 0.78, "learning_rate": 1.1221343694304838e-05, "loss": 2.3988, "step": 444740 }, { "epoch": 0.78, "learning_rate": 1.122047175437801e-05, "loss": 2.2817, "step": 444750 }, { "epoch": 0.78, "learning_rate": 1.1219599814451184e-05, "loss": 2.2633, "step": 444760 }, { "epoch": 0.78, "learning_rate": 1.1218727874524357e-05, "loss": 2.3469, "step": 444770 }, { "epoch": 0.78, "learning_rate": 1.1217855934597531e-05, "loss": 2.2329, "step": 444780 }, { "epoch": 0.78, "learning_rate": 1.1216983994670703e-05, "loss": 2.311, "step": 444790 }, { "epoch": 0.78, "learning_rate": 1.1216112054743877e-05, "loss": 2.2568, "step": 444800 }, { "epoch": 0.78, "learning_rate": 1.121524011481705e-05, "loss": 2.2154, "step": 444810 }, { "epoch": 0.78, "learning_rate": 1.1214368174890223e-05, "loss": 2.2415, "step": 444820 }, { "epoch": 0.78, "learning_rate": 1.1213496234963397e-05, "loss": 2.3039, "step": 444830 }, { "epoch": 0.78, "learning_rate": 1.1212624295036569e-05, "loss": 2.3384, "step": 444840 }, { "epoch": 0.78, "learning_rate": 1.1211752355109744e-05, "loss": 2.3308, "step": 444850 }, { "epoch": 0.78, "learning_rate": 1.1210880415182916e-05, "loss": 2.3205, "step": 444860 }, { "epoch": 0.78, "learning_rate": 1.121000847525609e-05, "loss": 2.2237, "step": 444870 }, { "epoch": 0.78, "learning_rate": 1.1209136535329262e-05, "loss": 2.2971, "step": 444880 }, { "epoch": 0.78, "learning_rate": 1.1208264595402436e-05, "loss": 2.3601, "step": 444890 }, { "epoch": 0.78, "learning_rate": 1.1207392655475608e-05, "loss": 2.2509, "step": 444900 }, { "epoch": 0.78, "learning_rate": 1.1206520715548782e-05, "loss": 2.2498, "step": 444910 }, { "epoch": 0.78, "learning_rate": 1.1205648775621955e-05, "loss": 2.2865, "step": 444920 }, { "epoch": 0.78, "learning_rate": 1.120477683569513e-05, "loss": 2.3177, "step": 444930 }, { "epoch": 0.78, "learning_rate": 1.1203904895768301e-05, "loss": 2.322, "step": 444940 }, { "epoch": 0.78, "learning_rate": 1.1203032955841475e-05, "loss": 2.3145, "step": 444950 }, { "epoch": 0.78, "learning_rate": 1.1202161015914649e-05, "loss": 2.0987, "step": 444960 }, { "epoch": 0.78, "learning_rate": 1.1201289075987821e-05, "loss": 2.2856, "step": 444970 }, { "epoch": 0.78, "learning_rate": 1.1200417136060995e-05, "loss": 2.237, "step": 444980 }, { "epoch": 0.78, "learning_rate": 1.1199545196134167e-05, "loss": 2.2878, "step": 444990 }, { "epoch": 0.78, "learning_rate": 1.119867325620734e-05, "loss": 2.323, "step": 445000 }, { "epoch": 0.78, "learning_rate": 1.1197801316280514e-05, "loss": 2.4189, "step": 445010 }, { "epoch": 0.78, "learning_rate": 1.1196929376353688e-05, "loss": 2.3263, "step": 445020 }, { "epoch": 0.78, "learning_rate": 1.119605743642686e-05, "loss": 2.2098, "step": 445030 }, { "epoch": 0.78, "learning_rate": 1.1195185496500034e-05, "loss": 2.2601, "step": 445040 }, { "epoch": 0.78, "learning_rate": 1.1194313556573206e-05, "loss": 2.2623, "step": 445050 }, { "epoch": 0.78, "learning_rate": 1.119344161664638e-05, "loss": 2.2819, "step": 445060 }, { "epoch": 0.78, "learning_rate": 1.1192569676719552e-05, "loss": 2.3501, "step": 445070 }, { "epoch": 0.78, "learning_rate": 1.1191697736792726e-05, "loss": 2.2116, "step": 445080 }, { "epoch": 0.78, "learning_rate": 1.1190825796865901e-05, "loss": 2.403, "step": 445090 }, { "epoch": 0.78, "learning_rate": 1.1189953856939073e-05, "loss": 2.2098, "step": 445100 }, { "epoch": 0.78, "learning_rate": 1.1189081917012247e-05, "loss": 2.1387, "step": 445110 }, { "epoch": 0.78, "learning_rate": 1.1188209977085419e-05, "loss": 2.2139, "step": 445120 }, { "epoch": 0.78, "learning_rate": 1.1187338037158593e-05, "loss": 2.2802, "step": 445130 }, { "epoch": 0.78, "learning_rate": 1.1186466097231765e-05, "loss": 2.3202, "step": 445140 }, { "epoch": 0.78, "learning_rate": 1.1185594157304939e-05, "loss": 2.2726, "step": 445150 }, { "epoch": 0.78, "learning_rate": 1.1184722217378112e-05, "loss": 2.2588, "step": 445160 }, { "epoch": 0.78, "learning_rate": 1.1183850277451286e-05, "loss": 2.3647, "step": 445170 }, { "epoch": 0.78, "learning_rate": 1.1182978337524458e-05, "loss": 2.4024, "step": 445180 }, { "epoch": 0.78, "learning_rate": 1.1182106397597632e-05, "loss": 2.1812, "step": 445190 }, { "epoch": 0.78, "learning_rate": 1.1181234457670804e-05, "loss": 2.4287, "step": 445200 }, { "epoch": 0.78, "learning_rate": 1.1180362517743978e-05, "loss": 2.2527, "step": 445210 }, { "epoch": 0.78, "learning_rate": 1.1179490577817152e-05, "loss": 2.2525, "step": 445220 }, { "epoch": 0.78, "learning_rate": 1.1178618637890324e-05, "loss": 2.345, "step": 445230 }, { "epoch": 0.78, "learning_rate": 1.1177746697963497e-05, "loss": 2.3535, "step": 445240 }, { "epoch": 0.78, "learning_rate": 1.1176874758036671e-05, "loss": 2.2037, "step": 445250 }, { "epoch": 0.78, "learning_rate": 1.1176002818109845e-05, "loss": 2.2121, "step": 445260 }, { "epoch": 0.78, "learning_rate": 1.1175130878183017e-05, "loss": 2.2654, "step": 445270 }, { "epoch": 0.78, "learning_rate": 1.1174258938256191e-05, "loss": 2.2105, "step": 445280 }, { "epoch": 0.78, "learning_rate": 1.1173386998329363e-05, "loss": 2.2731, "step": 445290 }, { "epoch": 0.78, "learning_rate": 1.1172515058402537e-05, "loss": 2.3115, "step": 445300 }, { "epoch": 0.78, "learning_rate": 1.1171643118475709e-05, "loss": 2.2629, "step": 445310 }, { "epoch": 0.78, "learning_rate": 1.1170771178548883e-05, "loss": 2.2872, "step": 445320 }, { "epoch": 0.78, "learning_rate": 1.1169899238622056e-05, "loss": 2.3385, "step": 445330 }, { "epoch": 0.78, "learning_rate": 1.116902729869523e-05, "loss": 2.1549, "step": 445340 }, { "epoch": 0.78, "learning_rate": 1.1168155358768404e-05, "loss": 2.2786, "step": 445350 }, { "epoch": 0.78, "learning_rate": 1.1167283418841576e-05, "loss": 2.3616, "step": 445360 }, { "epoch": 0.78, "learning_rate": 1.116641147891475e-05, "loss": 2.3212, "step": 445370 }, { "epoch": 0.78, "learning_rate": 1.1165539538987922e-05, "loss": 2.2334, "step": 445380 }, { "epoch": 0.78, "learning_rate": 1.1164667599061096e-05, "loss": 2.2739, "step": 445390 }, { "epoch": 0.78, "learning_rate": 1.116379565913427e-05, "loss": 2.176, "step": 445400 }, { "epoch": 0.78, "learning_rate": 1.1162923719207443e-05, "loss": 2.3715, "step": 445410 }, { "epoch": 0.78, "learning_rate": 1.1162051779280615e-05, "loss": 2.3533, "step": 445420 }, { "epoch": 0.78, "learning_rate": 1.1161179839353789e-05, "loss": 2.3252, "step": 445430 }, { "epoch": 0.78, "learning_rate": 1.1160307899426961e-05, "loss": 2.3687, "step": 445440 }, { "epoch": 0.78, "learning_rate": 1.1159435959500135e-05, "loss": 2.1664, "step": 445450 }, { "epoch": 0.78, "learning_rate": 1.1158564019573307e-05, "loss": 2.3211, "step": 445460 }, { "epoch": 0.78, "learning_rate": 1.115769207964648e-05, "loss": 2.3419, "step": 445470 }, { "epoch": 0.78, "learning_rate": 1.1156820139719654e-05, "loss": 2.1386, "step": 445480 }, { "epoch": 0.78, "learning_rate": 1.1155948199792828e-05, "loss": 2.2662, "step": 445490 }, { "epoch": 0.78, "learning_rate": 1.1155076259866002e-05, "loss": 2.2983, "step": 445500 }, { "epoch": 0.78, "learning_rate": 1.1154204319939174e-05, "loss": 2.3353, "step": 445510 }, { "epoch": 0.78, "learning_rate": 1.1153332380012348e-05, "loss": 2.2877, "step": 445520 }, { "epoch": 0.78, "learning_rate": 1.115246044008552e-05, "loss": 2.2556, "step": 445530 }, { "epoch": 0.78, "learning_rate": 1.1151588500158694e-05, "loss": 2.3652, "step": 445540 }, { "epoch": 0.78, "learning_rate": 1.1150716560231866e-05, "loss": 2.2252, "step": 445550 }, { "epoch": 0.78, "learning_rate": 1.114984462030504e-05, "loss": 2.2733, "step": 445560 }, { "epoch": 0.78, "learning_rate": 1.1148972680378213e-05, "loss": 2.2063, "step": 445570 }, { "epoch": 0.78, "learning_rate": 1.1148100740451387e-05, "loss": 2.3213, "step": 445580 }, { "epoch": 0.78, "learning_rate": 1.1147228800524559e-05, "loss": 2.31, "step": 445590 }, { "epoch": 0.78, "learning_rate": 1.1146356860597733e-05, "loss": 2.238, "step": 445600 }, { "epoch": 0.78, "learning_rate": 1.1145484920670907e-05, "loss": 2.3359, "step": 445610 }, { "epoch": 0.78, "learning_rate": 1.1144612980744079e-05, "loss": 2.2639, "step": 445620 }, { "epoch": 0.78, "learning_rate": 1.1143741040817252e-05, "loss": 2.3284, "step": 445630 }, { "epoch": 0.78, "learning_rate": 1.1142869100890426e-05, "loss": 2.2822, "step": 445640 }, { "epoch": 0.78, "learning_rate": 1.11419971609636e-05, "loss": 2.2232, "step": 445650 }, { "epoch": 0.78, "learning_rate": 1.1141125221036772e-05, "loss": 2.244, "step": 445660 }, { "epoch": 0.78, "learning_rate": 1.1140253281109946e-05, "loss": 2.2085, "step": 445670 }, { "epoch": 0.78, "learning_rate": 1.1139381341183118e-05, "loss": 2.2299, "step": 445680 }, { "epoch": 0.78, "learning_rate": 1.1138509401256292e-05, "loss": 2.339, "step": 445690 }, { "epoch": 0.78, "learning_rate": 1.1137637461329464e-05, "loss": 2.3712, "step": 445700 }, { "epoch": 0.78, "learning_rate": 1.1136765521402638e-05, "loss": 2.35, "step": 445710 }, { "epoch": 0.78, "learning_rate": 1.1135893581475811e-05, "loss": 2.3036, "step": 445720 }, { "epoch": 0.78, "learning_rate": 1.1135021641548985e-05, "loss": 2.2134, "step": 445730 }, { "epoch": 0.78, "learning_rate": 1.1134149701622159e-05, "loss": 2.3258, "step": 445740 }, { "epoch": 0.78, "learning_rate": 1.1133277761695331e-05, "loss": 2.3676, "step": 445750 }, { "epoch": 0.78, "learning_rate": 1.1132405821768505e-05, "loss": 2.3372, "step": 445760 }, { "epoch": 0.78, "learning_rate": 1.1131533881841677e-05, "loss": 2.2774, "step": 445770 }, { "epoch": 0.78, "learning_rate": 1.113066194191485e-05, "loss": 2.2449, "step": 445780 }, { "epoch": 0.78, "learning_rate": 1.1129790001988023e-05, "loss": 2.334, "step": 445790 }, { "epoch": 0.78, "learning_rate": 1.1128918062061196e-05, "loss": 2.355, "step": 445800 }, { "epoch": 0.78, "learning_rate": 1.112804612213437e-05, "loss": 2.3197, "step": 445810 }, { "epoch": 0.78, "learning_rate": 1.1127174182207544e-05, "loss": 2.2316, "step": 445820 }, { "epoch": 0.78, "learning_rate": 1.1126302242280716e-05, "loss": 2.4049, "step": 445830 }, { "epoch": 0.78, "learning_rate": 1.112543030235389e-05, "loss": 2.2272, "step": 445840 }, { "epoch": 0.78, "learning_rate": 1.1124558362427062e-05, "loss": 2.2697, "step": 445850 }, { "epoch": 0.78, "learning_rate": 1.1123686422500236e-05, "loss": 2.29, "step": 445860 }, { "epoch": 0.78, "learning_rate": 1.1122814482573408e-05, "loss": 2.239, "step": 445870 }, { "epoch": 0.78, "learning_rate": 1.1121942542646581e-05, "loss": 2.403, "step": 445880 }, { "epoch": 0.78, "learning_rate": 1.1121070602719757e-05, "loss": 2.167, "step": 445890 }, { "epoch": 0.78, "learning_rate": 1.1120198662792929e-05, "loss": 2.2898, "step": 445900 }, { "epoch": 0.78, "learning_rate": 1.1119326722866103e-05, "loss": 2.2417, "step": 445910 }, { "epoch": 0.78, "learning_rate": 1.1118454782939275e-05, "loss": 2.3041, "step": 445920 }, { "epoch": 0.78, "learning_rate": 1.1117582843012449e-05, "loss": 2.2393, "step": 445930 }, { "epoch": 0.78, "learning_rate": 1.111671090308562e-05, "loss": 2.1993, "step": 445940 }, { "epoch": 0.78, "learning_rate": 1.1115838963158794e-05, "loss": 2.2735, "step": 445950 }, { "epoch": 0.78, "learning_rate": 1.1114967023231968e-05, "loss": 2.2793, "step": 445960 }, { "epoch": 0.78, "learning_rate": 1.1114095083305142e-05, "loss": 2.2112, "step": 445970 }, { "epoch": 0.78, "learning_rate": 1.1113223143378314e-05, "loss": 2.2422, "step": 445980 }, { "epoch": 0.78, "learning_rate": 1.1112351203451488e-05, "loss": 2.3416, "step": 445990 }, { "epoch": 0.78, "learning_rate": 1.111147926352466e-05, "loss": 2.3276, "step": 446000 }, { "epoch": 0.78, "learning_rate": 1.1110607323597834e-05, "loss": 2.2889, "step": 446010 }, { "epoch": 0.78, "learning_rate": 1.1109735383671007e-05, "loss": 2.3087, "step": 446020 }, { "epoch": 0.78, "learning_rate": 1.110886344374418e-05, "loss": 2.2605, "step": 446030 }, { "epoch": 0.78, "learning_rate": 1.1107991503817353e-05, "loss": 2.1994, "step": 446040 }, { "epoch": 0.78, "learning_rate": 1.1107119563890527e-05, "loss": 2.3569, "step": 446050 }, { "epoch": 0.78, "learning_rate": 1.1106247623963701e-05, "loss": 2.254, "step": 446060 }, { "epoch": 0.78, "learning_rate": 1.1105375684036873e-05, "loss": 2.2616, "step": 446070 }, { "epoch": 0.78, "learning_rate": 1.1104503744110047e-05, "loss": 2.2765, "step": 446080 }, { "epoch": 0.78, "learning_rate": 1.1103631804183219e-05, "loss": 2.2048, "step": 446090 }, { "epoch": 0.78, "learning_rate": 1.1102759864256393e-05, "loss": 2.3075, "step": 446100 }, { "epoch": 0.78, "learning_rate": 1.1101887924329565e-05, "loss": 2.3581, "step": 446110 }, { "epoch": 0.78, "learning_rate": 1.1101015984402738e-05, "loss": 2.3565, "step": 446120 }, { "epoch": 0.78, "learning_rate": 1.1100144044475912e-05, "loss": 2.2526, "step": 446130 }, { "epoch": 0.78, "learning_rate": 1.1099272104549086e-05, "loss": 2.2316, "step": 446140 }, { "epoch": 0.78, "learning_rate": 1.109840016462226e-05, "loss": 2.2508, "step": 446150 }, { "epoch": 0.78, "learning_rate": 1.1097528224695432e-05, "loss": 2.237, "step": 446160 }, { "epoch": 0.78, "learning_rate": 1.1096656284768606e-05, "loss": 2.3562, "step": 446170 }, { "epoch": 0.78, "learning_rate": 1.1095784344841778e-05, "loss": 2.2726, "step": 446180 }, { "epoch": 0.78, "learning_rate": 1.1094912404914951e-05, "loss": 2.2558, "step": 446190 }, { "epoch": 0.78, "learning_rate": 1.1094040464988125e-05, "loss": 2.3041, "step": 446200 }, { "epoch": 0.78, "learning_rate": 1.1093168525061299e-05, "loss": 2.3083, "step": 446210 }, { "epoch": 0.78, "learning_rate": 1.1092296585134471e-05, "loss": 2.2715, "step": 446220 }, { "epoch": 0.78, "learning_rate": 1.1091424645207645e-05, "loss": 2.1642, "step": 446230 }, { "epoch": 0.78, "learning_rate": 1.1090552705280817e-05, "loss": 2.2833, "step": 446240 }, { "epoch": 0.78, "learning_rate": 1.108968076535399e-05, "loss": 2.2689, "step": 446250 }, { "epoch": 0.78, "learning_rate": 1.1088808825427163e-05, "loss": 2.2884, "step": 446260 }, { "epoch": 0.78, "learning_rate": 1.1087936885500336e-05, "loss": 2.2104, "step": 446270 }, { "epoch": 0.78, "learning_rate": 1.108706494557351e-05, "loss": 2.2287, "step": 446280 }, { "epoch": 0.78, "learning_rate": 1.1086193005646684e-05, "loss": 2.3536, "step": 446290 }, { "epoch": 0.78, "learning_rate": 1.1085321065719858e-05, "loss": 2.1844, "step": 446300 }, { "epoch": 0.78, "learning_rate": 1.108444912579303e-05, "loss": 2.3056, "step": 446310 }, { "epoch": 0.78, "learning_rate": 1.1083577185866204e-05, "loss": 2.2632, "step": 446320 }, { "epoch": 0.78, "learning_rate": 1.1082705245939376e-05, "loss": 2.334, "step": 446330 }, { "epoch": 0.78, "learning_rate": 1.108183330601255e-05, "loss": 2.2087, "step": 446340 }, { "epoch": 0.78, "learning_rate": 1.1080961366085722e-05, "loss": 2.2475, "step": 446350 }, { "epoch": 0.78, "learning_rate": 1.1080089426158895e-05, "loss": 2.3455, "step": 446360 }, { "epoch": 0.78, "learning_rate": 1.1079217486232069e-05, "loss": 2.2522, "step": 446370 }, { "epoch": 0.78, "learning_rate": 1.1078345546305243e-05, "loss": 2.2919, "step": 446380 }, { "epoch": 0.78, "learning_rate": 1.1077473606378415e-05, "loss": 2.2653, "step": 446390 }, { "epoch": 0.78, "learning_rate": 1.1076601666451589e-05, "loss": 2.3586, "step": 446400 }, { "epoch": 0.78, "learning_rate": 1.1075729726524762e-05, "loss": 2.1692, "step": 446410 }, { "epoch": 0.78, "learning_rate": 1.1074857786597935e-05, "loss": 2.2088, "step": 446420 }, { "epoch": 0.78, "learning_rate": 1.1073985846671108e-05, "loss": 2.2327, "step": 446430 }, { "epoch": 0.78, "learning_rate": 1.1073113906744282e-05, "loss": 2.3086, "step": 446440 }, { "epoch": 0.78, "learning_rate": 1.1072241966817456e-05, "loss": 2.3474, "step": 446450 }, { "epoch": 0.78, "learning_rate": 1.1071370026890628e-05, "loss": 2.3636, "step": 446460 }, { "epoch": 0.78, "learning_rate": 1.1070498086963802e-05, "loss": 2.2901, "step": 446470 }, { "epoch": 0.78, "learning_rate": 1.1069626147036974e-05, "loss": 2.3037, "step": 446480 }, { "epoch": 0.78, "learning_rate": 1.1068754207110148e-05, "loss": 2.229, "step": 446490 }, { "epoch": 0.78, "learning_rate": 1.106788226718332e-05, "loss": 2.2816, "step": 446500 }, { "epoch": 0.78, "learning_rate": 1.1067010327256493e-05, "loss": 2.1807, "step": 446510 }, { "epoch": 0.78, "learning_rate": 1.1066138387329667e-05, "loss": 2.2818, "step": 446520 }, { "epoch": 0.78, "learning_rate": 1.1065266447402841e-05, "loss": 2.3987, "step": 446530 }, { "epoch": 0.78, "learning_rate": 1.1064394507476015e-05, "loss": 2.2472, "step": 446540 }, { "epoch": 0.78, "learning_rate": 1.1063522567549187e-05, "loss": 2.2862, "step": 446550 }, { "epoch": 0.78, "learning_rate": 1.106265062762236e-05, "loss": 2.3113, "step": 446560 }, { "epoch": 0.78, "learning_rate": 1.1061778687695533e-05, "loss": 2.2414, "step": 446570 }, { "epoch": 0.78, "learning_rate": 1.1060906747768706e-05, "loss": 2.3419, "step": 446580 }, { "epoch": 0.78, "learning_rate": 1.1060034807841878e-05, "loss": 2.1414, "step": 446590 }, { "epoch": 0.78, "learning_rate": 1.1059162867915052e-05, "loss": 2.3085, "step": 446600 }, { "epoch": 0.78, "learning_rate": 1.1058290927988226e-05, "loss": 2.1271, "step": 446610 }, { "epoch": 0.78, "learning_rate": 1.10574189880614e-05, "loss": 2.0722, "step": 446620 }, { "epoch": 0.78, "learning_rate": 1.1056547048134572e-05, "loss": 2.2798, "step": 446630 }, { "epoch": 0.78, "learning_rate": 1.1055675108207746e-05, "loss": 2.2962, "step": 446640 }, { "epoch": 0.78, "learning_rate": 1.1054803168280918e-05, "loss": 2.2891, "step": 446650 }, { "epoch": 0.78, "learning_rate": 1.1053931228354091e-05, "loss": 2.2241, "step": 446660 }, { "epoch": 0.78, "learning_rate": 1.1053059288427265e-05, "loss": 2.191, "step": 446670 }, { "epoch": 0.78, "learning_rate": 1.1052187348500439e-05, "loss": 2.2935, "step": 446680 }, { "epoch": 0.78, "learning_rate": 1.1051315408573613e-05, "loss": 2.4007, "step": 446690 }, { "epoch": 0.78, "learning_rate": 1.1050443468646785e-05, "loss": 2.3889, "step": 446700 }, { "epoch": 0.78, "learning_rate": 1.1049571528719959e-05, "loss": 2.3619, "step": 446710 }, { "epoch": 0.78, "learning_rate": 1.104869958879313e-05, "loss": 2.3061, "step": 446720 }, { "epoch": 0.78, "learning_rate": 1.1047827648866304e-05, "loss": 2.3259, "step": 446730 }, { "epoch": 0.78, "learning_rate": 1.1046955708939477e-05, "loss": 2.3453, "step": 446740 }, { "epoch": 0.78, "learning_rate": 1.104608376901265e-05, "loss": 2.3418, "step": 446750 }, { "epoch": 0.78, "learning_rate": 1.1045211829085824e-05, "loss": 2.2666, "step": 446760 }, { "epoch": 0.78, "learning_rate": 1.1044339889158998e-05, "loss": 2.351, "step": 446770 }, { "epoch": 0.78, "learning_rate": 1.104346794923217e-05, "loss": 2.2604, "step": 446780 }, { "epoch": 0.78, "learning_rate": 1.1042596009305344e-05, "loss": 2.1564, "step": 446790 }, { "epoch": 0.78, "learning_rate": 1.1041724069378516e-05, "loss": 2.3085, "step": 446800 }, { "epoch": 0.78, "learning_rate": 1.104085212945169e-05, "loss": 2.332, "step": 446810 }, { "epoch": 0.78, "learning_rate": 1.1039980189524863e-05, "loss": 2.2855, "step": 446820 }, { "epoch": 0.78, "learning_rate": 1.1039108249598035e-05, "loss": 2.4223, "step": 446830 }, { "epoch": 0.78, "learning_rate": 1.103823630967121e-05, "loss": 2.2385, "step": 446840 }, { "epoch": 0.78, "learning_rate": 1.1037364369744383e-05, "loss": 2.1582, "step": 446850 }, { "epoch": 0.78, "learning_rate": 1.1036492429817557e-05, "loss": 2.3146, "step": 446860 }, { "epoch": 0.78, "learning_rate": 1.1035620489890729e-05, "loss": 2.3067, "step": 446870 }, { "epoch": 0.78, "learning_rate": 1.1034748549963903e-05, "loss": 2.2691, "step": 446880 }, { "epoch": 0.78, "learning_rate": 1.1033876610037075e-05, "loss": 2.349, "step": 446890 }, { "epoch": 0.78, "learning_rate": 1.1033004670110248e-05, "loss": 2.4146, "step": 446900 }, { "epoch": 0.78, "learning_rate": 1.103213273018342e-05, "loss": 2.2405, "step": 446910 }, { "epoch": 0.78, "learning_rate": 1.1031260790256594e-05, "loss": 2.2862, "step": 446920 }, { "epoch": 0.78, "learning_rate": 1.1030388850329768e-05, "loss": 2.3093, "step": 446930 }, { "epoch": 0.78, "learning_rate": 1.1029516910402942e-05, "loss": 2.3189, "step": 446940 }, { "epoch": 0.78, "learning_rate": 1.1028644970476116e-05, "loss": 2.2441, "step": 446950 }, { "epoch": 0.78, "learning_rate": 1.1027773030549288e-05, "loss": 2.2554, "step": 446960 }, { "epoch": 0.78, "learning_rate": 1.1026901090622461e-05, "loss": 2.3194, "step": 446970 }, { "epoch": 0.78, "learning_rate": 1.1026029150695633e-05, "loss": 2.2225, "step": 446980 }, { "epoch": 0.78, "learning_rate": 1.1025157210768807e-05, "loss": 2.214, "step": 446990 }, { "epoch": 0.78, "learning_rate": 1.1024285270841981e-05, "loss": 2.3019, "step": 447000 }, { "epoch": 0.78, "learning_rate": 1.1023413330915155e-05, "loss": 2.3267, "step": 447010 }, { "epoch": 0.78, "learning_rate": 1.1022541390988327e-05, "loss": 2.3323, "step": 447020 }, { "epoch": 0.78, "learning_rate": 1.10216694510615e-05, "loss": 2.433, "step": 447030 }, { "epoch": 0.78, "learning_rate": 1.1020797511134673e-05, "loss": 2.3244, "step": 447040 }, { "epoch": 0.78, "learning_rate": 1.1019925571207846e-05, "loss": 2.3029, "step": 447050 }, { "epoch": 0.78, "learning_rate": 1.1019053631281019e-05, "loss": 2.2674, "step": 447060 }, { "epoch": 0.78, "learning_rate": 1.1018181691354192e-05, "loss": 2.2632, "step": 447070 }, { "epoch": 0.78, "learning_rate": 1.1017309751427366e-05, "loss": 2.2927, "step": 447080 }, { "epoch": 0.78, "learning_rate": 1.101643781150054e-05, "loss": 2.2025, "step": 447090 }, { "epoch": 0.78, "learning_rate": 1.1015565871573714e-05, "loss": 2.1706, "step": 447100 }, { "epoch": 0.78, "learning_rate": 1.1014693931646886e-05, "loss": 2.2141, "step": 447110 }, { "epoch": 0.78, "learning_rate": 1.101382199172006e-05, "loss": 2.3135, "step": 447120 }, { "epoch": 0.78, "learning_rate": 1.1012950051793232e-05, "loss": 2.2779, "step": 447130 }, { "epoch": 0.78, "learning_rate": 1.1012078111866405e-05, "loss": 2.359, "step": 447140 }, { "epoch": 0.78, "learning_rate": 1.1011206171939577e-05, "loss": 2.2618, "step": 447150 }, { "epoch": 0.78, "learning_rate": 1.1010334232012751e-05, "loss": 2.2528, "step": 447160 }, { "epoch": 0.78, "learning_rate": 1.1009462292085925e-05, "loss": 2.36, "step": 447170 }, { "epoch": 0.78, "learning_rate": 1.1008590352159099e-05, "loss": 2.278, "step": 447180 }, { "epoch": 0.78, "learning_rate": 1.100771841223227e-05, "loss": 2.2808, "step": 447190 }, { "epoch": 0.78, "learning_rate": 1.1006846472305445e-05, "loss": 2.4314, "step": 447200 }, { "epoch": 0.78, "learning_rate": 1.1005974532378618e-05, "loss": 2.2784, "step": 447210 }, { "epoch": 0.78, "learning_rate": 1.100510259245179e-05, "loss": 2.2529, "step": 447220 }, { "epoch": 0.78, "learning_rate": 1.1004230652524964e-05, "loss": 2.2777, "step": 447230 }, { "epoch": 0.78, "learning_rate": 1.1003358712598138e-05, "loss": 2.3169, "step": 447240 }, { "epoch": 0.78, "learning_rate": 1.1002486772671312e-05, "loss": 2.2251, "step": 447250 }, { "epoch": 0.78, "learning_rate": 1.1001614832744484e-05, "loss": 2.3217, "step": 447260 }, { "epoch": 0.78, "learning_rate": 1.1000742892817658e-05, "loss": 2.268, "step": 447270 }, { "epoch": 0.78, "learning_rate": 1.099987095289083e-05, "loss": 2.307, "step": 447280 }, { "epoch": 0.78, "learning_rate": 1.0998999012964003e-05, "loss": 2.2134, "step": 447290 }, { "epoch": 0.78, "learning_rate": 1.0998127073037175e-05, "loss": 2.2463, "step": 447300 }, { "epoch": 0.78, "learning_rate": 1.099725513311035e-05, "loss": 2.279, "step": 447310 }, { "epoch": 0.78, "learning_rate": 1.0996383193183523e-05, "loss": 2.3445, "step": 447320 }, { "epoch": 0.78, "learning_rate": 1.0995511253256697e-05, "loss": 2.3498, "step": 447330 }, { "epoch": 0.78, "learning_rate": 1.099463931332987e-05, "loss": 2.2694, "step": 447340 }, { "epoch": 0.78, "learning_rate": 1.0993767373403043e-05, "loss": 2.3334, "step": 447350 }, { "epoch": 0.78, "learning_rate": 1.0992895433476216e-05, "loss": 2.2519, "step": 447360 }, { "epoch": 0.78, "learning_rate": 1.0992023493549388e-05, "loss": 2.3013, "step": 447370 }, { "epoch": 0.78, "learning_rate": 1.0991151553622562e-05, "loss": 2.2051, "step": 447380 }, { "epoch": 0.78, "learning_rate": 1.0990279613695734e-05, "loss": 2.2646, "step": 447390 }, { "epoch": 0.78, "learning_rate": 1.0989407673768908e-05, "loss": 2.1417, "step": 447400 }, { "epoch": 0.78, "learning_rate": 1.0988535733842082e-05, "loss": 2.335, "step": 447410 }, { "epoch": 0.78, "learning_rate": 1.0987663793915256e-05, "loss": 2.2486, "step": 447420 }, { "epoch": 0.78, "learning_rate": 1.0986791853988428e-05, "loss": 2.3027, "step": 447430 }, { "epoch": 0.78, "learning_rate": 1.0985919914061601e-05, "loss": 2.2399, "step": 447440 }, { "epoch": 0.78, "learning_rate": 1.0985047974134774e-05, "loss": 2.3594, "step": 447450 }, { "epoch": 0.78, "learning_rate": 1.0984176034207947e-05, "loss": 2.358, "step": 447460 }, { "epoch": 0.78, "learning_rate": 1.0983304094281121e-05, "loss": 2.2909, "step": 447470 }, { "epoch": 0.78, "learning_rate": 1.0982432154354295e-05, "loss": 2.2096, "step": 447480 }, { "epoch": 0.78, "learning_rate": 1.0981560214427469e-05, "loss": 2.2437, "step": 447490 }, { "epoch": 0.78, "learning_rate": 1.098068827450064e-05, "loss": 2.2955, "step": 447500 }, { "epoch": 0.78, "learning_rate": 1.0979816334573814e-05, "loss": 2.2038, "step": 447510 }, { "epoch": 0.78, "learning_rate": 1.0978944394646987e-05, "loss": 2.3192, "step": 447520 }, { "epoch": 0.78, "learning_rate": 1.097807245472016e-05, "loss": 2.3408, "step": 447530 }, { "epoch": 0.78, "learning_rate": 1.0977200514793332e-05, "loss": 2.2949, "step": 447540 }, { "epoch": 0.78, "learning_rate": 1.0976328574866506e-05, "loss": 2.2573, "step": 447550 }, { "epoch": 0.78, "learning_rate": 1.097545663493968e-05, "loss": 2.2396, "step": 447560 }, { "epoch": 0.78, "learning_rate": 1.0974584695012854e-05, "loss": 2.2342, "step": 447570 }, { "epoch": 0.78, "learning_rate": 1.0973712755086026e-05, "loss": 2.2065, "step": 447580 }, { "epoch": 0.78, "learning_rate": 1.09728408151592e-05, "loss": 2.1327, "step": 447590 }, { "epoch": 0.78, "learning_rate": 1.0971968875232372e-05, "loss": 2.2753, "step": 447600 }, { "epoch": 0.78, "learning_rate": 1.0971096935305545e-05, "loss": 2.4205, "step": 447610 }, { "epoch": 0.78, "learning_rate": 1.097022499537872e-05, "loss": 2.2626, "step": 447620 }, { "epoch": 0.78, "learning_rate": 1.0969353055451891e-05, "loss": 2.2871, "step": 447630 }, { "epoch": 0.78, "learning_rate": 1.0968481115525065e-05, "loss": 2.2328, "step": 447640 }, { "epoch": 0.78, "learning_rate": 1.0967609175598239e-05, "loss": 2.3665, "step": 447650 }, { "epoch": 0.78, "learning_rate": 1.0966737235671413e-05, "loss": 2.3321, "step": 447660 }, { "epoch": 0.78, "learning_rate": 1.0965865295744585e-05, "loss": 2.2465, "step": 447670 }, { "epoch": 0.78, "learning_rate": 1.0964993355817758e-05, "loss": 2.3034, "step": 447680 }, { "epoch": 0.78, "learning_rate": 1.096412141589093e-05, "loss": 2.2495, "step": 447690 }, { "epoch": 0.78, "learning_rate": 1.0963249475964104e-05, "loss": 2.3279, "step": 447700 }, { "epoch": 0.78, "learning_rate": 1.0962377536037276e-05, "loss": 2.153, "step": 447710 }, { "epoch": 0.78, "learning_rate": 1.0961505596110452e-05, "loss": 2.3023, "step": 447720 }, { "epoch": 0.78, "learning_rate": 1.0960633656183624e-05, "loss": 2.4085, "step": 447730 }, { "epoch": 0.78, "learning_rate": 1.0959761716256798e-05, "loss": 2.2664, "step": 447740 }, { "epoch": 0.78, "learning_rate": 1.0958889776329971e-05, "loss": 2.3539, "step": 447750 }, { "epoch": 0.78, "learning_rate": 1.0958017836403143e-05, "loss": 2.2912, "step": 447760 }, { "epoch": 0.78, "learning_rate": 1.0957145896476317e-05, "loss": 2.3172, "step": 447770 }, { "epoch": 0.78, "learning_rate": 1.095627395654949e-05, "loss": 2.1588, "step": 447780 }, { "epoch": 0.78, "learning_rate": 1.0955402016622663e-05, "loss": 2.29, "step": 447790 }, { "epoch": 0.78, "learning_rate": 1.0954530076695837e-05, "loss": 2.2013, "step": 447800 }, { "epoch": 0.78, "learning_rate": 1.095365813676901e-05, "loss": 2.3078, "step": 447810 }, { "epoch": 0.78, "learning_rate": 1.0952786196842183e-05, "loss": 2.3843, "step": 447820 }, { "epoch": 0.78, "learning_rate": 1.0951914256915356e-05, "loss": 2.263, "step": 447830 }, { "epoch": 0.78, "learning_rate": 1.0951042316988529e-05, "loss": 2.3343, "step": 447840 }, { "epoch": 0.78, "learning_rate": 1.0950170377061702e-05, "loss": 2.2634, "step": 447850 }, { "epoch": 0.78, "learning_rate": 1.0949298437134874e-05, "loss": 2.1757, "step": 447860 }, { "epoch": 0.78, "learning_rate": 1.0948426497208048e-05, "loss": 2.2699, "step": 447870 }, { "epoch": 0.78, "learning_rate": 1.0947554557281222e-05, "loss": 2.3486, "step": 447880 }, { "epoch": 0.78, "learning_rate": 1.0946682617354396e-05, "loss": 2.1854, "step": 447890 }, { "epoch": 0.78, "learning_rate": 1.094581067742757e-05, "loss": 2.241, "step": 447900 }, { "epoch": 0.78, "learning_rate": 1.0944938737500742e-05, "loss": 2.1979, "step": 447910 }, { "epoch": 0.78, "learning_rate": 1.0944066797573915e-05, "loss": 2.3076, "step": 447920 }, { "epoch": 0.78, "learning_rate": 1.0943194857647087e-05, "loss": 2.2866, "step": 447930 }, { "epoch": 0.78, "learning_rate": 1.0942322917720261e-05, "loss": 2.3123, "step": 447940 }, { "epoch": 0.78, "learning_rate": 1.0941450977793433e-05, "loss": 2.2125, "step": 447950 }, { "epoch": 0.78, "learning_rate": 1.0940579037866607e-05, "loss": 2.4053, "step": 447960 }, { "epoch": 0.78, "learning_rate": 1.093970709793978e-05, "loss": 2.3394, "step": 447970 }, { "epoch": 0.78, "learning_rate": 1.0938835158012955e-05, "loss": 2.3901, "step": 447980 }, { "epoch": 0.78, "learning_rate": 1.0937963218086127e-05, "loss": 2.312, "step": 447990 }, { "epoch": 0.78, "learning_rate": 1.09370912781593e-05, "loss": 2.3416, "step": 448000 }, { "epoch": 0.78, "learning_rate": 1.0936219338232474e-05, "loss": 2.2258, "step": 448010 }, { "epoch": 0.78, "learning_rate": 1.0935347398305646e-05, "loss": 2.3343, "step": 448020 }, { "epoch": 0.78, "learning_rate": 1.093447545837882e-05, "loss": 2.3504, "step": 448030 }, { "epoch": 0.78, "learning_rate": 1.0933603518451994e-05, "loss": 2.2995, "step": 448040 }, { "epoch": 0.78, "learning_rate": 1.0932731578525168e-05, "loss": 2.3014, "step": 448050 }, { "epoch": 0.78, "learning_rate": 1.093185963859834e-05, "loss": 2.2266, "step": 448060 }, { "epoch": 0.78, "learning_rate": 1.0930987698671513e-05, "loss": 2.3508, "step": 448070 }, { "epoch": 0.78, "learning_rate": 1.0930115758744685e-05, "loss": 2.2831, "step": 448080 }, { "epoch": 0.78, "learning_rate": 1.092924381881786e-05, "loss": 2.2383, "step": 448090 }, { "epoch": 0.78, "learning_rate": 1.0928371878891031e-05, "loss": 2.2214, "step": 448100 }, { "epoch": 0.78, "learning_rate": 1.0927499938964205e-05, "loss": 2.2117, "step": 448110 }, { "epoch": 0.78, "learning_rate": 1.0926627999037379e-05, "loss": 2.1928, "step": 448120 }, { "epoch": 0.78, "learning_rate": 1.0925756059110553e-05, "loss": 2.3885, "step": 448130 }, { "epoch": 0.78, "learning_rate": 1.0924884119183726e-05, "loss": 2.3726, "step": 448140 }, { "epoch": 0.78, "learning_rate": 1.0924012179256898e-05, "loss": 2.2789, "step": 448150 }, { "epoch": 0.78, "learning_rate": 1.0923140239330072e-05, "loss": 2.3413, "step": 448160 }, { "epoch": 0.78, "learning_rate": 1.0922268299403244e-05, "loss": 2.2719, "step": 448170 }, { "epoch": 0.78, "learning_rate": 1.0921396359476418e-05, "loss": 2.254, "step": 448180 }, { "epoch": 0.78, "learning_rate": 1.092052441954959e-05, "loss": 2.3938, "step": 448190 }, { "epoch": 0.78, "learning_rate": 1.0919652479622764e-05, "loss": 2.3804, "step": 448200 }, { "epoch": 0.78, "learning_rate": 1.0918780539695938e-05, "loss": 2.3806, "step": 448210 }, { "epoch": 0.78, "learning_rate": 1.0917908599769111e-05, "loss": 2.3337, "step": 448220 }, { "epoch": 0.78, "learning_rate": 1.0917036659842284e-05, "loss": 2.1988, "step": 448230 }, { "epoch": 0.78, "learning_rate": 1.0916164719915457e-05, "loss": 2.2141, "step": 448240 }, { "epoch": 0.78, "learning_rate": 1.091529277998863e-05, "loss": 2.3316, "step": 448250 }, { "epoch": 0.78, "learning_rate": 1.0914420840061803e-05, "loss": 2.269, "step": 448260 }, { "epoch": 0.78, "learning_rate": 1.0913548900134977e-05, "loss": 2.3499, "step": 448270 }, { "epoch": 0.78, "learning_rate": 1.091267696020815e-05, "loss": 2.333, "step": 448280 }, { "epoch": 0.78, "learning_rate": 1.0911805020281324e-05, "loss": 2.273, "step": 448290 }, { "epoch": 0.78, "learning_rate": 1.0910933080354497e-05, "loss": 2.3449, "step": 448300 }, { "epoch": 0.78, "learning_rate": 1.091006114042767e-05, "loss": 2.2618, "step": 448310 }, { "epoch": 0.78, "learning_rate": 1.0909189200500842e-05, "loss": 2.3276, "step": 448320 }, { "epoch": 0.78, "learning_rate": 1.0908317260574016e-05, "loss": 2.3009, "step": 448330 }, { "epoch": 0.78, "learning_rate": 1.0907445320647188e-05, "loss": 2.4322, "step": 448340 }, { "epoch": 0.78, "learning_rate": 1.0906573380720362e-05, "loss": 2.3093, "step": 448350 }, { "epoch": 0.78, "learning_rate": 1.0905701440793536e-05, "loss": 2.3618, "step": 448360 }, { "epoch": 0.78, "learning_rate": 1.090482950086671e-05, "loss": 2.2381, "step": 448370 }, { "epoch": 0.78, "learning_rate": 1.0903957560939882e-05, "loss": 2.298, "step": 448380 }, { "epoch": 0.78, "learning_rate": 1.0903085621013055e-05, "loss": 2.3223, "step": 448390 }, { "epoch": 0.78, "learning_rate": 1.090221368108623e-05, "loss": 2.2489, "step": 448400 }, { "epoch": 0.78, "learning_rate": 1.0901341741159401e-05, "loss": 2.3532, "step": 448410 }, { "epoch": 0.78, "learning_rate": 1.0900469801232575e-05, "loss": 2.3726, "step": 448420 }, { "epoch": 0.78, "learning_rate": 1.0899597861305747e-05, "loss": 2.3058, "step": 448430 }, { "epoch": 0.78, "learning_rate": 1.0898725921378921e-05, "loss": 2.3509, "step": 448440 }, { "epoch": 0.78, "learning_rate": 1.0897853981452095e-05, "loss": 2.2069, "step": 448450 }, { "epoch": 0.78, "learning_rate": 1.0896982041525268e-05, "loss": 2.3641, "step": 448460 }, { "epoch": 0.78, "learning_rate": 1.089611010159844e-05, "loss": 2.2752, "step": 448470 }, { "epoch": 0.78, "learning_rate": 1.0895238161671614e-05, "loss": 2.283, "step": 448480 }, { "epoch": 0.78, "learning_rate": 1.0894366221744786e-05, "loss": 2.2041, "step": 448490 }, { "epoch": 0.78, "learning_rate": 1.089349428181796e-05, "loss": 2.1738, "step": 448500 }, { "epoch": 0.78, "learning_rate": 1.0892622341891132e-05, "loss": 2.231, "step": 448510 }, { "epoch": 0.78, "learning_rate": 1.0891750401964308e-05, "loss": 2.2712, "step": 448520 }, { "epoch": 0.78, "learning_rate": 1.089087846203748e-05, "loss": 2.301, "step": 448530 }, { "epoch": 0.78, "learning_rate": 1.0890006522110653e-05, "loss": 2.3201, "step": 448540 }, { "epoch": 0.78, "learning_rate": 1.0889134582183827e-05, "loss": 2.3108, "step": 448550 }, { "epoch": 0.78, "learning_rate": 1.0888262642257e-05, "loss": 2.214, "step": 448560 }, { "epoch": 0.78, "learning_rate": 1.0887390702330173e-05, "loss": 2.2519, "step": 448570 }, { "epoch": 0.78, "learning_rate": 1.0886518762403345e-05, "loss": 2.2344, "step": 448580 }, { "epoch": 0.78, "learning_rate": 1.0885646822476519e-05, "loss": 2.2845, "step": 448590 }, { "epoch": 0.78, "learning_rate": 1.0884774882549693e-05, "loss": 2.3209, "step": 448600 }, { "epoch": 0.78, "learning_rate": 1.0883902942622866e-05, "loss": 2.2117, "step": 448610 }, { "epoch": 0.78, "learning_rate": 1.0883031002696039e-05, "loss": 2.332, "step": 448620 }, { "epoch": 0.78, "learning_rate": 1.0882159062769212e-05, "loss": 2.2885, "step": 448630 }, { "epoch": 0.78, "learning_rate": 1.0881287122842384e-05, "loss": 2.4049, "step": 448640 }, { "epoch": 0.78, "learning_rate": 1.0880415182915558e-05, "loss": 2.2754, "step": 448650 }, { "epoch": 0.78, "learning_rate": 1.087954324298873e-05, "loss": 2.2095, "step": 448660 }, { "epoch": 0.78, "learning_rate": 1.0878671303061904e-05, "loss": 2.3389, "step": 448670 }, { "epoch": 0.78, "learning_rate": 1.0877799363135078e-05, "loss": 2.3013, "step": 448680 }, { "epoch": 0.78, "learning_rate": 1.0876927423208252e-05, "loss": 2.3097, "step": 448690 }, { "epoch": 0.78, "learning_rate": 1.0876055483281425e-05, "loss": 2.3084, "step": 448700 }, { "epoch": 0.78, "learning_rate": 1.0875183543354597e-05, "loss": 2.1587, "step": 448710 }, { "epoch": 0.78, "learning_rate": 1.0874311603427771e-05, "loss": 2.2526, "step": 448720 }, { "epoch": 0.78, "learning_rate": 1.0873439663500943e-05, "loss": 2.3235, "step": 448730 }, { "epoch": 0.78, "learning_rate": 1.0872567723574117e-05, "loss": 2.1592, "step": 448740 }, { "epoch": 0.78, "learning_rate": 1.0871695783647289e-05, "loss": 2.265, "step": 448750 }, { "epoch": 0.78, "learning_rate": 1.0870823843720465e-05, "loss": 2.3007, "step": 448760 }, { "epoch": 0.78, "learning_rate": 1.0869951903793637e-05, "loss": 2.2539, "step": 448770 }, { "epoch": 0.78, "learning_rate": 1.086907996386681e-05, "loss": 2.2202, "step": 448780 }, { "epoch": 0.78, "learning_rate": 1.0868208023939982e-05, "loss": 2.3093, "step": 448790 }, { "epoch": 0.78, "learning_rate": 1.0867336084013156e-05, "loss": 2.3515, "step": 448800 }, { "epoch": 0.78, "learning_rate": 1.086646414408633e-05, "loss": 2.2852, "step": 448810 }, { "epoch": 0.78, "learning_rate": 1.0865592204159502e-05, "loss": 2.3158, "step": 448820 }, { "epoch": 0.78, "learning_rate": 1.0864720264232676e-05, "loss": 2.2456, "step": 448830 }, { "epoch": 0.78, "learning_rate": 1.086384832430585e-05, "loss": 2.2556, "step": 448840 }, { "epoch": 0.78, "learning_rate": 1.0862976384379023e-05, "loss": 2.2917, "step": 448850 }, { "epoch": 0.78, "learning_rate": 1.0862104444452195e-05, "loss": 2.1712, "step": 448860 }, { "epoch": 0.78, "learning_rate": 1.086123250452537e-05, "loss": 2.174, "step": 448870 }, { "epoch": 0.78, "learning_rate": 1.0860360564598541e-05, "loss": 2.3618, "step": 448880 }, { "epoch": 0.78, "learning_rate": 1.0859488624671715e-05, "loss": 2.2951, "step": 448890 }, { "epoch": 0.78, "learning_rate": 1.0858616684744887e-05, "loss": 2.1882, "step": 448900 }, { "epoch": 0.78, "learning_rate": 1.0857744744818061e-05, "loss": 2.2281, "step": 448910 }, { "epoch": 0.78, "learning_rate": 1.0856872804891235e-05, "loss": 2.3293, "step": 448920 }, { "epoch": 0.78, "learning_rate": 1.0856000864964408e-05, "loss": 2.3897, "step": 448930 }, { "epoch": 0.78, "learning_rate": 1.0855128925037582e-05, "loss": 2.2934, "step": 448940 }, { "epoch": 0.78, "learning_rate": 1.0854256985110754e-05, "loss": 2.4413, "step": 448950 }, { "epoch": 0.78, "learning_rate": 1.0853385045183928e-05, "loss": 2.2849, "step": 448960 }, { "epoch": 0.78, "learning_rate": 1.08525131052571e-05, "loss": 2.3869, "step": 448970 }, { "epoch": 0.78, "learning_rate": 1.0851641165330274e-05, "loss": 2.3043, "step": 448980 }, { "epoch": 0.78, "learning_rate": 1.0850769225403446e-05, "loss": 2.218, "step": 448990 }, { "epoch": 0.78, "learning_rate": 1.0849897285476621e-05, "loss": 2.2313, "step": 449000 }, { "epoch": 0.78, "learning_rate": 1.0849025345549794e-05, "loss": 2.2683, "step": 449010 }, { "epoch": 0.78, "learning_rate": 1.0848153405622967e-05, "loss": 2.3161, "step": 449020 }, { "epoch": 0.78, "learning_rate": 1.084728146569614e-05, "loss": 2.3097, "step": 449030 }, { "epoch": 0.78, "learning_rate": 1.0846409525769313e-05, "loss": 2.2864, "step": 449040 }, { "epoch": 0.78, "learning_rate": 1.0845537585842485e-05, "loss": 2.2166, "step": 449050 }, { "epoch": 0.78, "learning_rate": 1.0844665645915659e-05, "loss": 2.2431, "step": 449060 }, { "epoch": 0.78, "learning_rate": 1.0843793705988833e-05, "loss": 2.2889, "step": 449070 }, { "epoch": 0.78, "learning_rate": 1.0842921766062007e-05, "loss": 2.2386, "step": 449080 }, { "epoch": 0.78, "learning_rate": 1.084204982613518e-05, "loss": 2.309, "step": 449090 }, { "epoch": 0.78, "learning_rate": 1.0841177886208352e-05, "loss": 2.2211, "step": 449100 }, { "epoch": 0.78, "learning_rate": 1.0840305946281526e-05, "loss": 2.3847, "step": 449110 }, { "epoch": 0.78, "learning_rate": 1.0839434006354698e-05, "loss": 2.368, "step": 449120 }, { "epoch": 0.78, "learning_rate": 1.0838562066427872e-05, "loss": 2.2543, "step": 449130 }, { "epoch": 0.78, "learning_rate": 1.0837690126501044e-05, "loss": 2.1969, "step": 449140 }, { "epoch": 0.78, "learning_rate": 1.0836818186574218e-05, "loss": 2.3512, "step": 449150 }, { "epoch": 0.78, "learning_rate": 1.0835946246647392e-05, "loss": 2.2207, "step": 449160 }, { "epoch": 0.78, "learning_rate": 1.0835074306720565e-05, "loss": 2.2446, "step": 449170 }, { "epoch": 0.78, "learning_rate": 1.0834202366793737e-05, "loss": 2.2618, "step": 449180 }, { "epoch": 0.78, "learning_rate": 1.0833330426866911e-05, "loss": 2.3821, "step": 449190 }, { "epoch": 0.78, "learning_rate": 1.0832458486940085e-05, "loss": 2.2228, "step": 449200 }, { "epoch": 0.78, "learning_rate": 1.0831586547013257e-05, "loss": 2.3172, "step": 449210 }, { "epoch": 0.78, "learning_rate": 1.0830714607086431e-05, "loss": 2.3321, "step": 449220 }, { "epoch": 0.78, "learning_rate": 1.0829842667159603e-05, "loss": 2.3625, "step": 449230 }, { "epoch": 0.78, "learning_rate": 1.0828970727232777e-05, "loss": 2.2753, "step": 449240 }, { "epoch": 0.78, "learning_rate": 1.082809878730595e-05, "loss": 2.2643, "step": 449250 }, { "epoch": 0.78, "learning_rate": 1.0827226847379124e-05, "loss": 2.3571, "step": 449260 }, { "epoch": 0.78, "learning_rate": 1.0826354907452296e-05, "loss": 2.2732, "step": 449270 }, { "epoch": 0.78, "learning_rate": 1.082548296752547e-05, "loss": 2.327, "step": 449280 }, { "epoch": 0.78, "learning_rate": 1.0824611027598642e-05, "loss": 2.2776, "step": 449290 }, { "epoch": 0.78, "learning_rate": 1.0823739087671816e-05, "loss": 2.321, "step": 449300 }, { "epoch": 0.78, "learning_rate": 1.082286714774499e-05, "loss": 2.3378, "step": 449310 }, { "epoch": 0.78, "learning_rate": 1.0821995207818164e-05, "loss": 2.3567, "step": 449320 }, { "epoch": 0.78, "learning_rate": 1.0821123267891337e-05, "loss": 2.258, "step": 449330 }, { "epoch": 0.78, "learning_rate": 1.082025132796451e-05, "loss": 2.3548, "step": 449340 }, { "epoch": 0.78, "learning_rate": 1.0819379388037683e-05, "loss": 2.3303, "step": 449350 }, { "epoch": 0.78, "learning_rate": 1.0818507448110855e-05, "loss": 2.2754, "step": 449360 }, { "epoch": 0.78, "learning_rate": 1.0817635508184029e-05, "loss": 2.2137, "step": 449370 }, { "epoch": 0.78, "learning_rate": 1.0816763568257201e-05, "loss": 2.2348, "step": 449380 }, { "epoch": 0.78, "learning_rate": 1.0815891628330375e-05, "loss": 2.4426, "step": 449390 }, { "epoch": 0.78, "learning_rate": 1.0815019688403549e-05, "loss": 2.2729, "step": 449400 }, { "epoch": 0.78, "learning_rate": 1.0814147748476722e-05, "loss": 2.2749, "step": 449410 }, { "epoch": 0.78, "learning_rate": 1.0813275808549894e-05, "loss": 2.3461, "step": 449420 }, { "epoch": 0.78, "learning_rate": 1.0812403868623068e-05, "loss": 2.3582, "step": 449430 }, { "epoch": 0.78, "learning_rate": 1.081153192869624e-05, "loss": 2.3003, "step": 449440 }, { "epoch": 0.78, "learning_rate": 1.0810659988769414e-05, "loss": 2.3169, "step": 449450 }, { "epoch": 0.78, "learning_rate": 1.0809788048842586e-05, "loss": 2.2189, "step": 449460 }, { "epoch": 0.78, "learning_rate": 1.080891610891576e-05, "loss": 2.3281, "step": 449470 }, { "epoch": 0.78, "learning_rate": 1.0808044168988934e-05, "loss": 2.3016, "step": 449480 }, { "epoch": 0.78, "learning_rate": 1.0807172229062107e-05, "loss": 2.2522, "step": 449490 }, { "epoch": 0.78, "learning_rate": 1.0806300289135281e-05, "loss": 2.1331, "step": 449500 }, { "epoch": 0.78, "learning_rate": 1.0805428349208453e-05, "loss": 2.3617, "step": 449510 }, { "epoch": 0.78, "learning_rate": 1.0804556409281627e-05, "loss": 2.1801, "step": 449520 }, { "epoch": 0.78, "learning_rate": 1.0803684469354799e-05, "loss": 2.3151, "step": 449530 }, { "epoch": 0.78, "learning_rate": 1.0802812529427973e-05, "loss": 2.3262, "step": 449540 }, { "epoch": 0.78, "learning_rate": 1.0801940589501145e-05, "loss": 2.2605, "step": 449550 }, { "epoch": 0.78, "learning_rate": 1.080106864957432e-05, "loss": 2.3488, "step": 449560 }, { "epoch": 0.78, "learning_rate": 1.0800196709647493e-05, "loss": 2.3618, "step": 449570 }, { "epoch": 0.78, "learning_rate": 1.0799324769720666e-05, "loss": 2.2361, "step": 449580 }, { "epoch": 0.78, "learning_rate": 1.0798452829793838e-05, "loss": 2.2158, "step": 449590 }, { "epoch": 0.78, "learning_rate": 1.0797580889867012e-05, "loss": 2.2754, "step": 449600 }, { "epoch": 0.78, "learning_rate": 1.0796708949940186e-05, "loss": 2.1509, "step": 449610 }, { "epoch": 0.78, "learning_rate": 1.0795837010013358e-05, "loss": 2.39, "step": 449620 }, { "epoch": 0.78, "learning_rate": 1.0794965070086532e-05, "loss": 2.3359, "step": 449630 }, { "epoch": 0.78, "learning_rate": 1.0794093130159706e-05, "loss": 2.3593, "step": 449640 }, { "epoch": 0.78, "learning_rate": 1.079322119023288e-05, "loss": 2.3454, "step": 449650 }, { "epoch": 0.78, "learning_rate": 1.0792349250306051e-05, "loss": 2.2673, "step": 449660 }, { "epoch": 0.78, "learning_rate": 1.0791477310379225e-05, "loss": 2.2401, "step": 449670 }, { "epoch": 0.78, "learning_rate": 1.0790605370452397e-05, "loss": 2.2842, "step": 449680 }, { "epoch": 0.78, "learning_rate": 1.0789733430525571e-05, "loss": 2.2947, "step": 449690 }, { "epoch": 0.78, "learning_rate": 1.0788861490598743e-05, "loss": 2.2988, "step": 449700 }, { "epoch": 0.78, "learning_rate": 1.0787989550671917e-05, "loss": 2.3312, "step": 449710 }, { "epoch": 0.78, "learning_rate": 1.078711761074509e-05, "loss": 2.2716, "step": 449720 }, { "epoch": 0.78, "learning_rate": 1.0786245670818264e-05, "loss": 2.3822, "step": 449730 }, { "epoch": 0.78, "learning_rate": 1.0785373730891438e-05, "loss": 2.3064, "step": 449740 }, { "epoch": 0.78, "learning_rate": 1.078450179096461e-05, "loss": 2.2458, "step": 449750 }, { "epoch": 0.78, "learning_rate": 1.0783629851037784e-05, "loss": 2.4669, "step": 449760 }, { "epoch": 0.78, "learning_rate": 1.0782757911110956e-05, "loss": 2.3021, "step": 449770 }, { "epoch": 0.78, "learning_rate": 1.078188597118413e-05, "loss": 2.3231, "step": 449780 }, { "epoch": 0.78, "learning_rate": 1.0781014031257302e-05, "loss": 2.3044, "step": 449790 }, { "epoch": 0.78, "learning_rate": 1.0780142091330477e-05, "loss": 2.2474, "step": 449800 }, { "epoch": 0.78, "learning_rate": 1.077927015140365e-05, "loss": 2.3739, "step": 449810 }, { "epoch": 0.78, "learning_rate": 1.0778398211476823e-05, "loss": 2.3696, "step": 449820 }, { "epoch": 0.78, "learning_rate": 1.0777526271549995e-05, "loss": 2.2697, "step": 449830 }, { "epoch": 0.78, "learning_rate": 1.0776654331623169e-05, "loss": 2.3265, "step": 449840 }, { "epoch": 0.78, "learning_rate": 1.0775782391696341e-05, "loss": 2.2406, "step": 449850 }, { "epoch": 0.78, "learning_rate": 1.0774910451769515e-05, "loss": 2.2847, "step": 449860 }, { "epoch": 0.78, "learning_rate": 1.0774038511842689e-05, "loss": 2.3965, "step": 449870 }, { "epoch": 0.78, "learning_rate": 1.0773166571915862e-05, "loss": 2.3005, "step": 449880 }, { "epoch": 0.78, "learning_rate": 1.0772294631989036e-05, "loss": 2.3411, "step": 449890 }, { "epoch": 0.78, "learning_rate": 1.0771422692062208e-05, "loss": 2.3527, "step": 449900 }, { "epoch": 0.78, "learning_rate": 1.0770550752135382e-05, "loss": 2.371, "step": 449910 }, { "epoch": 0.78, "learning_rate": 1.0769678812208554e-05, "loss": 2.3902, "step": 449920 }, { "epoch": 0.78, "learning_rate": 1.0768806872281728e-05, "loss": 2.3924, "step": 449930 }, { "epoch": 0.78, "learning_rate": 1.07679349323549e-05, "loss": 2.2465, "step": 449940 }, { "epoch": 0.78, "learning_rate": 1.0767062992428074e-05, "loss": 2.4209, "step": 449950 }, { "epoch": 0.78, "learning_rate": 1.0766191052501248e-05, "loss": 2.2868, "step": 449960 }, { "epoch": 0.78, "learning_rate": 1.0765319112574421e-05, "loss": 2.2233, "step": 449970 }, { "epoch": 0.78, "learning_rate": 1.0764447172647593e-05, "loss": 2.294, "step": 449980 }, { "epoch": 0.78, "learning_rate": 1.0763575232720767e-05, "loss": 2.2497, "step": 449990 }, { "epoch": 0.78, "learning_rate": 1.0762703292793941e-05, "loss": 2.2802, "step": 450000 }, { "epoch": 0.78, "learning_rate": 1.0761831352867113e-05, "loss": 2.3855, "step": 450010 }, { "epoch": 0.78, "learning_rate": 1.0760959412940287e-05, "loss": 2.2662, "step": 450020 }, { "epoch": 0.78, "learning_rate": 1.0760087473013459e-05, "loss": 2.3497, "step": 450030 }, { "epoch": 0.78, "learning_rate": 1.0759215533086634e-05, "loss": 2.2592, "step": 450040 }, { "epoch": 0.78, "learning_rate": 1.0758343593159806e-05, "loss": 2.284, "step": 450050 }, { "epoch": 0.78, "learning_rate": 1.075747165323298e-05, "loss": 2.3896, "step": 450060 }, { "epoch": 0.78, "learning_rate": 1.0756599713306152e-05, "loss": 2.2608, "step": 450070 }, { "epoch": 0.78, "learning_rate": 1.0755727773379326e-05, "loss": 2.2361, "step": 450080 }, { "epoch": 0.78, "learning_rate": 1.0754855833452498e-05, "loss": 2.1684, "step": 450090 }, { "epoch": 0.78, "learning_rate": 1.0753983893525672e-05, "loss": 2.2717, "step": 450100 }, { "epoch": 0.78, "learning_rate": 1.0753111953598846e-05, "loss": 2.3537, "step": 450110 }, { "epoch": 0.78, "learning_rate": 1.075224001367202e-05, "loss": 2.2698, "step": 450120 }, { "epoch": 0.78, "learning_rate": 1.0751368073745193e-05, "loss": 2.3842, "step": 450130 }, { "epoch": 0.78, "learning_rate": 1.0750496133818365e-05, "loss": 2.198, "step": 450140 }, { "epoch": 0.79, "learning_rate": 1.0749624193891539e-05, "loss": 2.346, "step": 450150 }, { "epoch": 0.79, "learning_rate": 1.0748752253964711e-05, "loss": 2.3203, "step": 450160 }, { "epoch": 0.79, "learning_rate": 1.0747880314037885e-05, "loss": 2.2108, "step": 450170 }, { "epoch": 0.79, "learning_rate": 1.0747008374111057e-05, "loss": 2.2306, "step": 450180 }, { "epoch": 0.79, "learning_rate": 1.074613643418423e-05, "loss": 2.2754, "step": 450190 }, { "epoch": 0.79, "learning_rate": 1.0745264494257404e-05, "loss": 2.1815, "step": 450200 }, { "epoch": 0.79, "learning_rate": 1.0744392554330578e-05, "loss": 2.2219, "step": 450210 }, { "epoch": 0.79, "learning_rate": 1.074352061440375e-05, "loss": 2.3242, "step": 450220 }, { "epoch": 0.79, "learning_rate": 1.0742648674476924e-05, "loss": 2.2676, "step": 450230 }, { "epoch": 0.79, "learning_rate": 1.0741776734550096e-05, "loss": 2.2477, "step": 450240 }, { "epoch": 0.79, "learning_rate": 1.074090479462327e-05, "loss": 2.3049, "step": 450250 }, { "epoch": 0.79, "learning_rate": 1.0740032854696442e-05, "loss": 2.3957, "step": 450260 }, { "epoch": 0.79, "learning_rate": 1.0739160914769616e-05, "loss": 2.2668, "step": 450270 }, { "epoch": 0.79, "learning_rate": 1.073828897484279e-05, "loss": 2.3204, "step": 450280 }, { "epoch": 0.79, "learning_rate": 1.0737417034915963e-05, "loss": 2.1676, "step": 450290 }, { "epoch": 0.79, "learning_rate": 1.0736545094989137e-05, "loss": 2.1814, "step": 450300 }, { "epoch": 0.79, "learning_rate": 1.0735673155062309e-05, "loss": 2.3295, "step": 450310 }, { "epoch": 0.79, "learning_rate": 1.0734801215135483e-05, "loss": 2.2568, "step": 450320 }, { "epoch": 0.79, "learning_rate": 1.0733929275208655e-05, "loss": 2.2412, "step": 450330 }, { "epoch": 0.79, "learning_rate": 1.0733057335281829e-05, "loss": 2.2534, "step": 450340 }, { "epoch": 0.79, "learning_rate": 1.0732185395355003e-05, "loss": 2.2497, "step": 450350 }, { "epoch": 0.79, "learning_rate": 1.0731313455428176e-05, "loss": 2.2187, "step": 450360 }, { "epoch": 0.79, "learning_rate": 1.0730441515501348e-05, "loss": 2.1791, "step": 450370 }, { "epoch": 0.79, "learning_rate": 1.0729569575574522e-05, "loss": 2.2016, "step": 450380 }, { "epoch": 0.79, "learning_rate": 1.0728697635647694e-05, "loss": 2.2771, "step": 450390 }, { "epoch": 0.79, "learning_rate": 1.0727825695720868e-05, "loss": 2.4166, "step": 450400 }, { "epoch": 0.79, "learning_rate": 1.0726953755794042e-05, "loss": 2.3865, "step": 450410 }, { "epoch": 0.79, "learning_rate": 1.0726081815867214e-05, "loss": 2.2444, "step": 450420 }, { "epoch": 0.79, "learning_rate": 1.0725209875940388e-05, "loss": 2.2878, "step": 450430 }, { "epoch": 0.79, "learning_rate": 1.0724337936013561e-05, "loss": 2.3997, "step": 450440 }, { "epoch": 0.79, "learning_rate": 1.0723465996086735e-05, "loss": 2.2708, "step": 450450 }, { "epoch": 0.79, "learning_rate": 1.0722594056159907e-05, "loss": 2.3768, "step": 450460 }, { "epoch": 0.79, "learning_rate": 1.0721722116233081e-05, "loss": 2.2351, "step": 450470 }, { "epoch": 0.79, "learning_rate": 1.0720850176306253e-05, "loss": 2.3214, "step": 450480 }, { "epoch": 0.79, "learning_rate": 1.0719978236379427e-05, "loss": 2.1862, "step": 450490 }, { "epoch": 0.79, "learning_rate": 1.0719106296452599e-05, "loss": 2.1891, "step": 450500 }, { "epoch": 0.79, "learning_rate": 1.0718234356525773e-05, "loss": 2.3988, "step": 450510 }, { "epoch": 0.79, "learning_rate": 1.0717362416598946e-05, "loss": 2.2365, "step": 450520 }, { "epoch": 0.79, "learning_rate": 1.071649047667212e-05, "loss": 2.3106, "step": 450530 }, { "epoch": 0.79, "learning_rate": 1.0715618536745294e-05, "loss": 2.3045, "step": 450540 }, { "epoch": 0.79, "learning_rate": 1.0714746596818466e-05, "loss": 2.2453, "step": 450550 }, { "epoch": 0.79, "learning_rate": 1.071387465689164e-05, "loss": 2.2847, "step": 450560 }, { "epoch": 0.79, "learning_rate": 1.0713002716964812e-05, "loss": 2.2715, "step": 450570 }, { "epoch": 0.79, "learning_rate": 1.0712130777037986e-05, "loss": 2.2767, "step": 450580 }, { "epoch": 0.79, "learning_rate": 1.0711258837111158e-05, "loss": 2.2663, "step": 450590 }, { "epoch": 0.79, "learning_rate": 1.0710386897184333e-05, "loss": 2.2989, "step": 450600 }, { "epoch": 0.79, "learning_rate": 1.0709514957257505e-05, "loss": 2.331, "step": 450610 }, { "epoch": 0.79, "learning_rate": 1.0708643017330679e-05, "loss": 2.3558, "step": 450620 }, { "epoch": 0.79, "learning_rate": 1.0707771077403851e-05, "loss": 2.1973, "step": 450630 }, { "epoch": 0.79, "learning_rate": 1.0706899137477025e-05, "loss": 2.3248, "step": 450640 }, { "epoch": 0.79, "learning_rate": 1.0706027197550197e-05, "loss": 2.3293, "step": 450650 }, { "epoch": 0.79, "learning_rate": 1.070515525762337e-05, "loss": 2.3976, "step": 450660 }, { "epoch": 0.79, "learning_rate": 1.0704283317696545e-05, "loss": 2.3094, "step": 450670 }, { "epoch": 0.79, "learning_rate": 1.0703411377769718e-05, "loss": 2.3532, "step": 450680 }, { "epoch": 0.79, "learning_rate": 1.0702539437842892e-05, "loss": 2.3697, "step": 450690 }, { "epoch": 0.79, "learning_rate": 1.0701667497916064e-05, "loss": 2.4347, "step": 450700 }, { "epoch": 0.79, "learning_rate": 1.0700795557989238e-05, "loss": 2.3374, "step": 450710 }, { "epoch": 0.79, "learning_rate": 1.069992361806241e-05, "loss": 2.2787, "step": 450720 }, { "epoch": 0.79, "learning_rate": 1.0699051678135584e-05, "loss": 2.323, "step": 450730 }, { "epoch": 0.79, "learning_rate": 1.0698179738208756e-05, "loss": 2.3431, "step": 450740 }, { "epoch": 0.79, "learning_rate": 1.069730779828193e-05, "loss": 2.3029, "step": 450750 }, { "epoch": 0.79, "learning_rate": 1.0696435858355103e-05, "loss": 2.3509, "step": 450760 }, { "epoch": 0.79, "learning_rate": 1.0695563918428277e-05, "loss": 2.4273, "step": 450770 }, { "epoch": 0.79, "learning_rate": 1.069469197850145e-05, "loss": 2.2018, "step": 450780 }, { "epoch": 0.79, "learning_rate": 1.0693820038574623e-05, "loss": 2.1855, "step": 450790 }, { "epoch": 0.79, "learning_rate": 1.0692948098647797e-05, "loss": 2.2757, "step": 450800 }, { "epoch": 0.79, "learning_rate": 1.0692076158720969e-05, "loss": 2.2735, "step": 450810 }, { "epoch": 0.79, "learning_rate": 1.0691204218794143e-05, "loss": 2.4053, "step": 450820 }, { "epoch": 0.79, "learning_rate": 1.0690332278867315e-05, "loss": 2.2096, "step": 450830 }, { "epoch": 0.79, "learning_rate": 1.068946033894049e-05, "loss": 2.3292, "step": 450840 }, { "epoch": 0.79, "learning_rate": 1.0688588399013662e-05, "loss": 2.3046, "step": 450850 }, { "epoch": 0.79, "learning_rate": 1.0687716459086836e-05, "loss": 2.2382, "step": 450860 }, { "epoch": 0.79, "learning_rate": 1.0686844519160008e-05, "loss": 2.2304, "step": 450870 }, { "epoch": 0.79, "learning_rate": 1.0685972579233182e-05, "loss": 2.2396, "step": 450880 }, { "epoch": 0.79, "learning_rate": 1.0685100639306354e-05, "loss": 2.2996, "step": 450890 }, { "epoch": 0.79, "learning_rate": 1.0684228699379528e-05, "loss": 2.233, "step": 450900 }, { "epoch": 0.79, "learning_rate": 1.0683356759452701e-05, "loss": 2.3296, "step": 450910 }, { "epoch": 0.79, "learning_rate": 1.0682484819525875e-05, "loss": 2.3448, "step": 450920 }, { "epoch": 0.79, "learning_rate": 1.0681612879599049e-05, "loss": 2.2208, "step": 450930 }, { "epoch": 0.79, "learning_rate": 1.0680740939672221e-05, "loss": 2.326, "step": 450940 }, { "epoch": 0.79, "learning_rate": 1.0679868999745395e-05, "loss": 2.3926, "step": 450950 }, { "epoch": 0.79, "learning_rate": 1.0678997059818567e-05, "loss": 2.1418, "step": 450960 }, { "epoch": 0.79, "learning_rate": 1.067812511989174e-05, "loss": 2.3779, "step": 450970 }, { "epoch": 0.79, "learning_rate": 1.0677253179964913e-05, "loss": 2.307, "step": 450980 }, { "epoch": 0.79, "learning_rate": 1.0676381240038087e-05, "loss": 2.2993, "step": 450990 }, { "epoch": 0.79, "learning_rate": 1.067550930011126e-05, "loss": 2.2492, "step": 451000 }, { "epoch": 0.79, "learning_rate": 1.0674637360184434e-05, "loss": 2.2619, "step": 451010 }, { "epoch": 0.79, "learning_rate": 1.0673765420257606e-05, "loss": 2.3215, "step": 451020 }, { "epoch": 0.79, "learning_rate": 1.067289348033078e-05, "loss": 2.3279, "step": 451030 }, { "epoch": 0.79, "learning_rate": 1.0672021540403952e-05, "loss": 2.2973, "step": 451040 }, { "epoch": 0.79, "learning_rate": 1.0671149600477126e-05, "loss": 2.3695, "step": 451050 }, { "epoch": 0.79, "learning_rate": 1.06702776605503e-05, "loss": 2.367, "step": 451060 }, { "epoch": 0.79, "learning_rate": 1.0669405720623472e-05, "loss": 2.282, "step": 451070 }, { "epoch": 0.79, "learning_rate": 1.0668533780696647e-05, "loss": 2.4045, "step": 451080 }, { "epoch": 0.79, "learning_rate": 1.0667661840769819e-05, "loss": 2.2837, "step": 451090 }, { "epoch": 0.79, "learning_rate": 1.0666789900842993e-05, "loss": 2.2095, "step": 451100 }, { "epoch": 0.79, "learning_rate": 1.0665917960916165e-05, "loss": 2.3161, "step": 451110 }, { "epoch": 0.79, "learning_rate": 1.0665046020989339e-05, "loss": 2.2393, "step": 451120 }, { "epoch": 0.79, "learning_rate": 1.066417408106251e-05, "loss": 2.3892, "step": 451130 }, { "epoch": 0.79, "learning_rate": 1.0663302141135685e-05, "loss": 2.3358, "step": 451140 }, { "epoch": 0.79, "learning_rate": 1.0662430201208858e-05, "loss": 2.2544, "step": 451150 }, { "epoch": 0.79, "learning_rate": 1.0661558261282032e-05, "loss": 2.2247, "step": 451160 }, { "epoch": 0.79, "learning_rate": 1.0660686321355204e-05, "loss": 2.2466, "step": 451170 }, { "epoch": 0.79, "learning_rate": 1.0659814381428378e-05, "loss": 2.199, "step": 451180 }, { "epoch": 0.79, "learning_rate": 1.065894244150155e-05, "loss": 2.2166, "step": 451190 }, { "epoch": 0.79, "learning_rate": 1.0658070501574724e-05, "loss": 2.2486, "step": 451200 }, { "epoch": 0.79, "learning_rate": 1.0657198561647898e-05, "loss": 2.3837, "step": 451210 }, { "epoch": 0.79, "learning_rate": 1.065632662172107e-05, "loss": 2.2161, "step": 451220 }, { "epoch": 0.79, "learning_rate": 1.0655454681794243e-05, "loss": 2.1949, "step": 451230 }, { "epoch": 0.79, "learning_rate": 1.0654582741867417e-05, "loss": 2.3243, "step": 451240 }, { "epoch": 0.79, "learning_rate": 1.0653710801940591e-05, "loss": 2.2487, "step": 451250 }, { "epoch": 0.79, "learning_rate": 1.0652838862013763e-05, "loss": 2.3385, "step": 451260 }, { "epoch": 0.79, "learning_rate": 1.0651966922086937e-05, "loss": 2.2253, "step": 451270 }, { "epoch": 0.79, "learning_rate": 1.0651094982160109e-05, "loss": 2.1901, "step": 451280 }, { "epoch": 0.79, "learning_rate": 1.0650223042233283e-05, "loss": 2.3437, "step": 451290 }, { "epoch": 0.79, "learning_rate": 1.0649351102306455e-05, "loss": 2.4116, "step": 451300 }, { "epoch": 0.79, "learning_rate": 1.0648479162379629e-05, "loss": 2.3056, "step": 451310 }, { "epoch": 0.79, "learning_rate": 1.0647607222452802e-05, "loss": 2.3883, "step": 451320 }, { "epoch": 0.79, "learning_rate": 1.0646735282525976e-05, "loss": 2.2487, "step": 451330 }, { "epoch": 0.79, "learning_rate": 1.064586334259915e-05, "loss": 2.2987, "step": 451340 }, { "epoch": 0.79, "learning_rate": 1.0644991402672322e-05, "loss": 2.4565, "step": 451350 }, { "epoch": 0.79, "learning_rate": 1.0644119462745496e-05, "loss": 2.2087, "step": 451360 }, { "epoch": 0.79, "learning_rate": 1.0643247522818668e-05, "loss": 2.3303, "step": 451370 }, { "epoch": 0.79, "learning_rate": 1.0642375582891842e-05, "loss": 2.2096, "step": 451380 }, { "epoch": 0.79, "learning_rate": 1.0641503642965015e-05, "loss": 2.2762, "step": 451390 }, { "epoch": 0.79, "learning_rate": 1.0640631703038189e-05, "loss": 2.2706, "step": 451400 }, { "epoch": 0.79, "learning_rate": 1.0639759763111361e-05, "loss": 2.0764, "step": 451410 }, { "epoch": 0.79, "learning_rate": 1.0638887823184535e-05, "loss": 2.1351, "step": 451420 }, { "epoch": 0.79, "learning_rate": 1.0638015883257707e-05, "loss": 2.2237, "step": 451430 }, { "epoch": 0.79, "learning_rate": 1.063714394333088e-05, "loss": 2.2377, "step": 451440 }, { "epoch": 0.79, "learning_rate": 1.0636272003404053e-05, "loss": 2.3044, "step": 451450 }, { "epoch": 0.79, "learning_rate": 1.0635400063477227e-05, "loss": 2.3862, "step": 451460 }, { "epoch": 0.79, "learning_rate": 1.06345281235504e-05, "loss": 2.2312, "step": 451470 }, { "epoch": 0.79, "learning_rate": 1.0633656183623574e-05, "loss": 2.3081, "step": 451480 }, { "epoch": 0.79, "learning_rate": 1.0632784243696748e-05, "loss": 2.2366, "step": 451490 }, { "epoch": 0.79, "learning_rate": 1.063191230376992e-05, "loss": 2.2242, "step": 451500 }, { "epoch": 0.79, "learning_rate": 1.0631040363843094e-05, "loss": 2.2917, "step": 451510 }, { "epoch": 0.79, "learning_rate": 1.0630168423916266e-05, "loss": 2.3697, "step": 451520 }, { "epoch": 0.79, "learning_rate": 1.062929648398944e-05, "loss": 2.2877, "step": 451530 }, { "epoch": 0.79, "learning_rate": 1.0628424544062612e-05, "loss": 2.3335, "step": 451540 }, { "epoch": 0.79, "learning_rate": 1.0627552604135785e-05, "loss": 2.2675, "step": 451550 }, { "epoch": 0.79, "learning_rate": 1.062668066420896e-05, "loss": 2.3623, "step": 451560 }, { "epoch": 0.79, "learning_rate": 1.0625808724282133e-05, "loss": 2.2991, "step": 451570 }, { "epoch": 0.79, "learning_rate": 1.0624936784355305e-05, "loss": 2.286, "step": 451580 }, { "epoch": 0.79, "learning_rate": 1.0624064844428479e-05, "loss": 2.2107, "step": 451590 }, { "epoch": 0.79, "learning_rate": 1.0623192904501653e-05, "loss": 2.3226, "step": 451600 }, { "epoch": 0.79, "learning_rate": 1.0622320964574825e-05, "loss": 2.2885, "step": 451610 }, { "epoch": 0.79, "learning_rate": 1.0621449024647998e-05, "loss": 2.2379, "step": 451620 }, { "epoch": 0.79, "learning_rate": 1.062057708472117e-05, "loss": 2.3277, "step": 451630 }, { "epoch": 0.79, "learning_rate": 1.0619705144794346e-05, "loss": 2.3705, "step": 451640 }, { "epoch": 0.79, "learning_rate": 1.0618833204867518e-05, "loss": 2.3136, "step": 451650 }, { "epoch": 0.79, "learning_rate": 1.0617961264940692e-05, "loss": 2.1707, "step": 451660 }, { "epoch": 0.79, "learning_rate": 1.0617089325013864e-05, "loss": 2.2198, "step": 451670 }, { "epoch": 0.79, "learning_rate": 1.0616217385087038e-05, "loss": 2.3085, "step": 451680 }, { "epoch": 0.79, "learning_rate": 1.061534544516021e-05, "loss": 2.2149, "step": 451690 }, { "epoch": 0.79, "learning_rate": 1.0614473505233384e-05, "loss": 2.242, "step": 451700 }, { "epoch": 0.79, "learning_rate": 1.0613601565306557e-05, "loss": 2.3309, "step": 451710 }, { "epoch": 0.79, "learning_rate": 1.0612729625379731e-05, "loss": 2.223, "step": 451720 }, { "epoch": 0.79, "learning_rate": 1.0611857685452905e-05, "loss": 2.2953, "step": 451730 }, { "epoch": 0.79, "learning_rate": 1.0610985745526077e-05, "loss": 2.3243, "step": 451740 }, { "epoch": 0.79, "learning_rate": 1.061011380559925e-05, "loss": 2.3607, "step": 451750 }, { "epoch": 0.79, "learning_rate": 1.0609241865672423e-05, "loss": 2.3449, "step": 451760 }, { "epoch": 0.79, "learning_rate": 1.0608369925745597e-05, "loss": 2.2988, "step": 451770 }, { "epoch": 0.79, "learning_rate": 1.0607497985818769e-05, "loss": 2.2436, "step": 451780 }, { "epoch": 0.79, "learning_rate": 1.0606626045891942e-05, "loss": 2.35, "step": 451790 }, { "epoch": 0.79, "learning_rate": 1.0605754105965116e-05, "loss": 2.2338, "step": 451800 }, { "epoch": 0.79, "learning_rate": 1.060488216603829e-05, "loss": 2.2637, "step": 451810 }, { "epoch": 0.79, "learning_rate": 1.0604010226111462e-05, "loss": 2.247, "step": 451820 }, { "epoch": 0.79, "learning_rate": 1.0603138286184636e-05, "loss": 2.2722, "step": 451830 }, { "epoch": 0.79, "learning_rate": 1.0602266346257808e-05, "loss": 2.2879, "step": 451840 }, { "epoch": 0.79, "learning_rate": 1.0601394406330982e-05, "loss": 2.3636, "step": 451850 }, { "epoch": 0.79, "learning_rate": 1.0600522466404155e-05, "loss": 2.2544, "step": 451860 }, { "epoch": 0.79, "learning_rate": 1.0599650526477327e-05, "loss": 2.3306, "step": 451870 }, { "epoch": 0.79, "learning_rate": 1.0598778586550503e-05, "loss": 2.3093, "step": 451880 }, { "epoch": 0.79, "learning_rate": 1.0597906646623675e-05, "loss": 2.2767, "step": 451890 }, { "epoch": 0.79, "learning_rate": 1.0597034706696849e-05, "loss": 2.3309, "step": 451900 }, { "epoch": 0.79, "learning_rate": 1.059616276677002e-05, "loss": 2.3273, "step": 451910 }, { "epoch": 0.79, "learning_rate": 1.0595290826843195e-05, "loss": 2.4102, "step": 451920 }, { "epoch": 0.79, "learning_rate": 1.0594418886916367e-05, "loss": 2.1329, "step": 451930 }, { "epoch": 0.79, "learning_rate": 1.059354694698954e-05, "loss": 2.2046, "step": 451940 }, { "epoch": 0.79, "learning_rate": 1.0592675007062714e-05, "loss": 2.2472, "step": 451950 }, { "epoch": 0.79, "learning_rate": 1.0591803067135888e-05, "loss": 2.3142, "step": 451960 }, { "epoch": 0.79, "learning_rate": 1.059093112720906e-05, "loss": 2.3181, "step": 451970 }, { "epoch": 0.79, "learning_rate": 1.0590059187282234e-05, "loss": 2.2984, "step": 451980 }, { "epoch": 0.79, "learning_rate": 1.0589187247355408e-05, "loss": 2.2173, "step": 451990 }, { "epoch": 0.79, "learning_rate": 1.058831530742858e-05, "loss": 2.1415, "step": 452000 }, { "epoch": 0.79, "learning_rate": 1.0587443367501753e-05, "loss": 2.2295, "step": 452010 }, { "epoch": 0.79, "learning_rate": 1.0586571427574926e-05, "loss": 2.2254, "step": 452020 }, { "epoch": 0.79, "learning_rate": 1.05856994876481e-05, "loss": 2.2645, "step": 452030 }, { "epoch": 0.79, "learning_rate": 1.0584827547721273e-05, "loss": 2.2519, "step": 452040 }, { "epoch": 0.79, "learning_rate": 1.0583955607794447e-05, "loss": 2.1762, "step": 452050 }, { "epoch": 0.79, "learning_rate": 1.0583083667867619e-05, "loss": 2.1513, "step": 452060 }, { "epoch": 0.79, "learning_rate": 1.0582211727940793e-05, "loss": 2.4179, "step": 452070 }, { "epoch": 0.79, "learning_rate": 1.0581339788013965e-05, "loss": 2.2772, "step": 452080 }, { "epoch": 0.79, "learning_rate": 1.0580467848087139e-05, "loss": 2.2102, "step": 452090 }, { "epoch": 0.79, "learning_rate": 1.057959590816031e-05, "loss": 2.3593, "step": 452100 }, { "epoch": 0.79, "learning_rate": 1.0578723968233484e-05, "loss": 2.3284, "step": 452110 }, { "epoch": 0.79, "learning_rate": 1.0577852028306658e-05, "loss": 2.2732, "step": 452120 }, { "epoch": 0.79, "learning_rate": 1.0576980088379832e-05, "loss": 2.282, "step": 452130 }, { "epoch": 0.79, "learning_rate": 1.0576108148453006e-05, "loss": 2.2818, "step": 452140 }, { "epoch": 0.79, "learning_rate": 1.0575236208526178e-05, "loss": 2.2902, "step": 452150 }, { "epoch": 0.79, "learning_rate": 1.0574364268599352e-05, "loss": 2.2469, "step": 452160 }, { "epoch": 0.79, "learning_rate": 1.0573492328672524e-05, "loss": 2.2644, "step": 452170 }, { "epoch": 0.79, "learning_rate": 1.0572620388745697e-05, "loss": 2.309, "step": 452180 }, { "epoch": 0.79, "learning_rate": 1.0571748448818871e-05, "loss": 2.2679, "step": 452190 }, { "epoch": 0.79, "learning_rate": 1.0570876508892045e-05, "loss": 2.3388, "step": 452200 }, { "epoch": 0.79, "learning_rate": 1.0570004568965217e-05, "loss": 2.2145, "step": 452210 }, { "epoch": 0.79, "learning_rate": 1.056913262903839e-05, "loss": 2.2889, "step": 452220 }, { "epoch": 0.79, "learning_rate": 1.0568260689111563e-05, "loss": 2.3089, "step": 452230 }, { "epoch": 0.79, "learning_rate": 1.0567388749184737e-05, "loss": 2.3108, "step": 452240 }, { "epoch": 0.79, "learning_rate": 1.0566516809257909e-05, "loss": 2.3201, "step": 452250 }, { "epoch": 0.79, "learning_rate": 1.0565644869331082e-05, "loss": 2.1881, "step": 452260 }, { "epoch": 0.79, "learning_rate": 1.0564772929404256e-05, "loss": 2.3154, "step": 452270 }, { "epoch": 0.79, "learning_rate": 1.056390098947743e-05, "loss": 2.1353, "step": 452280 }, { "epoch": 0.79, "learning_rate": 1.0563029049550604e-05, "loss": 2.3708, "step": 452290 }, { "epoch": 0.79, "learning_rate": 1.0562157109623776e-05, "loss": 2.2985, "step": 452300 }, { "epoch": 0.79, "learning_rate": 1.056128516969695e-05, "loss": 2.3198, "step": 452310 }, { "epoch": 0.79, "learning_rate": 1.0560413229770122e-05, "loss": 2.2688, "step": 452320 }, { "epoch": 0.79, "learning_rate": 1.0559541289843295e-05, "loss": 2.4053, "step": 452330 }, { "epoch": 0.79, "learning_rate": 1.0558669349916468e-05, "loss": 2.245, "step": 452340 }, { "epoch": 0.79, "learning_rate": 1.0557797409989641e-05, "loss": 2.2403, "step": 452350 }, { "epoch": 0.79, "learning_rate": 1.0556925470062815e-05, "loss": 2.3639, "step": 452360 }, { "epoch": 0.79, "learning_rate": 1.0556053530135989e-05, "loss": 2.3416, "step": 452370 }, { "epoch": 0.79, "learning_rate": 1.0555181590209161e-05, "loss": 2.1843, "step": 452380 }, { "epoch": 0.79, "learning_rate": 1.0554309650282335e-05, "loss": 2.3293, "step": 452390 }, { "epoch": 0.79, "learning_rate": 1.0553437710355508e-05, "loss": 2.2337, "step": 452400 }, { "epoch": 0.79, "learning_rate": 1.055256577042868e-05, "loss": 2.2505, "step": 452410 }, { "epoch": 0.79, "learning_rate": 1.0551693830501854e-05, "loss": 2.335, "step": 452420 }, { "epoch": 0.79, "learning_rate": 1.0550821890575028e-05, "loss": 2.3186, "step": 452430 }, { "epoch": 0.79, "learning_rate": 1.0549949950648202e-05, "loss": 2.3046, "step": 452440 }, { "epoch": 0.79, "learning_rate": 1.0549078010721374e-05, "loss": 2.1998, "step": 452450 }, { "epoch": 0.79, "learning_rate": 1.0548206070794548e-05, "loss": 2.3185, "step": 452460 }, { "epoch": 0.79, "learning_rate": 1.054733413086772e-05, "loss": 2.3074, "step": 452470 }, { "epoch": 0.79, "learning_rate": 1.0546462190940894e-05, "loss": 2.2568, "step": 452480 }, { "epoch": 0.79, "learning_rate": 1.0545590251014066e-05, "loss": 2.2233, "step": 452490 }, { "epoch": 0.79, "learning_rate": 1.054471831108724e-05, "loss": 2.343, "step": 452500 }, { "epoch": 0.79, "learning_rate": 1.0543846371160413e-05, "loss": 2.3096, "step": 452510 }, { "epoch": 0.79, "learning_rate": 1.0542974431233587e-05, "loss": 2.3047, "step": 452520 }, { "epoch": 0.79, "learning_rate": 1.054210249130676e-05, "loss": 2.3072, "step": 452530 }, { "epoch": 0.79, "learning_rate": 1.0541230551379933e-05, "loss": 2.3619, "step": 452540 }, { "epoch": 0.79, "learning_rate": 1.0540358611453107e-05, "loss": 2.3085, "step": 452550 }, { "epoch": 0.79, "learning_rate": 1.0539486671526279e-05, "loss": 2.3789, "step": 452560 }, { "epoch": 0.79, "learning_rate": 1.0538614731599452e-05, "loss": 2.1945, "step": 452570 }, { "epoch": 0.79, "learning_rate": 1.0537742791672624e-05, "loss": 2.3497, "step": 452580 }, { "epoch": 0.79, "learning_rate": 1.0536870851745798e-05, "loss": 2.298, "step": 452590 }, { "epoch": 0.79, "learning_rate": 1.0535998911818972e-05, "loss": 2.4094, "step": 452600 }, { "epoch": 0.79, "learning_rate": 1.0535126971892146e-05, "loss": 2.3332, "step": 452610 }, { "epoch": 0.79, "learning_rate": 1.0534255031965318e-05, "loss": 2.2849, "step": 452620 }, { "epoch": 0.79, "learning_rate": 1.0533383092038492e-05, "loss": 2.2324, "step": 452630 }, { "epoch": 0.79, "learning_rate": 1.0532511152111664e-05, "loss": 2.1565, "step": 452640 }, { "epoch": 0.79, "learning_rate": 1.0531639212184837e-05, "loss": 2.276, "step": 452650 }, { "epoch": 0.79, "learning_rate": 1.0530767272258011e-05, "loss": 2.1321, "step": 452660 }, { "epoch": 0.79, "learning_rate": 1.0529895332331183e-05, "loss": 2.2902, "step": 452670 }, { "epoch": 0.79, "learning_rate": 1.0529023392404359e-05, "loss": 2.4007, "step": 452680 }, { "epoch": 0.79, "learning_rate": 1.052815145247753e-05, "loss": 2.2385, "step": 452690 }, { "epoch": 0.79, "learning_rate": 1.0527279512550705e-05, "loss": 2.1755, "step": 452700 }, { "epoch": 0.79, "learning_rate": 1.0526407572623877e-05, "loss": 2.3412, "step": 452710 }, { "epoch": 0.79, "learning_rate": 1.052553563269705e-05, "loss": 2.3553, "step": 452720 }, { "epoch": 0.79, "learning_rate": 1.0524663692770223e-05, "loss": 2.3552, "step": 452730 }, { "epoch": 0.79, "learning_rate": 1.0523791752843396e-05, "loss": 2.3038, "step": 452740 }, { "epoch": 0.79, "learning_rate": 1.052291981291657e-05, "loss": 2.2834, "step": 452750 }, { "epoch": 0.79, "learning_rate": 1.0522047872989744e-05, "loss": 2.3163, "step": 452760 }, { "epoch": 0.79, "learning_rate": 1.0521175933062916e-05, "loss": 2.4166, "step": 452770 }, { "epoch": 0.79, "learning_rate": 1.052030399313609e-05, "loss": 2.1991, "step": 452780 }, { "epoch": 0.79, "learning_rate": 1.0519432053209263e-05, "loss": 2.2902, "step": 452790 }, { "epoch": 0.79, "learning_rate": 1.0518560113282436e-05, "loss": 2.2797, "step": 452800 }, { "epoch": 0.79, "learning_rate": 1.051768817335561e-05, "loss": 2.3774, "step": 452810 }, { "epoch": 0.79, "learning_rate": 1.0516816233428781e-05, "loss": 2.2566, "step": 452820 }, { "epoch": 0.79, "learning_rate": 1.0515944293501955e-05, "loss": 2.2583, "step": 452830 }, { "epoch": 0.79, "learning_rate": 1.0515072353575129e-05, "loss": 2.4059, "step": 452840 }, { "epoch": 0.79, "learning_rate": 1.0514200413648303e-05, "loss": 2.3052, "step": 452850 }, { "epoch": 0.79, "learning_rate": 1.0513328473721475e-05, "loss": 2.2644, "step": 452860 }, { "epoch": 0.79, "learning_rate": 1.0512456533794649e-05, "loss": 2.3236, "step": 452870 }, { "epoch": 0.79, "learning_rate": 1.051158459386782e-05, "loss": 2.2617, "step": 452880 }, { "epoch": 0.79, "learning_rate": 1.0510712653940994e-05, "loss": 2.2539, "step": 452890 }, { "epoch": 0.79, "learning_rate": 1.0509840714014166e-05, "loss": 2.292, "step": 452900 }, { "epoch": 0.79, "learning_rate": 1.050896877408734e-05, "loss": 2.2064, "step": 452910 }, { "epoch": 0.79, "learning_rate": 1.0508096834160514e-05, "loss": 2.308, "step": 452920 }, { "epoch": 0.79, "learning_rate": 1.0507224894233688e-05, "loss": 2.2915, "step": 452930 }, { "epoch": 0.79, "learning_rate": 1.0506352954306862e-05, "loss": 2.2012, "step": 452940 }, { "epoch": 0.79, "learning_rate": 1.0505481014380034e-05, "loss": 2.3145, "step": 452950 }, { "epoch": 0.79, "learning_rate": 1.0504609074453207e-05, "loss": 2.3252, "step": 452960 }, { "epoch": 0.79, "learning_rate": 1.050373713452638e-05, "loss": 2.235, "step": 452970 }, { "epoch": 0.79, "learning_rate": 1.0502865194599553e-05, "loss": 2.2096, "step": 452980 }, { "epoch": 0.79, "learning_rate": 1.0501993254672727e-05, "loss": 2.2575, "step": 452990 }, { "epoch": 0.79, "learning_rate": 1.05011213147459e-05, "loss": 2.3625, "step": 453000 }, { "epoch": 0.79, "learning_rate": 1.0500249374819073e-05, "loss": 2.2595, "step": 453010 }, { "epoch": 0.79, "learning_rate": 1.0499377434892247e-05, "loss": 2.3905, "step": 453020 }, { "epoch": 0.79, "learning_rate": 1.0498505494965419e-05, "loss": 2.3253, "step": 453030 }, { "epoch": 0.79, "learning_rate": 1.0497633555038592e-05, "loss": 2.3007, "step": 453040 }, { "epoch": 0.79, "learning_rate": 1.0496761615111765e-05, "loss": 2.3192, "step": 453050 }, { "epoch": 0.79, "learning_rate": 1.0495889675184938e-05, "loss": 2.1549, "step": 453060 }, { "epoch": 0.79, "learning_rate": 1.0495017735258112e-05, "loss": 2.2492, "step": 453070 }, { "epoch": 0.79, "learning_rate": 1.0494145795331286e-05, "loss": 2.1885, "step": 453080 }, { "epoch": 0.79, "learning_rate": 1.049327385540446e-05, "loss": 2.2944, "step": 453090 }, { "epoch": 0.79, "learning_rate": 1.0492401915477632e-05, "loss": 2.2835, "step": 453100 }, { "epoch": 0.79, "learning_rate": 1.0491529975550805e-05, "loss": 2.3707, "step": 453110 }, { "epoch": 0.79, "learning_rate": 1.0490658035623978e-05, "loss": 2.224, "step": 453120 }, { "epoch": 0.79, "learning_rate": 1.0489786095697151e-05, "loss": 2.3236, "step": 453130 }, { "epoch": 0.79, "learning_rate": 1.0488914155770323e-05, "loss": 2.1553, "step": 453140 }, { "epoch": 0.79, "learning_rate": 1.0488042215843497e-05, "loss": 2.2136, "step": 453150 }, { "epoch": 0.79, "learning_rate": 1.0487170275916671e-05, "loss": 2.2753, "step": 453160 }, { "epoch": 0.79, "learning_rate": 1.0486298335989845e-05, "loss": 2.2864, "step": 453170 }, { "epoch": 0.79, "learning_rate": 1.0485426396063017e-05, "loss": 2.2853, "step": 453180 }, { "epoch": 0.79, "learning_rate": 1.048455445613619e-05, "loss": 2.3571, "step": 453190 }, { "epoch": 0.79, "learning_rate": 1.0483682516209364e-05, "loss": 2.2903, "step": 453200 }, { "epoch": 0.79, "learning_rate": 1.0482810576282536e-05, "loss": 2.2756, "step": 453210 }, { "epoch": 0.79, "learning_rate": 1.048193863635571e-05, "loss": 2.2264, "step": 453220 }, { "epoch": 0.79, "learning_rate": 1.0481066696428884e-05, "loss": 2.2601, "step": 453230 }, { "epoch": 0.79, "learning_rate": 1.0480194756502058e-05, "loss": 2.2023, "step": 453240 }, { "epoch": 0.79, "learning_rate": 1.047932281657523e-05, "loss": 2.4168, "step": 453250 }, { "epoch": 0.79, "learning_rate": 1.0478450876648404e-05, "loss": 2.3077, "step": 453260 }, { "epoch": 0.79, "learning_rate": 1.0477578936721576e-05, "loss": 2.3765, "step": 453270 }, { "epoch": 0.79, "learning_rate": 1.047670699679475e-05, "loss": 2.2408, "step": 453280 }, { "epoch": 0.79, "learning_rate": 1.0475835056867921e-05, "loss": 2.2858, "step": 453290 }, { "epoch": 0.79, "learning_rate": 1.0474963116941095e-05, "loss": 2.2378, "step": 453300 }, { "epoch": 0.79, "learning_rate": 1.0474091177014269e-05, "loss": 2.1564, "step": 453310 }, { "epoch": 0.79, "learning_rate": 1.0473219237087443e-05, "loss": 2.3288, "step": 453320 }, { "epoch": 0.79, "learning_rate": 1.0472347297160617e-05, "loss": 2.2816, "step": 453330 }, { "epoch": 0.79, "learning_rate": 1.0471475357233789e-05, "loss": 2.3118, "step": 453340 }, { "epoch": 0.79, "learning_rate": 1.0470603417306962e-05, "loss": 2.3097, "step": 453350 }, { "epoch": 0.79, "learning_rate": 1.0469731477380134e-05, "loss": 2.3308, "step": 453360 }, { "epoch": 0.79, "learning_rate": 1.0468859537453308e-05, "loss": 2.3783, "step": 453370 }, { "epoch": 0.79, "learning_rate": 1.046798759752648e-05, "loss": 2.2155, "step": 453380 }, { "epoch": 0.79, "learning_rate": 1.0467115657599654e-05, "loss": 2.3847, "step": 453390 }, { "epoch": 0.79, "learning_rate": 1.0466243717672828e-05, "loss": 2.2966, "step": 453400 }, { "epoch": 0.79, "learning_rate": 1.0465371777746002e-05, "loss": 2.2489, "step": 453410 }, { "epoch": 0.79, "learning_rate": 1.0464499837819174e-05, "loss": 2.3314, "step": 453420 }, { "epoch": 0.79, "learning_rate": 1.0463627897892347e-05, "loss": 2.3311, "step": 453430 }, { "epoch": 0.79, "learning_rate": 1.046275595796552e-05, "loss": 2.2792, "step": 453440 }, { "epoch": 0.79, "learning_rate": 1.0461884018038693e-05, "loss": 2.271, "step": 453450 }, { "epoch": 0.79, "learning_rate": 1.0461012078111867e-05, "loss": 2.3909, "step": 453460 }, { "epoch": 0.79, "learning_rate": 1.046014013818504e-05, "loss": 2.2059, "step": 453470 }, { "epoch": 0.79, "learning_rate": 1.0459268198258215e-05, "loss": 2.3837, "step": 453480 }, { "epoch": 0.79, "learning_rate": 1.0458396258331387e-05, "loss": 2.3049, "step": 453490 }, { "epoch": 0.79, "learning_rate": 1.045752431840456e-05, "loss": 2.1819, "step": 453500 }, { "epoch": 0.79, "learning_rate": 1.0456652378477733e-05, "loss": 2.315, "step": 453510 }, { "epoch": 0.79, "learning_rate": 1.0455780438550906e-05, "loss": 2.3159, "step": 453520 }, { "epoch": 0.79, "learning_rate": 1.0454908498624078e-05, "loss": 2.3121, "step": 453530 }, { "epoch": 0.79, "learning_rate": 1.0454036558697252e-05, "loss": 2.2927, "step": 453540 }, { "epoch": 0.79, "learning_rate": 1.0453164618770426e-05, "loss": 2.3073, "step": 453550 }, { "epoch": 0.79, "learning_rate": 1.04522926788436e-05, "loss": 2.2488, "step": 453560 }, { "epoch": 0.79, "learning_rate": 1.0451420738916772e-05, "loss": 2.2603, "step": 453570 }, { "epoch": 0.79, "learning_rate": 1.0450548798989946e-05, "loss": 2.2571, "step": 453580 }, { "epoch": 0.79, "learning_rate": 1.044967685906312e-05, "loss": 2.2432, "step": 453590 }, { "epoch": 0.79, "learning_rate": 1.0448804919136291e-05, "loss": 2.2681, "step": 453600 }, { "epoch": 0.79, "learning_rate": 1.0447932979209465e-05, "loss": 2.2863, "step": 453610 }, { "epoch": 0.79, "learning_rate": 1.0447061039282637e-05, "loss": 2.2252, "step": 453620 }, { "epoch": 0.79, "learning_rate": 1.0446189099355811e-05, "loss": 2.304, "step": 453630 }, { "epoch": 0.79, "learning_rate": 1.0445317159428985e-05, "loss": 2.2744, "step": 453640 }, { "epoch": 0.79, "learning_rate": 1.0444445219502159e-05, "loss": 2.3194, "step": 453650 }, { "epoch": 0.79, "learning_rate": 1.044357327957533e-05, "loss": 2.3457, "step": 453660 }, { "epoch": 0.79, "learning_rate": 1.0442701339648504e-05, "loss": 2.2564, "step": 453670 }, { "epoch": 0.79, "learning_rate": 1.0441829399721676e-05, "loss": 2.3639, "step": 453680 }, { "epoch": 0.79, "learning_rate": 1.044095745979485e-05, "loss": 2.229, "step": 453690 }, { "epoch": 0.79, "learning_rate": 1.0440085519868022e-05, "loss": 2.3204, "step": 453700 }, { "epoch": 0.79, "learning_rate": 1.0439213579941196e-05, "loss": 2.2176, "step": 453710 }, { "epoch": 0.79, "learning_rate": 1.0438341640014372e-05, "loss": 2.2916, "step": 453720 }, { "epoch": 0.79, "learning_rate": 1.0437469700087544e-05, "loss": 2.3048, "step": 453730 }, { "epoch": 0.79, "learning_rate": 1.0436597760160717e-05, "loss": 2.2944, "step": 453740 }, { "epoch": 0.79, "learning_rate": 1.043572582023389e-05, "loss": 2.2797, "step": 453750 }, { "epoch": 0.79, "learning_rate": 1.0434853880307063e-05, "loss": 2.3289, "step": 453760 }, { "epoch": 0.79, "learning_rate": 1.0433981940380235e-05, "loss": 2.2244, "step": 453770 }, { "epoch": 0.79, "learning_rate": 1.0433110000453409e-05, "loss": 2.2719, "step": 453780 }, { "epoch": 0.79, "learning_rate": 1.0432238060526583e-05, "loss": 2.3097, "step": 453790 }, { "epoch": 0.79, "learning_rate": 1.0431366120599757e-05, "loss": 2.2685, "step": 453800 }, { "epoch": 0.79, "learning_rate": 1.0430494180672929e-05, "loss": 2.2846, "step": 453810 }, { "epoch": 0.79, "learning_rate": 1.0429622240746102e-05, "loss": 2.2304, "step": 453820 }, { "epoch": 0.79, "learning_rate": 1.0428750300819275e-05, "loss": 2.3654, "step": 453830 }, { "epoch": 0.79, "learning_rate": 1.0427878360892448e-05, "loss": 2.4001, "step": 453840 }, { "epoch": 0.79, "learning_rate": 1.042700642096562e-05, "loss": 2.2937, "step": 453850 }, { "epoch": 0.79, "learning_rate": 1.0426134481038794e-05, "loss": 2.1865, "step": 453860 }, { "epoch": 0.79, "learning_rate": 1.0425262541111968e-05, "loss": 2.2469, "step": 453870 }, { "epoch": 0.79, "learning_rate": 1.0424390601185142e-05, "loss": 2.2711, "step": 453880 }, { "epoch": 0.79, "learning_rate": 1.0423518661258315e-05, "loss": 2.2986, "step": 453890 }, { "epoch": 0.79, "learning_rate": 1.0422646721331488e-05, "loss": 2.203, "step": 453900 }, { "epoch": 0.79, "learning_rate": 1.0421774781404661e-05, "loss": 2.3036, "step": 453910 }, { "epoch": 0.79, "learning_rate": 1.0420902841477833e-05, "loss": 2.4139, "step": 453920 }, { "epoch": 0.79, "learning_rate": 1.0420030901551007e-05, "loss": 2.2616, "step": 453930 }, { "epoch": 0.79, "learning_rate": 1.041915896162418e-05, "loss": 2.3448, "step": 453940 }, { "epoch": 0.79, "learning_rate": 1.0418287021697353e-05, "loss": 2.3987, "step": 453950 }, { "epoch": 0.79, "learning_rate": 1.0417415081770527e-05, "loss": 2.3411, "step": 453960 }, { "epoch": 0.79, "learning_rate": 1.04165431418437e-05, "loss": 2.1596, "step": 453970 }, { "epoch": 0.79, "learning_rate": 1.0415671201916873e-05, "loss": 2.2911, "step": 453980 }, { "epoch": 0.79, "learning_rate": 1.0414799261990046e-05, "loss": 2.27, "step": 453990 }, { "epoch": 0.79, "learning_rate": 1.041392732206322e-05, "loss": 2.3854, "step": 454000 }, { "epoch": 0.79, "learning_rate": 1.0413055382136392e-05, "loss": 2.3329, "step": 454010 }, { "epoch": 0.79, "learning_rate": 1.0412183442209566e-05, "loss": 2.2325, "step": 454020 }, { "epoch": 0.79, "learning_rate": 1.041131150228274e-05, "loss": 2.2671, "step": 454030 }, { "epoch": 0.79, "learning_rate": 1.0410439562355914e-05, "loss": 2.392, "step": 454040 }, { "epoch": 0.79, "learning_rate": 1.0409567622429086e-05, "loss": 2.0128, "step": 454050 }, { "epoch": 0.79, "learning_rate": 1.040869568250226e-05, "loss": 2.2458, "step": 454060 }, { "epoch": 0.79, "learning_rate": 1.0407823742575431e-05, "loss": 2.3026, "step": 454070 }, { "epoch": 0.79, "learning_rate": 1.0406951802648605e-05, "loss": 2.3298, "step": 454080 }, { "epoch": 0.79, "learning_rate": 1.0406079862721777e-05, "loss": 2.2624, "step": 454090 }, { "epoch": 0.79, "learning_rate": 1.0405207922794951e-05, "loss": 2.2841, "step": 454100 }, { "epoch": 0.79, "learning_rate": 1.0404335982868125e-05, "loss": 2.3559, "step": 454110 }, { "epoch": 0.79, "learning_rate": 1.0403464042941299e-05, "loss": 2.2938, "step": 454120 }, { "epoch": 0.79, "learning_rate": 1.0402592103014472e-05, "loss": 2.2563, "step": 454130 }, { "epoch": 0.79, "learning_rate": 1.0401720163087644e-05, "loss": 2.2391, "step": 454140 }, { "epoch": 0.79, "learning_rate": 1.0400848223160818e-05, "loss": 2.3401, "step": 454150 }, { "epoch": 0.79, "learning_rate": 1.039997628323399e-05, "loss": 2.2908, "step": 454160 }, { "epoch": 0.79, "learning_rate": 1.0399104343307164e-05, "loss": 2.1049, "step": 454170 }, { "epoch": 0.79, "learning_rate": 1.0398232403380336e-05, "loss": 2.2316, "step": 454180 }, { "epoch": 0.79, "learning_rate": 1.039736046345351e-05, "loss": 2.2138, "step": 454190 }, { "epoch": 0.79, "learning_rate": 1.0396488523526684e-05, "loss": 2.3647, "step": 454200 }, { "epoch": 0.79, "learning_rate": 1.0395616583599857e-05, "loss": 2.3238, "step": 454210 }, { "epoch": 0.79, "learning_rate": 1.039474464367303e-05, "loss": 2.2706, "step": 454220 }, { "epoch": 0.79, "learning_rate": 1.0393872703746203e-05, "loss": 2.3839, "step": 454230 }, { "epoch": 0.79, "learning_rate": 1.0393000763819375e-05, "loss": 2.2937, "step": 454240 }, { "epoch": 0.79, "learning_rate": 1.039212882389255e-05, "loss": 2.2041, "step": 454250 }, { "epoch": 0.79, "learning_rate": 1.0391256883965723e-05, "loss": 2.317, "step": 454260 }, { "epoch": 0.79, "learning_rate": 1.0390384944038897e-05, "loss": 2.2637, "step": 454270 }, { "epoch": 0.79, "learning_rate": 1.038951300411207e-05, "loss": 2.2196, "step": 454280 }, { "epoch": 0.79, "learning_rate": 1.0388641064185243e-05, "loss": 2.239, "step": 454290 }, { "epoch": 0.79, "learning_rate": 1.0387769124258416e-05, "loss": 2.2925, "step": 454300 }, { "epoch": 0.79, "learning_rate": 1.0386897184331588e-05, "loss": 2.1006, "step": 454310 }, { "epoch": 0.79, "learning_rate": 1.0386025244404762e-05, "loss": 2.4033, "step": 454320 }, { "epoch": 0.79, "learning_rate": 1.0385153304477934e-05, "loss": 2.307, "step": 454330 }, { "epoch": 0.79, "learning_rate": 1.0384281364551108e-05, "loss": 2.2598, "step": 454340 }, { "epoch": 0.79, "learning_rate": 1.0383409424624282e-05, "loss": 2.1797, "step": 454350 }, { "epoch": 0.79, "learning_rate": 1.0382537484697456e-05, "loss": 2.4317, "step": 454360 }, { "epoch": 0.79, "learning_rate": 1.0381665544770628e-05, "loss": 2.2899, "step": 454370 }, { "epoch": 0.79, "learning_rate": 1.0380793604843801e-05, "loss": 2.2194, "step": 454380 }, { "epoch": 0.79, "learning_rate": 1.0379921664916975e-05, "loss": 2.3406, "step": 454390 }, { "epoch": 0.79, "learning_rate": 1.0379049724990147e-05, "loss": 2.279, "step": 454400 }, { "epoch": 0.79, "learning_rate": 1.0378177785063321e-05, "loss": 2.1529, "step": 454410 }, { "epoch": 0.79, "learning_rate": 1.0377305845136493e-05, "loss": 2.267, "step": 454420 }, { "epoch": 0.79, "learning_rate": 1.0376433905209667e-05, "loss": 2.3338, "step": 454430 }, { "epoch": 0.79, "learning_rate": 1.037556196528284e-05, "loss": 2.296, "step": 454440 }, { "epoch": 0.79, "learning_rate": 1.0374690025356014e-05, "loss": 2.2688, "step": 454450 }, { "epoch": 0.79, "learning_rate": 1.0373818085429186e-05, "loss": 2.3013, "step": 454460 }, { "epoch": 0.79, "learning_rate": 1.037294614550236e-05, "loss": 2.2531, "step": 454470 }, { "epoch": 0.79, "learning_rate": 1.0372074205575532e-05, "loss": 2.2577, "step": 454480 }, { "epoch": 0.79, "learning_rate": 1.0371202265648706e-05, "loss": 2.255, "step": 454490 }, { "epoch": 0.79, "learning_rate": 1.0370330325721878e-05, "loss": 2.3246, "step": 454500 }, { "epoch": 0.79, "learning_rate": 1.0369458385795054e-05, "loss": 2.3504, "step": 454510 }, { "epoch": 0.79, "learning_rate": 1.0368586445868227e-05, "loss": 2.2741, "step": 454520 }, { "epoch": 0.79, "learning_rate": 1.03677145059414e-05, "loss": 2.3379, "step": 454530 }, { "epoch": 0.79, "learning_rate": 1.0366842566014573e-05, "loss": 2.2637, "step": 454540 }, { "epoch": 0.79, "learning_rate": 1.0365970626087745e-05, "loss": 2.3252, "step": 454550 }, { "epoch": 0.79, "learning_rate": 1.0365098686160919e-05, "loss": 2.2663, "step": 454560 }, { "epoch": 0.79, "learning_rate": 1.0364226746234091e-05, "loss": 2.2904, "step": 454570 }, { "epoch": 0.79, "learning_rate": 1.0363354806307265e-05, "loss": 2.1167, "step": 454580 }, { "epoch": 0.79, "learning_rate": 1.0362482866380439e-05, "loss": 2.1991, "step": 454590 }, { "epoch": 0.79, "learning_rate": 1.0361610926453612e-05, "loss": 2.3079, "step": 454600 }, { "epoch": 0.79, "learning_rate": 1.0360738986526785e-05, "loss": 2.2726, "step": 454610 }, { "epoch": 0.79, "learning_rate": 1.0359867046599958e-05, "loss": 2.2643, "step": 454620 }, { "epoch": 0.79, "learning_rate": 1.035899510667313e-05, "loss": 2.2773, "step": 454630 }, { "epoch": 0.79, "learning_rate": 1.0358123166746304e-05, "loss": 2.3584, "step": 454640 }, { "epoch": 0.79, "learning_rate": 1.0357251226819476e-05, "loss": 2.1178, "step": 454650 }, { "epoch": 0.79, "learning_rate": 1.035637928689265e-05, "loss": 2.3628, "step": 454660 }, { "epoch": 0.79, "learning_rate": 1.0355507346965824e-05, "loss": 2.2896, "step": 454670 }, { "epoch": 0.79, "learning_rate": 1.0354635407038998e-05, "loss": 2.2954, "step": 454680 }, { "epoch": 0.79, "learning_rate": 1.0353763467112171e-05, "loss": 2.427, "step": 454690 }, { "epoch": 0.79, "learning_rate": 1.0352891527185343e-05, "loss": 2.2731, "step": 454700 }, { "epoch": 0.79, "learning_rate": 1.0352019587258517e-05, "loss": 2.3983, "step": 454710 }, { "epoch": 0.79, "learning_rate": 1.035114764733169e-05, "loss": 2.2936, "step": 454720 }, { "epoch": 0.79, "learning_rate": 1.0350275707404863e-05, "loss": 2.385, "step": 454730 }, { "epoch": 0.79, "learning_rate": 1.0349403767478035e-05, "loss": 2.2529, "step": 454740 }, { "epoch": 0.79, "learning_rate": 1.034853182755121e-05, "loss": 2.3041, "step": 454750 }, { "epoch": 0.79, "learning_rate": 1.0347659887624383e-05, "loss": 2.1404, "step": 454760 }, { "epoch": 0.79, "learning_rate": 1.0346787947697556e-05, "loss": 2.3379, "step": 454770 }, { "epoch": 0.79, "learning_rate": 1.0345916007770728e-05, "loss": 2.439, "step": 454780 }, { "epoch": 0.79, "learning_rate": 1.0345044067843902e-05, "loss": 2.2303, "step": 454790 }, { "epoch": 0.79, "learning_rate": 1.0344172127917076e-05, "loss": 2.3086, "step": 454800 }, { "epoch": 0.79, "learning_rate": 1.0343300187990248e-05, "loss": 2.2801, "step": 454810 }, { "epoch": 0.79, "learning_rate": 1.0342428248063422e-05, "loss": 2.1555, "step": 454820 }, { "epoch": 0.79, "learning_rate": 1.0341556308136596e-05, "loss": 2.198, "step": 454830 }, { "epoch": 0.79, "learning_rate": 1.034068436820977e-05, "loss": 2.328, "step": 454840 }, { "epoch": 0.79, "learning_rate": 1.0339812428282941e-05, "loss": 2.1695, "step": 454850 }, { "epoch": 0.79, "learning_rate": 1.0338940488356115e-05, "loss": 2.2677, "step": 454860 }, { "epoch": 0.79, "learning_rate": 1.0338068548429287e-05, "loss": 2.2012, "step": 454870 }, { "epoch": 0.79, "learning_rate": 1.0337196608502461e-05, "loss": 2.1827, "step": 454880 }, { "epoch": 0.79, "learning_rate": 1.0336324668575633e-05, "loss": 2.2224, "step": 454890 }, { "epoch": 0.79, "learning_rate": 1.0335452728648807e-05, "loss": 2.148, "step": 454900 }, { "epoch": 0.79, "learning_rate": 1.033458078872198e-05, "loss": 2.3284, "step": 454910 }, { "epoch": 0.79, "learning_rate": 1.0333708848795154e-05, "loss": 2.1774, "step": 454920 }, { "epoch": 0.79, "learning_rate": 1.0332836908868328e-05, "loss": 2.149, "step": 454930 }, { "epoch": 0.79, "learning_rate": 1.03319649689415e-05, "loss": 2.2078, "step": 454940 }, { "epoch": 0.79, "learning_rate": 1.0331093029014674e-05, "loss": 2.2306, "step": 454950 }, { "epoch": 0.79, "learning_rate": 1.0330221089087846e-05, "loss": 2.2018, "step": 454960 }, { "epoch": 0.79, "learning_rate": 1.032934914916102e-05, "loss": 2.3288, "step": 454970 }, { "epoch": 0.79, "learning_rate": 1.0328477209234192e-05, "loss": 2.2547, "step": 454980 }, { "epoch": 0.79, "learning_rate": 1.0327605269307366e-05, "loss": 2.3211, "step": 454990 }, { "epoch": 0.79, "learning_rate": 1.032673332938054e-05, "loss": 2.2887, "step": 455000 }, { "epoch": 0.79, "learning_rate": 1.0325861389453713e-05, "loss": 2.3162, "step": 455010 }, { "epoch": 0.79, "learning_rate": 1.0324989449526885e-05, "loss": 2.2333, "step": 455020 }, { "epoch": 0.79, "learning_rate": 1.032411750960006e-05, "loss": 2.247, "step": 455030 }, { "epoch": 0.79, "learning_rate": 1.0323245569673231e-05, "loss": 2.2089, "step": 455040 }, { "epoch": 0.79, "learning_rate": 1.0322373629746405e-05, "loss": 2.2909, "step": 455050 }, { "epoch": 0.79, "learning_rate": 1.0321501689819579e-05, "loss": 2.3872, "step": 455060 }, { "epoch": 0.79, "learning_rate": 1.0320629749892753e-05, "loss": 2.197, "step": 455070 }, { "epoch": 0.79, "learning_rate": 1.0319757809965926e-05, "loss": 2.2202, "step": 455080 }, { "epoch": 0.79, "learning_rate": 1.0318885870039098e-05, "loss": 2.3442, "step": 455090 }, { "epoch": 0.79, "learning_rate": 1.0318013930112272e-05, "loss": 2.2652, "step": 455100 }, { "epoch": 0.79, "learning_rate": 1.0317141990185444e-05, "loss": 2.3097, "step": 455110 }, { "epoch": 0.79, "learning_rate": 1.0316270050258618e-05, "loss": 2.2533, "step": 455120 }, { "epoch": 0.79, "learning_rate": 1.031539811033179e-05, "loss": 2.2632, "step": 455130 }, { "epoch": 0.79, "learning_rate": 1.0314526170404964e-05, "loss": 2.2452, "step": 455140 }, { "epoch": 0.79, "learning_rate": 1.0313654230478138e-05, "loss": 2.3086, "step": 455150 }, { "epoch": 0.79, "learning_rate": 1.0312782290551311e-05, "loss": 2.1754, "step": 455160 }, { "epoch": 0.79, "learning_rate": 1.0311910350624483e-05, "loss": 2.3588, "step": 455170 }, { "epoch": 0.79, "learning_rate": 1.0311038410697657e-05, "loss": 2.2809, "step": 455180 }, { "epoch": 0.79, "learning_rate": 1.0310166470770831e-05, "loss": 2.453, "step": 455190 }, { "epoch": 0.79, "learning_rate": 1.0309294530844003e-05, "loss": 2.2489, "step": 455200 }, { "epoch": 0.79, "learning_rate": 1.0308422590917177e-05, "loss": 2.1281, "step": 455210 }, { "epoch": 0.79, "learning_rate": 1.0307550650990349e-05, "loss": 2.3183, "step": 455220 }, { "epoch": 0.79, "learning_rate": 1.0306678711063523e-05, "loss": 2.2488, "step": 455230 }, { "epoch": 0.79, "learning_rate": 1.0305806771136696e-05, "loss": 2.2858, "step": 455240 }, { "epoch": 0.79, "learning_rate": 1.030493483120987e-05, "loss": 2.2097, "step": 455250 }, { "epoch": 0.79, "learning_rate": 1.0304062891283042e-05, "loss": 2.2607, "step": 455260 }, { "epoch": 0.79, "learning_rate": 1.0303190951356216e-05, "loss": 2.2811, "step": 455270 }, { "epoch": 0.79, "learning_rate": 1.0302319011429388e-05, "loss": 2.3136, "step": 455280 }, { "epoch": 0.79, "learning_rate": 1.0301447071502562e-05, "loss": 2.2547, "step": 455290 }, { "epoch": 0.79, "learning_rate": 1.0300575131575734e-05, "loss": 2.332, "step": 455300 }, { "epoch": 0.79, "learning_rate": 1.029970319164891e-05, "loss": 2.3722, "step": 455310 }, { "epoch": 0.79, "learning_rate": 1.0298831251722083e-05, "loss": 2.365, "step": 455320 }, { "epoch": 0.79, "learning_rate": 1.0297959311795255e-05, "loss": 2.1628, "step": 455330 }, { "epoch": 0.79, "learning_rate": 1.0297087371868429e-05, "loss": 2.3057, "step": 455340 }, { "epoch": 0.79, "learning_rate": 1.0296215431941601e-05, "loss": 2.3358, "step": 455350 }, { "epoch": 0.79, "learning_rate": 1.0295343492014775e-05, "loss": 2.2987, "step": 455360 }, { "epoch": 0.79, "learning_rate": 1.0294471552087947e-05, "loss": 2.2985, "step": 455370 }, { "epoch": 0.79, "learning_rate": 1.029359961216112e-05, "loss": 2.3233, "step": 455380 }, { "epoch": 0.79, "learning_rate": 1.0292727672234295e-05, "loss": 2.2621, "step": 455390 }, { "epoch": 0.79, "learning_rate": 1.0291855732307468e-05, "loss": 2.2854, "step": 455400 }, { "epoch": 0.79, "learning_rate": 1.029098379238064e-05, "loss": 2.2423, "step": 455410 }, { "epoch": 0.79, "learning_rate": 1.0290111852453814e-05, "loss": 2.2162, "step": 455420 }, { "epoch": 0.79, "learning_rate": 1.0289239912526986e-05, "loss": 2.2645, "step": 455430 }, { "epoch": 0.79, "learning_rate": 1.028836797260016e-05, "loss": 2.2314, "step": 455440 }, { "epoch": 0.79, "learning_rate": 1.0287496032673334e-05, "loss": 2.2398, "step": 455450 }, { "epoch": 0.79, "learning_rate": 1.0286624092746506e-05, "loss": 2.3141, "step": 455460 }, { "epoch": 0.79, "learning_rate": 1.028575215281968e-05, "loss": 2.2874, "step": 455470 }, { "epoch": 0.79, "learning_rate": 1.0284880212892853e-05, "loss": 2.2639, "step": 455480 }, { "epoch": 0.79, "learning_rate": 1.0284008272966027e-05, "loss": 2.2938, "step": 455490 }, { "epoch": 0.79, "learning_rate": 1.02831363330392e-05, "loss": 2.2546, "step": 455500 }, { "epoch": 0.79, "learning_rate": 1.0282264393112373e-05, "loss": 2.3014, "step": 455510 }, { "epoch": 0.79, "learning_rate": 1.0281392453185545e-05, "loss": 2.4053, "step": 455520 }, { "epoch": 0.79, "learning_rate": 1.0280520513258719e-05, "loss": 2.2545, "step": 455530 }, { "epoch": 0.79, "learning_rate": 1.0279648573331891e-05, "loss": 2.3766, "step": 455540 }, { "epoch": 0.79, "learning_rate": 1.0278776633405066e-05, "loss": 2.2293, "step": 455550 }, { "epoch": 0.79, "learning_rate": 1.0277904693478238e-05, "loss": 2.2899, "step": 455560 }, { "epoch": 0.79, "learning_rate": 1.0277032753551412e-05, "loss": 2.1769, "step": 455570 }, { "epoch": 0.79, "learning_rate": 1.0276160813624584e-05, "loss": 2.2893, "step": 455580 }, { "epoch": 0.79, "learning_rate": 1.0275288873697758e-05, "loss": 2.2664, "step": 455590 }, { "epoch": 0.79, "learning_rate": 1.0274416933770932e-05, "loss": 2.2969, "step": 455600 }, { "epoch": 0.79, "learning_rate": 1.0273544993844104e-05, "loss": 2.2321, "step": 455610 }, { "epoch": 0.79, "learning_rate": 1.0272673053917278e-05, "loss": 2.2864, "step": 455620 }, { "epoch": 0.79, "learning_rate": 1.0271801113990451e-05, "loss": 2.235, "step": 455630 }, { "epoch": 0.79, "learning_rate": 1.0270929174063625e-05, "loss": 2.2235, "step": 455640 }, { "epoch": 0.79, "learning_rate": 1.0270057234136797e-05, "loss": 2.2072, "step": 455650 }, { "epoch": 0.79, "learning_rate": 1.0269185294209971e-05, "loss": 2.2663, "step": 455660 }, { "epoch": 0.79, "learning_rate": 1.0268313354283143e-05, "loss": 2.3835, "step": 455670 }, { "epoch": 0.79, "learning_rate": 1.0267441414356317e-05, "loss": 2.3211, "step": 455680 }, { "epoch": 0.79, "learning_rate": 1.0266569474429489e-05, "loss": 2.3107, "step": 455690 }, { "epoch": 0.79, "learning_rate": 1.0265697534502663e-05, "loss": 2.1725, "step": 455700 }, { "epoch": 0.79, "learning_rate": 1.0264825594575837e-05, "loss": 2.2997, "step": 455710 }, { "epoch": 0.79, "learning_rate": 1.026395365464901e-05, "loss": 2.2006, "step": 455720 }, { "epoch": 0.79, "learning_rate": 1.0263081714722184e-05, "loss": 2.2786, "step": 455730 }, { "epoch": 0.79, "learning_rate": 1.0262209774795356e-05, "loss": 2.2797, "step": 455740 }, { "epoch": 0.79, "learning_rate": 1.026133783486853e-05, "loss": 2.2773, "step": 455750 }, { "epoch": 0.79, "learning_rate": 1.0260465894941702e-05, "loss": 2.3626, "step": 455760 }, { "epoch": 0.79, "learning_rate": 1.0259593955014876e-05, "loss": 2.4114, "step": 455770 }, { "epoch": 0.79, "learning_rate": 1.0258722015088048e-05, "loss": 2.2432, "step": 455780 }, { "epoch": 0.79, "learning_rate": 1.0257850075161223e-05, "loss": 2.332, "step": 455790 }, { "epoch": 0.79, "learning_rate": 1.0256978135234395e-05, "loss": 2.2243, "step": 455800 }, { "epoch": 0.79, "learning_rate": 1.025610619530757e-05, "loss": 2.2557, "step": 455810 }, { "epoch": 0.79, "learning_rate": 1.0255234255380741e-05, "loss": 2.2338, "step": 455820 }, { "epoch": 0.79, "learning_rate": 1.0254362315453915e-05, "loss": 2.1983, "step": 455830 }, { "epoch": 0.79, "learning_rate": 1.0253490375527087e-05, "loss": 2.3047, "step": 455840 }, { "epoch": 0.79, "learning_rate": 1.0252618435600261e-05, "loss": 2.2354, "step": 455850 }, { "epoch": 0.79, "learning_rate": 1.0251746495673435e-05, "loss": 2.3497, "step": 455860 }, { "epoch": 0.79, "learning_rate": 1.0250874555746608e-05, "loss": 2.2838, "step": 455870 }, { "epoch": 0.79, "learning_rate": 1.0250002615819782e-05, "loss": 2.2829, "step": 455880 }, { "epoch": 0.8, "learning_rate": 1.0249130675892954e-05, "loss": 2.2515, "step": 455890 }, { "epoch": 0.8, "learning_rate": 1.0248258735966128e-05, "loss": 2.3795, "step": 455900 }, { "epoch": 0.8, "learning_rate": 1.02473867960393e-05, "loss": 2.3264, "step": 455910 }, { "epoch": 0.8, "learning_rate": 1.0246514856112474e-05, "loss": 2.3261, "step": 455920 }, { "epoch": 0.8, "learning_rate": 1.0245642916185646e-05, "loss": 2.2902, "step": 455930 }, { "epoch": 0.8, "learning_rate": 1.024477097625882e-05, "loss": 2.3128, "step": 455940 }, { "epoch": 0.8, "learning_rate": 1.0243899036331993e-05, "loss": 2.375, "step": 455950 }, { "epoch": 0.8, "learning_rate": 1.0243027096405167e-05, "loss": 2.3436, "step": 455960 }, { "epoch": 0.8, "learning_rate": 1.024215515647834e-05, "loss": 2.2801, "step": 455970 }, { "epoch": 0.8, "learning_rate": 1.0241283216551513e-05, "loss": 2.2826, "step": 455980 }, { "epoch": 0.8, "learning_rate": 1.0240411276624687e-05, "loss": 2.2964, "step": 455990 }, { "epoch": 0.8, "learning_rate": 1.0239539336697859e-05, "loss": 2.3736, "step": 456000 }, { "epoch": 0.8, "learning_rate": 1.0238667396771033e-05, "loss": 2.271, "step": 456010 }, { "epoch": 0.8, "learning_rate": 1.0237795456844205e-05, "loss": 2.3297, "step": 456020 }, { "epoch": 0.8, "learning_rate": 1.0236923516917379e-05, "loss": 2.404, "step": 456030 }, { "epoch": 0.8, "learning_rate": 1.0236051576990552e-05, "loss": 2.4018, "step": 456040 }, { "epoch": 0.8, "learning_rate": 1.0235179637063726e-05, "loss": 2.2696, "step": 456050 }, { "epoch": 0.8, "learning_rate": 1.0234307697136898e-05, "loss": 2.3234, "step": 456060 }, { "epoch": 0.8, "learning_rate": 1.0233435757210072e-05, "loss": 2.3017, "step": 456070 }, { "epoch": 0.8, "learning_rate": 1.0232563817283244e-05, "loss": 2.2849, "step": 456080 }, { "epoch": 0.8, "learning_rate": 1.0231691877356418e-05, "loss": 2.3493, "step": 456090 }, { "epoch": 0.8, "learning_rate": 1.0230819937429592e-05, "loss": 2.2633, "step": 456100 }, { "epoch": 0.8, "learning_rate": 1.0229947997502765e-05, "loss": 2.32, "step": 456110 }, { "epoch": 0.8, "learning_rate": 1.0229076057575939e-05, "loss": 2.1316, "step": 456120 }, { "epoch": 0.8, "learning_rate": 1.0228204117649111e-05, "loss": 2.3321, "step": 456130 }, { "epoch": 0.8, "learning_rate": 1.0227332177722285e-05, "loss": 2.2818, "step": 456140 }, { "epoch": 0.8, "learning_rate": 1.0226460237795457e-05, "loss": 2.2615, "step": 456150 }, { "epoch": 0.8, "learning_rate": 1.022558829786863e-05, "loss": 2.3526, "step": 456160 }, { "epoch": 0.8, "learning_rate": 1.0224716357941803e-05, "loss": 2.3402, "step": 456170 }, { "epoch": 0.8, "learning_rate": 1.0223844418014977e-05, "loss": 2.2826, "step": 456180 }, { "epoch": 0.8, "learning_rate": 1.022297247808815e-05, "loss": 2.3186, "step": 456190 }, { "epoch": 0.8, "learning_rate": 1.0222100538161324e-05, "loss": 2.2036, "step": 456200 }, { "epoch": 0.8, "learning_rate": 1.0221228598234496e-05, "loss": 2.2488, "step": 456210 }, { "epoch": 0.8, "learning_rate": 1.022035665830767e-05, "loss": 2.3437, "step": 456220 }, { "epoch": 0.8, "learning_rate": 1.0219484718380842e-05, "loss": 2.214, "step": 456230 }, { "epoch": 0.8, "learning_rate": 1.0218612778454016e-05, "loss": 2.2569, "step": 456240 }, { "epoch": 0.8, "learning_rate": 1.021774083852719e-05, "loss": 2.214, "step": 456250 }, { "epoch": 0.8, "learning_rate": 1.0216868898600362e-05, "loss": 2.4505, "step": 456260 }, { "epoch": 0.8, "learning_rate": 1.0215996958673535e-05, "loss": 2.3328, "step": 456270 }, { "epoch": 0.8, "learning_rate": 1.021512501874671e-05, "loss": 2.2238, "step": 456280 }, { "epoch": 0.8, "learning_rate": 1.0214253078819883e-05, "loss": 2.3256, "step": 456290 }, { "epoch": 0.8, "learning_rate": 1.0213381138893055e-05, "loss": 2.2977, "step": 456300 }, { "epoch": 0.8, "learning_rate": 1.0212509198966229e-05, "loss": 2.281, "step": 456310 }, { "epoch": 0.8, "learning_rate": 1.0211637259039401e-05, "loss": 2.2134, "step": 456320 }, { "epoch": 0.8, "learning_rate": 1.0210765319112575e-05, "loss": 2.2763, "step": 456330 }, { "epoch": 0.8, "learning_rate": 1.0209893379185747e-05, "loss": 2.3005, "step": 456340 }, { "epoch": 0.8, "learning_rate": 1.0209021439258922e-05, "loss": 2.321, "step": 456350 }, { "epoch": 0.8, "learning_rate": 1.0208149499332094e-05, "loss": 2.2534, "step": 456360 }, { "epoch": 0.8, "learning_rate": 1.0207277559405268e-05, "loss": 2.2804, "step": 456370 }, { "epoch": 0.8, "learning_rate": 1.0206405619478442e-05, "loss": 2.3103, "step": 456380 }, { "epoch": 0.8, "learning_rate": 1.0205533679551614e-05, "loss": 2.2577, "step": 456390 }, { "epoch": 0.8, "learning_rate": 1.0204661739624788e-05, "loss": 2.3658, "step": 456400 }, { "epoch": 0.8, "learning_rate": 1.020378979969796e-05, "loss": 2.3513, "step": 456410 }, { "epoch": 0.8, "learning_rate": 1.0202917859771134e-05, "loss": 2.3178, "step": 456420 }, { "epoch": 0.8, "learning_rate": 1.0202045919844307e-05, "loss": 2.3019, "step": 456430 }, { "epoch": 0.8, "learning_rate": 1.0201173979917481e-05, "loss": 2.2501, "step": 456440 }, { "epoch": 0.8, "learning_rate": 1.0200302039990653e-05, "loss": 2.2567, "step": 456450 }, { "epoch": 0.8, "learning_rate": 1.0199430100063827e-05, "loss": 2.339, "step": 456460 }, { "epoch": 0.8, "learning_rate": 1.0198558160136999e-05, "loss": 2.3375, "step": 456470 }, { "epoch": 0.8, "learning_rate": 1.0197686220210173e-05, "loss": 2.2499, "step": 456480 }, { "epoch": 0.8, "learning_rate": 1.0196814280283345e-05, "loss": 2.1961, "step": 456490 }, { "epoch": 0.8, "learning_rate": 1.0195942340356519e-05, "loss": 2.2849, "step": 456500 }, { "epoch": 0.8, "learning_rate": 1.0195070400429692e-05, "loss": 2.2554, "step": 456510 }, { "epoch": 0.8, "learning_rate": 1.0194198460502866e-05, "loss": 2.4108, "step": 456520 }, { "epoch": 0.8, "learning_rate": 1.019332652057604e-05, "loss": 2.2612, "step": 456530 }, { "epoch": 0.8, "learning_rate": 1.0192454580649212e-05, "loss": 2.2284, "step": 456540 }, { "epoch": 0.8, "learning_rate": 1.0191582640722386e-05, "loss": 2.3868, "step": 456550 }, { "epoch": 0.8, "learning_rate": 1.0190710700795558e-05, "loss": 2.2374, "step": 456560 }, { "epoch": 0.8, "learning_rate": 1.0189838760868732e-05, "loss": 2.2217, "step": 456570 }, { "epoch": 0.8, "learning_rate": 1.0188966820941904e-05, "loss": 2.3317, "step": 456580 }, { "epoch": 0.8, "learning_rate": 1.018809488101508e-05, "loss": 2.2325, "step": 456590 }, { "epoch": 0.8, "learning_rate": 1.0187222941088251e-05, "loss": 2.4173, "step": 456600 }, { "epoch": 0.8, "learning_rate": 1.0186351001161425e-05, "loss": 2.3532, "step": 456610 }, { "epoch": 0.8, "learning_rate": 1.0185479061234597e-05, "loss": 2.1998, "step": 456620 }, { "epoch": 0.8, "learning_rate": 1.0184607121307771e-05, "loss": 2.1966, "step": 456630 }, { "epoch": 0.8, "learning_rate": 1.0183735181380943e-05, "loss": 2.373, "step": 456640 }, { "epoch": 0.8, "learning_rate": 1.0182863241454117e-05, "loss": 2.2637, "step": 456650 }, { "epoch": 0.8, "learning_rate": 1.018199130152729e-05, "loss": 2.2134, "step": 456660 }, { "epoch": 0.8, "learning_rate": 1.0181119361600464e-05, "loss": 2.3778, "step": 456670 }, { "epoch": 0.8, "learning_rate": 1.0180247421673638e-05, "loss": 2.3773, "step": 456680 }, { "epoch": 0.8, "learning_rate": 1.017937548174681e-05, "loss": 2.2001, "step": 456690 }, { "epoch": 0.8, "learning_rate": 1.0178503541819984e-05, "loss": 2.2764, "step": 456700 }, { "epoch": 0.8, "learning_rate": 1.0177631601893156e-05, "loss": 2.2621, "step": 456710 }, { "epoch": 0.8, "learning_rate": 1.017675966196633e-05, "loss": 2.1777, "step": 456720 }, { "epoch": 0.8, "learning_rate": 1.0175887722039502e-05, "loss": 2.2171, "step": 456730 }, { "epoch": 0.8, "learning_rate": 1.0175015782112676e-05, "loss": 2.2904, "step": 456740 }, { "epoch": 0.8, "learning_rate": 1.017414384218585e-05, "loss": 2.4294, "step": 456750 }, { "epoch": 0.8, "learning_rate": 1.0173271902259023e-05, "loss": 2.3357, "step": 456760 }, { "epoch": 0.8, "learning_rate": 1.0172399962332195e-05, "loss": 2.2069, "step": 456770 }, { "epoch": 0.8, "learning_rate": 1.0171528022405369e-05, "loss": 2.3238, "step": 456780 }, { "epoch": 0.8, "learning_rate": 1.0170656082478543e-05, "loss": 2.2988, "step": 456790 }, { "epoch": 0.8, "learning_rate": 1.0169784142551715e-05, "loss": 2.1942, "step": 456800 }, { "epoch": 0.8, "learning_rate": 1.0168912202624889e-05, "loss": 2.2448, "step": 456810 }, { "epoch": 0.8, "learning_rate": 1.016804026269806e-05, "loss": 2.3814, "step": 456820 }, { "epoch": 0.8, "learning_rate": 1.0167168322771236e-05, "loss": 2.4019, "step": 456830 }, { "epoch": 0.8, "learning_rate": 1.0166296382844408e-05, "loss": 2.2615, "step": 456840 }, { "epoch": 0.8, "learning_rate": 1.0165424442917582e-05, "loss": 2.2266, "step": 456850 }, { "epoch": 0.8, "learning_rate": 1.0164552502990754e-05, "loss": 2.2027, "step": 456860 }, { "epoch": 0.8, "learning_rate": 1.0163680563063928e-05, "loss": 2.3064, "step": 456870 }, { "epoch": 0.8, "learning_rate": 1.01628086231371e-05, "loss": 2.2205, "step": 456880 }, { "epoch": 0.8, "learning_rate": 1.0161936683210274e-05, "loss": 2.1588, "step": 456890 }, { "epoch": 0.8, "learning_rate": 1.0161064743283447e-05, "loss": 2.3081, "step": 456900 }, { "epoch": 0.8, "learning_rate": 1.0160192803356621e-05, "loss": 2.2436, "step": 456910 }, { "epoch": 0.8, "learning_rate": 1.0159320863429795e-05, "loss": 2.2165, "step": 456920 }, { "epoch": 0.8, "learning_rate": 1.0158448923502967e-05, "loss": 2.2916, "step": 456930 }, { "epoch": 0.8, "learning_rate": 1.015757698357614e-05, "loss": 2.1819, "step": 456940 }, { "epoch": 0.8, "learning_rate": 1.0156705043649313e-05, "loss": 2.2934, "step": 456950 }, { "epoch": 0.8, "learning_rate": 1.0155833103722487e-05, "loss": 2.287, "step": 456960 }, { "epoch": 0.8, "learning_rate": 1.0154961163795659e-05, "loss": 2.278, "step": 456970 }, { "epoch": 0.8, "learning_rate": 1.0154089223868832e-05, "loss": 2.1921, "step": 456980 }, { "epoch": 0.8, "learning_rate": 1.0153217283942006e-05, "loss": 2.2831, "step": 456990 }, { "epoch": 0.8, "learning_rate": 1.015234534401518e-05, "loss": 2.1598, "step": 457000 }, { "epoch": 0.8, "learning_rate": 1.0151473404088352e-05, "loss": 2.156, "step": 457010 }, { "epoch": 0.8, "learning_rate": 1.0150601464161526e-05, "loss": 2.2436, "step": 457020 }, { "epoch": 0.8, "learning_rate": 1.0149729524234698e-05, "loss": 2.3272, "step": 457030 }, { "epoch": 0.8, "learning_rate": 1.0148857584307872e-05, "loss": 2.1464, "step": 457040 }, { "epoch": 0.8, "learning_rate": 1.0147985644381045e-05, "loss": 2.4018, "step": 457050 }, { "epoch": 0.8, "learning_rate": 1.0147113704454218e-05, "loss": 2.2389, "step": 457060 }, { "epoch": 0.8, "learning_rate": 1.0146241764527391e-05, "loss": 2.3816, "step": 457070 }, { "epoch": 0.8, "learning_rate": 1.0145369824600565e-05, "loss": 2.3573, "step": 457080 }, { "epoch": 0.8, "learning_rate": 1.0144497884673739e-05, "loss": 2.2781, "step": 457090 }, { "epoch": 0.8, "learning_rate": 1.0143625944746911e-05, "loss": 2.3567, "step": 457100 }, { "epoch": 0.8, "learning_rate": 1.0142754004820085e-05, "loss": 2.2553, "step": 457110 }, { "epoch": 0.8, "learning_rate": 1.0141882064893257e-05, "loss": 2.3246, "step": 457120 }, { "epoch": 0.8, "learning_rate": 1.014101012496643e-05, "loss": 2.3476, "step": 457130 }, { "epoch": 0.8, "learning_rate": 1.0140138185039604e-05, "loss": 2.3082, "step": 457140 }, { "epoch": 0.8, "learning_rate": 1.0139266245112778e-05, "loss": 2.2878, "step": 457150 }, { "epoch": 0.8, "learning_rate": 1.013839430518595e-05, "loss": 2.2959, "step": 457160 }, { "epoch": 0.8, "learning_rate": 1.0137522365259124e-05, "loss": 2.3426, "step": 457170 }, { "epoch": 0.8, "learning_rate": 1.0136650425332298e-05, "loss": 2.3728, "step": 457180 }, { "epoch": 0.8, "learning_rate": 1.013577848540547e-05, "loss": 2.3496, "step": 457190 }, { "epoch": 0.8, "learning_rate": 1.0134906545478644e-05, "loss": 2.3535, "step": 457200 }, { "epoch": 0.8, "learning_rate": 1.0134034605551816e-05, "loss": 2.2799, "step": 457210 }, { "epoch": 0.8, "learning_rate": 1.013316266562499e-05, "loss": 2.2267, "step": 457220 }, { "epoch": 0.8, "learning_rate": 1.0132290725698163e-05, "loss": 2.3898, "step": 457230 }, { "epoch": 0.8, "learning_rate": 1.0131418785771337e-05, "loss": 2.353, "step": 457240 }, { "epoch": 0.8, "learning_rate": 1.0130546845844509e-05, "loss": 2.1921, "step": 457250 }, { "epoch": 0.8, "learning_rate": 1.0129674905917683e-05, "loss": 2.1977, "step": 457260 }, { "epoch": 0.8, "learning_rate": 1.0128802965990855e-05, "loss": 2.2127, "step": 457270 }, { "epoch": 0.8, "learning_rate": 1.0127931026064029e-05, "loss": 2.2541, "step": 457280 }, { "epoch": 0.8, "learning_rate": 1.01270590861372e-05, "loss": 2.3327, "step": 457290 }, { "epoch": 0.8, "learning_rate": 1.0126187146210374e-05, "loss": 2.3581, "step": 457300 }, { "epoch": 0.8, "learning_rate": 1.0125315206283548e-05, "loss": 2.1413, "step": 457310 }, { "epoch": 0.8, "learning_rate": 1.0124443266356722e-05, "loss": 2.1325, "step": 457320 }, { "epoch": 0.8, "learning_rate": 1.0123571326429896e-05, "loss": 2.3, "step": 457330 }, { "epoch": 0.8, "learning_rate": 1.0122699386503068e-05, "loss": 2.3582, "step": 457340 }, { "epoch": 0.8, "learning_rate": 1.0121827446576242e-05, "loss": 2.2801, "step": 457350 }, { "epoch": 0.8, "learning_rate": 1.0120955506649414e-05, "loss": 2.2628, "step": 457360 }, { "epoch": 0.8, "learning_rate": 1.0120083566722587e-05, "loss": 2.2705, "step": 457370 }, { "epoch": 0.8, "learning_rate": 1.011921162679576e-05, "loss": 2.1547, "step": 457380 }, { "epoch": 0.8, "learning_rate": 1.0118339686868935e-05, "loss": 2.4016, "step": 457390 }, { "epoch": 0.8, "learning_rate": 1.0117467746942107e-05, "loss": 2.2526, "step": 457400 }, { "epoch": 0.8, "learning_rate": 1.0116595807015281e-05, "loss": 2.3333, "step": 457410 }, { "epoch": 0.8, "learning_rate": 1.0115723867088453e-05, "loss": 2.2813, "step": 457420 }, { "epoch": 0.8, "learning_rate": 1.0114851927161627e-05, "loss": 2.2581, "step": 457430 }, { "epoch": 0.8, "learning_rate": 1.0113979987234799e-05, "loss": 2.3778, "step": 457440 }, { "epoch": 0.8, "learning_rate": 1.0113108047307973e-05, "loss": 2.3536, "step": 457450 }, { "epoch": 0.8, "learning_rate": 1.0112236107381146e-05, "loss": 2.3413, "step": 457460 }, { "epoch": 0.8, "learning_rate": 1.011136416745432e-05, "loss": 2.2367, "step": 457470 }, { "epoch": 0.8, "learning_rate": 1.0110492227527494e-05, "loss": 2.2759, "step": 457480 }, { "epoch": 0.8, "learning_rate": 1.0109620287600666e-05, "loss": 2.3587, "step": 457490 }, { "epoch": 0.8, "learning_rate": 1.010874834767384e-05, "loss": 2.3707, "step": 457500 }, { "epoch": 0.8, "learning_rate": 1.0107876407747012e-05, "loss": 2.3099, "step": 457510 }, { "epoch": 0.8, "learning_rate": 1.0107004467820186e-05, "loss": 2.3616, "step": 457520 }, { "epoch": 0.8, "learning_rate": 1.0106132527893358e-05, "loss": 2.2816, "step": 457530 }, { "epoch": 0.8, "learning_rate": 1.0105260587966531e-05, "loss": 2.2066, "step": 457540 }, { "epoch": 0.8, "learning_rate": 1.0104388648039705e-05, "loss": 2.3049, "step": 457550 }, { "epoch": 0.8, "learning_rate": 1.0103516708112879e-05, "loss": 2.3138, "step": 457560 }, { "epoch": 0.8, "learning_rate": 1.0102644768186051e-05, "loss": 2.3393, "step": 457570 }, { "epoch": 0.8, "learning_rate": 1.0101772828259225e-05, "loss": 2.3993, "step": 457580 }, { "epoch": 0.8, "learning_rate": 1.0100900888332399e-05, "loss": 2.2408, "step": 457590 }, { "epoch": 0.8, "learning_rate": 1.010002894840557e-05, "loss": 2.2718, "step": 457600 }, { "epoch": 0.8, "learning_rate": 1.0099157008478744e-05, "loss": 2.1689, "step": 457610 }, { "epoch": 0.8, "learning_rate": 1.0098285068551916e-05, "loss": 2.1708, "step": 457620 }, { "epoch": 0.8, "learning_rate": 1.0097413128625092e-05, "loss": 2.3301, "step": 457630 }, { "epoch": 0.8, "learning_rate": 1.0096541188698264e-05, "loss": 2.2453, "step": 457640 }, { "epoch": 0.8, "learning_rate": 1.0095669248771438e-05, "loss": 2.3494, "step": 457650 }, { "epoch": 0.8, "learning_rate": 1.009479730884461e-05, "loss": 2.1454, "step": 457660 }, { "epoch": 0.8, "learning_rate": 1.0093925368917784e-05, "loss": 2.3022, "step": 457670 }, { "epoch": 0.8, "learning_rate": 1.0093053428990956e-05, "loss": 2.3147, "step": 457680 }, { "epoch": 0.8, "learning_rate": 1.009218148906413e-05, "loss": 2.2131, "step": 457690 }, { "epoch": 0.8, "learning_rate": 1.0091309549137303e-05, "loss": 2.2225, "step": 457700 }, { "epoch": 0.8, "learning_rate": 1.0090437609210477e-05, "loss": 2.19, "step": 457710 }, { "epoch": 0.8, "learning_rate": 1.008956566928365e-05, "loss": 2.3567, "step": 457720 }, { "epoch": 0.8, "learning_rate": 1.0088693729356823e-05, "loss": 2.2101, "step": 457730 }, { "epoch": 0.8, "learning_rate": 1.0087821789429997e-05, "loss": 2.3761, "step": 457740 }, { "epoch": 0.8, "learning_rate": 1.0086949849503169e-05, "loss": 2.2063, "step": 457750 }, { "epoch": 0.8, "learning_rate": 1.0086077909576342e-05, "loss": 2.3801, "step": 457760 }, { "epoch": 0.8, "learning_rate": 1.0085205969649515e-05, "loss": 2.3444, "step": 457770 }, { "epoch": 0.8, "learning_rate": 1.0084334029722688e-05, "loss": 2.2795, "step": 457780 }, { "epoch": 0.8, "learning_rate": 1.0083462089795862e-05, "loss": 2.1985, "step": 457790 }, { "epoch": 0.8, "learning_rate": 1.0082590149869036e-05, "loss": 2.2211, "step": 457800 }, { "epoch": 0.8, "learning_rate": 1.0081718209942208e-05, "loss": 2.2929, "step": 457810 }, { "epoch": 0.8, "learning_rate": 1.0080846270015382e-05, "loss": 2.3386, "step": 457820 }, { "epoch": 0.8, "learning_rate": 1.0079974330088554e-05, "loss": 2.2618, "step": 457830 }, { "epoch": 0.8, "learning_rate": 1.0079102390161728e-05, "loss": 2.1884, "step": 457840 }, { "epoch": 0.8, "learning_rate": 1.0078230450234901e-05, "loss": 2.2534, "step": 457850 }, { "epoch": 0.8, "learning_rate": 1.0077358510308073e-05, "loss": 2.3501, "step": 457860 }, { "epoch": 0.8, "learning_rate": 1.0076486570381249e-05, "loss": 2.1807, "step": 457870 }, { "epoch": 0.8, "learning_rate": 1.0075614630454421e-05, "loss": 2.2635, "step": 457880 }, { "epoch": 0.8, "learning_rate": 1.0074742690527595e-05, "loss": 2.3627, "step": 457890 }, { "epoch": 0.8, "learning_rate": 1.0073870750600767e-05, "loss": 2.236, "step": 457900 }, { "epoch": 0.8, "learning_rate": 1.007299881067394e-05, "loss": 2.1729, "step": 457910 }, { "epoch": 0.8, "learning_rate": 1.0072126870747113e-05, "loss": 2.2908, "step": 457920 }, { "epoch": 0.8, "learning_rate": 1.0071254930820286e-05, "loss": 2.3901, "step": 457930 }, { "epoch": 0.8, "learning_rate": 1.007038299089346e-05, "loss": 2.3614, "step": 457940 }, { "epoch": 0.8, "learning_rate": 1.0069511050966634e-05, "loss": 2.2896, "step": 457950 }, { "epoch": 0.8, "learning_rate": 1.0068639111039806e-05, "loss": 2.2317, "step": 457960 }, { "epoch": 0.8, "learning_rate": 1.006776717111298e-05, "loss": 2.4015, "step": 457970 }, { "epoch": 0.8, "learning_rate": 1.0066895231186154e-05, "loss": 2.1717, "step": 457980 }, { "epoch": 0.8, "learning_rate": 1.0066023291259326e-05, "loss": 2.3586, "step": 457990 }, { "epoch": 0.8, "learning_rate": 1.00651513513325e-05, "loss": 2.2567, "step": 458000 }, { "epoch": 0.8, "learning_rate": 1.0064279411405671e-05, "loss": 2.3111, "step": 458010 }, { "epoch": 0.8, "learning_rate": 1.0063407471478845e-05, "loss": 2.2909, "step": 458020 }, { "epoch": 0.8, "learning_rate": 1.0062535531552019e-05, "loss": 2.324, "step": 458030 }, { "epoch": 0.8, "learning_rate": 1.0061663591625193e-05, "loss": 2.2165, "step": 458040 }, { "epoch": 0.8, "learning_rate": 1.0060791651698365e-05, "loss": 2.267, "step": 458050 }, { "epoch": 0.8, "learning_rate": 1.0059919711771539e-05, "loss": 2.4236, "step": 458060 }, { "epoch": 0.8, "learning_rate": 1.005904777184471e-05, "loss": 2.3693, "step": 458070 }, { "epoch": 0.8, "learning_rate": 1.0058175831917884e-05, "loss": 2.2432, "step": 458080 }, { "epoch": 0.8, "learning_rate": 1.0057303891991057e-05, "loss": 2.2693, "step": 458090 }, { "epoch": 0.8, "learning_rate": 1.005643195206423e-05, "loss": 2.3034, "step": 458100 }, { "epoch": 0.8, "learning_rate": 1.0055560012137404e-05, "loss": 2.3461, "step": 458110 }, { "epoch": 0.8, "learning_rate": 1.0054688072210578e-05, "loss": 2.3826, "step": 458120 }, { "epoch": 0.8, "learning_rate": 1.0053816132283752e-05, "loss": 2.2949, "step": 458130 }, { "epoch": 0.8, "learning_rate": 1.0052944192356924e-05, "loss": 2.2529, "step": 458140 }, { "epoch": 0.8, "learning_rate": 1.0052072252430097e-05, "loss": 2.3531, "step": 458150 }, { "epoch": 0.8, "learning_rate": 1.005120031250327e-05, "loss": 2.1888, "step": 458160 }, { "epoch": 0.8, "learning_rate": 1.0050328372576443e-05, "loss": 2.2133, "step": 458170 }, { "epoch": 0.8, "learning_rate": 1.0049456432649617e-05, "loss": 2.2132, "step": 458180 }, { "epoch": 0.8, "learning_rate": 1.0048584492722791e-05, "loss": 2.2863, "step": 458190 }, { "epoch": 0.8, "learning_rate": 1.0047712552795963e-05, "loss": 2.1705, "step": 458200 }, { "epoch": 0.8, "learning_rate": 1.0046840612869137e-05, "loss": 2.3012, "step": 458210 }, { "epoch": 0.8, "learning_rate": 1.0045968672942309e-05, "loss": 2.2875, "step": 458220 }, { "epoch": 0.8, "learning_rate": 1.0045096733015483e-05, "loss": 2.3942, "step": 458230 }, { "epoch": 0.8, "learning_rate": 1.0044224793088655e-05, "loss": 2.2993, "step": 458240 }, { "epoch": 0.8, "learning_rate": 1.0043352853161828e-05, "loss": 2.3151, "step": 458250 }, { "epoch": 0.8, "learning_rate": 1.0042480913235002e-05, "loss": 2.231, "step": 458260 }, { "epoch": 0.8, "learning_rate": 1.0041608973308176e-05, "loss": 2.203, "step": 458270 }, { "epoch": 0.8, "learning_rate": 1.004073703338135e-05, "loss": 2.3102, "step": 458280 }, { "epoch": 0.8, "learning_rate": 1.0039865093454522e-05, "loss": 2.1522, "step": 458290 }, { "epoch": 0.8, "learning_rate": 1.0038993153527696e-05, "loss": 2.3514, "step": 458300 }, { "epoch": 0.8, "learning_rate": 1.0038121213600868e-05, "loss": 2.3091, "step": 458310 }, { "epoch": 0.8, "learning_rate": 1.0037249273674041e-05, "loss": 2.1504, "step": 458320 }, { "epoch": 0.8, "learning_rate": 1.0036377333747213e-05, "loss": 2.3445, "step": 458330 }, { "epoch": 0.8, "learning_rate": 1.0035505393820387e-05, "loss": 2.3288, "step": 458340 }, { "epoch": 0.8, "learning_rate": 1.0034633453893561e-05, "loss": 2.2515, "step": 458350 }, { "epoch": 0.8, "learning_rate": 1.0033761513966735e-05, "loss": 2.327, "step": 458360 }, { "epoch": 0.8, "learning_rate": 1.0032889574039907e-05, "loss": 2.3173, "step": 458370 }, { "epoch": 0.8, "learning_rate": 1.003201763411308e-05, "loss": 2.1925, "step": 458380 }, { "epoch": 0.8, "learning_rate": 1.0031145694186254e-05, "loss": 2.2726, "step": 458390 }, { "epoch": 0.8, "learning_rate": 1.0030273754259427e-05, "loss": 2.2427, "step": 458400 }, { "epoch": 0.8, "learning_rate": 1.00294018143326e-05, "loss": 2.2935, "step": 458410 }, { "epoch": 0.8, "learning_rate": 1.0028529874405772e-05, "loss": 2.2865, "step": 458420 }, { "epoch": 0.8, "learning_rate": 1.0027657934478948e-05, "loss": 2.3111, "step": 458430 }, { "epoch": 0.8, "learning_rate": 1.002678599455212e-05, "loss": 2.2273, "step": 458440 }, { "epoch": 0.8, "learning_rate": 1.0025914054625294e-05, "loss": 2.3415, "step": 458450 }, { "epoch": 0.8, "learning_rate": 1.0025042114698466e-05, "loss": 2.3635, "step": 458460 }, { "epoch": 0.8, "learning_rate": 1.002417017477164e-05, "loss": 2.3311, "step": 458470 }, { "epoch": 0.8, "learning_rate": 1.0023298234844812e-05, "loss": 2.2854, "step": 458480 }, { "epoch": 0.8, "learning_rate": 1.0022426294917985e-05, "loss": 2.3056, "step": 458490 }, { "epoch": 0.8, "learning_rate": 1.0021554354991159e-05, "loss": 2.241, "step": 458500 }, { "epoch": 0.8, "learning_rate": 1.0020682415064333e-05, "loss": 2.3025, "step": 458510 }, { "epoch": 0.8, "learning_rate": 1.0019810475137507e-05, "loss": 2.2092, "step": 458520 }, { "epoch": 0.8, "learning_rate": 1.0018938535210679e-05, "loss": 2.3765, "step": 458530 }, { "epoch": 0.8, "learning_rate": 1.0018066595283853e-05, "loss": 2.1046, "step": 458540 }, { "epoch": 0.8, "learning_rate": 1.0017194655357025e-05, "loss": 2.3204, "step": 458550 }, { "epoch": 0.8, "learning_rate": 1.0016322715430198e-05, "loss": 2.2965, "step": 458560 }, { "epoch": 0.8, "learning_rate": 1.001545077550337e-05, "loss": 2.1909, "step": 458570 }, { "epoch": 0.8, "learning_rate": 1.0014578835576544e-05, "loss": 2.3328, "step": 458580 }, { "epoch": 0.8, "learning_rate": 1.0013706895649718e-05, "loss": 2.3678, "step": 458590 }, { "epoch": 0.8, "learning_rate": 1.0012834955722892e-05, "loss": 2.1684, "step": 458600 }, { "epoch": 0.8, "learning_rate": 1.0011963015796064e-05, "loss": 2.3882, "step": 458610 }, { "epoch": 0.8, "learning_rate": 1.0011091075869238e-05, "loss": 2.3761, "step": 458620 }, { "epoch": 0.8, "learning_rate": 1.001021913594241e-05, "loss": 2.3699, "step": 458630 }, { "epoch": 0.8, "learning_rate": 1.0009347196015583e-05, "loss": 2.2884, "step": 458640 }, { "epoch": 0.8, "learning_rate": 1.0008475256088757e-05, "loss": 2.2661, "step": 458650 }, { "epoch": 0.8, "learning_rate": 1.000760331616193e-05, "loss": 2.2008, "step": 458660 }, { "epoch": 0.8, "learning_rate": 1.0006731376235105e-05, "loss": 2.387, "step": 458670 }, { "epoch": 0.8, "learning_rate": 1.0005859436308277e-05, "loss": 2.1805, "step": 458680 }, { "epoch": 0.8, "learning_rate": 1.000498749638145e-05, "loss": 2.3639, "step": 458690 }, { "epoch": 0.8, "learning_rate": 1.0004115556454623e-05, "loss": 2.3196, "step": 458700 }, { "epoch": 0.8, "learning_rate": 1.0003243616527796e-05, "loss": 2.1667, "step": 458710 }, { "epoch": 0.8, "learning_rate": 1.0002371676600969e-05, "loss": 2.2237, "step": 458720 }, { "epoch": 0.8, "learning_rate": 1.0001499736674142e-05, "loss": 2.3328, "step": 458730 }, { "epoch": 0.8, "learning_rate": 1.0000627796747316e-05, "loss": 2.2116, "step": 458740 }, { "epoch": 0.8, "learning_rate": 9.99975585682049e-06, "loss": 2.3603, "step": 458750 }, { "epoch": 0.8, "learning_rate": 9.998883916893662e-06, "loss": 2.2597, "step": 458760 }, { "epoch": 0.8, "learning_rate": 9.998011976966836e-06, "loss": 2.3841, "step": 458770 }, { "epoch": 0.8, "learning_rate": 9.99714003704001e-06, "loss": 2.3041, "step": 458780 }, { "epoch": 0.8, "learning_rate": 9.996268097113182e-06, "loss": 2.2805, "step": 458790 }, { "epoch": 0.8, "learning_rate": 9.995396157186355e-06, "loss": 2.1132, "step": 458800 }, { "epoch": 0.8, "learning_rate": 9.994524217259527e-06, "loss": 2.3801, "step": 458810 }, { "epoch": 0.8, "learning_rate": 9.993652277332701e-06, "loss": 2.2965, "step": 458820 }, { "epoch": 0.8, "learning_rate": 9.992780337405875e-06, "loss": 2.2712, "step": 458830 }, { "epoch": 0.8, "learning_rate": 9.991908397479049e-06, "loss": 2.2052, "step": 458840 }, { "epoch": 0.8, "learning_rate": 9.99103645755222e-06, "loss": 2.3493, "step": 458850 }, { "epoch": 0.8, "learning_rate": 9.990164517625395e-06, "loss": 2.2523, "step": 458860 }, { "epoch": 0.8, "learning_rate": 9.989292577698567e-06, "loss": 2.1716, "step": 458870 }, { "epoch": 0.8, "learning_rate": 9.98842063777174e-06, "loss": 2.2131, "step": 458880 }, { "epoch": 0.8, "learning_rate": 9.987548697844912e-06, "loss": 2.181, "step": 458890 }, { "epoch": 0.8, "learning_rate": 9.986676757918086e-06, "loss": 2.3255, "step": 458900 }, { "epoch": 0.8, "learning_rate": 9.985804817991262e-06, "loss": 2.2251, "step": 458910 }, { "epoch": 0.8, "learning_rate": 9.984932878064434e-06, "loss": 2.3024, "step": 458920 }, { "epoch": 0.8, "learning_rate": 9.984060938137608e-06, "loss": 2.2322, "step": 458930 }, { "epoch": 0.8, "learning_rate": 9.98318899821078e-06, "loss": 2.2235, "step": 458940 }, { "epoch": 0.8, "learning_rate": 9.982317058283953e-06, "loss": 2.3719, "step": 458950 }, { "epoch": 0.8, "learning_rate": 9.981445118357125e-06, "loss": 2.2881, "step": 458960 }, { "epoch": 0.8, "learning_rate": 9.9805731784303e-06, "loss": 2.223, "step": 458970 }, { "epoch": 0.8, "learning_rate": 9.979701238503473e-06, "loss": 2.2339, "step": 458980 }, { "epoch": 0.8, "learning_rate": 9.978829298576647e-06, "loss": 2.1285, "step": 458990 }, { "epoch": 0.8, "learning_rate": 9.977957358649819e-06, "loss": 2.3414, "step": 459000 }, { "epoch": 0.8, "learning_rate": 9.977085418722993e-06, "loss": 2.2691, "step": 459010 }, { "epoch": 0.8, "learning_rate": 9.976213478796165e-06, "loss": 2.3539, "step": 459020 }, { "epoch": 0.8, "learning_rate": 9.975341538869338e-06, "loss": 2.2187, "step": 459030 }, { "epoch": 0.8, "learning_rate": 9.974469598942512e-06, "loss": 2.2154, "step": 459040 }, { "epoch": 0.8, "learning_rate": 9.973597659015684e-06, "loss": 2.2027, "step": 459050 }, { "epoch": 0.8, "learning_rate": 9.972725719088858e-06, "loss": 2.289, "step": 459060 }, { "epoch": 0.8, "learning_rate": 9.971853779162032e-06, "loss": 2.2903, "step": 459070 }, { "epoch": 0.8, "learning_rate": 9.970981839235206e-06, "loss": 2.2789, "step": 459080 }, { "epoch": 0.8, "learning_rate": 9.970109899308378e-06, "loss": 2.1605, "step": 459090 }, { "epoch": 0.8, "learning_rate": 9.969237959381551e-06, "loss": 2.2421, "step": 459100 }, { "epoch": 0.8, "learning_rate": 9.968366019454724e-06, "loss": 2.2792, "step": 459110 }, { "epoch": 0.8, "learning_rate": 9.967494079527897e-06, "loss": 2.2682, "step": 459120 }, { "epoch": 0.8, "learning_rate": 9.96662213960107e-06, "loss": 2.4117, "step": 459130 }, { "epoch": 0.8, "learning_rate": 9.965750199674243e-06, "loss": 2.3045, "step": 459140 }, { "epoch": 0.8, "learning_rate": 9.964878259747417e-06, "loss": 2.2914, "step": 459150 }, { "epoch": 0.8, "learning_rate": 9.96400631982059e-06, "loss": 2.3532, "step": 459160 }, { "epoch": 0.8, "learning_rate": 9.963134379893763e-06, "loss": 2.2648, "step": 459170 }, { "epoch": 0.8, "learning_rate": 9.962262439966937e-06, "loss": 2.2499, "step": 459180 }, { "epoch": 0.8, "learning_rate": 9.96139050004011e-06, "loss": 2.3808, "step": 459190 }, { "epoch": 0.8, "learning_rate": 9.960518560113282e-06, "loss": 2.2252, "step": 459200 }, { "epoch": 0.8, "learning_rate": 9.959646620186456e-06, "loss": 2.3499, "step": 459210 }, { "epoch": 0.8, "learning_rate": 9.95877468025963e-06, "loss": 2.3076, "step": 459220 }, { "epoch": 0.8, "learning_rate": 9.957902740332804e-06, "loss": 2.2194, "step": 459230 }, { "epoch": 0.8, "learning_rate": 9.957030800405976e-06, "loss": 2.2813, "step": 459240 }, { "epoch": 0.8, "learning_rate": 9.95615886047915e-06, "loss": 2.2945, "step": 459250 }, { "epoch": 0.8, "learning_rate": 9.955286920552322e-06, "loss": 2.3421, "step": 459260 }, { "epoch": 0.8, "learning_rate": 9.954414980625495e-06, "loss": 2.2655, "step": 459270 }, { "epoch": 0.8, "learning_rate": 9.953543040698667e-06, "loss": 2.3175, "step": 459280 }, { "epoch": 0.8, "learning_rate": 9.952671100771841e-06, "loss": 2.3767, "step": 459290 }, { "epoch": 0.8, "learning_rate": 9.951799160845015e-06, "loss": 2.3178, "step": 459300 }, { "epoch": 0.8, "learning_rate": 9.950927220918189e-06, "loss": 2.2262, "step": 459310 }, { "epoch": 0.8, "learning_rate": 9.950055280991363e-06, "loss": 2.337, "step": 459320 }, { "epoch": 0.8, "learning_rate": 9.949183341064535e-06, "loss": 2.3416, "step": 459330 }, { "epoch": 0.8, "learning_rate": 9.948311401137708e-06, "loss": 2.1605, "step": 459340 }, { "epoch": 0.8, "learning_rate": 9.94743946121088e-06, "loss": 2.3179, "step": 459350 }, { "epoch": 0.8, "learning_rate": 9.946567521284054e-06, "loss": 2.3776, "step": 459360 }, { "epoch": 0.8, "learning_rate": 9.945695581357226e-06, "loss": 2.3356, "step": 459370 }, { "epoch": 0.8, "learning_rate": 9.9448236414304e-06, "loss": 2.302, "step": 459380 }, { "epoch": 0.8, "learning_rate": 9.943951701503574e-06, "loss": 2.2167, "step": 459390 }, { "epoch": 0.8, "learning_rate": 9.943079761576748e-06, "loss": 2.3249, "step": 459400 }, { "epoch": 0.8, "learning_rate": 9.94220782164992e-06, "loss": 2.2319, "step": 459410 }, { "epoch": 0.8, "learning_rate": 9.941335881723093e-06, "loss": 2.2735, "step": 459420 }, { "epoch": 0.8, "learning_rate": 9.940463941796266e-06, "loss": 2.369, "step": 459430 }, { "epoch": 0.8, "learning_rate": 9.93959200186944e-06, "loss": 2.2707, "step": 459440 }, { "epoch": 0.8, "learning_rate": 9.938720061942613e-06, "loss": 2.2711, "step": 459450 }, { "epoch": 0.8, "learning_rate": 9.937848122015785e-06, "loss": 2.3094, "step": 459460 }, { "epoch": 0.8, "learning_rate": 9.93697618208896e-06, "loss": 2.2569, "step": 459470 }, { "epoch": 0.8, "learning_rate": 9.936104242162133e-06, "loss": 2.2734, "step": 459480 }, { "epoch": 0.8, "learning_rate": 9.935232302235306e-06, "loss": 2.2205, "step": 459490 }, { "epoch": 0.8, "learning_rate": 9.934360362308479e-06, "loss": 2.2177, "step": 459500 }, { "epoch": 0.8, "learning_rate": 9.933488422381652e-06, "loss": 2.2526, "step": 459510 }, { "epoch": 0.8, "learning_rate": 9.932616482454824e-06, "loss": 2.2605, "step": 459520 }, { "epoch": 0.8, "learning_rate": 9.931744542527998e-06, "loss": 2.278, "step": 459530 }, { "epoch": 0.8, "learning_rate": 9.930872602601172e-06, "loss": 2.2297, "step": 459540 }, { "epoch": 0.8, "learning_rate": 9.930000662674346e-06, "loss": 2.17, "step": 459550 }, { "epoch": 0.8, "learning_rate": 9.929128722747518e-06, "loss": 2.2, "step": 459560 }, { "epoch": 0.8, "learning_rate": 9.928256782820692e-06, "loss": 2.2844, "step": 459570 }, { "epoch": 0.8, "learning_rate": 9.927384842893865e-06, "loss": 2.2453, "step": 459580 }, { "epoch": 0.8, "learning_rate": 9.926512902967037e-06, "loss": 2.3461, "step": 459590 }, { "epoch": 0.8, "learning_rate": 9.925640963040211e-06, "loss": 2.2285, "step": 459600 }, { "epoch": 0.8, "learning_rate": 9.924769023113383e-06, "loss": 2.1742, "step": 459610 }, { "epoch": 0.8, "learning_rate": 9.923897083186557e-06, "loss": 2.3657, "step": 459620 }, { "epoch": 0.8, "learning_rate": 9.92302514325973e-06, "loss": 2.3206, "step": 459630 }, { "epoch": 0.8, "learning_rate": 9.922153203332905e-06, "loss": 2.2691, "step": 459640 }, { "epoch": 0.8, "learning_rate": 9.921281263406077e-06, "loss": 2.2035, "step": 459650 }, { "epoch": 0.8, "learning_rate": 9.92040932347925e-06, "loss": 2.3607, "step": 459660 }, { "epoch": 0.8, "learning_rate": 9.919537383552422e-06, "loss": 2.2331, "step": 459670 }, { "epoch": 0.8, "learning_rate": 9.918665443625596e-06, "loss": 2.1333, "step": 459680 }, { "epoch": 0.8, "learning_rate": 9.917793503698768e-06, "loss": 2.2003, "step": 459690 }, { "epoch": 0.8, "learning_rate": 9.916921563771942e-06, "loss": 2.2191, "step": 459700 }, { "epoch": 0.8, "learning_rate": 9.916049623845118e-06, "loss": 2.4377, "step": 459710 }, { "epoch": 0.8, "learning_rate": 9.91517768391829e-06, "loss": 2.3826, "step": 459720 }, { "epoch": 0.8, "learning_rate": 9.914305743991463e-06, "loss": 2.2306, "step": 459730 }, { "epoch": 0.8, "learning_rate": 9.913433804064635e-06, "loss": 2.3233, "step": 459740 }, { "epoch": 0.8, "learning_rate": 9.91256186413781e-06, "loss": 2.259, "step": 459750 }, { "epoch": 0.8, "learning_rate": 9.911689924210981e-06, "loss": 2.3186, "step": 459760 }, { "epoch": 0.8, "learning_rate": 9.910817984284155e-06, "loss": 2.2173, "step": 459770 }, { "epoch": 0.8, "learning_rate": 9.909946044357329e-06, "loss": 2.2089, "step": 459780 }, { "epoch": 0.8, "learning_rate": 9.909074104430503e-06, "loss": 2.1254, "step": 459790 }, { "epoch": 0.8, "learning_rate": 9.908202164503675e-06, "loss": 2.2899, "step": 459800 }, { "epoch": 0.8, "learning_rate": 9.907330224576848e-06, "loss": 2.3397, "step": 459810 }, { "epoch": 0.8, "learning_rate": 9.90645828465002e-06, "loss": 2.3194, "step": 459820 }, { "epoch": 0.8, "learning_rate": 9.905586344723194e-06, "loss": 2.192, "step": 459830 }, { "epoch": 0.8, "learning_rate": 9.904714404796368e-06, "loss": 2.3501, "step": 459840 }, { "epoch": 0.8, "learning_rate": 9.90384246486954e-06, "loss": 2.2316, "step": 459850 }, { "epoch": 0.8, "learning_rate": 9.902970524942714e-06, "loss": 2.2887, "step": 459860 }, { "epoch": 0.8, "learning_rate": 9.902098585015888e-06, "loss": 2.2893, "step": 459870 }, { "epoch": 0.8, "learning_rate": 9.901226645089061e-06, "loss": 2.2282, "step": 459880 }, { "epoch": 0.8, "learning_rate": 9.900354705162234e-06, "loss": 2.264, "step": 459890 }, { "epoch": 0.8, "learning_rate": 9.899482765235407e-06, "loss": 2.3938, "step": 459900 }, { "epoch": 0.8, "learning_rate": 9.89861082530858e-06, "loss": 2.3484, "step": 459910 }, { "epoch": 0.8, "learning_rate": 9.897738885381753e-06, "loss": 2.2869, "step": 459920 }, { "epoch": 0.8, "learning_rate": 9.896866945454925e-06, "loss": 2.3862, "step": 459930 }, { "epoch": 0.8, "learning_rate": 9.895995005528099e-06, "loss": 2.3129, "step": 459940 }, { "epoch": 0.8, "learning_rate": 9.895123065601273e-06, "loss": 2.3278, "step": 459950 }, { "epoch": 0.8, "learning_rate": 9.894251125674447e-06, "loss": 2.3507, "step": 459960 }, { "epoch": 0.8, "learning_rate": 9.893379185747619e-06, "loss": 2.3797, "step": 459970 }, { "epoch": 0.8, "learning_rate": 9.892507245820792e-06, "loss": 2.316, "step": 459980 }, { "epoch": 0.8, "learning_rate": 9.891635305893966e-06, "loss": 2.2166, "step": 459990 }, { "epoch": 0.8, "learning_rate": 9.890763365967138e-06, "loss": 2.2996, "step": 460000 }, { "epoch": 0.8, "learning_rate": 9.889891426040312e-06, "loss": 2.3254, "step": 460010 }, { "epoch": 0.8, "learning_rate": 9.889019486113486e-06, "loss": 2.2105, "step": 460020 }, { "epoch": 0.8, "learning_rate": 9.88814754618666e-06, "loss": 2.2586, "step": 460030 }, { "epoch": 0.8, "learning_rate": 9.887275606259832e-06, "loss": 2.2783, "step": 460040 }, { "epoch": 0.8, "learning_rate": 9.886403666333005e-06, "loss": 2.3236, "step": 460050 }, { "epoch": 0.8, "learning_rate": 9.885531726406177e-06, "loss": 2.1681, "step": 460060 }, { "epoch": 0.8, "learning_rate": 9.884659786479351e-06, "loss": 2.2079, "step": 460070 }, { "epoch": 0.8, "learning_rate": 9.883787846552523e-06, "loss": 2.2531, "step": 460080 }, { "epoch": 0.8, "learning_rate": 9.882915906625697e-06, "loss": 2.2716, "step": 460090 }, { "epoch": 0.8, "learning_rate": 9.88204396669887e-06, "loss": 2.3136, "step": 460100 }, { "epoch": 0.8, "learning_rate": 9.881172026772045e-06, "loss": 2.3114, "step": 460110 }, { "epoch": 0.8, "learning_rate": 9.880300086845218e-06, "loss": 2.2314, "step": 460120 }, { "epoch": 0.8, "learning_rate": 9.87942814691839e-06, "loss": 2.2421, "step": 460130 }, { "epoch": 0.8, "learning_rate": 9.878556206991564e-06, "loss": 2.27, "step": 460140 }, { "epoch": 0.8, "learning_rate": 9.877684267064736e-06, "loss": 2.331, "step": 460150 }, { "epoch": 0.8, "learning_rate": 9.87681232713791e-06, "loss": 2.2145, "step": 460160 }, { "epoch": 0.8, "learning_rate": 9.875940387211082e-06, "loss": 2.2758, "step": 460170 }, { "epoch": 0.8, "learning_rate": 9.875068447284256e-06, "loss": 2.2945, "step": 460180 }, { "epoch": 0.8, "learning_rate": 9.87419650735743e-06, "loss": 2.33, "step": 460190 }, { "epoch": 0.8, "learning_rate": 9.873324567430603e-06, "loss": 2.1489, "step": 460200 }, { "epoch": 0.8, "learning_rate": 9.872452627503776e-06, "loss": 2.2552, "step": 460210 }, { "epoch": 0.8, "learning_rate": 9.87158068757695e-06, "loss": 2.3222, "step": 460220 }, { "epoch": 0.8, "learning_rate": 9.870708747650121e-06, "loss": 2.3249, "step": 460230 }, { "epoch": 0.8, "learning_rate": 9.869836807723295e-06, "loss": 2.2406, "step": 460240 }, { "epoch": 0.8, "learning_rate": 9.868964867796469e-06, "loss": 2.2769, "step": 460250 }, { "epoch": 0.8, "learning_rate": 9.868092927869643e-06, "loss": 2.2979, "step": 460260 }, { "epoch": 0.8, "learning_rate": 9.867220987942816e-06, "loss": 2.3454, "step": 460270 }, { "epoch": 0.8, "learning_rate": 9.866349048015989e-06, "loss": 2.2307, "step": 460280 }, { "epoch": 0.8, "learning_rate": 9.865477108089162e-06, "loss": 2.2042, "step": 460290 }, { "epoch": 0.8, "learning_rate": 9.864605168162334e-06, "loss": 2.2946, "step": 460300 }, { "epoch": 0.8, "learning_rate": 9.863733228235508e-06, "loss": 2.3304, "step": 460310 }, { "epoch": 0.8, "learning_rate": 9.86286128830868e-06, "loss": 2.3997, "step": 460320 }, { "epoch": 0.8, "learning_rate": 9.861989348381854e-06, "loss": 2.2052, "step": 460330 }, { "epoch": 0.8, "learning_rate": 9.861117408455028e-06, "loss": 2.2112, "step": 460340 }, { "epoch": 0.8, "learning_rate": 9.860245468528202e-06, "loss": 2.2988, "step": 460350 }, { "epoch": 0.8, "learning_rate": 9.859373528601374e-06, "loss": 2.1461, "step": 460360 }, { "epoch": 0.8, "learning_rate": 9.858501588674547e-06, "loss": 2.2437, "step": 460370 }, { "epoch": 0.8, "learning_rate": 9.857629648747721e-06, "loss": 2.2345, "step": 460380 }, { "epoch": 0.8, "learning_rate": 9.856757708820893e-06, "loss": 2.3012, "step": 460390 }, { "epoch": 0.8, "learning_rate": 9.855885768894067e-06, "loss": 2.2173, "step": 460400 }, { "epoch": 0.8, "learning_rate": 9.855013828967239e-06, "loss": 2.259, "step": 460410 }, { "epoch": 0.8, "learning_rate": 9.854141889040413e-06, "loss": 2.2222, "step": 460420 }, { "epoch": 0.8, "learning_rate": 9.853269949113587e-06, "loss": 2.216, "step": 460430 }, { "epoch": 0.8, "learning_rate": 9.85239800918676e-06, "loss": 2.4202, "step": 460440 }, { "epoch": 0.8, "learning_rate": 9.851526069259932e-06, "loss": 2.2899, "step": 460450 }, { "epoch": 0.8, "learning_rate": 9.850654129333106e-06, "loss": 2.2682, "step": 460460 }, { "epoch": 0.8, "learning_rate": 9.849782189406278e-06, "loss": 2.1516, "step": 460470 }, { "epoch": 0.8, "learning_rate": 9.848910249479452e-06, "loss": 2.2997, "step": 460480 }, { "epoch": 0.8, "learning_rate": 9.848038309552624e-06, "loss": 2.3052, "step": 460490 }, { "epoch": 0.8, "learning_rate": 9.847166369625798e-06, "loss": 2.3291, "step": 460500 }, { "epoch": 0.8, "learning_rate": 9.846294429698973e-06, "loss": 2.1916, "step": 460510 }, { "epoch": 0.8, "learning_rate": 9.845422489772145e-06, "loss": 2.1937, "step": 460520 }, { "epoch": 0.8, "learning_rate": 9.84455054984532e-06, "loss": 2.1999, "step": 460530 }, { "epoch": 0.8, "learning_rate": 9.843678609918491e-06, "loss": 2.2219, "step": 460540 }, { "epoch": 0.8, "learning_rate": 9.842806669991665e-06, "loss": 2.3913, "step": 460550 }, { "epoch": 0.8, "learning_rate": 9.841934730064837e-06, "loss": 2.4393, "step": 460560 }, { "epoch": 0.8, "learning_rate": 9.841062790138011e-06, "loss": 2.3071, "step": 460570 }, { "epoch": 0.8, "learning_rate": 9.840190850211185e-06, "loss": 2.3381, "step": 460580 }, { "epoch": 0.8, "learning_rate": 9.839318910284358e-06, "loss": 2.3493, "step": 460590 }, { "epoch": 0.8, "learning_rate": 9.83844697035753e-06, "loss": 2.2347, "step": 460600 }, { "epoch": 0.8, "learning_rate": 9.837575030430704e-06, "loss": 2.3319, "step": 460610 }, { "epoch": 0.8, "learning_rate": 9.836703090503876e-06, "loss": 2.2805, "step": 460620 }, { "epoch": 0.8, "learning_rate": 9.83583115057705e-06, "loss": 2.2221, "step": 460630 }, { "epoch": 0.8, "learning_rate": 9.834959210650224e-06, "loss": 2.3207, "step": 460640 }, { "epoch": 0.8, "learning_rate": 9.834087270723396e-06, "loss": 2.3358, "step": 460650 }, { "epoch": 0.8, "learning_rate": 9.83321533079657e-06, "loss": 2.449, "step": 460660 }, { "epoch": 0.8, "learning_rate": 9.832343390869744e-06, "loss": 2.3289, "step": 460670 }, { "epoch": 0.8, "learning_rate": 9.831471450942917e-06, "loss": 2.1865, "step": 460680 }, { "epoch": 0.8, "learning_rate": 9.83059951101609e-06, "loss": 2.2791, "step": 460690 }, { "epoch": 0.8, "learning_rate": 9.829727571089263e-06, "loss": 2.3125, "step": 460700 }, { "epoch": 0.8, "learning_rate": 9.828855631162435e-06, "loss": 2.2768, "step": 460710 }, { "epoch": 0.8, "learning_rate": 9.827983691235609e-06, "loss": 2.3149, "step": 460720 }, { "epoch": 0.8, "learning_rate": 9.827111751308781e-06, "loss": 2.2623, "step": 460730 }, { "epoch": 0.8, "learning_rate": 9.826239811381955e-06, "loss": 2.2918, "step": 460740 }, { "epoch": 0.8, "learning_rate": 9.825367871455129e-06, "loss": 2.3039, "step": 460750 }, { "epoch": 0.8, "learning_rate": 9.824495931528302e-06, "loss": 2.2642, "step": 460760 }, { "epoch": 0.8, "learning_rate": 9.823623991601476e-06, "loss": 2.3009, "step": 460770 }, { "epoch": 0.8, "learning_rate": 9.822752051674648e-06, "loss": 2.3608, "step": 460780 }, { "epoch": 0.8, "learning_rate": 9.821880111747822e-06, "loss": 2.1848, "step": 460790 }, { "epoch": 0.8, "learning_rate": 9.821008171820994e-06, "loss": 2.2706, "step": 460800 }, { "epoch": 0.8, "learning_rate": 9.820136231894168e-06, "loss": 2.4928, "step": 460810 }, { "epoch": 0.8, "learning_rate": 9.819264291967342e-06, "loss": 2.1858, "step": 460820 }, { "epoch": 0.8, "learning_rate": 9.818392352040515e-06, "loss": 2.3026, "step": 460830 }, { "epoch": 0.8, "learning_rate": 9.817520412113687e-06, "loss": 2.3787, "step": 460840 }, { "epoch": 0.8, "learning_rate": 9.816648472186861e-06, "loss": 2.229, "step": 460850 }, { "epoch": 0.8, "learning_rate": 9.815776532260033e-06, "loss": 2.2501, "step": 460860 }, { "epoch": 0.8, "learning_rate": 9.814904592333207e-06, "loss": 2.3331, "step": 460870 }, { "epoch": 0.8, "learning_rate": 9.814032652406379e-06, "loss": 2.2698, "step": 460880 }, { "epoch": 0.8, "learning_rate": 9.813160712479553e-06, "loss": 2.157, "step": 460890 }, { "epoch": 0.8, "learning_rate": 9.812288772552727e-06, "loss": 2.3676, "step": 460900 }, { "epoch": 0.8, "learning_rate": 9.8114168326259e-06, "loss": 2.3883, "step": 460910 }, { "epoch": 0.8, "learning_rate": 9.810544892699074e-06, "loss": 2.1903, "step": 460920 }, { "epoch": 0.8, "learning_rate": 9.809672952772246e-06, "loss": 2.246, "step": 460930 }, { "epoch": 0.8, "learning_rate": 9.80880101284542e-06, "loss": 2.3466, "step": 460940 }, { "epoch": 0.8, "learning_rate": 9.807929072918592e-06, "loss": 2.3384, "step": 460950 }, { "epoch": 0.8, "learning_rate": 9.807057132991766e-06, "loss": 2.3993, "step": 460960 }, { "epoch": 0.8, "learning_rate": 9.806185193064938e-06, "loss": 2.2644, "step": 460970 }, { "epoch": 0.8, "learning_rate": 9.805313253138112e-06, "loss": 2.2528, "step": 460980 }, { "epoch": 0.8, "learning_rate": 9.804441313211286e-06, "loss": 2.3014, "step": 460990 }, { "epoch": 0.8, "learning_rate": 9.80356937328446e-06, "loss": 2.2652, "step": 461000 }, { "epoch": 0.8, "learning_rate": 9.802697433357631e-06, "loss": 2.3375, "step": 461010 }, { "epoch": 0.8, "learning_rate": 9.801825493430805e-06, "loss": 2.2792, "step": 461020 }, { "epoch": 0.8, "learning_rate": 9.800953553503977e-06, "loss": 2.3274, "step": 461030 }, { "epoch": 0.8, "learning_rate": 9.800081613577151e-06, "loss": 2.2519, "step": 461040 }, { "epoch": 0.8, "learning_rate": 9.799209673650325e-06, "loss": 2.2746, "step": 461050 }, { "epoch": 0.8, "learning_rate": 9.798337733723499e-06, "loss": 2.2612, "step": 461060 }, { "epoch": 0.8, "learning_rate": 9.797465793796672e-06, "loss": 2.2038, "step": 461070 }, { "epoch": 0.8, "learning_rate": 9.796593853869844e-06, "loss": 2.3006, "step": 461080 }, { "epoch": 0.8, "learning_rate": 9.795721913943018e-06, "loss": 2.3086, "step": 461090 }, { "epoch": 0.8, "learning_rate": 9.79484997401619e-06, "loss": 2.2805, "step": 461100 }, { "epoch": 0.8, "learning_rate": 9.793978034089364e-06, "loss": 2.2433, "step": 461110 }, { "epoch": 0.8, "learning_rate": 9.793106094162536e-06, "loss": 2.3381, "step": 461120 }, { "epoch": 0.8, "learning_rate": 9.79223415423571e-06, "loss": 2.1596, "step": 461130 }, { "epoch": 0.8, "learning_rate": 9.791362214308884e-06, "loss": 2.164, "step": 461140 }, { "epoch": 0.8, "learning_rate": 9.790490274382057e-06, "loss": 2.2251, "step": 461150 }, { "epoch": 0.8, "learning_rate": 9.78961833445523e-06, "loss": 2.2668, "step": 461160 }, { "epoch": 0.8, "learning_rate": 9.788746394528403e-06, "loss": 2.243, "step": 461170 }, { "epoch": 0.8, "learning_rate": 9.787874454601577e-06, "loss": 2.2959, "step": 461180 }, { "epoch": 0.8, "learning_rate": 9.787002514674749e-06, "loss": 2.269, "step": 461190 }, { "epoch": 0.8, "learning_rate": 9.786130574747923e-06, "loss": 2.3094, "step": 461200 }, { "epoch": 0.8, "learning_rate": 9.785258634821095e-06, "loss": 2.302, "step": 461210 }, { "epoch": 0.8, "learning_rate": 9.784386694894269e-06, "loss": 2.161, "step": 461220 }, { "epoch": 0.8, "learning_rate": 9.783514754967442e-06, "loss": 2.2233, "step": 461230 }, { "epoch": 0.8, "learning_rate": 9.782642815040616e-06, "loss": 2.2141, "step": 461240 }, { "epoch": 0.8, "learning_rate": 9.781770875113788e-06, "loss": 2.2958, "step": 461250 }, { "epoch": 0.8, "learning_rate": 9.780898935186962e-06, "loss": 2.1967, "step": 461260 }, { "epoch": 0.8, "learning_rate": 9.780026995260134e-06, "loss": 2.3022, "step": 461270 }, { "epoch": 0.8, "learning_rate": 9.779155055333308e-06, "loss": 2.2211, "step": 461280 }, { "epoch": 0.8, "learning_rate": 9.77828311540648e-06, "loss": 2.2893, "step": 461290 }, { "epoch": 0.8, "learning_rate": 9.777411175479655e-06, "loss": 2.3421, "step": 461300 }, { "epoch": 0.8, "learning_rate": 9.77653923555283e-06, "loss": 2.3761, "step": 461310 }, { "epoch": 0.8, "learning_rate": 9.775667295626001e-06, "loss": 2.2286, "step": 461320 }, { "epoch": 0.8, "learning_rate": 9.774795355699175e-06, "loss": 2.2997, "step": 461330 }, { "epoch": 0.8, "learning_rate": 9.773923415772347e-06, "loss": 2.2914, "step": 461340 }, { "epoch": 0.8, "learning_rate": 9.773051475845521e-06, "loss": 2.2417, "step": 461350 }, { "epoch": 0.8, "learning_rate": 9.772179535918693e-06, "loss": 2.2785, "step": 461360 }, { "epoch": 0.8, "learning_rate": 9.771307595991867e-06, "loss": 2.3267, "step": 461370 }, { "epoch": 0.8, "learning_rate": 9.77043565606504e-06, "loss": 2.1927, "step": 461380 }, { "epoch": 0.8, "learning_rate": 9.769563716138214e-06, "loss": 2.1601, "step": 461390 }, { "epoch": 0.8, "learning_rate": 9.768691776211386e-06, "loss": 2.307, "step": 461400 }, { "epoch": 0.8, "learning_rate": 9.76781983628456e-06, "loss": 2.3399, "step": 461410 }, { "epoch": 0.8, "learning_rate": 9.766947896357732e-06, "loss": 2.3713, "step": 461420 }, { "epoch": 0.8, "learning_rate": 9.766075956430906e-06, "loss": 2.2372, "step": 461430 }, { "epoch": 0.8, "learning_rate": 9.76520401650408e-06, "loss": 2.2618, "step": 461440 }, { "epoch": 0.8, "learning_rate": 9.764332076577252e-06, "loss": 2.236, "step": 461450 }, { "epoch": 0.8, "learning_rate": 9.763460136650426e-06, "loss": 2.2066, "step": 461460 }, { "epoch": 0.8, "learning_rate": 9.7625881967236e-06, "loss": 2.263, "step": 461470 }, { "epoch": 0.8, "learning_rate": 9.761716256796773e-06, "loss": 2.2171, "step": 461480 }, { "epoch": 0.8, "learning_rate": 9.760844316869945e-06, "loss": 2.2325, "step": 461490 }, { "epoch": 0.8, "learning_rate": 9.759972376943119e-06, "loss": 2.3289, "step": 461500 }, { "epoch": 0.8, "learning_rate": 9.759100437016291e-06, "loss": 2.1298, "step": 461510 }, { "epoch": 0.8, "learning_rate": 9.758228497089465e-06, "loss": 2.3865, "step": 461520 }, { "epoch": 0.8, "learning_rate": 9.757356557162637e-06, "loss": 2.2719, "step": 461530 }, { "epoch": 0.8, "learning_rate": 9.756484617235812e-06, "loss": 2.1885, "step": 461540 }, { "epoch": 0.8, "learning_rate": 9.755612677308984e-06, "loss": 2.1713, "step": 461550 }, { "epoch": 0.8, "learning_rate": 9.754740737382158e-06, "loss": 2.3244, "step": 461560 }, { "epoch": 0.8, "learning_rate": 9.753868797455332e-06, "loss": 2.1511, "step": 461570 }, { "epoch": 0.8, "learning_rate": 9.752996857528504e-06, "loss": 2.2641, "step": 461580 }, { "epoch": 0.8, "learning_rate": 9.752124917601678e-06, "loss": 2.3371, "step": 461590 }, { "epoch": 0.8, "learning_rate": 9.75125297767485e-06, "loss": 2.3791, "step": 461600 }, { "epoch": 0.8, "learning_rate": 9.750381037748024e-06, "loss": 2.2319, "step": 461610 }, { "epoch": 0.81, "learning_rate": 9.749509097821197e-06, "loss": 2.2948, "step": 461620 }, { "epoch": 0.81, "learning_rate": 9.748637157894371e-06, "loss": 2.2818, "step": 461630 }, { "epoch": 0.81, "learning_rate": 9.747765217967543e-06, "loss": 2.2277, "step": 461640 }, { "epoch": 0.81, "learning_rate": 9.746893278040717e-06, "loss": 2.2864, "step": 461650 }, { "epoch": 0.81, "learning_rate": 9.746021338113889e-06, "loss": 2.2742, "step": 461660 }, { "epoch": 0.81, "learning_rate": 9.745149398187063e-06, "loss": 2.1785, "step": 461670 }, { "epoch": 0.81, "learning_rate": 9.744277458260235e-06, "loss": 2.4142, "step": 461680 }, { "epoch": 0.81, "learning_rate": 9.743405518333409e-06, "loss": 2.2952, "step": 461690 }, { "epoch": 0.81, "learning_rate": 9.742533578406583e-06, "loss": 2.281, "step": 461700 }, { "epoch": 0.81, "learning_rate": 9.741661638479756e-06, "loss": 2.2048, "step": 461710 }, { "epoch": 0.81, "learning_rate": 9.74078969855293e-06, "loss": 2.3189, "step": 461720 }, { "epoch": 0.81, "learning_rate": 9.739917758626102e-06, "loss": 2.3236, "step": 461730 }, { "epoch": 0.81, "learning_rate": 9.739045818699276e-06, "loss": 2.2812, "step": 461740 }, { "epoch": 0.81, "learning_rate": 9.738173878772448e-06, "loss": 2.3552, "step": 461750 }, { "epoch": 0.81, "learning_rate": 9.737301938845622e-06, "loss": 2.322, "step": 461760 }, { "epoch": 0.81, "learning_rate": 9.736429998918794e-06, "loss": 2.3071, "step": 461770 }, { "epoch": 0.81, "learning_rate": 9.735558058991968e-06, "loss": 2.3435, "step": 461780 }, { "epoch": 0.81, "learning_rate": 9.734686119065141e-06, "loss": 2.2909, "step": 461790 }, { "epoch": 0.81, "learning_rate": 9.733814179138315e-06, "loss": 2.3062, "step": 461800 }, { "epoch": 0.81, "learning_rate": 9.732942239211487e-06, "loss": 2.2117, "step": 461810 }, { "epoch": 0.81, "learning_rate": 9.732070299284661e-06, "loss": 2.2615, "step": 461820 }, { "epoch": 0.81, "learning_rate": 9.731198359357833e-06, "loss": 2.3769, "step": 461830 }, { "epoch": 0.81, "learning_rate": 9.730326419431007e-06, "loss": 2.2025, "step": 461840 }, { "epoch": 0.81, "learning_rate": 9.72945447950418e-06, "loss": 2.2856, "step": 461850 }, { "epoch": 0.81, "learning_rate": 9.728582539577354e-06, "loss": 2.2502, "step": 461860 }, { "epoch": 0.81, "learning_rate": 9.727710599650528e-06, "loss": 2.1335, "step": 461870 }, { "epoch": 0.81, "learning_rate": 9.7268386597237e-06, "loss": 2.2497, "step": 461880 }, { "epoch": 0.81, "learning_rate": 9.725966719796874e-06, "loss": 2.1398, "step": 461890 }, { "epoch": 0.81, "learning_rate": 9.725094779870046e-06, "loss": 2.3193, "step": 461900 }, { "epoch": 0.81, "learning_rate": 9.72422283994322e-06, "loss": 2.2169, "step": 461910 }, { "epoch": 0.81, "learning_rate": 9.723350900016392e-06, "loss": 2.2593, "step": 461920 }, { "epoch": 0.81, "learning_rate": 9.722478960089566e-06, "loss": 2.2068, "step": 461930 }, { "epoch": 0.81, "learning_rate": 9.72160702016274e-06, "loss": 2.1866, "step": 461940 }, { "epoch": 0.81, "learning_rate": 9.720735080235913e-06, "loss": 2.315, "step": 461950 }, { "epoch": 0.81, "learning_rate": 9.719863140309085e-06, "loss": 2.2587, "step": 461960 }, { "epoch": 0.81, "learning_rate": 9.718991200382259e-06, "loss": 2.2719, "step": 461970 }, { "epoch": 0.81, "learning_rate": 9.718119260455433e-06, "loss": 2.2694, "step": 461980 }, { "epoch": 0.81, "learning_rate": 9.717247320528605e-06, "loss": 2.0898, "step": 461990 }, { "epoch": 0.81, "learning_rate": 9.716375380601779e-06, "loss": 2.2857, "step": 462000 }, { "epoch": 0.81, "learning_rate": 9.71550344067495e-06, "loss": 2.2594, "step": 462010 }, { "epoch": 0.81, "learning_rate": 9.714631500748125e-06, "loss": 2.2779, "step": 462020 }, { "epoch": 0.81, "learning_rate": 9.713759560821298e-06, "loss": 2.2759, "step": 462030 }, { "epoch": 0.81, "learning_rate": 9.712887620894472e-06, "loss": 2.2726, "step": 462040 }, { "epoch": 0.81, "learning_rate": 9.712015680967644e-06, "loss": 2.3134, "step": 462050 }, { "epoch": 0.81, "learning_rate": 9.711143741040818e-06, "loss": 2.2181, "step": 462060 }, { "epoch": 0.81, "learning_rate": 9.71027180111399e-06, "loss": 2.315, "step": 462070 }, { "epoch": 0.81, "learning_rate": 9.709399861187164e-06, "loss": 2.3029, "step": 462080 }, { "epoch": 0.81, "learning_rate": 9.708527921260336e-06, "loss": 2.302, "step": 462090 }, { "epoch": 0.81, "learning_rate": 9.707655981333511e-06, "loss": 2.2265, "step": 462100 }, { "epoch": 0.81, "learning_rate": 9.706784041406685e-06, "loss": 2.3033, "step": 462110 }, { "epoch": 0.81, "learning_rate": 9.705912101479857e-06, "loss": 2.2984, "step": 462120 }, { "epoch": 0.81, "learning_rate": 9.705040161553031e-06, "loss": 2.2442, "step": 462130 }, { "epoch": 0.81, "learning_rate": 9.704168221626203e-06, "loss": 2.3654, "step": 462140 }, { "epoch": 0.81, "learning_rate": 9.703296281699377e-06, "loss": 2.293, "step": 462150 }, { "epoch": 0.81, "learning_rate": 9.702424341772549e-06, "loss": 2.3781, "step": 462160 }, { "epoch": 0.81, "learning_rate": 9.701552401845723e-06, "loss": 2.3354, "step": 462170 }, { "epoch": 0.81, "learning_rate": 9.700680461918896e-06, "loss": 2.2997, "step": 462180 }, { "epoch": 0.81, "learning_rate": 9.69980852199207e-06, "loss": 2.1891, "step": 462190 }, { "epoch": 0.81, "learning_rate": 9.698936582065242e-06, "loss": 2.1401, "step": 462200 }, { "epoch": 0.81, "learning_rate": 9.698064642138416e-06, "loss": 2.2428, "step": 462210 }, { "epoch": 0.81, "learning_rate": 9.697192702211588e-06, "loss": 2.3894, "step": 462220 }, { "epoch": 0.81, "learning_rate": 9.696320762284762e-06, "loss": 2.138, "step": 462230 }, { "epoch": 0.81, "learning_rate": 9.695448822357936e-06, "loss": 2.3338, "step": 462240 }, { "epoch": 0.81, "learning_rate": 9.694576882431108e-06, "loss": 2.3364, "step": 462250 }, { "epoch": 0.81, "learning_rate": 9.693704942504281e-06, "loss": 2.3063, "step": 462260 }, { "epoch": 0.81, "learning_rate": 9.692833002577455e-06, "loss": 2.3859, "step": 462270 }, { "epoch": 0.81, "learning_rate": 9.691961062650629e-06, "loss": 2.1622, "step": 462280 }, { "epoch": 0.81, "learning_rate": 9.691089122723801e-06, "loss": 2.216, "step": 462290 }, { "epoch": 0.81, "learning_rate": 9.690217182796975e-06, "loss": 2.2386, "step": 462300 }, { "epoch": 0.81, "learning_rate": 9.689345242870147e-06, "loss": 2.4427, "step": 462310 }, { "epoch": 0.81, "learning_rate": 9.68847330294332e-06, "loss": 2.2906, "step": 462320 }, { "epoch": 0.81, "learning_rate": 9.687601363016493e-06, "loss": 2.1312, "step": 462330 }, { "epoch": 0.81, "learning_rate": 9.686729423089668e-06, "loss": 2.3482, "step": 462340 }, { "epoch": 0.81, "learning_rate": 9.68585748316284e-06, "loss": 2.2903, "step": 462350 }, { "epoch": 0.81, "learning_rate": 9.684985543236014e-06, "loss": 2.3512, "step": 462360 }, { "epoch": 0.81, "learning_rate": 9.684113603309188e-06, "loss": 2.1794, "step": 462370 }, { "epoch": 0.81, "learning_rate": 9.68324166338236e-06, "loss": 2.2717, "step": 462380 }, { "epoch": 0.81, "learning_rate": 9.682369723455534e-06, "loss": 2.2021, "step": 462390 }, { "epoch": 0.81, "learning_rate": 9.681497783528706e-06, "loss": 2.2041, "step": 462400 }, { "epoch": 0.81, "learning_rate": 9.68062584360188e-06, "loss": 2.4284, "step": 462410 }, { "epoch": 0.81, "learning_rate": 9.679753903675053e-06, "loss": 2.2501, "step": 462420 }, { "epoch": 0.81, "learning_rate": 9.678881963748227e-06, "loss": 2.2783, "step": 462430 }, { "epoch": 0.81, "learning_rate": 9.678010023821399e-06, "loss": 2.2838, "step": 462440 }, { "epoch": 0.81, "learning_rate": 9.677138083894573e-06, "loss": 2.3623, "step": 462450 }, { "epoch": 0.81, "learning_rate": 9.676266143967745e-06, "loss": 2.1904, "step": 462460 }, { "epoch": 0.81, "learning_rate": 9.675394204040919e-06, "loss": 2.292, "step": 462470 }, { "epoch": 0.81, "learning_rate": 9.67452226411409e-06, "loss": 2.236, "step": 462480 }, { "epoch": 0.81, "learning_rate": 9.673650324187265e-06, "loss": 2.2622, "step": 462490 }, { "epoch": 0.81, "learning_rate": 9.672778384260438e-06, "loss": 2.3332, "step": 462500 }, { "epoch": 0.81, "learning_rate": 9.671906444333612e-06, "loss": 2.1442, "step": 462510 }, { "epoch": 0.81, "learning_rate": 9.671034504406786e-06, "loss": 2.181, "step": 462520 }, { "epoch": 0.81, "learning_rate": 9.670162564479958e-06, "loss": 2.3661, "step": 462530 }, { "epoch": 0.81, "learning_rate": 9.669290624553132e-06, "loss": 2.279, "step": 462540 }, { "epoch": 0.81, "learning_rate": 9.668418684626304e-06, "loss": 2.2246, "step": 462550 }, { "epoch": 0.81, "learning_rate": 9.667546744699478e-06, "loss": 2.197, "step": 462560 }, { "epoch": 0.81, "learning_rate": 9.66667480477265e-06, "loss": 2.2802, "step": 462570 }, { "epoch": 0.81, "learning_rate": 9.665802864845825e-06, "loss": 2.2604, "step": 462580 }, { "epoch": 0.81, "learning_rate": 9.664930924918997e-06, "loss": 2.2238, "step": 462590 }, { "epoch": 0.81, "learning_rate": 9.664058984992171e-06, "loss": 2.3071, "step": 462600 }, { "epoch": 0.81, "learning_rate": 9.663187045065343e-06, "loss": 2.2205, "step": 462610 }, { "epoch": 0.81, "learning_rate": 9.662315105138517e-06, "loss": 2.253, "step": 462620 }, { "epoch": 0.81, "learning_rate": 9.661443165211689e-06, "loss": 2.268, "step": 462630 }, { "epoch": 0.81, "learning_rate": 9.660571225284863e-06, "loss": 2.2242, "step": 462640 }, { "epoch": 0.81, "learning_rate": 9.659699285358036e-06, "loss": 2.3673, "step": 462650 }, { "epoch": 0.81, "learning_rate": 9.65882734543121e-06, "loss": 2.1344, "step": 462660 }, { "epoch": 0.81, "learning_rate": 9.657955405504384e-06, "loss": 2.2998, "step": 462670 }, { "epoch": 0.81, "learning_rate": 9.657083465577556e-06, "loss": 2.2733, "step": 462680 }, { "epoch": 0.81, "learning_rate": 9.65621152565073e-06, "loss": 2.237, "step": 462690 }, { "epoch": 0.81, "learning_rate": 9.655339585723902e-06, "loss": 2.2746, "step": 462700 }, { "epoch": 0.81, "learning_rate": 9.654467645797076e-06, "loss": 2.1696, "step": 462710 }, { "epoch": 0.81, "learning_rate": 9.653595705870248e-06, "loss": 2.3345, "step": 462720 }, { "epoch": 0.81, "learning_rate": 9.652723765943422e-06, "loss": 2.2599, "step": 462730 }, { "epoch": 0.81, "learning_rate": 9.651851826016595e-06, "loss": 2.2071, "step": 462740 }, { "epoch": 0.81, "learning_rate": 9.650979886089769e-06, "loss": 2.3071, "step": 462750 }, { "epoch": 0.81, "learning_rate": 9.650107946162941e-06, "loss": 2.3692, "step": 462760 }, { "epoch": 0.81, "learning_rate": 9.649236006236115e-06, "loss": 2.2608, "step": 462770 }, { "epoch": 0.81, "learning_rate": 9.648364066309289e-06, "loss": 2.2634, "step": 462780 }, { "epoch": 0.81, "learning_rate": 9.64749212638246e-06, "loss": 2.3703, "step": 462790 }, { "epoch": 0.81, "learning_rate": 9.646620186455635e-06, "loss": 2.3405, "step": 462800 }, { "epoch": 0.81, "learning_rate": 9.645748246528807e-06, "loss": 2.3245, "step": 462810 }, { "epoch": 0.81, "learning_rate": 9.64487630660198e-06, "loss": 2.2792, "step": 462820 }, { "epoch": 0.81, "learning_rate": 9.644004366675154e-06, "loss": 2.2008, "step": 462830 }, { "epoch": 0.81, "learning_rate": 9.643132426748328e-06, "loss": 2.2359, "step": 462840 }, { "epoch": 0.81, "learning_rate": 9.6422604868215e-06, "loss": 2.3409, "step": 462850 }, { "epoch": 0.81, "learning_rate": 9.641388546894674e-06, "loss": 2.3073, "step": 462860 }, { "epoch": 0.81, "learning_rate": 9.640516606967846e-06, "loss": 2.2467, "step": 462870 }, { "epoch": 0.81, "learning_rate": 9.63964466704102e-06, "loss": 2.2072, "step": 462880 }, { "epoch": 0.81, "learning_rate": 9.638772727114193e-06, "loss": 2.2951, "step": 462890 }, { "epoch": 0.81, "learning_rate": 9.637900787187367e-06, "loss": 2.206, "step": 462900 }, { "epoch": 0.81, "learning_rate": 9.637028847260541e-06, "loss": 2.2743, "step": 462910 }, { "epoch": 0.81, "learning_rate": 9.636156907333713e-06, "loss": 2.3653, "step": 462920 }, { "epoch": 0.81, "learning_rate": 9.635284967406887e-06, "loss": 2.1935, "step": 462930 }, { "epoch": 0.81, "learning_rate": 9.634413027480059e-06, "loss": 2.2169, "step": 462940 }, { "epoch": 0.81, "learning_rate": 9.633541087553233e-06, "loss": 2.3167, "step": 462950 }, { "epoch": 0.81, "learning_rate": 9.632669147626405e-06, "loss": 2.3238, "step": 462960 }, { "epoch": 0.81, "learning_rate": 9.631797207699578e-06, "loss": 2.3397, "step": 462970 }, { "epoch": 0.81, "learning_rate": 9.630925267772752e-06, "loss": 2.3194, "step": 462980 }, { "epoch": 0.81, "learning_rate": 9.630053327845926e-06, "loss": 2.1578, "step": 462990 }, { "epoch": 0.81, "learning_rate": 9.629181387919098e-06, "loss": 2.2071, "step": 463000 }, { "epoch": 0.81, "learning_rate": 9.628309447992272e-06, "loss": 2.1551, "step": 463010 }, { "epoch": 0.81, "learning_rate": 9.627437508065444e-06, "loss": 2.2401, "step": 463020 }, { "epoch": 0.81, "learning_rate": 9.626565568138618e-06, "loss": 2.4323, "step": 463030 }, { "epoch": 0.81, "learning_rate": 9.625693628211791e-06, "loss": 2.3128, "step": 463040 }, { "epoch": 0.81, "learning_rate": 9.624821688284964e-06, "loss": 2.305, "step": 463050 }, { "epoch": 0.81, "learning_rate": 9.623949748358137e-06, "loss": 2.4229, "step": 463060 }, { "epoch": 0.81, "learning_rate": 9.623077808431311e-06, "loss": 2.303, "step": 463070 }, { "epoch": 0.81, "learning_rate": 9.622205868504485e-06, "loss": 2.2435, "step": 463080 }, { "epoch": 0.81, "learning_rate": 9.621333928577657e-06, "loss": 2.2038, "step": 463090 }, { "epoch": 0.81, "learning_rate": 9.62046198865083e-06, "loss": 2.2867, "step": 463100 }, { "epoch": 0.81, "learning_rate": 9.619590048724003e-06, "loss": 2.2928, "step": 463110 }, { "epoch": 0.81, "learning_rate": 9.618718108797177e-06, "loss": 2.2329, "step": 463120 }, { "epoch": 0.81, "learning_rate": 9.617846168870349e-06, "loss": 2.3219, "step": 463130 }, { "epoch": 0.81, "learning_rate": 9.616974228943524e-06, "loss": 2.3009, "step": 463140 }, { "epoch": 0.81, "learning_rate": 9.616102289016696e-06, "loss": 2.3077, "step": 463150 }, { "epoch": 0.81, "learning_rate": 9.61523034908987e-06, "loss": 2.322, "step": 463160 }, { "epoch": 0.81, "learning_rate": 9.614358409163044e-06, "loss": 2.2151, "step": 463170 }, { "epoch": 0.81, "learning_rate": 9.613486469236216e-06, "loss": 2.3262, "step": 463180 }, { "epoch": 0.81, "learning_rate": 9.61261452930939e-06, "loss": 2.3037, "step": 463190 }, { "epoch": 0.81, "learning_rate": 9.611742589382562e-06, "loss": 2.3272, "step": 463200 }, { "epoch": 0.81, "learning_rate": 9.610870649455735e-06, "loss": 2.2648, "step": 463210 }, { "epoch": 0.81, "learning_rate": 9.60999870952891e-06, "loss": 2.3157, "step": 463220 }, { "epoch": 0.81, "learning_rate": 9.609126769602083e-06, "loss": 2.3418, "step": 463230 }, { "epoch": 0.81, "learning_rate": 9.608254829675255e-06, "loss": 2.2101, "step": 463240 }, { "epoch": 0.81, "learning_rate": 9.607382889748429e-06, "loss": 2.3253, "step": 463250 }, { "epoch": 0.81, "learning_rate": 9.606510949821601e-06, "loss": 2.2491, "step": 463260 }, { "epoch": 0.81, "learning_rate": 9.605639009894775e-06, "loss": 2.1893, "step": 463270 }, { "epoch": 0.81, "learning_rate": 9.604767069967947e-06, "loss": 2.3761, "step": 463280 }, { "epoch": 0.81, "learning_rate": 9.60389513004112e-06, "loss": 2.3148, "step": 463290 }, { "epoch": 0.81, "learning_rate": 9.603023190114294e-06, "loss": 2.253, "step": 463300 }, { "epoch": 0.81, "learning_rate": 9.602151250187468e-06, "loss": 2.3344, "step": 463310 }, { "epoch": 0.81, "learning_rate": 9.601279310260642e-06, "loss": 2.2237, "step": 463320 }, { "epoch": 0.81, "learning_rate": 9.600407370333814e-06, "loss": 2.2966, "step": 463330 }, { "epoch": 0.81, "learning_rate": 9.599535430406988e-06, "loss": 2.3825, "step": 463340 }, { "epoch": 0.81, "learning_rate": 9.59866349048016e-06, "loss": 2.2171, "step": 463350 }, { "epoch": 0.81, "learning_rate": 9.597791550553333e-06, "loss": 2.183, "step": 463360 }, { "epoch": 0.81, "learning_rate": 9.596919610626506e-06, "loss": 2.1944, "step": 463370 }, { "epoch": 0.81, "learning_rate": 9.596047670699681e-06, "loss": 2.2783, "step": 463380 }, { "epoch": 0.81, "learning_rate": 9.595175730772853e-06, "loss": 2.2714, "step": 463390 }, { "epoch": 0.81, "learning_rate": 9.594303790846027e-06, "loss": 2.3665, "step": 463400 }, { "epoch": 0.81, "learning_rate": 9.593431850919199e-06, "loss": 2.2259, "step": 463410 }, { "epoch": 0.81, "learning_rate": 9.592559910992373e-06, "loss": 2.2529, "step": 463420 }, { "epoch": 0.81, "learning_rate": 9.591687971065546e-06, "loss": 2.2926, "step": 463430 }, { "epoch": 0.81, "learning_rate": 9.590816031138719e-06, "loss": 2.3446, "step": 463440 }, { "epoch": 0.81, "learning_rate": 9.589944091211892e-06, "loss": 2.2161, "step": 463450 }, { "epoch": 0.81, "learning_rate": 9.589072151285066e-06, "loss": 2.305, "step": 463460 }, { "epoch": 0.81, "learning_rate": 9.58820021135824e-06, "loss": 2.2171, "step": 463470 }, { "epoch": 0.81, "learning_rate": 9.587328271431412e-06, "loss": 2.2229, "step": 463480 }, { "epoch": 0.81, "learning_rate": 9.586456331504586e-06, "loss": 2.3728, "step": 463490 }, { "epoch": 0.81, "learning_rate": 9.585584391577758e-06, "loss": 2.2915, "step": 463500 }, { "epoch": 0.81, "learning_rate": 9.584712451650932e-06, "loss": 2.2681, "step": 463510 }, { "epoch": 0.81, "learning_rate": 9.583840511724104e-06, "loss": 2.2537, "step": 463520 }, { "epoch": 0.81, "learning_rate": 9.582968571797277e-06, "loss": 2.3889, "step": 463530 }, { "epoch": 0.81, "learning_rate": 9.582096631870451e-06, "loss": 2.2855, "step": 463540 }, { "epoch": 0.81, "learning_rate": 9.581224691943625e-06, "loss": 2.2563, "step": 463550 }, { "epoch": 0.81, "learning_rate": 9.580352752016797e-06, "loss": 2.4538, "step": 463560 }, { "epoch": 0.81, "learning_rate": 9.57948081208997e-06, "loss": 2.2932, "step": 463570 }, { "epoch": 0.81, "learning_rate": 9.578608872163145e-06, "loss": 2.2085, "step": 463580 }, { "epoch": 0.81, "learning_rate": 9.577736932236317e-06, "loss": 2.3606, "step": 463590 }, { "epoch": 0.81, "learning_rate": 9.57686499230949e-06, "loss": 2.2438, "step": 463600 }, { "epoch": 0.81, "learning_rate": 9.575993052382662e-06, "loss": 2.2384, "step": 463610 }, { "epoch": 0.81, "learning_rate": 9.575121112455838e-06, "loss": 2.2093, "step": 463620 }, { "epoch": 0.81, "learning_rate": 9.57424917252901e-06, "loss": 2.3108, "step": 463630 }, { "epoch": 0.81, "learning_rate": 9.573377232602184e-06, "loss": 2.1545, "step": 463640 }, { "epoch": 0.81, "learning_rate": 9.572505292675356e-06, "loss": 2.2412, "step": 463650 }, { "epoch": 0.81, "learning_rate": 9.57163335274853e-06, "loss": 2.3051, "step": 463660 }, { "epoch": 0.81, "learning_rate": 9.570761412821702e-06, "loss": 2.3843, "step": 463670 }, { "epoch": 0.81, "learning_rate": 9.569889472894875e-06, "loss": 2.2068, "step": 463680 }, { "epoch": 0.81, "learning_rate": 9.56901753296805e-06, "loss": 2.2292, "step": 463690 }, { "epoch": 0.81, "learning_rate": 9.568145593041223e-06, "loss": 2.2298, "step": 463700 }, { "epoch": 0.81, "learning_rate": 9.567273653114397e-06, "loss": 2.2597, "step": 463710 }, { "epoch": 0.81, "learning_rate": 9.566401713187569e-06, "loss": 2.1824, "step": 463720 }, { "epoch": 0.81, "learning_rate": 9.565529773260743e-06, "loss": 2.2518, "step": 463730 }, { "epoch": 0.81, "learning_rate": 9.564657833333915e-06, "loss": 2.24, "step": 463740 }, { "epoch": 0.81, "learning_rate": 9.563785893407088e-06, "loss": 2.2089, "step": 463750 }, { "epoch": 0.81, "learning_rate": 9.56291395348026e-06, "loss": 2.2578, "step": 463760 }, { "epoch": 0.81, "learning_rate": 9.562042013553434e-06, "loss": 2.3088, "step": 463770 }, { "epoch": 0.81, "learning_rate": 9.561170073626608e-06, "loss": 2.3787, "step": 463780 }, { "epoch": 0.81, "learning_rate": 9.560298133699782e-06, "loss": 2.3584, "step": 463790 }, { "epoch": 0.81, "learning_rate": 9.559426193772954e-06, "loss": 2.261, "step": 463800 }, { "epoch": 0.81, "learning_rate": 9.558554253846128e-06, "loss": 2.1089, "step": 463810 }, { "epoch": 0.81, "learning_rate": 9.5576823139193e-06, "loss": 2.2588, "step": 463820 }, { "epoch": 0.81, "learning_rate": 9.556810373992474e-06, "loss": 2.2269, "step": 463830 }, { "epoch": 0.81, "learning_rate": 9.555938434065647e-06, "loss": 2.2993, "step": 463840 }, { "epoch": 0.81, "learning_rate": 9.55506649413882e-06, "loss": 2.324, "step": 463850 }, { "epoch": 0.81, "learning_rate": 9.554194554211993e-06, "loss": 2.3146, "step": 463860 }, { "epoch": 0.81, "learning_rate": 9.553322614285167e-06, "loss": 2.2315, "step": 463870 }, { "epoch": 0.81, "learning_rate": 9.55245067435834e-06, "loss": 2.4138, "step": 463880 }, { "epoch": 0.81, "learning_rate": 9.551578734431513e-06, "loss": 2.1568, "step": 463890 }, { "epoch": 0.81, "learning_rate": 9.550706794504687e-06, "loss": 2.2545, "step": 463900 }, { "epoch": 0.81, "learning_rate": 9.549834854577859e-06, "loss": 2.2599, "step": 463910 }, { "epoch": 0.81, "learning_rate": 9.548962914651032e-06, "loss": 2.1734, "step": 463920 }, { "epoch": 0.81, "learning_rate": 9.548090974724206e-06, "loss": 2.2852, "step": 463930 }, { "epoch": 0.81, "learning_rate": 9.54721903479738e-06, "loss": 2.376, "step": 463940 }, { "epoch": 0.81, "learning_rate": 9.546347094870552e-06, "loss": 2.3724, "step": 463950 }, { "epoch": 0.81, "learning_rate": 9.545475154943726e-06, "loss": 2.2832, "step": 463960 }, { "epoch": 0.81, "learning_rate": 9.5446032150169e-06, "loss": 2.2743, "step": 463970 }, { "epoch": 0.81, "learning_rate": 9.543731275090072e-06, "loss": 2.21, "step": 463980 }, { "epoch": 0.81, "learning_rate": 9.542859335163245e-06, "loss": 2.3196, "step": 463990 }, { "epoch": 0.81, "learning_rate": 9.541987395236417e-06, "loss": 2.4368, "step": 464000 }, { "epoch": 0.81, "learning_rate": 9.541115455309591e-06, "loss": 2.2538, "step": 464010 }, { "epoch": 0.81, "learning_rate": 9.540243515382765e-06, "loss": 2.2789, "step": 464020 }, { "epoch": 0.81, "learning_rate": 9.539371575455939e-06, "loss": 2.3362, "step": 464030 }, { "epoch": 0.81, "learning_rate": 9.538499635529111e-06, "loss": 2.1835, "step": 464040 }, { "epoch": 0.81, "learning_rate": 9.537627695602285e-06, "loss": 2.2731, "step": 464050 }, { "epoch": 0.81, "learning_rate": 9.536755755675457e-06, "loss": 2.2904, "step": 464060 }, { "epoch": 0.81, "learning_rate": 9.53588381574863e-06, "loss": 2.2062, "step": 464070 }, { "epoch": 0.81, "learning_rate": 9.535011875821803e-06, "loss": 2.351, "step": 464080 }, { "epoch": 0.81, "learning_rate": 9.534139935894976e-06, "loss": 2.3866, "step": 464090 }, { "epoch": 0.81, "learning_rate": 9.53326799596815e-06, "loss": 2.271, "step": 464100 }, { "epoch": 0.81, "learning_rate": 9.532396056041324e-06, "loss": 2.3362, "step": 464110 }, { "epoch": 0.81, "learning_rate": 9.531524116114498e-06, "loss": 2.3706, "step": 464120 }, { "epoch": 0.81, "learning_rate": 9.53065217618767e-06, "loss": 2.3248, "step": 464130 }, { "epoch": 0.81, "learning_rate": 9.529780236260843e-06, "loss": 2.2477, "step": 464140 }, { "epoch": 0.81, "learning_rate": 9.528908296334016e-06, "loss": 2.4081, "step": 464150 }, { "epoch": 0.81, "learning_rate": 9.52803635640719e-06, "loss": 2.218, "step": 464160 }, { "epoch": 0.81, "learning_rate": 9.527164416480361e-06, "loss": 2.2943, "step": 464170 }, { "epoch": 0.81, "learning_rate": 9.526292476553537e-06, "loss": 2.1861, "step": 464180 }, { "epoch": 0.81, "learning_rate": 9.525420536626709e-06, "loss": 2.1959, "step": 464190 }, { "epoch": 0.81, "learning_rate": 9.524548596699883e-06, "loss": 2.2726, "step": 464200 }, { "epoch": 0.81, "learning_rate": 9.523676656773055e-06, "loss": 2.2803, "step": 464210 }, { "epoch": 0.81, "learning_rate": 9.522804716846229e-06, "loss": 2.2846, "step": 464220 }, { "epoch": 0.81, "learning_rate": 9.521932776919402e-06, "loss": 2.3372, "step": 464230 }, { "epoch": 0.81, "learning_rate": 9.521060836992574e-06, "loss": 2.3138, "step": 464240 }, { "epoch": 0.81, "learning_rate": 9.520188897065748e-06, "loss": 2.3496, "step": 464250 }, { "epoch": 0.81, "learning_rate": 9.519316957138922e-06, "loss": 2.2879, "step": 464260 }, { "epoch": 0.81, "learning_rate": 9.518445017212096e-06, "loss": 2.287, "step": 464270 }, { "epoch": 0.81, "learning_rate": 9.517573077285268e-06, "loss": 2.3332, "step": 464280 }, { "epoch": 0.81, "learning_rate": 9.516701137358442e-06, "loss": 2.3555, "step": 464290 }, { "epoch": 0.81, "learning_rate": 9.515829197431614e-06, "loss": 2.2432, "step": 464300 }, { "epoch": 0.81, "learning_rate": 9.514957257504787e-06, "loss": 2.3096, "step": 464310 }, { "epoch": 0.81, "learning_rate": 9.51408531757796e-06, "loss": 2.2806, "step": 464320 }, { "epoch": 0.81, "learning_rate": 9.513213377651133e-06, "loss": 2.2538, "step": 464330 }, { "epoch": 0.81, "learning_rate": 9.512341437724307e-06, "loss": 2.2277, "step": 464340 }, { "epoch": 0.81, "learning_rate": 9.51146949779748e-06, "loss": 2.3631, "step": 464350 }, { "epoch": 0.81, "learning_rate": 9.510597557870653e-06, "loss": 2.2753, "step": 464360 }, { "epoch": 0.81, "learning_rate": 9.509725617943827e-06, "loss": 2.3703, "step": 464370 }, { "epoch": 0.81, "learning_rate": 9.508853678017e-06, "loss": 2.2804, "step": 464380 }, { "epoch": 0.81, "learning_rate": 9.507981738090172e-06, "loss": 2.3168, "step": 464390 }, { "epoch": 0.81, "learning_rate": 9.507109798163346e-06, "loss": 2.4042, "step": 464400 }, { "epoch": 0.81, "learning_rate": 9.506237858236518e-06, "loss": 2.2548, "step": 464410 }, { "epoch": 0.81, "learning_rate": 9.505365918309694e-06, "loss": 2.2664, "step": 464420 }, { "epoch": 0.81, "learning_rate": 9.504493978382866e-06, "loss": 2.2417, "step": 464430 }, { "epoch": 0.81, "learning_rate": 9.50362203845604e-06, "loss": 2.2806, "step": 464440 }, { "epoch": 0.81, "learning_rate": 9.502750098529212e-06, "loss": 2.3855, "step": 464450 }, { "epoch": 0.81, "learning_rate": 9.501878158602385e-06, "loss": 2.2366, "step": 464460 }, { "epoch": 0.81, "learning_rate": 9.501006218675558e-06, "loss": 2.333, "step": 464470 }, { "epoch": 0.81, "learning_rate": 9.500134278748731e-06, "loss": 2.3019, "step": 464480 }, { "epoch": 0.81, "learning_rate": 9.499262338821905e-06, "loss": 2.2844, "step": 464490 }, { "epoch": 0.81, "learning_rate": 9.498390398895079e-06, "loss": 2.1582, "step": 464500 }, { "epoch": 0.81, "learning_rate": 9.497518458968253e-06, "loss": 2.3401, "step": 464510 }, { "epoch": 0.81, "learning_rate": 9.496646519041425e-06, "loss": 2.3612, "step": 464520 }, { "epoch": 0.81, "learning_rate": 9.495774579114598e-06, "loss": 2.2959, "step": 464530 }, { "epoch": 0.81, "learning_rate": 9.49490263918777e-06, "loss": 2.3885, "step": 464540 }, { "epoch": 0.81, "learning_rate": 9.494030699260944e-06, "loss": 2.3043, "step": 464550 }, { "epoch": 0.81, "learning_rate": 9.493158759334116e-06, "loss": 2.3141, "step": 464560 }, { "epoch": 0.81, "learning_rate": 9.49228681940729e-06, "loss": 2.1647, "step": 464570 }, { "epoch": 0.81, "learning_rate": 9.491414879480464e-06, "loss": 2.3067, "step": 464580 }, { "epoch": 0.81, "learning_rate": 9.490542939553638e-06, "loss": 2.2291, "step": 464590 }, { "epoch": 0.81, "learning_rate": 9.48967099962681e-06, "loss": 2.3075, "step": 464600 }, { "epoch": 0.81, "learning_rate": 9.488799059699984e-06, "loss": 2.4187, "step": 464610 }, { "epoch": 0.81, "learning_rate": 9.487927119773156e-06, "loss": 2.2761, "step": 464620 }, { "epoch": 0.81, "learning_rate": 9.48705517984633e-06, "loss": 2.2026, "step": 464630 }, { "epoch": 0.81, "learning_rate": 9.486183239919503e-06, "loss": 2.2428, "step": 464640 }, { "epoch": 0.81, "learning_rate": 9.485311299992675e-06, "loss": 2.299, "step": 464650 }, { "epoch": 0.81, "learning_rate": 9.48443936006585e-06, "loss": 2.2875, "step": 464660 }, { "epoch": 0.81, "learning_rate": 9.483567420139023e-06, "loss": 2.4015, "step": 464670 }, { "epoch": 0.81, "learning_rate": 9.482695480212197e-06, "loss": 2.1658, "step": 464680 }, { "epoch": 0.81, "learning_rate": 9.481823540285369e-06, "loss": 2.2701, "step": 464690 }, { "epoch": 0.81, "learning_rate": 9.480951600358542e-06, "loss": 2.3384, "step": 464700 }, { "epoch": 0.81, "learning_rate": 9.480079660431714e-06, "loss": 2.2287, "step": 464710 }, { "epoch": 0.81, "learning_rate": 9.479207720504888e-06, "loss": 2.2202, "step": 464720 }, { "epoch": 0.81, "learning_rate": 9.478335780578062e-06, "loss": 2.4132, "step": 464730 }, { "epoch": 0.81, "learning_rate": 9.477463840651236e-06, "loss": 2.1698, "step": 464740 }, { "epoch": 0.81, "learning_rate": 9.476591900724408e-06, "loss": 2.2847, "step": 464750 }, { "epoch": 0.81, "learning_rate": 9.475719960797582e-06, "loss": 2.2116, "step": 464760 }, { "epoch": 0.81, "learning_rate": 9.474848020870755e-06, "loss": 2.3476, "step": 464770 }, { "epoch": 0.81, "learning_rate": 9.473976080943927e-06, "loss": 2.2488, "step": 464780 }, { "epoch": 0.81, "learning_rate": 9.473104141017101e-06, "loss": 2.2156, "step": 464790 }, { "epoch": 0.81, "learning_rate": 9.472232201090273e-06, "loss": 2.4621, "step": 464800 }, { "epoch": 0.81, "learning_rate": 9.471360261163447e-06, "loss": 2.3295, "step": 464810 }, { "epoch": 0.81, "learning_rate": 9.470488321236621e-06, "loss": 2.3023, "step": 464820 }, { "epoch": 0.81, "learning_rate": 9.469616381309795e-06, "loss": 2.2363, "step": 464830 }, { "epoch": 0.81, "learning_rate": 9.468744441382967e-06, "loss": 2.3424, "step": 464840 }, { "epoch": 0.81, "learning_rate": 9.46787250145614e-06, "loss": 2.2067, "step": 464850 }, { "epoch": 0.81, "learning_rate": 9.467000561529313e-06, "loss": 2.2296, "step": 464860 }, { "epoch": 0.81, "learning_rate": 9.466128621602486e-06, "loss": 2.244, "step": 464870 }, { "epoch": 0.81, "learning_rate": 9.465256681675658e-06, "loss": 2.2382, "step": 464880 }, { "epoch": 0.81, "learning_rate": 9.464384741748832e-06, "loss": 2.199, "step": 464890 }, { "epoch": 0.81, "learning_rate": 9.463512801822006e-06, "loss": 2.2164, "step": 464900 }, { "epoch": 0.81, "learning_rate": 9.46264086189518e-06, "loss": 2.3531, "step": 464910 }, { "epoch": 0.81, "learning_rate": 9.461768921968353e-06, "loss": 2.2779, "step": 464920 }, { "epoch": 0.81, "learning_rate": 9.460896982041526e-06, "loss": 2.2544, "step": 464930 }, { "epoch": 0.81, "learning_rate": 9.4600250421147e-06, "loss": 2.2201, "step": 464940 }, { "epoch": 0.81, "learning_rate": 9.459153102187871e-06, "loss": 2.3248, "step": 464950 }, { "epoch": 0.81, "learning_rate": 9.458281162261045e-06, "loss": 2.262, "step": 464960 }, { "epoch": 0.81, "learning_rate": 9.457409222334219e-06, "loss": 2.3265, "step": 464970 }, { "epoch": 0.81, "learning_rate": 9.456537282407393e-06, "loss": 2.1953, "step": 464980 }, { "epoch": 0.81, "learning_rate": 9.455665342480565e-06, "loss": 2.2495, "step": 464990 }, { "epoch": 0.81, "learning_rate": 9.454793402553739e-06, "loss": 2.2498, "step": 465000 }, { "epoch": 0.81, "learning_rate": 9.45392146262691e-06, "loss": 2.193, "step": 465010 }, { "epoch": 0.81, "learning_rate": 9.453049522700084e-06, "loss": 2.2302, "step": 465020 }, { "epoch": 0.81, "learning_rate": 9.452177582773258e-06, "loss": 2.3052, "step": 465030 }, { "epoch": 0.81, "learning_rate": 9.45130564284643e-06, "loss": 2.3187, "step": 465040 }, { "epoch": 0.81, "learning_rate": 9.450433702919604e-06, "loss": 2.2977, "step": 465050 }, { "epoch": 0.81, "learning_rate": 9.449561762992778e-06, "loss": 2.3282, "step": 465060 }, { "epoch": 0.81, "learning_rate": 9.448689823065952e-06, "loss": 2.2754, "step": 465070 }, { "epoch": 0.81, "learning_rate": 9.447817883139124e-06, "loss": 2.2461, "step": 465080 }, { "epoch": 0.81, "learning_rate": 9.446945943212297e-06, "loss": 2.2569, "step": 465090 }, { "epoch": 0.81, "learning_rate": 9.44607400328547e-06, "loss": 2.2876, "step": 465100 }, { "epoch": 0.81, "learning_rate": 9.445202063358643e-06, "loss": 2.3476, "step": 465110 }, { "epoch": 0.81, "learning_rate": 9.444330123431815e-06, "loss": 2.2372, "step": 465120 }, { "epoch": 0.81, "learning_rate": 9.443458183504989e-06, "loss": 2.3945, "step": 465130 }, { "epoch": 0.81, "learning_rate": 9.442586243578163e-06, "loss": 2.2113, "step": 465140 }, { "epoch": 0.81, "learning_rate": 9.441714303651337e-06, "loss": 2.209, "step": 465150 }, { "epoch": 0.81, "learning_rate": 9.44084236372451e-06, "loss": 2.3132, "step": 465160 }, { "epoch": 0.81, "learning_rate": 9.439970423797682e-06, "loss": 2.2412, "step": 465170 }, { "epoch": 0.81, "learning_rate": 9.439098483870856e-06, "loss": 2.3951, "step": 465180 }, { "epoch": 0.81, "learning_rate": 9.438226543944028e-06, "loss": 2.4415, "step": 465190 }, { "epoch": 0.81, "learning_rate": 9.437354604017202e-06, "loss": 2.3874, "step": 465200 }, { "epoch": 0.81, "learning_rate": 9.436482664090374e-06, "loss": 2.3114, "step": 465210 }, { "epoch": 0.81, "learning_rate": 9.43561072416355e-06, "loss": 2.3312, "step": 465220 }, { "epoch": 0.81, "learning_rate": 9.434738784236722e-06, "loss": 2.1296, "step": 465230 }, { "epoch": 0.81, "learning_rate": 9.433866844309895e-06, "loss": 2.218, "step": 465240 }, { "epoch": 0.81, "learning_rate": 9.432994904383068e-06, "loss": 2.3336, "step": 465250 }, { "epoch": 0.81, "learning_rate": 9.432122964456241e-06, "loss": 2.2695, "step": 465260 }, { "epoch": 0.81, "learning_rate": 9.431251024529413e-06, "loss": 2.3797, "step": 465270 }, { "epoch": 0.81, "learning_rate": 9.430379084602587e-06, "loss": 2.3055, "step": 465280 }, { "epoch": 0.81, "learning_rate": 9.429507144675761e-06, "loss": 2.354, "step": 465290 }, { "epoch": 0.81, "learning_rate": 9.428635204748935e-06, "loss": 2.3488, "step": 465300 }, { "epoch": 0.81, "learning_rate": 9.427763264822108e-06, "loss": 2.4137, "step": 465310 }, { "epoch": 0.81, "learning_rate": 9.42689132489528e-06, "loss": 2.1888, "step": 465320 }, { "epoch": 0.81, "learning_rate": 9.426019384968454e-06, "loss": 2.383, "step": 465330 }, { "epoch": 0.81, "learning_rate": 9.425147445041626e-06, "loss": 2.2878, "step": 465340 }, { "epoch": 0.81, "learning_rate": 9.4242755051148e-06, "loss": 2.2034, "step": 465350 }, { "epoch": 0.81, "learning_rate": 9.423403565187972e-06, "loss": 2.2333, "step": 465360 }, { "epoch": 0.81, "learning_rate": 9.422531625261146e-06, "loss": 2.2315, "step": 465370 }, { "epoch": 0.81, "learning_rate": 9.42165968533432e-06, "loss": 2.369, "step": 465380 }, { "epoch": 0.81, "learning_rate": 9.420787745407494e-06, "loss": 2.233, "step": 465390 }, { "epoch": 0.81, "learning_rate": 9.419915805480666e-06, "loss": 2.3456, "step": 465400 }, { "epoch": 0.81, "learning_rate": 9.41904386555384e-06, "loss": 2.164, "step": 465410 }, { "epoch": 0.81, "learning_rate": 9.418171925627011e-06, "loss": 2.3369, "step": 465420 }, { "epoch": 0.81, "learning_rate": 9.417299985700185e-06, "loss": 2.3116, "step": 465430 }, { "epoch": 0.81, "learning_rate": 9.416428045773359e-06, "loss": 2.1963, "step": 465440 }, { "epoch": 0.81, "learning_rate": 9.415556105846531e-06, "loss": 2.2613, "step": 465450 }, { "epoch": 0.81, "learning_rate": 9.414684165919707e-06, "loss": 2.2578, "step": 465460 }, { "epoch": 0.81, "learning_rate": 9.413812225992879e-06, "loss": 2.3095, "step": 465470 }, { "epoch": 0.81, "learning_rate": 9.412940286066052e-06, "loss": 2.3118, "step": 465480 }, { "epoch": 0.81, "learning_rate": 9.412068346139224e-06, "loss": 2.2322, "step": 465490 }, { "epoch": 0.81, "learning_rate": 9.411196406212398e-06, "loss": 2.3372, "step": 465500 }, { "epoch": 0.81, "learning_rate": 9.41032446628557e-06, "loss": 2.254, "step": 465510 }, { "epoch": 0.81, "learning_rate": 9.409452526358744e-06, "loss": 2.3581, "step": 465520 }, { "epoch": 0.81, "learning_rate": 9.408580586431918e-06, "loss": 2.3527, "step": 465530 }, { "epoch": 0.81, "learning_rate": 9.407708646505092e-06, "loss": 2.2541, "step": 465540 }, { "epoch": 0.81, "learning_rate": 9.406836706578264e-06, "loss": 2.3878, "step": 465550 }, { "epoch": 0.81, "learning_rate": 9.405964766651437e-06, "loss": 2.2432, "step": 465560 }, { "epoch": 0.81, "learning_rate": 9.405092826724611e-06, "loss": 2.2939, "step": 465570 }, { "epoch": 0.81, "learning_rate": 9.404220886797783e-06, "loss": 2.3414, "step": 465580 }, { "epoch": 0.81, "learning_rate": 9.403348946870957e-06, "loss": 2.3944, "step": 465590 }, { "epoch": 0.81, "learning_rate": 9.40247700694413e-06, "loss": 2.2318, "step": 465600 }, { "epoch": 0.81, "learning_rate": 9.401605067017303e-06, "loss": 2.1803, "step": 465610 }, { "epoch": 0.81, "learning_rate": 9.400733127090477e-06, "loss": 2.2965, "step": 465620 }, { "epoch": 0.81, "learning_rate": 9.39986118716365e-06, "loss": 2.3262, "step": 465630 }, { "epoch": 0.81, "learning_rate": 9.398989247236823e-06, "loss": 2.3602, "step": 465640 }, { "epoch": 0.81, "learning_rate": 9.398117307309996e-06, "loss": 2.2377, "step": 465650 }, { "epoch": 0.81, "learning_rate": 9.397245367383168e-06, "loss": 2.2079, "step": 465660 }, { "epoch": 0.81, "learning_rate": 9.396373427456342e-06, "loss": 2.2865, "step": 465670 }, { "epoch": 0.81, "learning_rate": 9.395501487529514e-06, "loss": 2.3769, "step": 465680 }, { "epoch": 0.81, "learning_rate": 9.394629547602688e-06, "loss": 2.3081, "step": 465690 }, { "epoch": 0.81, "learning_rate": 9.393757607675863e-06, "loss": 2.3759, "step": 465700 }, { "epoch": 0.81, "learning_rate": 9.392885667749036e-06, "loss": 2.2342, "step": 465710 }, { "epoch": 0.81, "learning_rate": 9.39201372782221e-06, "loss": 2.3388, "step": 465720 }, { "epoch": 0.81, "learning_rate": 9.391141787895381e-06, "loss": 2.4401, "step": 465730 }, { "epoch": 0.81, "learning_rate": 9.390269847968555e-06, "loss": 2.2444, "step": 465740 }, { "epoch": 0.81, "learning_rate": 9.389397908041727e-06, "loss": 2.2846, "step": 465750 }, { "epoch": 0.81, "learning_rate": 9.388525968114901e-06, "loss": 2.2863, "step": 465760 }, { "epoch": 0.81, "learning_rate": 9.387654028188075e-06, "loss": 2.3823, "step": 465770 }, { "epoch": 0.81, "learning_rate": 9.386782088261249e-06, "loss": 2.3122, "step": 465780 }, { "epoch": 0.81, "learning_rate": 9.38591014833442e-06, "loss": 2.2337, "step": 465790 }, { "epoch": 0.81, "learning_rate": 9.385038208407594e-06, "loss": 2.2701, "step": 465800 }, { "epoch": 0.81, "learning_rate": 9.384166268480766e-06, "loss": 2.2521, "step": 465810 }, { "epoch": 0.81, "learning_rate": 9.38329432855394e-06, "loss": 2.2585, "step": 465820 }, { "epoch": 0.81, "learning_rate": 9.382422388627114e-06, "loss": 2.3538, "step": 465830 }, { "epoch": 0.81, "learning_rate": 9.381550448700286e-06, "loss": 2.3531, "step": 465840 }, { "epoch": 0.81, "learning_rate": 9.38067850877346e-06, "loss": 2.3538, "step": 465850 }, { "epoch": 0.81, "learning_rate": 9.379806568846634e-06, "loss": 2.394, "step": 465860 }, { "epoch": 0.81, "learning_rate": 9.378934628919807e-06, "loss": 2.2953, "step": 465870 }, { "epoch": 0.81, "learning_rate": 9.37806268899298e-06, "loss": 2.2795, "step": 465880 }, { "epoch": 0.81, "learning_rate": 9.377190749066153e-06, "loss": 2.2722, "step": 465890 }, { "epoch": 0.81, "learning_rate": 9.376318809139325e-06, "loss": 2.2738, "step": 465900 }, { "epoch": 0.81, "learning_rate": 9.375446869212499e-06, "loss": 2.279, "step": 465910 }, { "epoch": 0.81, "learning_rate": 9.374574929285671e-06, "loss": 2.314, "step": 465920 }, { "epoch": 0.81, "learning_rate": 9.373702989358845e-06, "loss": 2.249, "step": 465930 }, { "epoch": 0.81, "learning_rate": 9.372831049432019e-06, "loss": 2.2731, "step": 465940 }, { "epoch": 0.81, "learning_rate": 9.371959109505192e-06, "loss": 2.31, "step": 465950 }, { "epoch": 0.81, "learning_rate": 9.371087169578366e-06, "loss": 2.2732, "step": 465960 }, { "epoch": 0.81, "learning_rate": 9.370215229651538e-06, "loss": 2.3234, "step": 465970 }, { "epoch": 0.81, "learning_rate": 9.369343289724712e-06, "loss": 2.2397, "step": 465980 }, { "epoch": 0.81, "learning_rate": 9.368471349797884e-06, "loss": 2.3734, "step": 465990 }, { "epoch": 0.81, "learning_rate": 9.367599409871058e-06, "loss": 2.3616, "step": 466000 }, { "epoch": 0.81, "learning_rate": 9.366727469944232e-06, "loss": 2.3552, "step": 466010 }, { "epoch": 0.81, "learning_rate": 9.365855530017405e-06, "loss": 2.3402, "step": 466020 }, { "epoch": 0.81, "learning_rate": 9.364983590090578e-06, "loss": 2.4025, "step": 466030 }, { "epoch": 0.81, "learning_rate": 9.364111650163751e-06, "loss": 2.2366, "step": 466040 }, { "epoch": 0.81, "learning_rate": 9.363239710236923e-06, "loss": 2.2907, "step": 466050 }, { "epoch": 0.81, "learning_rate": 9.362367770310097e-06, "loss": 2.2637, "step": 466060 }, { "epoch": 0.81, "learning_rate": 9.36149583038327e-06, "loss": 2.2147, "step": 466070 }, { "epoch": 0.81, "learning_rate": 9.360623890456443e-06, "loss": 2.2131, "step": 466080 }, { "epoch": 0.81, "learning_rate": 9.359751950529617e-06, "loss": 2.1871, "step": 466090 }, { "epoch": 0.81, "learning_rate": 9.35888001060279e-06, "loss": 2.3621, "step": 466100 }, { "epoch": 0.81, "learning_rate": 9.358008070675964e-06, "loss": 2.2101, "step": 466110 }, { "epoch": 0.81, "learning_rate": 9.357136130749136e-06, "loss": 2.257, "step": 466120 }, { "epoch": 0.81, "learning_rate": 9.35626419082231e-06, "loss": 2.2399, "step": 466130 }, { "epoch": 0.81, "learning_rate": 9.355392250895482e-06, "loss": 2.3785, "step": 466140 }, { "epoch": 0.81, "learning_rate": 9.354520310968656e-06, "loss": 2.2134, "step": 466150 }, { "epoch": 0.81, "learning_rate": 9.353648371041828e-06, "loss": 2.1664, "step": 466160 }, { "epoch": 0.81, "learning_rate": 9.352776431115002e-06, "loss": 2.2, "step": 466170 }, { "epoch": 0.81, "learning_rate": 9.351904491188176e-06, "loss": 2.2571, "step": 466180 }, { "epoch": 0.81, "learning_rate": 9.35103255126135e-06, "loss": 2.2913, "step": 466190 }, { "epoch": 0.81, "learning_rate": 9.350160611334521e-06, "loss": 2.2974, "step": 466200 }, { "epoch": 0.81, "learning_rate": 9.349288671407695e-06, "loss": 2.3152, "step": 466210 }, { "epoch": 0.81, "learning_rate": 9.348416731480867e-06, "loss": 2.2331, "step": 466220 }, { "epoch": 0.81, "learning_rate": 9.347544791554041e-06, "loss": 2.308, "step": 466230 }, { "epoch": 0.81, "learning_rate": 9.346672851627215e-06, "loss": 2.2191, "step": 466240 }, { "epoch": 0.81, "learning_rate": 9.345800911700387e-06, "loss": 2.3775, "step": 466250 }, { "epoch": 0.81, "learning_rate": 9.344928971773562e-06, "loss": 2.261, "step": 466260 }, { "epoch": 0.81, "learning_rate": 9.344057031846734e-06, "loss": 2.2567, "step": 466270 }, { "epoch": 0.81, "learning_rate": 9.343185091919908e-06, "loss": 2.3137, "step": 466280 }, { "epoch": 0.81, "learning_rate": 9.34231315199308e-06, "loss": 2.2645, "step": 466290 }, { "epoch": 0.81, "learning_rate": 9.341441212066254e-06, "loss": 2.3091, "step": 466300 }, { "epoch": 0.81, "learning_rate": 9.340569272139426e-06, "loss": 2.2773, "step": 466310 }, { "epoch": 0.81, "learning_rate": 9.3396973322126e-06, "loss": 2.1607, "step": 466320 }, { "epoch": 0.81, "learning_rate": 9.338825392285774e-06, "loss": 2.2864, "step": 466330 }, { "epoch": 0.81, "learning_rate": 9.337953452358947e-06, "loss": 2.3671, "step": 466340 }, { "epoch": 0.81, "learning_rate": 9.33708151243212e-06, "loss": 2.3358, "step": 466350 }, { "epoch": 0.81, "learning_rate": 9.336209572505293e-06, "loss": 2.1329, "step": 466360 }, { "epoch": 0.81, "learning_rate": 9.335337632578467e-06, "loss": 2.3235, "step": 466370 }, { "epoch": 0.81, "learning_rate": 9.33446569265164e-06, "loss": 2.2316, "step": 466380 }, { "epoch": 0.81, "learning_rate": 9.333593752724813e-06, "loss": 2.2176, "step": 466390 }, { "epoch": 0.81, "learning_rate": 9.332721812797985e-06, "loss": 2.2735, "step": 466400 }, { "epoch": 0.81, "learning_rate": 9.331849872871159e-06, "loss": 2.3764, "step": 466410 }, { "epoch": 0.81, "learning_rate": 9.330977932944333e-06, "loss": 2.2556, "step": 466420 }, { "epoch": 0.81, "learning_rate": 9.330105993017506e-06, "loss": 2.2701, "step": 466430 }, { "epoch": 0.81, "learning_rate": 9.329234053090678e-06, "loss": 2.2671, "step": 466440 }, { "epoch": 0.81, "learning_rate": 9.328362113163852e-06, "loss": 2.2928, "step": 466450 }, { "epoch": 0.81, "learning_rate": 9.327490173237024e-06, "loss": 2.2962, "step": 466460 }, { "epoch": 0.81, "learning_rate": 9.326618233310198e-06, "loss": 2.2354, "step": 466470 }, { "epoch": 0.81, "learning_rate": 9.32574629338337e-06, "loss": 2.1893, "step": 466480 }, { "epoch": 0.81, "learning_rate": 9.324874353456544e-06, "loss": 2.1898, "step": 466490 }, { "epoch": 0.81, "learning_rate": 9.32400241352972e-06, "loss": 2.2342, "step": 466500 }, { "epoch": 0.81, "learning_rate": 9.323130473602891e-06, "loss": 2.3733, "step": 466510 }, { "epoch": 0.81, "learning_rate": 9.322258533676065e-06, "loss": 2.1596, "step": 466520 }, { "epoch": 0.81, "learning_rate": 9.321386593749237e-06, "loss": 2.3527, "step": 466530 }, { "epoch": 0.81, "learning_rate": 9.320514653822411e-06, "loss": 2.2471, "step": 466540 }, { "epoch": 0.81, "learning_rate": 9.319642713895583e-06, "loss": 2.2877, "step": 466550 }, { "epoch": 0.81, "learning_rate": 9.318770773968757e-06, "loss": 2.2479, "step": 466560 }, { "epoch": 0.81, "learning_rate": 9.31789883404193e-06, "loss": 2.2463, "step": 466570 }, { "epoch": 0.81, "learning_rate": 9.317026894115104e-06, "loss": 2.2274, "step": 466580 }, { "epoch": 0.81, "learning_rate": 9.316154954188276e-06, "loss": 2.3215, "step": 466590 }, { "epoch": 0.81, "learning_rate": 9.31528301426145e-06, "loss": 2.1582, "step": 466600 }, { "epoch": 0.81, "learning_rate": 9.314411074334622e-06, "loss": 2.3235, "step": 466610 }, { "epoch": 0.81, "learning_rate": 9.313539134407796e-06, "loss": 2.1922, "step": 466620 }, { "epoch": 0.81, "learning_rate": 9.31266719448097e-06, "loss": 2.2843, "step": 466630 }, { "epoch": 0.81, "learning_rate": 9.311795254554142e-06, "loss": 2.2052, "step": 466640 }, { "epoch": 0.81, "learning_rate": 9.310923314627316e-06, "loss": 2.2298, "step": 466650 }, { "epoch": 0.81, "learning_rate": 9.31005137470049e-06, "loss": 2.1759, "step": 466660 }, { "epoch": 0.81, "learning_rate": 9.309179434773663e-06, "loss": 2.3576, "step": 466670 }, { "epoch": 0.81, "learning_rate": 9.308307494846835e-06, "loss": 2.1529, "step": 466680 }, { "epoch": 0.81, "learning_rate": 9.307435554920009e-06, "loss": 2.3027, "step": 466690 }, { "epoch": 0.81, "learning_rate": 9.306563614993181e-06, "loss": 2.2786, "step": 466700 }, { "epoch": 0.81, "learning_rate": 9.305691675066355e-06, "loss": 2.2102, "step": 466710 }, { "epoch": 0.81, "learning_rate": 9.304819735139527e-06, "loss": 2.1534, "step": 466720 }, { "epoch": 0.81, "learning_rate": 9.3039477952127e-06, "loss": 2.3403, "step": 466730 }, { "epoch": 0.81, "learning_rate": 9.303075855285875e-06, "loss": 2.2204, "step": 466740 }, { "epoch": 0.81, "learning_rate": 9.302203915359048e-06, "loss": 2.3151, "step": 466750 }, { "epoch": 0.81, "learning_rate": 9.301331975432222e-06, "loss": 2.3386, "step": 466760 }, { "epoch": 0.81, "learning_rate": 9.300460035505394e-06, "loss": 2.2802, "step": 466770 }, { "epoch": 0.81, "learning_rate": 9.299588095578568e-06, "loss": 2.296, "step": 466780 }, { "epoch": 0.81, "learning_rate": 9.29871615565174e-06, "loss": 2.2729, "step": 466790 }, { "epoch": 0.81, "learning_rate": 9.297844215724914e-06, "loss": 2.2986, "step": 466800 }, { "epoch": 0.81, "learning_rate": 9.296972275798088e-06, "loss": 2.3128, "step": 466810 }, { "epoch": 0.81, "learning_rate": 9.296100335871261e-06, "loss": 2.2972, "step": 466820 }, { "epoch": 0.81, "learning_rate": 9.295228395944433e-06, "loss": 2.3047, "step": 466830 }, { "epoch": 0.81, "learning_rate": 9.294356456017607e-06, "loss": 2.2326, "step": 466840 }, { "epoch": 0.81, "learning_rate": 9.29348451609078e-06, "loss": 2.3383, "step": 466850 }, { "epoch": 0.81, "learning_rate": 9.292612576163953e-06, "loss": 2.2055, "step": 466860 }, { "epoch": 0.81, "learning_rate": 9.291740636237125e-06, "loss": 2.2484, "step": 466870 }, { "epoch": 0.81, "learning_rate": 9.290868696310299e-06, "loss": 2.297, "step": 466880 }, { "epoch": 0.81, "learning_rate": 9.289996756383473e-06, "loss": 2.3011, "step": 466890 }, { "epoch": 0.81, "learning_rate": 9.289124816456646e-06, "loss": 2.2858, "step": 466900 }, { "epoch": 0.81, "learning_rate": 9.28825287652982e-06, "loss": 2.3175, "step": 466910 }, { "epoch": 0.81, "learning_rate": 9.287380936602992e-06, "loss": 2.277, "step": 466920 }, { "epoch": 0.81, "learning_rate": 9.286508996676166e-06, "loss": 2.1882, "step": 466930 }, { "epoch": 0.81, "learning_rate": 9.285637056749338e-06, "loss": 2.3222, "step": 466940 }, { "epoch": 0.81, "learning_rate": 9.284765116822512e-06, "loss": 2.3349, "step": 466950 }, { "epoch": 0.81, "learning_rate": 9.283893176895684e-06, "loss": 2.3449, "step": 466960 }, { "epoch": 0.81, "learning_rate": 9.283021236968858e-06, "loss": 2.387, "step": 466970 }, { "epoch": 0.81, "learning_rate": 9.282149297042031e-06, "loss": 2.2316, "step": 466980 }, { "epoch": 0.81, "learning_rate": 9.281277357115205e-06, "loss": 2.3111, "step": 466990 }, { "epoch": 0.81, "learning_rate": 9.280405417188377e-06, "loss": 2.2855, "step": 467000 }, { "epoch": 0.81, "learning_rate": 9.279533477261551e-06, "loss": 2.209, "step": 467010 }, { "epoch": 0.81, "learning_rate": 9.278661537334723e-06, "loss": 2.1707, "step": 467020 }, { "epoch": 0.81, "learning_rate": 9.277789597407897e-06, "loss": 2.189, "step": 467030 }, { "epoch": 0.81, "learning_rate": 9.27691765748107e-06, "loss": 2.3714, "step": 467040 }, { "epoch": 0.81, "learning_rate": 9.276045717554244e-06, "loss": 2.1723, "step": 467050 }, { "epoch": 0.81, "learning_rate": 9.275173777627418e-06, "loss": 2.1954, "step": 467060 }, { "epoch": 0.81, "learning_rate": 9.27430183770059e-06, "loss": 2.1512, "step": 467070 }, { "epoch": 0.81, "learning_rate": 9.273429897773764e-06, "loss": 2.2387, "step": 467080 }, { "epoch": 0.81, "learning_rate": 9.272557957846936e-06, "loss": 2.2259, "step": 467090 }, { "epoch": 0.81, "learning_rate": 9.27168601792011e-06, "loss": 2.235, "step": 467100 }, { "epoch": 0.81, "learning_rate": 9.270814077993282e-06, "loss": 2.344, "step": 467110 }, { "epoch": 0.81, "learning_rate": 9.269942138066456e-06, "loss": 2.3667, "step": 467120 }, { "epoch": 0.81, "learning_rate": 9.26907019813963e-06, "loss": 2.3357, "step": 467130 }, { "epoch": 0.81, "learning_rate": 9.268198258212803e-06, "loss": 2.2116, "step": 467140 }, { "epoch": 0.81, "learning_rate": 9.267326318285975e-06, "loss": 2.1586, "step": 467150 }, { "epoch": 0.81, "learning_rate": 9.26645437835915e-06, "loss": 2.2305, "step": 467160 }, { "epoch": 0.81, "learning_rate": 9.265582438432323e-06, "loss": 2.2312, "step": 467170 }, { "epoch": 0.81, "learning_rate": 9.264710498505495e-06, "loss": 2.3675, "step": 467180 }, { "epoch": 0.81, "learning_rate": 9.263838558578669e-06, "loss": 2.4337, "step": 467190 }, { "epoch": 0.81, "learning_rate": 9.262966618651841e-06, "loss": 2.1842, "step": 467200 }, { "epoch": 0.81, "learning_rate": 9.262094678725015e-06, "loss": 2.182, "step": 467210 }, { "epoch": 0.81, "learning_rate": 9.261222738798188e-06, "loss": 2.1124, "step": 467220 }, { "epoch": 0.81, "learning_rate": 9.260350798871362e-06, "loss": 2.0656, "step": 467230 }, { "epoch": 0.81, "learning_rate": 9.259478858944534e-06, "loss": 2.3149, "step": 467240 }, { "epoch": 0.81, "learning_rate": 9.258606919017708e-06, "loss": 2.2024, "step": 467250 }, { "epoch": 0.81, "learning_rate": 9.25773497909088e-06, "loss": 2.2931, "step": 467260 }, { "epoch": 0.81, "learning_rate": 9.256863039164054e-06, "loss": 2.3289, "step": 467270 }, { "epoch": 0.81, "learning_rate": 9.255991099237226e-06, "loss": 2.3462, "step": 467280 }, { "epoch": 0.81, "learning_rate": 9.255119159310401e-06, "loss": 2.1945, "step": 467290 }, { "epoch": 0.81, "learning_rate": 9.254247219383575e-06, "loss": 2.2288, "step": 467300 }, { "epoch": 0.81, "learning_rate": 9.253375279456747e-06, "loss": 2.315, "step": 467310 }, { "epoch": 0.81, "learning_rate": 9.252503339529921e-06, "loss": 2.3146, "step": 467320 }, { "epoch": 0.81, "learning_rate": 9.251631399603093e-06, "loss": 2.3032, "step": 467330 }, { "epoch": 0.81, "learning_rate": 9.250759459676267e-06, "loss": 2.2879, "step": 467340 }, { "epoch": 0.82, "learning_rate": 9.249887519749439e-06, "loss": 2.3432, "step": 467350 }, { "epoch": 0.82, "learning_rate": 9.249015579822613e-06, "loss": 2.2839, "step": 467360 }, { "epoch": 0.82, "learning_rate": 9.248143639895787e-06, "loss": 2.3281, "step": 467370 }, { "epoch": 0.82, "learning_rate": 9.24727169996896e-06, "loss": 2.2762, "step": 467380 }, { "epoch": 0.82, "learning_rate": 9.246399760042132e-06, "loss": 2.2475, "step": 467390 }, { "epoch": 0.82, "learning_rate": 9.245527820115306e-06, "loss": 2.3241, "step": 467400 }, { "epoch": 0.82, "learning_rate": 9.244655880188478e-06, "loss": 2.2361, "step": 467410 }, { "epoch": 0.82, "learning_rate": 9.243783940261652e-06, "loss": 2.3974, "step": 467420 }, { "epoch": 0.82, "learning_rate": 9.242912000334826e-06, "loss": 2.32, "step": 467430 }, { "epoch": 0.82, "learning_rate": 9.242040060407998e-06, "loss": 2.2903, "step": 467440 }, { "epoch": 0.82, "learning_rate": 9.241168120481172e-06, "loss": 2.3442, "step": 467450 }, { "epoch": 0.82, "learning_rate": 9.240296180554345e-06, "loss": 2.2708, "step": 467460 }, { "epoch": 0.82, "learning_rate": 9.239424240627519e-06, "loss": 2.2726, "step": 467470 }, { "epoch": 0.82, "learning_rate": 9.238552300700691e-06, "loss": 2.3186, "step": 467480 }, { "epoch": 0.82, "learning_rate": 9.237680360773865e-06, "loss": 2.2975, "step": 467490 }, { "epoch": 0.82, "learning_rate": 9.236808420847037e-06, "loss": 2.2826, "step": 467500 }, { "epoch": 0.82, "learning_rate": 9.23593648092021e-06, "loss": 2.2842, "step": 467510 }, { "epoch": 0.82, "learning_rate": 9.235064540993383e-06, "loss": 2.3007, "step": 467520 }, { "epoch": 0.82, "learning_rate": 9.234192601066557e-06, "loss": 2.356, "step": 467530 }, { "epoch": 0.82, "learning_rate": 9.23332066113973e-06, "loss": 2.2483, "step": 467540 }, { "epoch": 0.82, "learning_rate": 9.232448721212904e-06, "loss": 2.223, "step": 467550 }, { "epoch": 0.82, "learning_rate": 9.231576781286078e-06, "loss": 2.3014, "step": 467560 }, { "epoch": 0.82, "learning_rate": 9.23070484135925e-06, "loss": 2.3562, "step": 467570 }, { "epoch": 0.82, "learning_rate": 9.229832901432424e-06, "loss": 2.2077, "step": 467580 }, { "epoch": 0.82, "learning_rate": 9.228960961505596e-06, "loss": 2.2583, "step": 467590 }, { "epoch": 0.82, "learning_rate": 9.22808902157877e-06, "loss": 2.1645, "step": 467600 }, { "epoch": 0.82, "learning_rate": 9.227217081651943e-06, "loss": 2.241, "step": 467610 }, { "epoch": 0.82, "learning_rate": 9.226345141725117e-06, "loss": 2.3337, "step": 467620 }, { "epoch": 0.82, "learning_rate": 9.22547320179829e-06, "loss": 2.1825, "step": 467630 }, { "epoch": 0.82, "learning_rate": 9.224601261871463e-06, "loss": 2.233, "step": 467640 }, { "epoch": 0.82, "learning_rate": 9.223729321944635e-06, "loss": 2.2293, "step": 467650 }, { "epoch": 0.82, "learning_rate": 9.222857382017809e-06, "loss": 2.4142, "step": 467660 }, { "epoch": 0.82, "learning_rate": 9.221985442090981e-06, "loss": 2.1829, "step": 467670 }, { "epoch": 0.82, "learning_rate": 9.221113502164155e-06, "loss": 2.2704, "step": 467680 }, { "epoch": 0.82, "learning_rate": 9.220241562237329e-06, "loss": 2.2839, "step": 467690 }, { "epoch": 0.82, "learning_rate": 9.219369622310502e-06, "loss": 2.2508, "step": 467700 }, { "epoch": 0.82, "learning_rate": 9.218497682383676e-06, "loss": 2.2188, "step": 467710 }, { "epoch": 0.82, "learning_rate": 9.217625742456848e-06, "loss": 2.3241, "step": 467720 }, { "epoch": 0.82, "learning_rate": 9.216753802530022e-06, "loss": 2.2856, "step": 467730 }, { "epoch": 0.82, "learning_rate": 9.215881862603194e-06, "loss": 2.3172, "step": 467740 }, { "epoch": 0.82, "learning_rate": 9.215009922676368e-06, "loss": 2.2018, "step": 467750 }, { "epoch": 0.82, "learning_rate": 9.21413798274954e-06, "loss": 2.3564, "step": 467760 }, { "epoch": 0.82, "learning_rate": 9.213266042822714e-06, "loss": 2.3059, "step": 467770 }, { "epoch": 0.82, "learning_rate": 9.212394102895887e-06, "loss": 2.3248, "step": 467780 }, { "epoch": 0.82, "learning_rate": 9.211522162969061e-06, "loss": 2.2524, "step": 467790 }, { "epoch": 0.82, "learning_rate": 9.210650223042233e-06, "loss": 2.3678, "step": 467800 }, { "epoch": 0.82, "learning_rate": 9.209778283115407e-06, "loss": 2.3251, "step": 467810 }, { "epoch": 0.82, "learning_rate": 9.20890634318858e-06, "loss": 2.3311, "step": 467820 }, { "epoch": 0.82, "learning_rate": 9.208034403261753e-06, "loss": 2.2049, "step": 467830 }, { "epoch": 0.82, "learning_rate": 9.207162463334927e-06, "loss": 2.2403, "step": 467840 }, { "epoch": 0.82, "learning_rate": 9.2062905234081e-06, "loss": 2.267, "step": 467850 }, { "epoch": 0.82, "learning_rate": 9.205418583481274e-06, "loss": 2.3447, "step": 467860 }, { "epoch": 0.82, "learning_rate": 9.204546643554446e-06, "loss": 2.3002, "step": 467870 }, { "epoch": 0.82, "learning_rate": 9.20367470362762e-06, "loss": 2.141, "step": 467880 }, { "epoch": 0.82, "learning_rate": 9.202802763700792e-06, "loss": 2.313, "step": 467890 }, { "epoch": 0.82, "learning_rate": 9.201930823773966e-06, "loss": 2.2412, "step": 467900 }, { "epoch": 0.82, "learning_rate": 9.201058883847138e-06, "loss": 2.1512, "step": 467910 }, { "epoch": 0.82, "learning_rate": 9.200186943920312e-06, "loss": 2.1972, "step": 467920 }, { "epoch": 0.82, "learning_rate": 9.199315003993485e-06, "loss": 2.2759, "step": 467930 }, { "epoch": 0.82, "learning_rate": 9.19844306406666e-06, "loss": 2.3298, "step": 467940 }, { "epoch": 0.82, "learning_rate": 9.197571124139831e-06, "loss": 2.2534, "step": 467950 }, { "epoch": 0.82, "learning_rate": 9.196699184213005e-06, "loss": 2.3734, "step": 467960 }, { "epoch": 0.82, "learning_rate": 9.195827244286179e-06, "loss": 2.3367, "step": 467970 }, { "epoch": 0.82, "learning_rate": 9.194955304359351e-06, "loss": 2.3283, "step": 467980 }, { "epoch": 0.82, "learning_rate": 9.194083364432525e-06, "loss": 2.3422, "step": 467990 }, { "epoch": 0.82, "learning_rate": 9.193211424505697e-06, "loss": 2.2276, "step": 468000 }, { "epoch": 0.82, "learning_rate": 9.19233948457887e-06, "loss": 2.2684, "step": 468010 }, { "epoch": 0.82, "learning_rate": 9.191467544652044e-06, "loss": 2.2105, "step": 468020 }, { "epoch": 0.82, "learning_rate": 9.190595604725218e-06, "loss": 2.2653, "step": 468030 }, { "epoch": 0.82, "learning_rate": 9.18972366479839e-06, "loss": 2.1734, "step": 468040 }, { "epoch": 0.82, "learning_rate": 9.188851724871564e-06, "loss": 2.2813, "step": 468050 }, { "epoch": 0.82, "learning_rate": 9.187979784944736e-06, "loss": 2.1684, "step": 468060 }, { "epoch": 0.82, "learning_rate": 9.18710784501791e-06, "loss": 2.3769, "step": 468070 }, { "epoch": 0.82, "learning_rate": 9.186235905091082e-06, "loss": 2.3903, "step": 468080 }, { "epoch": 0.82, "learning_rate": 9.185363965164257e-06, "loss": 2.3361, "step": 468090 }, { "epoch": 0.82, "learning_rate": 9.184492025237431e-06, "loss": 2.1425, "step": 468100 }, { "epoch": 0.82, "learning_rate": 9.183620085310603e-06, "loss": 2.2307, "step": 468110 }, { "epoch": 0.82, "learning_rate": 9.182748145383777e-06, "loss": 2.2734, "step": 468120 }, { "epoch": 0.82, "learning_rate": 9.181876205456949e-06, "loss": 2.1466, "step": 468130 }, { "epoch": 0.82, "learning_rate": 9.181004265530123e-06, "loss": 2.0652, "step": 468140 }, { "epoch": 0.82, "learning_rate": 9.180132325603295e-06, "loss": 2.2047, "step": 468150 }, { "epoch": 0.82, "learning_rate": 9.179260385676469e-06, "loss": 2.271, "step": 468160 }, { "epoch": 0.82, "learning_rate": 9.178388445749642e-06, "loss": 2.2627, "step": 468170 }, { "epoch": 0.82, "learning_rate": 9.177516505822816e-06, "loss": 2.186, "step": 468180 }, { "epoch": 0.82, "learning_rate": 9.176644565895988e-06, "loss": 2.3584, "step": 468190 }, { "epoch": 0.82, "learning_rate": 9.175772625969162e-06, "loss": 2.2742, "step": 468200 }, { "epoch": 0.82, "learning_rate": 9.174900686042334e-06, "loss": 2.3025, "step": 468210 }, { "epoch": 0.82, "learning_rate": 9.174028746115508e-06, "loss": 2.3355, "step": 468220 }, { "epoch": 0.82, "learning_rate": 9.173156806188682e-06, "loss": 2.3216, "step": 468230 }, { "epoch": 0.82, "learning_rate": 9.172284866261854e-06, "loss": 2.2914, "step": 468240 }, { "epoch": 0.82, "learning_rate": 9.171412926335027e-06, "loss": 2.1688, "step": 468250 }, { "epoch": 0.82, "learning_rate": 9.170540986408201e-06, "loss": 2.2208, "step": 468260 }, { "epoch": 0.82, "learning_rate": 9.169669046481375e-06, "loss": 2.3006, "step": 468270 }, { "epoch": 0.82, "learning_rate": 9.168797106554547e-06, "loss": 2.1131, "step": 468280 }, { "epoch": 0.82, "learning_rate": 9.16792516662772e-06, "loss": 2.2219, "step": 468290 }, { "epoch": 0.82, "learning_rate": 9.167053226700893e-06, "loss": 2.2103, "step": 468300 }, { "epoch": 0.82, "learning_rate": 9.166181286774067e-06, "loss": 2.2508, "step": 468310 }, { "epoch": 0.82, "learning_rate": 9.165309346847239e-06, "loss": 2.1679, "step": 468320 }, { "epoch": 0.82, "learning_rate": 9.164437406920414e-06, "loss": 2.2483, "step": 468330 }, { "epoch": 0.82, "learning_rate": 9.163565466993586e-06, "loss": 2.2864, "step": 468340 }, { "epoch": 0.82, "learning_rate": 9.16269352706676e-06, "loss": 2.2955, "step": 468350 }, { "epoch": 0.82, "learning_rate": 9.161821587139934e-06, "loss": 2.1778, "step": 468360 }, { "epoch": 0.82, "learning_rate": 9.160949647213106e-06, "loss": 2.2808, "step": 468370 }, { "epoch": 0.82, "learning_rate": 9.16007770728628e-06, "loss": 2.4207, "step": 468380 }, { "epoch": 0.82, "learning_rate": 9.159205767359452e-06, "loss": 2.331, "step": 468390 }, { "epoch": 0.82, "learning_rate": 9.158333827432626e-06, "loss": 2.2517, "step": 468400 }, { "epoch": 0.82, "learning_rate": 9.1574618875058e-06, "loss": 2.2853, "step": 468410 }, { "epoch": 0.82, "learning_rate": 9.156589947578973e-06, "loss": 2.3439, "step": 468420 }, { "epoch": 0.82, "learning_rate": 9.155718007652145e-06, "loss": 2.1823, "step": 468430 }, { "epoch": 0.82, "learning_rate": 9.154846067725319e-06, "loss": 2.3649, "step": 468440 }, { "epoch": 0.82, "learning_rate": 9.153974127798491e-06, "loss": 2.3817, "step": 468450 }, { "epoch": 0.82, "learning_rate": 9.153102187871665e-06, "loss": 2.2466, "step": 468460 }, { "epoch": 0.82, "learning_rate": 9.152230247944837e-06, "loss": 2.3161, "step": 468470 }, { "epoch": 0.82, "learning_rate": 9.15135830801801e-06, "loss": 2.2858, "step": 468480 }, { "epoch": 0.82, "learning_rate": 9.150486368091184e-06, "loss": 2.3134, "step": 468490 }, { "epoch": 0.82, "learning_rate": 9.149614428164358e-06, "loss": 2.3862, "step": 468500 }, { "epoch": 0.82, "learning_rate": 9.148742488237532e-06, "loss": 2.2782, "step": 468510 }, { "epoch": 0.82, "learning_rate": 9.147870548310704e-06, "loss": 2.2557, "step": 468520 }, { "epoch": 0.82, "learning_rate": 9.146998608383878e-06, "loss": 2.3245, "step": 468530 }, { "epoch": 0.82, "learning_rate": 9.14612666845705e-06, "loss": 2.3153, "step": 468540 }, { "epoch": 0.82, "learning_rate": 9.145254728530224e-06, "loss": 2.3127, "step": 468550 }, { "epoch": 0.82, "learning_rate": 9.144382788603396e-06, "loss": 2.1938, "step": 468560 }, { "epoch": 0.82, "learning_rate": 9.14351084867657e-06, "loss": 2.4423, "step": 468570 }, { "epoch": 0.82, "learning_rate": 9.142638908749743e-06, "loss": 2.2886, "step": 468580 }, { "epoch": 0.82, "learning_rate": 9.141766968822917e-06, "loss": 2.2553, "step": 468590 }, { "epoch": 0.82, "learning_rate": 9.140895028896089e-06, "loss": 2.3233, "step": 468600 }, { "epoch": 0.82, "learning_rate": 9.140023088969263e-06, "loss": 2.1605, "step": 468610 }, { "epoch": 0.82, "learning_rate": 9.139151149042437e-06, "loss": 2.3378, "step": 468620 }, { "epoch": 0.82, "learning_rate": 9.138279209115609e-06, "loss": 2.3131, "step": 468630 }, { "epoch": 0.82, "learning_rate": 9.137407269188782e-06, "loss": 2.3007, "step": 468640 }, { "epoch": 0.82, "learning_rate": 9.136535329261956e-06, "loss": 2.2896, "step": 468650 }, { "epoch": 0.82, "learning_rate": 9.13566338933513e-06, "loss": 2.233, "step": 468660 }, { "epoch": 0.82, "learning_rate": 9.134791449408302e-06, "loss": 2.2624, "step": 468670 }, { "epoch": 0.82, "learning_rate": 9.133919509481476e-06, "loss": 2.262, "step": 468680 }, { "epoch": 0.82, "learning_rate": 9.133047569554648e-06, "loss": 2.1692, "step": 468690 }, { "epoch": 0.82, "learning_rate": 9.132175629627822e-06, "loss": 2.2785, "step": 468700 }, { "epoch": 0.82, "learning_rate": 9.131303689700994e-06, "loss": 2.3209, "step": 468710 }, { "epoch": 0.82, "learning_rate": 9.130431749774168e-06, "loss": 2.2886, "step": 468720 }, { "epoch": 0.82, "learning_rate": 9.129559809847341e-06, "loss": 2.2217, "step": 468730 }, { "epoch": 0.82, "learning_rate": 9.128687869920515e-06, "loss": 2.3472, "step": 468740 }, { "epoch": 0.82, "learning_rate": 9.127815929993687e-06, "loss": 2.3806, "step": 468750 }, { "epoch": 0.82, "learning_rate": 9.126943990066861e-06, "loss": 2.3404, "step": 468760 }, { "epoch": 0.82, "learning_rate": 9.126072050140035e-06, "loss": 2.0481, "step": 468770 }, { "epoch": 0.82, "learning_rate": 9.125200110213207e-06, "loss": 2.2696, "step": 468780 }, { "epoch": 0.82, "learning_rate": 9.12432817028638e-06, "loss": 2.2651, "step": 468790 }, { "epoch": 0.82, "learning_rate": 9.123456230359553e-06, "loss": 2.2784, "step": 468800 }, { "epoch": 0.82, "learning_rate": 9.122584290432726e-06, "loss": 2.1997, "step": 468810 }, { "epoch": 0.82, "learning_rate": 9.1217123505059e-06, "loss": 2.2773, "step": 468820 }, { "epoch": 0.82, "learning_rate": 9.120840410579074e-06, "loss": 2.3827, "step": 468830 }, { "epoch": 0.82, "learning_rate": 9.119968470652246e-06, "loss": 2.2225, "step": 468840 }, { "epoch": 0.82, "learning_rate": 9.11909653072542e-06, "loss": 2.3505, "step": 468850 }, { "epoch": 0.82, "learning_rate": 9.118224590798592e-06, "loss": 2.2118, "step": 468860 }, { "epoch": 0.82, "learning_rate": 9.117352650871766e-06, "loss": 2.2007, "step": 468870 }, { "epoch": 0.82, "learning_rate": 9.116480710944938e-06, "loss": 2.166, "step": 468880 }, { "epoch": 0.82, "learning_rate": 9.115608771018113e-06, "loss": 2.3598, "step": 468890 }, { "epoch": 0.82, "learning_rate": 9.114736831091287e-06, "loss": 2.3382, "step": 468900 }, { "epoch": 0.82, "learning_rate": 9.113864891164459e-06, "loss": 2.3267, "step": 468910 }, { "epoch": 0.82, "learning_rate": 9.112992951237633e-06, "loss": 2.2422, "step": 468920 }, { "epoch": 0.82, "learning_rate": 9.112121011310805e-06, "loss": 2.2278, "step": 468930 }, { "epoch": 0.82, "learning_rate": 9.111249071383979e-06, "loss": 2.2207, "step": 468940 }, { "epoch": 0.82, "learning_rate": 9.11037713145715e-06, "loss": 2.2949, "step": 468950 }, { "epoch": 0.82, "learning_rate": 9.109505191530324e-06, "loss": 2.1944, "step": 468960 }, { "epoch": 0.82, "learning_rate": 9.108633251603498e-06, "loss": 2.3121, "step": 468970 }, { "epoch": 0.82, "learning_rate": 9.107761311676672e-06, "loss": 2.3398, "step": 468980 }, { "epoch": 0.82, "learning_rate": 9.106889371749844e-06, "loss": 2.2927, "step": 468990 }, { "epoch": 0.82, "learning_rate": 9.106017431823018e-06, "loss": 2.2454, "step": 469000 }, { "epoch": 0.82, "learning_rate": 9.10514549189619e-06, "loss": 2.3898, "step": 469010 }, { "epoch": 0.82, "learning_rate": 9.104273551969364e-06, "loss": 2.2775, "step": 469020 }, { "epoch": 0.82, "learning_rate": 9.103401612042537e-06, "loss": 2.2213, "step": 469030 }, { "epoch": 0.82, "learning_rate": 9.10252967211571e-06, "loss": 2.3986, "step": 469040 }, { "epoch": 0.82, "learning_rate": 9.101657732188883e-06, "loss": 2.2416, "step": 469050 }, { "epoch": 0.82, "learning_rate": 9.100785792262057e-06, "loss": 2.2836, "step": 469060 }, { "epoch": 0.82, "learning_rate": 9.09991385233523e-06, "loss": 2.3326, "step": 469070 }, { "epoch": 0.82, "learning_rate": 9.099041912408403e-06, "loss": 2.3263, "step": 469080 }, { "epoch": 0.82, "learning_rate": 9.098169972481577e-06, "loss": 2.2627, "step": 469090 }, { "epoch": 0.82, "learning_rate": 9.097298032554749e-06, "loss": 2.3651, "step": 469100 }, { "epoch": 0.82, "learning_rate": 9.096426092627923e-06, "loss": 2.2397, "step": 469110 }, { "epoch": 0.82, "learning_rate": 9.095554152701095e-06, "loss": 2.2586, "step": 469120 }, { "epoch": 0.82, "learning_rate": 9.09468221277427e-06, "loss": 2.2821, "step": 469130 }, { "epoch": 0.82, "learning_rate": 9.093810272847442e-06, "loss": 2.2996, "step": 469140 }, { "epoch": 0.82, "learning_rate": 9.092938332920616e-06, "loss": 2.2071, "step": 469150 }, { "epoch": 0.82, "learning_rate": 9.09206639299379e-06, "loss": 2.3098, "step": 469160 }, { "epoch": 0.82, "learning_rate": 9.091194453066962e-06, "loss": 2.2811, "step": 469170 }, { "epoch": 0.82, "learning_rate": 9.090322513140136e-06, "loss": 2.2337, "step": 469180 }, { "epoch": 0.82, "learning_rate": 9.089450573213308e-06, "loss": 2.3442, "step": 469190 }, { "epoch": 0.82, "learning_rate": 9.088578633286481e-06, "loss": 2.2529, "step": 469200 }, { "epoch": 0.82, "learning_rate": 9.087706693359655e-06, "loss": 2.2271, "step": 469210 }, { "epoch": 0.82, "learning_rate": 9.086834753432829e-06, "loss": 2.3481, "step": 469220 }, { "epoch": 0.82, "learning_rate": 9.085962813506001e-06, "loss": 2.2435, "step": 469230 }, { "epoch": 0.82, "learning_rate": 9.085090873579175e-06, "loss": 2.2631, "step": 469240 }, { "epoch": 0.82, "learning_rate": 9.084218933652347e-06, "loss": 2.3589, "step": 469250 }, { "epoch": 0.82, "learning_rate": 9.08334699372552e-06, "loss": 2.3235, "step": 469260 }, { "epoch": 0.82, "learning_rate": 9.082475053798693e-06, "loss": 2.2593, "step": 469270 }, { "epoch": 0.82, "learning_rate": 9.081603113871866e-06, "loss": 2.3189, "step": 469280 }, { "epoch": 0.82, "learning_rate": 9.08073117394504e-06, "loss": 2.2881, "step": 469290 }, { "epoch": 0.82, "learning_rate": 9.079859234018214e-06, "loss": 2.2916, "step": 469300 }, { "epoch": 0.82, "learning_rate": 9.078987294091388e-06, "loss": 2.2616, "step": 469310 }, { "epoch": 0.82, "learning_rate": 9.07811535416456e-06, "loss": 2.2874, "step": 469320 }, { "epoch": 0.82, "learning_rate": 9.077243414237734e-06, "loss": 2.3071, "step": 469330 }, { "epoch": 0.82, "learning_rate": 9.076371474310906e-06, "loss": 2.3332, "step": 469340 }, { "epoch": 0.82, "learning_rate": 9.07549953438408e-06, "loss": 2.4219, "step": 469350 }, { "epoch": 0.82, "learning_rate": 9.074627594457252e-06, "loss": 2.3301, "step": 469360 }, { "epoch": 0.82, "learning_rate": 9.073755654530427e-06, "loss": 2.3133, "step": 469370 }, { "epoch": 0.82, "learning_rate": 9.072883714603599e-06, "loss": 2.1245, "step": 469380 }, { "epoch": 0.82, "learning_rate": 9.072011774676773e-06, "loss": 2.24, "step": 469390 }, { "epoch": 0.82, "learning_rate": 9.071139834749945e-06, "loss": 2.2544, "step": 469400 }, { "epoch": 0.82, "learning_rate": 9.070267894823119e-06, "loss": 2.2795, "step": 469410 }, { "epoch": 0.82, "learning_rate": 9.069395954896292e-06, "loss": 2.1665, "step": 469420 }, { "epoch": 0.82, "learning_rate": 9.068524014969465e-06, "loss": 2.3691, "step": 469430 }, { "epoch": 0.82, "learning_rate": 9.067652075042638e-06, "loss": 2.2463, "step": 469440 }, { "epoch": 0.82, "learning_rate": 9.066780135115812e-06, "loss": 2.292, "step": 469450 }, { "epoch": 0.82, "learning_rate": 9.065908195188986e-06, "loss": 2.3023, "step": 469460 }, { "epoch": 0.82, "learning_rate": 9.065036255262158e-06, "loss": 2.3804, "step": 469470 }, { "epoch": 0.82, "learning_rate": 9.064164315335332e-06, "loss": 2.1864, "step": 469480 }, { "epoch": 0.82, "learning_rate": 9.063292375408504e-06, "loss": 2.1579, "step": 469490 }, { "epoch": 0.82, "learning_rate": 9.062420435481678e-06, "loss": 2.309, "step": 469500 }, { "epoch": 0.82, "learning_rate": 9.06154849555485e-06, "loss": 2.3089, "step": 469510 }, { "epoch": 0.82, "learning_rate": 9.060676555628023e-06, "loss": 2.3672, "step": 469520 }, { "epoch": 0.82, "learning_rate": 9.059804615701197e-06, "loss": 2.3495, "step": 469530 }, { "epoch": 0.82, "learning_rate": 9.058932675774371e-06, "loss": 2.2828, "step": 469540 }, { "epoch": 0.82, "learning_rate": 9.058060735847545e-06, "loss": 2.1853, "step": 469550 }, { "epoch": 0.82, "learning_rate": 9.057188795920717e-06, "loss": 2.352, "step": 469560 }, { "epoch": 0.82, "learning_rate": 9.05631685599389e-06, "loss": 2.3477, "step": 469570 }, { "epoch": 0.82, "learning_rate": 9.055444916067063e-06, "loss": 2.233, "step": 469580 }, { "epoch": 0.82, "learning_rate": 9.054572976140236e-06, "loss": 2.2785, "step": 469590 }, { "epoch": 0.82, "learning_rate": 9.053701036213408e-06, "loss": 2.333, "step": 469600 }, { "epoch": 0.82, "learning_rate": 9.052829096286582e-06, "loss": 2.2848, "step": 469610 }, { "epoch": 0.82, "learning_rate": 9.051957156359756e-06, "loss": 2.1815, "step": 469620 }, { "epoch": 0.82, "learning_rate": 9.05108521643293e-06, "loss": 2.2387, "step": 469630 }, { "epoch": 0.82, "learning_rate": 9.050213276506102e-06, "loss": 2.3014, "step": 469640 }, { "epoch": 0.82, "learning_rate": 9.049341336579276e-06, "loss": 2.3718, "step": 469650 }, { "epoch": 0.82, "learning_rate": 9.048469396652448e-06, "loss": 2.1547, "step": 469660 }, { "epoch": 0.82, "learning_rate": 9.047597456725621e-06, "loss": 2.191, "step": 469670 }, { "epoch": 0.82, "learning_rate": 9.046725516798795e-06, "loss": 2.2652, "step": 469680 }, { "epoch": 0.82, "learning_rate": 9.045853576871969e-06, "loss": 2.3063, "step": 469690 }, { "epoch": 0.82, "learning_rate": 9.044981636945143e-06, "loss": 2.2039, "step": 469700 }, { "epoch": 0.82, "learning_rate": 9.044109697018315e-06, "loss": 2.2437, "step": 469710 }, { "epoch": 0.82, "learning_rate": 9.043237757091489e-06, "loss": 2.3204, "step": 469720 }, { "epoch": 0.82, "learning_rate": 9.04236581716466e-06, "loss": 2.2554, "step": 469730 }, { "epoch": 0.82, "learning_rate": 9.041493877237834e-06, "loss": 2.224, "step": 469740 }, { "epoch": 0.82, "learning_rate": 9.040621937311007e-06, "loss": 2.2728, "step": 469750 }, { "epoch": 0.82, "learning_rate": 9.03974999738418e-06, "loss": 2.3063, "step": 469760 }, { "epoch": 0.82, "learning_rate": 9.038878057457354e-06, "loss": 2.2609, "step": 469770 }, { "epoch": 0.82, "learning_rate": 9.038006117530528e-06, "loss": 2.2222, "step": 469780 }, { "epoch": 0.82, "learning_rate": 9.0371341776037e-06, "loss": 2.338, "step": 469790 }, { "epoch": 0.82, "learning_rate": 9.036262237676874e-06, "loss": 2.3101, "step": 469800 }, { "epoch": 0.82, "learning_rate": 9.035390297750046e-06, "loss": 2.2036, "step": 469810 }, { "epoch": 0.82, "learning_rate": 9.03451835782322e-06, "loss": 2.3274, "step": 469820 }, { "epoch": 0.82, "learning_rate": 9.033646417896393e-06, "loss": 2.2299, "step": 469830 }, { "epoch": 0.82, "learning_rate": 9.032774477969565e-06, "loss": 2.2768, "step": 469840 }, { "epoch": 0.82, "learning_rate": 9.031902538042739e-06, "loss": 2.2164, "step": 469850 }, { "epoch": 0.82, "learning_rate": 9.031030598115913e-06, "loss": 2.24, "step": 469860 }, { "epoch": 0.82, "learning_rate": 9.030158658189087e-06, "loss": 2.2611, "step": 469870 }, { "epoch": 0.82, "learning_rate": 9.029286718262259e-06, "loss": 2.3425, "step": 469880 }, { "epoch": 0.82, "learning_rate": 9.028414778335433e-06, "loss": 2.1837, "step": 469890 }, { "epoch": 0.82, "learning_rate": 9.027542838408605e-06, "loss": 2.2721, "step": 469900 }, { "epoch": 0.82, "learning_rate": 9.026670898481778e-06, "loss": 2.2771, "step": 469910 }, { "epoch": 0.82, "learning_rate": 9.02579895855495e-06, "loss": 2.3608, "step": 469920 }, { "epoch": 0.82, "learning_rate": 9.024927018628126e-06, "loss": 2.2734, "step": 469930 }, { "epoch": 0.82, "learning_rate": 9.024055078701298e-06, "loss": 2.1884, "step": 469940 }, { "epoch": 0.82, "learning_rate": 9.023183138774472e-06, "loss": 2.3059, "step": 469950 }, { "epoch": 0.82, "learning_rate": 9.022311198847646e-06, "loss": 2.2906, "step": 469960 }, { "epoch": 0.82, "learning_rate": 9.021439258920818e-06, "loss": 2.3393, "step": 469970 }, { "epoch": 0.82, "learning_rate": 9.020567318993991e-06, "loss": 2.2146, "step": 469980 }, { "epoch": 0.82, "learning_rate": 9.019695379067163e-06, "loss": 2.2807, "step": 469990 }, { "epoch": 0.82, "learning_rate": 9.018823439140337e-06, "loss": 2.1978, "step": 470000 }, { "epoch": 0.82, "learning_rate": 9.017951499213511e-06, "loss": 2.2935, "step": 470010 }, { "epoch": 0.82, "learning_rate": 9.017079559286685e-06, "loss": 2.2789, "step": 470020 }, { "epoch": 0.82, "learning_rate": 9.016207619359857e-06, "loss": 2.2992, "step": 470030 }, { "epoch": 0.82, "learning_rate": 9.01533567943303e-06, "loss": 2.1447, "step": 470040 }, { "epoch": 0.82, "learning_rate": 9.014463739506203e-06, "loss": 2.2367, "step": 470050 }, { "epoch": 0.82, "learning_rate": 9.013591799579376e-06, "loss": 2.307, "step": 470060 }, { "epoch": 0.82, "learning_rate": 9.012719859652549e-06, "loss": 2.3357, "step": 470070 }, { "epoch": 0.82, "learning_rate": 9.011847919725722e-06, "loss": 2.3171, "step": 470080 }, { "epoch": 0.82, "learning_rate": 9.010975979798896e-06, "loss": 2.3004, "step": 470090 }, { "epoch": 0.82, "learning_rate": 9.01010403987207e-06, "loss": 2.3763, "step": 470100 }, { "epoch": 0.82, "learning_rate": 9.009232099945244e-06, "loss": 2.2863, "step": 470110 }, { "epoch": 0.82, "learning_rate": 9.008360160018416e-06, "loss": 2.3619, "step": 470120 }, { "epoch": 0.82, "learning_rate": 9.00748822009159e-06, "loss": 2.2901, "step": 470130 }, { "epoch": 0.82, "learning_rate": 9.006616280164762e-06, "loss": 2.3602, "step": 470140 }, { "epoch": 0.82, "learning_rate": 9.005744340237935e-06, "loss": 2.2646, "step": 470150 }, { "epoch": 0.82, "learning_rate": 9.004872400311107e-06, "loss": 2.2879, "step": 470160 }, { "epoch": 0.82, "learning_rate": 9.004000460384283e-06, "loss": 2.2794, "step": 470170 }, { "epoch": 0.82, "learning_rate": 9.003128520457455e-06, "loss": 2.1933, "step": 470180 }, { "epoch": 0.82, "learning_rate": 9.002256580530629e-06, "loss": 2.3553, "step": 470190 }, { "epoch": 0.82, "learning_rate": 9.0013846406038e-06, "loss": 2.2722, "step": 470200 }, { "epoch": 0.82, "learning_rate": 9.000512700676975e-06, "loss": 2.3319, "step": 470210 }, { "epoch": 0.82, "learning_rate": 8.999640760750148e-06, "loss": 2.362, "step": 470220 }, { "epoch": 0.82, "learning_rate": 8.99876882082332e-06, "loss": 2.2248, "step": 470230 }, { "epoch": 0.82, "learning_rate": 8.997896880896494e-06, "loss": 2.3041, "step": 470240 }, { "epoch": 0.82, "learning_rate": 8.997024940969668e-06, "loss": 2.3115, "step": 470250 }, { "epoch": 0.82, "learning_rate": 8.996153001042842e-06, "loss": 2.2544, "step": 470260 }, { "epoch": 0.82, "learning_rate": 8.995281061116014e-06, "loss": 2.2256, "step": 470270 }, { "epoch": 0.82, "learning_rate": 8.994409121189188e-06, "loss": 2.329, "step": 470280 }, { "epoch": 0.82, "learning_rate": 8.99353718126236e-06, "loss": 2.2246, "step": 470290 }, { "epoch": 0.82, "learning_rate": 8.992665241335533e-06, "loss": 2.1667, "step": 470300 }, { "epoch": 0.82, "learning_rate": 8.991793301408705e-06, "loss": 2.2255, "step": 470310 }, { "epoch": 0.82, "learning_rate": 8.99092136148188e-06, "loss": 2.3512, "step": 470320 }, { "epoch": 0.82, "learning_rate": 8.990049421555053e-06, "loss": 2.3446, "step": 470330 }, { "epoch": 0.82, "learning_rate": 8.989177481628227e-06, "loss": 2.3352, "step": 470340 }, { "epoch": 0.82, "learning_rate": 8.9883055417014e-06, "loss": 2.4277, "step": 470350 }, { "epoch": 0.82, "learning_rate": 8.987433601774573e-06, "loss": 2.2606, "step": 470360 }, { "epoch": 0.82, "learning_rate": 8.986561661847746e-06, "loss": 2.3451, "step": 470370 }, { "epoch": 0.82, "learning_rate": 8.985689721920918e-06, "loss": 2.2084, "step": 470380 }, { "epoch": 0.82, "learning_rate": 8.984817781994092e-06, "loss": 2.4582, "step": 470390 }, { "epoch": 0.82, "learning_rate": 8.983945842067264e-06, "loss": 2.2351, "step": 470400 }, { "epoch": 0.82, "learning_rate": 8.98307390214044e-06, "loss": 2.2755, "step": 470410 }, { "epoch": 0.82, "learning_rate": 8.982201962213612e-06, "loss": 2.2769, "step": 470420 }, { "epoch": 0.82, "learning_rate": 8.981330022286786e-06, "loss": 2.3406, "step": 470430 }, { "epoch": 0.82, "learning_rate": 8.980458082359958e-06, "loss": 2.1775, "step": 470440 }, { "epoch": 0.82, "learning_rate": 8.979586142433131e-06, "loss": 2.2645, "step": 470450 }, { "epoch": 0.82, "learning_rate": 8.978714202506304e-06, "loss": 2.3645, "step": 470460 }, { "epoch": 0.82, "learning_rate": 8.977842262579477e-06, "loss": 2.2887, "step": 470470 }, { "epoch": 0.82, "learning_rate": 8.976970322652651e-06, "loss": 2.3165, "step": 470480 }, { "epoch": 0.82, "learning_rate": 8.976098382725825e-06, "loss": 2.3074, "step": 470490 }, { "epoch": 0.82, "learning_rate": 8.975226442798999e-06, "loss": 2.1606, "step": 470500 }, { "epoch": 0.82, "learning_rate": 8.97435450287217e-06, "loss": 2.3953, "step": 470510 }, { "epoch": 0.82, "learning_rate": 8.973482562945344e-06, "loss": 2.3507, "step": 470520 }, { "epoch": 0.82, "learning_rate": 8.972610623018517e-06, "loss": 2.3354, "step": 470530 }, { "epoch": 0.82, "learning_rate": 8.97173868309169e-06, "loss": 2.347, "step": 470540 }, { "epoch": 0.82, "learning_rate": 8.970866743164862e-06, "loss": 2.3194, "step": 470550 }, { "epoch": 0.82, "learning_rate": 8.969994803238036e-06, "loss": 2.2947, "step": 470560 }, { "epoch": 0.82, "learning_rate": 8.96912286331121e-06, "loss": 2.2447, "step": 470570 }, { "epoch": 0.82, "learning_rate": 8.968250923384384e-06, "loss": 2.2683, "step": 470580 }, { "epoch": 0.82, "learning_rate": 8.967378983457556e-06, "loss": 2.2034, "step": 470590 }, { "epoch": 0.82, "learning_rate": 8.96650704353073e-06, "loss": 2.1965, "step": 470600 }, { "epoch": 0.82, "learning_rate": 8.965635103603902e-06, "loss": 2.3429, "step": 470610 }, { "epoch": 0.82, "learning_rate": 8.964763163677075e-06, "loss": 2.2145, "step": 470620 }, { "epoch": 0.82, "learning_rate": 8.963891223750249e-06, "loss": 2.37, "step": 470630 }, { "epoch": 0.82, "learning_rate": 8.963019283823421e-06, "loss": 2.229, "step": 470640 }, { "epoch": 0.82, "learning_rate": 8.962147343896595e-06, "loss": 2.3708, "step": 470650 }, { "epoch": 0.82, "learning_rate": 8.961275403969769e-06, "loss": 2.3356, "step": 470660 }, { "epoch": 0.82, "learning_rate": 8.960403464042943e-06, "loss": 2.3393, "step": 470670 }, { "epoch": 0.82, "learning_rate": 8.959531524116115e-06, "loss": 2.2832, "step": 470680 }, { "epoch": 0.82, "learning_rate": 8.958659584189288e-06, "loss": 2.2011, "step": 470690 }, { "epoch": 0.82, "learning_rate": 8.95778764426246e-06, "loss": 2.233, "step": 470700 }, { "epoch": 0.82, "learning_rate": 8.956915704335634e-06, "loss": 2.379, "step": 470710 }, { "epoch": 0.82, "learning_rate": 8.956043764408808e-06, "loss": 2.2044, "step": 470720 }, { "epoch": 0.82, "learning_rate": 8.955171824481982e-06, "loss": 2.2273, "step": 470730 }, { "epoch": 0.82, "learning_rate": 8.954299884555154e-06, "loss": 2.245, "step": 470740 }, { "epoch": 0.82, "learning_rate": 8.953427944628328e-06, "loss": 2.3943, "step": 470750 }, { "epoch": 0.82, "learning_rate": 8.952556004701501e-06, "loss": 2.3144, "step": 470760 }, { "epoch": 0.82, "learning_rate": 8.951684064774673e-06, "loss": 2.319, "step": 470770 }, { "epoch": 0.82, "learning_rate": 8.950812124847847e-06, "loss": 2.3146, "step": 470780 }, { "epoch": 0.82, "learning_rate": 8.94994018492102e-06, "loss": 2.178, "step": 470790 }, { "epoch": 0.82, "learning_rate": 8.949068244994193e-06, "loss": 2.236, "step": 470800 }, { "epoch": 0.82, "learning_rate": 8.948196305067367e-06, "loss": 2.2978, "step": 470810 }, { "epoch": 0.82, "learning_rate": 8.94732436514054e-06, "loss": 2.3081, "step": 470820 }, { "epoch": 0.82, "learning_rate": 8.946452425213713e-06, "loss": 2.2409, "step": 470830 }, { "epoch": 0.82, "learning_rate": 8.945580485286886e-06, "loss": 2.2516, "step": 470840 }, { "epoch": 0.82, "learning_rate": 8.944708545360059e-06, "loss": 2.2637, "step": 470850 }, { "epoch": 0.82, "learning_rate": 8.943836605433232e-06, "loss": 2.297, "step": 470860 }, { "epoch": 0.82, "learning_rate": 8.942964665506404e-06, "loss": 2.3507, "step": 470870 }, { "epoch": 0.82, "learning_rate": 8.942092725579578e-06, "loss": 2.2601, "step": 470880 }, { "epoch": 0.82, "learning_rate": 8.941220785652752e-06, "loss": 2.3266, "step": 470890 }, { "epoch": 0.82, "learning_rate": 8.940348845725926e-06, "loss": 2.2527, "step": 470900 }, { "epoch": 0.82, "learning_rate": 8.9394769057991e-06, "loss": 2.3043, "step": 470910 }, { "epoch": 0.82, "learning_rate": 8.938604965872272e-06, "loss": 2.2606, "step": 470920 }, { "epoch": 0.82, "learning_rate": 8.937733025945445e-06, "loss": 2.319, "step": 470930 }, { "epoch": 0.82, "learning_rate": 8.936861086018617e-06, "loss": 2.2566, "step": 470940 }, { "epoch": 0.82, "learning_rate": 8.935989146091791e-06, "loss": 2.3097, "step": 470950 }, { "epoch": 0.82, "learning_rate": 8.935117206164963e-06, "loss": 2.3286, "step": 470960 }, { "epoch": 0.82, "learning_rate": 8.934245266238139e-06, "loss": 2.1769, "step": 470970 }, { "epoch": 0.82, "learning_rate": 8.93337332631131e-06, "loss": 2.3341, "step": 470980 }, { "epoch": 0.82, "learning_rate": 8.932501386384485e-06, "loss": 2.2833, "step": 470990 }, { "epoch": 0.82, "learning_rate": 8.931629446457657e-06, "loss": 2.2434, "step": 471000 }, { "epoch": 0.82, "learning_rate": 8.93075750653083e-06, "loss": 2.2825, "step": 471010 }, { "epoch": 0.82, "learning_rate": 8.929885566604004e-06, "loss": 2.4669, "step": 471020 }, { "epoch": 0.82, "learning_rate": 8.929013626677176e-06, "loss": 2.3058, "step": 471030 }, { "epoch": 0.82, "learning_rate": 8.92814168675035e-06, "loss": 2.335, "step": 471040 }, { "epoch": 0.82, "learning_rate": 8.927269746823524e-06, "loss": 2.2128, "step": 471050 }, { "epoch": 0.82, "learning_rate": 8.926397806896698e-06, "loss": 2.2126, "step": 471060 }, { "epoch": 0.82, "learning_rate": 8.92552586696987e-06, "loss": 2.4059, "step": 471070 }, { "epoch": 0.82, "learning_rate": 8.924653927043043e-06, "loss": 2.2983, "step": 471080 }, { "epoch": 0.82, "learning_rate": 8.923781987116215e-06, "loss": 2.2213, "step": 471090 }, { "epoch": 0.82, "learning_rate": 8.92291004718939e-06, "loss": 2.404, "step": 471100 }, { "epoch": 0.82, "learning_rate": 8.922038107262561e-06, "loss": 2.3648, "step": 471110 }, { "epoch": 0.82, "learning_rate": 8.921166167335735e-06, "loss": 2.4046, "step": 471120 }, { "epoch": 0.82, "learning_rate": 8.920294227408909e-06, "loss": 2.2552, "step": 471130 }, { "epoch": 0.82, "learning_rate": 8.919422287482083e-06, "loss": 2.2658, "step": 471140 }, { "epoch": 0.82, "learning_rate": 8.918550347555256e-06, "loss": 2.3318, "step": 471150 }, { "epoch": 0.82, "learning_rate": 8.917678407628428e-06, "loss": 2.3344, "step": 471160 }, { "epoch": 0.82, "learning_rate": 8.916806467701602e-06, "loss": 2.2483, "step": 471170 }, { "epoch": 0.82, "learning_rate": 8.915934527774774e-06, "loss": 2.2124, "step": 471180 }, { "epoch": 0.82, "learning_rate": 8.915062587847948e-06, "loss": 2.2035, "step": 471190 }, { "epoch": 0.82, "learning_rate": 8.91419064792112e-06, "loss": 2.273, "step": 471200 }, { "epoch": 0.82, "learning_rate": 8.913318707994296e-06, "loss": 2.2498, "step": 471210 }, { "epoch": 0.82, "learning_rate": 8.912446768067468e-06, "loss": 2.2782, "step": 471220 }, { "epoch": 0.82, "learning_rate": 8.911574828140641e-06, "loss": 2.2999, "step": 471230 }, { "epoch": 0.82, "learning_rate": 8.910702888213814e-06, "loss": 2.2641, "step": 471240 }, { "epoch": 0.82, "learning_rate": 8.909830948286987e-06, "loss": 2.2904, "step": 471250 }, { "epoch": 0.82, "learning_rate": 8.90895900836016e-06, "loss": 2.2144, "step": 471260 }, { "epoch": 0.82, "learning_rate": 8.908087068433333e-06, "loss": 2.3191, "step": 471270 }, { "epoch": 0.82, "learning_rate": 8.907215128506507e-06, "loss": 2.2279, "step": 471280 }, { "epoch": 0.82, "learning_rate": 8.90634318857968e-06, "loss": 2.2864, "step": 471290 }, { "epoch": 0.82, "learning_rate": 8.905471248652854e-06, "loss": 2.2683, "step": 471300 }, { "epoch": 0.82, "learning_rate": 8.904599308726027e-06, "loss": 2.3209, "step": 471310 }, { "epoch": 0.82, "learning_rate": 8.9037273687992e-06, "loss": 2.1913, "step": 471320 }, { "epoch": 0.82, "learning_rate": 8.902855428872372e-06, "loss": 2.2909, "step": 471330 }, { "epoch": 0.82, "learning_rate": 8.901983488945546e-06, "loss": 2.3134, "step": 471340 }, { "epoch": 0.82, "learning_rate": 8.901111549018718e-06, "loss": 2.3285, "step": 471350 }, { "epoch": 0.82, "learning_rate": 8.900239609091892e-06, "loss": 2.332, "step": 471360 }, { "epoch": 0.82, "learning_rate": 8.899367669165066e-06, "loss": 2.3341, "step": 471370 }, { "epoch": 0.82, "learning_rate": 8.89849572923824e-06, "loss": 2.3178, "step": 471380 }, { "epoch": 0.82, "learning_rate": 8.897623789311412e-06, "loss": 2.3041, "step": 471390 }, { "epoch": 0.82, "learning_rate": 8.896751849384585e-06, "loss": 2.2676, "step": 471400 }, { "epoch": 0.82, "learning_rate": 8.895879909457757e-06, "loss": 2.1747, "step": 471410 }, { "epoch": 0.82, "learning_rate": 8.895007969530931e-06, "loss": 2.2763, "step": 471420 }, { "epoch": 0.82, "learning_rate": 8.894136029604105e-06, "loss": 2.308, "step": 471430 }, { "epoch": 0.82, "learning_rate": 8.893264089677277e-06, "loss": 2.242, "step": 471440 }, { "epoch": 0.82, "learning_rate": 8.892392149750453e-06, "loss": 2.2644, "step": 471450 }, { "epoch": 0.82, "learning_rate": 8.891520209823625e-06, "loss": 2.2862, "step": 471460 }, { "epoch": 0.82, "learning_rate": 8.890648269896798e-06, "loss": 2.231, "step": 471470 }, { "epoch": 0.82, "learning_rate": 8.88977632996997e-06, "loss": 2.3539, "step": 471480 }, { "epoch": 0.82, "learning_rate": 8.888904390043144e-06, "loss": 2.2294, "step": 471490 }, { "epoch": 0.82, "learning_rate": 8.888032450116316e-06, "loss": 2.2691, "step": 471500 }, { "epoch": 0.82, "learning_rate": 8.88716051018949e-06, "loss": 2.2838, "step": 471510 }, { "epoch": 0.82, "learning_rate": 8.886288570262664e-06, "loss": 2.294, "step": 471520 }, { "epoch": 0.82, "learning_rate": 8.885416630335838e-06, "loss": 2.4322, "step": 471530 }, { "epoch": 0.82, "learning_rate": 8.88454469040901e-06, "loss": 2.2711, "step": 471540 }, { "epoch": 0.82, "learning_rate": 8.883672750482183e-06, "loss": 2.3326, "step": 471550 }, { "epoch": 0.82, "learning_rate": 8.882800810555357e-06, "loss": 2.2436, "step": 471560 }, { "epoch": 0.82, "learning_rate": 8.88192887062853e-06, "loss": 2.2051, "step": 471570 }, { "epoch": 0.82, "learning_rate": 8.881056930701703e-06, "loss": 2.2299, "step": 471580 }, { "epoch": 0.82, "learning_rate": 8.880184990774875e-06, "loss": 2.249, "step": 471590 }, { "epoch": 0.82, "learning_rate": 8.879313050848049e-06, "loss": 2.1782, "step": 471600 }, { "epoch": 0.82, "learning_rate": 8.878441110921223e-06, "loss": 2.2804, "step": 471610 }, { "epoch": 0.82, "learning_rate": 8.877569170994396e-06, "loss": 2.2128, "step": 471620 }, { "epoch": 0.82, "learning_rate": 8.876697231067569e-06, "loss": 2.3252, "step": 471630 }, { "epoch": 0.82, "learning_rate": 8.875825291140742e-06, "loss": 2.1941, "step": 471640 }, { "epoch": 0.82, "learning_rate": 8.874953351213914e-06, "loss": 2.2615, "step": 471650 }, { "epoch": 0.82, "learning_rate": 8.874081411287088e-06, "loss": 2.2403, "step": 471660 }, { "epoch": 0.82, "learning_rate": 8.87320947136026e-06, "loss": 2.3557, "step": 471670 }, { "epoch": 0.82, "learning_rate": 8.872337531433434e-06, "loss": 2.4232, "step": 471680 }, { "epoch": 0.82, "learning_rate": 8.871465591506608e-06, "loss": 2.2799, "step": 471690 }, { "epoch": 0.82, "learning_rate": 8.870593651579782e-06, "loss": 2.3174, "step": 471700 }, { "epoch": 0.82, "learning_rate": 8.869721711652955e-06, "loss": 2.2411, "step": 471710 }, { "epoch": 0.82, "learning_rate": 8.868849771726127e-06, "loss": 2.2739, "step": 471720 }, { "epoch": 0.82, "learning_rate": 8.867977831799301e-06, "loss": 2.3006, "step": 471730 }, { "epoch": 0.82, "learning_rate": 8.867105891872473e-06, "loss": 2.349, "step": 471740 }, { "epoch": 0.82, "learning_rate": 8.866233951945647e-06, "loss": 2.257, "step": 471750 }, { "epoch": 0.82, "learning_rate": 8.86536201201882e-06, "loss": 2.2719, "step": 471760 }, { "epoch": 0.82, "learning_rate": 8.864490072091995e-06, "loss": 2.2428, "step": 471770 }, { "epoch": 0.82, "learning_rate": 8.863618132165167e-06, "loss": 2.2253, "step": 471780 }, { "epoch": 0.82, "learning_rate": 8.86274619223834e-06, "loss": 2.2227, "step": 471790 }, { "epoch": 0.82, "learning_rate": 8.861874252311512e-06, "loss": 2.2898, "step": 471800 }, { "epoch": 0.82, "learning_rate": 8.861002312384686e-06, "loss": 2.282, "step": 471810 }, { "epoch": 0.82, "learning_rate": 8.86013037245786e-06, "loss": 2.2486, "step": 471820 }, { "epoch": 0.82, "learning_rate": 8.859258432531032e-06, "loss": 2.2055, "step": 471830 }, { "epoch": 0.82, "learning_rate": 8.858386492604206e-06, "loss": 2.255, "step": 471840 }, { "epoch": 0.82, "learning_rate": 8.85751455267738e-06, "loss": 2.3003, "step": 471850 }, { "epoch": 0.82, "learning_rate": 8.856642612750553e-06, "loss": 2.2249, "step": 471860 }, { "epoch": 0.82, "learning_rate": 8.855770672823725e-06, "loss": 2.2975, "step": 471870 }, { "epoch": 0.82, "learning_rate": 8.8548987328969e-06, "loss": 2.2491, "step": 471880 }, { "epoch": 0.82, "learning_rate": 8.854026792970071e-06, "loss": 2.2417, "step": 471890 }, { "epoch": 0.82, "learning_rate": 8.853154853043245e-06, "loss": 2.311, "step": 471900 }, { "epoch": 0.82, "learning_rate": 8.852282913116417e-06, "loss": 2.4047, "step": 471910 }, { "epoch": 0.82, "learning_rate": 8.851410973189591e-06, "loss": 2.1646, "step": 471920 }, { "epoch": 0.82, "learning_rate": 8.850539033262765e-06, "loss": 2.2263, "step": 471930 }, { "epoch": 0.82, "learning_rate": 8.849667093335938e-06, "loss": 2.2196, "step": 471940 }, { "epoch": 0.82, "learning_rate": 8.848795153409112e-06, "loss": 2.2458, "step": 471950 }, { "epoch": 0.82, "learning_rate": 8.847923213482284e-06, "loss": 2.2693, "step": 471960 }, { "epoch": 0.82, "learning_rate": 8.847051273555458e-06, "loss": 2.1565, "step": 471970 }, { "epoch": 0.82, "learning_rate": 8.84617933362863e-06, "loss": 2.2372, "step": 471980 }, { "epoch": 0.82, "learning_rate": 8.845307393701804e-06, "loss": 2.2522, "step": 471990 }, { "epoch": 0.82, "learning_rate": 8.844435453774976e-06, "loss": 2.2716, "step": 472000 }, { "epoch": 0.82, "learning_rate": 8.843563513848151e-06, "loss": 2.1835, "step": 472010 }, { "epoch": 0.82, "learning_rate": 8.842691573921324e-06, "loss": 2.3335, "step": 472020 }, { "epoch": 0.82, "learning_rate": 8.841819633994497e-06, "loss": 2.2544, "step": 472030 }, { "epoch": 0.82, "learning_rate": 8.84094769406767e-06, "loss": 2.0631, "step": 472040 }, { "epoch": 0.82, "learning_rate": 8.840075754140843e-06, "loss": 2.2578, "step": 472050 }, { "epoch": 0.82, "learning_rate": 8.839203814214015e-06, "loss": 2.2897, "step": 472060 }, { "epoch": 0.82, "learning_rate": 8.838331874287189e-06, "loss": 2.2173, "step": 472070 }, { "epoch": 0.82, "learning_rate": 8.837459934360363e-06, "loss": 2.3199, "step": 472080 }, { "epoch": 0.82, "learning_rate": 8.836587994433537e-06, "loss": 2.0896, "step": 472090 }, { "epoch": 0.82, "learning_rate": 8.83571605450671e-06, "loss": 2.3811, "step": 472100 }, { "epoch": 0.82, "learning_rate": 8.834844114579882e-06, "loss": 2.3085, "step": 472110 }, { "epoch": 0.82, "learning_rate": 8.833972174653056e-06, "loss": 2.1882, "step": 472120 }, { "epoch": 0.82, "learning_rate": 8.833100234726228e-06, "loss": 2.1766, "step": 472130 }, { "epoch": 0.82, "learning_rate": 8.832228294799402e-06, "loss": 2.282, "step": 472140 }, { "epoch": 0.82, "learning_rate": 8.831356354872574e-06, "loss": 2.2908, "step": 472150 }, { "epoch": 0.82, "learning_rate": 8.830484414945748e-06, "loss": 2.2969, "step": 472160 }, { "epoch": 0.82, "learning_rate": 8.829612475018922e-06, "loss": 2.1593, "step": 472170 }, { "epoch": 0.82, "learning_rate": 8.828740535092095e-06, "loss": 2.3283, "step": 472180 }, { "epoch": 0.82, "learning_rate": 8.827868595165267e-06, "loss": 2.2766, "step": 472190 }, { "epoch": 0.82, "learning_rate": 8.826996655238441e-06, "loss": 2.2491, "step": 472200 }, { "epoch": 0.82, "learning_rate": 8.826124715311615e-06, "loss": 2.1119, "step": 472210 }, { "epoch": 0.82, "learning_rate": 8.825252775384787e-06, "loss": 2.2319, "step": 472220 }, { "epoch": 0.82, "learning_rate": 8.824380835457961e-06, "loss": 2.2156, "step": 472230 }, { "epoch": 0.82, "learning_rate": 8.823508895531133e-06, "loss": 2.2734, "step": 472240 }, { "epoch": 0.82, "learning_rate": 8.822636955604308e-06, "loss": 2.2617, "step": 472250 }, { "epoch": 0.82, "learning_rate": 8.82176501567748e-06, "loss": 2.3756, "step": 472260 }, { "epoch": 0.82, "learning_rate": 8.820893075750654e-06, "loss": 2.2669, "step": 472270 }, { "epoch": 0.82, "learning_rate": 8.820021135823826e-06, "loss": 2.2141, "step": 472280 }, { "epoch": 0.82, "learning_rate": 8.819149195897e-06, "loss": 2.3312, "step": 472290 }, { "epoch": 0.82, "learning_rate": 8.818277255970172e-06, "loss": 2.236, "step": 472300 }, { "epoch": 0.82, "learning_rate": 8.817405316043346e-06, "loss": 2.2862, "step": 472310 }, { "epoch": 0.82, "learning_rate": 8.81653337611652e-06, "loss": 2.2771, "step": 472320 }, { "epoch": 0.82, "learning_rate": 8.815661436189693e-06, "loss": 2.3653, "step": 472330 }, { "epoch": 0.82, "learning_rate": 8.814789496262866e-06, "loss": 2.3246, "step": 472340 }, { "epoch": 0.82, "learning_rate": 8.81391755633604e-06, "loss": 2.2508, "step": 472350 }, { "epoch": 0.82, "learning_rate": 8.813045616409213e-06, "loss": 2.1967, "step": 472360 }, { "epoch": 0.82, "learning_rate": 8.812173676482385e-06, "loss": 2.295, "step": 472370 }, { "epoch": 0.82, "learning_rate": 8.811301736555559e-06, "loss": 2.2281, "step": 472380 }, { "epoch": 0.82, "learning_rate": 8.810429796628731e-06, "loss": 2.4232, "step": 472390 }, { "epoch": 0.82, "learning_rate": 8.809557856701905e-06, "loss": 2.3171, "step": 472400 }, { "epoch": 0.82, "learning_rate": 8.808685916775079e-06, "loss": 2.3097, "step": 472410 }, { "epoch": 0.82, "learning_rate": 8.807813976848252e-06, "loss": 2.2769, "step": 472420 }, { "epoch": 0.82, "learning_rate": 8.806942036921424e-06, "loss": 2.2512, "step": 472430 }, { "epoch": 0.82, "learning_rate": 8.806070096994598e-06, "loss": 2.1086, "step": 472440 }, { "epoch": 0.82, "learning_rate": 8.80519815706777e-06, "loss": 2.2715, "step": 472450 }, { "epoch": 0.82, "learning_rate": 8.804326217140944e-06, "loss": 2.2346, "step": 472460 }, { "epoch": 0.82, "learning_rate": 8.803454277214116e-06, "loss": 2.241, "step": 472470 }, { "epoch": 0.82, "learning_rate": 8.80258233728729e-06, "loss": 2.2152, "step": 472480 }, { "epoch": 0.82, "learning_rate": 8.801710397360465e-06, "loss": 2.3598, "step": 472490 }, { "epoch": 0.82, "learning_rate": 8.800838457433637e-06, "loss": 2.3448, "step": 472500 }, { "epoch": 0.82, "learning_rate": 8.799966517506811e-06, "loss": 2.2179, "step": 472510 }, { "epoch": 0.82, "learning_rate": 8.799094577579983e-06, "loss": 2.2606, "step": 472520 }, { "epoch": 0.82, "learning_rate": 8.798222637653157e-06, "loss": 2.2263, "step": 472530 }, { "epoch": 0.82, "learning_rate": 8.797350697726329e-06, "loss": 2.3012, "step": 472540 }, { "epoch": 0.82, "learning_rate": 8.796478757799503e-06, "loss": 2.3341, "step": 472550 }, { "epoch": 0.82, "learning_rate": 8.795606817872677e-06, "loss": 2.2671, "step": 472560 }, { "epoch": 0.82, "learning_rate": 8.79473487794585e-06, "loss": 2.3169, "step": 472570 }, { "epoch": 0.82, "learning_rate": 8.793862938019022e-06, "loss": 2.209, "step": 472580 }, { "epoch": 0.82, "learning_rate": 8.792990998092196e-06, "loss": 2.2451, "step": 472590 }, { "epoch": 0.82, "learning_rate": 8.792119058165368e-06, "loss": 2.3416, "step": 472600 }, { "epoch": 0.82, "learning_rate": 8.791247118238542e-06, "loss": 2.2436, "step": 472610 }, { "epoch": 0.82, "learning_rate": 8.790375178311716e-06, "loss": 2.2272, "step": 472620 }, { "epoch": 0.82, "learning_rate": 8.789503238384888e-06, "loss": 2.3204, "step": 472630 }, { "epoch": 0.82, "learning_rate": 8.788631298458062e-06, "loss": 2.3277, "step": 472640 }, { "epoch": 0.82, "learning_rate": 8.787759358531235e-06, "loss": 2.3039, "step": 472650 }, { "epoch": 0.82, "learning_rate": 8.78688741860441e-06, "loss": 2.3434, "step": 472660 }, { "epoch": 0.82, "learning_rate": 8.786015478677581e-06, "loss": 2.0666, "step": 472670 }, { "epoch": 0.82, "learning_rate": 8.785143538750755e-06, "loss": 2.2171, "step": 472680 }, { "epoch": 0.82, "learning_rate": 8.784271598823927e-06, "loss": 2.2484, "step": 472690 }, { "epoch": 0.82, "learning_rate": 8.783399658897101e-06, "loss": 2.2546, "step": 472700 }, { "epoch": 0.82, "learning_rate": 8.782527718970273e-06, "loss": 2.2835, "step": 472710 }, { "epoch": 0.82, "learning_rate": 8.781655779043447e-06, "loss": 2.3424, "step": 472720 }, { "epoch": 0.82, "learning_rate": 8.78078383911662e-06, "loss": 2.3057, "step": 472730 }, { "epoch": 0.82, "learning_rate": 8.779911899189794e-06, "loss": 2.3289, "step": 472740 }, { "epoch": 0.82, "learning_rate": 8.779039959262968e-06, "loss": 2.3475, "step": 472750 }, { "epoch": 0.82, "learning_rate": 8.77816801933614e-06, "loss": 2.302, "step": 472760 }, { "epoch": 0.82, "learning_rate": 8.777296079409314e-06, "loss": 2.1842, "step": 472770 }, { "epoch": 0.82, "learning_rate": 8.776424139482486e-06, "loss": 2.3026, "step": 472780 }, { "epoch": 0.82, "learning_rate": 8.77555219955566e-06, "loss": 2.1847, "step": 472790 }, { "epoch": 0.82, "learning_rate": 8.774680259628834e-06, "loss": 2.1981, "step": 472800 }, { "epoch": 0.82, "learning_rate": 8.773808319702007e-06, "loss": 2.2417, "step": 472810 }, { "epoch": 0.82, "learning_rate": 8.77293637977518e-06, "loss": 2.33, "step": 472820 }, { "epoch": 0.82, "learning_rate": 8.772064439848353e-06, "loss": 2.2675, "step": 472830 }, { "epoch": 0.82, "learning_rate": 8.771192499921525e-06, "loss": 2.3211, "step": 472840 }, { "epoch": 0.82, "learning_rate": 8.770320559994699e-06, "loss": 2.3442, "step": 472850 }, { "epoch": 0.82, "learning_rate": 8.769448620067871e-06, "loss": 2.2454, "step": 472860 }, { "epoch": 0.82, "learning_rate": 8.768576680141045e-06, "loss": 2.3064, "step": 472870 }, { "epoch": 0.82, "learning_rate": 8.767704740214219e-06, "loss": 2.2671, "step": 472880 }, { "epoch": 0.82, "learning_rate": 8.766832800287392e-06, "loss": 2.3659, "step": 472890 }, { "epoch": 0.82, "learning_rate": 8.765960860360566e-06, "loss": 2.3167, "step": 472900 }, { "epoch": 0.82, "learning_rate": 8.765088920433738e-06, "loss": 2.3219, "step": 472910 }, { "epoch": 0.82, "learning_rate": 8.764216980506912e-06, "loss": 2.3309, "step": 472920 }, { "epoch": 0.82, "learning_rate": 8.763345040580084e-06, "loss": 2.4069, "step": 472930 }, { "epoch": 0.82, "learning_rate": 8.762473100653258e-06, "loss": 2.2254, "step": 472940 }, { "epoch": 0.82, "learning_rate": 8.76160116072643e-06, "loss": 2.4111, "step": 472950 }, { "epoch": 0.82, "learning_rate": 8.760729220799604e-06, "loss": 2.0802, "step": 472960 }, { "epoch": 0.82, "learning_rate": 8.759857280872777e-06, "loss": 2.2118, "step": 472970 }, { "epoch": 0.82, "learning_rate": 8.758985340945951e-06, "loss": 2.2344, "step": 472980 }, { "epoch": 0.82, "learning_rate": 8.758113401019123e-06, "loss": 2.1901, "step": 472990 }, { "epoch": 0.82, "learning_rate": 8.757241461092297e-06, "loss": 2.348, "step": 473000 }, { "epoch": 0.82, "learning_rate": 8.756369521165471e-06, "loss": 2.3072, "step": 473010 }, { "epoch": 0.82, "learning_rate": 8.755497581238643e-06, "loss": 2.2443, "step": 473020 }, { "epoch": 0.82, "learning_rate": 8.754625641311817e-06, "loss": 2.198, "step": 473030 }, { "epoch": 0.82, "learning_rate": 8.753753701384989e-06, "loss": 2.3734, "step": 473040 }, { "epoch": 0.82, "learning_rate": 8.752881761458164e-06, "loss": 2.1635, "step": 473050 }, { "epoch": 0.82, "learning_rate": 8.752009821531336e-06, "loss": 2.2393, "step": 473060 }, { "epoch": 0.82, "learning_rate": 8.75113788160451e-06, "loss": 2.3384, "step": 473070 }, { "epoch": 0.82, "learning_rate": 8.750265941677682e-06, "loss": 2.3154, "step": 473080 }, { "epoch": 0.83, "learning_rate": 8.749394001750856e-06, "loss": 2.284, "step": 473090 }, { "epoch": 0.83, "learning_rate": 8.748522061824028e-06, "loss": 2.2767, "step": 473100 }, { "epoch": 0.83, "learning_rate": 8.747650121897202e-06, "loss": 2.334, "step": 473110 }, { "epoch": 0.83, "learning_rate": 8.746778181970376e-06, "loss": 2.3093, "step": 473120 }, { "epoch": 0.83, "learning_rate": 8.74590624204355e-06, "loss": 2.2224, "step": 473130 }, { "epoch": 0.83, "learning_rate": 8.745034302116723e-06, "loss": 2.3021, "step": 473140 }, { "epoch": 0.83, "learning_rate": 8.744162362189895e-06, "loss": 2.1875, "step": 473150 }, { "epoch": 0.83, "learning_rate": 8.743290422263069e-06, "loss": 2.4325, "step": 473160 }, { "epoch": 0.83, "learning_rate": 8.742418482336241e-06, "loss": 2.0798, "step": 473170 }, { "epoch": 0.83, "learning_rate": 8.741546542409415e-06, "loss": 2.3246, "step": 473180 }, { "epoch": 0.83, "learning_rate": 8.740674602482587e-06, "loss": 2.2373, "step": 473190 }, { "epoch": 0.83, "learning_rate": 8.73980266255576e-06, "loss": 2.3055, "step": 473200 }, { "epoch": 0.83, "learning_rate": 8.738930722628934e-06, "loss": 2.2463, "step": 473210 }, { "epoch": 0.83, "learning_rate": 8.738058782702108e-06, "loss": 2.2724, "step": 473220 }, { "epoch": 0.83, "learning_rate": 8.73718684277528e-06, "loss": 2.2593, "step": 473230 }, { "epoch": 0.83, "learning_rate": 8.736314902848454e-06, "loss": 2.3198, "step": 473240 }, { "epoch": 0.83, "learning_rate": 8.735442962921626e-06, "loss": 2.4139, "step": 473250 }, { "epoch": 0.83, "learning_rate": 8.7345710229948e-06, "loss": 2.3379, "step": 473260 }, { "epoch": 0.83, "learning_rate": 8.733699083067972e-06, "loss": 2.3872, "step": 473270 }, { "epoch": 0.83, "learning_rate": 8.732827143141146e-06, "loss": 2.3133, "step": 473280 }, { "epoch": 0.83, "learning_rate": 8.731955203214321e-06, "loss": 2.235, "step": 473290 }, { "epoch": 0.83, "learning_rate": 8.731083263287493e-06, "loss": 2.1817, "step": 473300 }, { "epoch": 0.83, "learning_rate": 8.730211323360667e-06, "loss": 2.3015, "step": 473310 }, { "epoch": 0.83, "learning_rate": 8.729339383433839e-06, "loss": 2.2643, "step": 473320 }, { "epoch": 0.83, "learning_rate": 8.728467443507013e-06, "loss": 2.212, "step": 473330 }, { "epoch": 0.83, "learning_rate": 8.727595503580185e-06, "loss": 2.2544, "step": 473340 }, { "epoch": 0.83, "learning_rate": 8.726723563653359e-06, "loss": 2.2347, "step": 473350 }, { "epoch": 0.83, "learning_rate": 8.725851623726532e-06, "loss": 2.2856, "step": 473360 }, { "epoch": 0.83, "learning_rate": 8.724979683799706e-06, "loss": 2.2959, "step": 473370 }, { "epoch": 0.83, "learning_rate": 8.724107743872878e-06, "loss": 2.2593, "step": 473380 }, { "epoch": 0.83, "learning_rate": 8.723235803946052e-06, "loss": 2.3605, "step": 473390 }, { "epoch": 0.83, "learning_rate": 8.722363864019224e-06, "loss": 2.298, "step": 473400 }, { "epoch": 0.83, "learning_rate": 8.721491924092398e-06, "loss": 2.2265, "step": 473410 }, { "epoch": 0.83, "learning_rate": 8.720619984165572e-06, "loss": 2.1581, "step": 473420 }, { "epoch": 0.83, "learning_rate": 8.719748044238744e-06, "loss": 2.2321, "step": 473430 }, { "epoch": 0.83, "learning_rate": 8.718876104311918e-06, "loss": 2.3267, "step": 473440 }, { "epoch": 0.83, "learning_rate": 8.718004164385091e-06, "loss": 2.126, "step": 473450 }, { "epoch": 0.83, "learning_rate": 8.717132224458265e-06, "loss": 2.3792, "step": 473460 }, { "epoch": 0.83, "learning_rate": 8.716260284531437e-06, "loss": 2.23, "step": 473470 }, { "epoch": 0.83, "learning_rate": 8.715388344604611e-06, "loss": 2.2308, "step": 473480 }, { "epoch": 0.83, "learning_rate": 8.714516404677783e-06, "loss": 2.3047, "step": 473490 }, { "epoch": 0.83, "learning_rate": 8.713644464750957e-06, "loss": 2.2308, "step": 473500 }, { "epoch": 0.83, "learning_rate": 8.712772524824129e-06, "loss": 2.2924, "step": 473510 }, { "epoch": 0.83, "learning_rate": 8.711900584897303e-06, "loss": 2.1755, "step": 473520 }, { "epoch": 0.83, "learning_rate": 8.711028644970476e-06, "loss": 2.1875, "step": 473530 }, { "epoch": 0.83, "learning_rate": 8.71015670504365e-06, "loss": 2.3021, "step": 473540 }, { "epoch": 0.83, "learning_rate": 8.709284765116824e-06, "loss": 2.4189, "step": 473550 }, { "epoch": 0.83, "learning_rate": 8.708412825189996e-06, "loss": 2.3308, "step": 473560 }, { "epoch": 0.83, "learning_rate": 8.70754088526317e-06, "loss": 2.265, "step": 473570 }, { "epoch": 0.83, "learning_rate": 8.706668945336342e-06, "loss": 2.341, "step": 473580 }, { "epoch": 0.83, "learning_rate": 8.705797005409516e-06, "loss": 2.3446, "step": 473590 }, { "epoch": 0.83, "learning_rate": 8.70492506548269e-06, "loss": 2.3117, "step": 473600 }, { "epoch": 0.83, "learning_rate": 8.704053125555863e-06, "loss": 2.3387, "step": 473610 }, { "epoch": 0.83, "learning_rate": 8.703181185629035e-06, "loss": 2.3223, "step": 473620 }, { "epoch": 0.83, "learning_rate": 8.702309245702209e-06, "loss": 2.4142, "step": 473630 }, { "epoch": 0.83, "learning_rate": 8.701437305775381e-06, "loss": 2.2522, "step": 473640 }, { "epoch": 0.83, "learning_rate": 8.700565365848555e-06, "loss": 2.3146, "step": 473650 }, { "epoch": 0.83, "learning_rate": 8.699693425921727e-06, "loss": 2.361, "step": 473660 }, { "epoch": 0.83, "learning_rate": 8.6988214859949e-06, "loss": 2.3237, "step": 473670 }, { "epoch": 0.83, "learning_rate": 8.697949546068074e-06, "loss": 2.2429, "step": 473680 }, { "epoch": 0.83, "learning_rate": 8.697077606141248e-06, "loss": 2.3159, "step": 473690 }, { "epoch": 0.83, "learning_rate": 8.696205666214422e-06, "loss": 2.2631, "step": 473700 }, { "epoch": 0.83, "learning_rate": 8.695333726287594e-06, "loss": 2.29, "step": 473710 }, { "epoch": 0.83, "learning_rate": 8.694461786360768e-06, "loss": 2.2799, "step": 473720 }, { "epoch": 0.83, "learning_rate": 8.69358984643394e-06, "loss": 2.2509, "step": 473730 }, { "epoch": 0.83, "learning_rate": 8.692717906507114e-06, "loss": 2.2368, "step": 473740 }, { "epoch": 0.83, "learning_rate": 8.691845966580286e-06, "loss": 2.2955, "step": 473750 }, { "epoch": 0.83, "learning_rate": 8.69097402665346e-06, "loss": 2.2577, "step": 473760 }, { "epoch": 0.83, "learning_rate": 8.690102086726633e-06, "loss": 2.2942, "step": 473770 }, { "epoch": 0.83, "learning_rate": 8.689230146799807e-06, "loss": 2.3312, "step": 473780 }, { "epoch": 0.83, "learning_rate": 8.68835820687298e-06, "loss": 2.3195, "step": 473790 }, { "epoch": 0.83, "learning_rate": 8.687486266946153e-06, "loss": 2.2619, "step": 473800 }, { "epoch": 0.83, "learning_rate": 8.686614327019327e-06, "loss": 2.2416, "step": 473810 }, { "epoch": 0.83, "learning_rate": 8.685742387092499e-06, "loss": 2.2516, "step": 473820 }, { "epoch": 0.83, "learning_rate": 8.684870447165673e-06, "loss": 2.2919, "step": 473830 }, { "epoch": 0.83, "learning_rate": 8.683998507238846e-06, "loss": 2.3816, "step": 473840 }, { "epoch": 0.83, "learning_rate": 8.68312656731202e-06, "loss": 2.289, "step": 473850 }, { "epoch": 0.83, "learning_rate": 8.682254627385192e-06, "loss": 2.0979, "step": 473860 }, { "epoch": 0.83, "learning_rate": 8.681382687458366e-06, "loss": 2.2731, "step": 473870 }, { "epoch": 0.83, "learning_rate": 8.680510747531538e-06, "loss": 2.2459, "step": 473880 }, { "epoch": 0.83, "learning_rate": 8.679638807604712e-06, "loss": 2.4282, "step": 473890 }, { "epoch": 0.83, "learning_rate": 8.678766867677884e-06, "loss": 2.2064, "step": 473900 }, { "epoch": 0.83, "learning_rate": 8.677894927751058e-06, "loss": 2.2929, "step": 473910 }, { "epoch": 0.83, "learning_rate": 8.677022987824231e-06, "loss": 2.2592, "step": 473920 }, { "epoch": 0.83, "learning_rate": 8.676151047897405e-06, "loss": 2.2651, "step": 473930 }, { "epoch": 0.83, "learning_rate": 8.675279107970579e-06, "loss": 2.4204, "step": 473940 }, { "epoch": 0.83, "learning_rate": 8.674407168043751e-06, "loss": 2.3052, "step": 473950 }, { "epoch": 0.83, "learning_rate": 8.673535228116925e-06, "loss": 2.1808, "step": 473960 }, { "epoch": 0.83, "learning_rate": 8.672663288190097e-06, "loss": 2.2218, "step": 473970 }, { "epoch": 0.83, "learning_rate": 8.67179134826327e-06, "loss": 2.2774, "step": 473980 }, { "epoch": 0.83, "learning_rate": 8.670919408336443e-06, "loss": 2.2504, "step": 473990 }, { "epoch": 0.83, "learning_rate": 8.670047468409616e-06, "loss": 2.33, "step": 474000 }, { "epoch": 0.83, "learning_rate": 8.66917552848279e-06, "loss": 2.2848, "step": 474010 }, { "epoch": 0.83, "learning_rate": 8.668303588555964e-06, "loss": 2.4561, "step": 474020 }, { "epoch": 0.83, "learning_rate": 8.667431648629136e-06, "loss": 2.1958, "step": 474030 }, { "epoch": 0.83, "learning_rate": 8.66655970870231e-06, "loss": 2.3182, "step": 474040 }, { "epoch": 0.83, "learning_rate": 8.665687768775482e-06, "loss": 2.2682, "step": 474050 }, { "epoch": 0.83, "learning_rate": 8.664815828848656e-06, "loss": 2.1698, "step": 474060 }, { "epoch": 0.83, "learning_rate": 8.663943888921828e-06, "loss": 2.3929, "step": 474070 }, { "epoch": 0.83, "learning_rate": 8.663071948995003e-06, "loss": 2.325, "step": 474080 }, { "epoch": 0.83, "learning_rate": 8.662200009068177e-06, "loss": 2.3225, "step": 474090 }, { "epoch": 0.83, "learning_rate": 8.661328069141349e-06, "loss": 2.272, "step": 474100 }, { "epoch": 0.83, "learning_rate": 8.660456129214523e-06, "loss": 2.3747, "step": 474110 }, { "epoch": 0.83, "learning_rate": 8.659584189287695e-06, "loss": 2.1435, "step": 474120 }, { "epoch": 0.83, "learning_rate": 8.658712249360869e-06, "loss": 2.2887, "step": 474130 }, { "epoch": 0.83, "learning_rate": 8.65784030943404e-06, "loss": 2.3187, "step": 474140 }, { "epoch": 0.83, "learning_rate": 8.656968369507215e-06, "loss": 2.3637, "step": 474150 }, { "epoch": 0.83, "learning_rate": 8.656096429580388e-06, "loss": 2.345, "step": 474160 }, { "epoch": 0.83, "learning_rate": 8.655224489653562e-06, "loss": 2.2283, "step": 474170 }, { "epoch": 0.83, "learning_rate": 8.654352549726734e-06, "loss": 2.3356, "step": 474180 }, { "epoch": 0.83, "learning_rate": 8.653480609799908e-06, "loss": 2.2574, "step": 474190 }, { "epoch": 0.83, "learning_rate": 8.65260866987308e-06, "loss": 2.2217, "step": 474200 }, { "epoch": 0.83, "learning_rate": 8.651736729946254e-06, "loss": 2.3214, "step": 474210 }, { "epoch": 0.83, "learning_rate": 8.650864790019428e-06, "loss": 2.0708, "step": 474220 }, { "epoch": 0.83, "learning_rate": 8.6499928500926e-06, "loss": 2.3049, "step": 474230 }, { "epoch": 0.83, "learning_rate": 8.649120910165773e-06, "loss": 2.352, "step": 474240 }, { "epoch": 0.83, "learning_rate": 8.648248970238947e-06, "loss": 2.2065, "step": 474250 }, { "epoch": 0.83, "learning_rate": 8.647377030312121e-06, "loss": 2.3317, "step": 474260 }, { "epoch": 0.83, "learning_rate": 8.646505090385293e-06, "loss": 2.3289, "step": 474270 }, { "epoch": 0.83, "learning_rate": 8.645633150458467e-06, "loss": 2.2559, "step": 474280 }, { "epoch": 0.83, "learning_rate": 8.644761210531639e-06, "loss": 2.2624, "step": 474290 }, { "epoch": 0.83, "learning_rate": 8.643889270604813e-06, "loss": 2.2222, "step": 474300 }, { "epoch": 0.83, "learning_rate": 8.643017330677985e-06, "loss": 2.2371, "step": 474310 }, { "epoch": 0.83, "learning_rate": 8.642145390751158e-06, "loss": 2.2456, "step": 474320 }, { "epoch": 0.83, "learning_rate": 8.641273450824332e-06, "loss": 2.3452, "step": 474330 }, { "epoch": 0.83, "learning_rate": 8.640401510897506e-06, "loss": 2.3426, "step": 474340 }, { "epoch": 0.83, "learning_rate": 8.63952957097068e-06, "loss": 2.2748, "step": 474350 }, { "epoch": 0.83, "learning_rate": 8.638657631043852e-06, "loss": 2.2546, "step": 474360 }, { "epoch": 0.83, "learning_rate": 8.637785691117026e-06, "loss": 2.343, "step": 474370 }, { "epoch": 0.83, "learning_rate": 8.636913751190198e-06, "loss": 2.1966, "step": 474380 }, { "epoch": 0.83, "learning_rate": 8.636041811263371e-06, "loss": 2.3095, "step": 474390 }, { "epoch": 0.83, "learning_rate": 8.635169871336545e-06, "loss": 2.3294, "step": 474400 }, { "epoch": 0.83, "learning_rate": 8.634297931409719e-06, "loss": 2.2324, "step": 474410 }, { "epoch": 0.83, "learning_rate": 8.633425991482891e-06, "loss": 2.2627, "step": 474420 }, { "epoch": 0.83, "learning_rate": 8.632554051556065e-06, "loss": 2.313, "step": 474430 }, { "epoch": 0.83, "learning_rate": 8.631682111629237e-06, "loss": 2.3272, "step": 474440 }, { "epoch": 0.83, "learning_rate": 8.63081017170241e-06, "loss": 2.1803, "step": 474450 }, { "epoch": 0.83, "learning_rate": 8.629938231775583e-06, "loss": 2.2687, "step": 474460 }, { "epoch": 0.83, "learning_rate": 8.629066291848757e-06, "loss": 2.4158, "step": 474470 }, { "epoch": 0.83, "learning_rate": 8.62819435192193e-06, "loss": 2.2124, "step": 474480 }, { "epoch": 0.83, "learning_rate": 8.627322411995104e-06, "loss": 2.3736, "step": 474490 }, { "epoch": 0.83, "learning_rate": 8.626450472068278e-06, "loss": 2.3262, "step": 474500 }, { "epoch": 0.83, "learning_rate": 8.62557853214145e-06, "loss": 2.2829, "step": 474510 }, { "epoch": 0.83, "learning_rate": 8.624706592214624e-06, "loss": 2.2813, "step": 474520 }, { "epoch": 0.83, "learning_rate": 8.623834652287796e-06, "loss": 2.2777, "step": 474530 }, { "epoch": 0.83, "learning_rate": 8.62296271236097e-06, "loss": 2.3042, "step": 474540 }, { "epoch": 0.83, "learning_rate": 8.622090772434142e-06, "loss": 2.3596, "step": 474550 }, { "epoch": 0.83, "learning_rate": 8.621218832507315e-06, "loss": 2.2862, "step": 474560 }, { "epoch": 0.83, "learning_rate": 8.62034689258049e-06, "loss": 2.2222, "step": 474570 }, { "epoch": 0.83, "learning_rate": 8.619474952653663e-06, "loss": 2.1906, "step": 474580 }, { "epoch": 0.83, "learning_rate": 8.618603012726835e-06, "loss": 2.2666, "step": 474590 }, { "epoch": 0.83, "learning_rate": 8.617731072800009e-06, "loss": 2.2868, "step": 474600 }, { "epoch": 0.83, "learning_rate": 8.616859132873183e-06, "loss": 2.1968, "step": 474610 }, { "epoch": 0.83, "learning_rate": 8.615987192946355e-06, "loss": 2.3888, "step": 474620 }, { "epoch": 0.83, "learning_rate": 8.615115253019528e-06, "loss": 2.3294, "step": 474630 }, { "epoch": 0.83, "learning_rate": 8.614243313092702e-06, "loss": 2.3118, "step": 474640 }, { "epoch": 0.83, "learning_rate": 8.613371373165876e-06, "loss": 2.3182, "step": 474650 }, { "epoch": 0.83, "learning_rate": 8.612499433239048e-06, "loss": 2.3277, "step": 474660 }, { "epoch": 0.83, "learning_rate": 8.611627493312222e-06, "loss": 2.2815, "step": 474670 }, { "epoch": 0.83, "learning_rate": 8.610755553385394e-06, "loss": 2.3162, "step": 474680 }, { "epoch": 0.83, "learning_rate": 8.609883613458568e-06, "loss": 2.1328, "step": 474690 }, { "epoch": 0.83, "learning_rate": 8.60901167353174e-06, "loss": 2.2592, "step": 474700 }, { "epoch": 0.83, "learning_rate": 8.608139733604913e-06, "loss": 2.2275, "step": 474710 }, { "epoch": 0.83, "learning_rate": 8.607267793678087e-06, "loss": 2.2518, "step": 474720 }, { "epoch": 0.83, "learning_rate": 8.606395853751261e-06, "loss": 2.2649, "step": 474730 }, { "epoch": 0.83, "learning_rate": 8.605523913824435e-06, "loss": 2.2123, "step": 474740 }, { "epoch": 0.83, "learning_rate": 8.604651973897607e-06, "loss": 2.164, "step": 474750 }, { "epoch": 0.83, "learning_rate": 8.60378003397078e-06, "loss": 2.3776, "step": 474760 }, { "epoch": 0.83, "learning_rate": 8.602908094043953e-06, "loss": 2.3796, "step": 474770 }, { "epoch": 0.83, "learning_rate": 8.602036154117126e-06, "loss": 2.298, "step": 474780 }, { "epoch": 0.83, "learning_rate": 8.601164214190299e-06, "loss": 2.2475, "step": 474790 }, { "epoch": 0.83, "learning_rate": 8.600292274263472e-06, "loss": 2.2053, "step": 474800 }, { "epoch": 0.83, "learning_rate": 8.599420334336646e-06, "loss": 2.2316, "step": 474810 }, { "epoch": 0.83, "learning_rate": 8.59854839440982e-06, "loss": 2.2286, "step": 474820 }, { "epoch": 0.83, "learning_rate": 8.597676454482992e-06, "loss": 2.2788, "step": 474830 }, { "epoch": 0.83, "learning_rate": 8.596804514556166e-06, "loss": 2.2521, "step": 474840 }, { "epoch": 0.83, "learning_rate": 8.595932574629338e-06, "loss": 2.2762, "step": 474850 }, { "epoch": 0.83, "learning_rate": 8.595060634702512e-06, "loss": 2.2473, "step": 474860 }, { "epoch": 0.83, "learning_rate": 8.594188694775685e-06, "loss": 2.3532, "step": 474870 }, { "epoch": 0.83, "learning_rate": 8.593316754848859e-06, "loss": 2.3074, "step": 474880 }, { "epoch": 0.83, "learning_rate": 8.592444814922033e-06, "loss": 2.1724, "step": 474890 }, { "epoch": 0.83, "learning_rate": 8.591572874995205e-06, "loss": 2.2228, "step": 474900 }, { "epoch": 0.83, "learning_rate": 8.590700935068379e-06, "loss": 2.3808, "step": 474910 }, { "epoch": 0.83, "learning_rate": 8.58982899514155e-06, "loss": 2.1605, "step": 474920 }, { "epoch": 0.83, "learning_rate": 8.588957055214725e-06, "loss": 2.2464, "step": 474930 }, { "epoch": 0.83, "learning_rate": 8.588085115287897e-06, "loss": 2.2621, "step": 474940 }, { "epoch": 0.83, "learning_rate": 8.58721317536107e-06, "loss": 2.3218, "step": 474950 }, { "epoch": 0.83, "learning_rate": 8.586341235434244e-06, "loss": 2.2278, "step": 474960 }, { "epoch": 0.83, "learning_rate": 8.585469295507418e-06, "loss": 2.1249, "step": 474970 }, { "epoch": 0.83, "learning_rate": 8.58459735558059e-06, "loss": 2.25, "step": 474980 }, { "epoch": 0.83, "learning_rate": 8.583725415653764e-06, "loss": 2.2839, "step": 474990 }, { "epoch": 0.83, "learning_rate": 8.582853475726936e-06, "loss": 2.2192, "step": 475000 }, { "epoch": 0.83, "learning_rate": 8.58198153580011e-06, "loss": 2.2431, "step": 475010 }, { "epoch": 0.83, "learning_rate": 8.581109595873283e-06, "loss": 2.2492, "step": 475020 }, { "epoch": 0.83, "learning_rate": 8.580237655946455e-06, "loss": 2.343, "step": 475030 }, { "epoch": 0.83, "learning_rate": 8.57936571601963e-06, "loss": 2.2648, "step": 475040 }, { "epoch": 0.83, "learning_rate": 8.578493776092803e-06, "loss": 2.2901, "step": 475050 }, { "epoch": 0.83, "learning_rate": 8.577621836165977e-06, "loss": 2.3585, "step": 475060 }, { "epoch": 0.83, "learning_rate": 8.576749896239149e-06, "loss": 2.3025, "step": 475070 }, { "epoch": 0.83, "learning_rate": 8.575877956312323e-06, "loss": 2.3053, "step": 475080 }, { "epoch": 0.83, "learning_rate": 8.575006016385495e-06, "loss": 2.3274, "step": 475090 }, { "epoch": 0.83, "learning_rate": 8.574134076458668e-06, "loss": 2.2843, "step": 475100 }, { "epoch": 0.83, "learning_rate": 8.57326213653184e-06, "loss": 2.3102, "step": 475110 }, { "epoch": 0.83, "learning_rate": 8.572390196605016e-06, "loss": 2.314, "step": 475120 }, { "epoch": 0.83, "learning_rate": 8.571518256678188e-06, "loss": 2.2853, "step": 475130 }, { "epoch": 0.83, "learning_rate": 8.570646316751362e-06, "loss": 2.2918, "step": 475140 }, { "epoch": 0.83, "learning_rate": 8.569774376824536e-06, "loss": 2.3212, "step": 475150 }, { "epoch": 0.83, "learning_rate": 8.568902436897708e-06, "loss": 2.3371, "step": 475160 }, { "epoch": 0.83, "learning_rate": 8.568030496970881e-06, "loss": 2.2821, "step": 475170 }, { "epoch": 0.83, "learning_rate": 8.567158557044054e-06, "loss": 2.3053, "step": 475180 }, { "epoch": 0.83, "learning_rate": 8.566286617117227e-06, "loss": 2.2189, "step": 475190 }, { "epoch": 0.83, "learning_rate": 8.565414677190401e-06, "loss": 2.3146, "step": 475200 }, { "epoch": 0.83, "learning_rate": 8.564542737263575e-06, "loss": 2.2096, "step": 475210 }, { "epoch": 0.83, "learning_rate": 8.563670797336747e-06, "loss": 2.2926, "step": 475220 }, { "epoch": 0.83, "learning_rate": 8.56279885740992e-06, "loss": 2.2773, "step": 475230 }, { "epoch": 0.83, "learning_rate": 8.561926917483093e-06, "loss": 2.2977, "step": 475240 }, { "epoch": 0.83, "learning_rate": 8.561054977556267e-06, "loss": 2.3685, "step": 475250 }, { "epoch": 0.83, "learning_rate": 8.560183037629439e-06, "loss": 2.2174, "step": 475260 }, { "epoch": 0.83, "learning_rate": 8.559311097702612e-06, "loss": 2.2946, "step": 475270 }, { "epoch": 0.83, "learning_rate": 8.558439157775786e-06, "loss": 2.2854, "step": 475280 }, { "epoch": 0.83, "learning_rate": 8.55756721784896e-06, "loss": 2.2573, "step": 475290 }, { "epoch": 0.83, "learning_rate": 8.556695277922134e-06, "loss": 2.2262, "step": 475300 }, { "epoch": 0.83, "learning_rate": 8.555823337995306e-06, "loss": 2.2961, "step": 475310 }, { "epoch": 0.83, "learning_rate": 8.55495139806848e-06, "loss": 2.2903, "step": 475320 }, { "epoch": 0.83, "learning_rate": 8.554079458141652e-06, "loss": 2.2764, "step": 475330 }, { "epoch": 0.83, "learning_rate": 8.553207518214825e-06, "loss": 2.1476, "step": 475340 }, { "epoch": 0.83, "learning_rate": 8.552335578287997e-06, "loss": 2.2114, "step": 475350 }, { "epoch": 0.83, "learning_rate": 8.551463638361171e-06, "loss": 2.1639, "step": 475360 }, { "epoch": 0.83, "learning_rate": 8.550591698434345e-06, "loss": 2.3028, "step": 475370 }, { "epoch": 0.83, "learning_rate": 8.549719758507519e-06, "loss": 2.3741, "step": 475380 }, { "epoch": 0.83, "learning_rate": 8.548847818580691e-06, "loss": 2.329, "step": 475390 }, { "epoch": 0.83, "learning_rate": 8.547975878653865e-06, "loss": 2.4062, "step": 475400 }, { "epoch": 0.83, "learning_rate": 8.547103938727038e-06, "loss": 2.367, "step": 475410 }, { "epoch": 0.83, "learning_rate": 8.54623199880021e-06, "loss": 2.2503, "step": 475420 }, { "epoch": 0.83, "learning_rate": 8.545360058873384e-06, "loss": 2.1635, "step": 475430 }, { "epoch": 0.83, "learning_rate": 8.544488118946558e-06, "loss": 2.183, "step": 475440 }, { "epoch": 0.83, "learning_rate": 8.543616179019732e-06, "loss": 2.2927, "step": 475450 }, { "epoch": 0.83, "learning_rate": 8.542744239092904e-06, "loss": 2.297, "step": 475460 }, { "epoch": 0.83, "learning_rate": 8.541872299166078e-06, "loss": 2.2784, "step": 475470 }, { "epoch": 0.83, "learning_rate": 8.54100035923925e-06, "loss": 2.2832, "step": 475480 }, { "epoch": 0.83, "learning_rate": 8.540128419312423e-06, "loss": 2.2184, "step": 475490 }, { "epoch": 0.83, "learning_rate": 8.539256479385596e-06, "loss": 2.3449, "step": 475500 }, { "epoch": 0.83, "learning_rate": 8.53838453945877e-06, "loss": 2.1972, "step": 475510 }, { "epoch": 0.83, "learning_rate": 8.537512599531943e-06, "loss": 2.2883, "step": 475520 }, { "epoch": 0.83, "learning_rate": 8.536640659605117e-06, "loss": 2.3311, "step": 475530 }, { "epoch": 0.83, "learning_rate": 8.53576871967829e-06, "loss": 2.2036, "step": 475540 }, { "epoch": 0.83, "learning_rate": 8.534896779751463e-06, "loss": 2.3853, "step": 475550 }, { "epoch": 0.83, "learning_rate": 8.534024839824636e-06, "loss": 2.2309, "step": 475560 }, { "epoch": 0.83, "learning_rate": 8.533152899897809e-06, "loss": 2.3253, "step": 475570 }, { "epoch": 0.83, "learning_rate": 8.532280959970982e-06, "loss": 2.2249, "step": 475580 }, { "epoch": 0.83, "learning_rate": 8.531409020044154e-06, "loss": 2.266, "step": 475590 }, { "epoch": 0.83, "learning_rate": 8.530537080117328e-06, "loss": 2.3228, "step": 475600 }, { "epoch": 0.83, "learning_rate": 8.529665140190502e-06, "loss": 2.2028, "step": 475610 }, { "epoch": 0.83, "learning_rate": 8.528793200263676e-06, "loss": 2.3141, "step": 475620 }, { "epoch": 0.83, "learning_rate": 8.527921260336848e-06, "loss": 2.3455, "step": 475630 }, { "epoch": 0.83, "learning_rate": 8.527049320410022e-06, "loss": 2.3824, "step": 475640 }, { "epoch": 0.83, "learning_rate": 8.526177380483194e-06, "loss": 2.235, "step": 475650 }, { "epoch": 0.83, "learning_rate": 8.525305440556367e-06, "loss": 2.2821, "step": 475660 }, { "epoch": 0.83, "learning_rate": 8.524433500629541e-06, "loss": 2.1979, "step": 475670 }, { "epoch": 0.83, "learning_rate": 8.523561560702715e-06, "loss": 2.2468, "step": 475680 }, { "epoch": 0.83, "learning_rate": 8.522689620775889e-06, "loss": 2.1379, "step": 475690 }, { "epoch": 0.83, "learning_rate": 8.52181768084906e-06, "loss": 2.0841, "step": 475700 }, { "epoch": 0.83, "learning_rate": 8.520945740922235e-06, "loss": 2.2132, "step": 475710 }, { "epoch": 0.83, "learning_rate": 8.520073800995407e-06, "loss": 2.3213, "step": 475720 }, { "epoch": 0.83, "learning_rate": 8.51920186106858e-06, "loss": 2.2611, "step": 475730 }, { "epoch": 0.83, "learning_rate": 8.518329921141752e-06, "loss": 2.4095, "step": 475740 }, { "epoch": 0.83, "learning_rate": 8.517457981214926e-06, "loss": 2.2323, "step": 475750 }, { "epoch": 0.83, "learning_rate": 8.5165860412881e-06, "loss": 2.2982, "step": 475760 }, { "epoch": 0.83, "learning_rate": 8.515714101361274e-06, "loss": 2.2656, "step": 475770 }, { "epoch": 0.83, "learning_rate": 8.514842161434446e-06, "loss": 2.367, "step": 475780 }, { "epoch": 0.83, "learning_rate": 8.51397022150762e-06, "loss": 2.2024, "step": 475790 }, { "epoch": 0.83, "learning_rate": 8.513098281580793e-06, "loss": 2.3517, "step": 475800 }, { "epoch": 0.83, "learning_rate": 8.512226341653965e-06, "loss": 2.0865, "step": 475810 }, { "epoch": 0.83, "learning_rate": 8.51135440172714e-06, "loss": 2.3602, "step": 475820 }, { "epoch": 0.83, "learning_rate": 8.510482461800311e-06, "loss": 2.2982, "step": 475830 }, { "epoch": 0.83, "learning_rate": 8.509610521873485e-06, "loss": 2.2435, "step": 475840 }, { "epoch": 0.83, "learning_rate": 8.508738581946659e-06, "loss": 2.3224, "step": 475850 }, { "epoch": 0.83, "learning_rate": 8.507866642019833e-06, "loss": 2.2675, "step": 475860 }, { "epoch": 0.83, "learning_rate": 8.506994702093005e-06, "loss": 2.2746, "step": 475870 }, { "epoch": 0.83, "learning_rate": 8.506122762166178e-06, "loss": 2.3232, "step": 475880 }, { "epoch": 0.83, "learning_rate": 8.50525082223935e-06, "loss": 2.2571, "step": 475890 }, { "epoch": 0.83, "learning_rate": 8.504378882312524e-06, "loss": 2.3584, "step": 475900 }, { "epoch": 0.83, "learning_rate": 8.503506942385696e-06, "loss": 2.3146, "step": 475910 }, { "epoch": 0.83, "learning_rate": 8.502635002458872e-06, "loss": 2.2274, "step": 475920 }, { "epoch": 0.83, "learning_rate": 8.501763062532044e-06, "loss": 2.2637, "step": 475930 }, { "epoch": 0.83, "learning_rate": 8.500891122605218e-06, "loss": 2.3587, "step": 475940 }, { "epoch": 0.83, "learning_rate": 8.500019182678391e-06, "loss": 2.3065, "step": 475950 }, { "epoch": 0.83, "learning_rate": 8.499147242751564e-06, "loss": 2.2198, "step": 475960 }, { "epoch": 0.83, "learning_rate": 8.498275302824737e-06, "loss": 2.3292, "step": 475970 }, { "epoch": 0.83, "learning_rate": 8.49740336289791e-06, "loss": 2.3082, "step": 475980 }, { "epoch": 0.83, "learning_rate": 8.496531422971083e-06, "loss": 2.2775, "step": 475990 }, { "epoch": 0.83, "learning_rate": 8.495659483044257e-06, "loss": 2.1142, "step": 476000 }, { "epoch": 0.83, "learning_rate": 8.49478754311743e-06, "loss": 2.3147, "step": 476010 }, { "epoch": 0.83, "learning_rate": 8.493915603190603e-06, "loss": 2.2804, "step": 476020 }, { "epoch": 0.83, "learning_rate": 8.493043663263777e-06, "loss": 2.3113, "step": 476030 }, { "epoch": 0.83, "learning_rate": 8.492171723336949e-06, "loss": 2.2689, "step": 476040 }, { "epoch": 0.83, "learning_rate": 8.491299783410122e-06, "loss": 2.2099, "step": 476050 }, { "epoch": 0.83, "learning_rate": 8.490427843483294e-06, "loss": 2.2329, "step": 476060 }, { "epoch": 0.83, "learning_rate": 8.489555903556468e-06, "loss": 2.3424, "step": 476070 }, { "epoch": 0.83, "learning_rate": 8.488683963629642e-06, "loss": 2.2372, "step": 476080 }, { "epoch": 0.83, "learning_rate": 8.487812023702816e-06, "loss": 2.2927, "step": 476090 }, { "epoch": 0.83, "learning_rate": 8.48694008377599e-06, "loss": 2.1545, "step": 476100 }, { "epoch": 0.83, "learning_rate": 8.486068143849162e-06, "loss": 2.4383, "step": 476110 }, { "epoch": 0.83, "learning_rate": 8.485196203922335e-06, "loss": 2.2859, "step": 476120 }, { "epoch": 0.83, "learning_rate": 8.484324263995507e-06, "loss": 2.2105, "step": 476130 }, { "epoch": 0.83, "learning_rate": 8.483452324068681e-06, "loss": 2.1884, "step": 476140 }, { "epoch": 0.83, "learning_rate": 8.482580384141853e-06, "loss": 2.2681, "step": 476150 }, { "epoch": 0.83, "learning_rate": 8.481708444215029e-06, "loss": 2.1991, "step": 476160 }, { "epoch": 0.83, "learning_rate": 8.480836504288201e-06, "loss": 2.3411, "step": 476170 }, { "epoch": 0.83, "learning_rate": 8.479964564361375e-06, "loss": 2.1767, "step": 476180 }, { "epoch": 0.83, "learning_rate": 8.479092624434547e-06, "loss": 2.2779, "step": 476190 }, { "epoch": 0.83, "learning_rate": 8.47822068450772e-06, "loss": 2.239, "step": 476200 }, { "epoch": 0.83, "learning_rate": 8.477348744580894e-06, "loss": 2.3679, "step": 476210 }, { "epoch": 0.83, "learning_rate": 8.476476804654066e-06, "loss": 2.3923, "step": 476220 }, { "epoch": 0.83, "learning_rate": 8.47560486472724e-06, "loss": 2.3147, "step": 476230 }, { "epoch": 0.83, "learning_rate": 8.474732924800414e-06, "loss": 2.1106, "step": 476240 }, { "epoch": 0.83, "learning_rate": 8.473860984873588e-06, "loss": 2.4023, "step": 476250 }, { "epoch": 0.83, "learning_rate": 8.47298904494676e-06, "loss": 2.0389, "step": 476260 }, { "epoch": 0.83, "learning_rate": 8.472117105019934e-06, "loss": 2.2389, "step": 476270 }, { "epoch": 0.83, "learning_rate": 8.471245165093106e-06, "loss": 2.3043, "step": 476280 }, { "epoch": 0.83, "learning_rate": 8.47037322516628e-06, "loss": 2.1598, "step": 476290 }, { "epoch": 0.83, "learning_rate": 8.469501285239451e-06, "loss": 2.3241, "step": 476300 }, { "epoch": 0.83, "learning_rate": 8.468629345312625e-06, "loss": 2.1615, "step": 476310 }, { "epoch": 0.83, "learning_rate": 8.467757405385799e-06, "loss": 2.1564, "step": 476320 }, { "epoch": 0.83, "learning_rate": 8.466885465458973e-06, "loss": 2.3667, "step": 476330 }, { "epoch": 0.83, "learning_rate": 8.466013525532147e-06, "loss": 2.2494, "step": 476340 }, { "epoch": 0.83, "learning_rate": 8.465141585605319e-06, "loss": 2.2708, "step": 476350 }, { "epoch": 0.83, "learning_rate": 8.464269645678492e-06, "loss": 2.2011, "step": 476360 }, { "epoch": 0.83, "learning_rate": 8.463397705751664e-06, "loss": 2.3691, "step": 476370 }, { "epoch": 0.83, "learning_rate": 8.462525765824838e-06, "loss": 2.2554, "step": 476380 }, { "epoch": 0.83, "learning_rate": 8.46165382589801e-06, "loss": 2.3102, "step": 476390 }, { "epoch": 0.83, "learning_rate": 8.460781885971184e-06, "loss": 2.3114, "step": 476400 }, { "epoch": 0.83, "learning_rate": 8.459909946044358e-06, "loss": 2.2042, "step": 476410 }, { "epoch": 0.83, "learning_rate": 8.459038006117532e-06, "loss": 2.3707, "step": 476420 }, { "epoch": 0.83, "learning_rate": 8.458166066190704e-06, "loss": 2.2274, "step": 476430 }, { "epoch": 0.83, "learning_rate": 8.457294126263877e-06, "loss": 2.1619, "step": 476440 }, { "epoch": 0.83, "learning_rate": 8.45642218633705e-06, "loss": 2.3429, "step": 476450 }, { "epoch": 0.83, "learning_rate": 8.455550246410223e-06, "loss": 2.2992, "step": 476460 }, { "epoch": 0.83, "learning_rate": 8.454678306483397e-06, "loss": 2.241, "step": 476470 }, { "epoch": 0.83, "learning_rate": 8.45380636655657e-06, "loss": 2.2868, "step": 476480 }, { "epoch": 0.83, "learning_rate": 8.452934426629745e-06, "loss": 2.3155, "step": 476490 }, { "epoch": 0.83, "learning_rate": 8.452062486702917e-06, "loss": 2.3955, "step": 476500 }, { "epoch": 0.83, "learning_rate": 8.45119054677609e-06, "loss": 2.1655, "step": 476510 }, { "epoch": 0.83, "learning_rate": 8.450318606849263e-06, "loss": 2.3297, "step": 476520 }, { "epoch": 0.83, "learning_rate": 8.449446666922436e-06, "loss": 2.329, "step": 476530 }, { "epoch": 0.83, "learning_rate": 8.448574726995608e-06, "loss": 2.3799, "step": 476540 }, { "epoch": 0.83, "learning_rate": 8.447702787068782e-06, "loss": 2.2678, "step": 476550 }, { "epoch": 0.83, "learning_rate": 8.446830847141956e-06, "loss": 2.2957, "step": 476560 }, { "epoch": 0.83, "learning_rate": 8.44595890721513e-06, "loss": 2.3845, "step": 476570 }, { "epoch": 0.83, "learning_rate": 8.445086967288302e-06, "loss": 2.2667, "step": 476580 }, { "epoch": 0.83, "learning_rate": 8.444215027361476e-06, "loss": 2.1405, "step": 476590 }, { "epoch": 0.83, "learning_rate": 8.44334308743465e-06, "loss": 2.2881, "step": 476600 }, { "epoch": 0.83, "learning_rate": 8.442471147507821e-06, "loss": 2.2162, "step": 476610 }, { "epoch": 0.83, "learning_rate": 8.441599207580995e-06, "loss": 2.2943, "step": 476620 }, { "epoch": 0.83, "learning_rate": 8.440727267654167e-06, "loss": 2.315, "step": 476630 }, { "epoch": 0.83, "learning_rate": 8.439855327727341e-06, "loss": 2.3693, "step": 476640 }, { "epoch": 0.83, "learning_rate": 8.438983387800515e-06, "loss": 2.327, "step": 476650 }, { "epoch": 0.83, "learning_rate": 8.438111447873689e-06, "loss": 2.1879, "step": 476660 }, { "epoch": 0.83, "learning_rate": 8.43723950794686e-06, "loss": 2.1753, "step": 476670 }, { "epoch": 0.83, "learning_rate": 8.436367568020034e-06, "loss": 2.2798, "step": 476680 }, { "epoch": 0.83, "learning_rate": 8.435495628093206e-06, "loss": 2.252, "step": 476690 }, { "epoch": 0.83, "learning_rate": 8.43462368816638e-06, "loss": 2.2499, "step": 476700 }, { "epoch": 0.83, "learning_rate": 8.433751748239552e-06, "loss": 2.2868, "step": 476710 }, { "epoch": 0.83, "learning_rate": 8.432879808312728e-06, "loss": 2.3271, "step": 476720 }, { "epoch": 0.83, "learning_rate": 8.4320078683859e-06, "loss": 2.2499, "step": 476730 }, { "epoch": 0.83, "learning_rate": 8.431135928459074e-06, "loss": 2.217, "step": 476740 }, { "epoch": 0.83, "learning_rate": 8.430263988532247e-06, "loss": 2.2256, "step": 476750 }, { "epoch": 0.83, "learning_rate": 8.42939204860542e-06, "loss": 2.3777, "step": 476760 }, { "epoch": 0.83, "learning_rate": 8.428520108678593e-06, "loss": 2.2723, "step": 476770 }, { "epoch": 0.83, "learning_rate": 8.427648168751765e-06, "loss": 2.2823, "step": 476780 }, { "epoch": 0.83, "learning_rate": 8.426776228824939e-06, "loss": 2.2286, "step": 476790 }, { "epoch": 0.83, "learning_rate": 8.425904288898113e-06, "loss": 2.3359, "step": 476800 }, { "epoch": 0.83, "learning_rate": 8.425032348971287e-06, "loss": 2.3407, "step": 476810 }, { "epoch": 0.83, "learning_rate": 8.424160409044459e-06, "loss": 2.3377, "step": 476820 }, { "epoch": 0.83, "learning_rate": 8.423288469117632e-06, "loss": 2.3397, "step": 476830 }, { "epoch": 0.83, "learning_rate": 8.422416529190805e-06, "loss": 2.278, "step": 476840 }, { "epoch": 0.83, "learning_rate": 8.421544589263978e-06, "loss": 2.2304, "step": 476850 }, { "epoch": 0.83, "learning_rate": 8.42067264933715e-06, "loss": 2.1223, "step": 476860 }, { "epoch": 0.83, "learning_rate": 8.419800709410324e-06, "loss": 2.3049, "step": 476870 }, { "epoch": 0.83, "learning_rate": 8.418928769483498e-06, "loss": 2.1612, "step": 476880 }, { "epoch": 0.83, "learning_rate": 8.418056829556672e-06, "loss": 2.2601, "step": 476890 }, { "epoch": 0.83, "learning_rate": 8.417184889629845e-06, "loss": 2.2623, "step": 476900 }, { "epoch": 0.83, "learning_rate": 8.416312949703018e-06, "loss": 2.2977, "step": 476910 }, { "epoch": 0.83, "learning_rate": 8.415441009776191e-06, "loss": 2.3041, "step": 476920 }, { "epoch": 0.83, "learning_rate": 8.414569069849363e-06, "loss": 2.2297, "step": 476930 }, { "epoch": 0.83, "learning_rate": 8.413697129922537e-06, "loss": 2.2483, "step": 476940 }, { "epoch": 0.83, "learning_rate": 8.41282518999571e-06, "loss": 2.244, "step": 476950 }, { "epoch": 0.83, "learning_rate": 8.411953250068885e-06, "loss": 2.2763, "step": 476960 }, { "epoch": 0.83, "learning_rate": 8.411081310142057e-06, "loss": 2.2891, "step": 476970 }, { "epoch": 0.83, "learning_rate": 8.41020937021523e-06, "loss": 2.1821, "step": 476980 }, { "epoch": 0.83, "learning_rate": 8.409337430288403e-06, "loss": 2.3662, "step": 476990 }, { "epoch": 0.83, "learning_rate": 8.408465490361576e-06, "loss": 2.1608, "step": 477000 }, { "epoch": 0.83, "learning_rate": 8.40759355043475e-06, "loss": 2.2978, "step": 477010 }, { "epoch": 0.83, "learning_rate": 8.406721610507922e-06, "loss": 2.3339, "step": 477020 }, { "epoch": 0.83, "learning_rate": 8.405849670581096e-06, "loss": 2.3014, "step": 477030 }, { "epoch": 0.83, "learning_rate": 8.40497773065427e-06, "loss": 2.2962, "step": 477040 }, { "epoch": 0.83, "learning_rate": 8.404105790727444e-06, "loss": 2.2577, "step": 477050 }, { "epoch": 0.83, "learning_rate": 8.403233850800616e-06, "loss": 2.3116, "step": 477060 }, { "epoch": 0.83, "learning_rate": 8.40236191087379e-06, "loss": 2.2159, "step": 477070 }, { "epoch": 0.83, "learning_rate": 8.401489970946961e-06, "loss": 2.227, "step": 477080 }, { "epoch": 0.83, "learning_rate": 8.400618031020135e-06, "loss": 2.2024, "step": 477090 }, { "epoch": 0.83, "learning_rate": 8.399746091093307e-06, "loss": 2.266, "step": 477100 }, { "epoch": 0.83, "learning_rate": 8.398874151166481e-06, "loss": 2.2406, "step": 477110 }, { "epoch": 0.83, "learning_rate": 8.398002211239655e-06, "loss": 2.3288, "step": 477120 }, { "epoch": 0.83, "learning_rate": 8.397130271312829e-06, "loss": 2.2521, "step": 477130 }, { "epoch": 0.83, "learning_rate": 8.396258331386002e-06, "loss": 2.3274, "step": 477140 }, { "epoch": 0.83, "learning_rate": 8.395386391459174e-06, "loss": 2.3312, "step": 477150 }, { "epoch": 0.83, "learning_rate": 8.394514451532348e-06, "loss": 2.2442, "step": 477160 }, { "epoch": 0.83, "learning_rate": 8.39364251160552e-06, "loss": 2.3883, "step": 477170 }, { "epoch": 0.83, "learning_rate": 8.392770571678694e-06, "loss": 2.3247, "step": 477180 }, { "epoch": 0.83, "learning_rate": 8.391898631751866e-06, "loss": 2.1837, "step": 477190 }, { "epoch": 0.83, "learning_rate": 8.391026691825042e-06, "loss": 2.238, "step": 477200 }, { "epoch": 0.83, "learning_rate": 8.390154751898214e-06, "loss": 2.3133, "step": 477210 }, { "epoch": 0.83, "learning_rate": 8.389282811971387e-06, "loss": 2.312, "step": 477220 }, { "epoch": 0.83, "learning_rate": 8.38841087204456e-06, "loss": 2.3578, "step": 477230 }, { "epoch": 0.83, "learning_rate": 8.387538932117733e-06, "loss": 2.2222, "step": 477240 }, { "epoch": 0.83, "learning_rate": 8.386666992190905e-06, "loss": 2.3466, "step": 477250 }, { "epoch": 0.83, "learning_rate": 8.385795052264079e-06, "loss": 2.3018, "step": 477260 }, { "epoch": 0.83, "learning_rate": 8.384923112337253e-06, "loss": 2.3521, "step": 477270 }, { "epoch": 0.83, "learning_rate": 8.384051172410427e-06, "loss": 2.3073, "step": 477280 }, { "epoch": 0.83, "learning_rate": 8.3831792324836e-06, "loss": 2.095, "step": 477290 }, { "epoch": 0.83, "learning_rate": 8.382307292556773e-06, "loss": 2.3211, "step": 477300 }, { "epoch": 0.83, "learning_rate": 8.381435352629946e-06, "loss": 2.2695, "step": 477310 }, { "epoch": 0.83, "learning_rate": 8.380563412703118e-06, "loss": 2.263, "step": 477320 }, { "epoch": 0.83, "learning_rate": 8.379691472776292e-06, "loss": 2.2529, "step": 477330 }, { "epoch": 0.83, "learning_rate": 8.378819532849464e-06, "loss": 2.2209, "step": 477340 }, { "epoch": 0.83, "learning_rate": 8.377947592922638e-06, "loss": 2.3385, "step": 477350 }, { "epoch": 0.83, "learning_rate": 8.377075652995812e-06, "loss": 2.3037, "step": 477360 }, { "epoch": 0.83, "learning_rate": 8.376203713068986e-06, "loss": 2.2043, "step": 477370 }, { "epoch": 0.83, "learning_rate": 8.375331773142158e-06, "loss": 2.1906, "step": 477380 }, { "epoch": 0.83, "learning_rate": 8.374459833215331e-06, "loss": 2.4213, "step": 477390 }, { "epoch": 0.83, "learning_rate": 8.373587893288505e-06, "loss": 2.2054, "step": 477400 }, { "epoch": 0.83, "learning_rate": 8.372715953361677e-06, "loss": 2.2274, "step": 477410 }, { "epoch": 0.83, "learning_rate": 8.371844013434851e-06, "loss": 2.202, "step": 477420 }, { "epoch": 0.83, "learning_rate": 8.370972073508023e-06, "loss": 2.2219, "step": 477430 }, { "epoch": 0.83, "learning_rate": 8.370100133581197e-06, "loss": 2.4246, "step": 477440 }, { "epoch": 0.83, "learning_rate": 8.36922819365437e-06, "loss": 2.282, "step": 477450 }, { "epoch": 0.83, "learning_rate": 8.368356253727544e-06, "loss": 2.269, "step": 477460 }, { "epoch": 0.83, "learning_rate": 8.367484313800716e-06, "loss": 2.3711, "step": 477470 }, { "epoch": 0.83, "learning_rate": 8.36661237387389e-06, "loss": 2.3224, "step": 477480 }, { "epoch": 0.83, "learning_rate": 8.365740433947062e-06, "loss": 2.2139, "step": 477490 }, { "epoch": 0.83, "learning_rate": 8.364868494020236e-06, "loss": 2.3459, "step": 477500 }, { "epoch": 0.83, "learning_rate": 8.36399655409341e-06, "loss": 2.3052, "step": 477510 }, { "epoch": 0.83, "learning_rate": 8.363124614166584e-06, "loss": 2.2571, "step": 477520 }, { "epoch": 0.83, "learning_rate": 8.362252674239757e-06, "loss": 2.2173, "step": 477530 }, { "epoch": 0.83, "learning_rate": 8.36138073431293e-06, "loss": 2.2988, "step": 477540 }, { "epoch": 0.83, "learning_rate": 8.360508794386103e-06, "loss": 2.2934, "step": 477550 }, { "epoch": 0.83, "learning_rate": 8.359636854459275e-06, "loss": 2.3263, "step": 477560 }, { "epoch": 0.83, "learning_rate": 8.358764914532449e-06, "loss": 2.2333, "step": 477570 }, { "epoch": 0.83, "learning_rate": 8.357892974605621e-06, "loss": 2.3021, "step": 477580 }, { "epoch": 0.83, "learning_rate": 8.357021034678795e-06, "loss": 2.2049, "step": 477590 }, { "epoch": 0.83, "learning_rate": 8.356149094751969e-06, "loss": 2.2843, "step": 477600 }, { "epoch": 0.83, "learning_rate": 8.355277154825142e-06, "loss": 2.3238, "step": 477610 }, { "epoch": 0.83, "learning_rate": 8.354405214898315e-06, "loss": 2.2355, "step": 477620 }, { "epoch": 0.83, "learning_rate": 8.353533274971488e-06, "loss": 2.2714, "step": 477630 }, { "epoch": 0.83, "learning_rate": 8.35266133504466e-06, "loss": 2.268, "step": 477640 }, { "epoch": 0.83, "learning_rate": 8.351789395117834e-06, "loss": 2.171, "step": 477650 }, { "epoch": 0.83, "learning_rate": 8.350917455191006e-06, "loss": 2.3452, "step": 477660 }, { "epoch": 0.83, "learning_rate": 8.35004551526418e-06, "loss": 2.2659, "step": 477670 }, { "epoch": 0.83, "learning_rate": 8.349173575337354e-06, "loss": 2.3044, "step": 477680 }, { "epoch": 0.83, "learning_rate": 8.348301635410528e-06, "loss": 2.264, "step": 477690 }, { "epoch": 0.83, "learning_rate": 8.347429695483701e-06, "loss": 2.257, "step": 477700 }, { "epoch": 0.83, "learning_rate": 8.346557755556873e-06, "loss": 2.3204, "step": 477710 }, { "epoch": 0.83, "learning_rate": 8.345685815630047e-06, "loss": 2.1921, "step": 477720 }, { "epoch": 0.83, "learning_rate": 8.34481387570322e-06, "loss": 2.2204, "step": 477730 }, { "epoch": 0.83, "learning_rate": 8.343941935776393e-06, "loss": 2.2447, "step": 477740 }, { "epoch": 0.83, "learning_rate": 8.343069995849565e-06, "loss": 2.2456, "step": 477750 }, { "epoch": 0.83, "learning_rate": 8.34219805592274e-06, "loss": 2.2704, "step": 477760 }, { "epoch": 0.83, "learning_rate": 8.341326115995913e-06, "loss": 2.3506, "step": 477770 }, { "epoch": 0.83, "learning_rate": 8.340454176069086e-06, "loss": 2.2343, "step": 477780 }, { "epoch": 0.83, "learning_rate": 8.339582236142258e-06, "loss": 2.2678, "step": 477790 }, { "epoch": 0.83, "learning_rate": 8.338710296215432e-06, "loss": 2.2978, "step": 477800 }, { "epoch": 0.83, "learning_rate": 8.337838356288606e-06, "loss": 2.3624, "step": 477810 }, { "epoch": 0.83, "learning_rate": 8.336966416361778e-06, "loss": 2.2187, "step": 477820 }, { "epoch": 0.83, "learning_rate": 8.336094476434952e-06, "loss": 2.2323, "step": 477830 }, { "epoch": 0.83, "learning_rate": 8.335222536508126e-06, "loss": 2.3017, "step": 477840 }, { "epoch": 0.83, "learning_rate": 8.3343505965813e-06, "loss": 2.3545, "step": 477850 }, { "epoch": 0.83, "learning_rate": 8.333478656654471e-06, "loss": 2.2586, "step": 477860 }, { "epoch": 0.83, "learning_rate": 8.332606716727645e-06, "loss": 2.2586, "step": 477870 }, { "epoch": 0.83, "learning_rate": 8.331734776800817e-06, "loss": 2.3332, "step": 477880 }, { "epoch": 0.83, "learning_rate": 8.330862836873991e-06, "loss": 2.3111, "step": 477890 }, { "epoch": 0.83, "learning_rate": 8.329990896947163e-06, "loss": 2.3492, "step": 477900 }, { "epoch": 0.83, "learning_rate": 8.329118957020337e-06, "loss": 2.1101, "step": 477910 }, { "epoch": 0.83, "learning_rate": 8.32824701709351e-06, "loss": 2.2629, "step": 477920 }, { "epoch": 0.83, "learning_rate": 8.327375077166684e-06, "loss": 2.2899, "step": 477930 }, { "epoch": 0.83, "learning_rate": 8.326503137239858e-06, "loss": 2.3297, "step": 477940 }, { "epoch": 0.83, "learning_rate": 8.32563119731303e-06, "loss": 2.2774, "step": 477950 }, { "epoch": 0.83, "learning_rate": 8.324759257386204e-06, "loss": 2.2581, "step": 477960 }, { "epoch": 0.83, "learning_rate": 8.323887317459376e-06, "loss": 2.2566, "step": 477970 }, { "epoch": 0.83, "learning_rate": 8.32301537753255e-06, "loss": 2.3819, "step": 477980 }, { "epoch": 0.83, "learning_rate": 8.322143437605722e-06, "loss": 2.368, "step": 477990 }, { "epoch": 0.83, "learning_rate": 8.321271497678897e-06, "loss": 2.2201, "step": 478000 }, { "epoch": 0.83, "learning_rate": 8.32039955775207e-06, "loss": 2.3603, "step": 478010 }, { "epoch": 0.83, "learning_rate": 8.319527617825243e-06, "loss": 2.3095, "step": 478020 }, { "epoch": 0.83, "learning_rate": 8.318655677898415e-06, "loss": 2.2764, "step": 478030 }, { "epoch": 0.83, "learning_rate": 8.317783737971589e-06, "loss": 2.309, "step": 478040 }, { "epoch": 0.83, "learning_rate": 8.316911798044761e-06, "loss": 2.1855, "step": 478050 }, { "epoch": 0.83, "learning_rate": 8.316039858117935e-06, "loss": 2.3295, "step": 478060 }, { "epoch": 0.83, "learning_rate": 8.315167918191109e-06, "loss": 2.3916, "step": 478070 }, { "epoch": 0.83, "learning_rate": 8.314295978264283e-06, "loss": 2.2818, "step": 478080 }, { "epoch": 0.83, "learning_rate": 8.313424038337456e-06, "loss": 2.3059, "step": 478090 }, { "epoch": 0.83, "learning_rate": 8.312552098410628e-06, "loss": 2.3162, "step": 478100 }, { "epoch": 0.83, "learning_rate": 8.311680158483802e-06, "loss": 2.1499, "step": 478110 }, { "epoch": 0.83, "learning_rate": 8.310808218556974e-06, "loss": 2.2111, "step": 478120 }, { "epoch": 0.83, "learning_rate": 8.309936278630148e-06, "loss": 2.1834, "step": 478130 }, { "epoch": 0.83, "learning_rate": 8.30906433870332e-06, "loss": 2.3963, "step": 478140 }, { "epoch": 0.83, "learning_rate": 8.308192398776494e-06, "loss": 2.1821, "step": 478150 }, { "epoch": 0.83, "learning_rate": 8.307320458849668e-06, "loss": 2.3194, "step": 478160 }, { "epoch": 0.83, "learning_rate": 8.306448518922841e-06, "loss": 2.3462, "step": 478170 }, { "epoch": 0.83, "learning_rate": 8.305576578996013e-06, "loss": 2.2558, "step": 478180 }, { "epoch": 0.83, "learning_rate": 8.304704639069187e-06, "loss": 2.2729, "step": 478190 }, { "epoch": 0.83, "learning_rate": 8.303832699142361e-06, "loss": 2.3035, "step": 478200 }, { "epoch": 0.83, "learning_rate": 8.302960759215533e-06, "loss": 2.2249, "step": 478210 }, { "epoch": 0.83, "learning_rate": 8.302088819288707e-06, "loss": 2.1122, "step": 478220 }, { "epoch": 0.83, "learning_rate": 8.301216879361879e-06, "loss": 2.218, "step": 478230 }, { "epoch": 0.83, "learning_rate": 8.300344939435054e-06, "loss": 2.3227, "step": 478240 }, { "epoch": 0.83, "learning_rate": 8.299472999508226e-06, "loss": 2.2238, "step": 478250 }, { "epoch": 0.83, "learning_rate": 8.2986010595814e-06, "loss": 2.2789, "step": 478260 }, { "epoch": 0.83, "learning_rate": 8.297729119654572e-06, "loss": 2.1639, "step": 478270 }, { "epoch": 0.83, "learning_rate": 8.296857179727746e-06, "loss": 2.3395, "step": 478280 }, { "epoch": 0.83, "learning_rate": 8.295985239800918e-06, "loss": 2.334, "step": 478290 }, { "epoch": 0.83, "learning_rate": 8.295113299874092e-06, "loss": 2.3162, "step": 478300 }, { "epoch": 0.83, "learning_rate": 8.294241359947266e-06, "loss": 2.3743, "step": 478310 }, { "epoch": 0.83, "learning_rate": 8.29336942002044e-06, "loss": 2.2686, "step": 478320 }, { "epoch": 0.83, "learning_rate": 8.292497480093613e-06, "loss": 2.3226, "step": 478330 }, { "epoch": 0.83, "learning_rate": 8.291625540166785e-06, "loss": 2.2775, "step": 478340 }, { "epoch": 0.83, "learning_rate": 8.290753600239959e-06, "loss": 2.3007, "step": 478350 }, { "epoch": 0.83, "learning_rate": 8.289881660313131e-06, "loss": 2.2179, "step": 478360 }, { "epoch": 0.83, "learning_rate": 8.289009720386305e-06, "loss": 2.3176, "step": 478370 }, { "epoch": 0.83, "learning_rate": 8.288137780459477e-06, "loss": 2.2457, "step": 478380 }, { "epoch": 0.83, "learning_rate": 8.28726584053265e-06, "loss": 2.2523, "step": 478390 }, { "epoch": 0.83, "learning_rate": 8.286393900605825e-06, "loss": 2.3803, "step": 478400 }, { "epoch": 0.83, "learning_rate": 8.285521960678998e-06, "loss": 2.1909, "step": 478410 }, { "epoch": 0.83, "learning_rate": 8.28465002075217e-06, "loss": 2.3869, "step": 478420 }, { "epoch": 0.83, "learning_rate": 8.283778080825344e-06, "loss": 2.1477, "step": 478430 }, { "epoch": 0.83, "learning_rate": 8.282906140898516e-06, "loss": 2.2568, "step": 478440 }, { "epoch": 0.83, "learning_rate": 8.28203420097169e-06, "loss": 2.1575, "step": 478450 }, { "epoch": 0.83, "learning_rate": 8.281162261044862e-06, "loss": 2.2908, "step": 478460 }, { "epoch": 0.83, "learning_rate": 8.280290321118036e-06, "loss": 2.359, "step": 478470 }, { "epoch": 0.83, "learning_rate": 8.27941838119121e-06, "loss": 2.3087, "step": 478480 }, { "epoch": 0.83, "learning_rate": 8.278546441264383e-06, "loss": 2.255, "step": 478490 }, { "epoch": 0.83, "learning_rate": 8.277674501337557e-06, "loss": 2.2722, "step": 478500 }, { "epoch": 0.83, "learning_rate": 8.27680256141073e-06, "loss": 2.2536, "step": 478510 }, { "epoch": 0.83, "learning_rate": 8.275930621483903e-06, "loss": 2.3924, "step": 478520 }, { "epoch": 0.83, "learning_rate": 8.275058681557075e-06, "loss": 2.2938, "step": 478530 }, { "epoch": 0.83, "learning_rate": 8.274186741630249e-06, "loss": 2.2846, "step": 478540 }, { "epoch": 0.83, "learning_rate": 8.273314801703423e-06, "loss": 2.3374, "step": 478550 }, { "epoch": 0.83, "learning_rate": 8.272442861776596e-06, "loss": 2.2356, "step": 478560 }, { "epoch": 0.83, "learning_rate": 8.271570921849768e-06, "loss": 2.3213, "step": 478570 }, { "epoch": 0.83, "learning_rate": 8.270698981922942e-06, "loss": 2.2232, "step": 478580 }, { "epoch": 0.83, "learning_rate": 8.269827041996114e-06, "loss": 2.3631, "step": 478590 }, { "epoch": 0.83, "learning_rate": 8.268955102069288e-06, "loss": 2.2902, "step": 478600 }, { "epoch": 0.83, "learning_rate": 8.268083162142462e-06, "loss": 2.3103, "step": 478610 }, { "epoch": 0.83, "learning_rate": 8.267211222215634e-06, "loss": 2.3077, "step": 478620 }, { "epoch": 0.83, "learning_rate": 8.266339282288808e-06, "loss": 2.2374, "step": 478630 }, { "epoch": 0.83, "learning_rate": 8.265467342361981e-06, "loss": 2.3171, "step": 478640 }, { "epoch": 0.83, "learning_rate": 8.264595402435155e-06, "loss": 2.2571, "step": 478650 }, { "epoch": 0.83, "learning_rate": 8.263723462508327e-06, "loss": 2.2886, "step": 478660 }, { "epoch": 0.83, "learning_rate": 8.262851522581501e-06, "loss": 2.2503, "step": 478670 }, { "epoch": 0.83, "learning_rate": 8.261979582654673e-06, "loss": 2.2269, "step": 478680 }, { "epoch": 0.83, "learning_rate": 8.261107642727847e-06, "loss": 2.1363, "step": 478690 }, { "epoch": 0.83, "learning_rate": 8.260235702801019e-06, "loss": 2.2591, "step": 478700 }, { "epoch": 0.83, "learning_rate": 8.259363762874193e-06, "loss": 2.2295, "step": 478710 }, { "epoch": 0.83, "learning_rate": 8.258491822947367e-06, "loss": 2.3495, "step": 478720 }, { "epoch": 0.83, "learning_rate": 8.25761988302054e-06, "loss": 2.2862, "step": 478730 }, { "epoch": 0.83, "learning_rate": 8.256747943093714e-06, "loss": 2.1563, "step": 478740 }, { "epoch": 0.83, "learning_rate": 8.255876003166886e-06, "loss": 2.1802, "step": 478750 }, { "epoch": 0.83, "learning_rate": 8.25500406324006e-06, "loss": 2.3687, "step": 478760 }, { "epoch": 0.83, "learning_rate": 8.254132123313232e-06, "loss": 2.2936, "step": 478770 }, { "epoch": 0.83, "learning_rate": 8.253260183386406e-06, "loss": 2.1319, "step": 478780 }, { "epoch": 0.83, "learning_rate": 8.252388243459578e-06, "loss": 2.3441, "step": 478790 }, { "epoch": 0.83, "learning_rate": 8.251516303532753e-06, "loss": 2.3238, "step": 478800 }, { "epoch": 0.83, "learning_rate": 8.250644363605925e-06, "loss": 2.278, "step": 478810 }, { "epoch": 0.84, "learning_rate": 8.249772423679099e-06, "loss": 2.1985, "step": 478820 }, { "epoch": 0.84, "learning_rate": 8.248900483752271e-06, "loss": 2.233, "step": 478830 }, { "epoch": 0.84, "learning_rate": 8.248028543825445e-06, "loss": 2.3235, "step": 478840 }, { "epoch": 0.84, "learning_rate": 8.247156603898617e-06, "loss": 2.1668, "step": 478850 }, { "epoch": 0.84, "learning_rate": 8.24628466397179e-06, "loss": 2.2312, "step": 478860 }, { "epoch": 0.84, "learning_rate": 8.245412724044965e-06, "loss": 2.3197, "step": 478870 }, { "epoch": 0.84, "learning_rate": 8.244540784118138e-06, "loss": 2.2555, "step": 478880 }, { "epoch": 0.84, "learning_rate": 8.243668844191312e-06, "loss": 2.3698, "step": 478890 }, { "epoch": 0.84, "learning_rate": 8.242796904264484e-06, "loss": 2.2259, "step": 478900 }, { "epoch": 0.84, "learning_rate": 8.241924964337658e-06, "loss": 2.2431, "step": 478910 }, { "epoch": 0.84, "learning_rate": 8.24105302441083e-06, "loss": 2.239, "step": 478920 }, { "epoch": 0.84, "learning_rate": 8.240181084484004e-06, "loss": 2.2925, "step": 478930 }, { "epoch": 0.84, "learning_rate": 8.239309144557176e-06, "loss": 2.343, "step": 478940 }, { "epoch": 0.84, "learning_rate": 8.23843720463035e-06, "loss": 2.3523, "step": 478950 }, { "epoch": 0.84, "learning_rate": 8.237565264703523e-06, "loss": 2.3002, "step": 478960 }, { "epoch": 0.84, "learning_rate": 8.236693324776697e-06, "loss": 2.3588, "step": 478970 }, { "epoch": 0.84, "learning_rate": 8.23582138484987e-06, "loss": 2.1823, "step": 478980 }, { "epoch": 0.84, "learning_rate": 8.234949444923043e-06, "loss": 2.2792, "step": 478990 }, { "epoch": 0.84, "learning_rate": 8.234077504996217e-06, "loss": 2.2282, "step": 479000 }, { "epoch": 0.84, "learning_rate": 8.233205565069389e-06, "loss": 2.336, "step": 479010 }, { "epoch": 0.84, "learning_rate": 8.232333625142563e-06, "loss": 2.2917, "step": 479020 }, { "epoch": 0.84, "learning_rate": 8.231461685215735e-06, "loss": 2.2895, "step": 479030 }, { "epoch": 0.84, "learning_rate": 8.23058974528891e-06, "loss": 2.3257, "step": 479040 }, { "epoch": 0.84, "learning_rate": 8.229717805362082e-06, "loss": 2.2136, "step": 479050 }, { "epoch": 0.84, "learning_rate": 8.228845865435256e-06, "loss": 2.2063, "step": 479060 }, { "epoch": 0.84, "learning_rate": 8.227973925508428e-06, "loss": 2.2674, "step": 479070 }, { "epoch": 0.84, "learning_rate": 8.227101985581602e-06, "loss": 2.2509, "step": 479080 }, { "epoch": 0.84, "learning_rate": 8.226230045654774e-06, "loss": 2.2859, "step": 479090 }, { "epoch": 0.84, "learning_rate": 8.225358105727948e-06, "loss": 2.2561, "step": 479100 }, { "epoch": 0.84, "learning_rate": 8.224486165801122e-06, "loss": 2.1093, "step": 479110 }, { "epoch": 0.84, "learning_rate": 8.223614225874295e-06, "loss": 2.357, "step": 479120 }, { "epoch": 0.84, "learning_rate": 8.222742285947469e-06, "loss": 2.2259, "step": 479130 }, { "epoch": 0.84, "learning_rate": 8.221870346020641e-06, "loss": 2.1955, "step": 479140 }, { "epoch": 0.84, "learning_rate": 8.220998406093815e-06, "loss": 2.331, "step": 479150 }, { "epoch": 0.84, "learning_rate": 8.220126466166987e-06, "loss": 2.2185, "step": 479160 }, { "epoch": 0.84, "learning_rate": 8.21925452624016e-06, "loss": 2.1674, "step": 479170 }, { "epoch": 0.84, "learning_rate": 8.218382586313333e-06, "loss": 2.3092, "step": 479180 }, { "epoch": 0.84, "learning_rate": 8.217510646386507e-06, "loss": 2.2708, "step": 479190 }, { "epoch": 0.84, "learning_rate": 8.21663870645968e-06, "loss": 2.1897, "step": 479200 }, { "epoch": 0.84, "learning_rate": 8.215766766532854e-06, "loss": 2.3107, "step": 479210 }, { "epoch": 0.84, "learning_rate": 8.214894826606026e-06, "loss": 2.2706, "step": 479220 }, { "epoch": 0.84, "learning_rate": 8.2140228866792e-06, "loss": 2.2763, "step": 479230 }, { "epoch": 0.84, "learning_rate": 8.213150946752372e-06, "loss": 2.3406, "step": 479240 }, { "epoch": 0.84, "learning_rate": 8.212279006825546e-06, "loss": 2.2266, "step": 479250 }, { "epoch": 0.84, "learning_rate": 8.21140706689872e-06, "loss": 2.3253, "step": 479260 }, { "epoch": 0.84, "learning_rate": 8.210535126971892e-06, "loss": 2.2217, "step": 479270 }, { "epoch": 0.84, "learning_rate": 8.209663187045067e-06, "loss": 2.402, "step": 479280 }, { "epoch": 0.84, "learning_rate": 8.20879124711824e-06, "loss": 2.2318, "step": 479290 }, { "epoch": 0.84, "learning_rate": 8.207919307191413e-06, "loss": 2.3104, "step": 479300 }, { "epoch": 0.84, "learning_rate": 8.207047367264585e-06, "loss": 2.3706, "step": 479310 }, { "epoch": 0.84, "learning_rate": 8.206175427337759e-06, "loss": 2.2574, "step": 479320 }, { "epoch": 0.84, "learning_rate": 8.205303487410931e-06, "loss": 2.314, "step": 479330 }, { "epoch": 0.84, "learning_rate": 8.204431547484105e-06, "loss": 2.3643, "step": 479340 }, { "epoch": 0.84, "learning_rate": 8.203559607557278e-06, "loss": 2.2655, "step": 479350 }, { "epoch": 0.84, "learning_rate": 8.202687667630452e-06, "loss": 2.3429, "step": 479360 }, { "epoch": 0.84, "learning_rate": 8.201815727703624e-06, "loss": 2.2724, "step": 479370 }, { "epoch": 0.84, "learning_rate": 8.200943787776798e-06, "loss": 2.2427, "step": 479380 }, { "epoch": 0.84, "learning_rate": 8.20007184784997e-06, "loss": 2.2363, "step": 479390 }, { "epoch": 0.84, "learning_rate": 8.199199907923144e-06, "loss": 2.2567, "step": 479400 }, { "epoch": 0.84, "learning_rate": 8.198327967996318e-06, "loss": 2.3317, "step": 479410 }, { "epoch": 0.84, "learning_rate": 8.19745602806949e-06, "loss": 2.2863, "step": 479420 }, { "epoch": 0.84, "learning_rate": 8.196584088142664e-06, "loss": 2.2565, "step": 479430 }, { "epoch": 0.84, "learning_rate": 8.195712148215837e-06, "loss": 2.2854, "step": 479440 }, { "epoch": 0.84, "learning_rate": 8.194840208289011e-06, "loss": 2.2641, "step": 479450 }, { "epoch": 0.84, "learning_rate": 8.193968268362183e-06, "loss": 2.1641, "step": 479460 }, { "epoch": 0.84, "learning_rate": 8.193096328435357e-06, "loss": 2.3432, "step": 479470 }, { "epoch": 0.84, "learning_rate": 8.192224388508529e-06, "loss": 2.3654, "step": 479480 }, { "epoch": 0.84, "learning_rate": 8.191352448581703e-06, "loss": 2.3545, "step": 479490 }, { "epoch": 0.84, "learning_rate": 8.190480508654875e-06, "loss": 2.2171, "step": 479500 }, { "epoch": 0.84, "learning_rate": 8.189608568728049e-06, "loss": 2.2121, "step": 479510 }, { "epoch": 0.84, "learning_rate": 8.188736628801222e-06, "loss": 2.252, "step": 479520 }, { "epoch": 0.84, "learning_rate": 8.187864688874396e-06, "loss": 2.2926, "step": 479530 }, { "epoch": 0.84, "learning_rate": 8.18699274894757e-06, "loss": 2.2659, "step": 479540 }, { "epoch": 0.84, "learning_rate": 8.186120809020742e-06, "loss": 2.2368, "step": 479550 }, { "epoch": 0.84, "learning_rate": 8.185248869093916e-06, "loss": 2.1699, "step": 479560 }, { "epoch": 0.84, "learning_rate": 8.184376929167088e-06, "loss": 2.1985, "step": 479570 }, { "epoch": 0.84, "learning_rate": 8.183504989240262e-06, "loss": 2.38, "step": 479580 }, { "epoch": 0.84, "learning_rate": 8.182633049313435e-06, "loss": 2.3618, "step": 479590 }, { "epoch": 0.84, "learning_rate": 8.181761109386609e-06, "loss": 2.1832, "step": 479600 }, { "epoch": 0.84, "learning_rate": 8.180889169459781e-06, "loss": 2.3349, "step": 479610 }, { "epoch": 0.84, "learning_rate": 8.180017229532955e-06, "loss": 2.2448, "step": 479620 }, { "epoch": 0.84, "learning_rate": 8.179145289606127e-06, "loss": 2.3394, "step": 479630 }, { "epoch": 0.84, "learning_rate": 8.1782733496793e-06, "loss": 2.1557, "step": 479640 }, { "epoch": 0.84, "learning_rate": 8.177401409752473e-06, "loss": 2.3075, "step": 479650 }, { "epoch": 0.84, "learning_rate": 8.176529469825647e-06, "loss": 2.3287, "step": 479660 }, { "epoch": 0.84, "learning_rate": 8.17565752989882e-06, "loss": 2.2642, "step": 479670 }, { "epoch": 0.84, "learning_rate": 8.174785589971994e-06, "loss": 2.2515, "step": 479680 }, { "epoch": 0.84, "learning_rate": 8.173913650045168e-06, "loss": 2.207, "step": 479690 }, { "epoch": 0.84, "learning_rate": 8.17304171011834e-06, "loss": 2.1875, "step": 479700 }, { "epoch": 0.84, "learning_rate": 8.172169770191514e-06, "loss": 2.2395, "step": 479710 }, { "epoch": 0.84, "learning_rate": 8.171297830264686e-06, "loss": 2.1905, "step": 479720 }, { "epoch": 0.84, "learning_rate": 8.17042589033786e-06, "loss": 2.1485, "step": 479730 }, { "epoch": 0.84, "learning_rate": 8.169553950411032e-06, "loss": 2.2559, "step": 479740 }, { "epoch": 0.84, "learning_rate": 8.168682010484206e-06, "loss": 2.2627, "step": 479750 }, { "epoch": 0.84, "learning_rate": 8.16781007055738e-06, "loss": 2.2057, "step": 479760 }, { "epoch": 0.84, "learning_rate": 8.166938130630553e-06, "loss": 2.2042, "step": 479770 }, { "epoch": 0.84, "learning_rate": 8.166066190703725e-06, "loss": 2.3729, "step": 479780 }, { "epoch": 0.84, "learning_rate": 8.165194250776899e-06, "loss": 2.2418, "step": 479790 }, { "epoch": 0.84, "learning_rate": 8.164322310850073e-06, "loss": 2.2083, "step": 479800 }, { "epoch": 0.84, "learning_rate": 8.163450370923245e-06, "loss": 2.2266, "step": 479810 }, { "epoch": 0.84, "learning_rate": 8.162578430996419e-06, "loss": 2.2944, "step": 479820 }, { "epoch": 0.84, "learning_rate": 8.16170649106959e-06, "loss": 2.3304, "step": 479830 }, { "epoch": 0.84, "learning_rate": 8.160834551142766e-06, "loss": 2.2266, "step": 479840 }, { "epoch": 0.84, "learning_rate": 8.159962611215938e-06, "loss": 2.2574, "step": 479850 }, { "epoch": 0.84, "learning_rate": 8.159090671289112e-06, "loss": 2.3289, "step": 479860 }, { "epoch": 0.84, "learning_rate": 8.158218731362284e-06, "loss": 2.1495, "step": 479870 }, { "epoch": 0.84, "learning_rate": 8.157346791435458e-06, "loss": 2.2967, "step": 479880 }, { "epoch": 0.84, "learning_rate": 8.15647485150863e-06, "loss": 2.2817, "step": 479890 }, { "epoch": 0.84, "learning_rate": 8.155602911581804e-06, "loss": 2.2873, "step": 479900 }, { "epoch": 0.84, "learning_rate": 8.154730971654977e-06, "loss": 2.3343, "step": 479910 }, { "epoch": 0.84, "learning_rate": 8.153859031728151e-06, "loss": 2.1899, "step": 479920 }, { "epoch": 0.84, "learning_rate": 8.152987091801325e-06, "loss": 2.2454, "step": 479930 }, { "epoch": 0.84, "learning_rate": 8.152115151874497e-06, "loss": 2.1721, "step": 479940 }, { "epoch": 0.84, "learning_rate": 8.15124321194767e-06, "loss": 2.2329, "step": 479950 }, { "epoch": 0.84, "learning_rate": 8.150371272020843e-06, "loss": 2.3818, "step": 479960 }, { "epoch": 0.84, "learning_rate": 8.149499332094017e-06, "loss": 2.2541, "step": 479970 }, { "epoch": 0.84, "learning_rate": 8.148627392167189e-06, "loss": 2.3348, "step": 479980 }, { "epoch": 0.84, "learning_rate": 8.147755452240362e-06, "loss": 2.2227, "step": 479990 }, { "epoch": 0.84, "learning_rate": 8.146883512313536e-06, "loss": 2.1823, "step": 480000 }, { "epoch": 0.84, "learning_rate": 8.14601157238671e-06, "loss": 2.2014, "step": 480010 }, { "epoch": 0.84, "learning_rate": 8.145139632459882e-06, "loss": 2.346, "step": 480020 }, { "epoch": 0.84, "learning_rate": 8.144267692533056e-06, "loss": 2.265, "step": 480030 }, { "epoch": 0.84, "learning_rate": 8.143395752606228e-06, "loss": 2.3703, "step": 480040 }, { "epoch": 0.84, "learning_rate": 8.142523812679402e-06, "loss": 2.1757, "step": 480050 }, { "epoch": 0.84, "learning_rate": 8.141651872752575e-06, "loss": 2.2442, "step": 480060 }, { "epoch": 0.84, "learning_rate": 8.140779932825748e-06, "loss": 2.3107, "step": 480070 }, { "epoch": 0.84, "learning_rate": 8.139907992898923e-06, "loss": 2.1683, "step": 480080 }, { "epoch": 0.84, "learning_rate": 8.139036052972095e-06, "loss": 2.3207, "step": 480090 }, { "epoch": 0.84, "learning_rate": 8.138164113045269e-06, "loss": 2.2354, "step": 480100 }, { "epoch": 0.84, "learning_rate": 8.137292173118441e-06, "loss": 2.2828, "step": 480110 }, { "epoch": 0.84, "learning_rate": 8.136420233191615e-06, "loss": 2.3285, "step": 480120 }, { "epoch": 0.84, "learning_rate": 8.135548293264787e-06, "loss": 2.2609, "step": 480130 }, { "epoch": 0.84, "learning_rate": 8.13467635333796e-06, "loss": 2.2757, "step": 480140 }, { "epoch": 0.84, "learning_rate": 8.133804413411134e-06, "loss": 2.2774, "step": 480150 }, { "epoch": 0.84, "learning_rate": 8.132932473484308e-06, "loss": 2.2263, "step": 480160 }, { "epoch": 0.84, "learning_rate": 8.13206053355748e-06, "loss": 2.2212, "step": 480170 }, { "epoch": 0.84, "learning_rate": 8.131188593630654e-06, "loss": 2.363, "step": 480180 }, { "epoch": 0.84, "learning_rate": 8.130316653703828e-06, "loss": 2.2706, "step": 480190 }, { "epoch": 0.84, "learning_rate": 8.129444713777e-06, "loss": 2.3416, "step": 480200 }, { "epoch": 0.84, "learning_rate": 8.128572773850174e-06, "loss": 2.2542, "step": 480210 }, { "epoch": 0.84, "learning_rate": 8.127700833923346e-06, "loss": 2.3508, "step": 480220 }, { "epoch": 0.84, "learning_rate": 8.12682889399652e-06, "loss": 2.2711, "step": 480230 }, { "epoch": 0.84, "learning_rate": 8.125956954069693e-06, "loss": 2.3115, "step": 480240 }, { "epoch": 0.84, "learning_rate": 8.125085014142867e-06, "loss": 2.2974, "step": 480250 }, { "epoch": 0.84, "learning_rate": 8.124213074216039e-06, "loss": 2.1337, "step": 480260 }, { "epoch": 0.84, "learning_rate": 8.123341134289213e-06, "loss": 2.3016, "step": 480270 }, { "epoch": 0.84, "learning_rate": 8.122469194362385e-06, "loss": 2.1987, "step": 480280 }, { "epoch": 0.84, "learning_rate": 8.121597254435559e-06, "loss": 2.1943, "step": 480290 }, { "epoch": 0.84, "learning_rate": 8.12072531450873e-06, "loss": 2.2346, "step": 480300 }, { "epoch": 0.84, "learning_rate": 8.119853374581904e-06, "loss": 2.2797, "step": 480310 }, { "epoch": 0.84, "learning_rate": 8.118981434655078e-06, "loss": 2.2062, "step": 480320 }, { "epoch": 0.84, "learning_rate": 8.118109494728252e-06, "loss": 2.3208, "step": 480330 }, { "epoch": 0.84, "learning_rate": 8.117237554801426e-06, "loss": 2.2687, "step": 480340 }, { "epoch": 0.84, "learning_rate": 8.116365614874598e-06, "loss": 2.292, "step": 480350 }, { "epoch": 0.84, "learning_rate": 8.115493674947772e-06, "loss": 2.2818, "step": 480360 }, { "epoch": 0.84, "learning_rate": 8.114621735020944e-06, "loss": 2.2127, "step": 480370 }, { "epoch": 0.84, "learning_rate": 8.113749795094117e-06, "loss": 2.329, "step": 480380 }, { "epoch": 0.84, "learning_rate": 8.112877855167291e-06, "loss": 2.2776, "step": 480390 }, { "epoch": 0.84, "learning_rate": 8.112005915240465e-06, "loss": 2.2102, "step": 480400 }, { "epoch": 0.84, "learning_rate": 8.111133975313637e-06, "loss": 2.2094, "step": 480410 }, { "epoch": 0.84, "learning_rate": 8.11026203538681e-06, "loss": 2.3016, "step": 480420 }, { "epoch": 0.84, "learning_rate": 8.109390095459983e-06, "loss": 2.14, "step": 480430 }, { "epoch": 0.84, "learning_rate": 8.108518155533157e-06, "loss": 2.3096, "step": 480440 }, { "epoch": 0.84, "learning_rate": 8.107646215606329e-06, "loss": 2.1247, "step": 480450 }, { "epoch": 0.84, "learning_rate": 8.106774275679503e-06, "loss": 2.2972, "step": 480460 }, { "epoch": 0.84, "learning_rate": 8.105902335752676e-06, "loss": 2.1919, "step": 480470 }, { "epoch": 0.84, "learning_rate": 8.10503039582585e-06, "loss": 2.2875, "step": 480480 }, { "epoch": 0.84, "learning_rate": 8.104158455899024e-06, "loss": 2.2854, "step": 480490 }, { "epoch": 0.84, "learning_rate": 8.103286515972196e-06, "loss": 2.2843, "step": 480500 }, { "epoch": 0.84, "learning_rate": 8.10241457604537e-06, "loss": 2.305, "step": 480510 }, { "epoch": 0.84, "learning_rate": 8.101542636118542e-06, "loss": 2.2146, "step": 480520 }, { "epoch": 0.84, "learning_rate": 8.100670696191716e-06, "loss": 2.3983, "step": 480530 }, { "epoch": 0.84, "learning_rate": 8.099798756264888e-06, "loss": 2.3358, "step": 480540 }, { "epoch": 0.84, "learning_rate": 8.098926816338061e-06, "loss": 2.3233, "step": 480550 }, { "epoch": 0.84, "learning_rate": 8.098054876411235e-06, "loss": 2.3578, "step": 480560 }, { "epoch": 0.84, "learning_rate": 8.097182936484409e-06, "loss": 2.2986, "step": 480570 }, { "epoch": 0.84, "learning_rate": 8.096310996557581e-06, "loss": 2.2543, "step": 480580 }, { "epoch": 0.84, "learning_rate": 8.095439056630755e-06, "loss": 2.3527, "step": 480590 }, { "epoch": 0.84, "learning_rate": 8.094567116703929e-06, "loss": 2.1944, "step": 480600 }, { "epoch": 0.84, "learning_rate": 8.0936951767771e-06, "loss": 2.2564, "step": 480610 }, { "epoch": 0.84, "learning_rate": 8.092823236850274e-06, "loss": 2.3215, "step": 480620 }, { "epoch": 0.84, "learning_rate": 8.091951296923448e-06, "loss": 2.4512, "step": 480630 }, { "epoch": 0.84, "learning_rate": 8.091079356996622e-06, "loss": 2.4279, "step": 480640 }, { "epoch": 0.84, "learning_rate": 8.090207417069794e-06, "loss": 2.212, "step": 480650 }, { "epoch": 0.84, "learning_rate": 8.089335477142968e-06, "loss": 2.2486, "step": 480660 }, { "epoch": 0.84, "learning_rate": 8.08846353721614e-06, "loss": 2.2339, "step": 480670 }, { "epoch": 0.84, "learning_rate": 8.087591597289314e-06, "loss": 2.2987, "step": 480680 }, { "epoch": 0.84, "learning_rate": 8.086719657362486e-06, "loss": 2.1942, "step": 480690 }, { "epoch": 0.84, "learning_rate": 8.08584771743566e-06, "loss": 2.3314, "step": 480700 }, { "epoch": 0.84, "learning_rate": 8.084975777508833e-06, "loss": 2.2799, "step": 480710 }, { "epoch": 0.84, "learning_rate": 8.084103837582007e-06, "loss": 2.2056, "step": 480720 }, { "epoch": 0.84, "learning_rate": 8.08323189765518e-06, "loss": 2.3055, "step": 480730 }, { "epoch": 0.84, "learning_rate": 8.082359957728353e-06, "loss": 2.3243, "step": 480740 }, { "epoch": 0.84, "learning_rate": 8.081488017801527e-06, "loss": 2.2711, "step": 480750 }, { "epoch": 0.84, "learning_rate": 8.080616077874699e-06, "loss": 2.1675, "step": 480760 }, { "epoch": 0.84, "learning_rate": 8.079744137947872e-06, "loss": 2.3482, "step": 480770 }, { "epoch": 0.84, "learning_rate": 8.078872198021045e-06, "loss": 2.3446, "step": 480780 }, { "epoch": 0.84, "learning_rate": 8.078000258094218e-06, "loss": 2.3303, "step": 480790 }, { "epoch": 0.84, "learning_rate": 8.077128318167392e-06, "loss": 1.9281, "step": 480800 }, { "epoch": 0.84, "learning_rate": 8.076256378240566e-06, "loss": 2.3201, "step": 480810 }, { "epoch": 0.84, "learning_rate": 8.075384438313738e-06, "loss": 2.2839, "step": 480820 }, { "epoch": 0.84, "learning_rate": 8.074512498386912e-06, "loss": 2.2934, "step": 480830 }, { "epoch": 0.84, "learning_rate": 8.073640558460084e-06, "loss": 2.193, "step": 480840 }, { "epoch": 0.84, "learning_rate": 8.072768618533258e-06, "loss": 2.3585, "step": 480850 }, { "epoch": 0.84, "learning_rate": 8.071896678606431e-06, "loss": 2.2978, "step": 480860 }, { "epoch": 0.84, "learning_rate": 8.071024738679605e-06, "loss": 2.1496, "step": 480870 }, { "epoch": 0.84, "learning_rate": 8.070152798752779e-06, "loss": 2.2767, "step": 480880 }, { "epoch": 0.84, "learning_rate": 8.069280858825951e-06, "loss": 2.2877, "step": 480890 }, { "epoch": 0.84, "learning_rate": 8.068408918899125e-06, "loss": 2.3053, "step": 480900 }, { "epoch": 0.84, "learning_rate": 8.067536978972297e-06, "loss": 2.3108, "step": 480910 }, { "epoch": 0.84, "learning_rate": 8.06666503904547e-06, "loss": 2.2701, "step": 480920 }, { "epoch": 0.84, "learning_rate": 8.065793099118643e-06, "loss": 2.311, "step": 480930 }, { "epoch": 0.84, "learning_rate": 8.064921159191816e-06, "loss": 2.3655, "step": 480940 }, { "epoch": 0.84, "learning_rate": 8.06404921926499e-06, "loss": 2.2268, "step": 480950 }, { "epoch": 0.84, "learning_rate": 8.063177279338164e-06, "loss": 2.2901, "step": 480960 }, { "epoch": 0.84, "learning_rate": 8.062305339411336e-06, "loss": 2.3973, "step": 480970 }, { "epoch": 0.84, "learning_rate": 8.06143339948451e-06, "loss": 2.2896, "step": 480980 }, { "epoch": 0.84, "learning_rate": 8.060561459557684e-06, "loss": 2.3095, "step": 480990 }, { "epoch": 0.84, "learning_rate": 8.059689519630856e-06, "loss": 2.2738, "step": 481000 }, { "epoch": 0.84, "learning_rate": 8.05881757970403e-06, "loss": 2.2752, "step": 481010 }, { "epoch": 0.84, "learning_rate": 8.057945639777201e-06, "loss": 2.2745, "step": 481020 }, { "epoch": 0.84, "learning_rate": 8.057073699850375e-06, "loss": 2.3201, "step": 481030 }, { "epoch": 0.84, "learning_rate": 8.056201759923549e-06, "loss": 2.2116, "step": 481040 }, { "epoch": 0.84, "learning_rate": 8.055329819996723e-06, "loss": 2.1865, "step": 481050 }, { "epoch": 0.84, "learning_rate": 8.054457880069895e-06, "loss": 2.3133, "step": 481060 }, { "epoch": 0.84, "learning_rate": 8.053585940143069e-06, "loss": 2.3008, "step": 481070 }, { "epoch": 0.84, "learning_rate": 8.05271400021624e-06, "loss": 2.2959, "step": 481080 }, { "epoch": 0.84, "learning_rate": 8.051842060289414e-06, "loss": 2.2652, "step": 481090 }, { "epoch": 0.84, "learning_rate": 8.050970120362587e-06, "loss": 2.2254, "step": 481100 }, { "epoch": 0.84, "learning_rate": 8.05009818043576e-06, "loss": 2.1458, "step": 481110 }, { "epoch": 0.84, "learning_rate": 8.049226240508934e-06, "loss": 2.2771, "step": 481120 }, { "epoch": 0.84, "learning_rate": 8.048354300582108e-06, "loss": 2.3495, "step": 481130 }, { "epoch": 0.84, "learning_rate": 8.047482360655282e-06, "loss": 2.2648, "step": 481140 }, { "epoch": 0.84, "learning_rate": 8.046610420728454e-06, "loss": 2.2246, "step": 481150 }, { "epoch": 0.84, "learning_rate": 8.045738480801627e-06, "loss": 2.3191, "step": 481160 }, { "epoch": 0.84, "learning_rate": 8.0448665408748e-06, "loss": 2.2598, "step": 481170 }, { "epoch": 0.84, "learning_rate": 8.043994600947973e-06, "loss": 2.2898, "step": 481180 }, { "epoch": 0.84, "learning_rate": 8.043122661021147e-06, "loss": 2.395, "step": 481190 }, { "epoch": 0.84, "learning_rate": 8.042250721094321e-06, "loss": 2.2812, "step": 481200 }, { "epoch": 0.84, "learning_rate": 8.041378781167493e-06, "loss": 2.2365, "step": 481210 }, { "epoch": 0.84, "learning_rate": 8.040506841240667e-06, "loss": 2.2365, "step": 481220 }, { "epoch": 0.84, "learning_rate": 8.039634901313839e-06, "loss": 2.2912, "step": 481230 }, { "epoch": 0.84, "learning_rate": 8.038762961387013e-06, "loss": 2.3764, "step": 481240 }, { "epoch": 0.84, "learning_rate": 8.037891021460185e-06, "loss": 2.3605, "step": 481250 }, { "epoch": 0.84, "learning_rate": 8.037019081533358e-06, "loss": 2.3166, "step": 481260 }, { "epoch": 0.84, "learning_rate": 8.036147141606532e-06, "loss": 2.1232, "step": 481270 }, { "epoch": 0.84, "learning_rate": 8.035275201679706e-06, "loss": 2.2318, "step": 481280 }, { "epoch": 0.84, "learning_rate": 8.03440326175288e-06, "loss": 2.3441, "step": 481290 }, { "epoch": 0.84, "learning_rate": 8.033531321826052e-06, "loss": 2.2046, "step": 481300 }, { "epoch": 0.84, "learning_rate": 8.032659381899226e-06, "loss": 2.367, "step": 481310 }, { "epoch": 0.84, "learning_rate": 8.031787441972398e-06, "loss": 2.3114, "step": 481320 }, { "epoch": 0.84, "learning_rate": 8.030915502045571e-06, "loss": 2.3023, "step": 481330 }, { "epoch": 0.84, "learning_rate": 8.030043562118743e-06, "loss": 2.4063, "step": 481340 }, { "epoch": 0.84, "learning_rate": 8.029171622191917e-06, "loss": 2.2693, "step": 481350 }, { "epoch": 0.84, "learning_rate": 8.028299682265091e-06, "loss": 2.2747, "step": 481360 }, { "epoch": 0.84, "learning_rate": 8.027427742338265e-06, "loss": 2.2194, "step": 481370 }, { "epoch": 0.84, "learning_rate": 8.026555802411437e-06, "loss": 2.2243, "step": 481380 }, { "epoch": 0.84, "learning_rate": 8.02568386248461e-06, "loss": 2.1601, "step": 481390 }, { "epoch": 0.84, "learning_rate": 8.024811922557784e-06, "loss": 2.2541, "step": 481400 }, { "epoch": 0.84, "learning_rate": 8.023939982630956e-06, "loss": 2.2709, "step": 481410 }, { "epoch": 0.84, "learning_rate": 8.02306804270413e-06, "loss": 2.3189, "step": 481420 }, { "epoch": 0.84, "learning_rate": 8.022196102777304e-06, "loss": 2.2071, "step": 481430 }, { "epoch": 0.84, "learning_rate": 8.021324162850478e-06, "loss": 2.2273, "step": 481440 }, { "epoch": 0.84, "learning_rate": 8.02045222292365e-06, "loss": 2.2075, "step": 481450 }, { "epoch": 0.84, "learning_rate": 8.019580282996824e-06, "loss": 2.2585, "step": 481460 }, { "epoch": 0.84, "learning_rate": 8.018708343069996e-06, "loss": 2.3204, "step": 481470 }, { "epoch": 0.84, "learning_rate": 8.01783640314317e-06, "loss": 2.2644, "step": 481480 }, { "epoch": 0.84, "learning_rate": 8.016964463216342e-06, "loss": 2.3325, "step": 481490 }, { "epoch": 0.84, "learning_rate": 8.016092523289515e-06, "loss": 2.2745, "step": 481500 }, { "epoch": 0.84, "learning_rate": 8.015220583362689e-06, "loss": 2.2637, "step": 481510 }, { "epoch": 0.84, "learning_rate": 8.014348643435863e-06, "loss": 2.2673, "step": 481520 }, { "epoch": 0.84, "learning_rate": 8.013476703509037e-06, "loss": 2.246, "step": 481530 }, { "epoch": 0.84, "learning_rate": 8.012604763582209e-06, "loss": 2.2795, "step": 481540 }, { "epoch": 0.84, "learning_rate": 8.011732823655382e-06, "loss": 2.378, "step": 481550 }, { "epoch": 0.84, "learning_rate": 8.010860883728555e-06, "loss": 2.2295, "step": 481560 }, { "epoch": 0.84, "learning_rate": 8.009988943801728e-06, "loss": 2.2412, "step": 481570 }, { "epoch": 0.84, "learning_rate": 8.0091170038749e-06, "loss": 2.2282, "step": 481580 }, { "epoch": 0.84, "learning_rate": 8.008245063948074e-06, "loss": 2.1999, "step": 481590 }, { "epoch": 0.84, "learning_rate": 8.007373124021248e-06, "loss": 2.3233, "step": 481600 }, { "epoch": 0.84, "learning_rate": 8.006501184094422e-06, "loss": 2.3583, "step": 481610 }, { "epoch": 0.84, "learning_rate": 8.005629244167594e-06, "loss": 2.2688, "step": 481620 }, { "epoch": 0.84, "learning_rate": 8.004757304240768e-06, "loss": 2.3588, "step": 481630 }, { "epoch": 0.84, "learning_rate": 8.00388536431394e-06, "loss": 2.2733, "step": 481640 }, { "epoch": 0.84, "learning_rate": 8.003013424387113e-06, "loss": 2.2679, "step": 481650 }, { "epoch": 0.84, "learning_rate": 8.002141484460287e-06, "loss": 2.2973, "step": 481660 }, { "epoch": 0.84, "learning_rate": 8.001269544533461e-06, "loss": 2.2765, "step": 481670 }, { "epoch": 0.84, "learning_rate": 8.000397604606635e-06, "loss": 2.2661, "step": 481680 }, { "epoch": 0.84, "learning_rate": 7.999525664679807e-06, "loss": 2.2016, "step": 481690 }, { "epoch": 0.84, "learning_rate": 7.99865372475298e-06, "loss": 2.2232, "step": 481700 }, { "epoch": 0.84, "learning_rate": 7.997781784826153e-06, "loss": 2.4183, "step": 481710 }, { "epoch": 0.84, "learning_rate": 7.996909844899326e-06, "loss": 2.3699, "step": 481720 }, { "epoch": 0.84, "learning_rate": 7.996037904972498e-06, "loss": 2.3149, "step": 481730 }, { "epoch": 0.84, "learning_rate": 7.995165965045672e-06, "loss": 2.3297, "step": 481740 }, { "epoch": 0.84, "learning_rate": 7.994294025118846e-06, "loss": 2.3828, "step": 481750 }, { "epoch": 0.84, "learning_rate": 7.99342208519202e-06, "loss": 2.2527, "step": 481760 }, { "epoch": 0.84, "learning_rate": 7.992550145265192e-06, "loss": 2.2882, "step": 481770 }, { "epoch": 0.84, "learning_rate": 7.991678205338366e-06, "loss": 2.2035, "step": 481780 }, { "epoch": 0.84, "learning_rate": 7.99080626541154e-06, "loss": 2.3197, "step": 481790 }, { "epoch": 0.84, "learning_rate": 7.989934325484711e-06, "loss": 2.471, "step": 481800 }, { "epoch": 0.84, "learning_rate": 7.989062385557885e-06, "loss": 2.3108, "step": 481810 }, { "epoch": 0.84, "learning_rate": 7.988190445631057e-06, "loss": 2.1842, "step": 481820 }, { "epoch": 0.84, "learning_rate": 7.987318505704231e-06, "loss": 2.1747, "step": 481830 }, { "epoch": 0.84, "learning_rate": 7.986446565777405e-06, "loss": 2.3858, "step": 481840 }, { "epoch": 0.84, "learning_rate": 7.985574625850579e-06, "loss": 2.1945, "step": 481850 }, { "epoch": 0.84, "learning_rate": 7.98470268592375e-06, "loss": 2.3256, "step": 481860 }, { "epoch": 0.84, "learning_rate": 7.983830745996924e-06, "loss": 2.4069, "step": 481870 }, { "epoch": 0.84, "learning_rate": 7.982958806070097e-06, "loss": 2.3141, "step": 481880 }, { "epoch": 0.84, "learning_rate": 7.98208686614327e-06, "loss": 2.2631, "step": 481890 }, { "epoch": 0.84, "learning_rate": 7.981214926216442e-06, "loss": 2.2239, "step": 481900 }, { "epoch": 0.84, "learning_rate": 7.980342986289618e-06, "loss": 2.2283, "step": 481910 }, { "epoch": 0.84, "learning_rate": 7.979471046362792e-06, "loss": 2.1656, "step": 481920 }, { "epoch": 0.84, "learning_rate": 7.978599106435964e-06, "loss": 2.0981, "step": 481930 }, { "epoch": 0.84, "learning_rate": 7.977727166509137e-06, "loss": 2.2437, "step": 481940 }, { "epoch": 0.84, "learning_rate": 7.97685522658231e-06, "loss": 2.2785, "step": 481950 }, { "epoch": 0.84, "learning_rate": 7.975983286655483e-06, "loss": 2.2361, "step": 481960 }, { "epoch": 0.84, "learning_rate": 7.975111346728655e-06, "loss": 2.2487, "step": 481970 }, { "epoch": 0.84, "learning_rate": 7.97423940680183e-06, "loss": 2.182, "step": 481980 }, { "epoch": 0.84, "learning_rate": 7.973367466875003e-06, "loss": 2.3306, "step": 481990 }, { "epoch": 0.84, "learning_rate": 7.972495526948177e-06, "loss": 2.2524, "step": 482000 }, { "epoch": 0.84, "learning_rate": 7.971623587021349e-06, "loss": 2.2885, "step": 482010 }, { "epoch": 0.84, "learning_rate": 7.970751647094523e-06, "loss": 2.3216, "step": 482020 }, { "epoch": 0.84, "learning_rate": 7.969879707167695e-06, "loss": 2.248, "step": 482030 }, { "epoch": 0.84, "learning_rate": 7.969007767240868e-06, "loss": 2.2902, "step": 482040 }, { "epoch": 0.84, "learning_rate": 7.96813582731404e-06, "loss": 2.2923, "step": 482050 }, { "epoch": 0.84, "learning_rate": 7.967263887387214e-06, "loss": 2.3319, "step": 482060 }, { "epoch": 0.84, "learning_rate": 7.966391947460388e-06, "loss": 2.296, "step": 482070 }, { "epoch": 0.84, "learning_rate": 7.965520007533562e-06, "loss": 2.2802, "step": 482080 }, { "epoch": 0.84, "learning_rate": 7.964648067606736e-06, "loss": 2.2231, "step": 482090 }, { "epoch": 0.84, "learning_rate": 7.963776127679908e-06, "loss": 2.2073, "step": 482100 }, { "epoch": 0.84, "learning_rate": 7.962904187753081e-06, "loss": 2.2766, "step": 482110 }, { "epoch": 0.84, "learning_rate": 7.962032247826253e-06, "loss": 2.2343, "step": 482120 }, { "epoch": 0.84, "learning_rate": 7.961160307899427e-06, "loss": 2.2984, "step": 482130 }, { "epoch": 0.84, "learning_rate": 7.9602883679726e-06, "loss": 2.2662, "step": 482140 }, { "epoch": 0.84, "learning_rate": 7.959416428045773e-06, "loss": 2.2766, "step": 482150 }, { "epoch": 0.84, "learning_rate": 7.958544488118947e-06, "loss": 2.344, "step": 482160 }, { "epoch": 0.84, "learning_rate": 7.95767254819212e-06, "loss": 2.2194, "step": 482170 }, { "epoch": 0.84, "learning_rate": 7.956800608265293e-06, "loss": 2.433, "step": 482180 }, { "epoch": 0.84, "learning_rate": 7.955928668338466e-06, "loss": 2.2975, "step": 482190 }, { "epoch": 0.84, "learning_rate": 7.95505672841164e-06, "loss": 2.2771, "step": 482200 }, { "epoch": 0.84, "learning_rate": 7.954184788484812e-06, "loss": 2.3416, "step": 482210 }, { "epoch": 0.84, "learning_rate": 7.953312848557986e-06, "loss": 2.2482, "step": 482220 }, { "epoch": 0.84, "learning_rate": 7.95244090863116e-06, "loss": 2.0661, "step": 482230 }, { "epoch": 0.84, "learning_rate": 7.951568968704334e-06, "loss": 2.2038, "step": 482240 }, { "epoch": 0.84, "learning_rate": 7.950697028777506e-06, "loss": 2.1592, "step": 482250 }, { "epoch": 0.84, "learning_rate": 7.94982508885068e-06, "loss": 2.2229, "step": 482260 }, { "epoch": 0.84, "learning_rate": 7.948953148923852e-06, "loss": 2.3125, "step": 482270 }, { "epoch": 0.84, "learning_rate": 7.948081208997025e-06, "loss": 2.2692, "step": 482280 }, { "epoch": 0.84, "learning_rate": 7.947209269070197e-06, "loss": 2.1957, "step": 482290 }, { "epoch": 0.84, "learning_rate": 7.946337329143371e-06, "loss": 2.3325, "step": 482300 }, { "epoch": 0.84, "learning_rate": 7.945465389216545e-06, "loss": 2.2306, "step": 482310 }, { "epoch": 0.84, "learning_rate": 7.944593449289719e-06, "loss": 2.3139, "step": 482320 }, { "epoch": 0.84, "learning_rate": 7.943721509362892e-06, "loss": 2.2754, "step": 482330 }, { "epoch": 0.84, "learning_rate": 7.942849569436065e-06, "loss": 2.3058, "step": 482340 }, { "epoch": 0.84, "learning_rate": 7.941977629509238e-06, "loss": 2.2409, "step": 482350 }, { "epoch": 0.84, "learning_rate": 7.94110568958241e-06, "loss": 2.2294, "step": 482360 }, { "epoch": 0.84, "learning_rate": 7.940233749655584e-06, "loss": 2.478, "step": 482370 }, { "epoch": 0.84, "learning_rate": 7.939361809728756e-06, "loss": 2.2894, "step": 482380 }, { "epoch": 0.84, "learning_rate": 7.93848986980193e-06, "loss": 2.2221, "step": 482390 }, { "epoch": 0.84, "learning_rate": 7.937617929875104e-06, "loss": 2.2204, "step": 482400 }, { "epoch": 0.84, "learning_rate": 7.936745989948278e-06, "loss": 2.4318, "step": 482410 }, { "epoch": 0.84, "learning_rate": 7.93587405002145e-06, "loss": 2.1651, "step": 482420 }, { "epoch": 0.84, "learning_rate": 7.935002110094623e-06, "loss": 2.2457, "step": 482430 }, { "epoch": 0.84, "learning_rate": 7.934130170167795e-06, "loss": 2.1742, "step": 482440 }, { "epoch": 0.84, "learning_rate": 7.93325823024097e-06, "loss": 2.3201, "step": 482450 }, { "epoch": 0.84, "learning_rate": 7.932386290314143e-06, "loss": 2.2146, "step": 482460 }, { "epoch": 0.84, "learning_rate": 7.931514350387317e-06, "loss": 2.4478, "step": 482470 }, { "epoch": 0.84, "learning_rate": 7.93064241046049e-06, "loss": 2.2134, "step": 482480 }, { "epoch": 0.84, "learning_rate": 7.929770470533663e-06, "loss": 2.2311, "step": 482490 }, { "epoch": 0.84, "learning_rate": 7.928898530606836e-06, "loss": 2.2453, "step": 482500 }, { "epoch": 0.84, "learning_rate": 7.928026590680008e-06, "loss": 2.2199, "step": 482510 }, { "epoch": 0.84, "learning_rate": 7.927154650753182e-06, "loss": 2.2751, "step": 482520 }, { "epoch": 0.84, "learning_rate": 7.926282710826354e-06, "loss": 2.249, "step": 482530 }, { "epoch": 0.84, "learning_rate": 7.925410770899528e-06, "loss": 2.255, "step": 482540 }, { "epoch": 0.84, "learning_rate": 7.924538830972702e-06, "loss": 2.2289, "step": 482550 }, { "epoch": 0.84, "learning_rate": 7.923666891045876e-06, "loss": 2.2173, "step": 482560 }, { "epoch": 0.84, "learning_rate": 7.922794951119048e-06, "loss": 2.2612, "step": 482570 }, { "epoch": 0.84, "learning_rate": 7.921923011192221e-06, "loss": 2.2585, "step": 482580 }, { "epoch": 0.84, "learning_rate": 7.921051071265395e-06, "loss": 2.2574, "step": 482590 }, { "epoch": 0.84, "learning_rate": 7.920179131338567e-06, "loss": 2.3683, "step": 482600 }, { "epoch": 0.84, "learning_rate": 7.919307191411741e-06, "loss": 2.212, "step": 482610 }, { "epoch": 0.84, "learning_rate": 7.918435251484913e-06, "loss": 2.3168, "step": 482620 }, { "epoch": 0.84, "learning_rate": 7.917563311558087e-06, "loss": 2.3799, "step": 482630 }, { "epoch": 0.84, "learning_rate": 7.91669137163126e-06, "loss": 2.2189, "step": 482640 }, { "epoch": 0.84, "learning_rate": 7.915819431704434e-06, "loss": 2.1916, "step": 482650 }, { "epoch": 0.84, "learning_rate": 7.914947491777607e-06, "loss": 2.3723, "step": 482660 }, { "epoch": 0.84, "learning_rate": 7.91407555185078e-06, "loss": 2.2485, "step": 482670 }, { "epoch": 0.84, "learning_rate": 7.913203611923952e-06, "loss": 2.226, "step": 482680 }, { "epoch": 0.84, "learning_rate": 7.912331671997126e-06, "loss": 2.3607, "step": 482690 }, { "epoch": 0.84, "learning_rate": 7.911459732070298e-06, "loss": 2.244, "step": 482700 }, { "epoch": 0.84, "learning_rate": 7.910587792143474e-06, "loss": 2.2499, "step": 482710 }, { "epoch": 0.84, "learning_rate": 7.909715852216647e-06, "loss": 2.296, "step": 482720 }, { "epoch": 0.84, "learning_rate": 7.90884391228982e-06, "loss": 2.2911, "step": 482730 }, { "epoch": 0.84, "learning_rate": 7.907971972362993e-06, "loss": 2.2646, "step": 482740 }, { "epoch": 0.84, "learning_rate": 7.907100032436165e-06, "loss": 2.2111, "step": 482750 }, { "epoch": 0.84, "learning_rate": 7.90622809250934e-06, "loss": 2.3213, "step": 482760 }, { "epoch": 0.84, "learning_rate": 7.905356152582511e-06, "loss": 2.2885, "step": 482770 }, { "epoch": 0.84, "learning_rate": 7.904484212655685e-06, "loss": 2.2892, "step": 482780 }, { "epoch": 0.84, "learning_rate": 7.903612272728859e-06, "loss": 2.3201, "step": 482790 }, { "epoch": 0.84, "learning_rate": 7.902740332802033e-06, "loss": 2.264, "step": 482800 }, { "epoch": 0.84, "learning_rate": 7.901868392875205e-06, "loss": 2.2464, "step": 482810 }, { "epoch": 0.84, "learning_rate": 7.900996452948378e-06, "loss": 2.2318, "step": 482820 }, { "epoch": 0.84, "learning_rate": 7.90012451302155e-06, "loss": 2.3049, "step": 482830 }, { "epoch": 0.84, "learning_rate": 7.899252573094724e-06, "loss": 2.2443, "step": 482840 }, { "epoch": 0.84, "learning_rate": 7.898380633167898e-06, "loss": 2.4047, "step": 482850 }, { "epoch": 0.84, "learning_rate": 7.89750869324107e-06, "loss": 2.147, "step": 482860 }, { "epoch": 0.84, "learning_rate": 7.896636753314244e-06, "loss": 2.254, "step": 482870 }, { "epoch": 0.84, "learning_rate": 7.895764813387418e-06, "loss": 2.2875, "step": 482880 }, { "epoch": 0.84, "learning_rate": 7.894892873460591e-06, "loss": 2.2995, "step": 482890 }, { "epoch": 0.84, "learning_rate": 7.894020933533763e-06, "loss": 2.2593, "step": 482900 }, { "epoch": 0.84, "learning_rate": 7.893148993606937e-06, "loss": 2.2431, "step": 482910 }, { "epoch": 0.84, "learning_rate": 7.89227705368011e-06, "loss": 2.2541, "step": 482920 }, { "epoch": 0.84, "learning_rate": 7.891405113753283e-06, "loss": 2.2544, "step": 482930 }, { "epoch": 0.84, "learning_rate": 7.890533173826455e-06, "loss": 2.2175, "step": 482940 }, { "epoch": 0.84, "learning_rate": 7.88966123389963e-06, "loss": 2.2598, "step": 482950 }, { "epoch": 0.84, "learning_rate": 7.888789293972803e-06, "loss": 2.3284, "step": 482960 }, { "epoch": 0.84, "learning_rate": 7.887917354045976e-06, "loss": 2.2877, "step": 482970 }, { "epoch": 0.84, "learning_rate": 7.887045414119149e-06, "loss": 2.2957, "step": 482980 }, { "epoch": 0.84, "learning_rate": 7.886173474192322e-06, "loss": 2.264, "step": 482990 }, { "epoch": 0.84, "learning_rate": 7.885301534265496e-06, "loss": 2.2385, "step": 483000 }, { "epoch": 0.84, "learning_rate": 7.884429594338668e-06, "loss": 2.2109, "step": 483010 }, { "epoch": 0.84, "learning_rate": 7.883557654411842e-06, "loss": 2.2989, "step": 483020 }, { "epoch": 0.84, "learning_rate": 7.882685714485016e-06, "loss": 2.3738, "step": 483030 }, { "epoch": 0.84, "learning_rate": 7.88181377455819e-06, "loss": 2.1926, "step": 483040 }, { "epoch": 0.84, "learning_rate": 7.880941834631362e-06, "loss": 2.2615, "step": 483050 }, { "epoch": 0.84, "learning_rate": 7.880069894704535e-06, "loss": 2.2693, "step": 483060 }, { "epoch": 0.84, "learning_rate": 7.879197954777707e-06, "loss": 2.3208, "step": 483070 }, { "epoch": 0.84, "learning_rate": 7.878326014850881e-06, "loss": 2.1845, "step": 483080 }, { "epoch": 0.84, "learning_rate": 7.877454074924053e-06, "loss": 2.1984, "step": 483090 }, { "epoch": 0.84, "learning_rate": 7.876582134997227e-06, "loss": 2.2849, "step": 483100 }, { "epoch": 0.84, "learning_rate": 7.8757101950704e-06, "loss": 2.3199, "step": 483110 }, { "epoch": 0.84, "learning_rate": 7.874838255143575e-06, "loss": 2.2457, "step": 483120 }, { "epoch": 0.84, "learning_rate": 7.873966315216748e-06, "loss": 2.1525, "step": 483130 }, { "epoch": 0.84, "learning_rate": 7.87309437528992e-06, "loss": 2.272, "step": 483140 }, { "epoch": 0.84, "learning_rate": 7.872222435363094e-06, "loss": 2.2595, "step": 483150 }, { "epoch": 0.84, "learning_rate": 7.871350495436266e-06, "loss": 2.3661, "step": 483160 }, { "epoch": 0.84, "learning_rate": 7.87047855550944e-06, "loss": 2.2588, "step": 483170 }, { "epoch": 0.84, "learning_rate": 7.869606615582612e-06, "loss": 2.2744, "step": 483180 }, { "epoch": 0.84, "learning_rate": 7.868734675655786e-06, "loss": 2.3081, "step": 483190 }, { "epoch": 0.84, "learning_rate": 7.86786273572896e-06, "loss": 2.2567, "step": 483200 }, { "epoch": 0.84, "learning_rate": 7.866990795802133e-06, "loss": 2.202, "step": 483210 }, { "epoch": 0.84, "learning_rate": 7.866118855875305e-06, "loss": 2.2736, "step": 483220 }, { "epoch": 0.84, "learning_rate": 7.86524691594848e-06, "loss": 2.3138, "step": 483230 }, { "epoch": 0.84, "learning_rate": 7.864374976021651e-06, "loss": 2.3499, "step": 483240 }, { "epoch": 0.84, "learning_rate": 7.863503036094825e-06, "loss": 2.2265, "step": 483250 }, { "epoch": 0.84, "learning_rate": 7.862631096167999e-06, "loss": 2.3471, "step": 483260 }, { "epoch": 0.84, "learning_rate": 7.861759156241173e-06, "loss": 2.2015, "step": 483270 }, { "epoch": 0.84, "learning_rate": 7.860887216314346e-06, "loss": 2.2773, "step": 483280 }, { "epoch": 0.84, "learning_rate": 7.860015276387518e-06, "loss": 2.2228, "step": 483290 }, { "epoch": 0.84, "learning_rate": 7.859143336460692e-06, "loss": 2.1926, "step": 483300 }, { "epoch": 0.84, "learning_rate": 7.858271396533864e-06, "loss": 2.114, "step": 483310 }, { "epoch": 0.84, "learning_rate": 7.857399456607038e-06, "loss": 2.2676, "step": 483320 }, { "epoch": 0.84, "learning_rate": 7.85652751668021e-06, "loss": 2.2615, "step": 483330 }, { "epoch": 0.84, "learning_rate": 7.855655576753384e-06, "loss": 2.2116, "step": 483340 }, { "epoch": 0.84, "learning_rate": 7.854783636826558e-06, "loss": 2.2735, "step": 483350 }, { "epoch": 0.84, "learning_rate": 7.853911696899731e-06, "loss": 2.2699, "step": 483360 }, { "epoch": 0.84, "learning_rate": 7.853039756972904e-06, "loss": 2.2821, "step": 483370 }, { "epoch": 0.84, "learning_rate": 7.852167817046077e-06, "loss": 2.2151, "step": 483380 }, { "epoch": 0.84, "learning_rate": 7.851295877119251e-06, "loss": 2.2441, "step": 483390 }, { "epoch": 0.84, "learning_rate": 7.850423937192423e-06, "loss": 2.2649, "step": 483400 }, { "epoch": 0.84, "learning_rate": 7.849551997265597e-06, "loss": 2.2314, "step": 483410 }, { "epoch": 0.84, "learning_rate": 7.848680057338769e-06, "loss": 2.2964, "step": 483420 }, { "epoch": 0.84, "learning_rate": 7.847808117411943e-06, "loss": 2.2896, "step": 483430 }, { "epoch": 0.84, "learning_rate": 7.846936177485117e-06, "loss": 2.3486, "step": 483440 }, { "epoch": 0.84, "learning_rate": 7.84606423755829e-06, "loss": 2.2638, "step": 483450 }, { "epoch": 0.84, "learning_rate": 7.845192297631462e-06, "loss": 2.2792, "step": 483460 }, { "epoch": 0.84, "learning_rate": 7.844320357704636e-06, "loss": 2.274, "step": 483470 }, { "epoch": 0.84, "learning_rate": 7.843448417777808e-06, "loss": 2.2456, "step": 483480 }, { "epoch": 0.84, "learning_rate": 7.842576477850982e-06, "loss": 2.2642, "step": 483490 }, { "epoch": 0.84, "learning_rate": 7.841704537924154e-06, "loss": 2.2928, "step": 483500 }, { "epoch": 0.84, "learning_rate": 7.84083259799733e-06, "loss": 2.1762, "step": 483510 }, { "epoch": 0.84, "learning_rate": 7.839960658070503e-06, "loss": 2.2726, "step": 483520 }, { "epoch": 0.84, "learning_rate": 7.839088718143675e-06, "loss": 2.3034, "step": 483530 }, { "epoch": 0.84, "learning_rate": 7.83821677821685e-06, "loss": 2.1792, "step": 483540 }, { "epoch": 0.84, "learning_rate": 7.837344838290021e-06, "loss": 2.2649, "step": 483550 }, { "epoch": 0.84, "learning_rate": 7.836472898363195e-06, "loss": 2.2118, "step": 483560 }, { "epoch": 0.84, "learning_rate": 7.835600958436367e-06, "loss": 2.2619, "step": 483570 }, { "epoch": 0.84, "learning_rate": 7.834729018509541e-06, "loss": 2.2363, "step": 483580 }, { "epoch": 0.84, "learning_rate": 7.833857078582715e-06, "loss": 2.2621, "step": 483590 }, { "epoch": 0.84, "learning_rate": 7.832985138655888e-06, "loss": 2.3381, "step": 483600 }, { "epoch": 0.84, "learning_rate": 7.83211319872906e-06, "loss": 2.3934, "step": 483610 }, { "epoch": 0.84, "learning_rate": 7.831241258802234e-06, "loss": 2.1945, "step": 483620 }, { "epoch": 0.84, "learning_rate": 7.830369318875406e-06, "loss": 2.2771, "step": 483630 }, { "epoch": 0.84, "learning_rate": 7.82949737894858e-06, "loss": 2.1999, "step": 483640 }, { "epoch": 0.84, "learning_rate": 7.828625439021754e-06, "loss": 2.2997, "step": 483650 }, { "epoch": 0.84, "learning_rate": 7.827753499094926e-06, "loss": 2.2971, "step": 483660 }, { "epoch": 0.84, "learning_rate": 7.8268815591681e-06, "loss": 2.2908, "step": 483670 }, { "epoch": 0.84, "learning_rate": 7.826009619241273e-06, "loss": 2.1961, "step": 483680 }, { "epoch": 0.84, "learning_rate": 7.825137679314447e-06, "loss": 2.2858, "step": 483690 }, { "epoch": 0.84, "learning_rate": 7.82426573938762e-06, "loss": 2.2763, "step": 483700 }, { "epoch": 0.84, "learning_rate": 7.823393799460793e-06, "loss": 2.0637, "step": 483710 }, { "epoch": 0.84, "learning_rate": 7.822521859533965e-06, "loss": 2.2635, "step": 483720 }, { "epoch": 0.84, "learning_rate": 7.821649919607139e-06, "loss": 2.3286, "step": 483730 }, { "epoch": 0.84, "learning_rate": 7.820777979680311e-06, "loss": 2.2272, "step": 483740 }, { "epoch": 0.84, "learning_rate": 7.819906039753486e-06, "loss": 2.4018, "step": 483750 }, { "epoch": 0.84, "learning_rate": 7.819034099826659e-06, "loss": 2.3264, "step": 483760 }, { "epoch": 0.84, "learning_rate": 7.818162159899832e-06, "loss": 2.2522, "step": 483770 }, { "epoch": 0.84, "learning_rate": 7.817290219973004e-06, "loss": 2.2202, "step": 483780 }, { "epoch": 0.84, "learning_rate": 7.816418280046178e-06, "loss": 2.2429, "step": 483790 }, { "epoch": 0.84, "learning_rate": 7.815546340119352e-06, "loss": 2.269, "step": 483800 }, { "epoch": 0.84, "learning_rate": 7.814674400192524e-06, "loss": 2.3056, "step": 483810 }, { "epoch": 0.84, "learning_rate": 7.813802460265698e-06, "loss": 2.271, "step": 483820 }, { "epoch": 0.84, "learning_rate": 7.812930520338872e-06, "loss": 2.2494, "step": 483830 }, { "epoch": 0.84, "learning_rate": 7.812058580412045e-06, "loss": 2.2365, "step": 483840 }, { "epoch": 0.84, "learning_rate": 7.811186640485217e-06, "loss": 2.2356, "step": 483850 }, { "epoch": 0.84, "learning_rate": 7.810314700558391e-06, "loss": 2.2075, "step": 483860 }, { "epoch": 0.84, "learning_rate": 7.809442760631563e-06, "loss": 2.2118, "step": 483870 }, { "epoch": 0.84, "learning_rate": 7.808570820704737e-06, "loss": 2.2528, "step": 483880 }, { "epoch": 0.84, "learning_rate": 7.807698880777909e-06, "loss": 2.345, "step": 483890 }, { "epoch": 0.84, "learning_rate": 7.806826940851083e-06, "loss": 2.1163, "step": 483900 }, { "epoch": 0.84, "learning_rate": 7.805955000924257e-06, "loss": 2.1868, "step": 483910 }, { "epoch": 0.84, "learning_rate": 7.80508306099743e-06, "loss": 2.2573, "step": 483920 }, { "epoch": 0.84, "learning_rate": 7.804211121070604e-06, "loss": 2.2434, "step": 483930 }, { "epoch": 0.84, "learning_rate": 7.803339181143776e-06, "loss": 2.3736, "step": 483940 }, { "epoch": 0.84, "learning_rate": 7.80246724121695e-06, "loss": 2.2786, "step": 483950 }, { "epoch": 0.84, "learning_rate": 7.801595301290122e-06, "loss": 2.2668, "step": 483960 }, { "epoch": 0.84, "learning_rate": 7.800723361363296e-06, "loss": 2.3071, "step": 483970 }, { "epoch": 0.84, "learning_rate": 7.799851421436468e-06, "loss": 2.3283, "step": 483980 }, { "epoch": 0.84, "learning_rate": 7.798979481509643e-06, "loss": 2.2232, "step": 483990 }, { "epoch": 0.84, "learning_rate": 7.798107541582815e-06, "loss": 2.2561, "step": 484000 }, { "epoch": 0.84, "learning_rate": 7.79723560165599e-06, "loss": 2.3272, "step": 484010 }, { "epoch": 0.84, "learning_rate": 7.796363661729161e-06, "loss": 2.3263, "step": 484020 }, { "epoch": 0.84, "learning_rate": 7.795491721802335e-06, "loss": 2.3731, "step": 484030 }, { "epoch": 0.84, "learning_rate": 7.794619781875507e-06, "loss": 2.2418, "step": 484040 }, { "epoch": 0.84, "learning_rate": 7.793747841948681e-06, "loss": 2.248, "step": 484050 }, { "epoch": 0.84, "learning_rate": 7.792875902021855e-06, "loss": 2.2559, "step": 484060 }, { "epoch": 0.84, "learning_rate": 7.792003962095028e-06, "loss": 2.2633, "step": 484070 }, { "epoch": 0.84, "learning_rate": 7.791132022168202e-06, "loss": 2.3486, "step": 484080 }, { "epoch": 0.84, "learning_rate": 7.790260082241374e-06, "loss": 2.304, "step": 484090 }, { "epoch": 0.84, "learning_rate": 7.789388142314548e-06, "loss": 2.2317, "step": 484100 }, { "epoch": 0.84, "learning_rate": 7.78851620238772e-06, "loss": 2.3637, "step": 484110 }, { "epoch": 0.84, "learning_rate": 7.787644262460894e-06, "loss": 2.2878, "step": 484120 }, { "epoch": 0.84, "learning_rate": 7.786772322534066e-06, "loss": 2.3091, "step": 484130 }, { "epoch": 0.84, "learning_rate": 7.78590038260724e-06, "loss": 2.2362, "step": 484140 }, { "epoch": 0.84, "learning_rate": 7.785028442680414e-06, "loss": 2.2733, "step": 484150 }, { "epoch": 0.84, "learning_rate": 7.784156502753587e-06, "loss": 2.3058, "step": 484160 }, { "epoch": 0.84, "learning_rate": 7.78328456282676e-06, "loss": 2.3175, "step": 484170 }, { "epoch": 0.84, "learning_rate": 7.782412622899933e-06, "loss": 2.3108, "step": 484180 }, { "epoch": 0.84, "learning_rate": 7.781540682973107e-06, "loss": 2.2391, "step": 484190 }, { "epoch": 0.84, "learning_rate": 7.780668743046279e-06, "loss": 2.2223, "step": 484200 }, { "epoch": 0.84, "learning_rate": 7.779796803119453e-06, "loss": 2.2976, "step": 484210 }, { "epoch": 0.84, "learning_rate": 7.778924863192625e-06, "loss": 2.3151, "step": 484220 }, { "epoch": 0.84, "learning_rate": 7.778052923265799e-06, "loss": 2.3548, "step": 484230 }, { "epoch": 0.84, "learning_rate": 7.777180983338972e-06, "loss": 2.3421, "step": 484240 }, { "epoch": 0.84, "learning_rate": 7.776309043412146e-06, "loss": 2.2165, "step": 484250 }, { "epoch": 0.84, "learning_rate": 7.775437103485318e-06, "loss": 2.2888, "step": 484260 }, { "epoch": 0.84, "learning_rate": 7.774565163558492e-06, "loss": 2.2736, "step": 484270 }, { "epoch": 0.84, "learning_rate": 7.773693223631664e-06, "loss": 2.2908, "step": 484280 }, { "epoch": 0.84, "learning_rate": 7.772821283704838e-06, "loss": 2.3298, "step": 484290 }, { "epoch": 0.84, "learning_rate": 7.771949343778012e-06, "loss": 2.2873, "step": 484300 }, { "epoch": 0.84, "learning_rate": 7.771077403851185e-06, "loss": 2.3299, "step": 484310 }, { "epoch": 0.84, "learning_rate": 7.77020546392436e-06, "loss": 2.2875, "step": 484320 }, { "epoch": 0.84, "learning_rate": 7.769333523997531e-06, "loss": 2.32, "step": 484330 }, { "epoch": 0.84, "learning_rate": 7.768461584070705e-06, "loss": 2.2955, "step": 484340 }, { "epoch": 0.84, "learning_rate": 7.767589644143877e-06, "loss": 2.3086, "step": 484350 }, { "epoch": 0.84, "learning_rate": 7.766717704217051e-06, "loss": 2.3181, "step": 484360 }, { "epoch": 0.84, "learning_rate": 7.765845764290223e-06, "loss": 2.323, "step": 484370 }, { "epoch": 0.84, "learning_rate": 7.764973824363397e-06, "loss": 2.2557, "step": 484380 }, { "epoch": 0.84, "learning_rate": 7.76410188443657e-06, "loss": 2.2539, "step": 484390 }, { "epoch": 0.84, "learning_rate": 7.763229944509744e-06, "loss": 2.2526, "step": 484400 }, { "epoch": 0.84, "learning_rate": 7.762358004582916e-06, "loss": 2.4283, "step": 484410 }, { "epoch": 0.84, "learning_rate": 7.76148606465609e-06, "loss": 2.3352, "step": 484420 }, { "epoch": 0.84, "learning_rate": 7.760614124729262e-06, "loss": 2.2371, "step": 484430 }, { "epoch": 0.84, "learning_rate": 7.759742184802436e-06, "loss": 2.2171, "step": 484440 }, { "epoch": 0.84, "learning_rate": 7.75887024487561e-06, "loss": 2.2623, "step": 484450 }, { "epoch": 0.84, "learning_rate": 7.757998304948782e-06, "loss": 2.2231, "step": 484460 }, { "epoch": 0.84, "learning_rate": 7.757126365021956e-06, "loss": 2.2643, "step": 484470 }, { "epoch": 0.84, "learning_rate": 7.75625442509513e-06, "loss": 2.268, "step": 484480 }, { "epoch": 0.84, "learning_rate": 7.755382485168303e-06, "loss": 2.2968, "step": 484490 }, { "epoch": 0.84, "learning_rate": 7.754510545241475e-06, "loss": 2.3126, "step": 484500 }, { "epoch": 0.84, "learning_rate": 7.753638605314649e-06, "loss": 2.334, "step": 484510 }, { "epoch": 0.84, "learning_rate": 7.752766665387821e-06, "loss": 2.2026, "step": 484520 }, { "epoch": 0.84, "learning_rate": 7.751894725460995e-06, "loss": 2.249, "step": 484530 }, { "epoch": 0.84, "learning_rate": 7.751022785534167e-06, "loss": 2.3138, "step": 484540 }, { "epoch": 0.84, "learning_rate": 7.750150845607342e-06, "loss": 2.2811, "step": 484550 }, { "epoch": 0.85, "learning_rate": 7.749278905680514e-06, "loss": 2.3089, "step": 484560 }, { "epoch": 0.85, "learning_rate": 7.748406965753688e-06, "loss": 2.3342, "step": 484570 }, { "epoch": 0.85, "learning_rate": 7.747535025826862e-06, "loss": 2.2926, "step": 484580 }, { "epoch": 0.85, "learning_rate": 7.746663085900034e-06, "loss": 2.3253, "step": 484590 }, { "epoch": 0.85, "learning_rate": 7.745791145973208e-06, "loss": 2.3187, "step": 484600 }, { "epoch": 0.85, "learning_rate": 7.74491920604638e-06, "loss": 2.2676, "step": 484610 }, { "epoch": 0.85, "learning_rate": 7.744047266119554e-06, "loss": 2.1997, "step": 484620 }, { "epoch": 0.85, "learning_rate": 7.743175326192727e-06, "loss": 2.3419, "step": 484630 }, { "epoch": 0.85, "learning_rate": 7.742303386265901e-06, "loss": 2.393, "step": 484640 }, { "epoch": 0.85, "learning_rate": 7.741431446339073e-06, "loss": 2.4141, "step": 484650 }, { "epoch": 0.85, "learning_rate": 7.740559506412247e-06, "loss": 2.2358, "step": 484660 }, { "epoch": 0.85, "learning_rate": 7.739687566485419e-06, "loss": 2.2349, "step": 484670 }, { "epoch": 0.85, "learning_rate": 7.738815626558593e-06, "loss": 2.1731, "step": 484680 }, { "epoch": 0.85, "learning_rate": 7.737943686631765e-06, "loss": 2.2725, "step": 484690 }, { "epoch": 0.85, "learning_rate": 7.737071746704939e-06, "loss": 2.1843, "step": 484700 }, { "epoch": 0.85, "learning_rate": 7.736199806778112e-06, "loss": 2.2665, "step": 484710 }, { "epoch": 0.85, "learning_rate": 7.735327866851286e-06, "loss": 2.2645, "step": 484720 }, { "epoch": 0.85, "learning_rate": 7.73445592692446e-06, "loss": 2.3645, "step": 484730 }, { "epoch": 0.85, "learning_rate": 7.733583986997632e-06, "loss": 2.358, "step": 484740 }, { "epoch": 0.85, "learning_rate": 7.732712047070806e-06, "loss": 2.2633, "step": 484750 }, { "epoch": 0.85, "learning_rate": 7.731840107143978e-06, "loss": 2.3653, "step": 484760 }, { "epoch": 0.85, "learning_rate": 7.730968167217152e-06, "loss": 2.2654, "step": 484770 }, { "epoch": 0.85, "learning_rate": 7.730096227290324e-06, "loss": 2.2933, "step": 484780 }, { "epoch": 0.85, "learning_rate": 7.7292242873635e-06, "loss": 2.1925, "step": 484790 }, { "epoch": 0.85, "learning_rate": 7.728352347436671e-06, "loss": 2.3759, "step": 484800 }, { "epoch": 0.85, "learning_rate": 7.727480407509845e-06, "loss": 2.3295, "step": 484810 }, { "epoch": 0.85, "learning_rate": 7.726608467583017e-06, "loss": 2.3277, "step": 484820 }, { "epoch": 0.85, "learning_rate": 7.725736527656191e-06, "loss": 2.2654, "step": 484830 }, { "epoch": 0.85, "learning_rate": 7.724864587729363e-06, "loss": 2.1662, "step": 484840 }, { "epoch": 0.85, "learning_rate": 7.723992647802537e-06, "loss": 2.2701, "step": 484850 }, { "epoch": 0.85, "learning_rate": 7.72312070787571e-06, "loss": 2.2491, "step": 484860 }, { "epoch": 0.85, "learning_rate": 7.722248767948884e-06, "loss": 2.4304, "step": 484870 }, { "epoch": 0.85, "learning_rate": 7.721376828022058e-06, "loss": 2.1588, "step": 484880 }, { "epoch": 0.85, "learning_rate": 7.72050488809523e-06, "loss": 2.3052, "step": 484890 }, { "epoch": 0.85, "learning_rate": 7.719632948168404e-06, "loss": 2.2529, "step": 484900 }, { "epoch": 0.85, "learning_rate": 7.718761008241576e-06, "loss": 2.3276, "step": 484910 }, { "epoch": 0.85, "learning_rate": 7.71788906831475e-06, "loss": 2.3165, "step": 484920 }, { "epoch": 0.85, "learning_rate": 7.717017128387922e-06, "loss": 2.26, "step": 484930 }, { "epoch": 0.85, "learning_rate": 7.716145188461096e-06, "loss": 2.1396, "step": 484940 }, { "epoch": 0.85, "learning_rate": 7.71527324853427e-06, "loss": 2.1313, "step": 484950 }, { "epoch": 0.85, "learning_rate": 7.714401308607443e-06, "loss": 2.2277, "step": 484960 }, { "epoch": 0.85, "learning_rate": 7.713529368680615e-06, "loss": 2.1621, "step": 484970 }, { "epoch": 0.85, "learning_rate": 7.712657428753789e-06, "loss": 2.2454, "step": 484980 }, { "epoch": 0.85, "learning_rate": 7.711785488826963e-06, "loss": 2.2467, "step": 484990 }, { "epoch": 0.85, "learning_rate": 7.710913548900135e-06, "loss": 2.2044, "step": 485000 }, { "epoch": 0.85, "learning_rate": 7.710041608973309e-06, "loss": 2.2884, "step": 485010 }, { "epoch": 0.85, "learning_rate": 7.70916966904648e-06, "loss": 2.2872, "step": 485020 }, { "epoch": 0.85, "learning_rate": 7.708297729119656e-06, "loss": 2.2723, "step": 485030 }, { "epoch": 0.85, "learning_rate": 7.707425789192828e-06, "loss": 2.3601, "step": 485040 }, { "epoch": 0.85, "learning_rate": 7.706553849266002e-06, "loss": 2.3119, "step": 485050 }, { "epoch": 0.85, "learning_rate": 7.705681909339174e-06, "loss": 2.2233, "step": 485060 }, { "epoch": 0.85, "learning_rate": 7.704809969412348e-06, "loss": 2.3079, "step": 485070 }, { "epoch": 0.85, "learning_rate": 7.70393802948552e-06, "loss": 2.2534, "step": 485080 }, { "epoch": 0.85, "learning_rate": 7.703066089558694e-06, "loss": 2.4119, "step": 485090 }, { "epoch": 0.85, "learning_rate": 7.702194149631868e-06, "loss": 2.2984, "step": 485100 }, { "epoch": 0.85, "learning_rate": 7.701322209705041e-06, "loss": 2.2289, "step": 485110 }, { "epoch": 0.85, "learning_rate": 7.700450269778215e-06, "loss": 2.2811, "step": 485120 }, { "epoch": 0.85, "learning_rate": 7.699578329851387e-06, "loss": 2.306, "step": 485130 }, { "epoch": 0.85, "learning_rate": 7.698706389924561e-06, "loss": 2.326, "step": 485140 }, { "epoch": 0.85, "learning_rate": 7.697834449997733e-06, "loss": 2.3186, "step": 485150 }, { "epoch": 0.85, "learning_rate": 7.696962510070907e-06, "loss": 2.2661, "step": 485160 }, { "epoch": 0.85, "learning_rate": 7.696090570144079e-06, "loss": 2.3287, "step": 485170 }, { "epoch": 0.85, "learning_rate": 7.695218630217253e-06, "loss": 2.24, "step": 485180 }, { "epoch": 0.85, "learning_rate": 7.694346690290426e-06, "loss": 2.3606, "step": 485190 }, { "epoch": 0.85, "learning_rate": 7.6934747503636e-06, "loss": 2.3171, "step": 485200 }, { "epoch": 0.85, "learning_rate": 7.692602810436772e-06, "loss": 2.1413, "step": 485210 }, { "epoch": 0.85, "learning_rate": 7.691730870509946e-06, "loss": 2.3122, "step": 485220 }, { "epoch": 0.85, "learning_rate": 7.690858930583118e-06, "loss": 2.3129, "step": 485230 }, { "epoch": 0.85, "learning_rate": 7.689986990656292e-06, "loss": 2.3033, "step": 485240 }, { "epoch": 0.85, "learning_rate": 7.689115050729466e-06, "loss": 2.3307, "step": 485250 }, { "epoch": 0.85, "learning_rate": 7.688243110802638e-06, "loss": 2.2715, "step": 485260 }, { "epoch": 0.85, "learning_rate": 7.687371170875811e-06, "loss": 2.159, "step": 485270 }, { "epoch": 0.85, "learning_rate": 7.686499230948985e-06, "loss": 2.2846, "step": 485280 }, { "epoch": 0.85, "learning_rate": 7.685627291022159e-06, "loss": 2.2921, "step": 485290 }, { "epoch": 0.85, "learning_rate": 7.684755351095331e-06, "loss": 2.2583, "step": 485300 }, { "epoch": 0.85, "learning_rate": 7.683883411168505e-06, "loss": 2.361, "step": 485310 }, { "epoch": 0.85, "learning_rate": 7.683011471241677e-06, "loss": 2.2551, "step": 485320 }, { "epoch": 0.85, "learning_rate": 7.68213953131485e-06, "loss": 2.2036, "step": 485330 }, { "epoch": 0.85, "learning_rate": 7.681267591388024e-06, "loss": 2.2307, "step": 485340 }, { "epoch": 0.85, "learning_rate": 7.680395651461198e-06, "loss": 2.2709, "step": 485350 }, { "epoch": 0.85, "learning_rate": 7.67952371153437e-06, "loss": 2.2992, "step": 485360 }, { "epoch": 0.85, "learning_rate": 7.678651771607544e-06, "loss": 2.2997, "step": 485370 }, { "epoch": 0.85, "learning_rate": 7.677779831680718e-06, "loss": 2.2777, "step": 485380 }, { "epoch": 0.85, "learning_rate": 7.67690789175389e-06, "loss": 2.3082, "step": 485390 }, { "epoch": 0.85, "learning_rate": 7.676035951827064e-06, "loss": 2.2955, "step": 485400 }, { "epoch": 0.85, "learning_rate": 7.675164011900236e-06, "loss": 2.335, "step": 485410 }, { "epoch": 0.85, "learning_rate": 7.67429207197341e-06, "loss": 2.2998, "step": 485420 }, { "epoch": 0.85, "learning_rate": 7.673420132046583e-06, "loss": 2.1105, "step": 485430 }, { "epoch": 0.85, "learning_rate": 7.672548192119757e-06, "loss": 2.3399, "step": 485440 }, { "epoch": 0.85, "learning_rate": 7.671676252192929e-06, "loss": 2.2472, "step": 485450 }, { "epoch": 0.85, "learning_rate": 7.670804312266103e-06, "loss": 2.3351, "step": 485460 }, { "epoch": 0.85, "learning_rate": 7.669932372339275e-06, "loss": 2.3055, "step": 485470 }, { "epoch": 0.85, "learning_rate": 7.669060432412449e-06, "loss": 2.32, "step": 485480 }, { "epoch": 0.85, "learning_rate": 7.66818849248562e-06, "loss": 2.3373, "step": 485490 }, { "epoch": 0.85, "learning_rate": 7.667316552558795e-06, "loss": 2.2351, "step": 485500 }, { "epoch": 0.85, "learning_rate": 7.666444612631968e-06, "loss": 2.2511, "step": 485510 }, { "epoch": 0.85, "learning_rate": 7.665572672705142e-06, "loss": 2.2039, "step": 485520 }, { "epoch": 0.85, "learning_rate": 7.664700732778316e-06, "loss": 2.3319, "step": 485530 }, { "epoch": 0.85, "learning_rate": 7.663828792851488e-06, "loss": 2.1844, "step": 485540 }, { "epoch": 0.85, "learning_rate": 7.662956852924662e-06, "loss": 2.3083, "step": 485550 }, { "epoch": 0.85, "learning_rate": 7.662084912997834e-06, "loss": 2.3512, "step": 485560 }, { "epoch": 0.85, "learning_rate": 7.661212973071008e-06, "loss": 2.2928, "step": 485570 }, { "epoch": 0.85, "learning_rate": 7.66034103314418e-06, "loss": 2.2668, "step": 485580 }, { "epoch": 0.85, "learning_rate": 7.659469093217355e-06, "loss": 2.3348, "step": 485590 }, { "epoch": 0.85, "learning_rate": 7.658597153290527e-06, "loss": 2.2456, "step": 485600 }, { "epoch": 0.85, "learning_rate": 7.657725213363701e-06, "loss": 2.1811, "step": 485610 }, { "epoch": 0.85, "learning_rate": 7.656853273436873e-06, "loss": 2.2857, "step": 485620 }, { "epoch": 0.85, "learning_rate": 7.655981333510047e-06, "loss": 2.2511, "step": 485630 }, { "epoch": 0.85, "learning_rate": 7.655109393583219e-06, "loss": 2.1977, "step": 485640 }, { "epoch": 0.85, "learning_rate": 7.654237453656393e-06, "loss": 2.2263, "step": 485650 }, { "epoch": 0.85, "learning_rate": 7.653365513729566e-06, "loss": 2.1881, "step": 485660 }, { "epoch": 0.85, "learning_rate": 7.65249357380274e-06, "loss": 2.2875, "step": 485670 }, { "epoch": 0.85, "learning_rate": 7.651621633875914e-06, "loss": 2.2482, "step": 485680 }, { "epoch": 0.85, "learning_rate": 7.650749693949086e-06, "loss": 2.2775, "step": 485690 }, { "epoch": 0.85, "learning_rate": 7.64987775402226e-06, "loss": 2.3486, "step": 485700 }, { "epoch": 0.85, "learning_rate": 7.649005814095432e-06, "loss": 2.2916, "step": 485710 }, { "epoch": 0.85, "learning_rate": 7.648133874168606e-06, "loss": 2.2437, "step": 485720 }, { "epoch": 0.85, "learning_rate": 7.647261934241778e-06, "loss": 2.3511, "step": 485730 }, { "epoch": 0.85, "learning_rate": 7.646389994314952e-06, "loss": 2.1838, "step": 485740 }, { "epoch": 0.85, "learning_rate": 7.645518054388125e-06, "loss": 2.3624, "step": 485750 }, { "epoch": 0.85, "learning_rate": 7.644646114461299e-06, "loss": 2.2629, "step": 485760 }, { "epoch": 0.85, "learning_rate": 7.643774174534471e-06, "loss": 2.305, "step": 485770 }, { "epoch": 0.85, "learning_rate": 7.642902234607645e-06, "loss": 2.1795, "step": 485780 }, { "epoch": 0.85, "learning_rate": 7.642030294680819e-06, "loss": 2.2297, "step": 485790 }, { "epoch": 0.85, "learning_rate": 7.64115835475399e-06, "loss": 2.2627, "step": 485800 }, { "epoch": 0.85, "learning_rate": 7.640286414827165e-06, "loss": 2.364, "step": 485810 }, { "epoch": 0.85, "learning_rate": 7.639414474900337e-06, "loss": 2.1962, "step": 485820 }, { "epoch": 0.85, "learning_rate": 7.638542534973512e-06, "loss": 2.3892, "step": 485830 }, { "epoch": 0.85, "learning_rate": 7.637670595046684e-06, "loss": 2.3058, "step": 485840 }, { "epoch": 0.85, "learning_rate": 7.636798655119858e-06, "loss": 2.3093, "step": 485850 }, { "epoch": 0.85, "learning_rate": 7.63592671519303e-06, "loss": 2.2722, "step": 485860 }, { "epoch": 0.85, "learning_rate": 7.635054775266204e-06, "loss": 2.3481, "step": 485870 }, { "epoch": 0.85, "learning_rate": 7.634182835339376e-06, "loss": 2.2425, "step": 485880 }, { "epoch": 0.85, "learning_rate": 7.63331089541255e-06, "loss": 2.2236, "step": 485890 }, { "epoch": 0.85, "learning_rate": 7.632438955485723e-06, "loss": 2.3177, "step": 485900 }, { "epoch": 0.85, "learning_rate": 7.631567015558897e-06, "loss": 2.3645, "step": 485910 }, { "epoch": 0.85, "learning_rate": 7.630695075632071e-06, "loss": 2.2126, "step": 485920 }, { "epoch": 0.85, "learning_rate": 7.629823135705243e-06, "loss": 2.2845, "step": 485930 }, { "epoch": 0.85, "learning_rate": 7.628951195778417e-06, "loss": 2.2769, "step": 485940 }, { "epoch": 0.85, "learning_rate": 7.628079255851589e-06, "loss": 2.3101, "step": 485950 }, { "epoch": 0.85, "learning_rate": 7.627207315924763e-06, "loss": 2.2356, "step": 485960 }, { "epoch": 0.85, "learning_rate": 7.6263353759979355e-06, "loss": 2.2343, "step": 485970 }, { "epoch": 0.85, "learning_rate": 7.625463436071109e-06, "loss": 2.2893, "step": 485980 }, { "epoch": 0.85, "learning_rate": 7.624591496144281e-06, "loss": 2.3034, "step": 485990 }, { "epoch": 0.85, "learning_rate": 7.623719556217455e-06, "loss": 2.3118, "step": 486000 }, { "epoch": 0.85, "learning_rate": 7.622847616290628e-06, "loss": 2.2785, "step": 486010 }, { "epoch": 0.85, "learning_rate": 7.621975676363802e-06, "loss": 2.3328, "step": 486020 }, { "epoch": 0.85, "learning_rate": 7.621103736436974e-06, "loss": 2.3455, "step": 486030 }, { "epoch": 0.85, "learning_rate": 7.620231796510148e-06, "loss": 2.2331, "step": 486040 }, { "epoch": 0.85, "learning_rate": 7.6193598565833214e-06, "loss": 2.2217, "step": 486050 }, { "epoch": 0.85, "learning_rate": 7.618487916656494e-06, "loss": 2.3461, "step": 486060 }, { "epoch": 0.85, "learning_rate": 7.617615976729668e-06, "loss": 2.3637, "step": 486070 }, { "epoch": 0.85, "learning_rate": 7.61674403680284e-06, "loss": 2.2669, "step": 486080 }, { "epoch": 0.85, "learning_rate": 7.615872096876015e-06, "loss": 2.1995, "step": 486090 }, { "epoch": 0.85, "learning_rate": 7.615000156949187e-06, "loss": 2.2986, "step": 486100 }, { "epoch": 0.85, "learning_rate": 7.614128217022361e-06, "loss": 2.3728, "step": 486110 }, { "epoch": 0.85, "learning_rate": 7.613256277095534e-06, "loss": 2.2571, "step": 486120 }, { "epoch": 0.85, "learning_rate": 7.612384337168707e-06, "loss": 2.4478, "step": 486130 }, { "epoch": 0.85, "learning_rate": 7.6115123972418794e-06, "loss": 2.2601, "step": 486140 }, { "epoch": 0.85, "learning_rate": 7.610640457315053e-06, "loss": 2.3479, "step": 486150 }, { "epoch": 0.85, "learning_rate": 7.609768517388226e-06, "loss": 2.1764, "step": 486160 }, { "epoch": 0.85, "learning_rate": 7.6088965774614e-06, "loss": 2.1565, "step": 486170 }, { "epoch": 0.85, "learning_rate": 7.608024637534574e-06, "loss": 2.1417, "step": 486180 }, { "epoch": 0.85, "learning_rate": 7.607152697607746e-06, "loss": 2.2751, "step": 486190 }, { "epoch": 0.85, "learning_rate": 7.6062807576809195e-06, "loss": 2.1282, "step": 486200 }, { "epoch": 0.85, "learning_rate": 7.6054088177540924e-06, "loss": 2.208, "step": 486210 }, { "epoch": 0.85, "learning_rate": 7.604536877827266e-06, "loss": 2.2577, "step": 486220 }, { "epoch": 0.85, "learning_rate": 7.603664937900438e-06, "loss": 2.26, "step": 486230 }, { "epoch": 0.85, "learning_rate": 7.602792997973612e-06, "loss": 2.4519, "step": 486240 }, { "epoch": 0.85, "learning_rate": 7.601921058046785e-06, "loss": 2.3063, "step": 486250 }, { "epoch": 0.85, "learning_rate": 7.601049118119959e-06, "loss": 2.3331, "step": 486260 }, { "epoch": 0.85, "learning_rate": 7.600177178193131e-06, "loss": 2.3024, "step": 486270 }, { "epoch": 0.85, "learning_rate": 7.599305238266305e-06, "loss": 2.1673, "step": 486280 }, { "epoch": 0.85, "learning_rate": 7.5984332983394775e-06, "loss": 2.2991, "step": 486290 }, { "epoch": 0.85, "learning_rate": 7.597561358412651e-06, "loss": 2.287, "step": 486300 }, { "epoch": 0.85, "learning_rate": 7.596689418485825e-06, "loss": 2.2391, "step": 486310 }, { "epoch": 0.85, "learning_rate": 7.595817478558997e-06, "loss": 2.3477, "step": 486320 }, { "epoch": 0.85, "learning_rate": 7.594945538632172e-06, "loss": 2.2136, "step": 486330 }, { "epoch": 0.85, "learning_rate": 7.594073598705344e-06, "loss": 2.2098, "step": 486340 }, { "epoch": 0.85, "learning_rate": 7.593201658778518e-06, "loss": 2.2896, "step": 486350 }, { "epoch": 0.85, "learning_rate": 7.59232971885169e-06, "loss": 2.3196, "step": 486360 }, { "epoch": 0.85, "learning_rate": 7.591457778924864e-06, "loss": 2.1714, "step": 486370 }, { "epoch": 0.85, "learning_rate": 7.590585838998036e-06, "loss": 2.3018, "step": 486380 }, { "epoch": 0.85, "learning_rate": 7.58971389907121e-06, "loss": 2.3179, "step": 486390 }, { "epoch": 0.85, "learning_rate": 7.588841959144383e-06, "loss": 2.3275, "step": 486400 }, { "epoch": 0.85, "learning_rate": 7.587970019217557e-06, "loss": 2.3279, "step": 486410 }, { "epoch": 0.85, "learning_rate": 7.587098079290729e-06, "loss": 2.3503, "step": 486420 }, { "epoch": 0.85, "learning_rate": 7.586226139363903e-06, "loss": 2.32, "step": 486430 }, { "epoch": 0.85, "learning_rate": 7.585354199437076e-06, "loss": 2.2832, "step": 486440 }, { "epoch": 0.85, "learning_rate": 7.584482259510249e-06, "loss": 2.2844, "step": 486450 }, { "epoch": 0.85, "learning_rate": 7.583610319583423e-06, "loss": 2.1871, "step": 486460 }, { "epoch": 0.85, "learning_rate": 7.582738379656595e-06, "loss": 2.3042, "step": 486470 }, { "epoch": 0.85, "learning_rate": 7.581866439729769e-06, "loss": 2.1921, "step": 486480 }, { "epoch": 0.85, "learning_rate": 7.580994499802942e-06, "loss": 2.2958, "step": 486490 }, { "epoch": 0.85, "learning_rate": 7.580122559876116e-06, "loss": 2.2383, "step": 486500 }, { "epoch": 0.85, "learning_rate": 7.579250619949288e-06, "loss": 2.3124, "step": 486510 }, { "epoch": 0.85, "learning_rate": 7.5783786800224615e-06, "loss": 2.3111, "step": 486520 }, { "epoch": 0.85, "learning_rate": 7.5775067400956344e-06, "loss": 2.2648, "step": 486530 }, { "epoch": 0.85, "learning_rate": 7.576634800168808e-06, "loss": 2.2464, "step": 486540 }, { "epoch": 0.85, "learning_rate": 7.57576286024198e-06, "loss": 2.2251, "step": 486550 }, { "epoch": 0.85, "learning_rate": 7.574890920315154e-06, "loss": 2.2343, "step": 486560 }, { "epoch": 0.85, "learning_rate": 7.574018980388327e-06, "loss": 2.1838, "step": 486570 }, { "epoch": 0.85, "learning_rate": 7.573147040461501e-06, "loss": 2.2262, "step": 486580 }, { "epoch": 0.85, "learning_rate": 7.5722751005346745e-06, "loss": 2.3549, "step": 486590 }, { "epoch": 0.85, "learning_rate": 7.571403160607847e-06, "loss": 2.2804, "step": 486600 }, { "epoch": 0.85, "learning_rate": 7.570531220681021e-06, "loss": 2.2679, "step": 486610 }, { "epoch": 0.85, "learning_rate": 7.569659280754193e-06, "loss": 2.2875, "step": 486620 }, { "epoch": 0.85, "learning_rate": 7.568787340827367e-06, "loss": 2.2383, "step": 486630 }, { "epoch": 0.85, "learning_rate": 7.56791540090054e-06, "loss": 2.2306, "step": 486640 }, { "epoch": 0.85, "learning_rate": 7.567043460973714e-06, "loss": 2.2356, "step": 486650 }, { "epoch": 0.85, "learning_rate": 7.566171521046886e-06, "loss": 2.384, "step": 486660 }, { "epoch": 0.85, "learning_rate": 7.56529958112006e-06, "loss": 2.255, "step": 486670 }, { "epoch": 0.85, "learning_rate": 7.5644276411932325e-06, "loss": 2.1711, "step": 486680 }, { "epoch": 0.85, "learning_rate": 7.563555701266406e-06, "loss": 2.1872, "step": 486690 }, { "epoch": 0.85, "learning_rate": 7.562683761339578e-06, "loss": 2.2562, "step": 486700 }, { "epoch": 0.85, "learning_rate": 7.561811821412752e-06, "loss": 2.2386, "step": 486710 }, { "epoch": 0.85, "learning_rate": 7.560939881485926e-06, "loss": 2.2809, "step": 486720 }, { "epoch": 0.85, "learning_rate": 7.560067941559099e-06, "loss": 2.3796, "step": 486730 }, { "epoch": 0.85, "learning_rate": 7.559196001632273e-06, "loss": 2.2968, "step": 486740 }, { "epoch": 0.85, "learning_rate": 7.558324061705445e-06, "loss": 2.3429, "step": 486750 }, { "epoch": 0.85, "learning_rate": 7.5574521217786184e-06, "loss": 2.3267, "step": 486760 }, { "epoch": 0.85, "learning_rate": 7.556580181851791e-06, "loss": 2.292, "step": 486770 }, { "epoch": 0.85, "learning_rate": 7.555708241924965e-06, "loss": 2.2791, "step": 486780 }, { "epoch": 0.85, "learning_rate": 7.554836301998137e-06, "loss": 2.2913, "step": 486790 }, { "epoch": 0.85, "learning_rate": 7.553964362071311e-06, "loss": 2.3307, "step": 486800 }, { "epoch": 0.85, "learning_rate": 7.553092422144484e-06, "loss": 2.2825, "step": 486810 }, { "epoch": 0.85, "learning_rate": 7.552220482217658e-06, "loss": 2.3192, "step": 486820 }, { "epoch": 0.85, "learning_rate": 7.55134854229083e-06, "loss": 2.2921, "step": 486830 }, { "epoch": 0.85, "learning_rate": 7.5504766023640035e-06, "loss": 2.3547, "step": 486840 }, { "epoch": 0.85, "learning_rate": 7.549604662437178e-06, "loss": 2.1858, "step": 486850 }, { "epoch": 0.85, "learning_rate": 7.54873272251035e-06, "loss": 2.2401, "step": 486860 }, { "epoch": 0.85, "learning_rate": 7.547860782583524e-06, "loss": 2.1303, "step": 486870 }, { "epoch": 0.85, "learning_rate": 7.546988842656697e-06, "loss": 2.2987, "step": 486880 }, { "epoch": 0.85, "learning_rate": 7.546116902729871e-06, "loss": 2.3014, "step": 486890 }, { "epoch": 0.85, "learning_rate": 7.545244962803043e-06, "loss": 2.284, "step": 486900 }, { "epoch": 0.85, "learning_rate": 7.5443730228762165e-06, "loss": 2.313, "step": 486910 }, { "epoch": 0.85, "learning_rate": 7.5435010829493894e-06, "loss": 2.1366, "step": 486920 }, { "epoch": 0.85, "learning_rate": 7.542629143022563e-06, "loss": 2.286, "step": 486930 }, { "epoch": 0.85, "learning_rate": 7.541757203095735e-06, "loss": 2.2323, "step": 486940 }, { "epoch": 0.85, "learning_rate": 7.540885263168909e-06, "loss": 2.2169, "step": 486950 }, { "epoch": 0.85, "learning_rate": 7.540013323242082e-06, "loss": 2.1969, "step": 486960 }, { "epoch": 0.85, "learning_rate": 7.539141383315256e-06, "loss": 2.2009, "step": 486970 }, { "epoch": 0.85, "learning_rate": 7.5382694433884295e-06, "loss": 2.2584, "step": 486980 }, { "epoch": 0.85, "learning_rate": 7.537397503461602e-06, "loss": 2.1687, "step": 486990 }, { "epoch": 0.85, "learning_rate": 7.536525563534775e-06, "loss": 2.2942, "step": 487000 }, { "epoch": 0.85, "learning_rate": 7.535653623607948e-06, "loss": 2.2104, "step": 487010 }, { "epoch": 0.85, "learning_rate": 7.534781683681122e-06, "loss": 2.2686, "step": 487020 }, { "epoch": 0.85, "learning_rate": 7.533909743754294e-06, "loss": 2.427, "step": 487030 }, { "epoch": 0.85, "learning_rate": 7.533037803827468e-06, "loss": 2.2831, "step": 487040 }, { "epoch": 0.85, "learning_rate": 7.532165863900641e-06, "loss": 2.2973, "step": 487050 }, { "epoch": 0.85, "learning_rate": 7.531293923973815e-06, "loss": 2.1598, "step": 487060 }, { "epoch": 0.85, "learning_rate": 7.530421984046987e-06, "loss": 2.1756, "step": 487070 }, { "epoch": 0.85, "learning_rate": 7.5295500441201604e-06, "loss": 2.2231, "step": 487080 }, { "epoch": 0.85, "learning_rate": 7.528678104193333e-06, "loss": 2.3232, "step": 487090 }, { "epoch": 0.85, "learning_rate": 7.527806164266507e-06, "loss": 2.2239, "step": 487100 }, { "epoch": 0.85, "learning_rate": 7.526934224339681e-06, "loss": 2.3334, "step": 487110 }, { "epoch": 0.85, "learning_rate": 7.526062284412853e-06, "loss": 2.2613, "step": 487120 }, { "epoch": 0.85, "learning_rate": 7.525190344486028e-06, "loss": 2.251, "step": 487130 }, { "epoch": 0.85, "learning_rate": 7.5243184045592e-06, "loss": 2.2604, "step": 487140 }, { "epoch": 0.85, "learning_rate": 7.5234464646323734e-06, "loss": 2.3849, "step": 487150 }, { "epoch": 0.85, "learning_rate": 7.522574524705546e-06, "loss": 2.1162, "step": 487160 }, { "epoch": 0.85, "learning_rate": 7.52170258477872e-06, "loss": 2.2948, "step": 487170 }, { "epoch": 0.85, "learning_rate": 7.520830644851892e-06, "loss": 2.3177, "step": 487180 }, { "epoch": 0.85, "learning_rate": 7.519958704925066e-06, "loss": 2.2022, "step": 487190 }, { "epoch": 0.85, "learning_rate": 7.519086764998239e-06, "loss": 2.2748, "step": 487200 }, { "epoch": 0.85, "learning_rate": 7.518214825071413e-06, "loss": 2.256, "step": 487210 }, { "epoch": 0.85, "learning_rate": 7.517342885144585e-06, "loss": 2.2879, "step": 487220 }, { "epoch": 0.85, "learning_rate": 7.5164709452177585e-06, "loss": 2.2262, "step": 487230 }, { "epoch": 0.85, "learning_rate": 7.515599005290932e-06, "loss": 2.2635, "step": 487240 }, { "epoch": 0.85, "learning_rate": 7.514727065364105e-06, "loss": 2.2797, "step": 487250 }, { "epoch": 0.85, "learning_rate": 7.513855125437279e-06, "loss": 2.1437, "step": 487260 }, { "epoch": 0.85, "learning_rate": 7.512983185510451e-06, "loss": 2.3121, "step": 487270 }, { "epoch": 0.85, "learning_rate": 7.512111245583625e-06, "loss": 2.1767, "step": 487280 }, { "epoch": 0.85, "learning_rate": 7.511239305656798e-06, "loss": 2.2782, "step": 487290 }, { "epoch": 0.85, "learning_rate": 7.5103673657299715e-06, "loss": 2.2798, "step": 487300 }, { "epoch": 0.85, "learning_rate": 7.509495425803144e-06, "loss": 2.2335, "step": 487310 }, { "epoch": 0.85, "learning_rate": 7.508623485876317e-06, "loss": 2.3635, "step": 487320 }, { "epoch": 0.85, "learning_rate": 7.50775154594949e-06, "loss": 2.3183, "step": 487330 }, { "epoch": 0.85, "learning_rate": 7.506879606022664e-06, "loss": 2.2326, "step": 487340 }, { "epoch": 0.85, "learning_rate": 7.506007666095836e-06, "loss": 2.2571, "step": 487350 }, { "epoch": 0.85, "learning_rate": 7.50513572616901e-06, "loss": 2.4077, "step": 487360 }, { "epoch": 0.85, "learning_rate": 7.504263786242183e-06, "loss": 2.2621, "step": 487370 }, { "epoch": 0.85, "learning_rate": 7.503391846315357e-06, "loss": 2.2753, "step": 487380 }, { "epoch": 0.85, "learning_rate": 7.50251990638853e-06, "loss": 2.3506, "step": 487390 }, { "epoch": 0.85, "learning_rate": 7.501647966461703e-06, "loss": 2.265, "step": 487400 }, { "epoch": 0.85, "learning_rate": 7.500776026534877e-06, "loss": 2.2268, "step": 487410 }, { "epoch": 0.85, "learning_rate": 7.499904086608049e-06, "loss": 2.3303, "step": 487420 }, { "epoch": 0.85, "learning_rate": 7.499032146681223e-06, "loss": 2.3319, "step": 487430 }, { "epoch": 0.85, "learning_rate": 7.498160206754396e-06, "loss": 2.2101, "step": 487440 }, { "epoch": 0.85, "learning_rate": 7.49728826682757e-06, "loss": 2.3595, "step": 487450 }, { "epoch": 0.85, "learning_rate": 7.496416326900742e-06, "loss": 2.2228, "step": 487460 }, { "epoch": 0.85, "learning_rate": 7.4955443869739154e-06, "loss": 2.2563, "step": 487470 }, { "epoch": 0.85, "learning_rate": 7.494672447047088e-06, "loss": 2.2504, "step": 487480 }, { "epoch": 0.85, "learning_rate": 7.493800507120262e-06, "loss": 2.3041, "step": 487490 }, { "epoch": 0.85, "learning_rate": 7.492928567193434e-06, "loss": 2.3591, "step": 487500 }, { "epoch": 0.85, "learning_rate": 7.492056627266608e-06, "loss": 2.346, "step": 487510 }, { "epoch": 0.85, "learning_rate": 7.491184687339782e-06, "loss": 2.2341, "step": 487520 }, { "epoch": 0.85, "learning_rate": 7.490312747412955e-06, "loss": 2.2425, "step": 487530 }, { "epoch": 0.85, "learning_rate": 7.4894408074861284e-06, "loss": 2.3138, "step": 487540 }, { "epoch": 0.85, "learning_rate": 7.4885688675593005e-06, "loss": 2.3643, "step": 487550 }, { "epoch": 0.85, "learning_rate": 7.487696927632474e-06, "loss": 2.2012, "step": 487560 }, { "epoch": 0.85, "learning_rate": 7.486824987705647e-06, "loss": 2.1722, "step": 487570 }, { "epoch": 0.85, "learning_rate": 7.485953047778821e-06, "loss": 2.2643, "step": 487580 }, { "epoch": 0.85, "learning_rate": 7.485081107851993e-06, "loss": 2.2666, "step": 487590 }, { "epoch": 0.85, "learning_rate": 7.484209167925167e-06, "loss": 2.2925, "step": 487600 }, { "epoch": 0.85, "learning_rate": 7.48333722799834e-06, "loss": 2.3562, "step": 487610 }, { "epoch": 0.85, "learning_rate": 7.4824652880715135e-06, "loss": 2.1808, "step": 487620 }, { "epoch": 0.85, "learning_rate": 7.481593348144686e-06, "loss": 2.1558, "step": 487630 }, { "epoch": 0.85, "learning_rate": 7.480721408217859e-06, "loss": 2.2519, "step": 487640 }, { "epoch": 0.85, "learning_rate": 7.479849468291034e-06, "loss": 2.2337, "step": 487650 }, { "epoch": 0.85, "learning_rate": 7.478977528364206e-06, "loss": 2.2949, "step": 487660 }, { "epoch": 0.85, "learning_rate": 7.47810558843738e-06, "loss": 2.2147, "step": 487670 }, { "epoch": 0.85, "learning_rate": 7.477233648510553e-06, "loss": 2.2189, "step": 487680 }, { "epoch": 0.85, "learning_rate": 7.4763617085837265e-06, "loss": 2.2955, "step": 487690 }, { "epoch": 0.85, "learning_rate": 7.475489768656899e-06, "loss": 2.2588, "step": 487700 }, { "epoch": 0.85, "learning_rate": 7.474617828730072e-06, "loss": 2.2907, "step": 487710 }, { "epoch": 0.85, "learning_rate": 7.473745888803245e-06, "loss": 2.2112, "step": 487720 }, { "epoch": 0.85, "learning_rate": 7.472873948876419e-06, "loss": 2.2777, "step": 487730 }, { "epoch": 0.85, "learning_rate": 7.472002008949591e-06, "loss": 2.1689, "step": 487740 }, { "epoch": 0.85, "learning_rate": 7.471130069022765e-06, "loss": 2.2749, "step": 487750 }, { "epoch": 0.85, "learning_rate": 7.470258129095938e-06, "loss": 2.2954, "step": 487760 }, { "epoch": 0.85, "learning_rate": 7.469386189169112e-06, "loss": 2.3837, "step": 487770 }, { "epoch": 0.85, "learning_rate": 7.468514249242285e-06, "loss": 2.3991, "step": 487780 }, { "epoch": 0.85, "learning_rate": 7.4676423093154574e-06, "loss": 2.2795, "step": 487790 }, { "epoch": 0.85, "learning_rate": 7.466770369388631e-06, "loss": 2.3496, "step": 487800 }, { "epoch": 0.85, "learning_rate": 7.465898429461804e-06, "loss": 2.2487, "step": 487810 }, { "epoch": 0.85, "learning_rate": 7.465026489534978e-06, "loss": 2.2547, "step": 487820 }, { "epoch": 0.85, "learning_rate": 7.46415454960815e-06, "loss": 2.256, "step": 487830 }, { "epoch": 0.85, "learning_rate": 7.463282609681324e-06, "loss": 2.2997, "step": 487840 }, { "epoch": 0.85, "learning_rate": 7.462410669754497e-06, "loss": 2.2889, "step": 487850 }, { "epoch": 0.85, "learning_rate": 7.4615387298276704e-06, "loss": 2.3635, "step": 487860 }, { "epoch": 0.85, "learning_rate": 7.4606667899008425e-06, "loss": 2.3904, "step": 487870 }, { "epoch": 0.85, "learning_rate": 7.459794849974016e-06, "loss": 2.3115, "step": 487880 }, { "epoch": 0.85, "learning_rate": 7.458922910047189e-06, "loss": 2.297, "step": 487890 }, { "epoch": 0.85, "learning_rate": 7.458050970120363e-06, "loss": 2.3441, "step": 487900 }, { "epoch": 0.85, "learning_rate": 7.457179030193537e-06, "loss": 2.2392, "step": 487910 }, { "epoch": 0.85, "learning_rate": 7.45630709026671e-06, "loss": 2.2215, "step": 487920 }, { "epoch": 0.85, "learning_rate": 7.4554351503398834e-06, "loss": 2.2784, "step": 487930 }, { "epoch": 0.85, "learning_rate": 7.4545632104130555e-06, "loss": 2.18, "step": 487940 }, { "epoch": 0.85, "learning_rate": 7.453691270486229e-06, "loss": 2.267, "step": 487950 }, { "epoch": 0.85, "learning_rate": 7.452819330559402e-06, "loss": 2.1743, "step": 487960 }, { "epoch": 0.85, "learning_rate": 7.451947390632576e-06, "loss": 2.2988, "step": 487970 }, { "epoch": 0.85, "learning_rate": 7.451075450705748e-06, "loss": 2.2676, "step": 487980 }, { "epoch": 0.85, "learning_rate": 7.450203510778922e-06, "loss": 2.1717, "step": 487990 }, { "epoch": 0.85, "learning_rate": 7.449331570852095e-06, "loss": 2.365, "step": 488000 }, { "epoch": 0.85, "learning_rate": 7.4484596309252685e-06, "loss": 2.2207, "step": 488010 }, { "epoch": 0.85, "learning_rate": 7.447587690998441e-06, "loss": 2.1882, "step": 488020 }, { "epoch": 0.85, "learning_rate": 7.446715751071614e-06, "loss": 2.3069, "step": 488030 }, { "epoch": 0.85, "learning_rate": 7.445843811144788e-06, "loss": 2.3327, "step": 488040 }, { "epoch": 0.85, "learning_rate": 7.444971871217961e-06, "loss": 2.2388, "step": 488050 }, { "epoch": 0.85, "learning_rate": 7.444099931291135e-06, "loss": 2.3733, "step": 488060 }, { "epoch": 0.85, "learning_rate": 7.443227991364307e-06, "loss": 2.1782, "step": 488070 }, { "epoch": 0.85, "learning_rate": 7.442356051437481e-06, "loss": 2.1468, "step": 488080 }, { "epoch": 0.85, "learning_rate": 7.441484111510654e-06, "loss": 2.2498, "step": 488090 }, { "epoch": 0.85, "learning_rate": 7.440612171583827e-06, "loss": 2.2886, "step": 488100 }, { "epoch": 0.85, "learning_rate": 7.4397402316569994e-06, "loss": 2.25, "step": 488110 }, { "epoch": 0.85, "learning_rate": 7.438868291730173e-06, "loss": 2.2192, "step": 488120 }, { "epoch": 0.85, "learning_rate": 7.437996351803346e-06, "loss": 2.2734, "step": 488130 }, { "epoch": 0.85, "learning_rate": 7.43712441187652e-06, "loss": 2.2445, "step": 488140 }, { "epoch": 0.85, "learning_rate": 7.436252471949692e-06, "loss": 2.3195, "step": 488150 }, { "epoch": 0.85, "learning_rate": 7.435380532022866e-06, "loss": 2.2516, "step": 488160 }, { "epoch": 0.85, "learning_rate": 7.434508592096039e-06, "loss": 2.2615, "step": 488170 }, { "epoch": 0.85, "learning_rate": 7.4336366521692124e-06, "loss": 2.1851, "step": 488180 }, { "epoch": 0.85, "learning_rate": 7.432764712242386e-06, "loss": 2.2736, "step": 488190 }, { "epoch": 0.85, "learning_rate": 7.431892772315559e-06, "loss": 2.2339, "step": 488200 }, { "epoch": 0.85, "learning_rate": 7.431020832388733e-06, "loss": 2.2734, "step": 488210 }, { "epoch": 0.85, "learning_rate": 7.430148892461905e-06, "loss": 2.3155, "step": 488220 }, { "epoch": 0.85, "learning_rate": 7.429276952535079e-06, "loss": 2.2423, "step": 488230 }, { "epoch": 0.85, "learning_rate": 7.428405012608252e-06, "loss": 2.1962, "step": 488240 }, { "epoch": 0.85, "learning_rate": 7.4275330726814255e-06, "loss": 2.2171, "step": 488250 }, { "epoch": 0.85, "learning_rate": 7.4266611327545975e-06, "loss": 2.2701, "step": 488260 }, { "epoch": 0.85, "learning_rate": 7.425789192827771e-06, "loss": 2.3245, "step": 488270 }, { "epoch": 0.85, "learning_rate": 7.424917252900944e-06, "loss": 2.2043, "step": 488280 }, { "epoch": 0.85, "learning_rate": 7.424045312974118e-06, "loss": 2.2889, "step": 488290 }, { "epoch": 0.85, "learning_rate": 7.42317337304729e-06, "loss": 2.2216, "step": 488300 }, { "epoch": 0.85, "learning_rate": 7.422301433120464e-06, "loss": 2.2641, "step": 488310 }, { "epoch": 0.85, "learning_rate": 7.421429493193638e-06, "loss": 2.2366, "step": 488320 }, { "epoch": 0.85, "learning_rate": 7.4205575532668105e-06, "loss": 2.1707, "step": 488330 }, { "epoch": 0.85, "learning_rate": 7.419685613339984e-06, "loss": 2.2422, "step": 488340 }, { "epoch": 0.85, "learning_rate": 7.418813673413156e-06, "loss": 2.2985, "step": 488350 }, { "epoch": 0.85, "learning_rate": 7.41794173348633e-06, "loss": 2.2492, "step": 488360 }, { "epoch": 0.85, "learning_rate": 7.417069793559503e-06, "loss": 2.2119, "step": 488370 }, { "epoch": 0.85, "learning_rate": 7.416197853632677e-06, "loss": 2.3334, "step": 488380 }, { "epoch": 0.85, "learning_rate": 7.415325913705849e-06, "loss": 2.2824, "step": 488390 }, { "epoch": 0.85, "learning_rate": 7.414453973779023e-06, "loss": 2.2591, "step": 488400 }, { "epoch": 0.85, "learning_rate": 7.413582033852196e-06, "loss": 2.3258, "step": 488410 }, { "epoch": 0.85, "learning_rate": 7.412710093925369e-06, "loss": 2.4162, "step": 488420 }, { "epoch": 0.85, "learning_rate": 7.4118381539985415e-06, "loss": 2.2568, "step": 488430 }, { "epoch": 0.85, "learning_rate": 7.410966214071716e-06, "loss": 2.2738, "step": 488440 }, { "epoch": 0.85, "learning_rate": 7.41009427414489e-06, "loss": 2.2146, "step": 488450 }, { "epoch": 0.85, "learning_rate": 7.409222334218062e-06, "loss": 2.1826, "step": 488460 }, { "epoch": 0.85, "learning_rate": 7.408350394291236e-06, "loss": 2.1177, "step": 488470 }, { "epoch": 0.85, "learning_rate": 7.407478454364409e-06, "loss": 2.2278, "step": 488480 }, { "epoch": 0.85, "learning_rate": 7.406606514437582e-06, "loss": 2.2778, "step": 488490 }, { "epoch": 0.85, "learning_rate": 7.4057345745107545e-06, "loss": 2.3045, "step": 488500 }, { "epoch": 0.85, "learning_rate": 7.404862634583928e-06, "loss": 2.2331, "step": 488510 }, { "epoch": 0.85, "learning_rate": 7.403990694657101e-06, "loss": 2.1754, "step": 488520 }, { "epoch": 0.85, "learning_rate": 7.403118754730275e-06, "loss": 2.2963, "step": 488530 }, { "epoch": 0.85, "learning_rate": 7.402246814803447e-06, "loss": 2.3209, "step": 488540 }, { "epoch": 0.85, "learning_rate": 7.401374874876621e-06, "loss": 2.311, "step": 488550 }, { "epoch": 0.85, "learning_rate": 7.400502934949794e-06, "loss": 2.3281, "step": 488560 }, { "epoch": 0.85, "learning_rate": 7.3996309950229675e-06, "loss": 2.3034, "step": 488570 }, { "epoch": 0.85, "learning_rate": 7.398759055096141e-06, "loss": 2.2344, "step": 488580 }, { "epoch": 0.85, "learning_rate": 7.397887115169313e-06, "loss": 2.3145, "step": 488590 }, { "epoch": 0.85, "learning_rate": 7.397015175242487e-06, "loss": 2.2102, "step": 488600 }, { "epoch": 0.85, "learning_rate": 7.39614323531566e-06, "loss": 2.3309, "step": 488610 }, { "epoch": 0.85, "learning_rate": 7.395271295388834e-06, "loss": 2.2908, "step": 488620 }, { "epoch": 0.85, "learning_rate": 7.394399355462006e-06, "loss": 2.2114, "step": 488630 }, { "epoch": 0.85, "learning_rate": 7.39352741553518e-06, "loss": 2.3491, "step": 488640 }, { "epoch": 0.85, "learning_rate": 7.3926554756083525e-06, "loss": 2.1639, "step": 488650 }, { "epoch": 0.85, "learning_rate": 7.391783535681526e-06, "loss": 2.2653, "step": 488660 }, { "epoch": 0.85, "learning_rate": 7.390911595754698e-06, "loss": 2.162, "step": 488670 }, { "epoch": 0.85, "learning_rate": 7.390039655827872e-06, "loss": 2.2477, "step": 488680 }, { "epoch": 0.85, "learning_rate": 7.389167715901045e-06, "loss": 2.1763, "step": 488690 }, { "epoch": 0.85, "learning_rate": 7.388295775974219e-06, "loss": 2.2065, "step": 488700 }, { "epoch": 0.85, "learning_rate": 7.387423836047393e-06, "loss": 2.2691, "step": 488710 }, { "epoch": 0.85, "learning_rate": 7.3865518961205655e-06, "loss": 2.318, "step": 488720 }, { "epoch": 0.85, "learning_rate": 7.385679956193739e-06, "loss": 2.2995, "step": 488730 }, { "epoch": 0.85, "learning_rate": 7.384808016266911e-06, "loss": 2.4208, "step": 488740 }, { "epoch": 0.85, "learning_rate": 7.383936076340085e-06, "loss": 2.2747, "step": 488750 }, { "epoch": 0.85, "learning_rate": 7.383064136413258e-06, "loss": 2.2657, "step": 488760 }, { "epoch": 0.85, "learning_rate": 7.382192196486432e-06, "loss": 2.3187, "step": 488770 }, { "epoch": 0.85, "learning_rate": 7.381320256559604e-06, "loss": 2.1994, "step": 488780 }, { "epoch": 0.85, "learning_rate": 7.380448316632778e-06, "loss": 2.2621, "step": 488790 }, { "epoch": 0.85, "learning_rate": 7.379576376705951e-06, "loss": 2.3117, "step": 488800 }, { "epoch": 0.85, "learning_rate": 7.378704436779124e-06, "loss": 2.341, "step": 488810 }, { "epoch": 0.85, "learning_rate": 7.3778324968522965e-06, "loss": 2.1714, "step": 488820 }, { "epoch": 0.85, "learning_rate": 7.37696055692547e-06, "loss": 2.3251, "step": 488830 }, { "epoch": 0.85, "learning_rate": 7.376088616998644e-06, "loss": 2.3213, "step": 488840 }, { "epoch": 0.85, "learning_rate": 7.375216677071817e-06, "loss": 2.3351, "step": 488850 }, { "epoch": 0.85, "learning_rate": 7.374344737144991e-06, "loss": 2.2161, "step": 488860 }, { "epoch": 0.85, "learning_rate": 7.373472797218163e-06, "loss": 2.2426, "step": 488870 }, { "epoch": 0.85, "learning_rate": 7.3726008572913365e-06, "loss": 2.3433, "step": 488880 }, { "epoch": 0.85, "learning_rate": 7.3717289173645095e-06, "loss": 2.3313, "step": 488890 }, { "epoch": 0.85, "learning_rate": 7.370856977437683e-06, "loss": 2.3141, "step": 488900 }, { "epoch": 0.85, "learning_rate": 7.369985037510855e-06, "loss": 2.296, "step": 488910 }, { "epoch": 0.85, "learning_rate": 7.369113097584029e-06, "loss": 2.2954, "step": 488920 }, { "epoch": 0.85, "learning_rate": 7.368241157657202e-06, "loss": 2.1596, "step": 488930 }, { "epoch": 0.85, "learning_rate": 7.367369217730376e-06, "loss": 2.0843, "step": 488940 }, { "epoch": 0.85, "learning_rate": 7.366497277803548e-06, "loss": 2.2865, "step": 488950 }, { "epoch": 0.85, "learning_rate": 7.3656253378767225e-06, "loss": 2.2038, "step": 488960 }, { "epoch": 0.85, "learning_rate": 7.364753397949896e-06, "loss": 2.3094, "step": 488970 }, { "epoch": 0.85, "learning_rate": 7.363881458023068e-06, "loss": 2.0581, "step": 488980 }, { "epoch": 0.85, "learning_rate": 7.363009518096242e-06, "loss": 2.273, "step": 488990 }, { "epoch": 0.85, "learning_rate": 7.362137578169415e-06, "loss": 2.3308, "step": 489000 }, { "epoch": 0.85, "learning_rate": 7.361265638242589e-06, "loss": 2.1916, "step": 489010 }, { "epoch": 0.85, "learning_rate": 7.360393698315761e-06, "loss": 2.2316, "step": 489020 }, { "epoch": 0.85, "learning_rate": 7.359521758388935e-06, "loss": 2.2676, "step": 489030 }, { "epoch": 0.85, "learning_rate": 7.3586498184621075e-06, "loss": 2.3559, "step": 489040 }, { "epoch": 0.85, "learning_rate": 7.357777878535281e-06, "loss": 2.3371, "step": 489050 }, { "epoch": 0.85, "learning_rate": 7.356905938608453e-06, "loss": 2.0913, "step": 489060 }, { "epoch": 0.85, "learning_rate": 7.356033998681627e-06, "loss": 2.2731, "step": 489070 }, { "epoch": 0.85, "learning_rate": 7.3551620587548e-06, "loss": 2.2893, "step": 489080 }, { "epoch": 0.85, "learning_rate": 7.354290118827974e-06, "loss": 2.307, "step": 489090 }, { "epoch": 0.85, "learning_rate": 7.353418178901146e-06, "loss": 2.243, "step": 489100 }, { "epoch": 0.85, "learning_rate": 7.35254623897432e-06, "loss": 2.278, "step": 489110 }, { "epoch": 0.85, "learning_rate": 7.3516742990474935e-06, "loss": 2.3433, "step": 489120 }, { "epoch": 0.85, "learning_rate": 7.350802359120666e-06, "loss": 2.2911, "step": 489130 }, { "epoch": 0.85, "learning_rate": 7.34993041919384e-06, "loss": 2.2428, "step": 489140 }, { "epoch": 0.85, "learning_rate": 7.349058479267012e-06, "loss": 2.3332, "step": 489150 }, { "epoch": 0.85, "learning_rate": 7.348186539340186e-06, "loss": 2.1387, "step": 489160 }, { "epoch": 0.85, "learning_rate": 7.347314599413359e-06, "loss": 2.1746, "step": 489170 }, { "epoch": 0.85, "learning_rate": 7.346442659486533e-06, "loss": 2.2614, "step": 489180 }, { "epoch": 0.85, "learning_rate": 7.345570719559705e-06, "loss": 2.1747, "step": 489190 }, { "epoch": 0.85, "learning_rate": 7.3446987796328785e-06, "loss": 2.36, "step": 489200 }, { "epoch": 0.85, "learning_rate": 7.3438268397060515e-06, "loss": 2.2332, "step": 489210 }, { "epoch": 0.85, "learning_rate": 7.342954899779225e-06, "loss": 2.1985, "step": 489220 }, { "epoch": 0.85, "learning_rate": 7.342082959852397e-06, "loss": 2.2762, "step": 489230 }, { "epoch": 0.85, "learning_rate": 7.341211019925572e-06, "loss": 2.237, "step": 489240 }, { "epoch": 0.85, "learning_rate": 7.340339079998746e-06, "loss": 2.3834, "step": 489250 }, { "epoch": 0.85, "learning_rate": 7.339467140071918e-06, "loss": 2.2096, "step": 489260 }, { "epoch": 0.85, "learning_rate": 7.3385952001450915e-06, "loss": 2.3063, "step": 489270 }, { "epoch": 0.85, "learning_rate": 7.3377232602182645e-06, "loss": 2.2976, "step": 489280 }, { "epoch": 0.85, "learning_rate": 7.336851320291438e-06, "loss": 2.2913, "step": 489290 }, { "epoch": 0.85, "learning_rate": 7.33597938036461e-06, "loss": 2.4103, "step": 489300 }, { "epoch": 0.85, "learning_rate": 7.335107440437784e-06, "loss": 2.3401, "step": 489310 }, { "epoch": 0.85, "learning_rate": 7.334235500510957e-06, "loss": 2.3319, "step": 489320 }, { "epoch": 0.85, "learning_rate": 7.333363560584131e-06, "loss": 2.2605, "step": 489330 }, { "epoch": 0.85, "learning_rate": 7.332491620657303e-06, "loss": 2.2567, "step": 489340 }, { "epoch": 0.85, "learning_rate": 7.331619680730477e-06, "loss": 2.2418, "step": 489350 }, { "epoch": 0.85, "learning_rate": 7.3307477408036495e-06, "loss": 2.342, "step": 489360 }, { "epoch": 0.85, "learning_rate": 7.329875800876823e-06, "loss": 2.3049, "step": 489370 }, { "epoch": 0.85, "learning_rate": 7.329003860949997e-06, "loss": 2.3274, "step": 489380 }, { "epoch": 0.85, "learning_rate": 7.328131921023169e-06, "loss": 2.3493, "step": 489390 }, { "epoch": 0.85, "learning_rate": 7.327259981096343e-06, "loss": 2.2817, "step": 489400 }, { "epoch": 0.85, "learning_rate": 7.326388041169516e-06, "loss": 2.1627, "step": 489410 }, { "epoch": 0.85, "learning_rate": 7.32551610124269e-06, "loss": 2.1969, "step": 489420 }, { "epoch": 0.85, "learning_rate": 7.324644161315862e-06, "loss": 2.264, "step": 489430 }, { "epoch": 0.85, "learning_rate": 7.3237722213890355e-06, "loss": 2.2868, "step": 489440 }, { "epoch": 0.85, "learning_rate": 7.322900281462208e-06, "loss": 2.2036, "step": 489450 }, { "epoch": 0.85, "learning_rate": 7.322028341535382e-06, "loss": 2.2916, "step": 489460 }, { "epoch": 0.85, "learning_rate": 7.321156401608554e-06, "loss": 2.2892, "step": 489470 }, { "epoch": 0.85, "learning_rate": 7.320284461681729e-06, "loss": 2.2584, "step": 489480 }, { "epoch": 0.85, "learning_rate": 7.319412521754901e-06, "loss": 2.1255, "step": 489490 }, { "epoch": 0.85, "learning_rate": 7.318540581828075e-06, "loss": 2.2453, "step": 489500 }, { "epoch": 0.85, "learning_rate": 7.3176686419012485e-06, "loss": 2.3066, "step": 489510 }, { "epoch": 0.85, "learning_rate": 7.316796701974421e-06, "loss": 2.2188, "step": 489520 }, { "epoch": 0.85, "learning_rate": 7.315924762047595e-06, "loss": 2.2441, "step": 489530 }, { "epoch": 0.85, "learning_rate": 7.315052822120767e-06, "loss": 2.2616, "step": 489540 }, { "epoch": 0.85, "learning_rate": 7.314180882193941e-06, "loss": 2.2131, "step": 489550 }, { "epoch": 0.85, "learning_rate": 7.313308942267114e-06, "loss": 2.1966, "step": 489560 }, { "epoch": 0.85, "learning_rate": 7.312437002340288e-06, "loss": 2.3693, "step": 489570 }, { "epoch": 0.85, "learning_rate": 7.31156506241346e-06, "loss": 2.3017, "step": 489580 }, { "epoch": 0.85, "learning_rate": 7.3106931224866335e-06, "loss": 2.3305, "step": 489590 }, { "epoch": 0.85, "learning_rate": 7.3098211825598065e-06, "loss": 2.3194, "step": 489600 }, { "epoch": 0.85, "learning_rate": 7.30894924263298e-06, "loss": 2.2864, "step": 489610 }, { "epoch": 0.85, "learning_rate": 7.308077302706152e-06, "loss": 2.3317, "step": 489620 }, { "epoch": 0.85, "learning_rate": 7.307205362779326e-06, "loss": 2.2741, "step": 489630 }, { "epoch": 0.85, "learning_rate": 7.3063334228525e-06, "loss": 2.2116, "step": 489640 }, { "epoch": 0.85, "learning_rate": 7.305461482925673e-06, "loss": 2.2967, "step": 489650 }, { "epoch": 0.85, "learning_rate": 7.3045895429988465e-06, "loss": 2.2608, "step": 489660 }, { "epoch": 0.85, "learning_rate": 7.303717603072019e-06, "loss": 2.2642, "step": 489670 }, { "epoch": 0.85, "learning_rate": 7.302845663145192e-06, "loss": 2.2697, "step": 489680 }, { "epoch": 0.85, "learning_rate": 7.301973723218365e-06, "loss": 2.3391, "step": 489690 }, { "epoch": 0.85, "learning_rate": 7.301101783291539e-06, "loss": 2.2696, "step": 489700 }, { "epoch": 0.85, "learning_rate": 7.300229843364711e-06, "loss": 2.2739, "step": 489710 }, { "epoch": 0.85, "learning_rate": 7.299357903437885e-06, "loss": 2.1696, "step": 489720 }, { "epoch": 0.85, "learning_rate": 7.298485963511058e-06, "loss": 2.2714, "step": 489730 }, { "epoch": 0.85, "learning_rate": 7.297614023584232e-06, "loss": 2.2939, "step": 489740 }, { "epoch": 0.85, "learning_rate": 7.296742083657404e-06, "loss": 2.4328, "step": 489750 }, { "epoch": 0.85, "learning_rate": 7.295870143730578e-06, "loss": 2.1666, "step": 489760 }, { "epoch": 0.85, "learning_rate": 7.294998203803752e-06, "loss": 2.1896, "step": 489770 }, { "epoch": 0.85, "learning_rate": 7.294126263876924e-06, "loss": 2.3261, "step": 489780 }, { "epoch": 0.85, "learning_rate": 7.293254323950098e-06, "loss": 2.2662, "step": 489790 }, { "epoch": 0.85, "learning_rate": 7.292382384023271e-06, "loss": 2.2585, "step": 489800 }, { "epoch": 0.85, "learning_rate": 7.291510444096445e-06, "loss": 2.2884, "step": 489810 }, { "epoch": 0.85, "learning_rate": 7.290638504169617e-06, "loss": 2.3343, "step": 489820 }, { "epoch": 0.85, "learning_rate": 7.2897665642427905e-06, "loss": 2.2775, "step": 489830 }, { "epoch": 0.85, "learning_rate": 7.288894624315963e-06, "loss": 2.229, "step": 489840 }, { "epoch": 0.85, "learning_rate": 7.288022684389137e-06, "loss": 2.326, "step": 489850 }, { "epoch": 0.85, "learning_rate": 7.287150744462309e-06, "loss": 2.18, "step": 489860 }, { "epoch": 0.85, "learning_rate": 7.286278804535483e-06, "loss": 2.2859, "step": 489870 }, { "epoch": 0.85, "learning_rate": 7.285406864608656e-06, "loss": 2.2543, "step": 489880 }, { "epoch": 0.85, "learning_rate": 7.28453492468183e-06, "loss": 2.3532, "step": 489890 }, { "epoch": 0.85, "learning_rate": 7.2836629847550035e-06, "loss": 2.2402, "step": 489900 }, { "epoch": 0.85, "learning_rate": 7.2827910448281755e-06, "loss": 2.2813, "step": 489910 }, { "epoch": 0.85, "learning_rate": 7.281919104901349e-06, "loss": 2.329, "step": 489920 }, { "epoch": 0.85, "learning_rate": 7.281047164974522e-06, "loss": 2.1686, "step": 489930 }, { "epoch": 0.85, "learning_rate": 7.280175225047696e-06, "loss": 2.1193, "step": 489940 }, { "epoch": 0.85, "learning_rate": 7.279303285120868e-06, "loss": 2.3518, "step": 489950 }, { "epoch": 0.85, "learning_rate": 7.278431345194042e-06, "loss": 2.3028, "step": 489960 }, { "epoch": 0.85, "learning_rate": 7.277559405267215e-06, "loss": 2.2609, "step": 489970 }, { "epoch": 0.85, "learning_rate": 7.2766874653403885e-06, "loss": 2.3671, "step": 489980 }, { "epoch": 0.85, "learning_rate": 7.275815525413561e-06, "loss": 2.2513, "step": 489990 }, { "epoch": 0.85, "learning_rate": 7.274943585486735e-06, "loss": 2.2094, "step": 490000 }, { "epoch": 0.85, "learning_rate": 7.274071645559907e-06, "loss": 2.2535, "step": 490010 }, { "epoch": 0.85, "learning_rate": 7.273199705633081e-06, "loss": 2.2882, "step": 490020 }, { "epoch": 0.85, "learning_rate": 7.272327765706253e-06, "loss": 2.3013, "step": 490030 }, { "epoch": 0.85, "learning_rate": 7.271455825779428e-06, "loss": 2.2704, "step": 490040 }, { "epoch": 0.85, "learning_rate": 7.2705838858526015e-06, "loss": 2.3253, "step": 490050 }, { "epoch": 0.85, "learning_rate": 7.269711945925774e-06, "loss": 2.2121, "step": 490060 }, { "epoch": 0.85, "learning_rate": 7.268840005998947e-06, "loss": 2.2209, "step": 490070 }, { "epoch": 0.85, "learning_rate": 7.26796806607212e-06, "loss": 2.2641, "step": 490080 }, { "epoch": 0.85, "learning_rate": 7.267096126145294e-06, "loss": 2.3552, "step": 490090 }, { "epoch": 0.85, "learning_rate": 7.266224186218466e-06, "loss": 2.3753, "step": 490100 }, { "epoch": 0.85, "learning_rate": 7.26535224629164e-06, "loss": 2.3394, "step": 490110 }, { "epoch": 0.85, "learning_rate": 7.264480306364813e-06, "loss": 2.2483, "step": 490120 }, { "epoch": 0.85, "learning_rate": 7.263608366437987e-06, "loss": 2.1825, "step": 490130 }, { "epoch": 0.85, "learning_rate": 7.262736426511159e-06, "loss": 2.3079, "step": 490140 }, { "epoch": 0.85, "learning_rate": 7.2618644865843325e-06, "loss": 2.2183, "step": 490150 }, { "epoch": 0.85, "learning_rate": 7.260992546657505e-06, "loss": 2.3022, "step": 490160 }, { "epoch": 0.85, "learning_rate": 7.260120606730679e-06, "loss": 2.168, "step": 490170 }, { "epoch": 0.85, "learning_rate": 7.259248666803853e-06, "loss": 2.3101, "step": 490180 }, { "epoch": 0.85, "learning_rate": 7.258376726877025e-06, "loss": 2.3843, "step": 490190 }, { "epoch": 0.85, "learning_rate": 7.257504786950199e-06, "loss": 2.2365, "step": 490200 }, { "epoch": 0.85, "learning_rate": 7.256632847023372e-06, "loss": 2.375, "step": 490210 }, { "epoch": 0.85, "learning_rate": 7.2557609070965455e-06, "loss": 2.3023, "step": 490220 }, { "epoch": 0.85, "learning_rate": 7.2548889671697175e-06, "loss": 2.167, "step": 490230 }, { "epoch": 0.85, "learning_rate": 7.254017027242891e-06, "loss": 2.2414, "step": 490240 }, { "epoch": 0.85, "learning_rate": 7.253145087316064e-06, "loss": 2.3377, "step": 490250 }, { "epoch": 0.85, "learning_rate": 7.252273147389238e-06, "loss": 2.2582, "step": 490260 }, { "epoch": 0.85, "learning_rate": 7.25140120746241e-06, "loss": 2.2323, "step": 490270 }, { "epoch": 0.85, "learning_rate": 7.250529267535585e-06, "loss": 2.2128, "step": 490280 }, { "epoch": 0.86, "learning_rate": 7.249657327608757e-06, "loss": 2.1968, "step": 490290 }, { "epoch": 0.86, "learning_rate": 7.2487853876819305e-06, "loss": 2.3124, "step": 490300 }, { "epoch": 0.86, "learning_rate": 7.247913447755104e-06, "loss": 2.2026, "step": 490310 }, { "epoch": 0.86, "learning_rate": 7.247041507828277e-06, "loss": 2.34, "step": 490320 }, { "epoch": 0.86, "learning_rate": 7.246169567901451e-06, "loss": 2.2295, "step": 490330 }, { "epoch": 0.86, "learning_rate": 7.245297627974623e-06, "loss": 2.2798, "step": 490340 }, { "epoch": 0.86, "learning_rate": 7.244425688047797e-06, "loss": 2.2929, "step": 490350 }, { "epoch": 0.86, "learning_rate": 7.24355374812097e-06, "loss": 2.1791, "step": 490360 }, { "epoch": 0.86, "learning_rate": 7.2426818081941435e-06, "loss": 2.2333, "step": 490370 }, { "epoch": 0.86, "learning_rate": 7.241809868267316e-06, "loss": 2.2952, "step": 490380 }, { "epoch": 0.86, "learning_rate": 7.240937928340489e-06, "loss": 2.2817, "step": 490390 }, { "epoch": 0.86, "learning_rate": 7.240065988413662e-06, "loss": 2.2804, "step": 490400 }, { "epoch": 0.86, "learning_rate": 7.239194048486836e-06, "loss": 2.1985, "step": 490410 }, { "epoch": 0.86, "learning_rate": 7.238322108560008e-06, "loss": 2.179, "step": 490420 }, { "epoch": 0.86, "learning_rate": 7.237450168633182e-06, "loss": 2.1695, "step": 490430 }, { "epoch": 0.86, "learning_rate": 7.236578228706356e-06, "loss": 2.2148, "step": 490440 }, { "epoch": 0.86, "learning_rate": 7.235706288779529e-06, "loss": 2.2293, "step": 490450 }, { "epoch": 0.86, "learning_rate": 7.234834348852702e-06, "loss": 2.3529, "step": 490460 }, { "epoch": 0.86, "learning_rate": 7.2339624089258745e-06, "loss": 2.3419, "step": 490470 }, { "epoch": 0.86, "learning_rate": 7.233090468999048e-06, "loss": 2.2039, "step": 490480 }, { "epoch": 0.86, "learning_rate": 7.232218529072221e-06, "loss": 2.268, "step": 490490 }, { "epoch": 0.86, "learning_rate": 7.231346589145395e-06, "loss": 2.2708, "step": 490500 }, { "epoch": 0.86, "learning_rate": 7.230474649218567e-06, "loss": 2.2648, "step": 490510 }, { "epoch": 0.86, "learning_rate": 7.229602709291742e-06, "loss": 2.2154, "step": 490520 }, { "epoch": 0.86, "learning_rate": 7.228730769364914e-06, "loss": 2.2347, "step": 490530 }, { "epoch": 0.86, "learning_rate": 7.2278588294380875e-06, "loss": 2.4097, "step": 490540 }, { "epoch": 0.86, "learning_rate": 7.2269868895112595e-06, "loss": 2.2517, "step": 490550 }, { "epoch": 0.86, "learning_rate": 7.226114949584434e-06, "loss": 2.3174, "step": 490560 }, { "epoch": 0.86, "learning_rate": 7.225243009657608e-06, "loss": 2.1855, "step": 490570 }, { "epoch": 0.86, "learning_rate": 7.22437106973078e-06, "loss": 2.4178, "step": 490580 }, { "epoch": 0.86, "learning_rate": 7.223499129803954e-06, "loss": 2.3377, "step": 490590 }, { "epoch": 0.86, "learning_rate": 7.222627189877127e-06, "loss": 2.1377, "step": 490600 }, { "epoch": 0.86, "learning_rate": 7.2217552499503005e-06, "loss": 2.19, "step": 490610 }, { "epoch": 0.86, "learning_rate": 7.2208833100234725e-06, "loss": 2.2891, "step": 490620 }, { "epoch": 0.86, "learning_rate": 7.220011370096646e-06, "loss": 2.2361, "step": 490630 }, { "epoch": 0.86, "learning_rate": 7.219139430169819e-06, "loss": 2.2849, "step": 490640 }, { "epoch": 0.86, "learning_rate": 7.218267490242993e-06, "loss": 2.3665, "step": 490650 }, { "epoch": 0.86, "learning_rate": 7.217395550316165e-06, "loss": 2.2062, "step": 490660 }, { "epoch": 0.86, "learning_rate": 7.216523610389339e-06, "loss": 2.3396, "step": 490670 }, { "epoch": 0.86, "learning_rate": 7.215651670462512e-06, "loss": 2.2351, "step": 490680 }, { "epoch": 0.86, "learning_rate": 7.2147797305356855e-06, "loss": 2.3219, "step": 490690 }, { "epoch": 0.86, "learning_rate": 7.213907790608859e-06, "loss": 2.3861, "step": 490700 }, { "epoch": 0.86, "learning_rate": 7.213035850682031e-06, "loss": 2.2006, "step": 490710 }, { "epoch": 0.86, "learning_rate": 7.212163910755205e-06, "loss": 2.2352, "step": 490720 }, { "epoch": 0.86, "learning_rate": 7.211291970828378e-06, "loss": 2.3639, "step": 490730 }, { "epoch": 0.86, "learning_rate": 7.210420030901552e-06, "loss": 2.3061, "step": 490740 }, { "epoch": 0.86, "learning_rate": 7.209548090974724e-06, "loss": 2.2821, "step": 490750 }, { "epoch": 0.86, "learning_rate": 7.208676151047898e-06, "loss": 2.2808, "step": 490760 }, { "epoch": 0.86, "learning_rate": 7.207804211121071e-06, "loss": 2.2034, "step": 490770 }, { "epoch": 0.86, "learning_rate": 7.206932271194244e-06, "loss": 2.2106, "step": 490780 }, { "epoch": 0.86, "learning_rate": 7.2060603312674165e-06, "loss": 2.2655, "step": 490790 }, { "epoch": 0.86, "learning_rate": 7.205188391340591e-06, "loss": 2.2404, "step": 490800 }, { "epoch": 0.86, "learning_rate": 7.204316451413763e-06, "loss": 2.1837, "step": 490810 }, { "epoch": 0.86, "learning_rate": 7.203444511486937e-06, "loss": 2.2904, "step": 490820 }, { "epoch": 0.86, "learning_rate": 7.20257257156011e-06, "loss": 2.2536, "step": 490830 }, { "epoch": 0.86, "learning_rate": 7.201700631633284e-06, "loss": 2.2474, "step": 490840 }, { "epoch": 0.86, "learning_rate": 7.200828691706457e-06, "loss": 2.2436, "step": 490850 }, { "epoch": 0.86, "learning_rate": 7.1999567517796295e-06, "loss": 2.3284, "step": 490860 }, { "epoch": 0.86, "learning_rate": 7.199084811852803e-06, "loss": 2.2175, "step": 490870 }, { "epoch": 0.86, "learning_rate": 7.198212871925976e-06, "loss": 2.1309, "step": 490880 }, { "epoch": 0.86, "learning_rate": 7.19734093199915e-06, "loss": 2.2811, "step": 490890 }, { "epoch": 0.86, "learning_rate": 7.196468992072322e-06, "loss": 2.2327, "step": 490900 }, { "epoch": 0.86, "learning_rate": 7.195597052145496e-06, "loss": 2.333, "step": 490910 }, { "epoch": 0.86, "learning_rate": 7.194725112218669e-06, "loss": 2.3091, "step": 490920 }, { "epoch": 0.86, "learning_rate": 7.1938531722918425e-06, "loss": 2.2529, "step": 490930 }, { "epoch": 0.86, "learning_rate": 7.1929812323650145e-06, "loss": 2.2789, "step": 490940 }, { "epoch": 0.86, "learning_rate": 7.192109292438188e-06, "loss": 2.3151, "step": 490950 }, { "epoch": 0.86, "learning_rate": 7.191237352511361e-06, "loss": 2.2324, "step": 490960 }, { "epoch": 0.86, "learning_rate": 7.190365412584535e-06, "loss": 2.4171, "step": 490970 }, { "epoch": 0.86, "learning_rate": 7.189493472657709e-06, "loss": 2.2538, "step": 490980 }, { "epoch": 0.86, "learning_rate": 7.188621532730881e-06, "loss": 2.262, "step": 490990 }, { "epoch": 0.86, "learning_rate": 7.187749592804055e-06, "loss": 2.202, "step": 491000 }, { "epoch": 0.86, "learning_rate": 7.1868776528772276e-06, "loss": 2.3304, "step": 491010 }, { "epoch": 0.86, "learning_rate": 7.186005712950401e-06, "loss": 2.2938, "step": 491020 }, { "epoch": 0.86, "learning_rate": 7.185133773023573e-06, "loss": 2.2364, "step": 491030 }, { "epoch": 0.86, "learning_rate": 7.184261833096748e-06, "loss": 2.2575, "step": 491040 }, { "epoch": 0.86, "learning_rate": 7.18338989316992e-06, "loss": 2.2477, "step": 491050 }, { "epoch": 0.86, "learning_rate": 7.182517953243094e-06, "loss": 2.2819, "step": 491060 }, { "epoch": 0.86, "learning_rate": 7.181646013316266e-06, "loss": 2.2582, "step": 491070 }, { "epoch": 0.86, "learning_rate": 7.1807740733894406e-06, "loss": 2.2606, "step": 491080 }, { "epoch": 0.86, "learning_rate": 7.179902133462613e-06, "loss": 2.2452, "step": 491090 }, { "epoch": 0.86, "learning_rate": 7.179030193535786e-06, "loss": 2.1988, "step": 491100 }, { "epoch": 0.86, "learning_rate": 7.17815825360896e-06, "loss": 2.2147, "step": 491110 }, { "epoch": 0.86, "learning_rate": 7.177286313682133e-06, "loss": 2.2347, "step": 491120 }, { "epoch": 0.86, "learning_rate": 7.176414373755307e-06, "loss": 2.2959, "step": 491130 }, { "epoch": 0.86, "learning_rate": 7.175542433828479e-06, "loss": 2.3285, "step": 491140 }, { "epoch": 0.86, "learning_rate": 7.174670493901653e-06, "loss": 2.3505, "step": 491150 }, { "epoch": 0.86, "learning_rate": 7.173798553974826e-06, "loss": 2.2911, "step": 491160 }, { "epoch": 0.86, "learning_rate": 7.172926614047999e-06, "loss": 2.2617, "step": 491170 }, { "epoch": 0.86, "learning_rate": 7.1720546741211715e-06, "loss": 2.2367, "step": 491180 }, { "epoch": 0.86, "learning_rate": 7.171182734194345e-06, "loss": 2.2482, "step": 491190 }, { "epoch": 0.86, "learning_rate": 7.170310794267518e-06, "loss": 2.2833, "step": 491200 }, { "epoch": 0.86, "learning_rate": 7.169438854340692e-06, "loss": 2.2375, "step": 491210 }, { "epoch": 0.86, "learning_rate": 7.168566914413864e-06, "loss": 2.2774, "step": 491220 }, { "epoch": 0.86, "learning_rate": 7.167694974487038e-06, "loss": 2.2396, "step": 491230 }, { "epoch": 0.86, "learning_rate": 7.1668230345602116e-06, "loss": 2.2629, "step": 491240 }, { "epoch": 0.86, "learning_rate": 7.1659510946333845e-06, "loss": 2.2728, "step": 491250 }, { "epoch": 0.86, "learning_rate": 7.165079154706558e-06, "loss": 2.3715, "step": 491260 }, { "epoch": 0.86, "learning_rate": 7.16420721477973e-06, "loss": 2.3131, "step": 491270 }, { "epoch": 0.86, "learning_rate": 7.163335274852904e-06, "loss": 2.3197, "step": 491280 }, { "epoch": 0.86, "learning_rate": 7.162463334926077e-06, "loss": 2.3056, "step": 491290 }, { "epoch": 0.86, "learning_rate": 7.161591394999251e-06, "loss": 2.3058, "step": 491300 }, { "epoch": 0.86, "learning_rate": 7.160719455072423e-06, "loss": 2.1736, "step": 491310 }, { "epoch": 0.86, "learning_rate": 7.1598475151455975e-06, "loss": 2.285, "step": 491320 }, { "epoch": 0.86, "learning_rate": 7.1589755752187696e-06, "loss": 2.3253, "step": 491330 }, { "epoch": 0.86, "learning_rate": 7.158103635291943e-06, "loss": 2.1655, "step": 491340 }, { "epoch": 0.86, "learning_rate": 7.157231695365116e-06, "loss": 2.3626, "step": 491350 }, { "epoch": 0.86, "learning_rate": 7.15635975543829e-06, "loss": 2.2398, "step": 491360 }, { "epoch": 0.86, "learning_rate": 7.155487815511464e-06, "loss": 2.2916, "step": 491370 }, { "epoch": 0.86, "learning_rate": 7.154615875584636e-06, "loss": 2.2638, "step": 491380 }, { "epoch": 0.86, "learning_rate": 7.15374393565781e-06, "loss": 2.308, "step": 491390 }, { "epoch": 0.86, "learning_rate": 7.1528719957309826e-06, "loss": 2.4081, "step": 491400 }, { "epoch": 0.86, "learning_rate": 7.152000055804156e-06, "loss": 2.3345, "step": 491410 }, { "epoch": 0.86, "learning_rate": 7.151128115877328e-06, "loss": 2.2071, "step": 491420 }, { "epoch": 0.86, "learning_rate": 7.150256175950502e-06, "loss": 2.2828, "step": 491430 }, { "epoch": 0.86, "learning_rate": 7.149384236023675e-06, "loss": 2.2848, "step": 491440 }, { "epoch": 0.86, "learning_rate": 7.148512296096849e-06, "loss": 2.1753, "step": 491450 }, { "epoch": 0.86, "learning_rate": 7.147640356170021e-06, "loss": 2.3245, "step": 491460 }, { "epoch": 0.86, "learning_rate": 7.146768416243195e-06, "loss": 2.3237, "step": 491470 }, { "epoch": 0.86, "learning_rate": 7.145896476316368e-06, "loss": 2.3745, "step": 491480 }, { "epoch": 0.86, "learning_rate": 7.145024536389541e-06, "loss": 2.2108, "step": 491490 }, { "epoch": 0.86, "learning_rate": 7.144152596462715e-06, "loss": 2.2238, "step": 491500 }, { "epoch": 0.86, "learning_rate": 7.143280656535887e-06, "loss": 2.3076, "step": 491510 }, { "epoch": 0.86, "learning_rate": 7.142408716609061e-06, "loss": 2.252, "step": 491520 }, { "epoch": 0.86, "learning_rate": 7.141536776682234e-06, "loss": 2.3689, "step": 491530 }, { "epoch": 0.86, "learning_rate": 7.140664836755408e-06, "loss": 2.2149, "step": 491540 }, { "epoch": 0.86, "learning_rate": 7.13979289682858e-06, "loss": 2.4114, "step": 491550 }, { "epoch": 0.86, "learning_rate": 7.138920956901754e-06, "loss": 2.2376, "step": 491560 }, { "epoch": 0.86, "learning_rate": 7.1380490169749265e-06, "loss": 2.2119, "step": 491570 }, { "epoch": 0.86, "learning_rate": 7.1371770770481e-06, "loss": 2.2693, "step": 491580 }, { "epoch": 0.86, "learning_rate": 7.136305137121272e-06, "loss": 2.3823, "step": 491590 }, { "epoch": 0.86, "learning_rate": 7.135433197194447e-06, "loss": 2.3516, "step": 491600 }, { "epoch": 0.86, "learning_rate": 7.134561257267619e-06, "loss": 2.3695, "step": 491610 }, { "epoch": 0.86, "learning_rate": 7.133689317340793e-06, "loss": 2.2496, "step": 491620 }, { "epoch": 0.86, "learning_rate": 7.1328173774139666e-06, "loss": 2.2539, "step": 491630 }, { "epoch": 0.86, "learning_rate": 7.1319454374871395e-06, "loss": 2.2693, "step": 491640 }, { "epoch": 0.86, "learning_rate": 7.131073497560313e-06, "loss": 2.1577, "step": 491650 }, { "epoch": 0.86, "learning_rate": 7.130201557633485e-06, "loss": 2.2777, "step": 491660 }, { "epoch": 0.86, "learning_rate": 7.129329617706659e-06, "loss": 2.2711, "step": 491670 }, { "epoch": 0.86, "learning_rate": 7.128457677779832e-06, "loss": 2.2505, "step": 491680 }, { "epoch": 0.86, "learning_rate": 7.127585737853006e-06, "loss": 2.3252, "step": 491690 }, { "epoch": 0.86, "learning_rate": 7.126713797926178e-06, "loss": 2.2518, "step": 491700 }, { "epoch": 0.86, "learning_rate": 7.125841857999352e-06, "loss": 2.273, "step": 491710 }, { "epoch": 0.86, "learning_rate": 7.1249699180725246e-06, "loss": 2.3634, "step": 491720 }, { "epoch": 0.86, "learning_rate": 7.124097978145698e-06, "loss": 2.3221, "step": 491730 }, { "epoch": 0.86, "learning_rate": 7.12322603821887e-06, "loss": 2.2884, "step": 491740 }, { "epoch": 0.86, "learning_rate": 7.122354098292044e-06, "loss": 2.2642, "step": 491750 }, { "epoch": 0.86, "learning_rate": 7.121482158365217e-06, "loss": 2.2908, "step": 491760 }, { "epoch": 0.86, "learning_rate": 7.120610218438391e-06, "loss": 2.3513, "step": 491770 }, { "epoch": 0.86, "learning_rate": 7.119738278511565e-06, "loss": 2.1703, "step": 491780 }, { "epoch": 0.86, "learning_rate": 7.118866338584737e-06, "loss": 2.3353, "step": 491790 }, { "epoch": 0.86, "learning_rate": 7.1179943986579105e-06, "loss": 2.2966, "step": 491800 }, { "epoch": 0.86, "learning_rate": 7.117122458731083e-06, "loss": 2.3196, "step": 491810 }, { "epoch": 0.86, "learning_rate": 7.116250518804257e-06, "loss": 2.2236, "step": 491820 }, { "epoch": 0.86, "learning_rate": 7.115378578877429e-06, "loss": 2.3005, "step": 491830 }, { "epoch": 0.86, "learning_rate": 7.114506638950604e-06, "loss": 2.2306, "step": 491840 }, { "epoch": 0.86, "learning_rate": 7.113634699023776e-06, "loss": 2.3426, "step": 491850 }, { "epoch": 0.86, "learning_rate": 7.11276275909695e-06, "loss": 2.176, "step": 491860 }, { "epoch": 0.86, "learning_rate": 7.111890819170123e-06, "loss": 2.192, "step": 491870 }, { "epoch": 0.86, "learning_rate": 7.111018879243296e-06, "loss": 2.273, "step": 491880 }, { "epoch": 0.86, "learning_rate": 7.1101469393164685e-06, "loss": 2.148, "step": 491890 }, { "epoch": 0.86, "learning_rate": 7.109274999389642e-06, "loss": 2.3241, "step": 491900 }, { "epoch": 0.86, "learning_rate": 7.108403059462816e-06, "loss": 2.2953, "step": 491910 }, { "epoch": 0.86, "learning_rate": 7.107531119535989e-06, "loss": 2.197, "step": 491920 }, { "epoch": 0.86, "learning_rate": 7.106659179609163e-06, "loss": 2.2428, "step": 491930 }, { "epoch": 0.86, "learning_rate": 7.105787239682335e-06, "loss": 2.2842, "step": 491940 }, { "epoch": 0.86, "learning_rate": 7.1049152997555086e-06, "loss": 2.3542, "step": 491950 }, { "epoch": 0.86, "learning_rate": 7.1040433598286815e-06, "loss": 2.3086, "step": 491960 }, { "epoch": 0.86, "learning_rate": 7.103171419901855e-06, "loss": 2.188, "step": 491970 }, { "epoch": 0.86, "learning_rate": 7.102299479975027e-06, "loss": 2.3268, "step": 491980 }, { "epoch": 0.86, "learning_rate": 7.101427540048201e-06, "loss": 2.2068, "step": 491990 }, { "epoch": 0.86, "learning_rate": 7.100555600121374e-06, "loss": 2.2462, "step": 492000 }, { "epoch": 0.86, "learning_rate": 7.099683660194548e-06, "loss": 2.2604, "step": 492010 }, { "epoch": 0.86, "learning_rate": 7.09881172026772e-06, "loss": 2.3068, "step": 492020 }, { "epoch": 0.86, "learning_rate": 7.097939780340894e-06, "loss": 2.2627, "step": 492030 }, { "epoch": 0.86, "learning_rate": 7.097067840414067e-06, "loss": 2.3703, "step": 492040 }, { "epoch": 0.86, "learning_rate": 7.09619590048724e-06, "loss": 2.2649, "step": 492050 }, { "epoch": 0.86, "learning_rate": 7.095323960560414e-06, "loss": 2.267, "step": 492060 }, { "epoch": 0.86, "learning_rate": 7.094452020633586e-06, "loss": 2.2518, "step": 492070 }, { "epoch": 0.86, "learning_rate": 7.093580080706761e-06, "loss": 2.1402, "step": 492080 }, { "epoch": 0.86, "learning_rate": 7.092708140779933e-06, "loss": 2.2791, "step": 492090 }, { "epoch": 0.86, "learning_rate": 7.091836200853107e-06, "loss": 2.3716, "step": 492100 }, { "epoch": 0.86, "learning_rate": 7.090964260926279e-06, "loss": 2.2451, "step": 492110 }, { "epoch": 0.86, "learning_rate": 7.090092320999453e-06, "loss": 2.3976, "step": 492120 }, { "epoch": 0.86, "learning_rate": 7.089220381072625e-06, "loss": 2.415, "step": 492130 }, { "epoch": 0.86, "learning_rate": 7.088348441145799e-06, "loss": 2.241, "step": 492140 }, { "epoch": 0.86, "learning_rate": 7.087476501218972e-06, "loss": 2.1811, "step": 492150 }, { "epoch": 0.86, "learning_rate": 7.086604561292146e-06, "loss": 2.3021, "step": 492160 }, { "epoch": 0.86, "learning_rate": 7.08573262136532e-06, "loss": 2.1775, "step": 492170 }, { "epoch": 0.86, "learning_rate": 7.084860681438492e-06, "loss": 2.2876, "step": 492180 }, { "epoch": 0.86, "learning_rate": 7.0839887415116655e-06, "loss": 2.2662, "step": 492190 }, { "epoch": 0.86, "learning_rate": 7.083116801584838e-06, "loss": 2.2319, "step": 492200 }, { "epoch": 0.86, "learning_rate": 7.082244861658012e-06, "loss": 2.3639, "step": 492210 }, { "epoch": 0.86, "learning_rate": 7.081372921731184e-06, "loss": 2.2274, "step": 492220 }, { "epoch": 0.86, "learning_rate": 7.080500981804358e-06, "loss": 2.2304, "step": 492230 }, { "epoch": 0.86, "learning_rate": 7.079629041877531e-06, "loss": 2.3087, "step": 492240 }, { "epoch": 0.86, "learning_rate": 7.078757101950705e-06, "loss": 2.2185, "step": 492250 }, { "epoch": 0.86, "learning_rate": 7.077885162023877e-06, "loss": 2.3446, "step": 492260 }, { "epoch": 0.86, "learning_rate": 7.0770132220970506e-06, "loss": 2.29, "step": 492270 }, { "epoch": 0.86, "learning_rate": 7.0761412821702235e-06, "loss": 2.1773, "step": 492280 }, { "epoch": 0.86, "learning_rate": 7.075269342243397e-06, "loss": 2.2835, "step": 492290 }, { "epoch": 0.86, "learning_rate": 7.074397402316571e-06, "loss": 2.2067, "step": 492300 }, { "epoch": 0.86, "learning_rate": 7.073525462389743e-06, "loss": 2.1986, "step": 492310 }, { "epoch": 0.86, "learning_rate": 7.072653522462917e-06, "loss": 2.166, "step": 492320 }, { "epoch": 0.86, "learning_rate": 7.07178158253609e-06, "loss": 2.3822, "step": 492330 }, { "epoch": 0.86, "learning_rate": 7.0709096426092636e-06, "loss": 2.3889, "step": 492340 }, { "epoch": 0.86, "learning_rate": 7.070037702682436e-06, "loss": 2.2556, "step": 492350 }, { "epoch": 0.86, "learning_rate": 7.06916576275561e-06, "loss": 2.2898, "step": 492360 }, { "epoch": 0.86, "learning_rate": 7.068293822828782e-06, "loss": 2.3172, "step": 492370 }, { "epoch": 0.86, "learning_rate": 7.067421882901956e-06, "loss": 2.3715, "step": 492380 }, { "epoch": 0.86, "learning_rate": 7.066549942975129e-06, "loss": 2.252, "step": 492390 }, { "epoch": 0.86, "learning_rate": 7.065678003048303e-06, "loss": 2.4679, "step": 492400 }, { "epoch": 0.86, "learning_rate": 7.064806063121475e-06, "loss": 2.268, "step": 492410 }, { "epoch": 0.86, "learning_rate": 7.063934123194649e-06, "loss": 2.2387, "step": 492420 }, { "epoch": 0.86, "learning_rate": 7.063062183267822e-06, "loss": 2.3308, "step": 492430 }, { "epoch": 0.86, "learning_rate": 7.062190243340995e-06, "loss": 2.1983, "step": 492440 }, { "epoch": 0.86, "learning_rate": 7.061318303414169e-06, "loss": 2.2995, "step": 492450 }, { "epoch": 0.86, "learning_rate": 7.060446363487341e-06, "loss": 2.2759, "step": 492460 }, { "epoch": 0.86, "learning_rate": 7.059574423560515e-06, "loss": 2.2394, "step": 492470 }, { "epoch": 0.86, "learning_rate": 7.058702483633688e-06, "loss": 2.3107, "step": 492480 }, { "epoch": 0.86, "learning_rate": 7.057830543706862e-06, "loss": 2.2147, "step": 492490 }, { "epoch": 0.86, "learning_rate": 7.056958603780034e-06, "loss": 2.1598, "step": 492500 }, { "epoch": 0.86, "learning_rate": 7.0560866638532075e-06, "loss": 2.2757, "step": 492510 }, { "epoch": 0.86, "learning_rate": 7.05521472392638e-06, "loss": 2.2957, "step": 492520 }, { "epoch": 0.86, "learning_rate": 7.054342783999554e-06, "loss": 2.2083, "step": 492530 }, { "epoch": 0.86, "learning_rate": 7.053470844072726e-06, "loss": 2.3185, "step": 492540 }, { "epoch": 0.86, "learning_rate": 7.0525989041459e-06, "loss": 2.4051, "step": 492550 }, { "epoch": 0.86, "learning_rate": 7.051726964219074e-06, "loss": 2.2514, "step": 492560 }, { "epoch": 0.86, "learning_rate": 7.050855024292247e-06, "loss": 2.2199, "step": 492570 }, { "epoch": 0.86, "learning_rate": 7.0499830843654205e-06, "loss": 2.2839, "step": 492580 }, { "epoch": 0.86, "learning_rate": 7.0491111444385926e-06, "loss": 2.2525, "step": 492590 }, { "epoch": 0.86, "learning_rate": 7.048239204511767e-06, "loss": 2.3305, "step": 492600 }, { "epoch": 0.86, "learning_rate": 7.047367264584939e-06, "loss": 2.3163, "step": 492610 }, { "epoch": 0.86, "learning_rate": 7.046495324658113e-06, "loss": 2.3509, "step": 492620 }, { "epoch": 0.86, "learning_rate": 7.045623384731285e-06, "loss": 2.1959, "step": 492630 }, { "epoch": 0.86, "learning_rate": 7.04475144480446e-06, "loss": 2.2636, "step": 492640 }, { "epoch": 0.86, "learning_rate": 7.043879504877632e-06, "loss": 2.3846, "step": 492650 }, { "epoch": 0.86, "learning_rate": 7.0430075649508056e-06, "loss": 2.2863, "step": 492660 }, { "epoch": 0.86, "learning_rate": 7.0421356250239785e-06, "loss": 2.2983, "step": 492670 }, { "epoch": 0.86, "learning_rate": 7.041263685097152e-06, "loss": 2.3423, "step": 492680 }, { "epoch": 0.86, "learning_rate": 7.040391745170324e-06, "loss": 2.1202, "step": 492690 }, { "epoch": 0.86, "learning_rate": 7.039519805243498e-06, "loss": 2.1706, "step": 492700 }, { "epoch": 0.86, "learning_rate": 7.038647865316672e-06, "loss": 2.2813, "step": 492710 }, { "epoch": 0.86, "learning_rate": 7.037775925389845e-06, "loss": 2.2591, "step": 492720 }, { "epoch": 0.86, "learning_rate": 7.0369039854630186e-06, "loss": 2.2748, "step": 492730 }, { "epoch": 0.86, "learning_rate": 7.036032045536191e-06, "loss": 2.3331, "step": 492740 }, { "epoch": 0.86, "learning_rate": 7.035160105609364e-06, "loss": 2.1277, "step": 492750 }, { "epoch": 0.86, "learning_rate": 7.034288165682537e-06, "loss": 2.2513, "step": 492760 }, { "epoch": 0.86, "learning_rate": 7.033416225755711e-06, "loss": 2.2047, "step": 492770 }, { "epoch": 0.86, "learning_rate": 7.032544285828883e-06, "loss": 2.248, "step": 492780 }, { "epoch": 0.86, "learning_rate": 7.031672345902057e-06, "loss": 2.3164, "step": 492790 }, { "epoch": 0.86, "learning_rate": 7.03080040597523e-06, "loss": 2.2632, "step": 492800 }, { "epoch": 0.86, "learning_rate": 7.029928466048404e-06, "loss": 2.2293, "step": 492810 }, { "epoch": 0.86, "learning_rate": 7.029056526121576e-06, "loss": 2.2279, "step": 492820 }, { "epoch": 0.86, "learning_rate": 7.0281845861947495e-06, "loss": 2.3302, "step": 492830 }, { "epoch": 0.86, "learning_rate": 7.027312646267923e-06, "loss": 2.3197, "step": 492840 }, { "epoch": 0.86, "learning_rate": 7.026440706341096e-06, "loss": 2.229, "step": 492850 }, { "epoch": 0.86, "learning_rate": 7.02556876641427e-06, "loss": 2.2661, "step": 492860 }, { "epoch": 0.86, "learning_rate": 7.024696826487442e-06, "loss": 2.2234, "step": 492870 }, { "epoch": 0.86, "learning_rate": 7.023824886560617e-06, "loss": 2.2048, "step": 492880 }, { "epoch": 0.86, "learning_rate": 7.022952946633789e-06, "loss": 2.3769, "step": 492890 }, { "epoch": 0.86, "learning_rate": 7.0220810067069625e-06, "loss": 2.2381, "step": 492900 }, { "epoch": 0.86, "learning_rate": 7.021209066780135e-06, "loss": 2.2385, "step": 492910 }, { "epoch": 0.86, "learning_rate": 7.020337126853309e-06, "loss": 2.275, "step": 492920 }, { "epoch": 0.86, "learning_rate": 7.019465186926481e-06, "loss": 2.2692, "step": 492930 }, { "epoch": 0.86, "learning_rate": 7.018593246999655e-06, "loss": 2.2923, "step": 492940 }, { "epoch": 0.86, "learning_rate": 7.017721307072828e-06, "loss": 2.3301, "step": 492950 }, { "epoch": 0.86, "learning_rate": 7.016849367146002e-06, "loss": 2.2932, "step": 492960 }, { "epoch": 0.86, "learning_rate": 7.0159774272191755e-06, "loss": 2.1555, "step": 492970 }, { "epoch": 0.86, "learning_rate": 7.0151054872923476e-06, "loss": 2.247, "step": 492980 }, { "epoch": 0.86, "learning_rate": 7.014233547365521e-06, "loss": 2.3397, "step": 492990 }, { "epoch": 0.86, "learning_rate": 7.013361607438694e-06, "loss": 2.3298, "step": 493000 }, { "epoch": 0.86, "learning_rate": 7.012489667511868e-06, "loss": 2.1598, "step": 493010 }, { "epoch": 0.86, "learning_rate": 7.01161772758504e-06, "loss": 2.1671, "step": 493020 }, { "epoch": 0.86, "learning_rate": 7.010745787658214e-06, "loss": 2.3906, "step": 493030 }, { "epoch": 0.86, "learning_rate": 7.009873847731387e-06, "loss": 2.2771, "step": 493040 }, { "epoch": 0.86, "learning_rate": 7.0090019078045606e-06, "loss": 2.4038, "step": 493050 }, { "epoch": 0.86, "learning_rate": 7.008129967877733e-06, "loss": 2.3138, "step": 493060 }, { "epoch": 0.86, "learning_rate": 7.007258027950906e-06, "loss": 2.2129, "step": 493070 }, { "epoch": 0.86, "learning_rate": 7.006386088024079e-06, "loss": 2.3145, "step": 493080 }, { "epoch": 0.86, "learning_rate": 7.005514148097253e-06, "loss": 2.3518, "step": 493090 }, { "epoch": 0.86, "learning_rate": 7.004642208170427e-06, "loss": 2.2899, "step": 493100 }, { "epoch": 0.86, "learning_rate": 7.003770268243599e-06, "loss": 2.2048, "step": 493110 }, { "epoch": 0.86, "learning_rate": 7.0028983283167736e-06, "loss": 2.2867, "step": 493120 }, { "epoch": 0.86, "learning_rate": 7.002026388389946e-06, "loss": 2.2658, "step": 493130 }, { "epoch": 0.86, "learning_rate": 7.001154448463119e-06, "loss": 2.2669, "step": 493140 }, { "epoch": 0.86, "learning_rate": 7.000282508536292e-06, "loss": 2.2707, "step": 493150 }, { "epoch": 0.86, "learning_rate": 6.999410568609466e-06, "loss": 2.3003, "step": 493160 }, { "epoch": 0.86, "learning_rate": 6.998538628682638e-06, "loss": 2.246, "step": 493170 }, { "epoch": 0.86, "learning_rate": 6.997666688755812e-06, "loss": 2.1995, "step": 493180 }, { "epoch": 0.86, "learning_rate": 6.996794748828985e-06, "loss": 2.3261, "step": 493190 }, { "epoch": 0.86, "learning_rate": 6.995922808902159e-06, "loss": 2.2565, "step": 493200 }, { "epoch": 0.86, "learning_rate": 6.995050868975331e-06, "loss": 2.2452, "step": 493210 }, { "epoch": 0.86, "learning_rate": 6.9941789290485045e-06, "loss": 2.2415, "step": 493220 }, { "epoch": 0.86, "learning_rate": 6.993306989121678e-06, "loss": 2.232, "step": 493230 }, { "epoch": 0.86, "learning_rate": 6.992435049194851e-06, "loss": 2.2527, "step": 493240 }, { "epoch": 0.86, "learning_rate": 6.991563109268025e-06, "loss": 2.2259, "step": 493250 }, { "epoch": 0.86, "learning_rate": 6.990691169341197e-06, "loss": 2.2903, "step": 493260 }, { "epoch": 0.86, "learning_rate": 6.989819229414371e-06, "loss": 2.2564, "step": 493270 }, { "epoch": 0.86, "learning_rate": 6.988947289487544e-06, "loss": 2.3334, "step": 493280 }, { "epoch": 0.86, "learning_rate": 6.9880753495607175e-06, "loss": 2.249, "step": 493290 }, { "epoch": 0.86, "learning_rate": 6.9872034096338896e-06, "loss": 2.2013, "step": 493300 }, { "epoch": 0.86, "learning_rate": 6.986331469707063e-06, "loss": 2.3594, "step": 493310 }, { "epoch": 0.86, "learning_rate": 6.985459529780236e-06, "loss": 2.1805, "step": 493320 }, { "epoch": 0.86, "learning_rate": 6.98458758985341e-06, "loss": 2.2813, "step": 493330 }, { "epoch": 0.86, "learning_rate": 6.983715649926582e-06, "loss": 2.3558, "step": 493340 }, { "epoch": 0.86, "learning_rate": 6.982843709999756e-06, "loss": 2.2561, "step": 493350 }, { "epoch": 0.86, "learning_rate": 6.9819717700729305e-06, "loss": 2.3435, "step": 493360 }, { "epoch": 0.86, "learning_rate": 6.9810998301461026e-06, "loss": 2.3056, "step": 493370 }, { "epoch": 0.86, "learning_rate": 6.980227890219276e-06, "loss": 2.3097, "step": 493380 }, { "epoch": 0.86, "learning_rate": 6.979355950292448e-06, "loss": 2.3446, "step": 493390 }, { "epoch": 0.86, "learning_rate": 6.978484010365623e-06, "loss": 2.2499, "step": 493400 }, { "epoch": 0.86, "learning_rate": 6.977612070438795e-06, "loss": 2.2601, "step": 493410 }, { "epoch": 0.86, "learning_rate": 6.976740130511969e-06, "loss": 2.3857, "step": 493420 }, { "epoch": 0.86, "learning_rate": 6.975868190585142e-06, "loss": 2.2299, "step": 493430 }, { "epoch": 0.86, "learning_rate": 6.9749962506583156e-06, "loss": 2.2769, "step": 493440 }, { "epoch": 0.86, "learning_rate": 6.974124310731488e-06, "loss": 2.26, "step": 493450 }, { "epoch": 0.86, "learning_rate": 6.973252370804661e-06, "loss": 2.2788, "step": 493460 }, { "epoch": 0.86, "learning_rate": 6.972380430877834e-06, "loss": 2.2937, "step": 493470 }, { "epoch": 0.86, "learning_rate": 6.971508490951008e-06, "loss": 2.3094, "step": 493480 }, { "epoch": 0.86, "learning_rate": 6.97063655102418e-06, "loss": 2.2693, "step": 493490 }, { "epoch": 0.86, "learning_rate": 6.969764611097354e-06, "loss": 2.2856, "step": 493500 }, { "epoch": 0.86, "learning_rate": 6.968892671170528e-06, "loss": 2.2143, "step": 493510 }, { "epoch": 0.86, "learning_rate": 6.968020731243701e-06, "loss": 2.3052, "step": 493520 }, { "epoch": 0.86, "learning_rate": 6.967148791316874e-06, "loss": 2.2432, "step": 493530 }, { "epoch": 0.86, "learning_rate": 6.9662768513900465e-06, "loss": 2.2899, "step": 493540 }, { "epoch": 0.86, "learning_rate": 6.96540491146322e-06, "loss": 2.303, "step": 493550 }, { "epoch": 0.86, "learning_rate": 6.964532971536393e-06, "loss": 2.2357, "step": 493560 }, { "epoch": 0.86, "learning_rate": 6.963661031609567e-06, "loss": 2.2526, "step": 493570 }, { "epoch": 0.86, "learning_rate": 6.962789091682739e-06, "loss": 2.1885, "step": 493580 }, { "epoch": 0.86, "learning_rate": 6.961917151755913e-06, "loss": 2.2284, "step": 493590 }, { "epoch": 0.86, "learning_rate": 6.961045211829086e-06, "loss": 2.2116, "step": 493600 }, { "epoch": 0.86, "learning_rate": 6.9601732719022595e-06, "loss": 2.316, "step": 493610 }, { "epoch": 0.86, "learning_rate": 6.9593013319754316e-06, "loss": 2.2843, "step": 493620 }, { "epoch": 0.86, "learning_rate": 6.958429392048605e-06, "loss": 2.2663, "step": 493630 }, { "epoch": 0.86, "learning_rate": 6.95755745212178e-06, "loss": 2.3515, "step": 493640 }, { "epoch": 0.86, "learning_rate": 6.956685512194952e-06, "loss": 2.2624, "step": 493650 }, { "epoch": 0.86, "learning_rate": 6.955813572268126e-06, "loss": 2.2965, "step": 493660 }, { "epoch": 0.86, "learning_rate": 6.954941632341299e-06, "loss": 2.2894, "step": 493670 }, { "epoch": 0.86, "learning_rate": 6.9540696924144725e-06, "loss": 2.2458, "step": 493680 }, { "epoch": 0.86, "learning_rate": 6.9531977524876446e-06, "loss": 2.2076, "step": 493690 }, { "epoch": 0.86, "learning_rate": 6.952325812560818e-06, "loss": 2.2601, "step": 493700 }, { "epoch": 0.86, "learning_rate": 6.951453872633991e-06, "loss": 2.2887, "step": 493710 }, { "epoch": 0.86, "learning_rate": 6.950581932707165e-06, "loss": 2.2356, "step": 493720 }, { "epoch": 0.86, "learning_rate": 6.949709992780337e-06, "loss": 2.2468, "step": 493730 }, { "epoch": 0.86, "learning_rate": 6.948838052853511e-06, "loss": 2.2699, "step": 493740 }, { "epoch": 0.86, "learning_rate": 6.947966112926684e-06, "loss": 2.1775, "step": 493750 }, { "epoch": 0.86, "learning_rate": 6.9470941729998576e-06, "loss": 2.3336, "step": 493760 }, { "epoch": 0.86, "learning_rate": 6.946222233073031e-06, "loss": 2.3073, "step": 493770 }, { "epoch": 0.86, "learning_rate": 6.945350293146203e-06, "loss": 2.4057, "step": 493780 }, { "epoch": 0.86, "learning_rate": 6.944478353219377e-06, "loss": 2.1868, "step": 493790 }, { "epoch": 0.86, "learning_rate": 6.94360641329255e-06, "loss": 2.3896, "step": 493800 }, { "epoch": 0.86, "learning_rate": 6.942734473365724e-06, "loss": 2.3032, "step": 493810 }, { "epoch": 0.86, "learning_rate": 6.941862533438896e-06, "loss": 2.2338, "step": 493820 }, { "epoch": 0.86, "learning_rate": 6.94099059351207e-06, "loss": 2.2604, "step": 493830 }, { "epoch": 0.86, "learning_rate": 6.940118653585243e-06, "loss": 2.2255, "step": 493840 }, { "epoch": 0.86, "learning_rate": 6.939246713658416e-06, "loss": 2.4237, "step": 493850 }, { "epoch": 0.86, "learning_rate": 6.9383747737315885e-06, "loss": 2.1819, "step": 493860 }, { "epoch": 0.86, "learning_rate": 6.937502833804762e-06, "loss": 2.175, "step": 493870 }, { "epoch": 0.86, "learning_rate": 6.936630893877935e-06, "loss": 2.2294, "step": 493880 }, { "epoch": 0.86, "learning_rate": 6.935758953951109e-06, "loss": 2.4538, "step": 493890 }, { "epoch": 0.86, "learning_rate": 6.934887014024283e-06, "loss": 2.1606, "step": 493900 }, { "epoch": 0.86, "learning_rate": 6.934015074097455e-06, "loss": 2.3045, "step": 493910 }, { "epoch": 0.86, "learning_rate": 6.933143134170629e-06, "loss": 2.2781, "step": 493920 }, { "epoch": 0.86, "learning_rate": 6.9322711942438015e-06, "loss": 2.2394, "step": 493930 }, { "epoch": 0.86, "learning_rate": 6.931399254316975e-06, "loss": 2.2605, "step": 493940 }, { "epoch": 0.86, "learning_rate": 6.930527314390148e-06, "loss": 2.2258, "step": 493950 }, { "epoch": 0.86, "learning_rate": 6.929655374463322e-06, "loss": 2.1637, "step": 493960 }, { "epoch": 0.86, "learning_rate": 6.928783434536494e-06, "loss": 2.2622, "step": 493970 }, { "epoch": 0.86, "learning_rate": 6.927911494609668e-06, "loss": 2.213, "step": 493980 }, { "epoch": 0.86, "learning_rate": 6.927039554682841e-06, "loss": 2.3772, "step": 493990 }, { "epoch": 0.86, "learning_rate": 6.9261676147560145e-06, "loss": 2.1914, "step": 494000 }, { "epoch": 0.86, "learning_rate": 6.9252956748291866e-06, "loss": 2.1667, "step": 494010 }, { "epoch": 0.86, "learning_rate": 6.92442373490236e-06, "loss": 2.257, "step": 494020 }, { "epoch": 0.86, "learning_rate": 6.923551794975534e-06, "loss": 2.2518, "step": 494030 }, { "epoch": 0.86, "learning_rate": 6.922679855048707e-06, "loss": 2.2805, "step": 494040 }, { "epoch": 0.86, "learning_rate": 6.921807915121881e-06, "loss": 2.1944, "step": 494050 }, { "epoch": 0.86, "learning_rate": 6.920935975195053e-06, "loss": 2.2594, "step": 494060 }, { "epoch": 0.86, "learning_rate": 6.920064035268227e-06, "loss": 2.1558, "step": 494070 }, { "epoch": 0.86, "learning_rate": 6.9191920953414e-06, "loss": 2.2425, "step": 494080 }, { "epoch": 0.86, "learning_rate": 6.918320155414573e-06, "loss": 2.3517, "step": 494090 }, { "epoch": 0.86, "learning_rate": 6.917448215487745e-06, "loss": 2.3403, "step": 494100 }, { "epoch": 0.86, "learning_rate": 6.916576275560919e-06, "loss": 2.2275, "step": 494110 }, { "epoch": 0.86, "learning_rate": 6.915704335634092e-06, "loss": 2.2435, "step": 494120 }, { "epoch": 0.86, "learning_rate": 6.914832395707266e-06, "loss": 2.2853, "step": 494130 }, { "epoch": 0.86, "learning_rate": 6.913960455780438e-06, "loss": 2.3753, "step": 494140 }, { "epoch": 0.86, "learning_rate": 6.913088515853612e-06, "loss": 2.335, "step": 494150 }, { "epoch": 0.86, "learning_rate": 6.912216575926786e-06, "loss": 2.3265, "step": 494160 }, { "epoch": 0.86, "learning_rate": 6.9113446359999584e-06, "loss": 2.2078, "step": 494170 }, { "epoch": 0.86, "learning_rate": 6.910472696073132e-06, "loss": 2.3712, "step": 494180 }, { "epoch": 0.86, "learning_rate": 6.909600756146305e-06, "loss": 2.246, "step": 494190 }, { "epoch": 0.86, "learning_rate": 6.908728816219479e-06, "loss": 2.2593, "step": 494200 }, { "epoch": 0.86, "learning_rate": 6.907856876292651e-06, "loss": 2.2813, "step": 494210 }, { "epoch": 0.86, "learning_rate": 6.906984936365825e-06, "loss": 2.2689, "step": 494220 }, { "epoch": 0.86, "learning_rate": 6.906112996438998e-06, "loss": 2.3262, "step": 494230 }, { "epoch": 0.86, "learning_rate": 6.9052410565121714e-06, "loss": 2.2975, "step": 494240 }, { "epoch": 0.86, "learning_rate": 6.9043691165853435e-06, "loss": 2.3202, "step": 494250 }, { "epoch": 0.86, "learning_rate": 6.903497176658517e-06, "loss": 2.2635, "step": 494260 }, { "epoch": 0.86, "learning_rate": 6.90262523673169e-06, "loss": 2.1557, "step": 494270 }, { "epoch": 0.86, "learning_rate": 6.901753296804864e-06, "loss": 2.1736, "step": 494280 }, { "epoch": 0.86, "learning_rate": 6.900881356878038e-06, "loss": 2.3028, "step": 494290 }, { "epoch": 0.86, "learning_rate": 6.90000941695121e-06, "loss": 2.2788, "step": 494300 }, { "epoch": 0.86, "learning_rate": 6.899137477024384e-06, "loss": 2.2355, "step": 494310 }, { "epoch": 0.86, "learning_rate": 6.8982655370975565e-06, "loss": 2.4365, "step": 494320 }, { "epoch": 0.86, "learning_rate": 6.89739359717073e-06, "loss": 2.2381, "step": 494330 }, { "epoch": 0.86, "learning_rate": 6.896521657243902e-06, "loss": 2.2849, "step": 494340 }, { "epoch": 0.86, "learning_rate": 6.895649717317076e-06, "loss": 2.1855, "step": 494350 }, { "epoch": 0.86, "learning_rate": 6.894777777390249e-06, "loss": 2.2542, "step": 494360 }, { "epoch": 0.86, "learning_rate": 6.893905837463423e-06, "loss": 2.3094, "step": 494370 }, { "epoch": 0.86, "learning_rate": 6.893033897536595e-06, "loss": 2.1885, "step": 494380 }, { "epoch": 0.86, "learning_rate": 6.892161957609769e-06, "loss": 2.2973, "step": 494390 }, { "epoch": 0.86, "learning_rate": 6.891290017682942e-06, "loss": 2.3519, "step": 494400 }, { "epoch": 0.86, "learning_rate": 6.890418077756115e-06, "loss": 2.2632, "step": 494410 }, { "epoch": 0.86, "learning_rate": 6.8895461378292874e-06, "loss": 2.132, "step": 494420 }, { "epoch": 0.86, "learning_rate": 6.888674197902461e-06, "loss": 2.2477, "step": 494430 }, { "epoch": 0.86, "learning_rate": 6.887802257975636e-06, "loss": 2.3418, "step": 494440 }, { "epoch": 0.86, "learning_rate": 6.886930318048808e-06, "loss": 2.3013, "step": 494450 }, { "epoch": 0.86, "learning_rate": 6.886058378121982e-06, "loss": 2.3442, "step": 494460 }, { "epoch": 0.86, "learning_rate": 6.885186438195155e-06, "loss": 2.2954, "step": 494470 }, { "epoch": 0.86, "learning_rate": 6.884314498268328e-06, "loss": 2.2547, "step": 494480 }, { "epoch": 0.86, "learning_rate": 6.8834425583415004e-06, "loss": 2.1425, "step": 494490 }, { "epoch": 0.86, "learning_rate": 6.882570618414674e-06, "loss": 2.369, "step": 494500 }, { "epoch": 0.86, "learning_rate": 6.881698678487847e-06, "loss": 2.2156, "step": 494510 }, { "epoch": 0.86, "learning_rate": 6.880826738561021e-06, "loss": 2.3663, "step": 494520 }, { "epoch": 0.86, "learning_rate": 6.879954798634193e-06, "loss": 2.2695, "step": 494530 }, { "epoch": 0.86, "learning_rate": 6.879082858707367e-06, "loss": 2.2013, "step": 494540 }, { "epoch": 0.86, "learning_rate": 6.87821091878054e-06, "loss": 2.2853, "step": 494550 }, { "epoch": 0.86, "learning_rate": 6.8773389788537134e-06, "loss": 2.174, "step": 494560 }, { "epoch": 0.86, "learning_rate": 6.876467038926887e-06, "loss": 2.2519, "step": 494570 }, { "epoch": 0.86, "learning_rate": 6.875595099000059e-06, "loss": 2.4297, "step": 494580 }, { "epoch": 0.86, "learning_rate": 6.874723159073233e-06, "loss": 2.2577, "step": 494590 }, { "epoch": 0.86, "learning_rate": 6.873851219146406e-06, "loss": 2.2446, "step": 494600 }, { "epoch": 0.86, "learning_rate": 6.87297927921958e-06, "loss": 2.2195, "step": 494610 }, { "epoch": 0.86, "learning_rate": 6.872107339292752e-06, "loss": 2.3473, "step": 494620 }, { "epoch": 0.86, "learning_rate": 6.871235399365926e-06, "loss": 2.1609, "step": 494630 }, { "epoch": 0.86, "learning_rate": 6.8703634594390985e-06, "loss": 2.1663, "step": 494640 }, { "epoch": 0.86, "learning_rate": 6.869491519512272e-06, "loss": 2.2799, "step": 494650 }, { "epoch": 0.86, "learning_rate": 6.868619579585444e-06, "loss": 2.1754, "step": 494660 }, { "epoch": 0.86, "learning_rate": 6.867747639658618e-06, "loss": 2.3741, "step": 494670 }, { "epoch": 0.86, "learning_rate": 6.866875699731791e-06, "loss": 2.2911, "step": 494680 }, { "epoch": 0.86, "learning_rate": 6.866003759804965e-06, "loss": 2.2381, "step": 494690 }, { "epoch": 0.86, "learning_rate": 6.865131819878139e-06, "loss": 2.249, "step": 494700 }, { "epoch": 0.86, "learning_rate": 6.8642598799513115e-06, "loss": 2.2972, "step": 494710 }, { "epoch": 0.86, "learning_rate": 6.863387940024485e-06, "loss": 2.3474, "step": 494720 }, { "epoch": 0.86, "learning_rate": 6.862516000097657e-06, "loss": 2.2827, "step": 494730 }, { "epoch": 0.86, "learning_rate": 6.861644060170831e-06, "loss": 2.2396, "step": 494740 }, { "epoch": 0.86, "learning_rate": 6.860772120244004e-06, "loss": 2.2831, "step": 494750 }, { "epoch": 0.86, "learning_rate": 6.859900180317178e-06, "loss": 2.2551, "step": 494760 }, { "epoch": 0.86, "learning_rate": 6.85902824039035e-06, "loss": 2.3341, "step": 494770 }, { "epoch": 0.86, "learning_rate": 6.858156300463524e-06, "loss": 2.18, "step": 494780 }, { "epoch": 0.86, "learning_rate": 6.857284360536697e-06, "loss": 2.3317, "step": 494790 }, { "epoch": 0.86, "learning_rate": 6.85641242060987e-06, "loss": 2.3285, "step": 494800 }, { "epoch": 0.86, "learning_rate": 6.8555404806830424e-06, "loss": 2.1835, "step": 494810 }, { "epoch": 0.86, "learning_rate": 6.854668540756216e-06, "loss": 2.241, "step": 494820 }, { "epoch": 0.86, "learning_rate": 6.85379660082939e-06, "loss": 2.2664, "step": 494830 }, { "epoch": 0.86, "learning_rate": 6.852924660902563e-06, "loss": 2.3555, "step": 494840 }, { "epoch": 0.86, "learning_rate": 6.852052720975737e-06, "loss": 2.2827, "step": 494850 }, { "epoch": 0.86, "learning_rate": 6.851180781048909e-06, "loss": 2.2121, "step": 494860 }, { "epoch": 0.86, "learning_rate": 6.8503088411220825e-06, "loss": 2.3567, "step": 494870 }, { "epoch": 0.86, "learning_rate": 6.8494369011952554e-06, "loss": 2.3041, "step": 494880 }, { "epoch": 0.86, "learning_rate": 6.848564961268429e-06, "loss": 2.1218, "step": 494890 }, { "epoch": 0.86, "learning_rate": 6.847693021341601e-06, "loss": 2.3986, "step": 494900 }, { "epoch": 0.86, "learning_rate": 6.846821081414775e-06, "loss": 2.3006, "step": 494910 }, { "epoch": 0.86, "learning_rate": 6.845949141487948e-06, "loss": 2.3612, "step": 494920 }, { "epoch": 0.86, "learning_rate": 6.845077201561122e-06, "loss": 2.3564, "step": 494930 }, { "epoch": 0.86, "learning_rate": 6.844205261634294e-06, "loss": 2.2648, "step": 494940 }, { "epoch": 0.86, "learning_rate": 6.843333321707468e-06, "loss": 2.2063, "step": 494950 }, { "epoch": 0.86, "learning_rate": 6.842461381780642e-06, "loss": 2.3429, "step": 494960 }, { "epoch": 0.86, "learning_rate": 6.841589441853814e-06, "loss": 2.1973, "step": 494970 }, { "epoch": 0.86, "learning_rate": 6.840717501926988e-06, "loss": 2.2993, "step": 494980 }, { "epoch": 0.86, "learning_rate": 6.839845562000161e-06, "loss": 2.2689, "step": 494990 }, { "epoch": 0.86, "learning_rate": 6.838973622073335e-06, "loss": 2.1457, "step": 495000 }, { "epoch": 0.86, "learning_rate": 6.838101682146507e-06, "loss": 2.2821, "step": 495010 }, { "epoch": 0.86, "learning_rate": 6.837229742219681e-06, "loss": 2.3167, "step": 495020 }, { "epoch": 0.86, "learning_rate": 6.8363578022928535e-06, "loss": 2.3984, "step": 495030 }, { "epoch": 0.86, "learning_rate": 6.835485862366027e-06, "loss": 2.243, "step": 495040 }, { "epoch": 0.86, "learning_rate": 6.834613922439199e-06, "loss": 2.3946, "step": 495050 }, { "epoch": 0.86, "learning_rate": 6.833741982512373e-06, "loss": 2.2791, "step": 495060 }, { "epoch": 0.86, "learning_rate": 6.832870042585546e-06, "loss": 2.3226, "step": 495070 }, { "epoch": 0.86, "learning_rate": 6.83199810265872e-06, "loss": 2.2489, "step": 495080 }, { "epoch": 0.86, "learning_rate": 6.831126162731894e-06, "loss": 2.3572, "step": 495090 }, { "epoch": 0.86, "learning_rate": 6.830254222805066e-06, "loss": 2.2141, "step": 495100 }, { "epoch": 0.86, "learning_rate": 6.8293822828782394e-06, "loss": 2.2381, "step": 495110 }, { "epoch": 0.86, "learning_rate": 6.828510342951412e-06, "loss": 2.2641, "step": 495120 }, { "epoch": 0.86, "learning_rate": 6.827638403024586e-06, "loss": 2.3152, "step": 495130 }, { "epoch": 0.86, "learning_rate": 6.826766463097758e-06, "loss": 2.2922, "step": 495140 }, { "epoch": 0.86, "learning_rate": 6.825894523170932e-06, "loss": 2.2134, "step": 495150 }, { "epoch": 0.86, "learning_rate": 6.825022583244105e-06, "loss": 2.2382, "step": 495160 }, { "epoch": 0.86, "learning_rate": 6.824150643317279e-06, "loss": 2.294, "step": 495170 }, { "epoch": 0.86, "learning_rate": 6.823278703390451e-06, "loss": 2.257, "step": 495180 }, { "epoch": 0.86, "learning_rate": 6.8224067634636245e-06, "loss": 2.2597, "step": 495190 }, { "epoch": 0.86, "learning_rate": 6.8215348235367974e-06, "loss": 2.3223, "step": 495200 }, { "epoch": 0.86, "learning_rate": 6.820662883609971e-06, "loss": 2.3986, "step": 495210 }, { "epoch": 0.86, "learning_rate": 6.819790943683143e-06, "loss": 2.1784, "step": 495220 }, { "epoch": 0.86, "learning_rate": 6.818919003756318e-06, "loss": 2.3564, "step": 495230 }, { "epoch": 0.86, "learning_rate": 6.818047063829492e-06, "loss": 2.3773, "step": 495240 }, { "epoch": 0.86, "learning_rate": 6.817175123902664e-06, "loss": 2.1704, "step": 495250 }, { "epoch": 0.86, "learning_rate": 6.8163031839758375e-06, "loss": 2.3365, "step": 495260 }, { "epoch": 0.86, "learning_rate": 6.8154312440490104e-06, "loss": 2.2069, "step": 495270 }, { "epoch": 0.86, "learning_rate": 6.814559304122184e-06, "loss": 2.161, "step": 495280 }, { "epoch": 0.86, "learning_rate": 6.813687364195356e-06, "loss": 2.324, "step": 495290 }, { "epoch": 0.86, "learning_rate": 6.81281542426853e-06, "loss": 2.1686, "step": 495300 }, { "epoch": 0.86, "learning_rate": 6.811943484341703e-06, "loss": 2.3227, "step": 495310 }, { "epoch": 0.86, "learning_rate": 6.811071544414877e-06, "loss": 2.2339, "step": 495320 }, { "epoch": 0.86, "learning_rate": 6.810199604488049e-06, "loss": 2.272, "step": 495330 }, { "epoch": 0.86, "learning_rate": 6.809327664561223e-06, "loss": 2.2856, "step": 495340 }, { "epoch": 0.86, "learning_rate": 6.8084557246343955e-06, "loss": 2.224, "step": 495350 }, { "epoch": 0.86, "learning_rate": 6.807583784707569e-06, "loss": 2.2811, "step": 495360 }, { "epoch": 0.86, "learning_rate": 6.806711844780743e-06, "loss": 2.2378, "step": 495370 }, { "epoch": 0.86, "learning_rate": 6.805839904853915e-06, "loss": 2.2971, "step": 495380 }, { "epoch": 0.86, "learning_rate": 6.804967964927089e-06, "loss": 2.1687, "step": 495390 }, { "epoch": 0.86, "learning_rate": 6.804096025000262e-06, "loss": 2.3633, "step": 495400 }, { "epoch": 0.86, "learning_rate": 6.803224085073436e-06, "loss": 2.3449, "step": 495410 }, { "epoch": 0.86, "learning_rate": 6.802352145146608e-06, "loss": 2.0926, "step": 495420 }, { "epoch": 0.86, "learning_rate": 6.8014802052197814e-06, "loss": 2.2262, "step": 495430 }, { "epoch": 0.86, "learning_rate": 6.800608265292954e-06, "loss": 2.2498, "step": 495440 }, { "epoch": 0.86, "learning_rate": 6.799736325366128e-06, "loss": 2.2151, "step": 495450 }, { "epoch": 0.86, "learning_rate": 6.7988643854393e-06, "loss": 2.2798, "step": 495460 }, { "epoch": 0.86, "learning_rate": 6.797992445512474e-06, "loss": 2.2448, "step": 495470 }, { "epoch": 0.86, "learning_rate": 6.797120505585647e-06, "loss": 2.2446, "step": 495480 }, { "epoch": 0.86, "learning_rate": 6.796248565658821e-06, "loss": 2.3456, "step": 495490 }, { "epoch": 0.86, "learning_rate": 6.7953766257319944e-06, "loss": 2.2843, "step": 495500 }, { "epoch": 0.86, "learning_rate": 6.794504685805167e-06, "loss": 2.2169, "step": 495510 }, { "epoch": 0.86, "learning_rate": 6.793632745878341e-06, "loss": 2.2161, "step": 495520 }, { "epoch": 0.86, "learning_rate": 6.792760805951513e-06, "loss": 2.2914, "step": 495530 }, { "epoch": 0.86, "learning_rate": 6.791888866024687e-06, "loss": 2.2404, "step": 495540 }, { "epoch": 0.86, "learning_rate": 6.79101692609786e-06, "loss": 2.272, "step": 495550 }, { "epoch": 0.86, "learning_rate": 6.790144986171034e-06, "loss": 2.2701, "step": 495560 }, { "epoch": 0.86, "learning_rate": 6.789273046244206e-06, "loss": 2.2607, "step": 495570 }, { "epoch": 0.86, "learning_rate": 6.7884011063173795e-06, "loss": 2.1095, "step": 495580 }, { "epoch": 0.86, "learning_rate": 6.7875291663905524e-06, "loss": 2.2624, "step": 495590 }, { "epoch": 0.86, "learning_rate": 6.786657226463726e-06, "loss": 2.2299, "step": 495600 }, { "epoch": 0.86, "learning_rate": 6.785785286536898e-06, "loss": 2.1394, "step": 495610 }, { "epoch": 0.86, "learning_rate": 6.784913346610072e-06, "loss": 2.2946, "step": 495620 }, { "epoch": 0.86, "learning_rate": 6.784041406683246e-06, "loss": 2.2819, "step": 495630 }, { "epoch": 0.86, "learning_rate": 6.783169466756419e-06, "loss": 2.2586, "step": 495640 }, { "epoch": 0.86, "learning_rate": 6.7822975268295925e-06, "loss": 2.1604, "step": 495650 }, { "epoch": 0.86, "learning_rate": 6.781425586902765e-06, "loss": 2.2257, "step": 495660 }, { "epoch": 0.86, "learning_rate": 6.780553646975938e-06, "loss": 2.2917, "step": 495670 }, { "epoch": 0.86, "learning_rate": 6.779681707049111e-06, "loss": 2.2206, "step": 495680 }, { "epoch": 0.86, "learning_rate": 6.778809767122285e-06, "loss": 2.2187, "step": 495690 }, { "epoch": 0.86, "learning_rate": 6.777937827195457e-06, "loss": 2.1951, "step": 495700 }, { "epoch": 0.86, "learning_rate": 6.777065887268631e-06, "loss": 2.3185, "step": 495710 }, { "epoch": 0.86, "learning_rate": 6.776193947341804e-06, "loss": 2.3422, "step": 495720 }, { "epoch": 0.86, "learning_rate": 6.775322007414978e-06, "loss": 2.1997, "step": 495730 }, { "epoch": 0.86, "learning_rate": 6.77445006748815e-06, "loss": 2.193, "step": 495740 }, { "epoch": 0.86, "learning_rate": 6.773578127561324e-06, "loss": 2.2442, "step": 495750 }, { "epoch": 0.86, "learning_rate": 6.772706187634498e-06, "loss": 2.266, "step": 495760 }, { "epoch": 0.86, "learning_rate": 6.77183424770767e-06, "loss": 2.304, "step": 495770 }, { "epoch": 0.86, "learning_rate": 6.770962307780844e-06, "loss": 2.3616, "step": 495780 }, { "epoch": 0.86, "learning_rate": 6.770090367854017e-06, "loss": 2.3511, "step": 495790 }, { "epoch": 0.86, "learning_rate": 6.769218427927191e-06, "loss": 2.285, "step": 495800 }, { "epoch": 0.86, "learning_rate": 6.768346488000363e-06, "loss": 2.2403, "step": 495810 }, { "epoch": 0.86, "learning_rate": 6.7674745480735364e-06, "loss": 2.2594, "step": 495820 }, { "epoch": 0.86, "learning_rate": 6.766602608146709e-06, "loss": 2.129, "step": 495830 }, { "epoch": 0.86, "learning_rate": 6.765730668219883e-06, "loss": 2.1893, "step": 495840 }, { "epoch": 0.86, "learning_rate": 6.764858728293055e-06, "loss": 2.2369, "step": 495850 }, { "epoch": 0.86, "learning_rate": 6.763986788366229e-06, "loss": 2.3015, "step": 495860 }, { "epoch": 0.86, "learning_rate": 6.763114848439402e-06, "loss": 2.287, "step": 495870 }, { "epoch": 0.86, "learning_rate": 6.762242908512576e-06, "loss": 2.3251, "step": 495880 }, { "epoch": 0.86, "learning_rate": 6.7613709685857494e-06, "loss": 2.3067, "step": 495890 }, { "epoch": 0.86, "learning_rate": 6.7604990286589215e-06, "loss": 2.1939, "step": 495900 }, { "epoch": 0.86, "learning_rate": 6.759627088732095e-06, "loss": 2.11, "step": 495910 }, { "epoch": 0.86, "learning_rate": 6.758755148805268e-06, "loss": 2.2598, "step": 495920 }, { "epoch": 0.86, "learning_rate": 6.757883208878442e-06, "loss": 2.2402, "step": 495930 }, { "epoch": 0.86, "learning_rate": 6.757011268951614e-06, "loss": 2.3305, "step": 495940 }, { "epoch": 0.86, "learning_rate": 6.756139329024788e-06, "loss": 2.2203, "step": 495950 }, { "epoch": 0.86, "learning_rate": 6.755267389097961e-06, "loss": 2.2187, "step": 495960 }, { "epoch": 0.86, "learning_rate": 6.7543954491711345e-06, "loss": 2.2939, "step": 495970 }, { "epoch": 0.86, "learning_rate": 6.753523509244307e-06, "loss": 2.3299, "step": 495980 }, { "epoch": 0.86, "learning_rate": 6.75265156931748e-06, "loss": 2.2492, "step": 495990 }, { "epoch": 0.86, "learning_rate": 6.751779629390653e-06, "loss": 2.2995, "step": 496000 }, { "epoch": 0.86, "learning_rate": 6.750907689463827e-06, "loss": 2.3562, "step": 496010 }, { "epoch": 0.86, "learning_rate": 6.750035749537001e-06, "loss": 2.2835, "step": 496020 }, { "epoch": 0.87, "learning_rate": 6.749163809610174e-06, "loss": 2.3326, "step": 496030 }, { "epoch": 0.87, "learning_rate": 6.7482918696833475e-06, "loss": 2.2162, "step": 496040 }, { "epoch": 0.87, "learning_rate": 6.74741992975652e-06, "loss": 2.2491, "step": 496050 }, { "epoch": 0.87, "learning_rate": 6.746547989829693e-06, "loss": 2.0698, "step": 496060 }, { "epoch": 0.87, "learning_rate": 6.745676049902866e-06, "loss": 2.3627, "step": 496070 }, { "epoch": 0.87, "learning_rate": 6.74480410997604e-06, "loss": 2.3129, "step": 496080 }, { "epoch": 0.87, "learning_rate": 6.743932170049212e-06, "loss": 2.1984, "step": 496090 }, { "epoch": 0.87, "learning_rate": 6.743060230122386e-06, "loss": 2.2968, "step": 496100 }, { "epoch": 0.87, "learning_rate": 6.742188290195559e-06, "loss": 2.2669, "step": 496110 }, { "epoch": 0.87, "learning_rate": 6.741316350268733e-06, "loss": 2.2146, "step": 496120 }, { "epoch": 0.87, "learning_rate": 6.740444410341905e-06, "loss": 2.3552, "step": 496130 }, { "epoch": 0.87, "learning_rate": 6.7395724704150784e-06, "loss": 2.1588, "step": 496140 }, { "epoch": 0.87, "learning_rate": 6.738700530488251e-06, "loss": 2.2919, "step": 496150 }, { "epoch": 0.87, "learning_rate": 6.737828590561425e-06, "loss": 2.3535, "step": 496160 }, { "epoch": 0.87, "learning_rate": 6.736956650634599e-06, "loss": 2.1639, "step": 496170 }, { "epoch": 0.87, "learning_rate": 6.736084710707771e-06, "loss": 2.2413, "step": 496180 }, { "epoch": 0.87, "learning_rate": 6.735212770780945e-06, "loss": 2.3071, "step": 496190 }, { "epoch": 0.87, "learning_rate": 6.734340830854118e-06, "loss": 2.1466, "step": 496200 }, { "epoch": 0.87, "learning_rate": 6.7334688909272914e-06, "loss": 2.1824, "step": 496210 }, { "epoch": 0.87, "learning_rate": 6.7325969510004635e-06, "loss": 2.3701, "step": 496220 }, { "epoch": 0.87, "learning_rate": 6.731725011073637e-06, "loss": 2.2886, "step": 496230 }, { "epoch": 0.87, "learning_rate": 6.73085307114681e-06, "loss": 2.1967, "step": 496240 }, { "epoch": 0.87, "learning_rate": 6.729981131219984e-06, "loss": 2.2978, "step": 496250 }, { "epoch": 0.87, "learning_rate": 6.729109191293156e-06, "loss": 2.1873, "step": 496260 }, { "epoch": 0.87, "learning_rate": 6.728237251366331e-06, "loss": 2.1498, "step": 496270 }, { "epoch": 0.87, "learning_rate": 6.727365311439503e-06, "loss": 2.2573, "step": 496280 }, { "epoch": 0.87, "learning_rate": 6.7264933715126765e-06, "loss": 2.3332, "step": 496290 }, { "epoch": 0.87, "learning_rate": 6.72562143158585e-06, "loss": 2.164, "step": 496300 }, { "epoch": 0.87, "learning_rate": 6.724749491659023e-06, "loss": 2.2278, "step": 496310 }, { "epoch": 0.87, "learning_rate": 6.723877551732197e-06, "loss": 2.2725, "step": 496320 }, { "epoch": 0.87, "learning_rate": 6.723005611805369e-06, "loss": 2.3475, "step": 496330 }, { "epoch": 0.87, "learning_rate": 6.722133671878543e-06, "loss": 2.3727, "step": 496340 }, { "epoch": 0.87, "learning_rate": 6.721261731951716e-06, "loss": 2.3069, "step": 496350 }, { "epoch": 0.87, "learning_rate": 6.7203897920248895e-06, "loss": 2.301, "step": 496360 }, { "epoch": 0.87, "learning_rate": 6.719517852098062e-06, "loss": 2.3096, "step": 496370 }, { "epoch": 0.87, "learning_rate": 6.718645912171235e-06, "loss": 2.2701, "step": 496380 }, { "epoch": 0.87, "learning_rate": 6.717773972244408e-06, "loss": 2.2068, "step": 496390 }, { "epoch": 0.87, "learning_rate": 6.716902032317582e-06, "loss": 2.304, "step": 496400 }, { "epoch": 0.87, "learning_rate": 6.716030092390754e-06, "loss": 2.2702, "step": 496410 }, { "epoch": 0.87, "learning_rate": 6.715158152463928e-06, "loss": 2.2761, "step": 496420 }, { "epoch": 0.87, "learning_rate": 6.714286212537102e-06, "loss": 2.1879, "step": 496430 }, { "epoch": 0.87, "learning_rate": 6.713414272610275e-06, "loss": 2.2588, "step": 496440 }, { "epoch": 0.87, "learning_rate": 6.712542332683448e-06, "loss": 2.3045, "step": 496450 }, { "epoch": 0.87, "learning_rate": 6.7116703927566204e-06, "loss": 2.3466, "step": 496460 }, { "epoch": 0.87, "learning_rate": 6.710798452829794e-06, "loss": 2.3163, "step": 496470 }, { "epoch": 0.87, "learning_rate": 6.709926512902967e-06, "loss": 2.3681, "step": 496480 }, { "epoch": 0.87, "learning_rate": 6.709054572976141e-06, "loss": 2.2415, "step": 496490 }, { "epoch": 0.87, "learning_rate": 6.708182633049313e-06, "loss": 2.2988, "step": 496500 }, { "epoch": 0.87, "learning_rate": 6.707310693122487e-06, "loss": 2.3127, "step": 496510 }, { "epoch": 0.87, "learning_rate": 6.70643875319566e-06, "loss": 2.4065, "step": 496520 }, { "epoch": 0.87, "learning_rate": 6.7055668132688334e-06, "loss": 2.2302, "step": 496530 }, { "epoch": 0.87, "learning_rate": 6.7046948733420055e-06, "loss": 2.2056, "step": 496540 }, { "epoch": 0.87, "learning_rate": 6.70382293341518e-06, "loss": 2.3248, "step": 496550 }, { "epoch": 0.87, "learning_rate": 6.702950993488354e-06, "loss": 2.2207, "step": 496560 }, { "epoch": 0.87, "learning_rate": 6.702079053561526e-06, "loss": 2.2611, "step": 496570 }, { "epoch": 0.87, "learning_rate": 6.7012071136347e-06, "loss": 2.1848, "step": 496580 }, { "epoch": 0.87, "learning_rate": 6.700335173707873e-06, "loss": 2.3351, "step": 496590 }, { "epoch": 0.87, "learning_rate": 6.6994632337810464e-06, "loss": 2.2275, "step": 496600 }, { "epoch": 0.87, "learning_rate": 6.6985912938542185e-06, "loss": 2.2949, "step": 496610 }, { "epoch": 0.87, "learning_rate": 6.697719353927392e-06, "loss": 2.2873, "step": 496620 }, { "epoch": 0.87, "learning_rate": 6.696847414000565e-06, "loss": 2.4162, "step": 496630 }, { "epoch": 0.87, "learning_rate": 6.695975474073739e-06, "loss": 2.2596, "step": 496640 }, { "epoch": 0.87, "learning_rate": 6.695103534146911e-06, "loss": 2.2456, "step": 496650 }, { "epoch": 0.87, "learning_rate": 6.694231594220085e-06, "loss": 2.2713, "step": 496660 }, { "epoch": 0.87, "learning_rate": 6.693359654293258e-06, "loss": 2.3049, "step": 496670 }, { "epoch": 0.87, "learning_rate": 6.6924877143664315e-06, "loss": 2.1896, "step": 496680 }, { "epoch": 0.87, "learning_rate": 6.691615774439605e-06, "loss": 2.1907, "step": 496690 }, { "epoch": 0.87, "learning_rate": 6.690743834512777e-06, "loss": 2.2799, "step": 496700 }, { "epoch": 0.87, "learning_rate": 6.689871894585951e-06, "loss": 2.3016, "step": 496710 }, { "epoch": 0.87, "learning_rate": 6.688999954659124e-06, "loss": 2.3169, "step": 496720 }, { "epoch": 0.87, "learning_rate": 6.688128014732298e-06, "loss": 2.2664, "step": 496730 }, { "epoch": 0.87, "learning_rate": 6.68725607480547e-06, "loss": 2.2256, "step": 496740 }, { "epoch": 0.87, "learning_rate": 6.686384134878644e-06, "loss": 2.2203, "step": 496750 }, { "epoch": 0.87, "learning_rate": 6.685512194951817e-06, "loss": 2.1937, "step": 496760 }, { "epoch": 0.87, "learning_rate": 6.68464025502499e-06, "loss": 2.3157, "step": 496770 }, { "epoch": 0.87, "learning_rate": 6.6837683150981624e-06, "loss": 2.3031, "step": 496780 }, { "epoch": 0.87, "learning_rate": 6.682896375171337e-06, "loss": 2.3472, "step": 496790 }, { "epoch": 0.87, "learning_rate": 6.682024435244509e-06, "loss": 2.3385, "step": 496800 }, { "epoch": 0.87, "learning_rate": 6.681152495317683e-06, "loss": 2.1245, "step": 496810 }, { "epoch": 0.87, "learning_rate": 6.680280555390857e-06, "loss": 2.2813, "step": 496820 }, { "epoch": 0.87, "learning_rate": 6.67940861546403e-06, "loss": 2.3698, "step": 496830 }, { "epoch": 0.87, "learning_rate": 6.678536675537203e-06, "loss": 2.2705, "step": 496840 }, { "epoch": 0.87, "learning_rate": 6.6776647356103754e-06, "loss": 2.2508, "step": 496850 }, { "epoch": 0.87, "learning_rate": 6.676792795683549e-06, "loss": 2.4017, "step": 496860 }, { "epoch": 0.87, "learning_rate": 6.675920855756722e-06, "loss": 2.2243, "step": 496870 }, { "epoch": 0.87, "learning_rate": 6.675048915829896e-06, "loss": 2.2557, "step": 496880 }, { "epoch": 0.87, "learning_rate": 6.674176975903068e-06, "loss": 2.1204, "step": 496890 }, { "epoch": 0.87, "learning_rate": 6.673305035976242e-06, "loss": 2.2205, "step": 496900 }, { "epoch": 0.87, "learning_rate": 6.672433096049415e-06, "loss": 2.2811, "step": 496910 }, { "epoch": 0.87, "learning_rate": 6.6715611561225884e-06, "loss": 2.2715, "step": 496920 }, { "epoch": 0.87, "learning_rate": 6.6706892161957605e-06, "loss": 2.2494, "step": 496930 }, { "epoch": 0.87, "learning_rate": 6.669817276268934e-06, "loss": 2.1941, "step": 496940 }, { "epoch": 0.87, "learning_rate": 6.668945336342108e-06, "loss": 2.3087, "step": 496950 }, { "epoch": 0.87, "learning_rate": 6.668073396415281e-06, "loss": 2.1692, "step": 496960 }, { "epoch": 0.87, "learning_rate": 6.667201456488455e-06, "loss": 2.2045, "step": 496970 }, { "epoch": 0.87, "learning_rate": 6.666329516561627e-06, "loss": 2.227, "step": 496980 }, { "epoch": 0.87, "learning_rate": 6.665457576634801e-06, "loss": 2.3445, "step": 496990 }, { "epoch": 0.87, "learning_rate": 6.6645856367079735e-06, "loss": 2.2607, "step": 497000 }, { "epoch": 0.87, "learning_rate": 6.663713696781147e-06, "loss": 2.2094, "step": 497010 }, { "epoch": 0.87, "learning_rate": 6.662841756854319e-06, "loss": 2.3149, "step": 497020 }, { "epoch": 0.87, "learning_rate": 6.661969816927493e-06, "loss": 2.3336, "step": 497030 }, { "epoch": 0.87, "learning_rate": 6.661097877000666e-06, "loss": 2.329, "step": 497040 }, { "epoch": 0.87, "learning_rate": 6.66022593707384e-06, "loss": 2.3451, "step": 497050 }, { "epoch": 0.87, "learning_rate": 6.659353997147012e-06, "loss": 2.3543, "step": 497060 }, { "epoch": 0.87, "learning_rate": 6.6584820572201865e-06, "loss": 2.0888, "step": 497070 }, { "epoch": 0.87, "learning_rate": 6.657610117293359e-06, "loss": 2.2282, "step": 497080 }, { "epoch": 0.87, "learning_rate": 6.656738177366532e-06, "loss": 2.3113, "step": 497090 }, { "epoch": 0.87, "learning_rate": 6.655866237439706e-06, "loss": 2.2781, "step": 497100 }, { "epoch": 0.87, "learning_rate": 6.654994297512879e-06, "loss": 2.2673, "step": 497110 }, { "epoch": 0.87, "learning_rate": 6.654122357586053e-06, "loss": 2.2208, "step": 497120 }, { "epoch": 0.87, "learning_rate": 6.653250417659225e-06, "loss": 2.2407, "step": 497130 }, { "epoch": 0.87, "learning_rate": 6.652378477732399e-06, "loss": 2.3016, "step": 497140 }, { "epoch": 0.87, "learning_rate": 6.651506537805572e-06, "loss": 2.2859, "step": 497150 }, { "epoch": 0.87, "learning_rate": 6.650634597878745e-06, "loss": 2.3199, "step": 497160 }, { "epoch": 0.87, "learning_rate": 6.6497626579519174e-06, "loss": 2.2596, "step": 497170 }, { "epoch": 0.87, "learning_rate": 6.648890718025091e-06, "loss": 2.3318, "step": 497180 }, { "epoch": 0.87, "learning_rate": 6.648018778098264e-06, "loss": 2.2614, "step": 497190 }, { "epoch": 0.87, "learning_rate": 6.647146838171438e-06, "loss": 2.2251, "step": 497200 }, { "epoch": 0.87, "learning_rate": 6.64627489824461e-06, "loss": 2.2919, "step": 497210 }, { "epoch": 0.87, "learning_rate": 6.645402958317784e-06, "loss": 2.2478, "step": 497220 }, { "epoch": 0.87, "learning_rate": 6.6445310183909575e-06, "loss": 2.3767, "step": 497230 }, { "epoch": 0.87, "learning_rate": 6.6436590784641305e-06, "loss": 2.3291, "step": 497240 }, { "epoch": 0.87, "learning_rate": 6.642787138537304e-06, "loss": 2.176, "step": 497250 }, { "epoch": 0.87, "learning_rate": 6.641915198610476e-06, "loss": 2.2394, "step": 497260 }, { "epoch": 0.87, "learning_rate": 6.64104325868365e-06, "loss": 2.2757, "step": 497270 }, { "epoch": 0.87, "learning_rate": 6.640171318756823e-06, "loss": 2.2702, "step": 497280 }, { "epoch": 0.87, "learning_rate": 6.639299378829997e-06, "loss": 2.2739, "step": 497290 }, { "epoch": 0.87, "learning_rate": 6.638427438903169e-06, "loss": 2.2799, "step": 497300 }, { "epoch": 0.87, "learning_rate": 6.6375554989763435e-06, "loss": 2.2849, "step": 497310 }, { "epoch": 0.87, "learning_rate": 6.6366835590495155e-06, "loss": 2.3241, "step": 497320 }, { "epoch": 0.87, "learning_rate": 6.635811619122689e-06, "loss": 2.301, "step": 497330 }, { "epoch": 0.87, "learning_rate": 6.634939679195861e-06, "loss": 2.1314, "step": 497340 }, { "epoch": 0.87, "learning_rate": 6.634067739269036e-06, "loss": 2.2159, "step": 497350 }, { "epoch": 0.87, "learning_rate": 6.63319579934221e-06, "loss": 2.3009, "step": 497360 }, { "epoch": 0.87, "learning_rate": 6.632323859415382e-06, "loss": 2.1207, "step": 497370 }, { "epoch": 0.87, "learning_rate": 6.631451919488556e-06, "loss": 2.3404, "step": 497380 }, { "epoch": 0.87, "learning_rate": 6.6305799795617285e-06, "loss": 2.2425, "step": 497390 }, { "epoch": 0.87, "learning_rate": 6.629708039634902e-06, "loss": 2.2985, "step": 497400 }, { "epoch": 0.87, "learning_rate": 6.628836099708074e-06, "loss": 2.2844, "step": 497410 }, { "epoch": 0.87, "learning_rate": 6.627964159781248e-06, "loss": 2.2452, "step": 497420 }, { "epoch": 0.87, "learning_rate": 6.627092219854421e-06, "loss": 2.3098, "step": 497430 }, { "epoch": 0.87, "learning_rate": 6.626220279927595e-06, "loss": 2.2141, "step": 497440 }, { "epoch": 0.87, "learning_rate": 6.625348340000767e-06, "loss": 2.2374, "step": 497450 }, { "epoch": 0.87, "learning_rate": 6.624476400073941e-06, "loss": 2.2466, "step": 497460 }, { "epoch": 0.87, "learning_rate": 6.623604460147114e-06, "loss": 2.3086, "step": 497470 }, { "epoch": 0.87, "learning_rate": 6.622732520220287e-06, "loss": 2.2436, "step": 497480 }, { "epoch": 0.87, "learning_rate": 6.621860580293461e-06, "loss": 2.3492, "step": 497490 }, { "epoch": 0.87, "learning_rate": 6.620988640366633e-06, "loss": 2.2227, "step": 497500 }, { "epoch": 0.87, "learning_rate": 6.620116700439807e-06, "loss": 2.313, "step": 497510 }, { "epoch": 0.87, "learning_rate": 6.61924476051298e-06, "loss": 2.2208, "step": 497520 }, { "epoch": 0.87, "learning_rate": 6.618372820586154e-06, "loss": 2.1578, "step": 497530 }, { "epoch": 0.87, "learning_rate": 6.617500880659326e-06, "loss": 2.2955, "step": 497540 }, { "epoch": 0.87, "learning_rate": 6.6166289407324995e-06, "loss": 2.2413, "step": 497550 }, { "epoch": 0.87, "learning_rate": 6.6157570008056725e-06, "loss": 2.3287, "step": 497560 }, { "epoch": 0.87, "learning_rate": 6.614885060878846e-06, "loss": 2.2918, "step": 497570 }, { "epoch": 0.87, "learning_rate": 6.614013120952018e-06, "loss": 2.1891, "step": 497580 }, { "epoch": 0.87, "learning_rate": 6.613141181025193e-06, "loss": 2.1764, "step": 497590 }, { "epoch": 0.87, "learning_rate": 6.612269241098365e-06, "loss": 2.3685, "step": 497600 }, { "epoch": 0.87, "learning_rate": 6.611397301171539e-06, "loss": 2.2807, "step": 497610 }, { "epoch": 0.87, "learning_rate": 6.6105253612447125e-06, "loss": 2.2839, "step": 497620 }, { "epoch": 0.87, "learning_rate": 6.6096534213178855e-06, "loss": 2.2478, "step": 497630 }, { "epoch": 0.87, "learning_rate": 6.608781481391059e-06, "loss": 2.2923, "step": 497640 }, { "epoch": 0.87, "learning_rate": 6.607909541464231e-06, "loss": 2.3016, "step": 497650 }, { "epoch": 0.87, "learning_rate": 6.607037601537405e-06, "loss": 2.2717, "step": 497660 }, { "epoch": 0.87, "learning_rate": 6.606165661610578e-06, "loss": 2.2596, "step": 497670 }, { "epoch": 0.87, "learning_rate": 6.605293721683752e-06, "loss": 2.2362, "step": 497680 }, { "epoch": 0.87, "learning_rate": 6.604421781756924e-06, "loss": 2.304, "step": 497690 }, { "epoch": 0.87, "learning_rate": 6.603549841830098e-06, "loss": 2.2564, "step": 497700 }, { "epoch": 0.87, "learning_rate": 6.6026779019032705e-06, "loss": 2.3532, "step": 497710 }, { "epoch": 0.87, "learning_rate": 6.601805961976444e-06, "loss": 2.2758, "step": 497720 }, { "epoch": 0.87, "learning_rate": 6.600934022049616e-06, "loss": 2.2896, "step": 497730 }, { "epoch": 0.87, "learning_rate": 6.60006208212279e-06, "loss": 2.1937, "step": 497740 }, { "epoch": 0.87, "learning_rate": 6.599190142195964e-06, "loss": 2.1898, "step": 497750 }, { "epoch": 0.87, "learning_rate": 6.598318202269137e-06, "loss": 2.2814, "step": 497760 }, { "epoch": 0.87, "learning_rate": 6.597446262342311e-06, "loss": 2.1735, "step": 497770 }, { "epoch": 0.87, "learning_rate": 6.596574322415483e-06, "loss": 2.2067, "step": 497780 }, { "epoch": 0.87, "learning_rate": 6.5957023824886565e-06, "loss": 2.2177, "step": 497790 }, { "epoch": 0.87, "learning_rate": 6.594830442561829e-06, "loss": 2.3217, "step": 497800 }, { "epoch": 0.87, "learning_rate": 6.593958502635003e-06, "loss": 2.2764, "step": 497810 }, { "epoch": 0.87, "learning_rate": 6.593086562708175e-06, "loss": 2.3262, "step": 497820 }, { "epoch": 0.87, "learning_rate": 6.59221462278135e-06, "loss": 2.3219, "step": 497830 }, { "epoch": 0.87, "learning_rate": 6.591342682854522e-06, "loss": 2.2284, "step": 497840 }, { "epoch": 0.87, "learning_rate": 6.590470742927696e-06, "loss": 2.228, "step": 497850 }, { "epoch": 0.87, "learning_rate": 6.589598803000868e-06, "loss": 2.2296, "step": 497860 }, { "epoch": 0.87, "learning_rate": 6.588726863074042e-06, "loss": 2.1489, "step": 497870 }, { "epoch": 0.87, "learning_rate": 6.5878549231472145e-06, "loss": 2.335, "step": 497880 }, { "epoch": 0.87, "learning_rate": 6.586982983220388e-06, "loss": 2.1794, "step": 497890 }, { "epoch": 0.87, "learning_rate": 6.586111043293562e-06, "loss": 2.2348, "step": 497900 }, { "epoch": 0.87, "learning_rate": 6.585239103366735e-06, "loss": 2.1412, "step": 497910 }, { "epoch": 0.87, "learning_rate": 6.584367163439909e-06, "loss": 2.1341, "step": 497920 }, { "epoch": 0.87, "learning_rate": 6.583495223513081e-06, "loss": 2.2275, "step": 497930 }, { "epoch": 0.87, "learning_rate": 6.5826232835862545e-06, "loss": 2.2512, "step": 497940 }, { "epoch": 0.87, "learning_rate": 6.5817513436594275e-06, "loss": 2.3393, "step": 497950 }, { "epoch": 0.87, "learning_rate": 6.580879403732601e-06, "loss": 2.253, "step": 497960 }, { "epoch": 0.87, "learning_rate": 6.580007463805773e-06, "loss": 2.241, "step": 497970 }, { "epoch": 0.87, "learning_rate": 6.579135523878947e-06, "loss": 2.2782, "step": 497980 }, { "epoch": 0.87, "learning_rate": 6.57826358395212e-06, "loss": 2.2229, "step": 497990 }, { "epoch": 0.87, "learning_rate": 6.577391644025294e-06, "loss": 2.2057, "step": 498000 }, { "epoch": 0.87, "learning_rate": 6.576519704098466e-06, "loss": 2.3082, "step": 498010 }, { "epoch": 0.87, "learning_rate": 6.57564776417164e-06, "loss": 2.1696, "step": 498020 }, { "epoch": 0.87, "learning_rate": 6.574775824244813e-06, "loss": 2.2872, "step": 498030 }, { "epoch": 0.87, "learning_rate": 6.573903884317986e-06, "loss": 2.1235, "step": 498040 }, { "epoch": 0.87, "learning_rate": 6.57303194439116e-06, "loss": 2.2331, "step": 498050 }, { "epoch": 0.87, "learning_rate": 6.572160004464332e-06, "loss": 2.2611, "step": 498060 }, { "epoch": 0.87, "learning_rate": 6.571288064537506e-06, "loss": 2.2968, "step": 498070 }, { "epoch": 0.87, "learning_rate": 6.570416124610679e-06, "loss": 2.3134, "step": 498080 }, { "epoch": 0.87, "learning_rate": 6.569544184683853e-06, "loss": 2.2642, "step": 498090 }, { "epoch": 0.87, "learning_rate": 6.568672244757025e-06, "loss": 2.3128, "step": 498100 }, { "epoch": 0.87, "learning_rate": 6.567800304830199e-06, "loss": 2.363, "step": 498110 }, { "epoch": 0.87, "learning_rate": 6.566928364903371e-06, "loss": 2.2552, "step": 498120 }, { "epoch": 0.87, "learning_rate": 6.566056424976545e-06, "loss": 2.2726, "step": 498130 }, { "epoch": 0.87, "learning_rate": 6.565184485049718e-06, "loss": 2.3154, "step": 498140 }, { "epoch": 0.87, "learning_rate": 6.564312545122892e-06, "loss": 2.2463, "step": 498150 }, { "epoch": 0.87, "learning_rate": 6.563440605196066e-06, "loss": 2.2307, "step": 498160 }, { "epoch": 0.87, "learning_rate": 6.562568665269238e-06, "loss": 2.2806, "step": 498170 }, { "epoch": 0.87, "learning_rate": 6.5616967253424115e-06, "loss": 2.2261, "step": 498180 }, { "epoch": 0.87, "learning_rate": 6.560824785415584e-06, "loss": 2.3742, "step": 498190 }, { "epoch": 0.87, "learning_rate": 6.559952845488758e-06, "loss": 2.3112, "step": 498200 }, { "epoch": 0.87, "learning_rate": 6.55908090556193e-06, "loss": 2.2655, "step": 498210 }, { "epoch": 0.87, "learning_rate": 6.558208965635104e-06, "loss": 2.2361, "step": 498220 }, { "epoch": 0.87, "learning_rate": 6.557337025708277e-06, "loss": 2.3268, "step": 498230 }, { "epoch": 0.87, "learning_rate": 6.556465085781451e-06, "loss": 2.2815, "step": 498240 }, { "epoch": 0.87, "learning_rate": 6.555593145854623e-06, "loss": 2.2705, "step": 498250 }, { "epoch": 0.87, "learning_rate": 6.5547212059277965e-06, "loss": 2.2095, "step": 498260 }, { "epoch": 0.87, "learning_rate": 6.5538492660009695e-06, "loss": 2.2287, "step": 498270 }, { "epoch": 0.87, "learning_rate": 6.552977326074143e-06, "loss": 2.2173, "step": 498280 }, { "epoch": 0.87, "learning_rate": 6.552105386147317e-06, "loss": 2.2164, "step": 498290 }, { "epoch": 0.87, "learning_rate": 6.551233446220489e-06, "loss": 2.2719, "step": 498300 }, { "epoch": 0.87, "learning_rate": 6.550361506293663e-06, "loss": 2.2613, "step": 498310 }, { "epoch": 0.87, "learning_rate": 6.549489566366836e-06, "loss": 2.3216, "step": 498320 }, { "epoch": 0.87, "learning_rate": 6.5486176264400095e-06, "loss": 2.1718, "step": 498330 }, { "epoch": 0.87, "learning_rate": 6.547745686513182e-06, "loss": 2.2225, "step": 498340 }, { "epoch": 0.87, "learning_rate": 6.546873746586356e-06, "loss": 2.2677, "step": 498350 }, { "epoch": 0.87, "learning_rate": 6.546001806659528e-06, "loss": 2.327, "step": 498360 }, { "epoch": 0.87, "learning_rate": 6.545129866732702e-06, "loss": 2.3273, "step": 498370 }, { "epoch": 0.87, "learning_rate": 6.544257926805874e-06, "loss": 2.2488, "step": 498380 }, { "epoch": 0.87, "learning_rate": 6.543385986879049e-06, "loss": 2.2587, "step": 498390 }, { "epoch": 0.87, "learning_rate": 6.542514046952221e-06, "loss": 2.197, "step": 498400 }, { "epoch": 0.87, "learning_rate": 6.541642107025395e-06, "loss": 2.1263, "step": 498410 }, { "epoch": 0.87, "learning_rate": 6.540770167098568e-06, "loss": 2.2254, "step": 498420 }, { "epoch": 0.87, "learning_rate": 6.539898227171741e-06, "loss": 2.1753, "step": 498430 }, { "epoch": 0.87, "learning_rate": 6.539026287244915e-06, "loss": 2.308, "step": 498440 }, { "epoch": 0.87, "learning_rate": 6.538154347318087e-06, "loss": 2.1931, "step": 498450 }, { "epoch": 0.87, "learning_rate": 6.537282407391261e-06, "loss": 2.2116, "step": 498460 }, { "epoch": 0.87, "learning_rate": 6.536410467464434e-06, "loss": 2.3286, "step": 498470 }, { "epoch": 0.87, "learning_rate": 6.535538527537608e-06, "loss": 2.224, "step": 498480 }, { "epoch": 0.87, "learning_rate": 6.53466658761078e-06, "loss": 2.3616, "step": 498490 }, { "epoch": 0.87, "learning_rate": 6.5337946476839535e-06, "loss": 2.3033, "step": 498500 }, { "epoch": 0.87, "learning_rate": 6.532922707757126e-06, "loss": 2.2119, "step": 498510 }, { "epoch": 0.87, "learning_rate": 6.5320507678303e-06, "loss": 2.3236, "step": 498520 }, { "epoch": 0.87, "learning_rate": 6.531178827903472e-06, "loss": 2.1773, "step": 498530 }, { "epoch": 0.87, "learning_rate": 6.530306887976646e-06, "loss": 2.2974, "step": 498540 }, { "epoch": 0.87, "learning_rate": 6.52943494804982e-06, "loss": 2.3389, "step": 498550 }, { "epoch": 0.87, "learning_rate": 6.528563008122993e-06, "loss": 2.2076, "step": 498560 }, { "epoch": 0.87, "learning_rate": 6.5276910681961665e-06, "loss": 2.3385, "step": 498570 }, { "epoch": 0.87, "learning_rate": 6.5268191282693385e-06, "loss": 2.2404, "step": 498580 }, { "epoch": 0.87, "learning_rate": 6.525947188342512e-06, "loss": 2.2759, "step": 498590 }, { "epoch": 0.87, "learning_rate": 6.525075248415685e-06, "loss": 2.2613, "step": 498600 }, { "epoch": 0.87, "learning_rate": 6.524203308488859e-06, "loss": 2.2303, "step": 498610 }, { "epoch": 0.87, "learning_rate": 6.523331368562031e-06, "loss": 2.2349, "step": 498620 }, { "epoch": 0.87, "learning_rate": 6.522459428635206e-06, "loss": 2.3338, "step": 498630 }, { "epoch": 0.87, "learning_rate": 6.521587488708378e-06, "loss": 2.4016, "step": 498640 }, { "epoch": 0.87, "learning_rate": 6.5207155487815515e-06, "loss": 2.1868, "step": 498650 }, { "epoch": 0.87, "learning_rate": 6.5198436088547245e-06, "loss": 2.3032, "step": 498660 }, { "epoch": 0.87, "learning_rate": 6.518971668927898e-06, "loss": 2.3448, "step": 498670 }, { "epoch": 0.87, "learning_rate": 6.518099729001072e-06, "loss": 2.1882, "step": 498680 }, { "epoch": 0.87, "learning_rate": 6.517227789074244e-06, "loss": 2.3155, "step": 498690 }, { "epoch": 0.87, "learning_rate": 6.516355849147418e-06, "loss": 2.2741, "step": 498700 }, { "epoch": 0.87, "learning_rate": 6.515483909220591e-06, "loss": 2.3214, "step": 498710 }, { "epoch": 0.87, "learning_rate": 6.5146119692937645e-06, "loss": 2.2066, "step": 498720 }, { "epoch": 0.87, "learning_rate": 6.513740029366937e-06, "loss": 2.3949, "step": 498730 }, { "epoch": 0.87, "learning_rate": 6.51286808944011e-06, "loss": 2.2584, "step": 498740 }, { "epoch": 0.87, "learning_rate": 6.511996149513283e-06, "loss": 2.1812, "step": 498750 }, { "epoch": 0.87, "learning_rate": 6.511124209586457e-06, "loss": 2.291, "step": 498760 }, { "epoch": 0.87, "learning_rate": 6.510252269659629e-06, "loss": 2.2665, "step": 498770 }, { "epoch": 0.87, "learning_rate": 6.509380329732803e-06, "loss": 2.2607, "step": 498780 }, { "epoch": 0.87, "learning_rate": 6.508508389805976e-06, "loss": 2.1855, "step": 498790 }, { "epoch": 0.87, "learning_rate": 6.50763644987915e-06, "loss": 2.2916, "step": 498800 }, { "epoch": 0.87, "learning_rate": 6.506764509952322e-06, "loss": 2.2464, "step": 498810 }, { "epoch": 0.87, "learning_rate": 6.5058925700254955e-06, "loss": 2.3325, "step": 498820 }, { "epoch": 0.87, "learning_rate": 6.505020630098669e-06, "loss": 2.2917, "step": 498830 }, { "epoch": 0.87, "learning_rate": 6.504148690171842e-06, "loss": 2.1707, "step": 498840 }, { "epoch": 0.87, "learning_rate": 6.503276750245016e-06, "loss": 2.2581, "step": 498850 }, { "epoch": 0.87, "learning_rate": 6.502404810318188e-06, "loss": 2.1627, "step": 498860 }, { "epoch": 0.87, "learning_rate": 6.501532870391363e-06, "loss": 2.245, "step": 498870 }, { "epoch": 0.87, "learning_rate": 6.500660930464535e-06, "loss": 2.2638, "step": 498880 }, { "epoch": 0.87, "learning_rate": 6.4997889905377085e-06, "loss": 2.3052, "step": 498890 }, { "epoch": 0.87, "learning_rate": 6.4989170506108805e-06, "loss": 2.2942, "step": 498900 }, { "epoch": 0.87, "learning_rate": 6.498045110684055e-06, "loss": 2.1937, "step": 498910 }, { "epoch": 0.87, "learning_rate": 6.497173170757227e-06, "loss": 2.3353, "step": 498920 }, { "epoch": 0.87, "learning_rate": 6.496301230830401e-06, "loss": 2.3074, "step": 498930 }, { "epoch": 0.87, "learning_rate": 6.495429290903574e-06, "loss": 2.2816, "step": 498940 }, { "epoch": 0.87, "learning_rate": 6.494557350976748e-06, "loss": 2.2889, "step": 498950 }, { "epoch": 0.87, "learning_rate": 6.4936854110499215e-06, "loss": 2.3058, "step": 498960 }, { "epoch": 0.87, "learning_rate": 6.4928134711230935e-06, "loss": 2.2421, "step": 498970 }, { "epoch": 0.87, "learning_rate": 6.491941531196267e-06, "loss": 2.1909, "step": 498980 }, { "epoch": 0.87, "learning_rate": 6.49106959126944e-06, "loss": 2.1934, "step": 498990 }, { "epoch": 0.87, "learning_rate": 6.490197651342614e-06, "loss": 2.3474, "step": 499000 }, { "epoch": 0.87, "learning_rate": 6.489325711415786e-06, "loss": 2.2747, "step": 499010 }, { "epoch": 0.87, "learning_rate": 6.48845377148896e-06, "loss": 2.268, "step": 499020 }, { "epoch": 0.87, "learning_rate": 6.487581831562133e-06, "loss": 2.3106, "step": 499030 }, { "epoch": 0.87, "learning_rate": 6.4867098916353065e-06, "loss": 2.2857, "step": 499040 }, { "epoch": 0.87, "learning_rate": 6.485837951708479e-06, "loss": 2.3634, "step": 499050 }, { "epoch": 0.87, "learning_rate": 6.484966011781652e-06, "loss": 2.2039, "step": 499060 }, { "epoch": 0.87, "learning_rate": 6.484094071854825e-06, "loss": 2.2524, "step": 499070 }, { "epoch": 0.87, "learning_rate": 6.483222131927999e-06, "loss": 2.23, "step": 499080 }, { "epoch": 0.87, "learning_rate": 6.482350192001173e-06, "loss": 2.3385, "step": 499090 }, { "epoch": 0.87, "learning_rate": 6.481478252074345e-06, "loss": 2.2786, "step": 499100 }, { "epoch": 0.87, "learning_rate": 6.480606312147519e-06, "loss": 2.1769, "step": 499110 }, { "epoch": 0.87, "learning_rate": 6.479734372220692e-06, "loss": 2.1731, "step": 499120 }, { "epoch": 0.87, "learning_rate": 6.478862432293865e-06, "loss": 2.3326, "step": 499130 }, { "epoch": 0.87, "learning_rate": 6.4779904923670375e-06, "loss": 2.3854, "step": 499140 }, { "epoch": 0.87, "learning_rate": 6.477118552440212e-06, "loss": 2.2737, "step": 499150 }, { "epoch": 0.87, "learning_rate": 6.476246612513384e-06, "loss": 2.2221, "step": 499160 }, { "epoch": 0.87, "learning_rate": 6.475374672586558e-06, "loss": 2.2787, "step": 499170 }, { "epoch": 0.87, "learning_rate": 6.474502732659731e-06, "loss": 2.2923, "step": 499180 }, { "epoch": 0.87, "learning_rate": 6.473630792732905e-06, "loss": 2.3435, "step": 499190 }, { "epoch": 0.87, "learning_rate": 6.472758852806077e-06, "loss": 2.2098, "step": 499200 }, { "epoch": 0.87, "learning_rate": 6.4718869128792505e-06, "loss": 2.1515, "step": 499210 }, { "epoch": 0.87, "learning_rate": 6.471014972952424e-06, "loss": 2.291, "step": 499220 }, { "epoch": 0.87, "learning_rate": 6.470143033025597e-06, "loss": 2.318, "step": 499230 }, { "epoch": 0.87, "learning_rate": 6.469271093098771e-06, "loss": 2.3249, "step": 499240 }, { "epoch": 0.87, "learning_rate": 6.468399153171943e-06, "loss": 2.2203, "step": 499250 }, { "epoch": 0.87, "learning_rate": 6.467527213245117e-06, "loss": 2.2438, "step": 499260 }, { "epoch": 0.87, "learning_rate": 6.46665527331829e-06, "loss": 2.3548, "step": 499270 }, { "epoch": 0.87, "learning_rate": 6.4657833333914635e-06, "loss": 2.2404, "step": 499280 }, { "epoch": 0.87, "learning_rate": 6.4649113934646355e-06, "loss": 2.2624, "step": 499290 }, { "epoch": 0.87, "learning_rate": 6.464039453537809e-06, "loss": 2.1846, "step": 499300 }, { "epoch": 0.87, "learning_rate": 6.463167513610982e-06, "loss": 2.2327, "step": 499310 }, { "epoch": 0.87, "learning_rate": 6.462295573684156e-06, "loss": 2.3926, "step": 499320 }, { "epoch": 0.87, "learning_rate": 6.461423633757328e-06, "loss": 2.2635, "step": 499330 }, { "epoch": 0.87, "learning_rate": 6.460551693830502e-06, "loss": 2.3113, "step": 499340 }, { "epoch": 0.87, "learning_rate": 6.459679753903676e-06, "loss": 2.3495, "step": 499350 }, { "epoch": 0.87, "learning_rate": 6.4588078139768485e-06, "loss": 2.2396, "step": 499360 }, { "epoch": 0.87, "learning_rate": 6.457935874050022e-06, "loss": 2.2489, "step": 499370 }, { "epoch": 0.87, "learning_rate": 6.457063934123194e-06, "loss": 2.2225, "step": 499380 }, { "epoch": 0.87, "learning_rate": 6.456191994196369e-06, "loss": 2.2759, "step": 499390 }, { "epoch": 0.87, "learning_rate": 6.455320054269541e-06, "loss": 2.3294, "step": 499400 }, { "epoch": 0.87, "learning_rate": 6.454448114342715e-06, "loss": 2.1931, "step": 499410 }, { "epoch": 0.87, "learning_rate": 6.453576174415888e-06, "loss": 2.3295, "step": 499420 }, { "epoch": 0.87, "learning_rate": 6.4527042344890615e-06, "loss": 2.2764, "step": 499430 }, { "epoch": 0.87, "learning_rate": 6.451832294562234e-06, "loss": 2.0526, "step": 499440 }, { "epoch": 0.87, "learning_rate": 6.450960354635407e-06, "loss": 2.2423, "step": 499450 }, { "epoch": 0.87, "learning_rate": 6.45008841470858e-06, "loss": 2.3582, "step": 499460 }, { "epoch": 0.87, "learning_rate": 6.449216474781754e-06, "loss": 2.3281, "step": 499470 }, { "epoch": 0.87, "learning_rate": 6.448344534854928e-06, "loss": 2.3032, "step": 499480 }, { "epoch": 0.87, "learning_rate": 6.4474725949281e-06, "loss": 2.2486, "step": 499490 }, { "epoch": 0.87, "learning_rate": 6.446600655001274e-06, "loss": 2.482, "step": 499500 }, { "epoch": 0.87, "learning_rate": 6.445728715074447e-06, "loss": 2.3227, "step": 499510 }, { "epoch": 0.87, "learning_rate": 6.44485677514762e-06, "loss": 2.2508, "step": 499520 }, { "epoch": 0.87, "learning_rate": 6.4439848352207925e-06, "loss": 2.2386, "step": 499530 }, { "epoch": 0.87, "learning_rate": 6.443112895293966e-06, "loss": 2.1731, "step": 499540 }, { "epoch": 0.87, "learning_rate": 6.442240955367139e-06, "loss": 2.157, "step": 499550 }, { "epoch": 0.87, "learning_rate": 6.441369015440313e-06, "loss": 2.3516, "step": 499560 }, { "epoch": 0.87, "learning_rate": 6.440497075513485e-06, "loss": 2.2478, "step": 499570 }, { "epoch": 0.87, "learning_rate": 6.439625135586659e-06, "loss": 2.257, "step": 499580 }, { "epoch": 0.87, "learning_rate": 6.438753195659832e-06, "loss": 2.2879, "step": 499590 }, { "epoch": 0.87, "learning_rate": 6.4378812557330055e-06, "loss": 2.249, "step": 499600 }, { "epoch": 0.87, "learning_rate": 6.437009315806179e-06, "loss": 2.2173, "step": 499610 }, { "epoch": 0.87, "learning_rate": 6.436137375879351e-06, "loss": 2.302, "step": 499620 }, { "epoch": 0.87, "learning_rate": 6.435265435952526e-06, "loss": 2.284, "step": 499630 }, { "epoch": 0.87, "learning_rate": 6.434393496025698e-06, "loss": 2.3584, "step": 499640 }, { "epoch": 0.87, "learning_rate": 6.433521556098872e-06, "loss": 2.2245, "step": 499650 }, { "epoch": 0.87, "learning_rate": 6.432649616172044e-06, "loss": 2.3412, "step": 499660 }, { "epoch": 0.87, "learning_rate": 6.4317776762452185e-06, "loss": 2.2575, "step": 499670 }, { "epoch": 0.87, "learning_rate": 6.4309057363183905e-06, "loss": 2.2678, "step": 499680 }, { "epoch": 0.87, "learning_rate": 6.430033796391564e-06, "loss": 2.3505, "step": 499690 }, { "epoch": 0.87, "learning_rate": 6.429161856464737e-06, "loss": 2.258, "step": 499700 }, { "epoch": 0.87, "learning_rate": 6.428289916537911e-06, "loss": 2.2945, "step": 499710 }, { "epoch": 0.87, "learning_rate": 6.427417976611083e-06, "loss": 2.2827, "step": 499720 }, { "epoch": 0.87, "learning_rate": 6.426546036684257e-06, "loss": 2.3341, "step": 499730 }, { "epoch": 0.87, "learning_rate": 6.42567409675743e-06, "loss": 2.2713, "step": 499740 }, { "epoch": 0.87, "learning_rate": 6.4248021568306035e-06, "loss": 2.1662, "step": 499750 }, { "epoch": 0.87, "learning_rate": 6.423930216903777e-06, "loss": 2.3324, "step": 499760 }, { "epoch": 0.87, "learning_rate": 6.423058276976949e-06, "loss": 2.3939, "step": 499770 }, { "epoch": 0.87, "learning_rate": 6.422186337050123e-06, "loss": 2.4703, "step": 499780 }, { "epoch": 0.87, "learning_rate": 6.421314397123296e-06, "loss": 2.3147, "step": 499790 }, { "epoch": 0.87, "learning_rate": 6.42044245719647e-06, "loss": 2.201, "step": 499800 }, { "epoch": 0.87, "learning_rate": 6.419570517269642e-06, "loss": 2.2675, "step": 499810 }, { "epoch": 0.87, "learning_rate": 6.418698577342816e-06, "loss": 2.2701, "step": 499820 }, { "epoch": 0.87, "learning_rate": 6.417826637415989e-06, "loss": 2.3119, "step": 499830 }, { "epoch": 0.87, "learning_rate": 6.416954697489162e-06, "loss": 2.295, "step": 499840 }, { "epoch": 0.87, "learning_rate": 6.4160827575623345e-06, "loss": 2.3536, "step": 499850 }, { "epoch": 0.87, "learning_rate": 6.415210817635508e-06, "loss": 2.3161, "step": 499860 }, { "epoch": 0.87, "learning_rate": 6.414338877708681e-06, "loss": 2.2183, "step": 499870 }, { "epoch": 0.87, "learning_rate": 6.413466937781855e-06, "loss": 2.2751, "step": 499880 }, { "epoch": 0.87, "learning_rate": 6.412594997855029e-06, "loss": 2.267, "step": 499890 }, { "epoch": 0.87, "learning_rate": 6.411723057928201e-06, "loss": 2.2859, "step": 499900 }, { "epoch": 0.87, "learning_rate": 6.410851118001375e-06, "loss": 2.3136, "step": 499910 }, { "epoch": 0.87, "learning_rate": 6.4099791780745475e-06, "loss": 2.1233, "step": 499920 }, { "epoch": 0.87, "learning_rate": 6.409107238147721e-06, "loss": 2.1935, "step": 499930 }, { "epoch": 0.87, "learning_rate": 6.408235298220894e-06, "loss": 2.2883, "step": 499940 }, { "epoch": 0.87, "learning_rate": 6.407363358294068e-06, "loss": 2.2693, "step": 499950 }, { "epoch": 0.87, "learning_rate": 6.40649141836724e-06, "loss": 2.2949, "step": 499960 }, { "epoch": 0.87, "learning_rate": 6.405619478440414e-06, "loss": 2.4242, "step": 499970 }, { "epoch": 0.87, "learning_rate": 6.404747538513587e-06, "loss": 2.1458, "step": 499980 }, { "epoch": 0.87, "learning_rate": 6.4038755985867605e-06, "loss": 2.2496, "step": 499990 }, { "epoch": 0.87, "learning_rate": 6.4030036586599326e-06, "loss": 2.2421, "step": 500000 }, { "epoch": 0.87, "learning_rate": 6.402131718733106e-06, "loss": 2.3332, "step": 500010 }, { "epoch": 0.87, "learning_rate": 6.40125977880628e-06, "loss": 2.2208, "step": 500020 }, { "epoch": 0.87, "learning_rate": 6.400387838879453e-06, "loss": 2.2898, "step": 500030 }, { "epoch": 0.87, "learning_rate": 6.399515898952627e-06, "loss": 2.2042, "step": 500040 }, { "epoch": 0.87, "learning_rate": 6.398643959025799e-06, "loss": 2.3528, "step": 500050 }, { "epoch": 0.87, "learning_rate": 6.397772019098973e-06, "loss": 2.3925, "step": 500060 }, { "epoch": 0.87, "learning_rate": 6.3969000791721456e-06, "loss": 2.2716, "step": 500070 }, { "epoch": 0.87, "learning_rate": 6.396028139245319e-06, "loss": 2.2415, "step": 500080 }, { "epoch": 0.87, "learning_rate": 6.395156199318491e-06, "loss": 2.2198, "step": 500090 }, { "epoch": 0.87, "learning_rate": 6.394284259391665e-06, "loss": 2.2259, "step": 500100 }, { "epoch": 0.87, "learning_rate": 6.393412319464838e-06, "loss": 2.2742, "step": 500110 }, { "epoch": 0.87, "learning_rate": 6.392540379538012e-06, "loss": 2.1857, "step": 500120 }, { "epoch": 0.87, "learning_rate": 6.391668439611184e-06, "loss": 2.3398, "step": 500130 }, { "epoch": 0.87, "learning_rate": 6.390796499684358e-06, "loss": 2.263, "step": 500140 }, { "epoch": 0.87, "learning_rate": 6.389924559757532e-06, "loss": 2.2602, "step": 500150 }, { "epoch": 0.87, "learning_rate": 6.389052619830704e-06, "loss": 2.2097, "step": 500160 }, { "epoch": 0.87, "learning_rate": 6.388180679903878e-06, "loss": 2.1323, "step": 500170 }, { "epoch": 0.87, "learning_rate": 6.38730873997705e-06, "loss": 2.2409, "step": 500180 }, { "epoch": 0.87, "learning_rate": 6.386436800050225e-06, "loss": 2.2686, "step": 500190 }, { "epoch": 0.87, "learning_rate": 6.385564860123397e-06, "loss": 2.2216, "step": 500200 }, { "epoch": 0.87, "learning_rate": 6.384692920196571e-06, "loss": 2.2068, "step": 500210 }, { "epoch": 0.87, "learning_rate": 6.383820980269744e-06, "loss": 2.3252, "step": 500220 }, { "epoch": 0.87, "learning_rate": 6.382949040342917e-06, "loss": 2.2985, "step": 500230 }, { "epoch": 0.87, "learning_rate": 6.3820771004160895e-06, "loss": 2.2631, "step": 500240 }, { "epoch": 0.87, "learning_rate": 6.381205160489263e-06, "loss": 2.2294, "step": 500250 }, { "epoch": 0.87, "learning_rate": 6.380333220562436e-06, "loss": 2.2044, "step": 500260 }, { "epoch": 0.87, "learning_rate": 6.37946128063561e-06, "loss": 2.3103, "step": 500270 }, { "epoch": 0.87, "learning_rate": 6.378589340708784e-06, "loss": 2.2311, "step": 500280 }, { "epoch": 0.87, "learning_rate": 6.377717400781956e-06, "loss": 2.2914, "step": 500290 }, { "epoch": 0.87, "learning_rate": 6.3768454608551296e-06, "loss": 2.1067, "step": 500300 }, { "epoch": 0.87, "learning_rate": 6.3759735209283025e-06, "loss": 2.2371, "step": 500310 }, { "epoch": 0.87, "learning_rate": 6.375101581001476e-06, "loss": 2.3209, "step": 500320 }, { "epoch": 0.87, "learning_rate": 6.374229641074648e-06, "loss": 2.2413, "step": 500330 }, { "epoch": 0.87, "learning_rate": 6.373357701147822e-06, "loss": 2.2787, "step": 500340 }, { "epoch": 0.87, "learning_rate": 6.372485761220995e-06, "loss": 2.2704, "step": 500350 }, { "epoch": 0.87, "learning_rate": 6.371613821294169e-06, "loss": 2.1319, "step": 500360 }, { "epoch": 0.87, "learning_rate": 6.370741881367341e-06, "loss": 2.2345, "step": 500370 }, { "epoch": 0.87, "learning_rate": 6.369869941440515e-06, "loss": 2.3687, "step": 500380 }, { "epoch": 0.87, "learning_rate": 6.3689980015136876e-06, "loss": 2.1393, "step": 500390 }, { "epoch": 0.87, "learning_rate": 6.368126061586861e-06, "loss": 2.1953, "step": 500400 }, { "epoch": 0.87, "learning_rate": 6.367254121660035e-06, "loss": 2.211, "step": 500410 }, { "epoch": 0.87, "learning_rate": 6.366382181733207e-06, "loss": 2.215, "step": 500420 }, { "epoch": 0.87, "learning_rate": 6.365510241806382e-06, "loss": 2.2302, "step": 500430 }, { "epoch": 0.87, "learning_rate": 6.364638301879554e-06, "loss": 2.3597, "step": 500440 }, { "epoch": 0.87, "learning_rate": 6.363766361952728e-06, "loss": 2.1408, "step": 500450 }, { "epoch": 0.87, "learning_rate": 6.3628944220259006e-06, "loss": 2.2521, "step": 500460 }, { "epoch": 0.87, "learning_rate": 6.362022482099074e-06, "loss": 2.2135, "step": 500470 }, { "epoch": 0.87, "learning_rate": 6.361150542172246e-06, "loss": 2.2428, "step": 500480 }, { "epoch": 0.87, "learning_rate": 6.36027860224542e-06, "loss": 2.3035, "step": 500490 }, { "epoch": 0.87, "learning_rate": 6.359406662318593e-06, "loss": 2.3079, "step": 500500 }, { "epoch": 0.87, "learning_rate": 6.358534722391767e-06, "loss": 2.3362, "step": 500510 }, { "epoch": 0.87, "learning_rate": 6.357662782464939e-06, "loss": 2.2898, "step": 500520 }, { "epoch": 0.87, "learning_rate": 6.356790842538113e-06, "loss": 2.2604, "step": 500530 }, { "epoch": 0.87, "learning_rate": 6.355918902611286e-06, "loss": 2.3497, "step": 500540 }, { "epoch": 0.87, "learning_rate": 6.355046962684459e-06, "loss": 2.1422, "step": 500550 }, { "epoch": 0.87, "learning_rate": 6.354175022757633e-06, "loss": 2.2949, "step": 500560 }, { "epoch": 0.87, "learning_rate": 6.353303082830805e-06, "loss": 2.3505, "step": 500570 }, { "epoch": 0.87, "learning_rate": 6.352431142903979e-06, "loss": 2.1684, "step": 500580 }, { "epoch": 0.87, "learning_rate": 6.351559202977152e-06, "loss": 2.3015, "step": 500590 }, { "epoch": 0.87, "learning_rate": 6.350687263050326e-06, "loss": 2.225, "step": 500600 }, { "epoch": 0.87, "learning_rate": 6.349815323123498e-06, "loss": 2.2301, "step": 500610 }, { "epoch": 0.87, "learning_rate": 6.3489433831966716e-06, "loss": 2.2418, "step": 500620 }, { "epoch": 0.87, "learning_rate": 6.3480714432698445e-06, "loss": 2.2809, "step": 500630 }, { "epoch": 0.87, "learning_rate": 6.347199503343018e-06, "loss": 2.246, "step": 500640 }, { "epoch": 0.87, "learning_rate": 6.34632756341619e-06, "loss": 2.3246, "step": 500650 }, { "epoch": 0.87, "learning_rate": 6.345455623489364e-06, "loss": 2.111, "step": 500660 }, { "epoch": 0.87, "learning_rate": 6.344583683562537e-06, "loss": 2.2568, "step": 500670 }, { "epoch": 0.87, "learning_rate": 6.343711743635711e-06, "loss": 2.1685, "step": 500680 }, { "epoch": 0.87, "learning_rate": 6.3428398037088846e-06, "loss": 2.3374, "step": 500690 }, { "epoch": 0.87, "learning_rate": 6.341967863782057e-06, "loss": 2.2815, "step": 500700 }, { "epoch": 0.87, "learning_rate": 6.341095923855231e-06, "loss": 2.2834, "step": 500710 }, { "epoch": 0.87, "learning_rate": 6.340223983928403e-06, "loss": 2.3296, "step": 500720 }, { "epoch": 0.87, "learning_rate": 6.339352044001577e-06, "loss": 2.2576, "step": 500730 }, { "epoch": 0.87, "learning_rate": 6.33848010407475e-06, "loss": 2.3097, "step": 500740 }, { "epoch": 0.87, "learning_rate": 6.337608164147924e-06, "loss": 2.3379, "step": 500750 }, { "epoch": 0.87, "learning_rate": 6.336736224221096e-06, "loss": 2.2889, "step": 500760 }, { "epoch": 0.87, "learning_rate": 6.33586428429427e-06, "loss": 2.2348, "step": 500770 }, { "epoch": 0.87, "learning_rate": 6.3349923443674426e-06, "loss": 2.1828, "step": 500780 }, { "epoch": 0.87, "learning_rate": 6.334120404440616e-06, "loss": 2.2882, "step": 500790 }, { "epoch": 0.87, "learning_rate": 6.333248464513788e-06, "loss": 2.2353, "step": 500800 }, { "epoch": 0.87, "learning_rate": 6.332376524586962e-06, "loss": 2.2576, "step": 500810 }, { "epoch": 0.87, "learning_rate": 6.331504584660136e-06, "loss": 2.2172, "step": 500820 }, { "epoch": 0.87, "learning_rate": 6.330632644733309e-06, "loss": 2.1372, "step": 500830 }, { "epoch": 0.87, "learning_rate": 6.329760704806483e-06, "loss": 2.2122, "step": 500840 }, { "epoch": 0.87, "learning_rate": 6.328888764879655e-06, "loss": 2.2753, "step": 500850 }, { "epoch": 0.87, "learning_rate": 6.3280168249528285e-06, "loss": 2.297, "step": 500860 }, { "epoch": 0.87, "learning_rate": 6.327144885026001e-06, "loss": 2.2797, "step": 500870 }, { "epoch": 0.87, "learning_rate": 6.326272945099175e-06, "loss": 2.289, "step": 500880 }, { "epoch": 0.87, "learning_rate": 6.325401005172347e-06, "loss": 2.2051, "step": 500890 }, { "epoch": 0.87, "learning_rate": 6.324529065245521e-06, "loss": 2.3045, "step": 500900 }, { "epoch": 0.87, "learning_rate": 6.323657125318694e-06, "loss": 2.2798, "step": 500910 }, { "epoch": 0.87, "learning_rate": 6.322785185391868e-06, "loss": 2.2991, "step": 500920 }, { "epoch": 0.87, "learning_rate": 6.32191324546504e-06, "loss": 2.3561, "step": 500930 }, { "epoch": 0.87, "learning_rate": 6.3210413055382136e-06, "loss": 2.3479, "step": 500940 }, { "epoch": 0.87, "learning_rate": 6.320169365611388e-06, "loss": 2.2869, "step": 500950 }, { "epoch": 0.87, "learning_rate": 6.31929742568456e-06, "loss": 2.2811, "step": 500960 }, { "epoch": 0.87, "learning_rate": 6.318425485757734e-06, "loss": 2.2683, "step": 500970 }, { "epoch": 0.87, "learning_rate": 6.317553545830907e-06, "loss": 2.2276, "step": 500980 }, { "epoch": 0.87, "learning_rate": 6.316681605904081e-06, "loss": 2.1738, "step": 500990 }, { "epoch": 0.87, "learning_rate": 6.315809665977253e-06, "loss": 2.2791, "step": 501000 }, { "epoch": 0.87, "learning_rate": 6.3149377260504266e-06, "loss": 2.38, "step": 501010 }, { "epoch": 0.87, "learning_rate": 6.3140657861235995e-06, "loss": 2.2896, "step": 501020 }, { "epoch": 0.87, "learning_rate": 6.313193846196773e-06, "loss": 2.2731, "step": 501030 }, { "epoch": 0.87, "learning_rate": 6.312321906269945e-06, "loss": 2.3262, "step": 501040 }, { "epoch": 0.87, "learning_rate": 6.311449966343119e-06, "loss": 2.3911, "step": 501050 }, { "epoch": 0.87, "learning_rate": 6.310578026416292e-06, "loss": 2.174, "step": 501060 }, { "epoch": 0.87, "learning_rate": 6.309706086489466e-06, "loss": 2.2631, "step": 501070 }, { "epoch": 0.87, "learning_rate": 6.3088341465626396e-06, "loss": 2.2664, "step": 501080 }, { "epoch": 0.87, "learning_rate": 6.307962206635812e-06, "loss": 2.2414, "step": 501090 }, { "epoch": 0.87, "learning_rate": 6.307090266708985e-06, "loss": 2.2554, "step": 501100 }, { "epoch": 0.87, "learning_rate": 6.306218326782158e-06, "loss": 2.3292, "step": 501110 }, { "epoch": 0.87, "learning_rate": 6.305346386855332e-06, "loss": 2.2805, "step": 501120 }, { "epoch": 0.87, "learning_rate": 6.304474446928504e-06, "loss": 2.3584, "step": 501130 }, { "epoch": 0.87, "learning_rate": 6.303602507001678e-06, "loss": 2.2757, "step": 501140 }, { "epoch": 0.87, "learning_rate": 6.302730567074851e-06, "loss": 2.2463, "step": 501150 }, { "epoch": 0.87, "learning_rate": 6.301858627148025e-06, "loss": 2.2143, "step": 501160 }, { "epoch": 0.87, "learning_rate": 6.300986687221197e-06, "loss": 2.2835, "step": 501170 }, { "epoch": 0.87, "learning_rate": 6.3001147472943705e-06, "loss": 2.1911, "step": 501180 }, { "epoch": 0.87, "learning_rate": 6.299242807367543e-06, "loss": 2.1995, "step": 501190 }, { "epoch": 0.87, "learning_rate": 6.298370867440717e-06, "loss": 2.3001, "step": 501200 }, { "epoch": 0.87, "learning_rate": 6.297498927513891e-06, "loss": 2.1906, "step": 501210 }, { "epoch": 0.87, "learning_rate": 6.296626987587063e-06, "loss": 2.258, "step": 501220 }, { "epoch": 0.87, "learning_rate": 6.295755047660238e-06, "loss": 2.2151, "step": 501230 }, { "epoch": 0.87, "learning_rate": 6.29488310773341e-06, "loss": 2.2972, "step": 501240 }, { "epoch": 0.87, "learning_rate": 6.2940111678065835e-06, "loss": 2.3644, "step": 501250 }, { "epoch": 0.87, "learning_rate": 6.293139227879756e-06, "loss": 2.3537, "step": 501260 }, { "epoch": 0.87, "learning_rate": 6.29226728795293e-06, "loss": 2.2808, "step": 501270 }, { "epoch": 0.87, "learning_rate": 6.291395348026102e-06, "loss": 2.3265, "step": 501280 }, { "epoch": 0.87, "learning_rate": 6.290523408099276e-06, "loss": 2.2175, "step": 501290 }, { "epoch": 0.87, "learning_rate": 6.289651468172449e-06, "loss": 2.2653, "step": 501300 }, { "epoch": 0.87, "learning_rate": 6.288779528245623e-06, "loss": 2.2342, "step": 501310 }, { "epoch": 0.87, "learning_rate": 6.287907588318795e-06, "loss": 2.2997, "step": 501320 }, { "epoch": 0.87, "learning_rate": 6.2870356483919686e-06, "loss": 2.3674, "step": 501330 }, { "epoch": 0.87, "learning_rate": 6.286163708465142e-06, "loss": 2.2447, "step": 501340 }, { "epoch": 0.87, "learning_rate": 6.285291768538315e-06, "loss": 2.2001, "step": 501350 }, { "epoch": 0.87, "learning_rate": 6.284419828611489e-06, "loss": 2.2534, "step": 501360 }, { "epoch": 0.87, "learning_rate": 6.283547888684661e-06, "loss": 2.2117, "step": 501370 }, { "epoch": 0.87, "learning_rate": 6.282675948757835e-06, "loss": 2.3578, "step": 501380 }, { "epoch": 0.87, "learning_rate": 6.281804008831008e-06, "loss": 2.3648, "step": 501390 }, { "epoch": 0.87, "learning_rate": 6.2809320689041816e-06, "loss": 2.3638, "step": 501400 }, { "epoch": 0.87, "learning_rate": 6.280060128977354e-06, "loss": 2.2622, "step": 501410 }, { "epoch": 0.87, "learning_rate": 6.279188189050527e-06, "loss": 2.2662, "step": 501420 }, { "epoch": 0.87, "learning_rate": 6.2783162491237e-06, "loss": 2.2398, "step": 501430 }, { "epoch": 0.87, "learning_rate": 6.277444309196874e-06, "loss": 2.1692, "step": 501440 }, { "epoch": 0.87, "learning_rate": 6.276572369270046e-06, "loss": 2.2505, "step": 501450 }, { "epoch": 0.87, "learning_rate": 6.27570042934322e-06, "loss": 2.3539, "step": 501460 }, { "epoch": 0.87, "learning_rate": 6.274828489416393e-06, "loss": 2.2715, "step": 501470 }, { "epoch": 0.87, "learning_rate": 6.273956549489567e-06, "loss": 2.2269, "step": 501480 }, { "epoch": 0.87, "learning_rate": 6.27308460956274e-06, "loss": 2.287, "step": 501490 }, { "epoch": 0.87, "learning_rate": 6.272212669635913e-06, "loss": 2.4111, "step": 501500 }, { "epoch": 0.87, "learning_rate": 6.271340729709087e-06, "loss": 2.1125, "step": 501510 }, { "epoch": 0.87, "learning_rate": 6.270468789782259e-06, "loss": 2.2084, "step": 501520 }, { "epoch": 0.87, "learning_rate": 6.269596849855433e-06, "loss": 2.2129, "step": 501530 }, { "epoch": 0.87, "learning_rate": 6.268724909928606e-06, "loss": 2.145, "step": 501540 }, { "epoch": 0.87, "learning_rate": 6.26785297000178e-06, "loss": 2.2609, "step": 501550 }, { "epoch": 0.87, "learning_rate": 6.266981030074952e-06, "loss": 2.3183, "step": 501560 }, { "epoch": 0.87, "learning_rate": 6.2661090901481255e-06, "loss": 2.3174, "step": 501570 }, { "epoch": 0.87, "learning_rate": 6.265237150221298e-06, "loss": 2.2598, "step": 501580 }, { "epoch": 0.87, "learning_rate": 6.264365210294472e-06, "loss": 2.3058, "step": 501590 }, { "epoch": 0.87, "learning_rate": 6.263493270367644e-06, "loss": 2.2617, "step": 501600 }, { "epoch": 0.87, "learning_rate": 6.262621330440818e-06, "loss": 2.302, "step": 501610 }, { "epoch": 0.87, "learning_rate": 6.261749390513992e-06, "loss": 2.3612, "step": 501620 }, { "epoch": 0.87, "learning_rate": 6.260877450587165e-06, "loss": 2.239, "step": 501630 }, { "epoch": 0.87, "learning_rate": 6.2600055106603385e-06, "loss": 2.3514, "step": 501640 }, { "epoch": 0.87, "learning_rate": 6.2591335707335106e-06, "loss": 2.374, "step": 501650 }, { "epoch": 0.87, "learning_rate": 6.258261630806684e-06, "loss": 2.1015, "step": 501660 }, { "epoch": 0.87, "learning_rate": 6.257389690879857e-06, "loss": 2.2665, "step": 501670 }, { "epoch": 0.87, "learning_rate": 6.256517750953031e-06, "loss": 2.2074, "step": 501680 }, { "epoch": 0.87, "learning_rate": 6.255645811026203e-06, "loss": 2.2674, "step": 501690 }, { "epoch": 0.87, "learning_rate": 6.254773871099377e-06, "loss": 2.3677, "step": 501700 }, { "epoch": 0.87, "learning_rate": 6.25390193117255e-06, "loss": 2.3134, "step": 501710 }, { "epoch": 0.87, "learning_rate": 6.2530299912457236e-06, "loss": 2.235, "step": 501720 }, { "epoch": 0.87, "learning_rate": 6.252158051318896e-06, "loss": 2.2009, "step": 501730 }, { "epoch": 0.87, "learning_rate": 6.251286111392069e-06, "loss": 2.2837, "step": 501740 }, { "epoch": 0.87, "learning_rate": 6.250414171465244e-06, "loss": 2.1998, "step": 501750 }, { "epoch": 0.88, "learning_rate": 6.249542231538416e-06, "loss": 2.2533, "step": 501760 }, { "epoch": 0.88, "learning_rate": 6.248670291611589e-06, "loss": 2.2138, "step": 501770 }, { "epoch": 0.88, "learning_rate": 6.247798351684763e-06, "loss": 2.2734, "step": 501780 }, { "epoch": 0.88, "learning_rate": 6.246926411757936e-06, "loss": 2.2649, "step": 501790 }, { "epoch": 0.88, "learning_rate": 6.246054471831109e-06, "loss": 2.3235, "step": 501800 }, { "epoch": 0.88, "learning_rate": 6.245182531904282e-06, "loss": 2.2048, "step": 501810 }, { "epoch": 0.88, "learning_rate": 6.244310591977455e-06, "loss": 2.1426, "step": 501820 }, { "epoch": 0.88, "learning_rate": 6.243438652050629e-06, "loss": 2.2931, "step": 501830 }, { "epoch": 0.88, "learning_rate": 6.242566712123802e-06, "loss": 2.2571, "step": 501840 }, { "epoch": 0.88, "learning_rate": 6.241694772196975e-06, "loss": 2.1535, "step": 501850 }, { "epoch": 0.88, "learning_rate": 6.240822832270148e-06, "loss": 2.2192, "step": 501860 }, { "epoch": 0.88, "learning_rate": 6.239950892343322e-06, "loss": 2.1789, "step": 501870 }, { "epoch": 0.88, "learning_rate": 6.2390789524164946e-06, "loss": 2.2066, "step": 501880 }, { "epoch": 0.88, "learning_rate": 6.2382070124896675e-06, "loss": 2.2442, "step": 501890 }, { "epoch": 0.88, "learning_rate": 6.237335072562841e-06, "loss": 2.2635, "step": 501900 }, { "epoch": 0.88, "learning_rate": 6.236463132636014e-06, "loss": 2.2874, "step": 501910 }, { "epoch": 0.88, "learning_rate": 6.235591192709187e-06, "loss": 2.2955, "step": 501920 }, { "epoch": 0.88, "learning_rate": 6.23471925278236e-06, "loss": 2.3536, "step": 501930 }, { "epoch": 0.88, "learning_rate": 6.233847312855534e-06, "loss": 2.365, "step": 501940 }, { "epoch": 0.88, "learning_rate": 6.2329753729287076e-06, "loss": 2.2343, "step": 501950 }, { "epoch": 0.88, "learning_rate": 6.2321034330018805e-06, "loss": 2.2412, "step": 501960 }, { "epoch": 0.88, "learning_rate": 6.231231493075053e-06, "loss": 2.297, "step": 501970 }, { "epoch": 0.88, "learning_rate": 6.230359553148226e-06, "loss": 2.2162, "step": 501980 }, { "epoch": 0.88, "learning_rate": 6.2294876132214e-06, "loss": 2.3832, "step": 501990 }, { "epoch": 0.88, "learning_rate": 6.228615673294573e-06, "loss": 2.2731, "step": 502000 }, { "epoch": 0.88, "learning_rate": 6.227743733367746e-06, "loss": 2.2535, "step": 502010 }, { "epoch": 0.88, "learning_rate": 6.22687179344092e-06, "loss": 2.1911, "step": 502020 }, { "epoch": 0.88, "learning_rate": 6.225999853514093e-06, "loss": 2.3217, "step": 502030 }, { "epoch": 0.88, "learning_rate": 6.2251279135872656e-06, "loss": 2.321, "step": 502040 }, { "epoch": 0.88, "learning_rate": 6.2242559736604385e-06, "loss": 2.318, "step": 502050 }, { "epoch": 0.88, "learning_rate": 6.223384033733612e-06, "loss": 2.2277, "step": 502060 }, { "epoch": 0.88, "learning_rate": 6.222512093806785e-06, "loss": 2.2887, "step": 502070 }, { "epoch": 0.88, "learning_rate": 6.221640153879959e-06, "loss": 2.2113, "step": 502080 }, { "epoch": 0.88, "learning_rate": 6.220768213953132e-06, "loss": 2.2665, "step": 502090 }, { "epoch": 0.88, "learning_rate": 6.219896274026305e-06, "loss": 2.1246, "step": 502100 }, { "epoch": 0.88, "learning_rate": 6.2190243340994786e-06, "loss": 2.2417, "step": 502110 }, { "epoch": 0.88, "learning_rate": 6.2181523941726515e-06, "loss": 2.2818, "step": 502120 }, { "epoch": 0.88, "learning_rate": 6.217280454245824e-06, "loss": 2.3272, "step": 502130 }, { "epoch": 0.88, "learning_rate": 6.216408514318997e-06, "loss": 2.3612, "step": 502140 }, { "epoch": 0.88, "learning_rate": 6.215536574392171e-06, "loss": 2.2885, "step": 502150 }, { "epoch": 0.88, "learning_rate": 6.214664634465344e-06, "loss": 2.2033, "step": 502160 }, { "epoch": 0.88, "learning_rate": 6.213792694538517e-06, "loss": 2.2633, "step": 502170 }, { "epoch": 0.88, "learning_rate": 6.212920754611691e-06, "loss": 2.3387, "step": 502180 }, { "epoch": 0.88, "learning_rate": 6.212048814684864e-06, "loss": 2.2911, "step": 502190 }, { "epoch": 0.88, "learning_rate": 6.2111768747580366e-06, "loss": 2.3144, "step": 502200 }, { "epoch": 0.88, "learning_rate": 6.21030493483121e-06, "loss": 2.2786, "step": 502210 }, { "epoch": 0.88, "learning_rate": 6.209432994904383e-06, "loss": 2.2242, "step": 502220 }, { "epoch": 0.88, "learning_rate": 6.208561054977557e-06, "loss": 2.31, "step": 502230 }, { "epoch": 0.88, "learning_rate": 6.20768911505073e-06, "loss": 2.2305, "step": 502240 }, { "epoch": 0.88, "learning_rate": 6.206817175123903e-06, "loss": 2.2292, "step": 502250 }, { "epoch": 0.88, "learning_rate": 6.205945235197076e-06, "loss": 2.2512, "step": 502260 }, { "epoch": 0.88, "learning_rate": 6.2050732952702496e-06, "loss": 2.3828, "step": 502270 }, { "epoch": 0.88, "learning_rate": 6.2042013553434225e-06, "loss": 2.275, "step": 502280 }, { "epoch": 0.88, "learning_rate": 6.203329415416595e-06, "loss": 2.2548, "step": 502290 }, { "epoch": 0.88, "learning_rate": 6.202457475489769e-06, "loss": 2.2983, "step": 502300 }, { "epoch": 0.88, "learning_rate": 6.201585535562942e-06, "loss": 2.2263, "step": 502310 }, { "epoch": 0.88, "learning_rate": 6.200713595636115e-06, "loss": 2.3338, "step": 502320 }, { "epoch": 0.88, "learning_rate": 6.199841655709288e-06, "loss": 2.2187, "step": 502330 }, { "epoch": 0.88, "learning_rate": 6.198969715782462e-06, "loss": 2.258, "step": 502340 }, { "epoch": 0.88, "learning_rate": 6.1980977758556355e-06, "loss": 2.2603, "step": 502350 }, { "epoch": 0.88, "learning_rate": 6.197225835928808e-06, "loss": 2.2957, "step": 502360 }, { "epoch": 0.88, "learning_rate": 6.196353896001981e-06, "loss": 2.2864, "step": 502370 }, { "epoch": 0.88, "learning_rate": 6.195481956075154e-06, "loss": 2.3206, "step": 502380 }, { "epoch": 0.88, "learning_rate": 6.194610016148328e-06, "loss": 2.2552, "step": 502390 }, { "epoch": 0.88, "learning_rate": 6.193738076221501e-06, "loss": 2.3713, "step": 502400 }, { "epoch": 0.88, "learning_rate": 6.192866136294674e-06, "loss": 2.3164, "step": 502410 }, { "epoch": 0.88, "learning_rate": 6.191994196367848e-06, "loss": 2.2193, "step": 502420 }, { "epoch": 0.88, "learning_rate": 6.1911222564410206e-06, "loss": 2.2031, "step": 502430 }, { "epoch": 0.88, "learning_rate": 6.1902503165141935e-06, "loss": 2.2437, "step": 502440 }, { "epoch": 0.88, "learning_rate": 6.189378376587366e-06, "loss": 2.3648, "step": 502450 }, { "epoch": 0.88, "learning_rate": 6.18850643666054e-06, "loss": 2.3077, "step": 502460 }, { "epoch": 0.88, "learning_rate": 6.187634496733714e-06, "loss": 2.2532, "step": 502470 }, { "epoch": 0.88, "learning_rate": 6.186762556806887e-06, "loss": 2.2183, "step": 502480 }, { "epoch": 0.88, "learning_rate": 6.18589061688006e-06, "loss": 2.1425, "step": 502490 }, { "epoch": 0.88, "learning_rate": 6.185018676953233e-06, "loss": 2.1368, "step": 502500 }, { "epoch": 0.88, "learning_rate": 6.1841467370264065e-06, "loss": 2.2663, "step": 502510 }, { "epoch": 0.88, "learning_rate": 6.183274797099579e-06, "loss": 2.221, "step": 502520 }, { "epoch": 0.88, "learning_rate": 6.182402857172752e-06, "loss": 2.291, "step": 502530 }, { "epoch": 0.88, "learning_rate": 6.181530917245926e-06, "loss": 2.2433, "step": 502540 }, { "epoch": 0.88, "learning_rate": 6.180658977319099e-06, "loss": 2.2758, "step": 502550 }, { "epoch": 0.88, "learning_rate": 6.179787037392272e-06, "loss": 2.2706, "step": 502560 }, { "epoch": 0.88, "learning_rate": 6.178915097465445e-06, "loss": 2.3154, "step": 502570 }, { "epoch": 0.88, "learning_rate": 6.178043157538619e-06, "loss": 2.2916, "step": 502580 }, { "epoch": 0.88, "learning_rate": 6.1771712176117916e-06, "loss": 2.4584, "step": 502590 }, { "epoch": 0.88, "learning_rate": 6.1762992776849645e-06, "loss": 2.2252, "step": 502600 }, { "epoch": 0.88, "learning_rate": 6.175427337758138e-06, "loss": 2.3022, "step": 502610 }, { "epoch": 0.88, "learning_rate": 6.174555397831311e-06, "loss": 2.1847, "step": 502620 }, { "epoch": 0.88, "learning_rate": 6.173683457904485e-06, "loss": 2.2601, "step": 502630 }, { "epoch": 0.88, "learning_rate": 6.172811517977658e-06, "loss": 2.1647, "step": 502640 }, { "epoch": 0.88, "learning_rate": 6.171939578050831e-06, "loss": 2.4013, "step": 502650 }, { "epoch": 0.88, "learning_rate": 6.1710676381240046e-06, "loss": 2.1595, "step": 502660 }, { "epoch": 0.88, "learning_rate": 6.1701956981971775e-06, "loss": 2.2213, "step": 502670 }, { "epoch": 0.88, "learning_rate": 6.16932375827035e-06, "loss": 2.2757, "step": 502680 }, { "epoch": 0.88, "learning_rate": 6.168451818343523e-06, "loss": 2.3575, "step": 502690 }, { "epoch": 0.88, "learning_rate": 6.167579878416697e-06, "loss": 2.3443, "step": 502700 }, { "epoch": 0.88, "learning_rate": 6.16670793848987e-06, "loss": 2.2546, "step": 502710 }, { "epoch": 0.88, "learning_rate": 6.165835998563043e-06, "loss": 2.2963, "step": 502720 }, { "epoch": 0.88, "learning_rate": 6.164964058636216e-06, "loss": 2.2903, "step": 502730 }, { "epoch": 0.88, "learning_rate": 6.16409211870939e-06, "loss": 2.2862, "step": 502740 }, { "epoch": 0.88, "learning_rate": 6.163220178782563e-06, "loss": 2.2904, "step": 502750 }, { "epoch": 0.88, "learning_rate": 6.162348238855736e-06, "loss": 2.2397, "step": 502760 }, { "epoch": 0.88, "learning_rate": 6.161476298928909e-06, "loss": 2.2298, "step": 502770 }, { "epoch": 0.88, "learning_rate": 6.160604359002082e-06, "loss": 2.1525, "step": 502780 }, { "epoch": 0.88, "learning_rate": 6.159732419075256e-06, "loss": 2.3089, "step": 502790 }, { "epoch": 0.88, "learning_rate": 6.158860479148429e-06, "loss": 2.3739, "step": 502800 }, { "epoch": 0.88, "learning_rate": 6.157988539221602e-06, "loss": 2.3877, "step": 502810 }, { "epoch": 0.88, "learning_rate": 6.1571165992947756e-06, "loss": 2.3023, "step": 502820 }, { "epoch": 0.88, "learning_rate": 6.1562446593679485e-06, "loss": 2.2943, "step": 502830 }, { "epoch": 0.88, "learning_rate": 6.155372719441121e-06, "loss": 2.2968, "step": 502840 }, { "epoch": 0.88, "learning_rate": 6.154500779514294e-06, "loss": 2.1743, "step": 502850 }, { "epoch": 0.88, "learning_rate": 6.153628839587468e-06, "loss": 2.2356, "step": 502860 }, { "epoch": 0.88, "learning_rate": 6.152756899660642e-06, "loss": 2.2782, "step": 502870 }, { "epoch": 0.88, "learning_rate": 6.151884959733815e-06, "loss": 2.1589, "step": 502880 }, { "epoch": 0.88, "learning_rate": 6.151013019806988e-06, "loss": 2.1578, "step": 502890 }, { "epoch": 0.88, "learning_rate": 6.150141079880161e-06, "loss": 2.3311, "step": 502900 }, { "epoch": 0.88, "learning_rate": 6.149269139953334e-06, "loss": 2.2869, "step": 502910 }, { "epoch": 0.88, "learning_rate": 6.148397200026507e-06, "loss": 2.2978, "step": 502920 }, { "epoch": 0.88, "learning_rate": 6.14752526009968e-06, "loss": 2.3188, "step": 502930 }, { "epoch": 0.88, "learning_rate": 6.146653320172854e-06, "loss": 2.3747, "step": 502940 }, { "epoch": 0.88, "learning_rate": 6.145781380246027e-06, "loss": 2.3121, "step": 502950 }, { "epoch": 0.88, "learning_rate": 6.1449094403192e-06, "loss": 2.2794, "step": 502960 }, { "epoch": 0.88, "learning_rate": 6.144037500392373e-06, "loss": 2.2548, "step": 502970 }, { "epoch": 0.88, "learning_rate": 6.143165560465547e-06, "loss": 2.2328, "step": 502980 }, { "epoch": 0.88, "learning_rate": 6.1422936205387195e-06, "loss": 2.2272, "step": 502990 }, { "epoch": 0.88, "learning_rate": 6.141421680611892e-06, "loss": 2.2221, "step": 503000 }, { "epoch": 0.88, "learning_rate": 6.140549740685066e-06, "loss": 2.2594, "step": 503010 }, { "epoch": 0.88, "learning_rate": 6.139677800758239e-06, "loss": 2.3371, "step": 503020 }, { "epoch": 0.88, "learning_rate": 6.138805860831413e-06, "loss": 2.3756, "step": 503030 }, { "epoch": 0.88, "learning_rate": 6.137933920904586e-06, "loss": 2.2558, "step": 503040 }, { "epoch": 0.88, "learning_rate": 6.137061980977759e-06, "loss": 2.2564, "step": 503050 }, { "epoch": 0.88, "learning_rate": 6.1361900410509325e-06, "loss": 2.2399, "step": 503060 }, { "epoch": 0.88, "learning_rate": 6.1353181011241054e-06, "loss": 2.2326, "step": 503070 }, { "epoch": 0.88, "learning_rate": 6.134446161197278e-06, "loss": 2.3023, "step": 503080 }, { "epoch": 0.88, "learning_rate": 6.133574221270451e-06, "loss": 2.2165, "step": 503090 }, { "epoch": 0.88, "learning_rate": 6.132702281343625e-06, "loss": 2.1936, "step": 503100 }, { "epoch": 0.88, "learning_rate": 6.131830341416798e-06, "loss": 2.3687, "step": 503110 }, { "epoch": 0.88, "learning_rate": 6.130958401489971e-06, "loss": 2.3988, "step": 503120 }, { "epoch": 0.88, "learning_rate": 6.130086461563144e-06, "loss": 2.1694, "step": 503130 }, { "epoch": 0.88, "learning_rate": 6.129214521636318e-06, "loss": 2.4002, "step": 503140 }, { "epoch": 0.88, "learning_rate": 6.128342581709491e-06, "loss": 2.3012, "step": 503150 }, { "epoch": 0.88, "learning_rate": 6.127470641782664e-06, "loss": 2.3023, "step": 503160 }, { "epoch": 0.88, "learning_rate": 6.126598701855837e-06, "loss": 2.2928, "step": 503170 }, { "epoch": 0.88, "learning_rate": 6.125726761929011e-06, "loss": 2.1748, "step": 503180 }, { "epoch": 0.88, "learning_rate": 6.124854822002184e-06, "loss": 2.2303, "step": 503190 }, { "epoch": 0.88, "learning_rate": 6.123982882075357e-06, "loss": 2.2236, "step": 503200 }, { "epoch": 0.88, "learning_rate": 6.12311094214853e-06, "loss": 2.3132, "step": 503210 }, { "epoch": 0.88, "learning_rate": 6.1222390022217035e-06, "loss": 2.3672, "step": 503220 }, { "epoch": 0.88, "learning_rate": 6.1213670622948764e-06, "loss": 2.3187, "step": 503230 }, { "epoch": 0.88, "learning_rate": 6.120495122368049e-06, "loss": 2.3598, "step": 503240 }, { "epoch": 0.88, "learning_rate": 6.119623182441222e-06, "loss": 2.2127, "step": 503250 }, { "epoch": 0.88, "learning_rate": 6.118751242514396e-06, "loss": 2.3009, "step": 503260 }, { "epoch": 0.88, "learning_rate": 6.11787930258757e-06, "loss": 2.4085, "step": 503270 }, { "epoch": 0.88, "learning_rate": 6.117007362660743e-06, "loss": 2.1982, "step": 503280 }, { "epoch": 0.88, "learning_rate": 6.116135422733916e-06, "loss": 2.2798, "step": 503290 }, { "epoch": 0.88, "learning_rate": 6.115263482807089e-06, "loss": 2.3549, "step": 503300 }, { "epoch": 0.88, "learning_rate": 6.114391542880262e-06, "loss": 2.3395, "step": 503310 }, { "epoch": 0.88, "learning_rate": 6.113519602953435e-06, "loss": 2.1083, "step": 503320 }, { "epoch": 0.88, "learning_rate": 6.112647663026608e-06, "loss": 2.2785, "step": 503330 }, { "epoch": 0.88, "learning_rate": 6.111775723099782e-06, "loss": 2.2088, "step": 503340 }, { "epoch": 0.88, "learning_rate": 6.110903783172955e-06, "loss": 2.3008, "step": 503350 }, { "epoch": 0.88, "learning_rate": 6.110031843246128e-06, "loss": 2.3467, "step": 503360 }, { "epoch": 0.88, "learning_rate": 6.109159903319301e-06, "loss": 2.2852, "step": 503370 }, { "epoch": 0.88, "learning_rate": 6.1082879633924745e-06, "loss": 2.3214, "step": 503380 }, { "epoch": 0.88, "learning_rate": 6.1074160234656474e-06, "loss": 2.3271, "step": 503390 }, { "epoch": 0.88, "learning_rate": 6.10654408353882e-06, "loss": 2.248, "step": 503400 }, { "epoch": 0.88, "learning_rate": 6.105672143611994e-06, "loss": 2.3307, "step": 503410 }, { "epoch": 0.88, "learning_rate": 6.104800203685167e-06, "loss": 2.3284, "step": 503420 }, { "epoch": 0.88, "learning_rate": 6.103928263758341e-06, "loss": 2.2207, "step": 503430 }, { "epoch": 0.88, "learning_rate": 6.103056323831514e-06, "loss": 2.2188, "step": 503440 }, { "epoch": 0.88, "learning_rate": 6.102184383904687e-06, "loss": 2.2535, "step": 503450 }, { "epoch": 0.88, "learning_rate": 6.1013124439778604e-06, "loss": 2.333, "step": 503460 }, { "epoch": 0.88, "learning_rate": 6.100440504051033e-06, "loss": 2.3099, "step": 503470 }, { "epoch": 0.88, "learning_rate": 6.099568564124206e-06, "loss": 2.3169, "step": 503480 }, { "epoch": 0.88, "learning_rate": 6.098696624197379e-06, "loss": 2.2328, "step": 503490 }, { "epoch": 0.88, "learning_rate": 6.097824684270553e-06, "loss": 2.299, "step": 503500 }, { "epoch": 0.88, "learning_rate": 6.096952744343726e-06, "loss": 2.2947, "step": 503510 }, { "epoch": 0.88, "learning_rate": 6.096080804416899e-06, "loss": 2.3063, "step": 503520 }, { "epoch": 0.88, "learning_rate": 6.095208864490072e-06, "loss": 2.1897, "step": 503530 }, { "epoch": 0.88, "learning_rate": 6.0943369245632455e-06, "loss": 2.2391, "step": 503540 }, { "epoch": 0.88, "learning_rate": 6.093464984636419e-06, "loss": 2.2264, "step": 503550 }, { "epoch": 0.88, "learning_rate": 6.092593044709592e-06, "loss": 2.2294, "step": 503560 }, { "epoch": 0.88, "learning_rate": 6.091721104782765e-06, "loss": 2.3361, "step": 503570 }, { "epoch": 0.88, "learning_rate": 6.090849164855939e-06, "loss": 2.2565, "step": 503580 }, { "epoch": 0.88, "learning_rate": 6.089977224929112e-06, "loss": 2.2684, "step": 503590 }, { "epoch": 0.88, "learning_rate": 6.089105285002285e-06, "loss": 2.2345, "step": 503600 }, { "epoch": 0.88, "learning_rate": 6.088233345075458e-06, "loss": 2.2616, "step": 503610 }, { "epoch": 0.88, "learning_rate": 6.0873614051486314e-06, "loss": 2.1968, "step": 503620 }, { "epoch": 0.88, "learning_rate": 6.086489465221804e-06, "loss": 2.2128, "step": 503630 }, { "epoch": 0.88, "learning_rate": 6.085617525294977e-06, "loss": 2.1837, "step": 503640 }, { "epoch": 0.88, "learning_rate": 6.08474558536815e-06, "loss": 2.1963, "step": 503650 }, { "epoch": 0.88, "learning_rate": 6.083873645441324e-06, "loss": 2.3946, "step": 503660 }, { "epoch": 0.88, "learning_rate": 6.083001705514498e-06, "loss": 2.2932, "step": 503670 }, { "epoch": 0.88, "learning_rate": 6.082129765587671e-06, "loss": 2.2042, "step": 503680 }, { "epoch": 0.88, "learning_rate": 6.081257825660844e-06, "loss": 2.2688, "step": 503690 }, { "epoch": 0.88, "learning_rate": 6.080385885734017e-06, "loss": 2.285, "step": 503700 }, { "epoch": 0.88, "learning_rate": 6.07951394580719e-06, "loss": 2.2752, "step": 503710 }, { "epoch": 0.88, "learning_rate": 6.078642005880363e-06, "loss": 2.3406, "step": 503720 }, { "epoch": 0.88, "learning_rate": 6.077770065953536e-06, "loss": 2.2143, "step": 503730 }, { "epoch": 0.88, "learning_rate": 6.07689812602671e-06, "loss": 2.328, "step": 503740 }, { "epoch": 0.88, "learning_rate": 6.076026186099883e-06, "loss": 2.2449, "step": 503750 }, { "epoch": 0.88, "learning_rate": 6.075154246173056e-06, "loss": 2.179, "step": 503760 }, { "epoch": 0.88, "learning_rate": 6.074282306246229e-06, "loss": 2.2531, "step": 503770 }, { "epoch": 0.88, "learning_rate": 6.0734103663194024e-06, "loss": 2.2722, "step": 503780 }, { "epoch": 0.88, "learning_rate": 6.072538426392575e-06, "loss": 2.255, "step": 503790 }, { "epoch": 0.88, "learning_rate": 6.071666486465749e-06, "loss": 2.2671, "step": 503800 }, { "epoch": 0.88, "learning_rate": 6.070794546538922e-06, "loss": 2.1863, "step": 503810 }, { "epoch": 0.88, "learning_rate": 6.069922606612095e-06, "loss": 2.196, "step": 503820 }, { "epoch": 0.88, "learning_rate": 6.069050666685269e-06, "loss": 2.2472, "step": 503830 }, { "epoch": 0.88, "learning_rate": 6.068178726758442e-06, "loss": 2.2824, "step": 503840 }, { "epoch": 0.88, "learning_rate": 6.067306786831615e-06, "loss": 2.274, "step": 503850 }, { "epoch": 0.88, "learning_rate": 6.066434846904788e-06, "loss": 2.2509, "step": 503860 }, { "epoch": 0.88, "learning_rate": 6.065562906977961e-06, "loss": 2.3182, "step": 503870 }, { "epoch": 0.88, "learning_rate": 6.064690967051134e-06, "loss": 2.257, "step": 503880 }, { "epoch": 0.88, "learning_rate": 6.063819027124307e-06, "loss": 2.1844, "step": 503890 }, { "epoch": 0.88, "learning_rate": 6.062947087197481e-06, "loss": 2.2823, "step": 503900 }, { "epoch": 0.88, "learning_rate": 6.062075147270654e-06, "loss": 2.1947, "step": 503910 }, { "epoch": 0.88, "learning_rate": 6.061203207343827e-06, "loss": 2.166, "step": 503920 }, { "epoch": 0.88, "learning_rate": 6.060331267417e-06, "loss": 2.2796, "step": 503930 }, { "epoch": 0.88, "learning_rate": 6.0594593274901734e-06, "loss": 2.2683, "step": 503940 }, { "epoch": 0.88, "learning_rate": 6.058587387563347e-06, "loss": 2.1012, "step": 503950 }, { "epoch": 0.88, "learning_rate": 6.05771544763652e-06, "loss": 2.2116, "step": 503960 }, { "epoch": 0.88, "learning_rate": 6.056843507709693e-06, "loss": 2.2852, "step": 503970 }, { "epoch": 0.88, "learning_rate": 6.055971567782867e-06, "loss": 2.3761, "step": 503980 }, { "epoch": 0.88, "learning_rate": 6.05509962785604e-06, "loss": 2.3524, "step": 503990 }, { "epoch": 0.88, "learning_rate": 6.054227687929213e-06, "loss": 2.3603, "step": 504000 }, { "epoch": 0.88, "learning_rate": 6.053355748002386e-06, "loss": 2.2855, "step": 504010 }, { "epoch": 0.88, "learning_rate": 6.052483808075559e-06, "loss": 2.2876, "step": 504020 }, { "epoch": 0.88, "learning_rate": 6.051611868148732e-06, "loss": 2.214, "step": 504030 }, { "epoch": 0.88, "learning_rate": 6.050739928221905e-06, "loss": 2.2364, "step": 504040 }, { "epoch": 0.88, "learning_rate": 6.049867988295078e-06, "loss": 2.2753, "step": 504050 }, { "epoch": 0.88, "learning_rate": 6.048996048368252e-06, "loss": 2.2328, "step": 504060 }, { "epoch": 0.88, "learning_rate": 6.048124108441426e-06, "loss": 2.1637, "step": 504070 }, { "epoch": 0.88, "learning_rate": 6.047252168514599e-06, "loss": 2.1728, "step": 504080 }, { "epoch": 0.88, "learning_rate": 6.0463802285877715e-06, "loss": 2.3199, "step": 504090 }, { "epoch": 0.88, "learning_rate": 6.045508288660945e-06, "loss": 2.324, "step": 504100 }, { "epoch": 0.88, "learning_rate": 6.044636348734118e-06, "loss": 2.1746, "step": 504110 }, { "epoch": 0.88, "learning_rate": 6.043764408807291e-06, "loss": 2.305, "step": 504120 }, { "epoch": 0.88, "learning_rate": 6.042892468880464e-06, "loss": 2.2355, "step": 504130 }, { "epoch": 0.88, "learning_rate": 6.042020528953638e-06, "loss": 2.2908, "step": 504140 }, { "epoch": 0.88, "learning_rate": 6.041148589026811e-06, "loss": 2.3518, "step": 504150 }, { "epoch": 0.88, "learning_rate": 6.040276649099984e-06, "loss": 2.3325, "step": 504160 }, { "epoch": 0.88, "learning_rate": 6.039404709173157e-06, "loss": 2.305, "step": 504170 }, { "epoch": 0.88, "learning_rate": 6.03853276924633e-06, "loss": 2.2567, "step": 504180 }, { "epoch": 0.88, "learning_rate": 6.037660829319503e-06, "loss": 2.1234, "step": 504190 }, { "epoch": 0.88, "learning_rate": 6.036788889392677e-06, "loss": 2.3435, "step": 504200 }, { "epoch": 0.88, "learning_rate": 6.03591694946585e-06, "loss": 2.2623, "step": 504210 }, { "epoch": 0.88, "learning_rate": 6.035045009539024e-06, "loss": 2.2281, "step": 504220 }, { "epoch": 0.88, "learning_rate": 6.034173069612197e-06, "loss": 2.2201, "step": 504230 }, { "epoch": 0.88, "learning_rate": 6.03330112968537e-06, "loss": 2.2533, "step": 504240 }, { "epoch": 0.88, "learning_rate": 6.0324291897585425e-06, "loss": 2.2881, "step": 504250 }, { "epoch": 0.88, "learning_rate": 6.031557249831716e-06, "loss": 2.3189, "step": 504260 }, { "epoch": 0.88, "learning_rate": 6.030685309904889e-06, "loss": 2.2176, "step": 504270 }, { "epoch": 0.88, "learning_rate": 6.029813369978062e-06, "loss": 2.2414, "step": 504280 }, { "epoch": 0.88, "learning_rate": 6.028941430051235e-06, "loss": 2.2304, "step": 504290 }, { "epoch": 0.88, "learning_rate": 6.028069490124409e-06, "loss": 2.2351, "step": 504300 }, { "epoch": 0.88, "learning_rate": 6.027197550197582e-06, "loss": 2.2721, "step": 504310 }, { "epoch": 0.88, "learning_rate": 6.026325610270755e-06, "loss": 2.1513, "step": 504320 }, { "epoch": 0.88, "learning_rate": 6.025453670343928e-06, "loss": 2.3397, "step": 504330 }, { "epoch": 0.88, "learning_rate": 6.024581730417101e-06, "loss": 2.3377, "step": 504340 }, { "epoch": 0.88, "learning_rate": 6.023709790490275e-06, "loss": 2.2378, "step": 504350 }, { "epoch": 0.88, "learning_rate": 6.022837850563448e-06, "loss": 2.2486, "step": 504360 }, { "epoch": 0.88, "learning_rate": 6.021965910636621e-06, "loss": 2.1847, "step": 504370 }, { "epoch": 0.88, "learning_rate": 6.021093970709795e-06, "loss": 2.2553, "step": 504380 }, { "epoch": 0.88, "learning_rate": 6.020222030782968e-06, "loss": 2.2091, "step": 504390 }, { "epoch": 0.88, "learning_rate": 6.019350090856141e-06, "loss": 2.2609, "step": 504400 }, { "epoch": 0.88, "learning_rate": 6.0184781509293135e-06, "loss": 2.2416, "step": 504410 }, { "epoch": 0.88, "learning_rate": 6.017606211002487e-06, "loss": 2.3394, "step": 504420 }, { "epoch": 0.88, "learning_rate": 6.01673427107566e-06, "loss": 2.2591, "step": 504430 }, { "epoch": 0.88, "learning_rate": 6.015862331148833e-06, "loss": 2.3234, "step": 504440 }, { "epoch": 0.88, "learning_rate": 6.014990391222006e-06, "loss": 2.2538, "step": 504450 }, { "epoch": 0.88, "learning_rate": 6.01411845129518e-06, "loss": 2.1451, "step": 504460 }, { "epoch": 0.88, "learning_rate": 6.013246511368354e-06, "loss": 2.2928, "step": 504470 }, { "epoch": 0.88, "learning_rate": 6.0123745714415265e-06, "loss": 2.3485, "step": 504480 }, { "epoch": 0.88, "learning_rate": 6.0115026315146994e-06, "loss": 2.2812, "step": 504490 }, { "epoch": 0.88, "learning_rate": 6.010630691587873e-06, "loss": 2.2599, "step": 504500 }, { "epoch": 0.88, "learning_rate": 6.009758751661046e-06, "loss": 2.1919, "step": 504510 }, { "epoch": 0.88, "learning_rate": 6.008886811734219e-06, "loss": 2.1873, "step": 504520 }, { "epoch": 0.88, "learning_rate": 6.008014871807392e-06, "loss": 2.1192, "step": 504530 }, { "epoch": 0.88, "learning_rate": 6.007142931880566e-06, "loss": 2.2493, "step": 504540 }, { "epoch": 0.88, "learning_rate": 6.006270991953739e-06, "loss": 2.1024, "step": 504550 }, { "epoch": 0.88, "learning_rate": 6.005399052026912e-06, "loss": 2.2715, "step": 504560 }, { "epoch": 0.88, "learning_rate": 6.0045271121000845e-06, "loss": 2.1626, "step": 504570 }, { "epoch": 0.88, "learning_rate": 6.003655172173258e-06, "loss": 2.3375, "step": 504580 }, { "epoch": 0.88, "learning_rate": 6.002783232246431e-06, "loss": 2.283, "step": 504590 }, { "epoch": 0.88, "learning_rate": 6.001911292319605e-06, "loss": 2.422, "step": 504600 }, { "epoch": 0.88, "learning_rate": 6.001039352392778e-06, "loss": 2.3267, "step": 504610 }, { "epoch": 0.88, "learning_rate": 6.000167412465952e-06, "loss": 2.272, "step": 504620 }, { "epoch": 0.88, "learning_rate": 5.999295472539125e-06, "loss": 2.2836, "step": 504630 }, { "epoch": 0.88, "learning_rate": 5.9984235326122975e-06, "loss": 2.2458, "step": 504640 }, { "epoch": 0.88, "learning_rate": 5.9975515926854704e-06, "loss": 2.2765, "step": 504650 }, { "epoch": 0.88, "learning_rate": 5.996679652758644e-06, "loss": 2.269, "step": 504660 }, { "epoch": 0.88, "learning_rate": 5.995807712831817e-06, "loss": 2.3309, "step": 504670 }, { "epoch": 0.88, "learning_rate": 5.99493577290499e-06, "loss": 2.4122, "step": 504680 }, { "epoch": 0.88, "learning_rate": 5.994063832978163e-06, "loss": 2.3374, "step": 504690 }, { "epoch": 0.88, "learning_rate": 5.993191893051337e-06, "loss": 2.2533, "step": 504700 }, { "epoch": 0.88, "learning_rate": 5.99231995312451e-06, "loss": 2.2944, "step": 504710 }, { "epoch": 0.88, "learning_rate": 5.991448013197683e-06, "loss": 2.1812, "step": 504720 }, { "epoch": 0.88, "learning_rate": 5.9905760732708555e-06, "loss": 2.2835, "step": 504730 }, { "epoch": 0.88, "learning_rate": 5.98970413334403e-06, "loss": 2.5013, "step": 504740 }, { "epoch": 0.88, "learning_rate": 5.988832193417203e-06, "loss": 2.2331, "step": 504750 }, { "epoch": 0.88, "learning_rate": 5.987960253490376e-06, "loss": 2.3191, "step": 504760 }, { "epoch": 0.88, "learning_rate": 5.987088313563549e-06, "loss": 2.2918, "step": 504770 }, { "epoch": 0.88, "learning_rate": 5.986216373636723e-06, "loss": 2.2193, "step": 504780 }, { "epoch": 0.88, "learning_rate": 5.985344433709896e-06, "loss": 2.2609, "step": 504790 }, { "epoch": 0.88, "learning_rate": 5.9844724937830685e-06, "loss": 2.2938, "step": 504800 }, { "epoch": 0.88, "learning_rate": 5.9836005538562414e-06, "loss": 2.223, "step": 504810 }, { "epoch": 0.88, "learning_rate": 5.982728613929415e-06, "loss": 2.3108, "step": 504820 }, { "epoch": 0.88, "learning_rate": 5.981856674002588e-06, "loss": 2.3887, "step": 504830 }, { "epoch": 0.88, "learning_rate": 5.980984734075761e-06, "loss": 2.118, "step": 504840 }, { "epoch": 0.88, "learning_rate": 5.980112794148934e-06, "loss": 2.2887, "step": 504850 }, { "epoch": 0.88, "learning_rate": 5.979240854222108e-06, "loss": 2.2597, "step": 504860 }, { "epoch": 0.88, "learning_rate": 5.9783689142952815e-06, "loss": 2.326, "step": 504870 }, { "epoch": 0.88, "learning_rate": 5.9774969743684544e-06, "loss": 2.2691, "step": 504880 }, { "epoch": 0.88, "learning_rate": 5.976625034441627e-06, "loss": 2.0894, "step": 504890 }, { "epoch": 0.88, "learning_rate": 5.975753094514801e-06, "loss": 2.3005, "step": 504900 }, { "epoch": 0.88, "learning_rate": 5.974881154587974e-06, "loss": 2.2846, "step": 504910 }, { "epoch": 0.88, "learning_rate": 5.974009214661147e-06, "loss": 2.2827, "step": 504920 }, { "epoch": 0.88, "learning_rate": 5.97313727473432e-06, "loss": 2.2847, "step": 504930 }, { "epoch": 0.88, "learning_rate": 5.972265334807494e-06, "loss": 2.2287, "step": 504940 }, { "epoch": 0.88, "learning_rate": 5.971393394880667e-06, "loss": 2.1411, "step": 504950 }, { "epoch": 0.88, "learning_rate": 5.9705214549538395e-06, "loss": 2.2558, "step": 504960 }, { "epoch": 0.88, "learning_rate": 5.9696495150270124e-06, "loss": 2.2027, "step": 504970 }, { "epoch": 0.88, "learning_rate": 5.968777575100186e-06, "loss": 2.2661, "step": 504980 }, { "epoch": 0.88, "learning_rate": 5.967905635173359e-06, "loss": 2.2892, "step": 504990 }, { "epoch": 0.88, "learning_rate": 5.967033695246533e-06, "loss": 2.0233, "step": 505000 }, { "epoch": 0.88, "learning_rate": 5.966161755319706e-06, "loss": 2.3244, "step": 505010 }, { "epoch": 0.88, "learning_rate": 5.96528981539288e-06, "loss": 2.235, "step": 505020 }, { "epoch": 0.88, "learning_rate": 5.9644178754660525e-06, "loss": 2.2332, "step": 505030 }, { "epoch": 0.88, "learning_rate": 5.9635459355392254e-06, "loss": 2.3269, "step": 505040 }, { "epoch": 0.88, "learning_rate": 5.962673995612398e-06, "loss": 2.2901, "step": 505050 }, { "epoch": 0.88, "learning_rate": 5.961802055685572e-06, "loss": 2.2578, "step": 505060 }, { "epoch": 0.88, "learning_rate": 5.960930115758745e-06, "loss": 2.3126, "step": 505070 }, { "epoch": 0.88, "learning_rate": 5.960058175831918e-06, "loss": 2.2606, "step": 505080 }, { "epoch": 0.88, "learning_rate": 5.959186235905091e-06, "loss": 2.2293, "step": 505090 }, { "epoch": 0.88, "learning_rate": 5.958314295978265e-06, "loss": 2.3416, "step": 505100 }, { "epoch": 0.88, "learning_rate": 5.957442356051438e-06, "loss": 2.2432, "step": 505110 }, { "epoch": 0.88, "learning_rate": 5.9565704161246105e-06, "loss": 2.2655, "step": 505120 }, { "epoch": 0.88, "learning_rate": 5.9556984761977834e-06, "loss": 2.343, "step": 505130 }, { "epoch": 0.88, "learning_rate": 5.954826536270958e-06, "loss": 2.2262, "step": 505140 }, { "epoch": 0.88, "learning_rate": 5.953954596344131e-06, "loss": 2.3598, "step": 505150 }, { "epoch": 0.88, "learning_rate": 5.953082656417304e-06, "loss": 2.2133, "step": 505160 }, { "epoch": 0.88, "learning_rate": 5.952210716490477e-06, "loss": 2.3604, "step": 505170 }, { "epoch": 0.88, "learning_rate": 5.951338776563651e-06, "loss": 2.1591, "step": 505180 }, { "epoch": 0.88, "learning_rate": 5.9504668366368235e-06, "loss": 2.3171, "step": 505190 }, { "epoch": 0.88, "learning_rate": 5.9495948967099964e-06, "loss": 2.1952, "step": 505200 }, { "epoch": 0.88, "learning_rate": 5.948722956783169e-06, "loss": 2.2835, "step": 505210 }, { "epoch": 0.88, "learning_rate": 5.947851016856343e-06, "loss": 2.1934, "step": 505220 }, { "epoch": 0.88, "learning_rate": 5.946979076929516e-06, "loss": 2.2408, "step": 505230 }, { "epoch": 0.88, "learning_rate": 5.946107137002689e-06, "loss": 2.1946, "step": 505240 }, { "epoch": 0.88, "learning_rate": 5.945235197075862e-06, "loss": 2.2925, "step": 505250 }, { "epoch": 0.88, "learning_rate": 5.944363257149036e-06, "loss": 2.2929, "step": 505260 }, { "epoch": 0.88, "learning_rate": 5.9434913172222094e-06, "loss": 2.392, "step": 505270 }, { "epoch": 0.88, "learning_rate": 5.942619377295382e-06, "loss": 2.2917, "step": 505280 }, { "epoch": 0.88, "learning_rate": 5.941747437368555e-06, "loss": 2.2019, "step": 505290 }, { "epoch": 0.88, "learning_rate": 5.940875497441729e-06, "loss": 2.3115, "step": 505300 }, { "epoch": 0.88, "learning_rate": 5.940003557514902e-06, "loss": 2.2177, "step": 505310 }, { "epoch": 0.88, "learning_rate": 5.939131617588075e-06, "loss": 2.1573, "step": 505320 }, { "epoch": 0.88, "learning_rate": 5.938259677661248e-06, "loss": 2.3938, "step": 505330 }, { "epoch": 0.88, "learning_rate": 5.937387737734422e-06, "loss": 2.2405, "step": 505340 }, { "epoch": 0.88, "learning_rate": 5.9365157978075945e-06, "loss": 2.2734, "step": 505350 }, { "epoch": 0.88, "learning_rate": 5.9356438578807674e-06, "loss": 2.2592, "step": 505360 }, { "epoch": 0.88, "learning_rate": 5.93477191795394e-06, "loss": 2.3116, "step": 505370 }, { "epoch": 0.88, "learning_rate": 5.933899978027114e-06, "loss": 2.2581, "step": 505380 }, { "epoch": 0.88, "learning_rate": 5.933028038100287e-06, "loss": 2.3374, "step": 505390 }, { "epoch": 0.88, "learning_rate": 5.932156098173461e-06, "loss": 2.2194, "step": 505400 }, { "epoch": 0.88, "learning_rate": 5.931284158246634e-06, "loss": 2.2296, "step": 505410 }, { "epoch": 0.88, "learning_rate": 5.9304122183198075e-06, "loss": 2.2656, "step": 505420 }, { "epoch": 0.88, "learning_rate": 5.9295402783929804e-06, "loss": 2.3702, "step": 505430 }, { "epoch": 0.88, "learning_rate": 5.928668338466153e-06, "loss": 2.2552, "step": 505440 }, { "epoch": 0.88, "learning_rate": 5.927796398539326e-06, "loss": 2.2734, "step": 505450 }, { "epoch": 0.88, "learning_rate": 5.9269244586125e-06, "loss": 2.259, "step": 505460 }, { "epoch": 0.88, "learning_rate": 5.926052518685673e-06, "loss": 2.3049, "step": 505470 }, { "epoch": 0.88, "learning_rate": 5.925180578758846e-06, "loss": 2.2054, "step": 505480 }, { "epoch": 0.88, "learning_rate": 5.924308638832019e-06, "loss": 2.3534, "step": 505490 }, { "epoch": 0.88, "learning_rate": 5.923436698905193e-06, "loss": 2.3905, "step": 505500 }, { "epoch": 0.88, "learning_rate": 5.9225647589783655e-06, "loss": 2.3821, "step": 505510 }, { "epoch": 0.88, "learning_rate": 5.9216928190515384e-06, "loss": 2.2059, "step": 505520 }, { "epoch": 0.88, "learning_rate": 5.920820879124712e-06, "loss": 2.2774, "step": 505530 }, { "epoch": 0.88, "learning_rate": 5.919948939197886e-06, "loss": 2.2483, "step": 505540 }, { "epoch": 0.88, "learning_rate": 5.919076999271059e-06, "loss": 2.3305, "step": 505550 }, { "epoch": 0.88, "learning_rate": 5.918205059344232e-06, "loss": 2.2977, "step": 505560 }, { "epoch": 0.88, "learning_rate": 5.917333119417405e-06, "loss": 2.2344, "step": 505570 }, { "epoch": 0.88, "learning_rate": 5.9164611794905785e-06, "loss": 2.3334, "step": 505580 }, { "epoch": 0.88, "learning_rate": 5.9155892395637514e-06, "loss": 2.2496, "step": 505590 }, { "epoch": 0.88, "learning_rate": 5.914717299636924e-06, "loss": 2.2213, "step": 505600 }, { "epoch": 0.88, "learning_rate": 5.913845359710097e-06, "loss": 2.3434, "step": 505610 }, { "epoch": 0.88, "learning_rate": 5.912973419783271e-06, "loss": 2.2079, "step": 505620 }, { "epoch": 0.88, "learning_rate": 5.912101479856444e-06, "loss": 2.3473, "step": 505630 }, { "epoch": 0.88, "learning_rate": 5.911229539929617e-06, "loss": 2.3574, "step": 505640 }, { "epoch": 0.88, "learning_rate": 5.91035760000279e-06, "loss": 2.2323, "step": 505650 }, { "epoch": 0.88, "learning_rate": 5.909485660075964e-06, "loss": 2.2781, "step": 505660 }, { "epoch": 0.88, "learning_rate": 5.908613720149137e-06, "loss": 2.2111, "step": 505670 }, { "epoch": 0.88, "learning_rate": 5.90774178022231e-06, "loss": 2.3631, "step": 505680 }, { "epoch": 0.88, "learning_rate": 5.906869840295483e-06, "loss": 2.3411, "step": 505690 }, { "epoch": 0.88, "learning_rate": 5.905997900368657e-06, "loss": 2.3623, "step": 505700 }, { "epoch": 0.88, "learning_rate": 5.90512596044183e-06, "loss": 2.2026, "step": 505710 }, { "epoch": 0.88, "learning_rate": 5.904254020515003e-06, "loss": 2.3234, "step": 505720 }, { "epoch": 0.88, "learning_rate": 5.903382080588176e-06, "loss": 2.3293, "step": 505730 }, { "epoch": 0.88, "learning_rate": 5.9025101406613495e-06, "loss": 2.3164, "step": 505740 }, { "epoch": 0.88, "learning_rate": 5.9016382007345224e-06, "loss": 2.4097, "step": 505750 }, { "epoch": 0.88, "learning_rate": 5.900766260807695e-06, "loss": 2.3372, "step": 505760 }, { "epoch": 0.88, "learning_rate": 5.899894320880868e-06, "loss": 2.2314, "step": 505770 }, { "epoch": 0.88, "learning_rate": 5.899022380954042e-06, "loss": 2.2228, "step": 505780 }, { "epoch": 0.88, "learning_rate": 5.898150441027215e-06, "loss": 2.3019, "step": 505790 }, { "epoch": 0.88, "learning_rate": 5.897278501100389e-06, "loss": 2.2635, "step": 505800 }, { "epoch": 0.88, "learning_rate": 5.896406561173562e-06, "loss": 2.2029, "step": 505810 }, { "epoch": 0.88, "learning_rate": 5.8955346212467354e-06, "loss": 2.2756, "step": 505820 }, { "epoch": 0.88, "learning_rate": 5.894662681319908e-06, "loss": 2.2515, "step": 505830 }, { "epoch": 0.88, "learning_rate": 5.893790741393081e-06, "loss": 2.2345, "step": 505840 }, { "epoch": 0.88, "learning_rate": 5.892918801466254e-06, "loss": 2.2893, "step": 505850 }, { "epoch": 0.88, "learning_rate": 5.892046861539428e-06, "loss": 2.2091, "step": 505860 }, { "epoch": 0.88, "learning_rate": 5.891174921612601e-06, "loss": 2.2346, "step": 505870 }, { "epoch": 0.88, "learning_rate": 5.890302981685774e-06, "loss": 2.2947, "step": 505880 }, { "epoch": 0.88, "learning_rate": 5.889431041758947e-06, "loss": 2.2515, "step": 505890 }, { "epoch": 0.88, "learning_rate": 5.8885591018321205e-06, "loss": 2.1527, "step": 505900 }, { "epoch": 0.88, "learning_rate": 5.8876871619052934e-06, "loss": 2.328, "step": 505910 }, { "epoch": 0.88, "learning_rate": 5.886815221978466e-06, "loss": 2.2585, "step": 505920 }, { "epoch": 0.88, "learning_rate": 5.88594328205164e-06, "loss": 2.2678, "step": 505930 }, { "epoch": 0.88, "learning_rate": 5.885071342124814e-06, "loss": 2.3366, "step": 505940 }, { "epoch": 0.88, "learning_rate": 5.884199402197987e-06, "loss": 2.3573, "step": 505950 }, { "epoch": 0.88, "learning_rate": 5.88332746227116e-06, "loss": 2.2316, "step": 505960 }, { "epoch": 0.88, "learning_rate": 5.882455522344333e-06, "loss": 2.4203, "step": 505970 }, { "epoch": 0.88, "learning_rate": 5.8815835824175064e-06, "loss": 2.279, "step": 505980 }, { "epoch": 0.88, "learning_rate": 5.880711642490679e-06, "loss": 2.3188, "step": 505990 }, { "epoch": 0.88, "learning_rate": 5.879839702563852e-06, "loss": 2.1873, "step": 506000 }, { "epoch": 0.88, "learning_rate": 5.878967762637025e-06, "loss": 2.296, "step": 506010 }, { "epoch": 0.88, "learning_rate": 5.878095822710199e-06, "loss": 2.2989, "step": 506020 }, { "epoch": 0.88, "learning_rate": 5.877223882783372e-06, "loss": 2.2962, "step": 506030 }, { "epoch": 0.88, "learning_rate": 5.876351942856545e-06, "loss": 2.2517, "step": 506040 }, { "epoch": 0.88, "learning_rate": 5.875480002929718e-06, "loss": 2.28, "step": 506050 }, { "epoch": 0.88, "learning_rate": 5.8746080630028915e-06, "loss": 2.0983, "step": 506060 }, { "epoch": 0.88, "learning_rate": 5.873736123076065e-06, "loss": 2.1725, "step": 506070 }, { "epoch": 0.88, "learning_rate": 5.872864183149238e-06, "loss": 2.2885, "step": 506080 }, { "epoch": 0.88, "learning_rate": 5.871992243222411e-06, "loss": 2.3218, "step": 506090 }, { "epoch": 0.88, "learning_rate": 5.871120303295585e-06, "loss": 2.3351, "step": 506100 }, { "epoch": 0.88, "learning_rate": 5.870248363368758e-06, "loss": 2.315, "step": 506110 }, { "epoch": 0.88, "learning_rate": 5.869376423441931e-06, "loss": 2.2568, "step": 506120 }, { "epoch": 0.88, "learning_rate": 5.868504483515104e-06, "loss": 2.3316, "step": 506130 }, { "epoch": 0.88, "learning_rate": 5.8676325435882775e-06, "loss": 2.3978, "step": 506140 }, { "epoch": 0.88, "learning_rate": 5.86676060366145e-06, "loss": 2.3257, "step": 506150 }, { "epoch": 0.88, "learning_rate": 5.865888663734623e-06, "loss": 2.2531, "step": 506160 }, { "epoch": 0.88, "learning_rate": 5.865016723807796e-06, "loss": 2.2085, "step": 506170 }, { "epoch": 0.88, "learning_rate": 5.86414478388097e-06, "loss": 2.2197, "step": 506180 }, { "epoch": 0.88, "learning_rate": 5.863272843954143e-06, "loss": 2.3153, "step": 506190 }, { "epoch": 0.88, "learning_rate": 5.862400904027317e-06, "loss": 2.3282, "step": 506200 }, { "epoch": 0.88, "learning_rate": 5.86152896410049e-06, "loss": 2.2734, "step": 506210 }, { "epoch": 0.88, "learning_rate": 5.860657024173663e-06, "loss": 2.3093, "step": 506220 }, { "epoch": 0.88, "learning_rate": 5.859785084246836e-06, "loss": 2.2821, "step": 506230 }, { "epoch": 0.88, "learning_rate": 5.858913144320009e-06, "loss": 2.3079, "step": 506240 }, { "epoch": 0.88, "learning_rate": 5.858041204393182e-06, "loss": 2.1759, "step": 506250 }, { "epoch": 0.88, "learning_rate": 5.857169264466356e-06, "loss": 2.2268, "step": 506260 }, { "epoch": 0.88, "learning_rate": 5.856297324539529e-06, "loss": 2.2884, "step": 506270 }, { "epoch": 0.88, "learning_rate": 5.855425384612702e-06, "loss": 2.2753, "step": 506280 }, { "epoch": 0.88, "learning_rate": 5.854553444685875e-06, "loss": 2.2648, "step": 506290 }, { "epoch": 0.88, "learning_rate": 5.8536815047590485e-06, "loss": 2.1654, "step": 506300 }, { "epoch": 0.88, "learning_rate": 5.852809564832221e-06, "loss": 2.3206, "step": 506310 }, { "epoch": 0.88, "learning_rate": 5.851937624905394e-06, "loss": 2.1915, "step": 506320 }, { "epoch": 0.88, "learning_rate": 5.851065684978568e-06, "loss": 2.2022, "step": 506330 }, { "epoch": 0.88, "learning_rate": 5.850193745051742e-06, "loss": 2.3051, "step": 506340 }, { "epoch": 0.88, "learning_rate": 5.849321805124915e-06, "loss": 2.2439, "step": 506350 }, { "epoch": 0.88, "learning_rate": 5.848449865198088e-06, "loss": 2.254, "step": 506360 }, { "epoch": 0.88, "learning_rate": 5.847577925271261e-06, "loss": 2.3314, "step": 506370 }, { "epoch": 0.88, "learning_rate": 5.846705985344434e-06, "loss": 2.2831, "step": 506380 }, { "epoch": 0.88, "learning_rate": 5.845834045417607e-06, "loss": 2.1705, "step": 506390 }, { "epoch": 0.88, "learning_rate": 5.84496210549078e-06, "loss": 2.2739, "step": 506400 }, { "epoch": 0.88, "learning_rate": 5.844090165563953e-06, "loss": 2.3445, "step": 506410 }, { "epoch": 0.88, "learning_rate": 5.843218225637127e-06, "loss": 2.2613, "step": 506420 }, { "epoch": 0.88, "learning_rate": 5.8423462857103e-06, "loss": 2.2154, "step": 506430 }, { "epoch": 0.88, "learning_rate": 5.841474345783473e-06, "loss": 2.1861, "step": 506440 }, { "epoch": 0.88, "learning_rate": 5.840602405856646e-06, "loss": 2.1977, "step": 506450 }, { "epoch": 0.88, "learning_rate": 5.8397304659298195e-06, "loss": 2.2759, "step": 506460 }, { "epoch": 0.88, "learning_rate": 5.838858526002993e-06, "loss": 2.1746, "step": 506470 }, { "epoch": 0.88, "learning_rate": 5.837986586076166e-06, "loss": 2.3245, "step": 506480 }, { "epoch": 0.88, "learning_rate": 5.837114646149339e-06, "loss": 2.307, "step": 506490 }, { "epoch": 0.88, "learning_rate": 5.836242706222513e-06, "loss": 2.3257, "step": 506500 }, { "epoch": 0.88, "learning_rate": 5.835370766295686e-06, "loss": 2.3491, "step": 506510 }, { "epoch": 0.88, "learning_rate": 5.834498826368859e-06, "loss": 2.2192, "step": 506520 }, { "epoch": 0.88, "learning_rate": 5.833626886442032e-06, "loss": 2.1974, "step": 506530 }, { "epoch": 0.88, "learning_rate": 5.832754946515205e-06, "loss": 2.3456, "step": 506540 }, { "epoch": 0.88, "learning_rate": 5.831883006588378e-06, "loss": 2.3026, "step": 506550 }, { "epoch": 0.88, "learning_rate": 5.831011066661551e-06, "loss": 2.2649, "step": 506560 }, { "epoch": 0.88, "learning_rate": 5.830139126734724e-06, "loss": 2.2988, "step": 506570 }, { "epoch": 0.88, "learning_rate": 5.829267186807898e-06, "loss": 2.3582, "step": 506580 }, { "epoch": 0.88, "learning_rate": 5.828395246881071e-06, "loss": 2.2697, "step": 506590 }, { "epoch": 0.88, "learning_rate": 5.827523306954245e-06, "loss": 2.2404, "step": 506600 }, { "epoch": 0.88, "learning_rate": 5.8266513670274175e-06, "loss": 2.2176, "step": 506610 }, { "epoch": 0.88, "learning_rate": 5.825779427100591e-06, "loss": 2.3063, "step": 506620 }, { "epoch": 0.88, "learning_rate": 5.824907487173764e-06, "loss": 2.2959, "step": 506630 }, { "epoch": 0.88, "learning_rate": 5.824035547246937e-06, "loss": 2.2251, "step": 506640 }, { "epoch": 0.88, "learning_rate": 5.82316360732011e-06, "loss": 2.2855, "step": 506650 }, { "epoch": 0.88, "learning_rate": 5.822291667393284e-06, "loss": 2.2483, "step": 506660 }, { "epoch": 0.88, "learning_rate": 5.821419727466457e-06, "loss": 2.2547, "step": 506670 }, { "epoch": 0.88, "learning_rate": 5.82054778753963e-06, "loss": 2.2811, "step": 506680 }, { "epoch": 0.88, "learning_rate": 5.819675847612803e-06, "loss": 2.3059, "step": 506690 }, { "epoch": 0.88, "learning_rate": 5.818803907685976e-06, "loss": 2.3138, "step": 506700 }, { "epoch": 0.88, "learning_rate": 5.817931967759149e-06, "loss": 2.3022, "step": 506710 }, { "epoch": 0.88, "learning_rate": 5.817060027832322e-06, "loss": 2.2181, "step": 506720 }, { "epoch": 0.88, "learning_rate": 5.816188087905496e-06, "loss": 2.2574, "step": 506730 }, { "epoch": 0.88, "learning_rate": 5.81531614797867e-06, "loss": 2.2064, "step": 506740 }, { "epoch": 0.88, "learning_rate": 5.814444208051843e-06, "loss": 2.334, "step": 506750 }, { "epoch": 0.88, "learning_rate": 5.813572268125016e-06, "loss": 2.2757, "step": 506760 }, { "epoch": 0.88, "learning_rate": 5.8127003281981885e-06, "loss": 2.2326, "step": 506770 }, { "epoch": 0.88, "learning_rate": 5.811828388271362e-06, "loss": 2.2112, "step": 506780 }, { "epoch": 0.88, "learning_rate": 5.810956448344535e-06, "loss": 2.3646, "step": 506790 }, { "epoch": 0.88, "learning_rate": 5.810084508417708e-06, "loss": 2.28, "step": 506800 }, { "epoch": 0.88, "learning_rate": 5.809212568490881e-06, "loss": 2.4025, "step": 506810 }, { "epoch": 0.88, "learning_rate": 5.808340628564055e-06, "loss": 2.285, "step": 506820 }, { "epoch": 0.88, "learning_rate": 5.807468688637228e-06, "loss": 2.2277, "step": 506830 }, { "epoch": 0.88, "learning_rate": 5.806596748710401e-06, "loss": 2.2025, "step": 506840 }, { "epoch": 0.88, "learning_rate": 5.805724808783574e-06, "loss": 2.2385, "step": 506850 }, { "epoch": 0.88, "learning_rate": 5.804852868856748e-06, "loss": 2.279, "step": 506860 }, { "epoch": 0.88, "learning_rate": 5.803980928929921e-06, "loss": 2.2824, "step": 506870 }, { "epoch": 0.88, "learning_rate": 5.803108989003094e-06, "loss": 2.33, "step": 506880 }, { "epoch": 0.88, "learning_rate": 5.802237049076267e-06, "loss": 2.2934, "step": 506890 }, { "epoch": 0.88, "learning_rate": 5.801365109149441e-06, "loss": 2.3387, "step": 506900 }, { "epoch": 0.88, "learning_rate": 5.800493169222614e-06, "loss": 2.2666, "step": 506910 }, { "epoch": 0.88, "learning_rate": 5.799621229295787e-06, "loss": 2.1586, "step": 506920 }, { "epoch": 0.88, "learning_rate": 5.7987492893689595e-06, "loss": 2.4137, "step": 506930 }, { "epoch": 0.88, "learning_rate": 5.797877349442133e-06, "loss": 2.2563, "step": 506940 }, { "epoch": 0.88, "learning_rate": 5.797005409515306e-06, "loss": 2.3133, "step": 506950 }, { "epoch": 0.88, "learning_rate": 5.796133469588479e-06, "loss": 2.3061, "step": 506960 }, { "epoch": 0.88, "learning_rate": 5.795261529661652e-06, "loss": 2.2821, "step": 506970 }, { "epoch": 0.88, "learning_rate": 5.794389589734826e-06, "loss": 2.1772, "step": 506980 }, { "epoch": 0.88, "learning_rate": 5.793517649807999e-06, "loss": 2.2926, "step": 506990 }, { "epoch": 0.88, "learning_rate": 5.7926457098811725e-06, "loss": 2.1406, "step": 507000 }, { "epoch": 0.88, "learning_rate": 5.7917737699543455e-06, "loss": 2.2409, "step": 507010 }, { "epoch": 0.88, "learning_rate": 5.790901830027519e-06, "loss": 2.18, "step": 507020 }, { "epoch": 0.88, "learning_rate": 5.790029890100692e-06, "loss": 2.3222, "step": 507030 }, { "epoch": 0.88, "learning_rate": 5.789157950173865e-06, "loss": 2.2658, "step": 507040 }, { "epoch": 0.88, "learning_rate": 5.788286010247038e-06, "loss": 2.3395, "step": 507050 }, { "epoch": 0.88, "learning_rate": 5.787414070320212e-06, "loss": 2.2941, "step": 507060 }, { "epoch": 0.88, "learning_rate": 5.786542130393385e-06, "loss": 2.1891, "step": 507070 }, { "epoch": 0.88, "learning_rate": 5.785670190466558e-06, "loss": 2.3804, "step": 507080 }, { "epoch": 0.88, "learning_rate": 5.7847982505397305e-06, "loss": 2.3123, "step": 507090 }, { "epoch": 0.88, "learning_rate": 5.783926310612904e-06, "loss": 2.3092, "step": 507100 }, { "epoch": 0.88, "learning_rate": 5.783054370686077e-06, "loss": 2.2597, "step": 507110 }, { "epoch": 0.88, "learning_rate": 5.78218243075925e-06, "loss": 2.2342, "step": 507120 }, { "epoch": 0.88, "learning_rate": 5.781310490832424e-06, "loss": 2.3818, "step": 507130 }, { "epoch": 0.88, "learning_rate": 5.780438550905598e-06, "loss": 2.3167, "step": 507140 }, { "epoch": 0.88, "learning_rate": 5.779566610978771e-06, "loss": 2.1835, "step": 507150 }, { "epoch": 0.88, "learning_rate": 5.7786946710519435e-06, "loss": 2.3104, "step": 507160 }, { "epoch": 0.88, "learning_rate": 5.7778227311251165e-06, "loss": 2.2155, "step": 507170 }, { "epoch": 0.88, "learning_rate": 5.77695079119829e-06, "loss": 2.3822, "step": 507180 }, { "epoch": 0.88, "learning_rate": 5.776078851271463e-06, "loss": 2.2339, "step": 507190 }, { "epoch": 0.88, "learning_rate": 5.775206911344636e-06, "loss": 2.1568, "step": 507200 }, { "epoch": 0.88, "learning_rate": 5.774334971417809e-06, "loss": 2.2835, "step": 507210 }, { "epoch": 0.88, "learning_rate": 5.773463031490983e-06, "loss": 2.1812, "step": 507220 }, { "epoch": 0.88, "learning_rate": 5.772591091564156e-06, "loss": 2.207, "step": 507230 }, { "epoch": 0.88, "learning_rate": 5.771719151637329e-06, "loss": 2.2133, "step": 507240 }, { "epoch": 0.88, "learning_rate": 5.770847211710502e-06, "loss": 2.1831, "step": 507250 }, { "epoch": 0.88, "learning_rate": 5.769975271783676e-06, "loss": 2.1571, "step": 507260 }, { "epoch": 0.88, "learning_rate": 5.769103331856849e-06, "loss": 2.2771, "step": 507270 }, { "epoch": 0.88, "learning_rate": 5.768231391930022e-06, "loss": 2.2669, "step": 507280 }, { "epoch": 0.88, "learning_rate": 5.767359452003195e-06, "loss": 2.2692, "step": 507290 }, { "epoch": 0.88, "learning_rate": 5.766487512076369e-06, "loss": 2.2293, "step": 507300 }, { "epoch": 0.88, "learning_rate": 5.765615572149542e-06, "loss": 2.2946, "step": 507310 }, { "epoch": 0.88, "learning_rate": 5.7647436322227145e-06, "loss": 2.3794, "step": 507320 }, { "epoch": 0.88, "learning_rate": 5.7638716922958875e-06, "loss": 2.2572, "step": 507330 }, { "epoch": 0.88, "learning_rate": 5.762999752369061e-06, "loss": 2.2854, "step": 507340 }, { "epoch": 0.88, "learning_rate": 5.762127812442234e-06, "loss": 2.2377, "step": 507350 }, { "epoch": 0.88, "learning_rate": 5.761255872515407e-06, "loss": 2.3623, "step": 507360 }, { "epoch": 0.88, "learning_rate": 5.76038393258858e-06, "loss": 2.3184, "step": 507370 }, { "epoch": 0.88, "learning_rate": 5.759511992661754e-06, "loss": 2.2181, "step": 507380 }, { "epoch": 0.88, "learning_rate": 5.758640052734927e-06, "loss": 2.0929, "step": 507390 }, { "epoch": 0.88, "learning_rate": 5.7577681128081005e-06, "loss": 2.2355, "step": 507400 }, { "epoch": 0.88, "learning_rate": 5.756896172881273e-06, "loss": 2.2028, "step": 507410 }, { "epoch": 0.88, "learning_rate": 5.756024232954447e-06, "loss": 2.324, "step": 507420 }, { "epoch": 0.88, "learning_rate": 5.75515229302762e-06, "loss": 2.3351, "step": 507430 }, { "epoch": 0.88, "learning_rate": 5.754280353100793e-06, "loss": 2.2654, "step": 507440 }, { "epoch": 0.88, "learning_rate": 5.753408413173966e-06, "loss": 2.2679, "step": 507450 }, { "epoch": 0.88, "learning_rate": 5.75253647324714e-06, "loss": 2.2423, "step": 507460 }, { "epoch": 0.88, "learning_rate": 5.751664533320313e-06, "loss": 2.2844, "step": 507470 }, { "epoch": 0.88, "learning_rate": 5.7507925933934855e-06, "loss": 2.327, "step": 507480 }, { "epoch": 0.89, "learning_rate": 5.7499206534666585e-06, "loss": 2.1965, "step": 507490 }, { "epoch": 0.89, "learning_rate": 5.749048713539832e-06, "loss": 2.2727, "step": 507500 }, { "epoch": 0.89, "learning_rate": 5.748176773613005e-06, "loss": 2.2318, "step": 507510 }, { "epoch": 0.89, "learning_rate": 5.747304833686178e-06, "loss": 2.2222, "step": 507520 }, { "epoch": 0.89, "learning_rate": 5.746432893759352e-06, "loss": 2.2806, "step": 507530 }, { "epoch": 0.89, "learning_rate": 5.745560953832526e-06, "loss": 2.2742, "step": 507540 }, { "epoch": 0.89, "learning_rate": 5.7446890139056985e-06, "loss": 2.2687, "step": 507550 }, { "epoch": 0.89, "learning_rate": 5.7438170739788715e-06, "loss": 2.2482, "step": 507560 }, { "epoch": 0.89, "learning_rate": 5.742945134052044e-06, "loss": 2.2421, "step": 507570 }, { "epoch": 0.89, "learning_rate": 5.742073194125218e-06, "loss": 2.3521, "step": 507580 }, { "epoch": 0.89, "learning_rate": 5.741201254198391e-06, "loss": 2.2226, "step": 507590 }, { "epoch": 0.89, "learning_rate": 5.740329314271564e-06, "loss": 2.2991, "step": 507600 }, { "epoch": 0.89, "learning_rate": 5.739457374344737e-06, "loss": 2.1765, "step": 507610 }, { "epoch": 0.89, "learning_rate": 5.738585434417911e-06, "loss": 2.2347, "step": 507620 }, { "epoch": 0.89, "learning_rate": 5.737713494491084e-06, "loss": 2.3583, "step": 507630 }, { "epoch": 0.89, "learning_rate": 5.7368415545642565e-06, "loss": 2.337, "step": 507640 }, { "epoch": 0.89, "learning_rate": 5.73596961463743e-06, "loss": 2.2809, "step": 507650 }, { "epoch": 0.89, "learning_rate": 5.735097674710604e-06, "loss": 2.3128, "step": 507660 }, { "epoch": 0.89, "learning_rate": 5.734225734783777e-06, "loss": 2.2637, "step": 507670 }, { "epoch": 0.89, "learning_rate": 5.73335379485695e-06, "loss": 2.3128, "step": 507680 }, { "epoch": 0.89, "learning_rate": 5.732481854930123e-06, "loss": 2.3341, "step": 507690 }, { "epoch": 0.89, "learning_rate": 5.731609915003297e-06, "loss": 2.1824, "step": 507700 }, { "epoch": 0.89, "learning_rate": 5.7307379750764695e-06, "loss": 2.1223, "step": 507710 }, { "epoch": 0.89, "learning_rate": 5.7298660351496425e-06, "loss": 2.3157, "step": 507720 }, { "epoch": 0.89, "learning_rate": 5.728994095222815e-06, "loss": 2.2845, "step": 507730 }, { "epoch": 0.89, "learning_rate": 5.728122155295989e-06, "loss": 2.1556, "step": 507740 }, { "epoch": 0.89, "learning_rate": 5.727250215369162e-06, "loss": 2.1919, "step": 507750 }, { "epoch": 0.89, "learning_rate": 5.726378275442335e-06, "loss": 2.3584, "step": 507760 }, { "epoch": 0.89, "learning_rate": 5.725506335515509e-06, "loss": 2.3213, "step": 507770 }, { "epoch": 0.89, "learning_rate": 5.724634395588682e-06, "loss": 2.2011, "step": 507780 }, { "epoch": 0.89, "learning_rate": 5.723762455661855e-06, "loss": 2.2641, "step": 507790 }, { "epoch": 0.89, "learning_rate": 5.722890515735028e-06, "loss": 2.1921, "step": 507800 }, { "epoch": 0.89, "learning_rate": 5.722018575808201e-06, "loss": 2.2275, "step": 507810 }, { "epoch": 0.89, "learning_rate": 5.721146635881375e-06, "loss": 2.2031, "step": 507820 }, { "epoch": 0.89, "learning_rate": 5.720274695954548e-06, "loss": 2.1487, "step": 507830 }, { "epoch": 0.89, "learning_rate": 5.719402756027721e-06, "loss": 2.2538, "step": 507840 }, { "epoch": 0.89, "learning_rate": 5.718530816100894e-06, "loss": 2.275, "step": 507850 }, { "epoch": 0.89, "learning_rate": 5.717658876174068e-06, "loss": 2.2334, "step": 507860 }, { "epoch": 0.89, "learning_rate": 5.7167869362472405e-06, "loss": 2.2557, "step": 507870 }, { "epoch": 0.89, "learning_rate": 5.7159149963204135e-06, "loss": 2.256, "step": 507880 }, { "epoch": 0.89, "learning_rate": 5.715043056393586e-06, "loss": 2.4313, "step": 507890 }, { "epoch": 0.89, "learning_rate": 5.71417111646676e-06, "loss": 2.3864, "step": 507900 }, { "epoch": 0.89, "learning_rate": 5.713299176539933e-06, "loss": 2.2452, "step": 507910 }, { "epoch": 0.89, "learning_rate": 5.712427236613106e-06, "loss": 2.2527, "step": 507920 }, { "epoch": 0.89, "learning_rate": 5.71155529668628e-06, "loss": 2.2199, "step": 507930 }, { "epoch": 0.89, "learning_rate": 5.7106833567594535e-06, "loss": 2.2827, "step": 507940 }, { "epoch": 0.89, "learning_rate": 5.7098114168326265e-06, "loss": 2.222, "step": 507950 }, { "epoch": 0.89, "learning_rate": 5.708939476905799e-06, "loss": 2.2148, "step": 507960 }, { "epoch": 0.89, "learning_rate": 5.708067536978972e-06, "loss": 2.2388, "step": 507970 }, { "epoch": 0.89, "learning_rate": 5.707195597052146e-06, "loss": 2.3229, "step": 507980 }, { "epoch": 0.89, "learning_rate": 5.706323657125319e-06, "loss": 2.3126, "step": 507990 }, { "epoch": 0.89, "learning_rate": 5.705451717198492e-06, "loss": 2.1982, "step": 508000 }, { "epoch": 0.89, "learning_rate": 5.704579777271665e-06, "loss": 2.2714, "step": 508010 }, { "epoch": 0.89, "learning_rate": 5.703707837344839e-06, "loss": 2.3084, "step": 508020 }, { "epoch": 0.89, "learning_rate": 5.7028358974180115e-06, "loss": 2.2577, "step": 508030 }, { "epoch": 0.89, "learning_rate": 5.7019639574911845e-06, "loss": 2.2718, "step": 508040 }, { "epoch": 0.89, "learning_rate": 5.701092017564358e-06, "loss": 2.1751, "step": 508050 }, { "epoch": 0.89, "learning_rate": 5.700220077637532e-06, "loss": 2.3317, "step": 508060 }, { "epoch": 0.89, "learning_rate": 5.699348137710705e-06, "loss": 2.3454, "step": 508070 }, { "epoch": 0.89, "learning_rate": 5.698476197783878e-06, "loss": 2.2169, "step": 508080 }, { "epoch": 0.89, "learning_rate": 5.697604257857051e-06, "loss": 2.2388, "step": 508090 }, { "epoch": 0.89, "learning_rate": 5.6967323179302245e-06, "loss": 2.2028, "step": 508100 }, { "epoch": 0.89, "learning_rate": 5.6958603780033975e-06, "loss": 2.1465, "step": 508110 }, { "epoch": 0.89, "learning_rate": 5.69498843807657e-06, "loss": 2.3082, "step": 508120 }, { "epoch": 0.89, "learning_rate": 5.694116498149743e-06, "loss": 2.2831, "step": 508130 }, { "epoch": 0.89, "learning_rate": 5.693244558222917e-06, "loss": 2.2562, "step": 508140 }, { "epoch": 0.89, "learning_rate": 5.69237261829609e-06, "loss": 2.2695, "step": 508150 }, { "epoch": 0.89, "learning_rate": 5.691500678369263e-06, "loss": 2.1748, "step": 508160 }, { "epoch": 0.89, "learning_rate": 5.690628738442437e-06, "loss": 2.2731, "step": 508170 }, { "epoch": 0.89, "learning_rate": 5.68975679851561e-06, "loss": 2.2868, "step": 508180 }, { "epoch": 0.89, "learning_rate": 5.688884858588783e-06, "loss": 2.3056, "step": 508190 }, { "epoch": 0.89, "learning_rate": 5.688012918661956e-06, "loss": 2.2643, "step": 508200 }, { "epoch": 0.89, "learning_rate": 5.687140978735129e-06, "loss": 2.359, "step": 508210 }, { "epoch": 0.89, "learning_rate": 5.686269038808303e-06, "loss": 2.3279, "step": 508220 }, { "epoch": 0.89, "learning_rate": 5.685397098881476e-06, "loss": 2.2654, "step": 508230 }, { "epoch": 0.89, "learning_rate": 5.684525158954649e-06, "loss": 2.2779, "step": 508240 }, { "epoch": 0.89, "learning_rate": 5.683653219027822e-06, "loss": 2.2687, "step": 508250 }, { "epoch": 0.89, "learning_rate": 5.6827812791009955e-06, "loss": 2.3052, "step": 508260 }, { "epoch": 0.89, "learning_rate": 5.6819093391741685e-06, "loss": 2.149, "step": 508270 }, { "epoch": 0.89, "learning_rate": 5.681037399247341e-06, "loss": 2.3526, "step": 508280 }, { "epoch": 0.89, "learning_rate": 5.680165459320515e-06, "loss": 2.3333, "step": 508290 }, { "epoch": 0.89, "learning_rate": 5.679293519393688e-06, "loss": 2.2149, "step": 508300 }, { "epoch": 0.89, "learning_rate": 5.678421579466861e-06, "loss": 2.2141, "step": 508310 }, { "epoch": 0.89, "learning_rate": 5.677549639540034e-06, "loss": 2.2877, "step": 508320 }, { "epoch": 0.89, "learning_rate": 5.676677699613208e-06, "loss": 2.4112, "step": 508330 }, { "epoch": 0.89, "learning_rate": 5.6758057596863815e-06, "loss": 2.2136, "step": 508340 }, { "epoch": 0.89, "learning_rate": 5.674933819759554e-06, "loss": 2.4205, "step": 508350 }, { "epoch": 0.89, "learning_rate": 5.674061879832727e-06, "loss": 2.2566, "step": 508360 }, { "epoch": 0.89, "learning_rate": 5.6731899399059e-06, "loss": 2.2396, "step": 508370 }, { "epoch": 0.89, "learning_rate": 5.672317999979074e-06, "loss": 2.2402, "step": 508380 }, { "epoch": 0.89, "learning_rate": 5.671446060052247e-06, "loss": 2.2509, "step": 508390 }, { "epoch": 0.89, "learning_rate": 5.67057412012542e-06, "loss": 2.3423, "step": 508400 }, { "epoch": 0.89, "learning_rate": 5.669702180198593e-06, "loss": 2.2695, "step": 508410 }, { "epoch": 0.89, "learning_rate": 5.6688302402717665e-06, "loss": 2.2431, "step": 508420 }, { "epoch": 0.89, "learning_rate": 5.6679583003449395e-06, "loss": 2.3034, "step": 508430 }, { "epoch": 0.89, "learning_rate": 5.667086360418112e-06, "loss": 2.2382, "step": 508440 }, { "epoch": 0.89, "learning_rate": 5.666214420491286e-06, "loss": 2.2747, "step": 508450 }, { "epoch": 0.89, "learning_rate": 5.66534248056446e-06, "loss": 2.1605, "step": 508460 }, { "epoch": 0.89, "learning_rate": 5.664470540637633e-06, "loss": 2.1508, "step": 508470 }, { "epoch": 0.89, "learning_rate": 5.663598600710806e-06, "loss": 2.2271, "step": 508480 }, { "epoch": 0.89, "learning_rate": 5.662726660783979e-06, "loss": 2.2681, "step": 508490 }, { "epoch": 0.89, "learning_rate": 5.6618547208571525e-06, "loss": 2.3624, "step": 508500 }, { "epoch": 0.89, "learning_rate": 5.660982780930325e-06, "loss": 2.2473, "step": 508510 }, { "epoch": 0.89, "learning_rate": 5.660110841003498e-06, "loss": 2.2852, "step": 508520 }, { "epoch": 0.89, "learning_rate": 5.659238901076671e-06, "loss": 2.1924, "step": 508530 }, { "epoch": 0.89, "learning_rate": 5.658366961149845e-06, "loss": 2.3621, "step": 508540 }, { "epoch": 0.89, "learning_rate": 5.657495021223018e-06, "loss": 2.2584, "step": 508550 }, { "epoch": 0.89, "learning_rate": 5.656623081296191e-06, "loss": 2.1234, "step": 508560 }, { "epoch": 0.89, "learning_rate": 5.655751141369365e-06, "loss": 2.2888, "step": 508570 }, { "epoch": 0.89, "learning_rate": 5.6548792014425375e-06, "loss": 2.2229, "step": 508580 }, { "epoch": 0.89, "learning_rate": 5.654007261515711e-06, "loss": 2.1316, "step": 508590 }, { "epoch": 0.89, "learning_rate": 5.653135321588884e-06, "loss": 2.2716, "step": 508600 }, { "epoch": 0.89, "learning_rate": 5.652263381662057e-06, "loss": 2.3036, "step": 508610 }, { "epoch": 0.89, "learning_rate": 5.651391441735231e-06, "loss": 2.2546, "step": 508620 }, { "epoch": 0.89, "learning_rate": 5.650519501808404e-06, "loss": 2.276, "step": 508630 }, { "epoch": 0.89, "learning_rate": 5.649647561881577e-06, "loss": 2.1455, "step": 508640 }, { "epoch": 0.89, "learning_rate": 5.64877562195475e-06, "loss": 2.1219, "step": 508650 }, { "epoch": 0.89, "learning_rate": 5.6479036820279235e-06, "loss": 2.2864, "step": 508660 }, { "epoch": 0.89, "learning_rate": 5.647031742101096e-06, "loss": 2.2614, "step": 508670 }, { "epoch": 0.89, "learning_rate": 5.646159802174269e-06, "loss": 2.3457, "step": 508680 }, { "epoch": 0.89, "learning_rate": 5.645287862247443e-06, "loss": 2.3227, "step": 508690 }, { "epoch": 0.89, "learning_rate": 5.644415922320616e-06, "loss": 2.3275, "step": 508700 }, { "epoch": 0.89, "learning_rate": 5.643543982393789e-06, "loss": 2.3277, "step": 508710 }, { "epoch": 0.89, "learning_rate": 5.642672042466962e-06, "loss": 2.37, "step": 508720 }, { "epoch": 0.89, "learning_rate": 5.641800102540136e-06, "loss": 2.2139, "step": 508730 }, { "epoch": 0.89, "learning_rate": 5.640928162613309e-06, "loss": 2.2418, "step": 508740 }, { "epoch": 0.89, "learning_rate": 5.640056222686482e-06, "loss": 2.3203, "step": 508750 }, { "epoch": 0.89, "learning_rate": 5.639184282759655e-06, "loss": 2.2974, "step": 508760 }, { "epoch": 0.89, "learning_rate": 5.638312342832828e-06, "loss": 2.283, "step": 508770 }, { "epoch": 0.89, "learning_rate": 5.637440402906002e-06, "loss": 2.1615, "step": 508780 }, { "epoch": 0.89, "learning_rate": 5.636568462979175e-06, "loss": 2.3011, "step": 508790 }, { "epoch": 0.89, "learning_rate": 5.635696523052348e-06, "loss": 2.2619, "step": 508800 }, { "epoch": 0.89, "learning_rate": 5.6348245831255216e-06, "loss": 2.1892, "step": 508810 }, { "epoch": 0.89, "learning_rate": 5.6339526431986945e-06, "loss": 2.2376, "step": 508820 }, { "epoch": 0.89, "learning_rate": 5.633080703271867e-06, "loss": 2.2442, "step": 508830 }, { "epoch": 0.89, "learning_rate": 5.63220876334504e-06, "loss": 2.2402, "step": 508840 }, { "epoch": 0.89, "learning_rate": 5.631336823418214e-06, "loss": 2.2933, "step": 508850 }, { "epoch": 0.89, "learning_rate": 5.630464883491388e-06, "loss": 2.2493, "step": 508860 }, { "epoch": 0.89, "learning_rate": 5.629592943564561e-06, "loss": 2.3678, "step": 508870 }, { "epoch": 0.89, "learning_rate": 5.628721003637734e-06, "loss": 2.258, "step": 508880 }, { "epoch": 0.89, "learning_rate": 5.627849063710907e-06, "loss": 2.1946, "step": 508890 }, { "epoch": 0.89, "learning_rate": 5.62697712378408e-06, "loss": 2.3496, "step": 508900 }, { "epoch": 0.89, "learning_rate": 5.626105183857253e-06, "loss": 2.1847, "step": 508910 }, { "epoch": 0.89, "learning_rate": 5.625233243930426e-06, "loss": 2.2342, "step": 508920 }, { "epoch": 0.89, "learning_rate": 5.6243613040036e-06, "loss": 2.2799, "step": 508930 }, { "epoch": 0.89, "learning_rate": 5.623489364076773e-06, "loss": 2.1736, "step": 508940 }, { "epoch": 0.89, "learning_rate": 5.622617424149946e-06, "loss": 2.2335, "step": 508950 }, { "epoch": 0.89, "learning_rate": 5.621745484223119e-06, "loss": 2.2124, "step": 508960 }, { "epoch": 0.89, "learning_rate": 5.6208735442962926e-06, "loss": 2.2341, "step": 508970 }, { "epoch": 0.89, "learning_rate": 5.6200016043694655e-06, "loss": 2.2023, "step": 508980 }, { "epoch": 0.89, "learning_rate": 5.619129664442639e-06, "loss": 2.1772, "step": 508990 }, { "epoch": 0.89, "learning_rate": 5.618257724515812e-06, "loss": 2.2641, "step": 509000 }, { "epoch": 0.89, "learning_rate": 5.617385784588985e-06, "loss": 2.3531, "step": 509010 }, { "epoch": 0.89, "learning_rate": 5.616513844662159e-06, "loss": 2.3268, "step": 509020 }, { "epoch": 0.89, "learning_rate": 5.615641904735332e-06, "loss": 2.3518, "step": 509030 }, { "epoch": 0.89, "learning_rate": 5.614769964808505e-06, "loss": 2.1771, "step": 509040 }, { "epoch": 0.89, "learning_rate": 5.613898024881678e-06, "loss": 2.1436, "step": 509050 }, { "epoch": 0.89, "learning_rate": 5.613026084954851e-06, "loss": 2.2757, "step": 509060 }, { "epoch": 0.89, "learning_rate": 5.612154145028024e-06, "loss": 2.2329, "step": 509070 }, { "epoch": 0.89, "learning_rate": 5.611282205101197e-06, "loss": 2.1862, "step": 509080 }, { "epoch": 0.89, "learning_rate": 5.610410265174371e-06, "loss": 2.2006, "step": 509090 }, { "epoch": 0.89, "learning_rate": 5.609538325247544e-06, "loss": 2.2121, "step": 509100 }, { "epoch": 0.89, "learning_rate": 5.608666385320717e-06, "loss": 2.2618, "step": 509110 }, { "epoch": 0.89, "learning_rate": 5.60779444539389e-06, "loss": 2.1605, "step": 509120 }, { "epoch": 0.89, "learning_rate": 5.6069225054670636e-06, "loss": 2.2777, "step": 509130 }, { "epoch": 0.89, "learning_rate": 5.606050565540237e-06, "loss": 2.1992, "step": 509140 }, { "epoch": 0.89, "learning_rate": 5.60517862561341e-06, "loss": 2.4289, "step": 509150 }, { "epoch": 0.89, "learning_rate": 5.604306685686583e-06, "loss": 2.2566, "step": 509160 }, { "epoch": 0.89, "learning_rate": 5.603434745759756e-06, "loss": 2.1922, "step": 509170 }, { "epoch": 0.89, "learning_rate": 5.60256280583293e-06, "loss": 2.3092, "step": 509180 }, { "epoch": 0.89, "learning_rate": 5.601690865906103e-06, "loss": 2.256, "step": 509190 }, { "epoch": 0.89, "learning_rate": 5.600818925979276e-06, "loss": 2.3, "step": 509200 }, { "epoch": 0.89, "learning_rate": 5.5999469860524495e-06, "loss": 2.2695, "step": 509210 }, { "epoch": 0.89, "learning_rate": 5.599075046125622e-06, "loss": 2.2693, "step": 509220 }, { "epoch": 0.89, "learning_rate": 5.598203106198795e-06, "loss": 2.2433, "step": 509230 }, { "epoch": 0.89, "learning_rate": 5.597331166271968e-06, "loss": 2.3508, "step": 509240 }, { "epoch": 0.89, "learning_rate": 5.596459226345142e-06, "loss": 2.2617, "step": 509250 }, { "epoch": 0.89, "learning_rate": 5.595587286418316e-06, "loss": 2.3461, "step": 509260 }, { "epoch": 0.89, "learning_rate": 5.594715346491489e-06, "loss": 2.3406, "step": 509270 }, { "epoch": 0.89, "learning_rate": 5.593843406564662e-06, "loss": 2.2003, "step": 509280 }, { "epoch": 0.89, "learning_rate": 5.5929714666378346e-06, "loss": 2.3152, "step": 509290 }, { "epoch": 0.89, "learning_rate": 5.592099526711008e-06, "loss": 2.3209, "step": 509300 }, { "epoch": 0.89, "learning_rate": 5.591227586784181e-06, "loss": 2.316, "step": 509310 }, { "epoch": 0.89, "learning_rate": 5.590355646857354e-06, "loss": 2.2704, "step": 509320 }, { "epoch": 0.89, "learning_rate": 5.589483706930528e-06, "loss": 2.2949, "step": 509330 }, { "epoch": 0.89, "learning_rate": 5.588611767003701e-06, "loss": 2.2128, "step": 509340 }, { "epoch": 0.89, "learning_rate": 5.587739827076874e-06, "loss": 2.2718, "step": 509350 }, { "epoch": 0.89, "learning_rate": 5.586867887150047e-06, "loss": 2.2374, "step": 509360 }, { "epoch": 0.89, "learning_rate": 5.5859959472232205e-06, "loss": 2.3771, "step": 509370 }, { "epoch": 0.89, "learning_rate": 5.585124007296393e-06, "loss": 2.2608, "step": 509380 }, { "epoch": 0.89, "learning_rate": 5.584252067369567e-06, "loss": 2.3412, "step": 509390 }, { "epoch": 0.89, "learning_rate": 5.58338012744274e-06, "loss": 2.3458, "step": 509400 }, { "epoch": 0.89, "learning_rate": 5.582508187515913e-06, "loss": 2.229, "step": 509410 }, { "epoch": 0.89, "learning_rate": 5.581636247589087e-06, "loss": 2.1803, "step": 509420 }, { "epoch": 0.89, "learning_rate": 5.58076430766226e-06, "loss": 2.3263, "step": 509430 }, { "epoch": 0.89, "learning_rate": 5.579892367735433e-06, "loss": 2.3836, "step": 509440 }, { "epoch": 0.89, "learning_rate": 5.579020427808606e-06, "loss": 2.3734, "step": 509450 }, { "epoch": 0.89, "learning_rate": 5.578148487881779e-06, "loss": 2.2686, "step": 509460 }, { "epoch": 0.89, "learning_rate": 5.577276547954952e-06, "loss": 2.2114, "step": 509470 }, { "epoch": 0.89, "learning_rate": 5.576404608028125e-06, "loss": 2.2455, "step": 509480 }, { "epoch": 0.89, "learning_rate": 5.575532668101299e-06, "loss": 2.2265, "step": 509490 }, { "epoch": 0.89, "learning_rate": 5.574660728174472e-06, "loss": 2.2569, "step": 509500 }, { "epoch": 0.89, "learning_rate": 5.573788788247645e-06, "loss": 2.3354, "step": 509510 }, { "epoch": 0.89, "learning_rate": 5.5729168483208186e-06, "loss": 2.2563, "step": 509520 }, { "epoch": 0.89, "learning_rate": 5.5720449083939915e-06, "loss": 2.2377, "step": 509530 }, { "epoch": 0.89, "learning_rate": 5.571172968467165e-06, "loss": 2.1521, "step": 509540 }, { "epoch": 0.89, "learning_rate": 5.570301028540338e-06, "loss": 2.2455, "step": 509550 }, { "epoch": 0.89, "learning_rate": 5.569429088613511e-06, "loss": 2.2584, "step": 509560 }, { "epoch": 0.89, "learning_rate": 5.568557148686684e-06, "loss": 2.1928, "step": 509570 }, { "epoch": 0.89, "learning_rate": 5.567685208759858e-06, "loss": 2.3143, "step": 509580 }, { "epoch": 0.89, "learning_rate": 5.566813268833031e-06, "loss": 2.2344, "step": 509590 }, { "epoch": 0.89, "learning_rate": 5.565941328906204e-06, "loss": 2.2295, "step": 509600 }, { "epoch": 0.89, "learning_rate": 5.565069388979377e-06, "loss": 2.2551, "step": 509610 }, { "epoch": 0.89, "learning_rate": 5.56419744905255e-06, "loss": 2.1605, "step": 509620 }, { "epoch": 0.89, "learning_rate": 5.563325509125723e-06, "loss": 2.3948, "step": 509630 }, { "epoch": 0.89, "learning_rate": 5.562453569198896e-06, "loss": 2.2506, "step": 509640 }, { "epoch": 0.89, "learning_rate": 5.56158162927207e-06, "loss": 2.1878, "step": 509650 }, { "epoch": 0.89, "learning_rate": 5.560709689345244e-06, "loss": 2.1889, "step": 509660 }, { "epoch": 0.89, "learning_rate": 5.559837749418417e-06, "loss": 2.3158, "step": 509670 }, { "epoch": 0.89, "learning_rate": 5.5589658094915896e-06, "loss": 2.3191, "step": 509680 }, { "epoch": 0.89, "learning_rate": 5.5580938695647625e-06, "loss": 2.3427, "step": 509690 }, { "epoch": 0.89, "learning_rate": 5.557221929637936e-06, "loss": 2.2423, "step": 509700 }, { "epoch": 0.89, "learning_rate": 5.556349989711109e-06, "loss": 2.2898, "step": 509710 }, { "epoch": 0.89, "learning_rate": 5.555478049784282e-06, "loss": 2.2235, "step": 509720 }, { "epoch": 0.89, "learning_rate": 5.554606109857456e-06, "loss": 2.2739, "step": 509730 }, { "epoch": 0.89, "learning_rate": 5.553734169930629e-06, "loss": 2.2351, "step": 509740 }, { "epoch": 0.89, "learning_rate": 5.552862230003802e-06, "loss": 2.3216, "step": 509750 }, { "epoch": 0.89, "learning_rate": 5.551990290076975e-06, "loss": 2.2189, "step": 509760 }, { "epoch": 0.89, "learning_rate": 5.551118350150148e-06, "loss": 2.2153, "step": 509770 }, { "epoch": 0.89, "learning_rate": 5.550246410223321e-06, "loss": 2.3335, "step": 509780 }, { "epoch": 0.89, "learning_rate": 5.549374470296495e-06, "loss": 2.1769, "step": 509790 }, { "epoch": 0.89, "learning_rate": 5.548502530369668e-06, "loss": 2.3327, "step": 509800 }, { "epoch": 0.89, "learning_rate": 5.547630590442841e-06, "loss": 2.3144, "step": 509810 }, { "epoch": 0.89, "learning_rate": 5.546758650516015e-06, "loss": 2.3472, "step": 509820 }, { "epoch": 0.89, "learning_rate": 5.545886710589188e-06, "loss": 2.3731, "step": 509830 }, { "epoch": 0.89, "learning_rate": 5.5450147706623606e-06, "loss": 2.1678, "step": 509840 }, { "epoch": 0.89, "learning_rate": 5.544142830735534e-06, "loss": 2.2282, "step": 509850 }, { "epoch": 0.89, "learning_rate": 5.543270890808707e-06, "loss": 2.274, "step": 509860 }, { "epoch": 0.89, "learning_rate": 5.54239895088188e-06, "loss": 2.2727, "step": 509870 }, { "epoch": 0.89, "learning_rate": 5.541527010955053e-06, "loss": 2.2405, "step": 509880 }, { "epoch": 0.89, "learning_rate": 5.540655071028227e-06, "loss": 2.3198, "step": 509890 }, { "epoch": 0.89, "learning_rate": 5.5397831311014e-06, "loss": 2.1958, "step": 509900 }, { "epoch": 0.89, "learning_rate": 5.538911191174573e-06, "loss": 2.3599, "step": 509910 }, { "epoch": 0.89, "learning_rate": 5.5380392512477465e-06, "loss": 2.1867, "step": 509920 }, { "epoch": 0.89, "learning_rate": 5.537167311320919e-06, "loss": 2.3251, "step": 509930 }, { "epoch": 0.89, "learning_rate": 5.536295371394093e-06, "loss": 2.2423, "step": 509940 }, { "epoch": 0.89, "learning_rate": 5.535423431467266e-06, "loss": 2.2667, "step": 509950 }, { "epoch": 0.89, "learning_rate": 5.534551491540439e-06, "loss": 2.2884, "step": 509960 }, { "epoch": 0.89, "learning_rate": 5.533679551613613e-06, "loss": 2.3662, "step": 509970 }, { "epoch": 0.89, "learning_rate": 5.532807611686786e-06, "loss": 2.2808, "step": 509980 }, { "epoch": 0.89, "learning_rate": 5.531935671759959e-06, "loss": 2.3832, "step": 509990 }, { "epoch": 0.89, "learning_rate": 5.5310637318331316e-06, "loss": 2.4144, "step": 510000 }, { "epoch": 0.89, "learning_rate": 5.530191791906305e-06, "loss": 2.2125, "step": 510010 }, { "epoch": 0.89, "learning_rate": 5.529319851979478e-06, "loss": 2.3048, "step": 510020 }, { "epoch": 0.89, "learning_rate": 5.528447912052651e-06, "loss": 2.2973, "step": 510030 }, { "epoch": 0.89, "learning_rate": 5.527575972125824e-06, "loss": 2.3235, "step": 510040 }, { "epoch": 0.89, "learning_rate": 5.526704032198998e-06, "loss": 2.2495, "step": 510050 }, { "epoch": 0.89, "learning_rate": 5.525832092272172e-06, "loss": 2.2436, "step": 510060 }, { "epoch": 0.89, "learning_rate": 5.5249601523453446e-06, "loss": 2.3565, "step": 510070 }, { "epoch": 0.89, "learning_rate": 5.5240882124185175e-06, "loss": 2.2507, "step": 510080 }, { "epoch": 0.89, "learning_rate": 5.52321627249169e-06, "loss": 2.3677, "step": 510090 }, { "epoch": 0.89, "learning_rate": 5.522344332564864e-06, "loss": 2.2861, "step": 510100 }, { "epoch": 0.89, "learning_rate": 5.521472392638037e-06, "loss": 2.1411, "step": 510110 }, { "epoch": 0.89, "learning_rate": 5.52060045271121e-06, "loss": 2.1852, "step": 510120 }, { "epoch": 0.89, "learning_rate": 5.519728512784384e-06, "loss": 2.216, "step": 510130 }, { "epoch": 0.89, "learning_rate": 5.518856572857557e-06, "loss": 2.2152, "step": 510140 }, { "epoch": 0.89, "learning_rate": 5.51798463293073e-06, "loss": 2.1945, "step": 510150 }, { "epoch": 0.89, "learning_rate": 5.5171126930039026e-06, "loss": 2.2576, "step": 510160 }, { "epoch": 0.89, "learning_rate": 5.516240753077076e-06, "loss": 2.1602, "step": 510170 }, { "epoch": 0.89, "learning_rate": 5.515368813150249e-06, "loss": 2.2727, "step": 510180 }, { "epoch": 0.89, "learning_rate": 5.514496873223423e-06, "loss": 2.4091, "step": 510190 }, { "epoch": 0.89, "learning_rate": 5.513624933296596e-06, "loss": 2.4259, "step": 510200 }, { "epoch": 0.89, "learning_rate": 5.512752993369769e-06, "loss": 2.2588, "step": 510210 }, { "epoch": 0.89, "learning_rate": 5.511881053442943e-06, "loss": 2.2757, "step": 510220 }, { "epoch": 0.89, "learning_rate": 5.5110091135161156e-06, "loss": 2.2651, "step": 510230 }, { "epoch": 0.89, "learning_rate": 5.5101371735892885e-06, "loss": 2.2957, "step": 510240 }, { "epoch": 0.89, "learning_rate": 5.509265233662462e-06, "loss": 2.2636, "step": 510250 }, { "epoch": 0.89, "learning_rate": 5.508393293735635e-06, "loss": 2.3808, "step": 510260 }, { "epoch": 0.89, "learning_rate": 5.507521353808808e-06, "loss": 2.1696, "step": 510270 }, { "epoch": 0.89, "learning_rate": 5.506649413881981e-06, "loss": 2.4681, "step": 510280 }, { "epoch": 0.89, "learning_rate": 5.505777473955155e-06, "loss": 2.2999, "step": 510290 }, { "epoch": 0.89, "learning_rate": 5.504905534028328e-06, "loss": 2.3176, "step": 510300 }, { "epoch": 0.89, "learning_rate": 5.504033594101501e-06, "loss": 2.2589, "step": 510310 }, { "epoch": 0.89, "learning_rate": 5.503161654174674e-06, "loss": 2.1961, "step": 510320 }, { "epoch": 0.89, "learning_rate": 5.502289714247847e-06, "loss": 2.2342, "step": 510330 }, { "epoch": 0.89, "learning_rate": 5.501417774321021e-06, "loss": 2.2668, "step": 510340 }, { "epoch": 0.89, "learning_rate": 5.500545834394194e-06, "loss": 2.2841, "step": 510350 }, { "epoch": 0.89, "learning_rate": 5.499673894467367e-06, "loss": 2.2494, "step": 510360 }, { "epoch": 0.89, "learning_rate": 5.498801954540541e-06, "loss": 2.2685, "step": 510370 }, { "epoch": 0.89, "learning_rate": 5.497930014613714e-06, "loss": 2.2777, "step": 510380 }, { "epoch": 0.89, "learning_rate": 5.4970580746868866e-06, "loss": 2.246, "step": 510390 }, { "epoch": 0.89, "learning_rate": 5.4961861347600595e-06, "loss": 2.2426, "step": 510400 }, { "epoch": 0.89, "learning_rate": 5.495314194833233e-06, "loss": 2.2796, "step": 510410 }, { "epoch": 0.89, "learning_rate": 5.494442254906406e-06, "loss": 2.2836, "step": 510420 }, { "epoch": 0.89, "learning_rate": 5.493570314979579e-06, "loss": 2.1937, "step": 510430 }, { "epoch": 0.89, "learning_rate": 5.492698375052752e-06, "loss": 2.3509, "step": 510440 }, { "epoch": 0.89, "learning_rate": 5.491826435125926e-06, "loss": 2.3269, "step": 510450 }, { "epoch": 0.89, "learning_rate": 5.4909544951990996e-06, "loss": 2.2404, "step": 510460 }, { "epoch": 0.89, "learning_rate": 5.4900825552722725e-06, "loss": 2.3262, "step": 510470 }, { "epoch": 0.89, "learning_rate": 5.489210615345445e-06, "loss": 2.3424, "step": 510480 }, { "epoch": 0.89, "learning_rate": 5.488338675418619e-06, "loss": 2.2848, "step": 510490 }, { "epoch": 0.89, "learning_rate": 5.487466735491792e-06, "loss": 2.3122, "step": 510500 }, { "epoch": 0.89, "learning_rate": 5.486594795564965e-06, "loss": 2.2951, "step": 510510 }, { "epoch": 0.89, "learning_rate": 5.485722855638138e-06, "loss": 2.436, "step": 510520 }, { "epoch": 0.89, "learning_rate": 5.484850915711312e-06, "loss": 2.2551, "step": 510530 }, { "epoch": 0.89, "learning_rate": 5.483978975784485e-06, "loss": 2.3071, "step": 510540 }, { "epoch": 0.89, "learning_rate": 5.4831070358576576e-06, "loss": 2.2426, "step": 510550 }, { "epoch": 0.89, "learning_rate": 5.4822350959308305e-06, "loss": 2.2609, "step": 510560 }, { "epoch": 0.89, "learning_rate": 5.481363156004004e-06, "loss": 2.2851, "step": 510570 }, { "epoch": 0.89, "learning_rate": 5.480491216077177e-06, "loss": 2.3156, "step": 510580 }, { "epoch": 0.89, "learning_rate": 5.479619276150351e-06, "loss": 2.3329, "step": 510590 }, { "epoch": 0.89, "learning_rate": 5.478747336223524e-06, "loss": 2.2982, "step": 510600 }, { "epoch": 0.89, "learning_rate": 5.477875396296697e-06, "loss": 2.3496, "step": 510610 }, { "epoch": 0.89, "learning_rate": 5.4770034563698706e-06, "loss": 2.2336, "step": 510620 }, { "epoch": 0.89, "learning_rate": 5.4761315164430435e-06, "loss": 2.2675, "step": 510630 }, { "epoch": 0.89, "learning_rate": 5.475259576516216e-06, "loss": 2.3663, "step": 510640 }, { "epoch": 0.89, "learning_rate": 5.47438763658939e-06, "loss": 2.3795, "step": 510650 }, { "epoch": 0.89, "learning_rate": 5.473515696662563e-06, "loss": 2.233, "step": 510660 }, { "epoch": 0.89, "learning_rate": 5.472643756735736e-06, "loss": 2.1794, "step": 510670 }, { "epoch": 0.89, "learning_rate": 5.471771816808909e-06, "loss": 2.1895, "step": 510680 }, { "epoch": 0.89, "learning_rate": 5.470899876882083e-06, "loss": 2.2726, "step": 510690 }, { "epoch": 0.89, "learning_rate": 5.470027936955256e-06, "loss": 2.2078, "step": 510700 }, { "epoch": 0.89, "learning_rate": 5.4691559970284286e-06, "loss": 2.3125, "step": 510710 }, { "epoch": 0.89, "learning_rate": 5.468284057101602e-06, "loss": 2.1808, "step": 510720 }, { "epoch": 0.89, "learning_rate": 5.467412117174775e-06, "loss": 2.264, "step": 510730 }, { "epoch": 0.89, "learning_rate": 5.466540177247949e-06, "loss": 2.3058, "step": 510740 }, { "epoch": 0.89, "learning_rate": 5.465668237321122e-06, "loss": 2.2239, "step": 510750 }, { "epoch": 0.89, "learning_rate": 5.464796297394295e-06, "loss": 2.2397, "step": 510760 }, { "epoch": 0.89, "learning_rate": 5.463924357467469e-06, "loss": 2.2723, "step": 510770 }, { "epoch": 0.89, "learning_rate": 5.4630524175406416e-06, "loss": 2.3224, "step": 510780 }, { "epoch": 0.89, "learning_rate": 5.4621804776138145e-06, "loss": 2.238, "step": 510790 }, { "epoch": 0.89, "learning_rate": 5.461308537686987e-06, "loss": 2.2611, "step": 510800 }, { "epoch": 0.89, "learning_rate": 5.460436597760161e-06, "loss": 2.1392, "step": 510810 }, { "epoch": 0.89, "learning_rate": 5.459564657833334e-06, "loss": 2.3178, "step": 510820 }, { "epoch": 0.89, "learning_rate": 5.458692717906507e-06, "loss": 2.2393, "step": 510830 }, { "epoch": 0.89, "learning_rate": 5.45782077797968e-06, "loss": 2.2603, "step": 510840 }, { "epoch": 0.89, "learning_rate": 5.456948838052854e-06, "loss": 2.3749, "step": 510850 }, { "epoch": 0.89, "learning_rate": 5.4560768981260275e-06, "loss": 2.2313, "step": 510860 }, { "epoch": 0.89, "learning_rate": 5.4552049581992e-06, "loss": 2.2373, "step": 510870 }, { "epoch": 0.89, "learning_rate": 5.454333018272373e-06, "loss": 2.2272, "step": 510880 }, { "epoch": 0.89, "learning_rate": 5.453461078345547e-06, "loss": 2.2774, "step": 510890 }, { "epoch": 0.89, "learning_rate": 5.45258913841872e-06, "loss": 2.283, "step": 510900 }, { "epoch": 0.89, "learning_rate": 5.451717198491893e-06, "loss": 2.2939, "step": 510910 }, { "epoch": 0.89, "learning_rate": 5.450845258565066e-06, "loss": 2.2598, "step": 510920 }, { "epoch": 0.89, "learning_rate": 5.44997331863824e-06, "loss": 2.221, "step": 510930 }, { "epoch": 0.89, "learning_rate": 5.4491013787114126e-06, "loss": 2.1936, "step": 510940 }, { "epoch": 0.89, "learning_rate": 5.4482294387845855e-06, "loss": 2.1843, "step": 510950 }, { "epoch": 0.89, "learning_rate": 5.447357498857758e-06, "loss": 2.1677, "step": 510960 }, { "epoch": 0.89, "learning_rate": 5.446485558930932e-06, "loss": 2.2848, "step": 510970 }, { "epoch": 0.89, "learning_rate": 5.445613619004105e-06, "loss": 2.3419, "step": 510980 }, { "epoch": 0.89, "learning_rate": 5.444741679077279e-06, "loss": 2.1729, "step": 510990 }, { "epoch": 0.89, "learning_rate": 5.443869739150452e-06, "loss": 2.2758, "step": 511000 }, { "epoch": 0.89, "learning_rate": 5.4429977992236256e-06, "loss": 2.1078, "step": 511010 }, { "epoch": 0.89, "learning_rate": 5.4421258592967985e-06, "loss": 2.1945, "step": 511020 }, { "epoch": 0.89, "learning_rate": 5.441253919369971e-06, "loss": 2.1896, "step": 511030 }, { "epoch": 0.89, "learning_rate": 5.440381979443144e-06, "loss": 2.2856, "step": 511040 }, { "epoch": 0.89, "learning_rate": 5.439510039516318e-06, "loss": 2.2946, "step": 511050 }, { "epoch": 0.89, "learning_rate": 5.438638099589491e-06, "loss": 2.258, "step": 511060 }, { "epoch": 0.89, "learning_rate": 5.437766159662664e-06, "loss": 2.2819, "step": 511070 }, { "epoch": 0.89, "learning_rate": 5.436894219735837e-06, "loss": 2.2698, "step": 511080 }, { "epoch": 0.89, "learning_rate": 5.436022279809011e-06, "loss": 2.1662, "step": 511090 }, { "epoch": 0.89, "learning_rate": 5.4351503398821836e-06, "loss": 2.3341, "step": 511100 }, { "epoch": 0.89, "learning_rate": 5.4342783999553565e-06, "loss": 2.2918, "step": 511110 }, { "epoch": 0.89, "learning_rate": 5.43340646002853e-06, "loss": 2.3677, "step": 511120 }, { "epoch": 0.89, "learning_rate": 5.432534520101703e-06, "loss": 2.1571, "step": 511130 }, { "epoch": 0.89, "learning_rate": 5.431662580174877e-06, "loss": 2.2662, "step": 511140 }, { "epoch": 0.89, "learning_rate": 5.43079064024805e-06, "loss": 2.3866, "step": 511150 }, { "epoch": 0.89, "learning_rate": 5.429918700321223e-06, "loss": 2.2723, "step": 511160 }, { "epoch": 0.89, "learning_rate": 5.4290467603943966e-06, "loss": 2.3294, "step": 511170 }, { "epoch": 0.89, "learning_rate": 5.4281748204675695e-06, "loss": 2.3692, "step": 511180 }, { "epoch": 0.89, "learning_rate": 5.427302880540742e-06, "loss": 2.3073, "step": 511190 }, { "epoch": 0.89, "learning_rate": 5.426430940613915e-06, "loss": 2.2144, "step": 511200 }, { "epoch": 0.89, "learning_rate": 5.425559000687089e-06, "loss": 2.3322, "step": 511210 }, { "epoch": 0.89, "learning_rate": 5.424687060760262e-06, "loss": 2.302, "step": 511220 }, { "epoch": 0.89, "learning_rate": 5.423815120833435e-06, "loss": 2.2616, "step": 511230 }, { "epoch": 0.89, "learning_rate": 5.422943180906608e-06, "loss": 2.2938, "step": 511240 }, { "epoch": 0.89, "learning_rate": 5.422071240979782e-06, "loss": 2.2663, "step": 511250 }, { "epoch": 0.89, "learning_rate": 5.421199301052955e-06, "loss": 2.224, "step": 511260 }, { "epoch": 0.89, "learning_rate": 5.420327361126128e-06, "loss": 2.2447, "step": 511270 }, { "epoch": 0.89, "learning_rate": 5.419455421199301e-06, "loss": 2.2854, "step": 511280 }, { "epoch": 0.89, "learning_rate": 5.418583481272475e-06, "loss": 2.1463, "step": 511290 }, { "epoch": 0.89, "learning_rate": 5.417711541345648e-06, "loss": 2.2236, "step": 511300 }, { "epoch": 0.89, "learning_rate": 5.416839601418821e-06, "loss": 2.2563, "step": 511310 }, { "epoch": 0.89, "learning_rate": 5.415967661491994e-06, "loss": 2.2948, "step": 511320 }, { "epoch": 0.89, "learning_rate": 5.4150957215651676e-06, "loss": 2.2942, "step": 511330 }, { "epoch": 0.89, "learning_rate": 5.4142237816383405e-06, "loss": 2.2339, "step": 511340 }, { "epoch": 0.89, "learning_rate": 5.413351841711513e-06, "loss": 2.2539, "step": 511350 }, { "epoch": 0.89, "learning_rate": 5.412479901784686e-06, "loss": 2.1802, "step": 511360 }, { "epoch": 0.89, "learning_rate": 5.41160796185786e-06, "loss": 2.4136, "step": 511370 }, { "epoch": 0.89, "learning_rate": 5.410736021931033e-06, "loss": 2.3511, "step": 511380 }, { "epoch": 0.89, "learning_rate": 5.409864082004207e-06, "loss": 2.3067, "step": 511390 }, { "epoch": 0.89, "learning_rate": 5.40899214207738e-06, "loss": 2.124, "step": 511400 }, { "epoch": 0.89, "learning_rate": 5.4081202021505535e-06, "loss": 2.2015, "step": 511410 }, { "epoch": 0.89, "learning_rate": 5.407248262223726e-06, "loss": 2.3994, "step": 511420 }, { "epoch": 0.89, "learning_rate": 5.406376322296899e-06, "loss": 2.3992, "step": 511430 }, { "epoch": 0.89, "learning_rate": 5.405504382370072e-06, "loss": 2.3409, "step": 511440 }, { "epoch": 0.89, "learning_rate": 5.404632442443246e-06, "loss": 2.1062, "step": 511450 }, { "epoch": 0.89, "learning_rate": 5.403760502516419e-06, "loss": 2.3719, "step": 511460 }, { "epoch": 0.89, "learning_rate": 5.402888562589592e-06, "loss": 2.1949, "step": 511470 }, { "epoch": 0.89, "learning_rate": 5.402016622662765e-06, "loss": 2.2991, "step": 511480 }, { "epoch": 0.89, "learning_rate": 5.4011446827359386e-06, "loss": 2.2542, "step": 511490 }, { "epoch": 0.89, "learning_rate": 5.4002727428091115e-06, "loss": 2.1685, "step": 511500 }, { "epoch": 0.89, "learning_rate": 5.399400802882284e-06, "loss": 2.2354, "step": 511510 }, { "epoch": 0.89, "learning_rate": 5.398528862955458e-06, "loss": 2.3169, "step": 511520 }, { "epoch": 0.89, "learning_rate": 5.397656923028632e-06, "loss": 2.2275, "step": 511530 }, { "epoch": 0.89, "learning_rate": 5.396784983101805e-06, "loss": 2.2645, "step": 511540 }, { "epoch": 0.89, "learning_rate": 5.395913043174978e-06, "loss": 2.2077, "step": 511550 }, { "epoch": 0.89, "learning_rate": 5.395041103248151e-06, "loss": 2.1074, "step": 511560 }, { "epoch": 0.89, "learning_rate": 5.3941691633213245e-06, "loss": 2.1995, "step": 511570 }, { "epoch": 0.89, "learning_rate": 5.393297223394497e-06, "loss": 2.2277, "step": 511580 }, { "epoch": 0.89, "learning_rate": 5.39242528346767e-06, "loss": 2.3782, "step": 511590 }, { "epoch": 0.89, "learning_rate": 5.391553343540843e-06, "loss": 2.2061, "step": 511600 }, { "epoch": 0.89, "learning_rate": 5.390681403614017e-06, "loss": 2.1489, "step": 511610 }, { "epoch": 0.89, "learning_rate": 5.38980946368719e-06, "loss": 2.2483, "step": 511620 }, { "epoch": 0.89, "learning_rate": 5.388937523760363e-06, "loss": 2.2349, "step": 511630 }, { "epoch": 0.89, "learning_rate": 5.388065583833536e-06, "loss": 2.24, "step": 511640 }, { "epoch": 0.89, "learning_rate": 5.3871936439067096e-06, "loss": 2.3654, "step": 511650 }, { "epoch": 0.89, "learning_rate": 5.386321703979883e-06, "loss": 2.2811, "step": 511660 }, { "epoch": 0.89, "learning_rate": 5.385449764053056e-06, "loss": 2.2968, "step": 511670 }, { "epoch": 0.89, "learning_rate": 5.384577824126229e-06, "loss": 2.2853, "step": 511680 }, { "epoch": 0.89, "learning_rate": 5.383705884199403e-06, "loss": 2.2684, "step": 511690 }, { "epoch": 0.89, "learning_rate": 5.382833944272576e-06, "loss": 2.2308, "step": 511700 }, { "epoch": 0.89, "learning_rate": 5.381962004345749e-06, "loss": 2.2383, "step": 511710 }, { "epoch": 0.89, "learning_rate": 5.381090064418922e-06, "loss": 2.2661, "step": 511720 }, { "epoch": 0.89, "learning_rate": 5.3802181244920955e-06, "loss": 2.3197, "step": 511730 }, { "epoch": 0.89, "learning_rate": 5.379346184565268e-06, "loss": 2.2325, "step": 511740 }, { "epoch": 0.89, "learning_rate": 5.378474244638441e-06, "loss": 2.302, "step": 511750 }, { "epoch": 0.89, "learning_rate": 5.377602304711614e-06, "loss": 2.27, "step": 511760 }, { "epoch": 0.89, "learning_rate": 5.376730364784788e-06, "loss": 2.2423, "step": 511770 }, { "epoch": 0.89, "learning_rate": 5.375858424857961e-06, "loss": 2.2773, "step": 511780 }, { "epoch": 0.89, "learning_rate": 5.374986484931135e-06, "loss": 2.2993, "step": 511790 }, { "epoch": 0.89, "learning_rate": 5.374114545004308e-06, "loss": 2.3681, "step": 511800 }, { "epoch": 0.89, "learning_rate": 5.373242605077481e-06, "loss": 2.3318, "step": 511810 }, { "epoch": 0.89, "learning_rate": 5.372370665150654e-06, "loss": 2.2256, "step": 511820 }, { "epoch": 0.89, "learning_rate": 5.371498725223827e-06, "loss": 2.156, "step": 511830 }, { "epoch": 0.89, "learning_rate": 5.370626785297e-06, "loss": 2.2427, "step": 511840 }, { "epoch": 0.89, "learning_rate": 5.369754845370174e-06, "loss": 2.2281, "step": 511850 }, { "epoch": 0.89, "learning_rate": 5.368882905443347e-06, "loss": 2.3782, "step": 511860 }, { "epoch": 0.89, "learning_rate": 5.36801096551652e-06, "loss": 2.3052, "step": 511870 }, { "epoch": 0.89, "learning_rate": 5.367139025589693e-06, "loss": 2.2224, "step": 511880 }, { "epoch": 0.89, "learning_rate": 5.3662670856628665e-06, "loss": 2.2821, "step": 511890 }, { "epoch": 0.89, "learning_rate": 5.365395145736039e-06, "loss": 2.1424, "step": 511900 }, { "epoch": 0.89, "learning_rate": 5.364523205809212e-06, "loss": 2.293, "step": 511910 }, { "epoch": 0.89, "learning_rate": 5.363651265882386e-06, "loss": 2.2403, "step": 511920 }, { "epoch": 0.89, "learning_rate": 5.36277932595556e-06, "loss": 2.3008, "step": 511930 }, { "epoch": 0.89, "learning_rate": 5.361907386028733e-06, "loss": 2.2682, "step": 511940 }, { "epoch": 0.89, "learning_rate": 5.361035446101906e-06, "loss": 2.2489, "step": 511950 }, { "epoch": 0.89, "learning_rate": 5.360163506175079e-06, "loss": 2.2857, "step": 511960 }, { "epoch": 0.89, "learning_rate": 5.3592915662482524e-06, "loss": 2.1506, "step": 511970 }, { "epoch": 0.89, "learning_rate": 5.358419626321425e-06, "loss": 2.2695, "step": 511980 }, { "epoch": 0.89, "learning_rate": 5.357547686394598e-06, "loss": 2.2661, "step": 511990 }, { "epoch": 0.89, "learning_rate": 5.356675746467771e-06, "loss": 2.2549, "step": 512000 }, { "epoch": 0.89, "learning_rate": 5.355803806540945e-06, "loss": 2.2187, "step": 512010 }, { "epoch": 0.89, "learning_rate": 5.354931866614118e-06, "loss": 2.27, "step": 512020 }, { "epoch": 0.89, "learning_rate": 5.354059926687291e-06, "loss": 2.306, "step": 512030 }, { "epoch": 0.89, "learning_rate": 5.353187986760464e-06, "loss": 2.2194, "step": 512040 }, { "epoch": 0.89, "learning_rate": 5.352316046833638e-06, "loss": 2.3538, "step": 512050 }, { "epoch": 0.89, "learning_rate": 5.351444106906811e-06, "loss": 2.3239, "step": 512060 }, { "epoch": 0.89, "learning_rate": 5.350572166979984e-06, "loss": 2.3953, "step": 512070 }, { "epoch": 0.89, "learning_rate": 5.349700227053157e-06, "loss": 2.2457, "step": 512080 }, { "epoch": 0.89, "learning_rate": 5.348828287126331e-06, "loss": 2.2872, "step": 512090 }, { "epoch": 0.89, "learning_rate": 5.347956347199504e-06, "loss": 2.299, "step": 512100 }, { "epoch": 0.89, "learning_rate": 5.347084407272677e-06, "loss": 2.1982, "step": 512110 }, { "epoch": 0.89, "learning_rate": 5.34621246734585e-06, "loss": 2.3518, "step": 512120 }, { "epoch": 0.89, "learning_rate": 5.3453405274190234e-06, "loss": 2.2571, "step": 512130 }, { "epoch": 0.89, "learning_rate": 5.344468587492196e-06, "loss": 2.1696, "step": 512140 }, { "epoch": 0.89, "learning_rate": 5.343596647565369e-06, "loss": 2.2993, "step": 512150 }, { "epoch": 0.89, "learning_rate": 5.342724707638542e-06, "loss": 2.2531, "step": 512160 }, { "epoch": 0.89, "learning_rate": 5.341852767711716e-06, "loss": 2.2456, "step": 512170 }, { "epoch": 0.89, "learning_rate": 5.34098082778489e-06, "loss": 2.2739, "step": 512180 }, { "epoch": 0.89, "learning_rate": 5.340108887858063e-06, "loss": 2.2563, "step": 512190 }, { "epoch": 0.89, "learning_rate": 5.339236947931236e-06, "loss": 2.2973, "step": 512200 }, { "epoch": 0.89, "learning_rate": 5.338365008004409e-06, "loss": 2.351, "step": 512210 }, { "epoch": 0.89, "learning_rate": 5.337493068077582e-06, "loss": 2.3167, "step": 512220 }, { "epoch": 0.89, "learning_rate": 5.336621128150755e-06, "loss": 2.3529, "step": 512230 }, { "epoch": 0.89, "learning_rate": 5.335749188223928e-06, "loss": 2.3235, "step": 512240 }, { "epoch": 0.89, "learning_rate": 5.334877248297102e-06, "loss": 2.3297, "step": 512250 }, { "epoch": 0.89, "learning_rate": 5.334005308370275e-06, "loss": 2.2412, "step": 512260 }, { "epoch": 0.89, "learning_rate": 5.333133368443448e-06, "loss": 2.3433, "step": 512270 }, { "epoch": 0.89, "learning_rate": 5.332261428516621e-06, "loss": 2.3544, "step": 512280 }, { "epoch": 0.89, "learning_rate": 5.3313894885897944e-06, "loss": 2.2506, "step": 512290 }, { "epoch": 0.89, "learning_rate": 5.330517548662967e-06, "loss": 2.2883, "step": 512300 }, { "epoch": 0.89, "learning_rate": 5.32964560873614e-06, "loss": 2.4513, "step": 512310 }, { "epoch": 0.89, "learning_rate": 5.328773668809314e-06, "loss": 2.1872, "step": 512320 }, { "epoch": 0.89, "learning_rate": 5.327901728882488e-06, "loss": 2.274, "step": 512330 }, { "epoch": 0.89, "learning_rate": 5.327029788955661e-06, "loss": 2.2684, "step": 512340 }, { "epoch": 0.89, "learning_rate": 5.326157849028834e-06, "loss": 2.2136, "step": 512350 }, { "epoch": 0.89, "learning_rate": 5.325285909102007e-06, "loss": 2.2834, "step": 512360 }, { "epoch": 0.89, "learning_rate": 5.32441396917518e-06, "loss": 2.2629, "step": 512370 }, { "epoch": 0.89, "learning_rate": 5.323542029248353e-06, "loss": 2.2922, "step": 512380 }, { "epoch": 0.89, "learning_rate": 5.322670089321526e-06, "loss": 2.2504, "step": 512390 }, { "epoch": 0.89, "learning_rate": 5.321798149394699e-06, "loss": 2.2566, "step": 512400 }, { "epoch": 0.89, "learning_rate": 5.320926209467873e-06, "loss": 2.2666, "step": 512410 }, { "epoch": 0.89, "learning_rate": 5.320054269541046e-06, "loss": 2.2112, "step": 512420 }, { "epoch": 0.89, "learning_rate": 5.319182329614219e-06, "loss": 2.2987, "step": 512430 }, { "epoch": 0.89, "learning_rate": 5.318310389687392e-06, "loss": 2.2448, "step": 512440 }, { "epoch": 0.89, "learning_rate": 5.317438449760566e-06, "loss": 2.4219, "step": 512450 }, { "epoch": 0.89, "learning_rate": 5.316566509833739e-06, "loss": 2.3049, "step": 512460 }, { "epoch": 0.89, "learning_rate": 5.315694569906912e-06, "loss": 2.0955, "step": 512470 }, { "epoch": 0.89, "learning_rate": 5.314822629980085e-06, "loss": 2.2934, "step": 512480 }, { "epoch": 0.89, "learning_rate": 5.313950690053259e-06, "loss": 2.2965, "step": 512490 }, { "epoch": 0.89, "learning_rate": 5.313078750126432e-06, "loss": 2.2089, "step": 512500 }, { "epoch": 0.89, "learning_rate": 5.312206810199605e-06, "loss": 2.2439, "step": 512510 }, { "epoch": 0.89, "learning_rate": 5.311334870272778e-06, "loss": 2.1566, "step": 512520 }, { "epoch": 0.89, "learning_rate": 5.310462930345951e-06, "loss": 2.2268, "step": 512530 }, { "epoch": 0.89, "learning_rate": 5.309590990419124e-06, "loss": 2.2544, "step": 512540 }, { "epoch": 0.89, "learning_rate": 5.308719050492297e-06, "loss": 2.3779, "step": 512550 }, { "epoch": 0.89, "learning_rate": 5.30784711056547e-06, "loss": 2.2076, "step": 512560 }, { "epoch": 0.89, "learning_rate": 5.306975170638644e-06, "loss": 2.1645, "step": 512570 }, { "epoch": 0.89, "learning_rate": 5.306103230711818e-06, "loss": 2.3083, "step": 512580 }, { "epoch": 0.89, "learning_rate": 5.305231290784991e-06, "loss": 2.3269, "step": 512590 }, { "epoch": 0.89, "learning_rate": 5.3043593508581635e-06, "loss": 2.2693, "step": 512600 }, { "epoch": 0.89, "learning_rate": 5.303487410931337e-06, "loss": 2.2745, "step": 512610 }, { "epoch": 0.89, "learning_rate": 5.30261547100451e-06, "loss": 2.4016, "step": 512620 }, { "epoch": 0.89, "learning_rate": 5.301743531077683e-06, "loss": 2.2593, "step": 512630 }, { "epoch": 0.89, "learning_rate": 5.300871591150856e-06, "loss": 2.2923, "step": 512640 }, { "epoch": 0.89, "learning_rate": 5.29999965122403e-06, "loss": 2.1238, "step": 512650 }, { "epoch": 0.89, "learning_rate": 5.299127711297203e-06, "loss": 2.2287, "step": 512660 }, { "epoch": 0.89, "learning_rate": 5.298255771370376e-06, "loss": 2.3338, "step": 512670 }, { "epoch": 0.89, "learning_rate": 5.297383831443549e-06, "loss": 2.3479, "step": 512680 }, { "epoch": 0.89, "learning_rate": 5.296511891516722e-06, "loss": 2.2157, "step": 512690 }, { "epoch": 0.89, "learning_rate": 5.295639951589895e-06, "loss": 2.3302, "step": 512700 }, { "epoch": 0.89, "learning_rate": 5.294768011663068e-06, "loss": 2.2426, "step": 512710 }, { "epoch": 0.89, "learning_rate": 5.293896071736242e-06, "loss": 2.2872, "step": 512720 }, { "epoch": 0.89, "learning_rate": 5.293024131809416e-06, "loss": 2.3373, "step": 512730 }, { "epoch": 0.89, "learning_rate": 5.292152191882589e-06, "loss": 2.2322, "step": 512740 }, { "epoch": 0.89, "learning_rate": 5.291280251955762e-06, "loss": 2.3059, "step": 512750 }, { "epoch": 0.89, "learning_rate": 5.2904083120289345e-06, "loss": 2.3434, "step": 512760 }, { "epoch": 0.89, "learning_rate": 5.289536372102108e-06, "loss": 2.322, "step": 512770 }, { "epoch": 0.89, "learning_rate": 5.288664432175281e-06, "loss": 2.2284, "step": 512780 }, { "epoch": 0.89, "learning_rate": 5.287792492248454e-06, "loss": 2.1309, "step": 512790 }, { "epoch": 0.89, "learning_rate": 5.286920552321627e-06, "loss": 2.2271, "step": 512800 }, { "epoch": 0.89, "learning_rate": 5.286048612394801e-06, "loss": 2.344, "step": 512810 }, { "epoch": 0.89, "learning_rate": 5.285176672467974e-06, "loss": 2.2979, "step": 512820 }, { "epoch": 0.89, "learning_rate": 5.284304732541147e-06, "loss": 2.1304, "step": 512830 }, { "epoch": 0.89, "learning_rate": 5.28343279261432e-06, "loss": 2.3161, "step": 512840 }, { "epoch": 0.89, "learning_rate": 5.282560852687494e-06, "loss": 2.1802, "step": 512850 }, { "epoch": 0.89, "learning_rate": 5.281688912760667e-06, "loss": 2.3718, "step": 512860 }, { "epoch": 0.89, "learning_rate": 5.28081697283384e-06, "loss": 2.2452, "step": 512870 }, { "epoch": 0.89, "learning_rate": 5.279945032907013e-06, "loss": 2.315, "step": 512880 }, { "epoch": 0.89, "learning_rate": 5.279073092980187e-06, "loss": 2.2408, "step": 512890 }, { "epoch": 0.89, "learning_rate": 5.27820115305336e-06, "loss": 2.246, "step": 512900 }, { "epoch": 0.89, "learning_rate": 5.277329213126533e-06, "loss": 2.1831, "step": 512910 }, { "epoch": 0.89, "learning_rate": 5.2764572731997055e-06, "loss": 2.2811, "step": 512920 }, { "epoch": 0.89, "learning_rate": 5.275585333272879e-06, "loss": 2.2394, "step": 512930 }, { "epoch": 0.89, "learning_rate": 5.274713393346052e-06, "loss": 2.3966, "step": 512940 }, { "epoch": 0.89, "learning_rate": 5.273841453419225e-06, "loss": 2.2805, "step": 512950 }, { "epoch": 0.89, "learning_rate": 5.272969513492398e-06, "loss": 2.446, "step": 512960 }, { "epoch": 0.89, "learning_rate": 5.272097573565572e-06, "loss": 2.2132, "step": 512970 }, { "epoch": 0.89, "learning_rate": 5.271225633638746e-06, "loss": 2.3732, "step": 512980 }, { "epoch": 0.89, "learning_rate": 5.2703536937119185e-06, "loss": 2.2326, "step": 512990 }, { "epoch": 0.89, "learning_rate": 5.2694817537850914e-06, "loss": 2.2309, "step": 513000 }, { "epoch": 0.89, "learning_rate": 5.268609813858265e-06, "loss": 2.1917, "step": 513010 }, { "epoch": 0.89, "learning_rate": 5.267737873931438e-06, "loss": 2.2397, "step": 513020 }, { "epoch": 0.89, "learning_rate": 5.266865934004611e-06, "loss": 2.3611, "step": 513030 }, { "epoch": 0.89, "learning_rate": 5.265993994077784e-06, "loss": 2.2185, "step": 513040 }, { "epoch": 0.89, "learning_rate": 5.265122054150958e-06, "loss": 2.2885, "step": 513050 }, { "epoch": 0.89, "learning_rate": 5.264250114224131e-06, "loss": 2.2926, "step": 513060 }, { "epoch": 0.89, "learning_rate": 5.263378174297304e-06, "loss": 2.2783, "step": 513070 }, { "epoch": 0.89, "learning_rate": 5.2625062343704765e-06, "loss": 2.3394, "step": 513080 }, { "epoch": 0.89, "learning_rate": 5.26163429444365e-06, "loss": 2.2252, "step": 513090 }, { "epoch": 0.89, "learning_rate": 5.260762354516823e-06, "loss": 2.2015, "step": 513100 }, { "epoch": 0.89, "learning_rate": 5.259890414589996e-06, "loss": 2.3232, "step": 513110 }, { "epoch": 0.89, "learning_rate": 5.25901847466317e-06, "loss": 2.2167, "step": 513120 }, { "epoch": 0.89, "learning_rate": 5.258146534736344e-06, "loss": 2.3465, "step": 513130 }, { "epoch": 0.89, "learning_rate": 5.257274594809517e-06, "loss": 2.2193, "step": 513140 }, { "epoch": 0.89, "learning_rate": 5.2564026548826895e-06, "loss": 2.2969, "step": 513150 }, { "epoch": 0.89, "learning_rate": 5.2555307149558624e-06, "loss": 2.3211, "step": 513160 }, { "epoch": 0.89, "learning_rate": 5.254658775029036e-06, "loss": 2.1609, "step": 513170 }, { "epoch": 0.89, "learning_rate": 5.253786835102209e-06, "loss": 2.3062, "step": 513180 }, { "epoch": 0.89, "learning_rate": 5.252914895175382e-06, "loss": 2.1905, "step": 513190 }, { "epoch": 0.89, "learning_rate": 5.252042955248555e-06, "loss": 2.2434, "step": 513200 }, { "epoch": 0.89, "learning_rate": 5.251171015321729e-06, "loss": 2.2633, "step": 513210 }, { "epoch": 0.89, "learning_rate": 5.250299075394902e-06, "loss": 2.2319, "step": 513220 }, { "epoch": 0.9, "learning_rate": 5.249427135468075e-06, "loss": 2.2493, "step": 513230 }, { "epoch": 0.9, "learning_rate": 5.2485551955412475e-06, "loss": 2.2346, "step": 513240 }, { "epoch": 0.9, "learning_rate": 5.247683255614422e-06, "loss": 2.2032, "step": 513250 }, { "epoch": 0.9, "learning_rate": 5.246811315687595e-06, "loss": 2.1809, "step": 513260 }, { "epoch": 0.9, "learning_rate": 5.245939375760768e-06, "loss": 2.2361, "step": 513270 }, { "epoch": 0.9, "learning_rate": 5.245067435833941e-06, "loss": 2.2075, "step": 513280 }, { "epoch": 0.9, "learning_rate": 5.244195495907115e-06, "loss": 2.313, "step": 513290 }, { "epoch": 0.9, "learning_rate": 5.243323555980288e-06, "loss": 2.2252, "step": 513300 }, { "epoch": 0.9, "learning_rate": 5.2424516160534605e-06, "loss": 2.2204, "step": 513310 }, { "epoch": 0.9, "learning_rate": 5.2415796761266334e-06, "loss": 2.3906, "step": 513320 }, { "epoch": 0.9, "learning_rate": 5.240707736199807e-06, "loss": 2.18, "step": 513330 }, { "epoch": 0.9, "learning_rate": 5.23983579627298e-06, "loss": 2.3192, "step": 513340 }, { "epoch": 0.9, "learning_rate": 5.238963856346153e-06, "loss": 2.3066, "step": 513350 }, { "epoch": 0.9, "learning_rate": 5.238091916419326e-06, "loss": 2.2329, "step": 513360 }, { "epoch": 0.9, "learning_rate": 5.2372199764925e-06, "loss": 2.2315, "step": 513370 }, { "epoch": 0.9, "learning_rate": 5.2363480365656735e-06, "loss": 2.2982, "step": 513380 }, { "epoch": 0.9, "learning_rate": 5.2354760966388464e-06, "loss": 2.2814, "step": 513390 }, { "epoch": 0.9, "learning_rate": 5.234604156712019e-06, "loss": 2.2339, "step": 513400 }, { "epoch": 0.9, "learning_rate": 5.233732216785193e-06, "loss": 2.2323, "step": 513410 }, { "epoch": 0.9, "learning_rate": 5.232860276858366e-06, "loss": 2.1848, "step": 513420 }, { "epoch": 0.9, "learning_rate": 5.231988336931539e-06, "loss": 2.2788, "step": 513430 }, { "epoch": 0.9, "learning_rate": 5.231116397004712e-06, "loss": 2.2934, "step": 513440 }, { "epoch": 0.9, "learning_rate": 5.230244457077886e-06, "loss": 2.2143, "step": 513450 }, { "epoch": 0.9, "learning_rate": 5.229372517151059e-06, "loss": 2.2688, "step": 513460 }, { "epoch": 0.9, "learning_rate": 5.2285005772242315e-06, "loss": 2.19, "step": 513470 }, { "epoch": 0.9, "learning_rate": 5.2276286372974044e-06, "loss": 2.3097, "step": 513480 }, { "epoch": 0.9, "learning_rate": 5.226756697370578e-06, "loss": 2.2913, "step": 513490 }, { "epoch": 0.9, "learning_rate": 5.225884757443751e-06, "loss": 2.3146, "step": 513500 }, { "epoch": 0.9, "learning_rate": 5.225012817516924e-06, "loss": 2.2467, "step": 513510 }, { "epoch": 0.9, "learning_rate": 5.224140877590098e-06, "loss": 2.3027, "step": 513520 }, { "epoch": 0.9, "learning_rate": 5.223268937663272e-06, "loss": 2.2686, "step": 513530 }, { "epoch": 0.9, "learning_rate": 5.2223969977364445e-06, "loss": 2.2298, "step": 513540 }, { "epoch": 0.9, "learning_rate": 5.2215250578096174e-06, "loss": 2.3097, "step": 513550 }, { "epoch": 0.9, "learning_rate": 5.22065311788279e-06, "loss": 2.2786, "step": 513560 }, { "epoch": 0.9, "learning_rate": 5.219781177955964e-06, "loss": 2.2232, "step": 513570 }, { "epoch": 0.9, "learning_rate": 5.218909238029137e-06, "loss": 2.2427, "step": 513580 }, { "epoch": 0.9, "learning_rate": 5.21803729810231e-06, "loss": 2.2906, "step": 513590 }, { "epoch": 0.9, "learning_rate": 5.217165358175483e-06, "loss": 2.2631, "step": 513600 }, { "epoch": 0.9, "learning_rate": 5.216293418248657e-06, "loss": 2.2727, "step": 513610 }, { "epoch": 0.9, "learning_rate": 5.21542147832183e-06, "loss": 2.2733, "step": 513620 }, { "epoch": 0.9, "learning_rate": 5.2145495383950025e-06, "loss": 2.205, "step": 513630 }, { "epoch": 0.9, "learning_rate": 5.2136775984681754e-06, "loss": 2.2376, "step": 513640 }, { "epoch": 0.9, "learning_rate": 5.21280565854135e-06, "loss": 2.2815, "step": 513650 }, { "epoch": 0.9, "learning_rate": 5.211933718614523e-06, "loss": 2.2405, "step": 513660 }, { "epoch": 0.9, "learning_rate": 5.211061778687696e-06, "loss": 2.2366, "step": 513670 }, { "epoch": 0.9, "learning_rate": 5.210189838760869e-06, "loss": 2.3076, "step": 513680 }, { "epoch": 0.9, "learning_rate": 5.209317898834043e-06, "loss": 2.3428, "step": 513690 }, { "epoch": 0.9, "learning_rate": 5.2084459589072155e-06, "loss": 2.2164, "step": 513700 }, { "epoch": 0.9, "learning_rate": 5.2075740189803884e-06, "loss": 2.2783, "step": 513710 }, { "epoch": 0.9, "learning_rate": 5.206702079053561e-06, "loss": 2.2364, "step": 513720 }, { "epoch": 0.9, "learning_rate": 5.205830139126735e-06, "loss": 2.2361, "step": 513730 }, { "epoch": 0.9, "learning_rate": 5.204958199199908e-06, "loss": 2.2871, "step": 513740 }, { "epoch": 0.9, "learning_rate": 5.204086259273081e-06, "loss": 2.2327, "step": 513750 }, { "epoch": 0.9, "learning_rate": 5.203214319346254e-06, "loss": 2.2165, "step": 513760 }, { "epoch": 0.9, "learning_rate": 5.202342379419428e-06, "loss": 2.2321, "step": 513770 }, { "epoch": 0.9, "learning_rate": 5.2014704394926014e-06, "loss": 2.3313, "step": 513780 }, { "epoch": 0.9, "learning_rate": 5.200598499565774e-06, "loss": 2.2406, "step": 513790 }, { "epoch": 0.9, "learning_rate": 5.199726559638947e-06, "loss": 2.3602, "step": 513800 }, { "epoch": 0.9, "learning_rate": 5.198854619712121e-06, "loss": 2.2617, "step": 513810 }, { "epoch": 0.9, "learning_rate": 5.197982679785294e-06, "loss": 2.279, "step": 513820 }, { "epoch": 0.9, "learning_rate": 5.197110739858467e-06, "loss": 2.2192, "step": 513830 }, { "epoch": 0.9, "learning_rate": 5.19623879993164e-06, "loss": 2.3324, "step": 513840 }, { "epoch": 0.9, "learning_rate": 5.195366860004814e-06, "loss": 2.1915, "step": 513850 }, { "epoch": 0.9, "learning_rate": 5.1944949200779865e-06, "loss": 2.1952, "step": 513860 }, { "epoch": 0.9, "learning_rate": 5.1936229801511594e-06, "loss": 2.3669, "step": 513870 }, { "epoch": 0.9, "learning_rate": 5.192751040224332e-06, "loss": 2.2627, "step": 513880 }, { "epoch": 0.9, "learning_rate": 5.191879100297506e-06, "loss": 2.2434, "step": 513890 }, { "epoch": 0.9, "learning_rate": 5.191007160370679e-06, "loss": 2.2205, "step": 513900 }, { "epoch": 0.9, "learning_rate": 5.190135220443853e-06, "loss": 2.2157, "step": 513910 }, { "epoch": 0.9, "learning_rate": 5.189263280517026e-06, "loss": 2.3101, "step": 513920 }, { "epoch": 0.9, "learning_rate": 5.1883913405901995e-06, "loss": 2.2545, "step": 513930 }, { "epoch": 0.9, "learning_rate": 5.1875194006633724e-06, "loss": 2.1713, "step": 513940 }, { "epoch": 0.9, "learning_rate": 5.186647460736545e-06, "loss": 2.3031, "step": 513950 }, { "epoch": 0.9, "learning_rate": 5.185775520809718e-06, "loss": 2.3885, "step": 513960 }, { "epoch": 0.9, "learning_rate": 5.184903580882892e-06, "loss": 2.1403, "step": 513970 }, { "epoch": 0.9, "learning_rate": 5.184031640956065e-06, "loss": 2.2268, "step": 513980 }, { "epoch": 0.9, "learning_rate": 5.183159701029238e-06, "loss": 2.395, "step": 513990 }, { "epoch": 0.9, "learning_rate": 5.182287761102411e-06, "loss": 2.2282, "step": 514000 }, { "epoch": 0.9, "learning_rate": 5.181415821175585e-06, "loss": 2.2612, "step": 514010 }, { "epoch": 0.9, "learning_rate": 5.1805438812487575e-06, "loss": 2.1963, "step": 514020 }, { "epoch": 0.9, "learning_rate": 5.1796719413219304e-06, "loss": 2.3589, "step": 514030 }, { "epoch": 0.9, "learning_rate": 5.178800001395104e-06, "loss": 2.3, "step": 514040 }, { "epoch": 0.9, "learning_rate": 5.177928061468278e-06, "loss": 2.3973, "step": 514050 }, { "epoch": 0.9, "learning_rate": 5.177056121541451e-06, "loss": 2.2845, "step": 514060 }, { "epoch": 0.9, "learning_rate": 5.176184181614624e-06, "loss": 2.2899, "step": 514070 }, { "epoch": 0.9, "learning_rate": 5.175312241687797e-06, "loss": 2.2468, "step": 514080 }, { "epoch": 0.9, "learning_rate": 5.1744403017609705e-06, "loss": 2.2456, "step": 514090 }, { "epoch": 0.9, "learning_rate": 5.1735683618341434e-06, "loss": 2.3201, "step": 514100 }, { "epoch": 0.9, "learning_rate": 5.172696421907316e-06, "loss": 2.3784, "step": 514110 }, { "epoch": 0.9, "learning_rate": 5.171824481980489e-06, "loss": 2.2391, "step": 514120 }, { "epoch": 0.9, "learning_rate": 5.170952542053663e-06, "loss": 2.3727, "step": 514130 }, { "epoch": 0.9, "learning_rate": 5.170080602126836e-06, "loss": 2.215, "step": 514140 }, { "epoch": 0.9, "learning_rate": 5.169208662200009e-06, "loss": 2.2997, "step": 514150 }, { "epoch": 0.9, "learning_rate": 5.168336722273182e-06, "loss": 2.2188, "step": 514160 }, { "epoch": 0.9, "learning_rate": 5.167464782346356e-06, "loss": 2.1892, "step": 514170 }, { "epoch": 0.9, "learning_rate": 5.166592842419529e-06, "loss": 2.2618, "step": 514180 }, { "epoch": 0.9, "learning_rate": 5.165720902492702e-06, "loss": 2.1794, "step": 514190 }, { "epoch": 0.9, "learning_rate": 5.164848962565875e-06, "loss": 2.2582, "step": 514200 }, { "epoch": 0.9, "learning_rate": 5.163977022639049e-06, "loss": 2.2837, "step": 514210 }, { "epoch": 0.9, "learning_rate": 5.163105082712222e-06, "loss": 2.2692, "step": 514220 }, { "epoch": 0.9, "learning_rate": 5.162233142785395e-06, "loss": 2.2486, "step": 514230 }, { "epoch": 0.9, "learning_rate": 5.161361202858568e-06, "loss": 2.291, "step": 514240 }, { "epoch": 0.9, "learning_rate": 5.1604892629317415e-06, "loss": 2.317, "step": 514250 }, { "epoch": 0.9, "learning_rate": 5.1596173230049144e-06, "loss": 2.2754, "step": 514260 }, { "epoch": 0.9, "learning_rate": 5.158745383078087e-06, "loss": 2.3341, "step": 514270 }, { "epoch": 0.9, "learning_rate": 5.15787344315126e-06, "loss": 2.2683, "step": 514280 }, { "epoch": 0.9, "learning_rate": 5.157001503224434e-06, "loss": 2.3755, "step": 514290 }, { "epoch": 0.9, "learning_rate": 5.156129563297607e-06, "loss": 2.2242, "step": 514300 }, { "epoch": 0.9, "learning_rate": 5.155257623370781e-06, "loss": 2.3078, "step": 514310 }, { "epoch": 0.9, "learning_rate": 5.154385683443954e-06, "loss": 2.3127, "step": 514320 }, { "epoch": 0.9, "learning_rate": 5.1535137435171274e-06, "loss": 2.2057, "step": 514330 }, { "epoch": 0.9, "learning_rate": 5.1526418035903e-06, "loss": 2.1615, "step": 514340 }, { "epoch": 0.9, "learning_rate": 5.151769863663473e-06, "loss": 2.3326, "step": 514350 }, { "epoch": 0.9, "learning_rate": 5.150897923736646e-06, "loss": 2.2082, "step": 514360 }, { "epoch": 0.9, "learning_rate": 5.15002598380982e-06, "loss": 2.3897, "step": 514370 }, { "epoch": 0.9, "learning_rate": 5.149154043882993e-06, "loss": 2.2876, "step": 514380 }, { "epoch": 0.9, "learning_rate": 5.148282103956166e-06, "loss": 2.2841, "step": 514390 }, { "epoch": 0.9, "learning_rate": 5.147410164029339e-06, "loss": 2.3195, "step": 514400 }, { "epoch": 0.9, "learning_rate": 5.1465382241025125e-06, "loss": 2.1948, "step": 514410 }, { "epoch": 0.9, "learning_rate": 5.1456662841756854e-06, "loss": 2.2485, "step": 514420 }, { "epoch": 0.9, "learning_rate": 5.144794344248858e-06, "loss": 2.3106, "step": 514430 }, { "epoch": 0.9, "learning_rate": 5.143922404322032e-06, "loss": 2.2281, "step": 514440 }, { "epoch": 0.9, "learning_rate": 5.143050464395206e-06, "loss": 2.3458, "step": 514450 }, { "epoch": 0.9, "learning_rate": 5.142178524468379e-06, "loss": 2.3234, "step": 514460 }, { "epoch": 0.9, "learning_rate": 5.141306584541552e-06, "loss": 2.2389, "step": 514470 }, { "epoch": 0.9, "learning_rate": 5.140434644614725e-06, "loss": 2.3251, "step": 514480 }, { "epoch": 0.9, "learning_rate": 5.1395627046878984e-06, "loss": 2.3358, "step": 514490 }, { "epoch": 0.9, "learning_rate": 5.138690764761071e-06, "loss": 2.2691, "step": 514500 }, { "epoch": 0.9, "learning_rate": 5.137818824834244e-06, "loss": 2.2367, "step": 514510 }, { "epoch": 0.9, "learning_rate": 5.136946884907417e-06, "loss": 2.1643, "step": 514520 }, { "epoch": 0.9, "learning_rate": 5.136074944980591e-06, "loss": 2.2477, "step": 514530 }, { "epoch": 0.9, "learning_rate": 5.135203005053764e-06, "loss": 2.2165, "step": 514540 }, { "epoch": 0.9, "learning_rate": 5.134331065126937e-06, "loss": 2.3012, "step": 514550 }, { "epoch": 0.9, "learning_rate": 5.133459125200111e-06, "loss": 2.258, "step": 514560 }, { "epoch": 0.9, "learning_rate": 5.1325871852732835e-06, "loss": 2.1746, "step": 514570 }, { "epoch": 0.9, "learning_rate": 5.131715245346457e-06, "loss": 2.2574, "step": 514580 }, { "epoch": 0.9, "learning_rate": 5.13084330541963e-06, "loss": 2.1625, "step": 514590 }, { "epoch": 0.9, "learning_rate": 5.129971365492803e-06, "loss": 2.1993, "step": 514600 }, { "epoch": 0.9, "learning_rate": 5.129099425565977e-06, "loss": 2.2614, "step": 514610 }, { "epoch": 0.9, "learning_rate": 5.12822748563915e-06, "loss": 2.3084, "step": 514620 }, { "epoch": 0.9, "learning_rate": 5.127355545712323e-06, "loss": 2.3887, "step": 514630 }, { "epoch": 0.9, "learning_rate": 5.126483605785496e-06, "loss": 2.2438, "step": 514640 }, { "epoch": 0.9, "learning_rate": 5.1256116658586694e-06, "loss": 2.2365, "step": 514650 }, { "epoch": 0.9, "learning_rate": 5.124739725931842e-06, "loss": 2.1789, "step": 514660 }, { "epoch": 0.9, "learning_rate": 5.123867786005015e-06, "loss": 2.0957, "step": 514670 }, { "epoch": 0.9, "learning_rate": 5.122995846078188e-06, "loss": 2.2446, "step": 514680 }, { "epoch": 0.9, "learning_rate": 5.122123906151362e-06, "loss": 2.106, "step": 514690 }, { "epoch": 0.9, "learning_rate": 5.121251966224535e-06, "loss": 2.1888, "step": 514700 }, { "epoch": 0.9, "learning_rate": 5.120380026297709e-06, "loss": 2.3343, "step": 514710 }, { "epoch": 0.9, "learning_rate": 5.119508086370882e-06, "loss": 2.2012, "step": 514720 }, { "epoch": 0.9, "learning_rate": 5.118636146444055e-06, "loss": 2.2114, "step": 514730 }, { "epoch": 0.9, "learning_rate": 5.117764206517228e-06, "loss": 2.2862, "step": 514740 }, { "epoch": 0.9, "learning_rate": 5.116892266590401e-06, "loss": 2.2171, "step": 514750 }, { "epoch": 0.9, "learning_rate": 5.116020326663574e-06, "loss": 2.2877, "step": 514760 }, { "epoch": 0.9, "learning_rate": 5.115148386736748e-06, "loss": 2.2584, "step": 514770 }, { "epoch": 0.9, "learning_rate": 5.114276446809921e-06, "loss": 2.3612, "step": 514780 }, { "epoch": 0.9, "learning_rate": 5.113404506883094e-06, "loss": 2.225, "step": 514790 }, { "epoch": 0.9, "learning_rate": 5.112532566956267e-06, "loss": 2.1403, "step": 514800 }, { "epoch": 0.9, "learning_rate": 5.1116606270294404e-06, "loss": 2.2973, "step": 514810 }, { "epoch": 0.9, "learning_rate": 5.110788687102613e-06, "loss": 2.2042, "step": 514820 }, { "epoch": 0.9, "learning_rate": 5.109916747175786e-06, "loss": 2.2414, "step": 514830 }, { "epoch": 0.9, "learning_rate": 5.10904480724896e-06, "loss": 2.2583, "step": 514840 }, { "epoch": 0.9, "learning_rate": 5.108172867322134e-06, "loss": 2.1739, "step": 514850 }, { "epoch": 0.9, "learning_rate": 5.107300927395307e-06, "loss": 2.3166, "step": 514860 }, { "epoch": 0.9, "learning_rate": 5.10642898746848e-06, "loss": 2.1834, "step": 514870 }, { "epoch": 0.9, "learning_rate": 5.105557047541653e-06, "loss": 2.2431, "step": 514880 }, { "epoch": 0.9, "learning_rate": 5.104685107614826e-06, "loss": 2.2381, "step": 514890 }, { "epoch": 0.9, "learning_rate": 5.103813167687999e-06, "loss": 2.368, "step": 514900 }, { "epoch": 0.9, "learning_rate": 5.102941227761172e-06, "loss": 2.1904, "step": 514910 }, { "epoch": 0.9, "learning_rate": 5.102069287834345e-06, "loss": 2.2537, "step": 514920 }, { "epoch": 0.9, "learning_rate": 5.101197347907519e-06, "loss": 2.3752, "step": 514930 }, { "epoch": 0.9, "learning_rate": 5.100325407980692e-06, "loss": 2.3194, "step": 514940 }, { "epoch": 0.9, "learning_rate": 5.099453468053865e-06, "loss": 2.1961, "step": 514950 }, { "epoch": 0.9, "learning_rate": 5.0985815281270385e-06, "loss": 2.3353, "step": 514960 }, { "epoch": 0.9, "learning_rate": 5.0977095882002114e-06, "loss": 2.2617, "step": 514970 }, { "epoch": 0.9, "learning_rate": 5.096837648273385e-06, "loss": 2.3163, "step": 514980 }, { "epoch": 0.9, "learning_rate": 5.095965708346558e-06, "loss": 2.371, "step": 514990 }, { "epoch": 0.9, "learning_rate": 5.095093768419731e-06, "loss": 2.2294, "step": 515000 }, { "epoch": 0.9, "learning_rate": 5.094221828492905e-06, "loss": 2.3285, "step": 515010 }, { "epoch": 0.9, "learning_rate": 5.093349888566078e-06, "loss": 2.3376, "step": 515020 }, { "epoch": 0.9, "learning_rate": 5.092477948639251e-06, "loss": 2.283, "step": 515030 }, { "epoch": 0.9, "learning_rate": 5.091606008712424e-06, "loss": 2.3314, "step": 515040 }, { "epoch": 0.9, "learning_rate": 5.090734068785597e-06, "loss": 2.2515, "step": 515050 }, { "epoch": 0.9, "learning_rate": 5.08986212885877e-06, "loss": 2.209, "step": 515060 }, { "epoch": 0.9, "learning_rate": 5.088990188931943e-06, "loss": 2.2928, "step": 515070 }, { "epoch": 0.9, "learning_rate": 5.088118249005117e-06, "loss": 2.3726, "step": 515080 }, { "epoch": 0.9, "learning_rate": 5.08724630907829e-06, "loss": 2.2422, "step": 515090 }, { "epoch": 0.9, "learning_rate": 5.086374369151463e-06, "loss": 2.1573, "step": 515100 }, { "epoch": 0.9, "learning_rate": 5.085502429224637e-06, "loss": 2.3291, "step": 515110 }, { "epoch": 0.9, "learning_rate": 5.0846304892978095e-06, "loss": 2.2443, "step": 515120 }, { "epoch": 0.9, "learning_rate": 5.083758549370983e-06, "loss": 2.2336, "step": 515130 }, { "epoch": 0.9, "learning_rate": 5.082886609444156e-06, "loss": 2.2559, "step": 515140 }, { "epoch": 0.9, "learning_rate": 5.082014669517329e-06, "loss": 2.299, "step": 515150 }, { "epoch": 0.9, "learning_rate": 5.081142729590502e-06, "loss": 2.2009, "step": 515160 }, { "epoch": 0.9, "learning_rate": 5.080270789663676e-06, "loss": 2.3425, "step": 515170 }, { "epoch": 0.9, "learning_rate": 5.079398849736849e-06, "loss": 2.293, "step": 515180 }, { "epoch": 0.9, "learning_rate": 5.078526909810022e-06, "loss": 2.362, "step": 515190 }, { "epoch": 0.9, "learning_rate": 5.0776549698831955e-06, "loss": 2.2181, "step": 515200 }, { "epoch": 0.9, "learning_rate": 5.076783029956368e-06, "loss": 2.2915, "step": 515210 }, { "epoch": 0.9, "learning_rate": 5.075911090029541e-06, "loss": 2.2451, "step": 515220 }, { "epoch": 0.9, "learning_rate": 5.075039150102714e-06, "loss": 2.3105, "step": 515230 }, { "epoch": 0.9, "learning_rate": 5.074167210175888e-06, "loss": 2.0912, "step": 515240 }, { "epoch": 0.9, "learning_rate": 5.073295270249062e-06, "loss": 2.1843, "step": 515250 }, { "epoch": 0.9, "learning_rate": 5.072423330322235e-06, "loss": 2.2207, "step": 515260 }, { "epoch": 0.9, "learning_rate": 5.071551390395408e-06, "loss": 2.219, "step": 515270 }, { "epoch": 0.9, "learning_rate": 5.0706794504685805e-06, "loss": 2.2459, "step": 515280 }, { "epoch": 0.9, "learning_rate": 5.069807510541754e-06, "loss": 2.2264, "step": 515290 }, { "epoch": 0.9, "learning_rate": 5.068935570614927e-06, "loss": 2.2928, "step": 515300 }, { "epoch": 0.9, "learning_rate": 5.0680636306881e-06, "loss": 2.2671, "step": 515310 }, { "epoch": 0.9, "learning_rate": 5.067191690761273e-06, "loss": 2.3022, "step": 515320 }, { "epoch": 0.9, "learning_rate": 5.066319750834447e-06, "loss": 2.2385, "step": 515330 }, { "epoch": 0.9, "learning_rate": 5.06544781090762e-06, "loss": 2.2358, "step": 515340 }, { "epoch": 0.9, "learning_rate": 5.064575870980793e-06, "loss": 2.2837, "step": 515350 }, { "epoch": 0.9, "learning_rate": 5.0637039310539665e-06, "loss": 2.2385, "step": 515360 }, { "epoch": 0.9, "learning_rate": 5.062831991127139e-06, "loss": 2.271, "step": 515370 }, { "epoch": 0.9, "learning_rate": 5.061960051200313e-06, "loss": 2.3844, "step": 515380 }, { "epoch": 0.9, "learning_rate": 5.061088111273486e-06, "loss": 2.3452, "step": 515390 }, { "epoch": 0.9, "learning_rate": 5.060216171346659e-06, "loss": 2.3057, "step": 515400 }, { "epoch": 0.9, "learning_rate": 5.059344231419833e-06, "loss": 2.2243, "step": 515410 }, { "epoch": 0.9, "learning_rate": 5.058472291493006e-06, "loss": 2.2366, "step": 515420 }, { "epoch": 0.9, "learning_rate": 5.057600351566179e-06, "loss": 2.1997, "step": 515430 }, { "epoch": 0.9, "learning_rate": 5.0567284116393515e-06, "loss": 2.3399, "step": 515440 }, { "epoch": 0.9, "learning_rate": 5.055856471712525e-06, "loss": 2.2418, "step": 515450 }, { "epoch": 0.9, "learning_rate": 5.054984531785698e-06, "loss": 2.222, "step": 515460 }, { "epoch": 0.9, "learning_rate": 5.054112591858871e-06, "loss": 2.3959, "step": 515470 }, { "epoch": 0.9, "learning_rate": 5.053240651932045e-06, "loss": 2.3114, "step": 515480 }, { "epoch": 0.9, "learning_rate": 5.052368712005218e-06, "loss": 2.3983, "step": 515490 }, { "epoch": 0.9, "learning_rate": 5.051496772078391e-06, "loss": 2.2309, "step": 515500 }, { "epoch": 0.9, "learning_rate": 5.0506248321515645e-06, "loss": 2.2379, "step": 515510 }, { "epoch": 0.9, "learning_rate": 5.0497528922247375e-06, "loss": 2.3814, "step": 515520 }, { "epoch": 0.9, "learning_rate": 5.048880952297911e-06, "loss": 2.3612, "step": 515530 }, { "epoch": 0.9, "learning_rate": 5.048009012371084e-06, "loss": 2.3129, "step": 515540 }, { "epoch": 0.9, "learning_rate": 5.047137072444257e-06, "loss": 2.1822, "step": 515550 }, { "epoch": 0.9, "learning_rate": 5.04626513251743e-06, "loss": 2.233, "step": 515560 }, { "epoch": 0.9, "learning_rate": 5.045393192590604e-06, "loss": 2.2463, "step": 515570 }, { "epoch": 0.9, "learning_rate": 5.044521252663777e-06, "loss": 2.1413, "step": 515580 }, { "epoch": 0.9, "learning_rate": 5.04364931273695e-06, "loss": 2.1995, "step": 515590 }, { "epoch": 0.9, "learning_rate": 5.042777372810123e-06, "loss": 2.2349, "step": 515600 }, { "epoch": 0.9, "learning_rate": 5.041905432883296e-06, "loss": 2.2724, "step": 515610 }, { "epoch": 0.9, "learning_rate": 5.041033492956469e-06, "loss": 2.3007, "step": 515620 }, { "epoch": 0.9, "learning_rate": 5.040161553029642e-06, "loss": 2.2676, "step": 515630 }, { "epoch": 0.9, "learning_rate": 5.039289613102816e-06, "loss": 2.1814, "step": 515640 }, { "epoch": 0.9, "learning_rate": 5.03841767317599e-06, "loss": 2.3337, "step": 515650 }, { "epoch": 0.9, "learning_rate": 5.037545733249163e-06, "loss": 2.2476, "step": 515660 }, { "epoch": 0.9, "learning_rate": 5.0366737933223355e-06, "loss": 2.1537, "step": 515670 }, { "epoch": 0.9, "learning_rate": 5.0358018533955085e-06, "loss": 2.2787, "step": 515680 }, { "epoch": 0.9, "learning_rate": 5.034929913468682e-06, "loss": 2.3596, "step": 515690 }, { "epoch": 0.9, "learning_rate": 5.034057973541855e-06, "loss": 2.3354, "step": 515700 }, { "epoch": 0.9, "learning_rate": 5.033186033615028e-06, "loss": 2.1667, "step": 515710 }, { "epoch": 0.9, "learning_rate": 5.032314093688202e-06, "loss": 2.2424, "step": 515720 }, { "epoch": 0.9, "learning_rate": 5.031442153761375e-06, "loss": 2.2309, "step": 515730 }, { "epoch": 0.9, "learning_rate": 5.030570213834548e-06, "loss": 2.2756, "step": 515740 }, { "epoch": 0.9, "learning_rate": 5.029698273907721e-06, "loss": 2.3845, "step": 515750 }, { "epoch": 0.9, "learning_rate": 5.028826333980894e-06, "loss": 2.3226, "step": 515760 }, { "epoch": 0.9, "learning_rate": 5.027954394054067e-06, "loss": 2.2358, "step": 515770 }, { "epoch": 0.9, "learning_rate": 5.027082454127241e-06, "loss": 2.2563, "step": 515780 }, { "epoch": 0.9, "learning_rate": 5.026210514200414e-06, "loss": 2.3253, "step": 515790 }, { "epoch": 0.9, "learning_rate": 5.025338574273587e-06, "loss": 2.2957, "step": 515800 }, { "epoch": 0.9, "learning_rate": 5.024466634346761e-06, "loss": 2.4156, "step": 515810 }, { "epoch": 0.9, "learning_rate": 5.023594694419934e-06, "loss": 2.2477, "step": 515820 }, { "epoch": 0.9, "learning_rate": 5.0227227544931065e-06, "loss": 2.4053, "step": 515830 }, { "epoch": 0.9, "learning_rate": 5.0218508145662795e-06, "loss": 2.2033, "step": 515840 }, { "epoch": 0.9, "learning_rate": 5.020978874639453e-06, "loss": 2.1988, "step": 515850 }, { "epoch": 0.9, "learning_rate": 5.020106934712626e-06, "loss": 2.2329, "step": 515860 }, { "epoch": 0.9, "learning_rate": 5.019234994785799e-06, "loss": 2.2905, "step": 515870 }, { "epoch": 0.9, "learning_rate": 5.018363054858973e-06, "loss": 2.2456, "step": 515880 }, { "epoch": 0.9, "learning_rate": 5.017491114932146e-06, "loss": 2.1733, "step": 515890 }, { "epoch": 0.9, "learning_rate": 5.016619175005319e-06, "loss": 2.1341, "step": 515900 }, { "epoch": 0.9, "learning_rate": 5.0157472350784925e-06, "loss": 2.2859, "step": 515910 }, { "epoch": 0.9, "learning_rate": 5.014875295151665e-06, "loss": 2.2788, "step": 515920 }, { "epoch": 0.9, "learning_rate": 5.014003355224839e-06, "loss": 2.1581, "step": 515930 }, { "epoch": 0.9, "learning_rate": 5.013131415298012e-06, "loss": 2.274, "step": 515940 }, { "epoch": 0.9, "learning_rate": 5.012259475371185e-06, "loss": 2.3442, "step": 515950 }, { "epoch": 0.9, "learning_rate": 5.011387535444358e-06, "loss": 2.2392, "step": 515960 }, { "epoch": 0.9, "learning_rate": 5.010515595517532e-06, "loss": 2.1771, "step": 515970 }, { "epoch": 0.9, "learning_rate": 5.009643655590705e-06, "loss": 2.2765, "step": 515980 }, { "epoch": 0.9, "learning_rate": 5.0087717156638775e-06, "loss": 2.3045, "step": 515990 }, { "epoch": 0.9, "learning_rate": 5.007899775737051e-06, "loss": 2.3904, "step": 516000 }, { "epoch": 0.9, "learning_rate": 5.007027835810224e-06, "loss": 2.3085, "step": 516010 }, { "epoch": 0.9, "learning_rate": 5.006155895883397e-06, "loss": 2.2574, "step": 516020 }, { "epoch": 0.9, "learning_rate": 5.00528395595657e-06, "loss": 2.2557, "step": 516030 }, { "epoch": 0.9, "learning_rate": 5.004412016029744e-06, "loss": 2.2655, "step": 516040 }, { "epoch": 0.9, "learning_rate": 5.003540076102918e-06, "loss": 2.2381, "step": 516050 }, { "epoch": 0.9, "learning_rate": 5.0026681361760905e-06, "loss": 2.2262, "step": 516060 }, { "epoch": 0.9, "learning_rate": 5.0017961962492635e-06, "loss": 2.1584, "step": 516070 }, { "epoch": 0.9, "learning_rate": 5.000924256322436e-06, "loss": 2.2374, "step": 516080 }, { "epoch": 0.9, "learning_rate": 5.00005231639561e-06, "loss": 2.2973, "step": 516090 }, { "epoch": 0.9, "learning_rate": 4.999180376468783e-06, "loss": 2.3639, "step": 516100 }, { "epoch": 0.9, "learning_rate": 4.998308436541956e-06, "loss": 2.1865, "step": 516110 }, { "epoch": 0.9, "learning_rate": 4.99743649661513e-06, "loss": 2.2764, "step": 516120 }, { "epoch": 0.9, "learning_rate": 4.996564556688303e-06, "loss": 2.2123, "step": 516130 }, { "epoch": 0.9, "learning_rate": 4.995692616761476e-06, "loss": 2.2367, "step": 516140 }, { "epoch": 0.9, "learning_rate": 4.9948206768346485e-06, "loss": 2.3461, "step": 516150 }, { "epoch": 0.9, "learning_rate": 4.993948736907822e-06, "loss": 2.3886, "step": 516160 }, { "epoch": 0.9, "learning_rate": 4.993076796980995e-06, "loss": 2.136, "step": 516170 }, { "epoch": 0.9, "learning_rate": 4.992204857054169e-06, "loss": 2.3385, "step": 516180 }, { "epoch": 0.9, "learning_rate": 4.991332917127342e-06, "loss": 2.249, "step": 516190 }, { "epoch": 0.9, "learning_rate": 4.990460977200515e-06, "loss": 2.3329, "step": 516200 }, { "epoch": 0.9, "learning_rate": 4.989589037273689e-06, "loss": 2.3299, "step": 516210 }, { "epoch": 0.9, "learning_rate": 4.9887170973468615e-06, "loss": 2.2525, "step": 516220 }, { "epoch": 0.9, "learning_rate": 4.9878451574200345e-06, "loss": 2.2441, "step": 516230 }, { "epoch": 0.9, "learning_rate": 4.986973217493208e-06, "loss": 2.1992, "step": 516240 }, { "epoch": 0.9, "learning_rate": 4.986101277566381e-06, "loss": 2.2443, "step": 516250 }, { "epoch": 0.9, "learning_rate": 4.985229337639554e-06, "loss": 2.245, "step": 516260 }, { "epoch": 0.9, "learning_rate": 4.984357397712727e-06, "loss": 2.2566, "step": 516270 }, { "epoch": 0.9, "learning_rate": 4.983485457785901e-06, "loss": 2.2225, "step": 516280 }, { "epoch": 0.9, "learning_rate": 4.982613517859074e-06, "loss": 2.298, "step": 516290 }, { "epoch": 0.9, "learning_rate": 4.981741577932247e-06, "loss": 2.1575, "step": 516300 }, { "epoch": 0.9, "learning_rate": 4.98086963800542e-06, "loss": 2.2745, "step": 516310 }, { "epoch": 0.9, "learning_rate": 4.979997698078593e-06, "loss": 2.2714, "step": 516320 }, { "epoch": 0.9, "learning_rate": 4.979125758151767e-06, "loss": 2.3187, "step": 516330 }, { "epoch": 0.9, "learning_rate": 4.97825381822494e-06, "loss": 2.1677, "step": 516340 }, { "epoch": 0.9, "learning_rate": 4.977381878298113e-06, "loss": 2.3026, "step": 516350 }, { "epoch": 0.9, "learning_rate": 4.976509938371286e-06, "loss": 2.1221, "step": 516360 }, { "epoch": 0.9, "learning_rate": 4.97563799844446e-06, "loss": 2.1953, "step": 516370 }, { "epoch": 0.9, "learning_rate": 4.9747660585176325e-06, "loss": 2.167, "step": 516380 }, { "epoch": 0.9, "learning_rate": 4.9738941185908055e-06, "loss": 2.3566, "step": 516390 }, { "epoch": 0.9, "learning_rate": 4.973022178663979e-06, "loss": 2.2889, "step": 516400 }, { "epoch": 0.9, "learning_rate": 4.972150238737152e-06, "loss": 2.3423, "step": 516410 }, { "epoch": 0.9, "learning_rate": 4.971278298810325e-06, "loss": 2.1115, "step": 516420 }, { "epoch": 0.9, "learning_rate": 4.970406358883498e-06, "loss": 2.2903, "step": 516430 }, { "epoch": 0.9, "learning_rate": 4.969534418956672e-06, "loss": 2.3075, "step": 516440 }, { "epoch": 0.9, "learning_rate": 4.9686624790298455e-06, "loss": 2.1575, "step": 516450 }, { "epoch": 0.9, "learning_rate": 4.9677905391030185e-06, "loss": 2.2927, "step": 516460 }, { "epoch": 0.9, "learning_rate": 4.966918599176191e-06, "loss": 2.2265, "step": 516470 }, { "epoch": 0.9, "learning_rate": 4.966046659249364e-06, "loss": 2.2283, "step": 516480 }, { "epoch": 0.9, "learning_rate": 4.965174719322538e-06, "loss": 2.2185, "step": 516490 }, { "epoch": 0.9, "learning_rate": 4.964302779395711e-06, "loss": 2.1322, "step": 516500 }, { "epoch": 0.9, "learning_rate": 4.963430839468884e-06, "loss": 2.2759, "step": 516510 }, { "epoch": 0.9, "learning_rate": 4.962558899542058e-06, "loss": 2.2681, "step": 516520 }, { "epoch": 0.9, "learning_rate": 4.961686959615231e-06, "loss": 2.346, "step": 516530 }, { "epoch": 0.9, "learning_rate": 4.9608150196884035e-06, "loss": 2.2638, "step": 516540 }, { "epoch": 0.9, "learning_rate": 4.9599430797615765e-06, "loss": 2.2963, "step": 516550 }, { "epoch": 0.9, "learning_rate": 4.95907113983475e-06, "loss": 2.2735, "step": 516560 }, { "epoch": 0.9, "learning_rate": 4.958199199907924e-06, "loss": 2.1827, "step": 516570 }, { "epoch": 0.9, "learning_rate": 4.957327259981097e-06, "loss": 2.3428, "step": 516580 }, { "epoch": 0.9, "learning_rate": 4.95645532005427e-06, "loss": 2.295, "step": 516590 }, { "epoch": 0.9, "learning_rate": 4.955583380127443e-06, "loss": 2.165, "step": 516600 }, { "epoch": 0.9, "learning_rate": 4.9547114402006165e-06, "loss": 2.2697, "step": 516610 }, { "epoch": 0.9, "learning_rate": 4.9538395002737895e-06, "loss": 2.2651, "step": 516620 }, { "epoch": 0.9, "learning_rate": 4.952967560346962e-06, "loss": 2.2574, "step": 516630 }, { "epoch": 0.9, "learning_rate": 4.952095620420136e-06, "loss": 2.2722, "step": 516640 }, { "epoch": 0.9, "learning_rate": 4.951223680493309e-06, "loss": 2.2483, "step": 516650 }, { "epoch": 0.9, "learning_rate": 4.950351740566482e-06, "loss": 2.2582, "step": 516660 }, { "epoch": 0.9, "learning_rate": 4.949479800639655e-06, "loss": 2.2807, "step": 516670 }, { "epoch": 0.9, "learning_rate": 4.948607860712829e-06, "loss": 2.347, "step": 516680 }, { "epoch": 0.9, "learning_rate": 4.947735920786002e-06, "loss": 2.2594, "step": 516690 }, { "epoch": 0.9, "learning_rate": 4.9468639808591745e-06, "loss": 2.3294, "step": 516700 }, { "epoch": 0.9, "learning_rate": 4.945992040932348e-06, "loss": 2.2368, "step": 516710 }, { "epoch": 0.9, "learning_rate": 4.945120101005521e-06, "loss": 2.3005, "step": 516720 }, { "epoch": 0.9, "learning_rate": 4.944248161078695e-06, "loss": 2.2077, "step": 516730 }, { "epoch": 0.9, "learning_rate": 4.943376221151868e-06, "loss": 2.228, "step": 516740 }, { "epoch": 0.9, "learning_rate": 4.942504281225041e-06, "loss": 2.2913, "step": 516750 }, { "epoch": 0.9, "learning_rate": 4.941632341298215e-06, "loss": 2.3237, "step": 516760 }, { "epoch": 0.9, "learning_rate": 4.9407604013713875e-06, "loss": 2.156, "step": 516770 }, { "epoch": 0.9, "learning_rate": 4.9398884614445605e-06, "loss": 2.2199, "step": 516780 }, { "epoch": 0.9, "learning_rate": 4.939016521517733e-06, "loss": 2.3261, "step": 516790 }, { "epoch": 0.9, "learning_rate": 4.938144581590907e-06, "loss": 2.2322, "step": 516800 }, { "epoch": 0.9, "learning_rate": 4.93727264166408e-06, "loss": 2.313, "step": 516810 }, { "epoch": 0.9, "learning_rate": 4.936400701737253e-06, "loss": 2.2629, "step": 516820 }, { "epoch": 0.9, "learning_rate": 4.935528761810426e-06, "loss": 2.2396, "step": 516830 }, { "epoch": 0.9, "learning_rate": 4.9346568218836e-06, "loss": 2.2931, "step": 516840 }, { "epoch": 0.9, "learning_rate": 4.9337848819567735e-06, "loss": 2.3325, "step": 516850 }, { "epoch": 0.9, "learning_rate": 4.932912942029946e-06, "loss": 2.2249, "step": 516860 }, { "epoch": 0.9, "learning_rate": 4.932041002103119e-06, "loss": 2.2363, "step": 516870 }, { "epoch": 0.9, "learning_rate": 4.931169062176292e-06, "loss": 2.2975, "step": 516880 }, { "epoch": 0.9, "learning_rate": 4.930297122249466e-06, "loss": 2.312, "step": 516890 }, { "epoch": 0.9, "learning_rate": 4.929425182322639e-06, "loss": 2.1997, "step": 516900 }, { "epoch": 0.9, "learning_rate": 4.928553242395812e-06, "loss": 2.2384, "step": 516910 }, { "epoch": 0.9, "learning_rate": 4.927681302468986e-06, "loss": 2.2324, "step": 516920 }, { "epoch": 0.9, "learning_rate": 4.9268093625421585e-06, "loss": 2.3465, "step": 516930 }, { "epoch": 0.9, "learning_rate": 4.9259374226153315e-06, "loss": 2.3503, "step": 516940 }, { "epoch": 0.9, "learning_rate": 4.925065482688504e-06, "loss": 2.2614, "step": 516950 }, { "epoch": 0.9, "learning_rate": 4.924193542761678e-06, "loss": 2.1566, "step": 516960 }, { "epoch": 0.9, "learning_rate": 4.923321602834852e-06, "loss": 2.2764, "step": 516970 }, { "epoch": 0.9, "learning_rate": 4.922449662908025e-06, "loss": 2.2292, "step": 516980 }, { "epoch": 0.9, "learning_rate": 4.921577722981198e-06, "loss": 2.2491, "step": 516990 }, { "epoch": 0.9, "learning_rate": 4.920705783054371e-06, "loss": 2.021, "step": 517000 }, { "epoch": 0.9, "learning_rate": 4.9198338431275445e-06, "loss": 2.4153, "step": 517010 }, { "epoch": 0.9, "learning_rate": 4.918961903200717e-06, "loss": 2.2409, "step": 517020 }, { "epoch": 0.9, "learning_rate": 4.91808996327389e-06, "loss": 2.2498, "step": 517030 }, { "epoch": 0.9, "learning_rate": 4.917218023347064e-06, "loss": 2.2052, "step": 517040 }, { "epoch": 0.9, "learning_rate": 4.916346083420237e-06, "loss": 2.17, "step": 517050 }, { "epoch": 0.9, "learning_rate": 4.91547414349341e-06, "loss": 2.2164, "step": 517060 }, { "epoch": 0.9, "learning_rate": 4.914602203566583e-06, "loss": 2.2584, "step": 517070 }, { "epoch": 0.9, "learning_rate": 4.913730263639757e-06, "loss": 2.2216, "step": 517080 }, { "epoch": 0.9, "learning_rate": 4.9128583237129295e-06, "loss": 2.3262, "step": 517090 }, { "epoch": 0.9, "learning_rate": 4.9119863837861025e-06, "loss": 2.408, "step": 517100 }, { "epoch": 0.9, "learning_rate": 4.911114443859276e-06, "loss": 2.3195, "step": 517110 }, { "epoch": 0.9, "learning_rate": 4.910242503932449e-06, "loss": 2.2597, "step": 517120 }, { "epoch": 0.9, "learning_rate": 4.909370564005623e-06, "loss": 2.2937, "step": 517130 }, { "epoch": 0.9, "learning_rate": 4.908498624078796e-06, "loss": 2.1008, "step": 517140 }, { "epoch": 0.9, "learning_rate": 4.907626684151969e-06, "loss": 2.2273, "step": 517150 }, { "epoch": 0.9, "learning_rate": 4.9067547442251425e-06, "loss": 2.1828, "step": 517160 }, { "epoch": 0.9, "learning_rate": 4.9058828042983155e-06, "loss": 2.1789, "step": 517170 }, { "epoch": 0.9, "learning_rate": 4.905010864371488e-06, "loss": 2.2693, "step": 517180 }, { "epoch": 0.9, "learning_rate": 4.904138924444661e-06, "loss": 2.2206, "step": 517190 }, { "epoch": 0.9, "learning_rate": 4.903266984517835e-06, "loss": 2.3709, "step": 517200 }, { "epoch": 0.9, "learning_rate": 4.902395044591008e-06, "loss": 2.1628, "step": 517210 }, { "epoch": 0.9, "learning_rate": 4.901523104664181e-06, "loss": 2.3745, "step": 517220 }, { "epoch": 0.9, "learning_rate": 4.900651164737354e-06, "loss": 2.3108, "step": 517230 }, { "epoch": 0.9, "learning_rate": 4.899779224810528e-06, "loss": 2.2408, "step": 517240 }, { "epoch": 0.9, "learning_rate": 4.898907284883701e-06, "loss": 2.3299, "step": 517250 }, { "epoch": 0.9, "learning_rate": 4.898035344956874e-06, "loss": 2.3378, "step": 517260 }, { "epoch": 0.9, "learning_rate": 4.897163405030047e-06, "loss": 2.256, "step": 517270 }, { "epoch": 0.9, "learning_rate": 4.896291465103221e-06, "loss": 2.3389, "step": 517280 }, { "epoch": 0.9, "learning_rate": 4.895419525176394e-06, "loss": 2.3593, "step": 517290 }, { "epoch": 0.9, "learning_rate": 4.894547585249567e-06, "loss": 2.4192, "step": 517300 }, { "epoch": 0.9, "learning_rate": 4.89367564532274e-06, "loss": 2.2739, "step": 517310 }, { "epoch": 0.9, "learning_rate": 4.8928037053959135e-06, "loss": 2.2442, "step": 517320 }, { "epoch": 0.9, "learning_rate": 4.8919317654690865e-06, "loss": 2.2653, "step": 517330 }, { "epoch": 0.9, "learning_rate": 4.891059825542259e-06, "loss": 2.3294, "step": 517340 }, { "epoch": 0.9, "learning_rate": 4.890187885615432e-06, "loss": 2.4141, "step": 517350 }, { "epoch": 0.9, "learning_rate": 4.889315945688606e-06, "loss": 2.2614, "step": 517360 }, { "epoch": 0.9, "learning_rate": 4.88844400576178e-06, "loss": 2.3904, "step": 517370 }, { "epoch": 0.9, "learning_rate": 4.887572065834953e-06, "loss": 2.285, "step": 517380 }, { "epoch": 0.9, "learning_rate": 4.886700125908126e-06, "loss": 2.3902, "step": 517390 }, { "epoch": 0.9, "learning_rate": 4.885828185981299e-06, "loss": 2.2744, "step": 517400 }, { "epoch": 0.9, "learning_rate": 4.884956246054472e-06, "loss": 2.3109, "step": 517410 }, { "epoch": 0.9, "learning_rate": 4.884084306127645e-06, "loss": 2.3087, "step": 517420 }, { "epoch": 0.9, "learning_rate": 4.883212366200818e-06, "loss": 2.2958, "step": 517430 }, { "epoch": 0.9, "learning_rate": 4.882340426273992e-06, "loss": 2.2499, "step": 517440 }, { "epoch": 0.9, "learning_rate": 4.881468486347165e-06, "loss": 2.4022, "step": 517450 }, { "epoch": 0.9, "learning_rate": 4.880596546420338e-06, "loss": 2.2908, "step": 517460 }, { "epoch": 0.9, "learning_rate": 4.879724606493511e-06, "loss": 2.2606, "step": 517470 }, { "epoch": 0.9, "learning_rate": 4.8788526665666845e-06, "loss": 2.2385, "step": 517480 }, { "epoch": 0.9, "learning_rate": 4.8779807266398575e-06, "loss": 2.309, "step": 517490 }, { "epoch": 0.9, "learning_rate": 4.87710878671303e-06, "loss": 2.1161, "step": 517500 }, { "epoch": 0.9, "learning_rate": 4.876236846786204e-06, "loss": 2.2822, "step": 517510 }, { "epoch": 0.9, "learning_rate": 4.875364906859377e-06, "loss": 2.174, "step": 517520 }, { "epoch": 0.9, "learning_rate": 4.874492966932551e-06, "loss": 2.3102, "step": 517530 }, { "epoch": 0.9, "learning_rate": 4.873621027005724e-06, "loss": 2.2916, "step": 517540 }, { "epoch": 0.9, "learning_rate": 4.872749087078897e-06, "loss": 2.3445, "step": 517550 }, { "epoch": 0.9, "learning_rate": 4.8718771471520705e-06, "loss": 2.2016, "step": 517560 }, { "epoch": 0.9, "learning_rate": 4.871005207225243e-06, "loss": 2.2454, "step": 517570 }, { "epoch": 0.9, "learning_rate": 4.870133267298416e-06, "loss": 2.2614, "step": 517580 }, { "epoch": 0.9, "learning_rate": 4.869261327371589e-06, "loss": 2.3917, "step": 517590 }, { "epoch": 0.9, "learning_rate": 4.868389387444763e-06, "loss": 2.3839, "step": 517600 }, { "epoch": 0.9, "learning_rate": 4.867517447517936e-06, "loss": 2.2226, "step": 517610 }, { "epoch": 0.9, "learning_rate": 4.866645507591109e-06, "loss": 2.2344, "step": 517620 }, { "epoch": 0.9, "learning_rate": 4.865773567664282e-06, "loss": 2.1646, "step": 517630 }, { "epoch": 0.9, "learning_rate": 4.8649016277374555e-06, "loss": 2.3275, "step": 517640 }, { "epoch": 0.9, "learning_rate": 4.864029687810629e-06, "loss": 2.3507, "step": 517650 }, { "epoch": 0.9, "learning_rate": 4.863157747883802e-06, "loss": 2.293, "step": 517660 }, { "epoch": 0.9, "learning_rate": 4.862285807956975e-06, "loss": 2.298, "step": 517670 }, { "epoch": 0.9, "learning_rate": 4.861413868030149e-06, "loss": 2.252, "step": 517680 }, { "epoch": 0.9, "learning_rate": 4.860541928103322e-06, "loss": 2.1324, "step": 517690 }, { "epoch": 0.9, "learning_rate": 4.859669988176495e-06, "loss": 2.0959, "step": 517700 }, { "epoch": 0.9, "learning_rate": 4.858798048249668e-06, "loss": 2.2444, "step": 517710 }, { "epoch": 0.9, "learning_rate": 4.8579261083228415e-06, "loss": 2.3031, "step": 517720 }, { "epoch": 0.9, "learning_rate": 4.857054168396014e-06, "loss": 2.3105, "step": 517730 }, { "epoch": 0.9, "learning_rate": 4.856182228469187e-06, "loss": 2.2465, "step": 517740 }, { "epoch": 0.9, "learning_rate": 4.85531028854236e-06, "loss": 2.3536, "step": 517750 }, { "epoch": 0.9, "learning_rate": 4.854438348615534e-06, "loss": 2.2137, "step": 517760 }, { "epoch": 0.9, "learning_rate": 4.853566408688708e-06, "loss": 2.2788, "step": 517770 }, { "epoch": 0.9, "learning_rate": 4.852694468761881e-06, "loss": 2.2455, "step": 517780 }, { "epoch": 0.9, "learning_rate": 4.851822528835054e-06, "loss": 2.3437, "step": 517790 }, { "epoch": 0.9, "learning_rate": 4.850950588908227e-06, "loss": 2.2497, "step": 517800 }, { "epoch": 0.9, "learning_rate": 4.8500786489814e-06, "loss": 2.2132, "step": 517810 }, { "epoch": 0.9, "learning_rate": 4.849206709054573e-06, "loss": 2.1862, "step": 517820 }, { "epoch": 0.9, "learning_rate": 4.848334769127746e-06, "loss": 2.2844, "step": 517830 }, { "epoch": 0.9, "learning_rate": 4.84746282920092e-06, "loss": 2.2077, "step": 517840 }, { "epoch": 0.9, "learning_rate": 4.846590889274093e-06, "loss": 2.1901, "step": 517850 }, { "epoch": 0.9, "learning_rate": 4.845718949347266e-06, "loss": 2.2205, "step": 517860 }, { "epoch": 0.9, "learning_rate": 4.844847009420439e-06, "loss": 2.2424, "step": 517870 }, { "epoch": 0.9, "learning_rate": 4.8439750694936125e-06, "loss": 2.2203, "step": 517880 }, { "epoch": 0.9, "learning_rate": 4.843103129566785e-06, "loss": 2.3677, "step": 517890 }, { "epoch": 0.9, "learning_rate": 4.842231189639959e-06, "loss": 2.2976, "step": 517900 }, { "epoch": 0.9, "learning_rate": 4.841359249713132e-06, "loss": 2.243, "step": 517910 }, { "epoch": 0.9, "learning_rate": 4.840487309786305e-06, "loss": 2.2548, "step": 517920 }, { "epoch": 0.9, "learning_rate": 4.839615369859479e-06, "loss": 2.1795, "step": 517930 }, { "epoch": 0.9, "learning_rate": 4.838743429932652e-06, "loss": 2.3143, "step": 517940 }, { "epoch": 0.9, "learning_rate": 4.837871490005825e-06, "loss": 2.2133, "step": 517950 }, { "epoch": 0.9, "learning_rate": 4.836999550078998e-06, "loss": 2.3473, "step": 517960 }, { "epoch": 0.9, "learning_rate": 4.836127610152171e-06, "loss": 2.3385, "step": 517970 }, { "epoch": 0.9, "learning_rate": 4.835255670225344e-06, "loss": 2.1654, "step": 517980 }, { "epoch": 0.9, "learning_rate": 4.834383730298517e-06, "loss": 2.2415, "step": 517990 }, { "epoch": 0.9, "learning_rate": 4.833511790371691e-06, "loss": 2.2849, "step": 518000 }, { "epoch": 0.9, "learning_rate": 4.832639850444864e-06, "loss": 2.2003, "step": 518010 }, { "epoch": 0.9, "learning_rate": 4.831767910518037e-06, "loss": 2.3576, "step": 518020 }, { "epoch": 0.9, "learning_rate": 4.83089597059121e-06, "loss": 2.2044, "step": 518030 }, { "epoch": 0.9, "learning_rate": 4.8300240306643835e-06, "loss": 2.1732, "step": 518040 }, { "epoch": 0.9, "learning_rate": 4.829152090737557e-06, "loss": 2.3106, "step": 518050 }, { "epoch": 0.9, "learning_rate": 4.82828015081073e-06, "loss": 2.2601, "step": 518060 }, { "epoch": 0.9, "learning_rate": 4.827408210883903e-06, "loss": 2.2045, "step": 518070 }, { "epoch": 0.9, "learning_rate": 4.826536270957077e-06, "loss": 2.2676, "step": 518080 }, { "epoch": 0.9, "learning_rate": 4.82566433103025e-06, "loss": 2.3086, "step": 518090 }, { "epoch": 0.9, "learning_rate": 4.824792391103423e-06, "loss": 2.3402, "step": 518100 }, { "epoch": 0.9, "learning_rate": 4.823920451176596e-06, "loss": 2.1356, "step": 518110 }, { "epoch": 0.9, "learning_rate": 4.823048511249769e-06, "loss": 2.1805, "step": 518120 }, { "epoch": 0.9, "learning_rate": 4.822176571322942e-06, "loss": 2.2203, "step": 518130 }, { "epoch": 0.9, "learning_rate": 4.821304631396115e-06, "loss": 2.2753, "step": 518140 }, { "epoch": 0.9, "learning_rate": 4.820432691469288e-06, "loss": 2.2778, "step": 518150 }, { "epoch": 0.9, "learning_rate": 4.819560751542462e-06, "loss": 2.2145, "step": 518160 }, { "epoch": 0.9, "learning_rate": 4.818688811615636e-06, "loss": 2.2337, "step": 518170 }, { "epoch": 0.9, "learning_rate": 4.817816871688809e-06, "loss": 2.225, "step": 518180 }, { "epoch": 0.9, "learning_rate": 4.8169449317619816e-06, "loss": 2.3067, "step": 518190 }, { "epoch": 0.9, "learning_rate": 4.816072991835155e-06, "loss": 2.319, "step": 518200 }, { "epoch": 0.9, "learning_rate": 4.815201051908328e-06, "loss": 2.294, "step": 518210 }, { "epoch": 0.9, "learning_rate": 4.814329111981501e-06, "loss": 2.3031, "step": 518220 }, { "epoch": 0.9, "learning_rate": 4.813457172054674e-06, "loss": 2.332, "step": 518230 }, { "epoch": 0.9, "learning_rate": 4.812585232127848e-06, "loss": 2.2063, "step": 518240 }, { "epoch": 0.9, "learning_rate": 4.811713292201021e-06, "loss": 2.3409, "step": 518250 }, { "epoch": 0.9, "learning_rate": 4.810841352274194e-06, "loss": 2.319, "step": 518260 }, { "epoch": 0.9, "learning_rate": 4.809969412347367e-06, "loss": 2.3883, "step": 518270 }, { "epoch": 0.9, "learning_rate": 4.80909747242054e-06, "loss": 2.2975, "step": 518280 }, { "epoch": 0.9, "learning_rate": 4.808225532493713e-06, "loss": 2.3095, "step": 518290 }, { "epoch": 0.9, "learning_rate": 4.807353592566887e-06, "loss": 2.3051, "step": 518300 }, { "epoch": 0.9, "learning_rate": 4.80648165264006e-06, "loss": 2.249, "step": 518310 }, { "epoch": 0.9, "learning_rate": 4.805609712713234e-06, "loss": 2.2534, "step": 518320 }, { "epoch": 0.9, "learning_rate": 4.804737772786407e-06, "loss": 2.2529, "step": 518330 }, { "epoch": 0.9, "learning_rate": 4.80386583285958e-06, "loss": 2.2693, "step": 518340 }, { "epoch": 0.9, "learning_rate": 4.8029938929327526e-06, "loss": 2.3338, "step": 518350 }, { "epoch": 0.9, "learning_rate": 4.802121953005926e-06, "loss": 2.258, "step": 518360 }, { "epoch": 0.9, "learning_rate": 4.801250013079099e-06, "loss": 2.1887, "step": 518370 }, { "epoch": 0.9, "learning_rate": 4.800378073152272e-06, "loss": 2.1109, "step": 518380 }, { "epoch": 0.9, "learning_rate": 4.799506133225445e-06, "loss": 2.2301, "step": 518390 }, { "epoch": 0.9, "learning_rate": 4.798634193298619e-06, "loss": 2.2808, "step": 518400 }, { "epoch": 0.9, "learning_rate": 4.797762253371792e-06, "loss": 2.2619, "step": 518410 }, { "epoch": 0.9, "learning_rate": 4.796890313444965e-06, "loss": 2.3314, "step": 518420 }, { "epoch": 0.9, "learning_rate": 4.796018373518138e-06, "loss": 2.2917, "step": 518430 }, { "epoch": 0.9, "learning_rate": 4.795146433591312e-06, "loss": 2.1935, "step": 518440 }, { "epoch": 0.9, "learning_rate": 4.794274493664485e-06, "loss": 2.2761, "step": 518450 }, { "epoch": 0.9, "learning_rate": 4.793402553737658e-06, "loss": 2.1917, "step": 518460 }, { "epoch": 0.9, "learning_rate": 4.792530613810831e-06, "loss": 2.2842, "step": 518470 }, { "epoch": 0.9, "learning_rate": 4.791658673884005e-06, "loss": 2.324, "step": 518480 }, { "epoch": 0.9, "learning_rate": 4.790786733957178e-06, "loss": 2.2002, "step": 518490 }, { "epoch": 0.9, "learning_rate": 4.789914794030351e-06, "loss": 2.1899, "step": 518500 }, { "epoch": 0.9, "learning_rate": 4.7890428541035236e-06, "loss": 2.2465, "step": 518510 }, { "epoch": 0.9, "learning_rate": 4.788170914176697e-06, "loss": 2.3321, "step": 518520 }, { "epoch": 0.9, "learning_rate": 4.78729897424987e-06, "loss": 2.205, "step": 518530 }, { "epoch": 0.9, "learning_rate": 4.786427034323043e-06, "loss": 2.1979, "step": 518540 }, { "epoch": 0.9, "learning_rate": 4.785555094396216e-06, "loss": 2.2515, "step": 518550 }, { "epoch": 0.9, "learning_rate": 4.78468315446939e-06, "loss": 2.2574, "step": 518560 }, { "epoch": 0.9, "learning_rate": 4.783811214542564e-06, "loss": 2.1699, "step": 518570 }, { "epoch": 0.9, "learning_rate": 4.7829392746157366e-06, "loss": 2.2546, "step": 518580 }, { "epoch": 0.9, "learning_rate": 4.7820673346889095e-06, "loss": 2.2855, "step": 518590 }, { "epoch": 0.9, "learning_rate": 4.781195394762083e-06, "loss": 2.2718, "step": 518600 }, { "epoch": 0.9, "learning_rate": 4.780323454835256e-06, "loss": 2.1966, "step": 518610 }, { "epoch": 0.9, "learning_rate": 4.779451514908429e-06, "loss": 2.3435, "step": 518620 }, { "epoch": 0.9, "learning_rate": 4.778579574981602e-06, "loss": 2.3211, "step": 518630 }, { "epoch": 0.9, "learning_rate": 4.777707635054776e-06, "loss": 2.1434, "step": 518640 }, { "epoch": 0.9, "learning_rate": 4.776835695127949e-06, "loss": 2.1636, "step": 518650 }, { "epoch": 0.9, "learning_rate": 4.775963755201122e-06, "loss": 2.2717, "step": 518660 }, { "epoch": 0.9, "learning_rate": 4.7750918152742946e-06, "loss": 2.2347, "step": 518670 }, { "epoch": 0.9, "learning_rate": 4.774219875347468e-06, "loss": 2.203, "step": 518680 }, { "epoch": 0.9, "learning_rate": 4.773347935420641e-06, "loss": 2.2639, "step": 518690 }, { "epoch": 0.9, "learning_rate": 4.772475995493815e-06, "loss": 2.3326, "step": 518700 }, { "epoch": 0.9, "learning_rate": 4.771604055566988e-06, "loss": 2.2055, "step": 518710 }, { "epoch": 0.9, "learning_rate": 4.770732115640162e-06, "loss": 2.2069, "step": 518720 }, { "epoch": 0.9, "learning_rate": 4.769860175713335e-06, "loss": 2.2563, "step": 518730 }, { "epoch": 0.9, "learning_rate": 4.7689882357865076e-06, "loss": 2.293, "step": 518740 }, { "epoch": 0.9, "learning_rate": 4.7681162958596805e-06, "loss": 2.1521, "step": 518750 }, { "epoch": 0.9, "learning_rate": 4.767244355932854e-06, "loss": 2.3362, "step": 518760 }, { "epoch": 0.9, "learning_rate": 4.766372416006027e-06, "loss": 2.2801, "step": 518770 }, { "epoch": 0.9, "learning_rate": 4.7655004760792e-06, "loss": 2.306, "step": 518780 }, { "epoch": 0.9, "learning_rate": 4.764628536152373e-06, "loss": 2.3007, "step": 518790 }, { "epoch": 0.9, "learning_rate": 4.763756596225547e-06, "loss": 2.2216, "step": 518800 }, { "epoch": 0.9, "learning_rate": 4.76288465629872e-06, "loss": 2.3038, "step": 518810 }, { "epoch": 0.9, "learning_rate": 4.762012716371893e-06, "loss": 2.1701, "step": 518820 }, { "epoch": 0.9, "learning_rate": 4.7611407764450656e-06, "loss": 2.3011, "step": 518830 }, { "epoch": 0.9, "learning_rate": 4.76026883651824e-06, "loss": 2.325, "step": 518840 }, { "epoch": 0.9, "learning_rate": 4.759396896591413e-06, "loss": 2.367, "step": 518850 }, { "epoch": 0.9, "learning_rate": 4.758524956664586e-06, "loss": 2.2332, "step": 518860 }, { "epoch": 0.9, "learning_rate": 4.757653016737759e-06, "loss": 2.1726, "step": 518870 }, { "epoch": 0.9, "learning_rate": 4.756781076810933e-06, "loss": 2.2593, "step": 518880 }, { "epoch": 0.9, "learning_rate": 4.755909136884106e-06, "loss": 2.206, "step": 518890 }, { "epoch": 0.9, "learning_rate": 4.7550371969572786e-06, "loss": 2.1553, "step": 518900 }, { "epoch": 0.9, "learning_rate": 4.7541652570304515e-06, "loss": 2.3242, "step": 518910 }, { "epoch": 0.9, "learning_rate": 4.753293317103625e-06, "loss": 2.1702, "step": 518920 }, { "epoch": 0.9, "learning_rate": 4.752421377176798e-06, "loss": 2.2147, "step": 518930 }, { "epoch": 0.9, "learning_rate": 4.751549437249971e-06, "loss": 2.1708, "step": 518940 }, { "epoch": 0.9, "learning_rate": 4.750677497323144e-06, "loss": 2.2867, "step": 518950 }, { "epoch": 0.91, "learning_rate": 4.749805557396318e-06, "loss": 2.2438, "step": 518960 }, { "epoch": 0.91, "learning_rate": 4.7489336174694916e-06, "loss": 2.1737, "step": 518970 }, { "epoch": 0.91, "learning_rate": 4.7480616775426645e-06, "loss": 2.2318, "step": 518980 }, { "epoch": 0.91, "learning_rate": 4.747189737615837e-06, "loss": 2.3003, "step": 518990 }, { "epoch": 0.91, "learning_rate": 4.746317797689011e-06, "loss": 2.178, "step": 519000 }, { "epoch": 0.91, "learning_rate": 4.745445857762184e-06, "loss": 2.2521, "step": 519010 }, { "epoch": 0.91, "learning_rate": 4.744573917835357e-06, "loss": 2.2311, "step": 519020 }, { "epoch": 0.91, "learning_rate": 4.74370197790853e-06, "loss": 2.3246, "step": 519030 }, { "epoch": 0.91, "learning_rate": 4.742830037981704e-06, "loss": 2.2157, "step": 519040 }, { "epoch": 0.91, "learning_rate": 4.741958098054877e-06, "loss": 2.295, "step": 519050 }, { "epoch": 0.91, "learning_rate": 4.7410861581280496e-06, "loss": 2.2274, "step": 519060 }, { "epoch": 0.91, "learning_rate": 4.7402142182012225e-06, "loss": 2.2393, "step": 519070 }, { "epoch": 0.91, "learning_rate": 4.739342278274396e-06, "loss": 2.1999, "step": 519080 }, { "epoch": 0.91, "learning_rate": 4.738470338347569e-06, "loss": 2.2952, "step": 519090 }, { "epoch": 0.91, "learning_rate": 4.737598398420743e-06, "loss": 2.2439, "step": 519100 }, { "epoch": 0.91, "learning_rate": 4.736726458493916e-06, "loss": 2.3159, "step": 519110 }, { "epoch": 0.91, "learning_rate": 4.73585451856709e-06, "loss": 2.2118, "step": 519120 }, { "epoch": 0.91, "learning_rate": 4.7349825786402626e-06, "loss": 2.2365, "step": 519130 }, { "epoch": 0.91, "learning_rate": 4.7341106387134355e-06, "loss": 2.306, "step": 519140 }, { "epoch": 0.91, "learning_rate": 4.733238698786608e-06, "loss": 2.3649, "step": 519150 }, { "epoch": 0.91, "learning_rate": 4.732366758859782e-06, "loss": 2.2981, "step": 519160 }, { "epoch": 0.91, "learning_rate": 4.731494818932955e-06, "loss": 2.1671, "step": 519170 }, { "epoch": 0.91, "learning_rate": 4.730622879006128e-06, "loss": 2.2176, "step": 519180 }, { "epoch": 0.91, "learning_rate": 4.729750939079301e-06, "loss": 2.1458, "step": 519190 }, { "epoch": 0.91, "learning_rate": 4.728878999152475e-06, "loss": 2.2731, "step": 519200 }, { "epoch": 0.91, "learning_rate": 4.728007059225648e-06, "loss": 2.1592, "step": 519210 }, { "epoch": 0.91, "learning_rate": 4.7271351192988206e-06, "loss": 2.2031, "step": 519220 }, { "epoch": 0.91, "learning_rate": 4.726263179371994e-06, "loss": 2.391, "step": 519230 }, { "epoch": 0.91, "learning_rate": 4.725391239445168e-06, "loss": 2.2574, "step": 519240 }, { "epoch": 0.91, "learning_rate": 4.724519299518341e-06, "loss": 2.2277, "step": 519250 }, { "epoch": 0.91, "learning_rate": 4.723647359591514e-06, "loss": 2.2207, "step": 519260 }, { "epoch": 0.91, "learning_rate": 4.722775419664687e-06, "loss": 2.2143, "step": 519270 }, { "epoch": 0.91, "learning_rate": 4.721903479737861e-06, "loss": 2.2796, "step": 519280 }, { "epoch": 0.91, "learning_rate": 4.7210315398110336e-06, "loss": 2.2805, "step": 519290 }, { "epoch": 0.91, "learning_rate": 4.7201595998842065e-06, "loss": 2.347, "step": 519300 }, { "epoch": 0.91, "learning_rate": 4.719287659957379e-06, "loss": 2.2684, "step": 519310 }, { "epoch": 0.91, "learning_rate": 4.718415720030553e-06, "loss": 2.2481, "step": 519320 }, { "epoch": 0.91, "learning_rate": 4.717543780103726e-06, "loss": 2.2519, "step": 519330 }, { "epoch": 0.91, "learning_rate": 4.716671840176899e-06, "loss": 2.2758, "step": 519340 }, { "epoch": 0.91, "learning_rate": 4.715799900250072e-06, "loss": 2.3208, "step": 519350 }, { "epoch": 0.91, "learning_rate": 4.714927960323246e-06, "loss": 2.1506, "step": 519360 }, { "epoch": 0.91, "learning_rate": 4.7140560203964195e-06, "loss": 2.198, "step": 519370 }, { "epoch": 0.91, "learning_rate": 4.713184080469592e-06, "loss": 2.222, "step": 519380 }, { "epoch": 0.91, "learning_rate": 4.712312140542765e-06, "loss": 2.2739, "step": 519390 }, { "epoch": 0.91, "learning_rate": 4.711440200615939e-06, "loss": 2.3377, "step": 519400 }, { "epoch": 0.91, "learning_rate": 4.710568260689112e-06, "loss": 2.3312, "step": 519410 }, { "epoch": 0.91, "learning_rate": 4.709696320762285e-06, "loss": 2.1592, "step": 519420 }, { "epoch": 0.91, "learning_rate": 4.708824380835458e-06, "loss": 2.2814, "step": 519430 }, { "epoch": 0.91, "learning_rate": 4.707952440908632e-06, "loss": 2.268, "step": 519440 }, { "epoch": 0.91, "learning_rate": 4.7070805009818046e-06, "loss": 2.2954, "step": 519450 }, { "epoch": 0.91, "learning_rate": 4.7062085610549775e-06, "loss": 2.2689, "step": 519460 }, { "epoch": 0.91, "learning_rate": 4.70533662112815e-06, "loss": 2.2415, "step": 519470 }, { "epoch": 0.91, "learning_rate": 4.704464681201324e-06, "loss": 2.234, "step": 519480 }, { "epoch": 0.91, "learning_rate": 4.703592741274497e-06, "loss": 2.2008, "step": 519490 }, { "epoch": 0.91, "learning_rate": 4.702720801347671e-06, "loss": 2.1912, "step": 519500 }, { "epoch": 0.91, "learning_rate": 4.701848861420844e-06, "loss": 2.2668, "step": 519510 }, { "epoch": 0.91, "learning_rate": 4.7009769214940176e-06, "loss": 2.2157, "step": 519520 }, { "epoch": 0.91, "learning_rate": 4.7001049815671905e-06, "loss": 2.291, "step": 519530 }, { "epoch": 0.91, "learning_rate": 4.699233041640363e-06, "loss": 2.2927, "step": 519540 }, { "epoch": 0.91, "learning_rate": 4.698361101713536e-06, "loss": 2.3232, "step": 519550 }, { "epoch": 0.91, "learning_rate": 4.69748916178671e-06, "loss": 2.2606, "step": 519560 }, { "epoch": 0.91, "learning_rate": 4.696617221859883e-06, "loss": 2.3043, "step": 519570 }, { "epoch": 0.91, "learning_rate": 4.695745281933056e-06, "loss": 2.23, "step": 519580 }, { "epoch": 0.91, "learning_rate": 4.694873342006229e-06, "loss": 2.3128, "step": 519590 }, { "epoch": 0.91, "learning_rate": 4.694001402079403e-06, "loss": 2.1875, "step": 519600 }, { "epoch": 0.91, "learning_rate": 4.6931294621525756e-06, "loss": 2.2819, "step": 519610 }, { "epoch": 0.91, "learning_rate": 4.6922575222257485e-06, "loss": 2.1714, "step": 519620 }, { "epoch": 0.91, "learning_rate": 4.691385582298922e-06, "loss": 2.2599, "step": 519630 }, { "epoch": 0.91, "learning_rate": 4.690513642372096e-06, "loss": 2.2069, "step": 519640 }, { "epoch": 0.91, "learning_rate": 4.689641702445269e-06, "loss": 2.2624, "step": 519650 }, { "epoch": 0.91, "learning_rate": 4.688769762518442e-06, "loss": 2.2246, "step": 519660 }, { "epoch": 0.91, "learning_rate": 4.687897822591615e-06, "loss": 2.2216, "step": 519670 }, { "epoch": 0.91, "learning_rate": 4.6870258826647886e-06, "loss": 2.2127, "step": 519680 }, { "epoch": 0.91, "learning_rate": 4.6861539427379615e-06, "loss": 2.2759, "step": 519690 }, { "epoch": 0.91, "learning_rate": 4.685282002811134e-06, "loss": 2.2155, "step": 519700 }, { "epoch": 0.91, "learning_rate": 4.684410062884307e-06, "loss": 2.2671, "step": 519710 }, { "epoch": 0.91, "learning_rate": 4.683538122957481e-06, "loss": 2.2637, "step": 519720 }, { "epoch": 0.91, "learning_rate": 4.682666183030654e-06, "loss": 2.2963, "step": 519730 }, { "epoch": 0.91, "learning_rate": 4.681794243103827e-06, "loss": 2.1704, "step": 519740 }, { "epoch": 0.91, "learning_rate": 4.680922303177e-06, "loss": 2.2044, "step": 519750 }, { "epoch": 0.91, "learning_rate": 4.680050363250174e-06, "loss": 2.1472, "step": 519760 }, { "epoch": 0.91, "learning_rate": 4.679178423323347e-06, "loss": 2.2598, "step": 519770 }, { "epoch": 0.91, "learning_rate": 4.67830648339652e-06, "loss": 2.1935, "step": 519780 }, { "epoch": 0.91, "learning_rate": 4.677434543469693e-06, "loss": 2.2581, "step": 519790 }, { "epoch": 0.91, "learning_rate": 4.676562603542867e-06, "loss": 2.1783, "step": 519800 }, { "epoch": 0.91, "learning_rate": 4.67569066361604e-06, "loss": 2.273, "step": 519810 }, { "epoch": 0.91, "learning_rate": 4.674818723689213e-06, "loss": 2.3338, "step": 519820 }, { "epoch": 0.91, "learning_rate": 4.673946783762386e-06, "loss": 2.3115, "step": 519830 }, { "epoch": 0.91, "learning_rate": 4.6730748438355596e-06, "loss": 2.1326, "step": 519840 }, { "epoch": 0.91, "learning_rate": 4.6722029039087325e-06, "loss": 2.2006, "step": 519850 }, { "epoch": 0.91, "learning_rate": 4.671330963981905e-06, "loss": 2.2574, "step": 519860 }, { "epoch": 0.91, "learning_rate": 4.670459024055078e-06, "loss": 2.3322, "step": 519870 }, { "epoch": 0.91, "learning_rate": 4.669587084128252e-06, "loss": 2.245, "step": 519880 }, { "epoch": 0.91, "learning_rate": 4.668715144201425e-06, "loss": 2.2983, "step": 519890 }, { "epoch": 0.91, "learning_rate": 4.667843204274599e-06, "loss": 2.159, "step": 519900 }, { "epoch": 0.91, "learning_rate": 4.666971264347772e-06, "loss": 2.3708, "step": 519910 }, { "epoch": 0.91, "learning_rate": 4.6660993244209455e-06, "loss": 2.3166, "step": 519920 }, { "epoch": 0.91, "learning_rate": 4.665227384494118e-06, "loss": 2.2799, "step": 519930 }, { "epoch": 0.91, "learning_rate": 4.664355444567291e-06, "loss": 2.2539, "step": 519940 }, { "epoch": 0.91, "learning_rate": 4.663483504640464e-06, "loss": 2.3011, "step": 519950 }, { "epoch": 0.91, "learning_rate": 4.662611564713638e-06, "loss": 2.2846, "step": 519960 }, { "epoch": 0.91, "learning_rate": 4.661739624786811e-06, "loss": 2.3012, "step": 519970 }, { "epoch": 0.91, "learning_rate": 4.660867684859984e-06, "loss": 2.2712, "step": 519980 }, { "epoch": 0.91, "learning_rate": 4.659995744933157e-06, "loss": 2.3342, "step": 519990 }, { "epoch": 0.91, "learning_rate": 4.6591238050063306e-06, "loss": 2.1685, "step": 520000 }, { "epoch": 0.91, "learning_rate": 4.6582518650795035e-06, "loss": 2.3016, "step": 520010 }, { "epoch": 0.91, "learning_rate": 4.657379925152676e-06, "loss": 2.2537, "step": 520020 }, { "epoch": 0.91, "learning_rate": 4.65650798522585e-06, "loss": 2.3285, "step": 520030 }, { "epoch": 0.91, "learning_rate": 4.655636045299024e-06, "loss": 2.1658, "step": 520040 }, { "epoch": 0.91, "learning_rate": 4.654764105372197e-06, "loss": 2.35, "step": 520050 }, { "epoch": 0.91, "learning_rate": 4.65389216544537e-06, "loss": 2.3797, "step": 520060 }, { "epoch": 0.91, "learning_rate": 4.653020225518543e-06, "loss": 2.2385, "step": 520070 }, { "epoch": 0.91, "learning_rate": 4.6521482855917165e-06, "loss": 2.1436, "step": 520080 }, { "epoch": 0.91, "learning_rate": 4.651276345664889e-06, "loss": 2.3222, "step": 520090 }, { "epoch": 0.91, "learning_rate": 4.650404405738062e-06, "loss": 2.2467, "step": 520100 }, { "epoch": 0.91, "learning_rate": 4.649532465811235e-06, "loss": 2.2107, "step": 520110 }, { "epoch": 0.91, "learning_rate": 4.648660525884409e-06, "loss": 2.1603, "step": 520120 }, { "epoch": 0.91, "learning_rate": 4.647788585957582e-06, "loss": 2.1369, "step": 520130 }, { "epoch": 0.91, "learning_rate": 4.646916646030755e-06, "loss": 2.2594, "step": 520140 }, { "epoch": 0.91, "learning_rate": 4.646044706103928e-06, "loss": 2.4254, "step": 520150 }, { "epoch": 0.91, "learning_rate": 4.6451727661771016e-06, "loss": 2.2682, "step": 520160 }, { "epoch": 0.91, "learning_rate": 4.644300826250275e-06, "loss": 2.2347, "step": 520170 }, { "epoch": 0.91, "learning_rate": 4.643428886323448e-06, "loss": 2.2949, "step": 520180 }, { "epoch": 0.91, "learning_rate": 4.642556946396621e-06, "loss": 2.1521, "step": 520190 }, { "epoch": 0.91, "learning_rate": 4.641685006469795e-06, "loss": 2.315, "step": 520200 }, { "epoch": 0.91, "learning_rate": 4.640813066542968e-06, "loss": 2.2884, "step": 520210 }, { "epoch": 0.91, "learning_rate": 4.639941126616141e-06, "loss": 2.2692, "step": 520220 }, { "epoch": 0.91, "learning_rate": 4.639069186689314e-06, "loss": 2.2676, "step": 520230 }, { "epoch": 0.91, "learning_rate": 4.6381972467624875e-06, "loss": 2.203, "step": 520240 }, { "epoch": 0.91, "learning_rate": 4.63732530683566e-06, "loss": 2.2797, "step": 520250 }, { "epoch": 0.91, "learning_rate": 4.636453366908833e-06, "loss": 2.2721, "step": 520260 }, { "epoch": 0.91, "learning_rate": 4.635581426982006e-06, "loss": 2.2585, "step": 520270 }, { "epoch": 0.91, "learning_rate": 4.63470948705518e-06, "loss": 2.2067, "step": 520280 }, { "epoch": 0.91, "learning_rate": 4.633837547128353e-06, "loss": 2.3015, "step": 520290 }, { "epoch": 0.91, "learning_rate": 4.632965607201527e-06, "loss": 2.29, "step": 520300 }, { "epoch": 0.91, "learning_rate": 4.6320936672747e-06, "loss": 2.2389, "step": 520310 }, { "epoch": 0.91, "learning_rate": 4.631221727347873e-06, "loss": 2.1654, "step": 520320 }, { "epoch": 0.91, "learning_rate": 4.630349787421046e-06, "loss": 2.3011, "step": 520330 }, { "epoch": 0.91, "learning_rate": 4.629477847494219e-06, "loss": 2.2714, "step": 520340 }, { "epoch": 0.91, "learning_rate": 4.628605907567392e-06, "loss": 2.2411, "step": 520350 }, { "epoch": 0.91, "learning_rate": 4.627733967640566e-06, "loss": 2.3538, "step": 520360 }, { "epoch": 0.91, "learning_rate": 4.626862027713739e-06, "loss": 2.2988, "step": 520370 }, { "epoch": 0.91, "learning_rate": 4.625990087786912e-06, "loss": 2.2913, "step": 520380 }, { "epoch": 0.91, "learning_rate": 4.625118147860085e-06, "loss": 2.3293, "step": 520390 }, { "epoch": 0.91, "learning_rate": 4.6242462079332585e-06, "loss": 2.1829, "step": 520400 }, { "epoch": 0.91, "learning_rate": 4.623374268006431e-06, "loss": 2.3432, "step": 520410 }, { "epoch": 0.91, "learning_rate": 4.622502328079604e-06, "loss": 2.3285, "step": 520420 }, { "epoch": 0.91, "learning_rate": 4.621630388152778e-06, "loss": 2.3599, "step": 520430 }, { "epoch": 0.91, "learning_rate": 4.620758448225952e-06, "loss": 2.2147, "step": 520440 }, { "epoch": 0.91, "learning_rate": 4.619886508299125e-06, "loss": 2.1874, "step": 520450 }, { "epoch": 0.91, "learning_rate": 4.619014568372298e-06, "loss": 2.2609, "step": 520460 }, { "epoch": 0.91, "learning_rate": 4.618142628445471e-06, "loss": 2.2766, "step": 520470 }, { "epoch": 0.91, "learning_rate": 4.617270688518644e-06, "loss": 2.244, "step": 520480 }, { "epoch": 0.91, "learning_rate": 4.616398748591817e-06, "loss": 2.1716, "step": 520490 }, { "epoch": 0.91, "learning_rate": 4.61552680866499e-06, "loss": 2.2857, "step": 520500 }, { "epoch": 0.91, "learning_rate": 4.614654868738163e-06, "loss": 2.1742, "step": 520510 }, { "epoch": 0.91, "learning_rate": 4.613782928811337e-06, "loss": 2.2265, "step": 520520 }, { "epoch": 0.91, "learning_rate": 4.61291098888451e-06, "loss": 2.2155, "step": 520530 }, { "epoch": 0.91, "learning_rate": 4.612039048957683e-06, "loss": 2.2668, "step": 520540 }, { "epoch": 0.91, "learning_rate": 4.611167109030856e-06, "loss": 2.1951, "step": 520550 }, { "epoch": 0.91, "learning_rate": 4.61029516910403e-06, "loss": 2.1697, "step": 520560 }, { "epoch": 0.91, "learning_rate": 4.609423229177203e-06, "loss": 2.1701, "step": 520570 }, { "epoch": 0.91, "learning_rate": 4.608551289250376e-06, "loss": 2.2188, "step": 520580 }, { "epoch": 0.91, "learning_rate": 4.607679349323549e-06, "loss": 2.3005, "step": 520590 }, { "epoch": 0.91, "learning_rate": 4.606807409396723e-06, "loss": 2.3291, "step": 520600 }, { "epoch": 0.91, "learning_rate": 4.605935469469896e-06, "loss": 2.2166, "step": 520610 }, { "epoch": 0.91, "learning_rate": 4.605063529543069e-06, "loss": 2.2286, "step": 520620 }, { "epoch": 0.91, "learning_rate": 4.604191589616242e-06, "loss": 2.1674, "step": 520630 }, { "epoch": 0.91, "learning_rate": 4.603319649689415e-06, "loss": 2.2672, "step": 520640 }, { "epoch": 0.91, "learning_rate": 4.602447709762588e-06, "loss": 2.2692, "step": 520650 }, { "epoch": 0.91, "learning_rate": 4.601575769835761e-06, "loss": 2.3595, "step": 520660 }, { "epoch": 0.91, "learning_rate": 4.600703829908934e-06, "loss": 2.2824, "step": 520670 }, { "epoch": 0.91, "learning_rate": 4.599831889982108e-06, "loss": 2.3147, "step": 520680 }, { "epoch": 0.91, "learning_rate": 4.598959950055281e-06, "loss": 2.212, "step": 520690 }, { "epoch": 0.91, "learning_rate": 4.598088010128455e-06, "loss": 2.2772, "step": 520700 }, { "epoch": 0.91, "learning_rate": 4.5972160702016276e-06, "loss": 2.2945, "step": 520710 }, { "epoch": 0.91, "learning_rate": 4.596344130274801e-06, "loss": 2.2449, "step": 520720 }, { "epoch": 0.91, "learning_rate": 4.595472190347974e-06, "loss": 2.2391, "step": 520730 }, { "epoch": 0.91, "learning_rate": 4.594600250421147e-06, "loss": 2.3061, "step": 520740 }, { "epoch": 0.91, "learning_rate": 4.59372831049432e-06, "loss": 2.3927, "step": 520750 }, { "epoch": 0.91, "learning_rate": 4.592856370567494e-06, "loss": 2.1692, "step": 520760 }, { "epoch": 0.91, "learning_rate": 4.591984430640667e-06, "loss": 2.1208, "step": 520770 }, { "epoch": 0.91, "learning_rate": 4.59111249071384e-06, "loss": 2.3644, "step": 520780 }, { "epoch": 0.91, "learning_rate": 4.590240550787013e-06, "loss": 2.1738, "step": 520790 }, { "epoch": 0.91, "learning_rate": 4.589368610860186e-06, "loss": 2.2213, "step": 520800 }, { "epoch": 0.91, "learning_rate": 4.588496670933359e-06, "loss": 2.2286, "step": 520810 }, { "epoch": 0.91, "learning_rate": 4.587624731006532e-06, "loss": 2.2682, "step": 520820 }, { "epoch": 0.91, "learning_rate": 4.586752791079706e-06, "loss": 2.2426, "step": 520830 }, { "epoch": 0.91, "learning_rate": 4.58588085115288e-06, "loss": 2.3903, "step": 520840 }, { "epoch": 0.91, "learning_rate": 4.585008911226053e-06, "loss": 2.326, "step": 520850 }, { "epoch": 0.91, "learning_rate": 4.584136971299226e-06, "loss": 2.2706, "step": 520860 }, { "epoch": 0.91, "learning_rate": 4.583265031372399e-06, "loss": 2.2593, "step": 520870 }, { "epoch": 0.91, "learning_rate": 4.582393091445572e-06, "loss": 2.2249, "step": 520880 }, { "epoch": 0.91, "learning_rate": 4.581521151518745e-06, "loss": 2.3073, "step": 520890 }, { "epoch": 0.91, "learning_rate": 4.580649211591918e-06, "loss": 2.2803, "step": 520900 }, { "epoch": 0.91, "learning_rate": 4.579777271665091e-06, "loss": 2.1851, "step": 520910 }, { "epoch": 0.91, "learning_rate": 4.578905331738265e-06, "loss": 2.3609, "step": 520920 }, { "epoch": 0.91, "learning_rate": 4.578033391811438e-06, "loss": 2.2761, "step": 520930 }, { "epoch": 0.91, "learning_rate": 4.577161451884611e-06, "loss": 2.2159, "step": 520940 }, { "epoch": 0.91, "learning_rate": 4.576289511957784e-06, "loss": 2.2548, "step": 520950 }, { "epoch": 0.91, "learning_rate": 4.575417572030958e-06, "loss": 2.2635, "step": 520960 }, { "epoch": 0.91, "learning_rate": 4.574545632104131e-06, "loss": 2.2066, "step": 520970 }, { "epoch": 0.91, "learning_rate": 4.573673692177304e-06, "loss": 2.2074, "step": 520980 }, { "epoch": 0.91, "learning_rate": 4.572801752250477e-06, "loss": 2.3085, "step": 520990 }, { "epoch": 0.91, "learning_rate": 4.571929812323651e-06, "loss": 2.3399, "step": 521000 }, { "epoch": 0.91, "learning_rate": 4.571057872396824e-06, "loss": 2.2008, "step": 521010 }, { "epoch": 0.91, "learning_rate": 4.570185932469997e-06, "loss": 2.2416, "step": 521020 }, { "epoch": 0.91, "learning_rate": 4.56931399254317e-06, "loss": 2.2755, "step": 521030 }, { "epoch": 0.91, "learning_rate": 4.568442052616343e-06, "loss": 2.1817, "step": 521040 }, { "epoch": 0.91, "learning_rate": 4.567570112689516e-06, "loss": 2.2879, "step": 521050 }, { "epoch": 0.91, "learning_rate": 4.566698172762689e-06, "loss": 2.2524, "step": 521060 }, { "epoch": 0.91, "learning_rate": 4.565826232835862e-06, "loss": 2.1722, "step": 521070 }, { "epoch": 0.91, "learning_rate": 4.564954292909036e-06, "loss": 2.1678, "step": 521080 }, { "epoch": 0.91, "learning_rate": 4.564082352982209e-06, "loss": 2.3102, "step": 521090 }, { "epoch": 0.91, "learning_rate": 4.563210413055383e-06, "loss": 2.2194, "step": 521100 }, { "epoch": 0.91, "learning_rate": 4.5623384731285555e-06, "loss": 2.2301, "step": 521110 }, { "epoch": 0.91, "learning_rate": 4.561466533201729e-06, "loss": 2.3635, "step": 521120 }, { "epoch": 0.91, "learning_rate": 4.560594593274902e-06, "loss": 2.3131, "step": 521130 }, { "epoch": 0.91, "learning_rate": 4.559722653348075e-06, "loss": 2.3232, "step": 521140 }, { "epoch": 0.91, "learning_rate": 4.558850713421248e-06, "loss": 2.2839, "step": 521150 }, { "epoch": 0.91, "learning_rate": 4.557978773494422e-06, "loss": 2.1884, "step": 521160 }, { "epoch": 0.91, "learning_rate": 4.557106833567595e-06, "loss": 2.3465, "step": 521170 }, { "epoch": 0.91, "learning_rate": 4.556234893640768e-06, "loss": 2.1999, "step": 521180 }, { "epoch": 0.91, "learning_rate": 4.555362953713941e-06, "loss": 2.348, "step": 521190 }, { "epoch": 0.91, "learning_rate": 4.554491013787114e-06, "loss": 2.2628, "step": 521200 }, { "epoch": 0.91, "learning_rate": 4.553619073860287e-06, "loss": 2.1762, "step": 521210 }, { "epoch": 0.91, "learning_rate": 4.55274713393346e-06, "loss": 2.3473, "step": 521220 }, { "epoch": 0.91, "learning_rate": 4.551875194006634e-06, "loss": 2.3311, "step": 521230 }, { "epoch": 0.91, "learning_rate": 4.551003254079808e-06, "loss": 2.2614, "step": 521240 }, { "epoch": 0.91, "learning_rate": 4.550131314152981e-06, "loss": 2.3464, "step": 521250 }, { "epoch": 0.91, "learning_rate": 4.549259374226154e-06, "loss": 2.2444, "step": 521260 }, { "epoch": 0.91, "learning_rate": 4.5483874342993265e-06, "loss": 2.3506, "step": 521270 }, { "epoch": 0.91, "learning_rate": 4.5475154943725e-06, "loss": 2.2469, "step": 521280 }, { "epoch": 0.91, "learning_rate": 4.546643554445673e-06, "loss": 2.2461, "step": 521290 }, { "epoch": 0.91, "learning_rate": 4.545771614518846e-06, "loss": 2.2721, "step": 521300 }, { "epoch": 0.91, "learning_rate": 4.544899674592019e-06, "loss": 2.1982, "step": 521310 }, { "epoch": 0.91, "learning_rate": 4.544027734665193e-06, "loss": 2.3201, "step": 521320 }, { "epoch": 0.91, "learning_rate": 4.543155794738366e-06, "loss": 2.2216, "step": 521330 }, { "epoch": 0.91, "learning_rate": 4.542283854811539e-06, "loss": 2.229, "step": 521340 }, { "epoch": 0.91, "learning_rate": 4.5414119148847124e-06, "loss": 2.2788, "step": 521350 }, { "epoch": 0.91, "learning_rate": 4.540539974957886e-06, "loss": 2.2437, "step": 521360 }, { "epoch": 0.91, "learning_rate": 4.539668035031059e-06, "loss": 2.2655, "step": 521370 }, { "epoch": 0.91, "learning_rate": 4.538796095104232e-06, "loss": 2.2818, "step": 521380 }, { "epoch": 0.91, "learning_rate": 4.537924155177405e-06, "loss": 2.1202, "step": 521390 }, { "epoch": 0.91, "learning_rate": 4.537052215250579e-06, "loss": 2.3304, "step": 521400 }, { "epoch": 0.91, "learning_rate": 4.536180275323752e-06, "loss": 2.2397, "step": 521410 }, { "epoch": 0.91, "learning_rate": 4.535308335396925e-06, "loss": 2.2682, "step": 521420 }, { "epoch": 0.91, "learning_rate": 4.5344363954700975e-06, "loss": 2.1234, "step": 521430 }, { "epoch": 0.91, "learning_rate": 4.533564455543271e-06, "loss": 2.197, "step": 521440 }, { "epoch": 0.91, "learning_rate": 4.532692515616444e-06, "loss": 2.2653, "step": 521450 }, { "epoch": 0.91, "learning_rate": 4.531820575689617e-06, "loss": 2.2121, "step": 521460 }, { "epoch": 0.91, "learning_rate": 4.53094863576279e-06, "loss": 2.2759, "step": 521470 }, { "epoch": 0.91, "learning_rate": 4.530076695835964e-06, "loss": 2.2123, "step": 521480 }, { "epoch": 0.91, "learning_rate": 4.529204755909137e-06, "loss": 2.2254, "step": 521490 }, { "epoch": 0.91, "learning_rate": 4.5283328159823105e-06, "loss": 2.2612, "step": 521500 }, { "epoch": 0.91, "learning_rate": 4.5274608760554834e-06, "loss": 2.2731, "step": 521510 }, { "epoch": 0.91, "learning_rate": 4.526588936128657e-06, "loss": 2.21, "step": 521520 }, { "epoch": 0.91, "learning_rate": 4.52571699620183e-06, "loss": 2.3597, "step": 521530 }, { "epoch": 0.91, "learning_rate": 4.524845056275003e-06, "loss": 2.2603, "step": 521540 }, { "epoch": 0.91, "learning_rate": 4.523973116348176e-06, "loss": 2.2669, "step": 521550 }, { "epoch": 0.91, "learning_rate": 4.52310117642135e-06, "loss": 2.2558, "step": 521560 }, { "epoch": 0.91, "learning_rate": 4.522229236494523e-06, "loss": 2.2924, "step": 521570 }, { "epoch": 0.91, "learning_rate": 4.521357296567696e-06, "loss": 2.2186, "step": 521580 }, { "epoch": 0.91, "learning_rate": 4.5204853566408685e-06, "loss": 2.376, "step": 521590 }, { "epoch": 0.91, "learning_rate": 4.519613416714042e-06, "loss": 2.2943, "step": 521600 }, { "epoch": 0.91, "learning_rate": 4.518741476787215e-06, "loss": 2.2836, "step": 521610 }, { "epoch": 0.91, "learning_rate": 4.517869536860388e-06, "loss": 2.2854, "step": 521620 }, { "epoch": 0.91, "learning_rate": 4.516997596933562e-06, "loss": 2.2732, "step": 521630 }, { "epoch": 0.91, "learning_rate": 4.516125657006736e-06, "loss": 2.2073, "step": 521640 }, { "epoch": 0.91, "learning_rate": 4.515253717079909e-06, "loss": 2.2786, "step": 521650 }, { "epoch": 0.91, "learning_rate": 4.5143817771530815e-06, "loss": 2.1159, "step": 521660 }, { "epoch": 0.91, "learning_rate": 4.5135098372262544e-06, "loss": 2.2905, "step": 521670 }, { "epoch": 0.91, "learning_rate": 4.512637897299428e-06, "loss": 2.2582, "step": 521680 }, { "epoch": 0.91, "learning_rate": 4.511765957372601e-06, "loss": 2.3724, "step": 521690 }, { "epoch": 0.91, "learning_rate": 4.510894017445774e-06, "loss": 2.2298, "step": 521700 }, { "epoch": 0.91, "learning_rate": 4.510022077518947e-06, "loss": 2.4006, "step": 521710 }, { "epoch": 0.91, "learning_rate": 4.509150137592121e-06, "loss": 2.1767, "step": 521720 }, { "epoch": 0.91, "learning_rate": 4.508278197665294e-06, "loss": 2.2982, "step": 521730 }, { "epoch": 0.91, "learning_rate": 4.507406257738467e-06, "loss": 2.2558, "step": 521740 }, { "epoch": 0.91, "learning_rate": 4.50653431781164e-06, "loss": 2.1785, "step": 521750 }, { "epoch": 0.91, "learning_rate": 4.505662377884814e-06, "loss": 2.2843, "step": 521760 }, { "epoch": 0.91, "learning_rate": 4.504790437957987e-06, "loss": 2.2004, "step": 521770 }, { "epoch": 0.91, "learning_rate": 4.50391849803116e-06, "loss": 2.2653, "step": 521780 }, { "epoch": 0.91, "learning_rate": 4.503046558104333e-06, "loss": 2.24, "step": 521790 }, { "epoch": 0.91, "learning_rate": 4.502174618177507e-06, "loss": 2.2728, "step": 521800 }, { "epoch": 0.91, "learning_rate": 4.50130267825068e-06, "loss": 2.2372, "step": 521810 }, { "epoch": 0.91, "learning_rate": 4.5004307383238525e-06, "loss": 2.2197, "step": 521820 }, { "epoch": 0.91, "learning_rate": 4.4995587983970254e-06, "loss": 2.2801, "step": 521830 }, { "epoch": 0.91, "learning_rate": 4.498686858470199e-06, "loss": 2.3318, "step": 521840 }, { "epoch": 0.91, "learning_rate": 4.497814918543372e-06, "loss": 2.1956, "step": 521850 }, { "epoch": 0.91, "learning_rate": 4.496942978616545e-06, "loss": 2.246, "step": 521860 }, { "epoch": 0.91, "learning_rate": 4.496071038689719e-06, "loss": 2.2857, "step": 521870 }, { "epoch": 0.91, "learning_rate": 4.495199098762892e-06, "loss": 2.2168, "step": 521880 }, { "epoch": 0.91, "learning_rate": 4.494327158836065e-06, "loss": 2.2831, "step": 521890 }, { "epoch": 0.91, "learning_rate": 4.4934552189092384e-06, "loss": 2.2514, "step": 521900 }, { "epoch": 0.91, "learning_rate": 4.492583278982411e-06, "loss": 2.388, "step": 521910 }, { "epoch": 0.91, "learning_rate": 4.491711339055585e-06, "loss": 2.2675, "step": 521920 }, { "epoch": 0.91, "learning_rate": 4.490839399128758e-06, "loss": 2.2358, "step": 521930 }, { "epoch": 0.91, "learning_rate": 4.489967459201931e-06, "loss": 2.4247, "step": 521940 }, { "epoch": 0.91, "learning_rate": 4.489095519275104e-06, "loss": 2.3451, "step": 521950 }, { "epoch": 0.91, "learning_rate": 4.488223579348278e-06, "loss": 2.1031, "step": 521960 }, { "epoch": 0.91, "learning_rate": 4.487351639421451e-06, "loss": 2.2714, "step": 521970 }, { "epoch": 0.91, "learning_rate": 4.4864796994946235e-06, "loss": 2.2105, "step": 521980 }, { "epoch": 0.91, "learning_rate": 4.485607759567797e-06, "loss": 2.2386, "step": 521990 }, { "epoch": 0.91, "learning_rate": 4.48473581964097e-06, "loss": 2.2191, "step": 522000 }, { "epoch": 0.91, "learning_rate": 4.483863879714143e-06, "loss": 2.3744, "step": 522010 }, { "epoch": 0.91, "learning_rate": 4.482991939787316e-06, "loss": 2.2134, "step": 522020 }, { "epoch": 0.91, "learning_rate": 4.48211999986049e-06, "loss": 2.2435, "step": 522030 }, { "epoch": 0.91, "learning_rate": 4.481248059933664e-06, "loss": 2.3294, "step": 522040 }, { "epoch": 0.91, "learning_rate": 4.4803761200068365e-06, "loss": 2.378, "step": 522050 }, { "epoch": 0.91, "learning_rate": 4.4795041800800094e-06, "loss": 2.2273, "step": 522060 }, { "epoch": 0.91, "learning_rate": 4.478632240153182e-06, "loss": 2.2501, "step": 522070 }, { "epoch": 0.91, "learning_rate": 4.477760300226356e-06, "loss": 2.2528, "step": 522080 }, { "epoch": 0.91, "learning_rate": 4.476888360299529e-06, "loss": 2.2815, "step": 522090 }, { "epoch": 0.91, "learning_rate": 4.476016420372702e-06, "loss": 2.2052, "step": 522100 }, { "epoch": 0.91, "learning_rate": 4.475144480445875e-06, "loss": 2.3264, "step": 522110 }, { "epoch": 0.91, "learning_rate": 4.474272540519049e-06, "loss": 2.1876, "step": 522120 }, { "epoch": 0.91, "learning_rate": 4.473400600592222e-06, "loss": 2.2572, "step": 522130 }, { "epoch": 0.91, "learning_rate": 4.4725286606653945e-06, "loss": 2.246, "step": 522140 }, { "epoch": 0.91, "learning_rate": 4.471656720738568e-06, "loss": 2.2393, "step": 522150 }, { "epoch": 0.91, "learning_rate": 4.470784780811742e-06, "loss": 2.23, "step": 522160 }, { "epoch": 0.91, "learning_rate": 4.469912840884915e-06, "loss": 2.3891, "step": 522170 }, { "epoch": 0.91, "learning_rate": 4.469040900958088e-06, "loss": 2.2913, "step": 522180 }, { "epoch": 0.91, "learning_rate": 4.468168961031261e-06, "loss": 2.3577, "step": 522190 }, { "epoch": 0.91, "learning_rate": 4.467297021104435e-06, "loss": 2.3611, "step": 522200 }, { "epoch": 0.91, "learning_rate": 4.4664250811776075e-06, "loss": 2.2036, "step": 522210 }, { "epoch": 0.91, "learning_rate": 4.4655531412507804e-06, "loss": 2.2824, "step": 522220 }, { "epoch": 0.91, "learning_rate": 4.464681201323953e-06, "loss": 2.2213, "step": 522230 }, { "epoch": 0.91, "learning_rate": 4.463809261397127e-06, "loss": 2.2571, "step": 522240 }, { "epoch": 0.91, "learning_rate": 4.4629373214703e-06, "loss": 2.3081, "step": 522250 }, { "epoch": 0.91, "learning_rate": 4.462065381543473e-06, "loss": 2.2632, "step": 522260 }, { "epoch": 0.91, "learning_rate": 4.461193441616647e-06, "loss": 2.2238, "step": 522270 }, { "epoch": 0.91, "learning_rate": 4.46032150168982e-06, "loss": 2.2512, "step": 522280 }, { "epoch": 0.91, "learning_rate": 4.4594495617629934e-06, "loss": 2.1427, "step": 522290 }, { "epoch": 0.91, "learning_rate": 4.458577621836166e-06, "loss": 2.2568, "step": 522300 }, { "epoch": 0.91, "learning_rate": 4.457705681909339e-06, "loss": 2.2624, "step": 522310 }, { "epoch": 0.91, "learning_rate": 4.456833741982513e-06, "loss": 2.2634, "step": 522320 }, { "epoch": 0.91, "learning_rate": 4.455961802055686e-06, "loss": 2.3088, "step": 522330 }, { "epoch": 0.91, "learning_rate": 4.455089862128859e-06, "loss": 2.2338, "step": 522340 }, { "epoch": 0.91, "learning_rate": 4.454217922202032e-06, "loss": 2.24, "step": 522350 }, { "epoch": 0.91, "learning_rate": 4.453345982275206e-06, "loss": 2.2797, "step": 522360 }, { "epoch": 0.91, "learning_rate": 4.4524740423483785e-06, "loss": 2.2457, "step": 522370 }, { "epoch": 0.91, "learning_rate": 4.4516021024215514e-06, "loss": 2.2637, "step": 522380 }, { "epoch": 0.91, "learning_rate": 4.450730162494725e-06, "loss": 2.3, "step": 522390 }, { "epoch": 0.91, "learning_rate": 4.449858222567898e-06, "loss": 2.1743, "step": 522400 }, { "epoch": 0.91, "learning_rate": 4.448986282641071e-06, "loss": 2.246, "step": 522410 }, { "epoch": 0.91, "learning_rate": 4.448114342714244e-06, "loss": 2.2834, "step": 522420 }, { "epoch": 0.91, "learning_rate": 4.447242402787418e-06, "loss": 2.2142, "step": 522430 }, { "epoch": 0.91, "learning_rate": 4.4463704628605915e-06, "loss": 2.2216, "step": 522440 }, { "epoch": 0.91, "learning_rate": 4.4454985229337644e-06, "loss": 2.2062, "step": 522450 }, { "epoch": 0.91, "learning_rate": 4.444626583006937e-06, "loss": 2.2578, "step": 522460 }, { "epoch": 0.91, "learning_rate": 4.44375464308011e-06, "loss": 2.1922, "step": 522470 }, { "epoch": 0.91, "learning_rate": 4.442882703153284e-06, "loss": 2.2169, "step": 522480 }, { "epoch": 0.91, "learning_rate": 4.442010763226457e-06, "loss": 2.3594, "step": 522490 }, { "epoch": 0.91, "learning_rate": 4.44113882329963e-06, "loss": 2.3865, "step": 522500 }, { "epoch": 0.91, "learning_rate": 4.440266883372804e-06, "loss": 2.1929, "step": 522510 }, { "epoch": 0.91, "learning_rate": 4.439394943445977e-06, "loss": 2.3305, "step": 522520 }, { "epoch": 0.91, "learning_rate": 4.4385230035191495e-06, "loss": 2.4118, "step": 522530 }, { "epoch": 0.91, "learning_rate": 4.4376510635923224e-06, "loss": 2.2385, "step": 522540 }, { "epoch": 0.91, "learning_rate": 4.436779123665496e-06, "loss": 2.1673, "step": 522550 }, { "epoch": 0.91, "learning_rate": 4.43590718373867e-06, "loss": 2.1009, "step": 522560 }, { "epoch": 0.91, "learning_rate": 4.435035243811843e-06, "loss": 2.307, "step": 522570 }, { "epoch": 0.91, "learning_rate": 4.434163303885016e-06, "loss": 2.25, "step": 522580 }, { "epoch": 0.91, "learning_rate": 4.433291363958189e-06, "loss": 2.2726, "step": 522590 }, { "epoch": 0.91, "learning_rate": 4.4324194240313625e-06, "loss": 2.325, "step": 522600 }, { "epoch": 0.91, "learning_rate": 4.4315474841045354e-06, "loss": 2.3794, "step": 522610 }, { "epoch": 0.91, "learning_rate": 4.430675544177708e-06, "loss": 2.1977, "step": 522620 }, { "epoch": 0.91, "learning_rate": 4.429803604250881e-06, "loss": 2.1705, "step": 522630 }, { "epoch": 0.91, "learning_rate": 4.428931664324055e-06, "loss": 2.2186, "step": 522640 }, { "epoch": 0.91, "learning_rate": 4.428059724397228e-06, "loss": 2.3045, "step": 522650 }, { "epoch": 0.91, "learning_rate": 4.427187784470401e-06, "loss": 2.3445, "step": 522660 }, { "epoch": 0.91, "learning_rate": 4.426315844543575e-06, "loss": 2.2632, "step": 522670 }, { "epoch": 0.91, "learning_rate": 4.425443904616748e-06, "loss": 2.2751, "step": 522680 }, { "epoch": 0.91, "learning_rate": 4.424571964689921e-06, "loss": 2.2609, "step": 522690 }, { "epoch": 0.91, "learning_rate": 4.423700024763094e-06, "loss": 2.373, "step": 522700 }, { "epoch": 0.91, "learning_rate": 4.422828084836267e-06, "loss": 2.1794, "step": 522710 }, { "epoch": 0.91, "learning_rate": 4.421956144909441e-06, "loss": 2.2538, "step": 522720 }, { "epoch": 0.91, "learning_rate": 4.421084204982614e-06, "loss": 2.3618, "step": 522730 }, { "epoch": 0.91, "learning_rate": 4.420212265055787e-06, "loss": 2.2792, "step": 522740 }, { "epoch": 0.91, "learning_rate": 4.41934032512896e-06, "loss": 2.3149, "step": 522750 }, { "epoch": 0.91, "learning_rate": 4.4184683852021335e-06, "loss": 2.1791, "step": 522760 }, { "epoch": 0.91, "learning_rate": 4.4175964452753064e-06, "loss": 2.2557, "step": 522770 }, { "epoch": 0.91, "learning_rate": 4.416724505348479e-06, "loss": 2.3118, "step": 522780 }, { "epoch": 0.91, "learning_rate": 4.415852565421653e-06, "loss": 2.2866, "step": 522790 }, { "epoch": 0.91, "learning_rate": 4.414980625494826e-06, "loss": 2.1489, "step": 522800 }, { "epoch": 0.91, "learning_rate": 4.414108685567999e-06, "loss": 2.2303, "step": 522810 }, { "epoch": 0.91, "learning_rate": 4.413236745641172e-06, "loss": 2.1695, "step": 522820 }, { "epoch": 0.91, "learning_rate": 4.412364805714346e-06, "loss": 2.3656, "step": 522830 }, { "epoch": 0.91, "learning_rate": 4.4114928657875194e-06, "loss": 2.1515, "step": 522840 }, { "epoch": 0.91, "learning_rate": 4.410620925860692e-06, "loss": 2.2728, "step": 522850 }, { "epoch": 0.91, "learning_rate": 4.409748985933865e-06, "loss": 2.2534, "step": 522860 }, { "epoch": 0.91, "learning_rate": 4.408877046007038e-06, "loss": 2.2639, "step": 522870 }, { "epoch": 0.91, "learning_rate": 4.408005106080212e-06, "loss": 2.2781, "step": 522880 }, { "epoch": 0.91, "learning_rate": 4.407133166153385e-06, "loss": 2.2793, "step": 522890 }, { "epoch": 0.91, "learning_rate": 4.406261226226558e-06, "loss": 2.285, "step": 522900 }, { "epoch": 0.91, "learning_rate": 4.405389286299732e-06, "loss": 2.2699, "step": 522910 }, { "epoch": 0.91, "learning_rate": 4.4045173463729045e-06, "loss": 2.258, "step": 522920 }, { "epoch": 0.91, "learning_rate": 4.4036454064460774e-06, "loss": 2.2401, "step": 522930 }, { "epoch": 0.91, "learning_rate": 4.40277346651925e-06, "loss": 2.2836, "step": 522940 }, { "epoch": 0.91, "learning_rate": 4.401901526592424e-06, "loss": 2.1401, "step": 522950 }, { "epoch": 0.91, "learning_rate": 4.401029586665598e-06, "loss": 2.2195, "step": 522960 }, { "epoch": 0.91, "learning_rate": 4.400157646738771e-06, "loss": 2.2619, "step": 522970 }, { "epoch": 0.91, "learning_rate": 4.399285706811944e-06, "loss": 2.2969, "step": 522980 }, { "epoch": 0.91, "learning_rate": 4.398413766885117e-06, "loss": 2.2825, "step": 522990 }, { "epoch": 0.91, "learning_rate": 4.3975418269582904e-06, "loss": 2.2971, "step": 523000 }, { "epoch": 0.91, "learning_rate": 4.396669887031463e-06, "loss": 2.2427, "step": 523010 }, { "epoch": 0.91, "learning_rate": 4.395797947104636e-06, "loss": 2.4066, "step": 523020 }, { "epoch": 0.91, "learning_rate": 4.39492600717781e-06, "loss": 2.2377, "step": 523030 }, { "epoch": 0.91, "learning_rate": 4.394054067250983e-06, "loss": 2.2361, "step": 523040 }, { "epoch": 0.91, "learning_rate": 4.393182127324156e-06, "loss": 2.3028, "step": 523050 }, { "epoch": 0.91, "learning_rate": 4.392310187397329e-06, "loss": 2.208, "step": 523060 }, { "epoch": 0.91, "learning_rate": 4.391438247470503e-06, "loss": 2.2517, "step": 523070 }, { "epoch": 0.91, "learning_rate": 4.3905663075436755e-06, "loss": 2.2806, "step": 523080 }, { "epoch": 0.91, "learning_rate": 4.389694367616849e-06, "loss": 2.1425, "step": 523090 }, { "epoch": 0.91, "learning_rate": 4.388822427690022e-06, "loss": 2.2914, "step": 523100 }, { "epoch": 0.91, "learning_rate": 4.387950487763195e-06, "loss": 2.255, "step": 523110 }, { "epoch": 0.91, "learning_rate": 4.387078547836369e-06, "loss": 2.3288, "step": 523120 }, { "epoch": 0.91, "learning_rate": 4.386206607909542e-06, "loss": 2.241, "step": 523130 }, { "epoch": 0.91, "learning_rate": 4.385334667982715e-06, "loss": 2.2676, "step": 523140 }, { "epoch": 0.91, "learning_rate": 4.384462728055888e-06, "loss": 2.2661, "step": 523150 }, { "epoch": 0.91, "learning_rate": 4.3835907881290614e-06, "loss": 2.3039, "step": 523160 }, { "epoch": 0.91, "learning_rate": 4.382718848202234e-06, "loss": 2.2893, "step": 523170 }, { "epoch": 0.91, "learning_rate": 4.381846908275407e-06, "loss": 2.229, "step": 523180 }, { "epoch": 0.91, "learning_rate": 4.380974968348581e-06, "loss": 2.124, "step": 523190 }, { "epoch": 0.91, "learning_rate": 4.380103028421754e-06, "loss": 2.2696, "step": 523200 }, { "epoch": 0.91, "learning_rate": 4.379231088494927e-06, "loss": 2.2509, "step": 523210 }, { "epoch": 0.91, "learning_rate": 4.3783591485681e-06, "loss": 2.2396, "step": 523220 }, { "epoch": 0.91, "learning_rate": 4.377487208641274e-06, "loss": 2.1772, "step": 523230 }, { "epoch": 0.91, "learning_rate": 4.376615268714447e-06, "loss": 2.275, "step": 523240 }, { "epoch": 0.91, "learning_rate": 4.37574332878762e-06, "loss": 2.1885, "step": 523250 }, { "epoch": 0.91, "learning_rate": 4.374871388860793e-06, "loss": 2.1831, "step": 523260 }, { "epoch": 0.91, "learning_rate": 4.373999448933966e-06, "loss": 2.2609, "step": 523270 }, { "epoch": 0.91, "learning_rate": 4.37312750900714e-06, "loss": 2.2716, "step": 523280 }, { "epoch": 0.91, "learning_rate": 4.372255569080313e-06, "loss": 2.2767, "step": 523290 }, { "epoch": 0.91, "learning_rate": 4.371383629153486e-06, "loss": 2.2484, "step": 523300 }, { "epoch": 0.91, "learning_rate": 4.3705116892266595e-06, "loss": 2.1358, "step": 523310 }, { "epoch": 0.91, "learning_rate": 4.3696397492998324e-06, "loss": 2.3058, "step": 523320 }, { "epoch": 0.91, "learning_rate": 4.368767809373005e-06, "loss": 2.2636, "step": 523330 }, { "epoch": 0.91, "learning_rate": 4.367895869446178e-06, "loss": 2.1938, "step": 523340 }, { "epoch": 0.91, "learning_rate": 4.367023929519352e-06, "loss": 2.1991, "step": 523350 }, { "epoch": 0.91, "learning_rate": 4.366151989592526e-06, "loss": 2.3136, "step": 523360 }, { "epoch": 0.91, "learning_rate": 4.365280049665699e-06, "loss": 2.2655, "step": 523370 }, { "epoch": 0.91, "learning_rate": 4.364408109738872e-06, "loss": 2.1674, "step": 523380 }, { "epoch": 0.91, "learning_rate": 4.363536169812045e-06, "loss": 2.2408, "step": 523390 }, { "epoch": 0.91, "learning_rate": 4.362664229885218e-06, "loss": 2.2841, "step": 523400 }, { "epoch": 0.91, "learning_rate": 4.361792289958391e-06, "loss": 2.2889, "step": 523410 }, { "epoch": 0.91, "learning_rate": 4.360920350031564e-06, "loss": 2.0985, "step": 523420 }, { "epoch": 0.91, "learning_rate": 4.360048410104738e-06, "loss": 2.1592, "step": 523430 }, { "epoch": 0.91, "learning_rate": 4.359176470177911e-06, "loss": 2.3365, "step": 523440 }, { "epoch": 0.91, "learning_rate": 4.358304530251084e-06, "loss": 2.1893, "step": 523450 }, { "epoch": 0.91, "learning_rate": 4.357432590324257e-06, "loss": 2.3454, "step": 523460 }, { "epoch": 0.91, "learning_rate": 4.3565606503974305e-06, "loss": 2.2722, "step": 523470 }, { "epoch": 0.91, "learning_rate": 4.3556887104706034e-06, "loss": 2.3411, "step": 523480 }, { "epoch": 0.91, "learning_rate": 4.354816770543777e-06, "loss": 2.2835, "step": 523490 }, { "epoch": 0.91, "learning_rate": 4.35394483061695e-06, "loss": 2.3194, "step": 523500 }, { "epoch": 0.91, "learning_rate": 4.353072890690123e-06, "loss": 2.2758, "step": 523510 }, { "epoch": 0.91, "learning_rate": 4.352200950763297e-06, "loss": 2.3241, "step": 523520 }, { "epoch": 0.91, "learning_rate": 4.35132901083647e-06, "loss": 2.1809, "step": 523530 }, { "epoch": 0.91, "learning_rate": 4.350457070909643e-06, "loss": 2.1931, "step": 523540 }, { "epoch": 0.91, "learning_rate": 4.3495851309828164e-06, "loss": 2.3809, "step": 523550 }, { "epoch": 0.91, "learning_rate": 4.348713191055989e-06, "loss": 2.2213, "step": 523560 }, { "epoch": 0.91, "learning_rate": 4.347841251129162e-06, "loss": 2.2748, "step": 523570 }, { "epoch": 0.91, "learning_rate": 4.346969311202335e-06, "loss": 2.3982, "step": 523580 }, { "epoch": 0.91, "learning_rate": 4.346097371275509e-06, "loss": 2.2082, "step": 523590 }, { "epoch": 0.91, "learning_rate": 4.345225431348682e-06, "loss": 2.2654, "step": 523600 }, { "epoch": 0.91, "learning_rate": 4.344353491421855e-06, "loss": 2.1955, "step": 523610 }, { "epoch": 0.91, "learning_rate": 4.343481551495029e-06, "loss": 2.3126, "step": 523620 }, { "epoch": 0.91, "learning_rate": 4.3426096115682015e-06, "loss": 2.189, "step": 523630 }, { "epoch": 0.91, "learning_rate": 4.341737671641375e-06, "loss": 2.1327, "step": 523640 }, { "epoch": 0.91, "learning_rate": 4.340865731714548e-06, "loss": 2.2753, "step": 523650 }, { "epoch": 0.91, "learning_rate": 4.339993791787721e-06, "loss": 2.2809, "step": 523660 }, { "epoch": 0.91, "learning_rate": 4.339121851860894e-06, "loss": 2.2495, "step": 523670 }, { "epoch": 0.91, "learning_rate": 4.338249911934068e-06, "loss": 2.1929, "step": 523680 }, { "epoch": 0.91, "learning_rate": 4.337377972007241e-06, "loss": 2.0763, "step": 523690 }, { "epoch": 0.91, "learning_rate": 4.336506032080414e-06, "loss": 2.32, "step": 523700 }, { "epoch": 0.91, "learning_rate": 4.3356340921535874e-06, "loss": 2.1719, "step": 523710 }, { "epoch": 0.91, "learning_rate": 4.33476215222676e-06, "loss": 2.1905, "step": 523720 }, { "epoch": 0.91, "learning_rate": 4.333890212299933e-06, "loss": 2.2513, "step": 523730 }, { "epoch": 0.91, "learning_rate": 4.333018272373106e-06, "loss": 2.2131, "step": 523740 }, { "epoch": 0.91, "learning_rate": 4.33214633244628e-06, "loss": 2.3029, "step": 523750 }, { "epoch": 0.91, "learning_rate": 4.331274392519454e-06, "loss": 2.2545, "step": 523760 }, { "epoch": 0.91, "learning_rate": 4.330402452592627e-06, "loss": 2.2149, "step": 523770 }, { "epoch": 0.91, "learning_rate": 4.3295305126658e-06, "loss": 2.1568, "step": 523780 }, { "epoch": 0.91, "learning_rate": 4.3286585727389725e-06, "loss": 2.3272, "step": 523790 }, { "epoch": 0.91, "learning_rate": 4.327786632812146e-06, "loss": 2.3888, "step": 523800 }, { "epoch": 0.91, "learning_rate": 4.326914692885319e-06, "loss": 2.1563, "step": 523810 }, { "epoch": 0.91, "learning_rate": 4.326042752958492e-06, "loss": 2.2635, "step": 523820 }, { "epoch": 0.91, "learning_rate": 4.325170813031666e-06, "loss": 2.2907, "step": 523830 }, { "epoch": 0.91, "learning_rate": 4.324298873104839e-06, "loss": 2.3339, "step": 523840 }, { "epoch": 0.91, "learning_rate": 4.323426933178012e-06, "loss": 2.2755, "step": 523850 }, { "epoch": 0.91, "learning_rate": 4.322554993251185e-06, "loss": 2.2847, "step": 523860 }, { "epoch": 0.91, "learning_rate": 4.3216830533243584e-06, "loss": 2.1935, "step": 523870 }, { "epoch": 0.91, "learning_rate": 4.320811113397531e-06, "loss": 2.2794, "step": 523880 }, { "epoch": 0.91, "learning_rate": 4.319939173470705e-06, "loss": 2.3311, "step": 523890 }, { "epoch": 0.91, "learning_rate": 4.319067233543878e-06, "loss": 2.1107, "step": 523900 }, { "epoch": 0.91, "learning_rate": 4.318195293617051e-06, "loss": 2.2222, "step": 523910 }, { "epoch": 0.91, "learning_rate": 4.317323353690225e-06, "loss": 2.2201, "step": 523920 }, { "epoch": 0.91, "learning_rate": 4.316451413763398e-06, "loss": 2.1969, "step": 523930 }, { "epoch": 0.91, "learning_rate": 4.315579473836571e-06, "loss": 2.2537, "step": 523940 }, { "epoch": 0.91, "learning_rate": 4.314707533909744e-06, "loss": 2.2125, "step": 523950 }, { "epoch": 0.91, "learning_rate": 4.313835593982917e-06, "loss": 2.3324, "step": 523960 }, { "epoch": 0.91, "learning_rate": 4.31296365405609e-06, "loss": 2.3295, "step": 523970 }, { "epoch": 0.91, "learning_rate": 4.312091714129263e-06, "loss": 2.3567, "step": 523980 }, { "epoch": 0.91, "learning_rate": 4.311219774202437e-06, "loss": 2.2278, "step": 523990 }, { "epoch": 0.91, "learning_rate": 4.31034783427561e-06, "loss": 2.2195, "step": 524000 }, { "epoch": 0.91, "learning_rate": 4.309475894348783e-06, "loss": 2.194, "step": 524010 }, { "epoch": 0.91, "learning_rate": 4.3086039544219565e-06, "loss": 2.2129, "step": 524020 }, { "epoch": 0.91, "learning_rate": 4.3077320144951295e-06, "loss": 2.3386, "step": 524030 }, { "epoch": 0.91, "learning_rate": 4.306860074568303e-06, "loss": 2.2601, "step": 524040 }, { "epoch": 0.91, "learning_rate": 4.305988134641476e-06, "loss": 2.2428, "step": 524050 }, { "epoch": 0.91, "learning_rate": 4.305116194714649e-06, "loss": 2.2451, "step": 524060 }, { "epoch": 0.91, "learning_rate": 4.304244254787823e-06, "loss": 2.2863, "step": 524070 }, { "epoch": 0.91, "learning_rate": 4.303372314860996e-06, "loss": 2.2713, "step": 524080 }, { "epoch": 0.91, "learning_rate": 4.302500374934169e-06, "loss": 2.3861, "step": 524090 }, { "epoch": 0.91, "learning_rate": 4.301628435007342e-06, "loss": 2.2212, "step": 524100 }, { "epoch": 0.91, "learning_rate": 4.300756495080515e-06, "loss": 2.1726, "step": 524110 }, { "epoch": 0.91, "learning_rate": 4.299884555153688e-06, "loss": 2.2006, "step": 524120 }, { "epoch": 0.91, "learning_rate": 4.299012615226861e-06, "loss": 2.2635, "step": 524130 }, { "epoch": 0.91, "learning_rate": 4.298140675300034e-06, "loss": 2.1635, "step": 524140 }, { "epoch": 0.91, "learning_rate": 4.297268735373208e-06, "loss": 2.2922, "step": 524150 }, { "epoch": 0.91, "learning_rate": 4.296396795446382e-06, "loss": 2.2775, "step": 524160 }, { "epoch": 0.91, "learning_rate": 4.295524855519555e-06, "loss": 2.2788, "step": 524170 }, { "epoch": 0.91, "learning_rate": 4.2946529155927275e-06, "loss": 2.3075, "step": 524180 }, { "epoch": 0.91, "learning_rate": 4.2937809756659005e-06, "loss": 2.2584, "step": 524190 }, { "epoch": 0.91, "learning_rate": 4.292909035739074e-06, "loss": 2.3435, "step": 524200 }, { "epoch": 0.91, "learning_rate": 4.292037095812247e-06, "loss": 2.2588, "step": 524210 }, { "epoch": 0.91, "learning_rate": 4.29116515588542e-06, "loss": 2.2838, "step": 524220 }, { "epoch": 0.91, "learning_rate": 4.290293215958594e-06, "loss": 2.1948, "step": 524230 }, { "epoch": 0.91, "learning_rate": 4.289421276031767e-06, "loss": 2.2861, "step": 524240 }, { "epoch": 0.91, "learning_rate": 4.28854933610494e-06, "loss": 2.224, "step": 524250 }, { "epoch": 0.91, "learning_rate": 4.287677396178113e-06, "loss": 2.27, "step": 524260 }, { "epoch": 0.91, "learning_rate": 4.286805456251286e-06, "loss": 2.3412, "step": 524270 }, { "epoch": 0.91, "learning_rate": 4.285933516324459e-06, "loss": 2.2338, "step": 524280 }, { "epoch": 0.91, "learning_rate": 4.285061576397633e-06, "loss": 2.3385, "step": 524290 }, { "epoch": 0.91, "learning_rate": 4.284189636470806e-06, "loss": 2.311, "step": 524300 }, { "epoch": 0.91, "learning_rate": 4.283317696543979e-06, "loss": 2.1625, "step": 524310 }, { "epoch": 0.91, "learning_rate": 4.282445756617153e-06, "loss": 2.0859, "step": 524320 }, { "epoch": 0.91, "learning_rate": 4.281573816690326e-06, "loss": 2.2345, "step": 524330 }, { "epoch": 0.91, "learning_rate": 4.2807018767634985e-06, "loss": 2.3011, "step": 524340 }, { "epoch": 0.91, "learning_rate": 4.279829936836672e-06, "loss": 2.2709, "step": 524350 }, { "epoch": 0.91, "learning_rate": 4.278957996909845e-06, "loss": 2.3174, "step": 524360 }, { "epoch": 0.91, "learning_rate": 4.278086056983018e-06, "loss": 2.2861, "step": 524370 }, { "epoch": 0.91, "learning_rate": 4.277214117056191e-06, "loss": 2.2127, "step": 524380 }, { "epoch": 0.91, "learning_rate": 4.276342177129365e-06, "loss": 2.3079, "step": 524390 }, { "epoch": 0.91, "learning_rate": 4.275470237202538e-06, "loss": 2.1626, "step": 524400 }, { "epoch": 0.91, "learning_rate": 4.274598297275711e-06, "loss": 2.237, "step": 524410 }, { "epoch": 0.91, "learning_rate": 4.2737263573488845e-06, "loss": 2.1662, "step": 524420 }, { "epoch": 0.91, "learning_rate": 4.272854417422057e-06, "loss": 2.2173, "step": 524430 }, { "epoch": 0.91, "learning_rate": 4.271982477495231e-06, "loss": 2.217, "step": 524440 }, { "epoch": 0.91, "learning_rate": 4.271110537568404e-06, "loss": 2.2995, "step": 524450 }, { "epoch": 0.91, "learning_rate": 4.270238597641577e-06, "loss": 2.2609, "step": 524460 }, { "epoch": 0.91, "learning_rate": 4.269366657714751e-06, "loss": 2.3309, "step": 524470 }, { "epoch": 0.91, "learning_rate": 4.268494717787924e-06, "loss": 2.2072, "step": 524480 }, { "epoch": 0.91, "learning_rate": 4.267622777861097e-06, "loss": 2.269, "step": 524490 }, { "epoch": 0.91, "learning_rate": 4.2667508379342695e-06, "loss": 2.292, "step": 524500 }, { "epoch": 0.91, "learning_rate": 4.265878898007443e-06, "loss": 2.3779, "step": 524510 }, { "epoch": 0.91, "learning_rate": 4.265006958080616e-06, "loss": 2.2087, "step": 524520 }, { "epoch": 0.91, "learning_rate": 4.264135018153789e-06, "loss": 2.2291, "step": 524530 }, { "epoch": 0.91, "learning_rate": 4.263263078226962e-06, "loss": 2.3039, "step": 524540 }, { "epoch": 0.91, "learning_rate": 4.262391138300136e-06, "loss": 2.3413, "step": 524550 }, { "epoch": 0.91, "learning_rate": 4.26151919837331e-06, "loss": 2.2534, "step": 524560 }, { "epoch": 0.91, "learning_rate": 4.2606472584464825e-06, "loss": 2.3304, "step": 524570 }, { "epoch": 0.91, "learning_rate": 4.2597753185196555e-06, "loss": 2.3653, "step": 524580 }, { "epoch": 0.91, "learning_rate": 4.258903378592829e-06, "loss": 2.2174, "step": 524590 }, { "epoch": 0.91, "learning_rate": 4.258031438666002e-06, "loss": 2.34, "step": 524600 }, { "epoch": 0.91, "learning_rate": 4.257159498739175e-06, "loss": 2.3092, "step": 524610 }, { "epoch": 0.91, "learning_rate": 4.256287558812348e-06, "loss": 2.1299, "step": 524620 }, { "epoch": 0.91, "learning_rate": 4.255415618885522e-06, "loss": 2.2581, "step": 524630 }, { "epoch": 0.91, "learning_rate": 4.254543678958695e-06, "loss": 2.2446, "step": 524640 }, { "epoch": 0.91, "learning_rate": 4.253671739031868e-06, "loss": 2.2705, "step": 524650 }, { "epoch": 0.91, "learning_rate": 4.2527997991050405e-06, "loss": 2.2663, "step": 524660 }, { "epoch": 0.91, "learning_rate": 4.251927859178214e-06, "loss": 2.2988, "step": 524670 }, { "epoch": 0.91, "learning_rate": 4.251055919251387e-06, "loss": 2.3314, "step": 524680 }, { "epoch": 0.91, "learning_rate": 4.250183979324561e-06, "loss": 2.2478, "step": 524690 }, { "epoch": 0.92, "learning_rate": 4.249312039397734e-06, "loss": 2.1767, "step": 524700 }, { "epoch": 0.92, "learning_rate": 4.248440099470907e-06, "loss": 2.2016, "step": 524710 }, { "epoch": 0.92, "learning_rate": 4.247568159544081e-06, "loss": 2.231, "step": 524720 }, { "epoch": 0.92, "learning_rate": 4.2466962196172535e-06, "loss": 2.1828, "step": 524730 }, { "epoch": 0.92, "learning_rate": 4.2458242796904265e-06, "loss": 2.2944, "step": 524740 }, { "epoch": 0.92, "learning_rate": 4.2449523397636e-06, "loss": 2.2231, "step": 524750 }, { "epoch": 0.92, "learning_rate": 4.244080399836773e-06, "loss": 2.2405, "step": 524760 }, { "epoch": 0.92, "learning_rate": 4.243208459909946e-06, "loss": 2.2625, "step": 524770 }, { "epoch": 0.92, "learning_rate": 4.242336519983119e-06, "loss": 2.2583, "step": 524780 }, { "epoch": 0.92, "learning_rate": 4.241464580056293e-06, "loss": 2.2856, "step": 524790 }, { "epoch": 0.92, "learning_rate": 4.240592640129466e-06, "loss": 2.3381, "step": 524800 }, { "epoch": 0.92, "learning_rate": 4.239720700202639e-06, "loss": 2.2116, "step": 524810 }, { "epoch": 0.92, "learning_rate": 4.238848760275812e-06, "loss": 2.2969, "step": 524820 }, { "epoch": 0.92, "learning_rate": 4.237976820348985e-06, "loss": 2.2277, "step": 524830 }, { "epoch": 0.92, "learning_rate": 4.237104880422159e-06, "loss": 2.2164, "step": 524840 }, { "epoch": 0.92, "learning_rate": 4.236232940495332e-06, "loss": 2.3616, "step": 524850 }, { "epoch": 0.92, "learning_rate": 4.235361000568505e-06, "loss": 2.2364, "step": 524860 }, { "epoch": 0.92, "learning_rate": 4.234489060641679e-06, "loss": 2.1789, "step": 524870 }, { "epoch": 0.92, "learning_rate": 4.233617120714852e-06, "loss": 2.303, "step": 524880 }, { "epoch": 0.92, "learning_rate": 4.2327451807880245e-06, "loss": 2.2831, "step": 524890 }, { "epoch": 0.92, "learning_rate": 4.2318732408611975e-06, "loss": 2.2216, "step": 524900 }, { "epoch": 0.92, "learning_rate": 4.231001300934371e-06, "loss": 2.3201, "step": 524910 }, { "epoch": 0.92, "learning_rate": 4.230129361007544e-06, "loss": 2.092, "step": 524920 }, { "epoch": 0.92, "learning_rate": 4.229257421080717e-06, "loss": 2.4244, "step": 524930 }, { "epoch": 0.92, "learning_rate": 4.22838548115389e-06, "loss": 2.1549, "step": 524940 }, { "epoch": 0.92, "learning_rate": 4.227513541227064e-06, "loss": 2.3095, "step": 524950 }, { "epoch": 0.92, "learning_rate": 4.2266416013002375e-06, "loss": 2.3141, "step": 524960 }, { "epoch": 0.92, "learning_rate": 4.2257696613734105e-06, "loss": 2.0473, "step": 524970 }, { "epoch": 0.92, "learning_rate": 4.224897721446583e-06, "loss": 2.2837, "step": 524980 }, { "epoch": 0.92, "learning_rate": 4.224025781519757e-06, "loss": 2.3068, "step": 524990 }, { "epoch": 0.92, "learning_rate": 4.22315384159293e-06, "loss": 2.1835, "step": 525000 }, { "epoch": 0.92, "learning_rate": 4.222281901666103e-06, "loss": 2.2447, "step": 525010 }, { "epoch": 0.92, "learning_rate": 4.221409961739276e-06, "loss": 2.3238, "step": 525020 }, { "epoch": 0.92, "learning_rate": 4.22053802181245e-06, "loss": 2.2, "step": 525030 }, { "epoch": 0.92, "learning_rate": 4.219666081885623e-06, "loss": 2.2723, "step": 525040 }, { "epoch": 0.92, "learning_rate": 4.2187941419587955e-06, "loss": 2.3285, "step": 525050 }, { "epoch": 0.92, "learning_rate": 4.2179222020319685e-06, "loss": 2.1688, "step": 525060 }, { "epoch": 0.92, "learning_rate": 4.217050262105142e-06, "loss": 2.2522, "step": 525070 }, { "epoch": 0.92, "learning_rate": 4.216178322178315e-06, "loss": 2.3372, "step": 525080 }, { "epoch": 0.92, "learning_rate": 4.215306382251489e-06, "loss": 2.1993, "step": 525090 }, { "epoch": 0.92, "learning_rate": 4.214434442324662e-06, "loss": 2.2811, "step": 525100 }, { "epoch": 0.92, "learning_rate": 4.213562502397836e-06, "loss": 2.2924, "step": 525110 }, { "epoch": 0.92, "learning_rate": 4.2126905624710085e-06, "loss": 2.1553, "step": 525120 }, { "epoch": 0.92, "learning_rate": 4.2118186225441815e-06, "loss": 2.3028, "step": 525130 }, { "epoch": 0.92, "learning_rate": 4.210946682617354e-06, "loss": 2.1805, "step": 525140 }, { "epoch": 0.92, "learning_rate": 4.210074742690528e-06, "loss": 2.2228, "step": 525150 }, { "epoch": 0.92, "learning_rate": 4.209202802763701e-06, "loss": 2.2988, "step": 525160 }, { "epoch": 0.92, "learning_rate": 4.208330862836874e-06, "loss": 2.2497, "step": 525170 }, { "epoch": 0.92, "learning_rate": 4.207458922910047e-06, "loss": 2.2429, "step": 525180 }, { "epoch": 0.92, "learning_rate": 4.206586982983221e-06, "loss": 2.3436, "step": 525190 }, { "epoch": 0.92, "learning_rate": 4.205715043056394e-06, "loss": 2.3538, "step": 525200 }, { "epoch": 0.92, "learning_rate": 4.2048431031295665e-06, "loss": 2.2119, "step": 525210 }, { "epoch": 0.92, "learning_rate": 4.20397116320274e-06, "loss": 2.3014, "step": 525220 }, { "epoch": 0.92, "learning_rate": 4.203099223275914e-06, "loss": 2.0969, "step": 525230 }, { "epoch": 0.92, "learning_rate": 4.202227283349087e-06, "loss": 2.2711, "step": 525240 }, { "epoch": 0.92, "learning_rate": 4.20135534342226e-06, "loss": 2.3631, "step": 525250 }, { "epoch": 0.92, "learning_rate": 4.200483403495433e-06, "loss": 2.1742, "step": 525260 }, { "epoch": 0.92, "learning_rate": 4.199611463568607e-06, "loss": 2.2525, "step": 525270 }, { "epoch": 0.92, "learning_rate": 4.1987395236417795e-06, "loss": 2.3417, "step": 525280 }, { "epoch": 0.92, "learning_rate": 4.1978675837149525e-06, "loss": 2.1182, "step": 525290 }, { "epoch": 0.92, "learning_rate": 4.196995643788125e-06, "loss": 2.2201, "step": 525300 }, { "epoch": 0.92, "learning_rate": 4.196123703861299e-06, "loss": 2.3397, "step": 525310 }, { "epoch": 0.92, "learning_rate": 4.195251763934472e-06, "loss": 2.2416, "step": 525320 }, { "epoch": 0.92, "learning_rate": 4.194379824007645e-06, "loss": 2.2389, "step": 525330 }, { "epoch": 0.92, "learning_rate": 4.193507884080818e-06, "loss": 2.2053, "step": 525340 }, { "epoch": 0.92, "learning_rate": 4.192635944153992e-06, "loss": 2.3344, "step": 525350 }, { "epoch": 0.92, "learning_rate": 4.1917640042271655e-06, "loss": 2.1932, "step": 525360 }, { "epoch": 0.92, "learning_rate": 4.190892064300338e-06, "loss": 2.2534, "step": 525370 }, { "epoch": 0.92, "learning_rate": 4.190020124373511e-06, "loss": 2.2061, "step": 525380 }, { "epoch": 0.92, "learning_rate": 4.189148184446685e-06, "loss": 2.388, "step": 525390 }, { "epoch": 0.92, "learning_rate": 4.188276244519858e-06, "loss": 2.2649, "step": 525400 }, { "epoch": 0.92, "learning_rate": 4.187404304593031e-06, "loss": 2.3011, "step": 525410 }, { "epoch": 0.92, "learning_rate": 4.186532364666204e-06, "loss": 2.2205, "step": 525420 }, { "epoch": 0.92, "learning_rate": 4.185660424739378e-06, "loss": 2.3215, "step": 525430 }, { "epoch": 0.92, "learning_rate": 4.1847884848125505e-06, "loss": 2.1708, "step": 525440 }, { "epoch": 0.92, "learning_rate": 4.1839165448857235e-06, "loss": 2.2485, "step": 525450 }, { "epoch": 0.92, "learning_rate": 4.183044604958896e-06, "loss": 2.1665, "step": 525460 }, { "epoch": 0.92, "learning_rate": 4.18217266503207e-06, "loss": 2.2526, "step": 525470 }, { "epoch": 0.92, "learning_rate": 4.181300725105243e-06, "loss": 2.2074, "step": 525480 }, { "epoch": 0.92, "learning_rate": 4.180428785178417e-06, "loss": 2.2847, "step": 525490 }, { "epoch": 0.92, "learning_rate": 4.17955684525159e-06, "loss": 2.2469, "step": 525500 }, { "epoch": 0.92, "learning_rate": 4.1786849053247635e-06, "loss": 2.2725, "step": 525510 }, { "epoch": 0.92, "learning_rate": 4.1778129653979365e-06, "loss": 2.3005, "step": 525520 }, { "epoch": 0.92, "learning_rate": 4.176941025471109e-06, "loss": 2.204, "step": 525530 }, { "epoch": 0.92, "learning_rate": 4.176069085544282e-06, "loss": 2.3262, "step": 525540 }, { "epoch": 0.92, "learning_rate": 4.175197145617456e-06, "loss": 2.2414, "step": 525550 }, { "epoch": 0.92, "learning_rate": 4.174325205690629e-06, "loss": 2.304, "step": 525560 }, { "epoch": 0.92, "learning_rate": 4.173453265763802e-06, "loss": 2.359, "step": 525570 }, { "epoch": 0.92, "learning_rate": 4.172581325836975e-06, "loss": 2.3795, "step": 525580 }, { "epoch": 0.92, "learning_rate": 4.171709385910149e-06, "loss": 2.2151, "step": 525590 }, { "epoch": 0.92, "learning_rate": 4.1708374459833215e-06, "loss": 2.1345, "step": 525600 }, { "epoch": 0.92, "learning_rate": 4.1699655060564945e-06, "loss": 2.1767, "step": 525610 }, { "epoch": 0.92, "learning_rate": 4.169093566129668e-06, "loss": 2.2723, "step": 525620 }, { "epoch": 0.92, "learning_rate": 4.168221626202842e-06, "loss": 2.3386, "step": 525630 }, { "epoch": 0.92, "learning_rate": 4.167349686276015e-06, "loss": 2.3171, "step": 525640 }, { "epoch": 0.92, "learning_rate": 4.166477746349188e-06, "loss": 2.1866, "step": 525650 }, { "epoch": 0.92, "learning_rate": 4.165605806422361e-06, "loss": 2.3122, "step": 525660 }, { "epoch": 0.92, "learning_rate": 4.1647338664955345e-06, "loss": 2.2578, "step": 525670 }, { "epoch": 0.92, "learning_rate": 4.1638619265687075e-06, "loss": 2.3011, "step": 525680 }, { "epoch": 0.92, "learning_rate": 4.16298998664188e-06, "loss": 2.2281, "step": 525690 }, { "epoch": 0.92, "learning_rate": 4.162118046715053e-06, "loss": 2.2919, "step": 525700 }, { "epoch": 0.92, "learning_rate": 4.161246106788227e-06, "loss": 2.2264, "step": 525710 }, { "epoch": 0.92, "learning_rate": 4.1603741668614e-06, "loss": 2.2879, "step": 525720 }, { "epoch": 0.92, "learning_rate": 4.159502226934573e-06, "loss": 2.234, "step": 525730 }, { "epoch": 0.92, "learning_rate": 4.158630287007746e-06, "loss": 2.1407, "step": 525740 }, { "epoch": 0.92, "learning_rate": 4.1577583470809205e-06, "loss": 2.2943, "step": 525750 }, { "epoch": 0.92, "learning_rate": 4.156886407154093e-06, "loss": 2.275, "step": 525760 }, { "epoch": 0.92, "learning_rate": 4.156014467227266e-06, "loss": 2.2766, "step": 525770 }, { "epoch": 0.92, "learning_rate": 4.155142527300439e-06, "loss": 2.3296, "step": 525780 }, { "epoch": 0.92, "learning_rate": 4.154270587373613e-06, "loss": 2.2534, "step": 525790 }, { "epoch": 0.92, "learning_rate": 4.153398647446786e-06, "loss": 2.2264, "step": 525800 }, { "epoch": 0.92, "learning_rate": 4.152526707519959e-06, "loss": 2.2127, "step": 525810 }, { "epoch": 0.92, "learning_rate": 4.151654767593132e-06, "loss": 2.2569, "step": 525820 }, { "epoch": 0.92, "learning_rate": 4.1507828276663055e-06, "loss": 2.3557, "step": 525830 }, { "epoch": 0.92, "learning_rate": 4.1499108877394785e-06, "loss": 2.2681, "step": 525840 }, { "epoch": 0.92, "learning_rate": 4.149038947812651e-06, "loss": 2.2359, "step": 525850 }, { "epoch": 0.92, "learning_rate": 4.148167007885824e-06, "loss": 2.2085, "step": 525860 }, { "epoch": 0.92, "learning_rate": 4.147295067958998e-06, "loss": 2.1686, "step": 525870 }, { "epoch": 0.92, "learning_rate": 4.146423128032171e-06, "loss": 2.3166, "step": 525880 }, { "epoch": 0.92, "learning_rate": 4.145551188105345e-06, "loss": 2.2383, "step": 525890 }, { "epoch": 0.92, "learning_rate": 4.144679248178518e-06, "loss": 2.1974, "step": 525900 }, { "epoch": 0.92, "learning_rate": 4.1438073082516915e-06, "loss": 2.2717, "step": 525910 }, { "epoch": 0.92, "learning_rate": 4.142935368324864e-06, "loss": 2.2326, "step": 525920 }, { "epoch": 0.92, "learning_rate": 4.142063428398037e-06, "loss": 2.2403, "step": 525930 }, { "epoch": 0.92, "learning_rate": 4.14119148847121e-06, "loss": 2.2045, "step": 525940 }, { "epoch": 0.92, "learning_rate": 4.140319548544384e-06, "loss": 2.2893, "step": 525950 }, { "epoch": 0.92, "learning_rate": 4.139447608617557e-06, "loss": 2.2702, "step": 525960 }, { "epoch": 0.92, "learning_rate": 4.13857566869073e-06, "loss": 2.3295, "step": 525970 }, { "epoch": 0.92, "learning_rate": 4.137703728763903e-06, "loss": 2.219, "step": 525980 }, { "epoch": 0.92, "learning_rate": 4.1368317888370765e-06, "loss": 2.2874, "step": 525990 }, { "epoch": 0.92, "learning_rate": 4.1359598489102495e-06, "loss": 2.2038, "step": 526000 }, { "epoch": 0.92, "learning_rate": 4.135087908983422e-06, "loss": 2.3248, "step": 526010 }, { "epoch": 0.92, "learning_rate": 4.134215969056596e-06, "loss": 2.164, "step": 526020 }, { "epoch": 0.92, "learning_rate": 4.13334402912977e-06, "loss": 2.3733, "step": 526030 }, { "epoch": 0.92, "learning_rate": 4.132472089202943e-06, "loss": 2.1867, "step": 526040 }, { "epoch": 0.92, "learning_rate": 4.131600149276116e-06, "loss": 2.2794, "step": 526050 }, { "epoch": 0.92, "learning_rate": 4.130728209349289e-06, "loss": 2.2505, "step": 526060 }, { "epoch": 0.92, "learning_rate": 4.1298562694224625e-06, "loss": 2.2821, "step": 526070 }, { "epoch": 0.92, "learning_rate": 4.128984329495635e-06, "loss": 2.2083, "step": 526080 }, { "epoch": 0.92, "learning_rate": 4.128112389568808e-06, "loss": 2.1228, "step": 526090 }, { "epoch": 0.92, "learning_rate": 4.127240449641981e-06, "loss": 2.2392, "step": 526100 }, { "epoch": 0.92, "learning_rate": 4.126368509715155e-06, "loss": 2.2093, "step": 526110 }, { "epoch": 0.92, "learning_rate": 4.125496569788328e-06, "loss": 2.2158, "step": 526120 }, { "epoch": 0.92, "learning_rate": 4.124624629861501e-06, "loss": 2.2944, "step": 526130 }, { "epoch": 0.92, "learning_rate": 4.123752689934674e-06, "loss": 2.1447, "step": 526140 }, { "epoch": 0.92, "learning_rate": 4.122880750007848e-06, "loss": 2.377, "step": 526150 }, { "epoch": 0.92, "learning_rate": 4.122008810081021e-06, "loss": 2.2488, "step": 526160 }, { "epoch": 0.92, "learning_rate": 4.121136870154194e-06, "loss": 2.2675, "step": 526170 }, { "epoch": 0.92, "learning_rate": 4.120264930227367e-06, "loss": 2.309, "step": 526180 }, { "epoch": 0.92, "learning_rate": 4.119392990300541e-06, "loss": 2.2725, "step": 526190 }, { "epoch": 0.92, "learning_rate": 4.118521050373714e-06, "loss": 2.2767, "step": 526200 }, { "epoch": 0.92, "learning_rate": 4.117649110446887e-06, "loss": 2.3226, "step": 526210 }, { "epoch": 0.92, "learning_rate": 4.11677717052006e-06, "loss": 2.307, "step": 526220 }, { "epoch": 0.92, "learning_rate": 4.1159052305932335e-06, "loss": 2.3517, "step": 526230 }, { "epoch": 0.92, "learning_rate": 4.115033290666406e-06, "loss": 2.1607, "step": 526240 }, { "epoch": 0.92, "learning_rate": 4.114161350739579e-06, "loss": 2.2584, "step": 526250 }, { "epoch": 0.92, "learning_rate": 4.113289410812752e-06, "loss": 2.2097, "step": 526260 }, { "epoch": 0.92, "learning_rate": 4.112417470885926e-06, "loss": 2.335, "step": 526270 }, { "epoch": 0.92, "learning_rate": 4.1115455309591e-06, "loss": 2.2114, "step": 526280 }, { "epoch": 0.92, "learning_rate": 4.110673591032273e-06, "loss": 2.1757, "step": 526290 }, { "epoch": 0.92, "learning_rate": 4.109801651105446e-06, "loss": 2.2542, "step": 526300 }, { "epoch": 0.92, "learning_rate": 4.108929711178619e-06, "loss": 2.3363, "step": 526310 }, { "epoch": 0.92, "learning_rate": 4.108057771251792e-06, "loss": 2.2447, "step": 526320 }, { "epoch": 0.92, "learning_rate": 4.107185831324965e-06, "loss": 2.2973, "step": 526330 }, { "epoch": 0.92, "learning_rate": 4.106313891398138e-06, "loss": 2.2709, "step": 526340 }, { "epoch": 0.92, "learning_rate": 4.105441951471312e-06, "loss": 2.3695, "step": 526350 }, { "epoch": 0.92, "learning_rate": 4.104570011544485e-06, "loss": 2.3727, "step": 526360 }, { "epoch": 0.92, "learning_rate": 4.103698071617658e-06, "loss": 2.1751, "step": 526370 }, { "epoch": 0.92, "learning_rate": 4.102826131690831e-06, "loss": 2.3086, "step": 526380 }, { "epoch": 0.92, "learning_rate": 4.1019541917640045e-06, "loss": 2.3918, "step": 526390 }, { "epoch": 0.92, "learning_rate": 4.101082251837177e-06, "loss": 2.2846, "step": 526400 }, { "epoch": 0.92, "learning_rate": 4.10021031191035e-06, "loss": 2.183, "step": 526410 }, { "epoch": 0.92, "learning_rate": 4.099338371983524e-06, "loss": 2.2612, "step": 526420 }, { "epoch": 0.92, "learning_rate": 4.098466432056698e-06, "loss": 2.281, "step": 526430 }, { "epoch": 0.92, "learning_rate": 4.097594492129871e-06, "loss": 2.2789, "step": 526440 }, { "epoch": 0.92, "learning_rate": 4.096722552203044e-06, "loss": 2.3434, "step": 526450 }, { "epoch": 0.92, "learning_rate": 4.095850612276217e-06, "loss": 2.3214, "step": 526460 }, { "epoch": 0.92, "learning_rate": 4.09497867234939e-06, "loss": 2.2796, "step": 526470 }, { "epoch": 0.92, "learning_rate": 4.094106732422563e-06, "loss": 2.2638, "step": 526480 }, { "epoch": 0.92, "learning_rate": 4.093234792495736e-06, "loss": 2.1996, "step": 526490 }, { "epoch": 0.92, "learning_rate": 4.092362852568909e-06, "loss": 2.2768, "step": 526500 }, { "epoch": 0.92, "learning_rate": 4.091490912642083e-06, "loss": 2.1659, "step": 526510 }, { "epoch": 0.92, "learning_rate": 4.090618972715256e-06, "loss": 2.2286, "step": 526520 }, { "epoch": 0.92, "learning_rate": 4.089747032788429e-06, "loss": 2.1999, "step": 526530 }, { "epoch": 0.92, "learning_rate": 4.088875092861602e-06, "loss": 2.2197, "step": 526540 }, { "epoch": 0.92, "learning_rate": 4.088003152934776e-06, "loss": 2.3097, "step": 526550 }, { "epoch": 0.92, "learning_rate": 4.087131213007949e-06, "loss": 2.3029, "step": 526560 }, { "epoch": 0.92, "learning_rate": 4.086259273081122e-06, "loss": 2.2483, "step": 526570 }, { "epoch": 0.92, "learning_rate": 4.085387333154295e-06, "loss": 2.2688, "step": 526580 }, { "epoch": 0.92, "learning_rate": 4.084515393227469e-06, "loss": 2.3244, "step": 526590 }, { "epoch": 0.92, "learning_rate": 4.083643453300642e-06, "loss": 2.2282, "step": 526600 }, { "epoch": 0.92, "learning_rate": 4.082771513373815e-06, "loss": 2.2642, "step": 526610 }, { "epoch": 0.92, "learning_rate": 4.081899573446988e-06, "loss": 2.3301, "step": 526620 }, { "epoch": 0.92, "learning_rate": 4.081027633520161e-06, "loss": 2.1841, "step": 526630 }, { "epoch": 0.92, "learning_rate": 4.080155693593334e-06, "loss": 2.1505, "step": 526640 }, { "epoch": 0.92, "learning_rate": 4.079283753666507e-06, "loss": 2.1908, "step": 526650 }, { "epoch": 0.92, "learning_rate": 4.07841181373968e-06, "loss": 2.2076, "step": 526660 }, { "epoch": 0.92, "learning_rate": 4.077539873812854e-06, "loss": 2.3354, "step": 526670 }, { "epoch": 0.92, "learning_rate": 4.076667933886028e-06, "loss": 2.2379, "step": 526680 }, { "epoch": 0.92, "learning_rate": 4.075795993959201e-06, "loss": 2.275, "step": 526690 }, { "epoch": 0.92, "learning_rate": 4.0749240540323736e-06, "loss": 2.1511, "step": 526700 }, { "epoch": 0.92, "learning_rate": 4.074052114105547e-06, "loss": 2.3195, "step": 526710 }, { "epoch": 0.92, "learning_rate": 4.07318017417872e-06, "loss": 2.1612, "step": 526720 }, { "epoch": 0.92, "learning_rate": 4.072308234251893e-06, "loss": 2.3068, "step": 526730 }, { "epoch": 0.92, "learning_rate": 4.071436294325066e-06, "loss": 2.3423, "step": 526740 }, { "epoch": 0.92, "learning_rate": 4.07056435439824e-06, "loss": 2.1899, "step": 526750 }, { "epoch": 0.92, "learning_rate": 4.069692414471413e-06, "loss": 2.241, "step": 526760 }, { "epoch": 0.92, "learning_rate": 4.068820474544586e-06, "loss": 2.2165, "step": 526770 }, { "epoch": 0.92, "learning_rate": 4.067948534617759e-06, "loss": 2.2441, "step": 526780 }, { "epoch": 0.92, "learning_rate": 4.067076594690932e-06, "loss": 2.3173, "step": 526790 }, { "epoch": 0.92, "learning_rate": 4.066204654764105e-06, "loss": 2.3008, "step": 526800 }, { "epoch": 0.92, "learning_rate": 4.065332714837278e-06, "loss": 2.1971, "step": 526810 }, { "epoch": 0.92, "learning_rate": 4.064460774910452e-06, "loss": 2.2885, "step": 526820 }, { "epoch": 0.92, "learning_rate": 4.063588834983626e-06, "loss": 2.2869, "step": 526830 }, { "epoch": 0.92, "learning_rate": 4.062716895056799e-06, "loss": 2.2346, "step": 526840 }, { "epoch": 0.92, "learning_rate": 4.061844955129972e-06, "loss": 2.2611, "step": 526850 }, { "epoch": 0.92, "learning_rate": 4.0609730152031446e-06, "loss": 2.2892, "step": 526860 }, { "epoch": 0.92, "learning_rate": 4.060101075276318e-06, "loss": 2.2345, "step": 526870 }, { "epoch": 0.92, "learning_rate": 4.059229135349491e-06, "loss": 2.1319, "step": 526880 }, { "epoch": 0.92, "learning_rate": 4.058357195422664e-06, "loss": 2.2496, "step": 526890 }, { "epoch": 0.92, "learning_rate": 4.057485255495837e-06, "loss": 2.2792, "step": 526900 }, { "epoch": 0.92, "learning_rate": 4.056613315569011e-06, "loss": 2.3585, "step": 526910 }, { "epoch": 0.92, "learning_rate": 4.055741375642184e-06, "loss": 2.2754, "step": 526920 }, { "epoch": 0.92, "learning_rate": 4.054869435715357e-06, "loss": 2.239, "step": 526930 }, { "epoch": 0.92, "learning_rate": 4.05399749578853e-06, "loss": 2.339, "step": 526940 }, { "epoch": 0.92, "learning_rate": 4.053125555861704e-06, "loss": 2.3632, "step": 526950 }, { "epoch": 0.92, "learning_rate": 4.052253615934877e-06, "loss": 2.2536, "step": 526960 }, { "epoch": 0.92, "learning_rate": 4.05138167600805e-06, "loss": 2.2613, "step": 526970 }, { "epoch": 0.92, "learning_rate": 4.050509736081223e-06, "loss": 2.3474, "step": 526980 }, { "epoch": 0.92, "learning_rate": 4.049637796154397e-06, "loss": 2.2979, "step": 526990 }, { "epoch": 0.92, "learning_rate": 4.04876585622757e-06, "loss": 2.2537, "step": 527000 }, { "epoch": 0.92, "learning_rate": 4.047893916300743e-06, "loss": 2.3303, "step": 527010 }, { "epoch": 0.92, "learning_rate": 4.0470219763739156e-06, "loss": 2.3239, "step": 527020 }, { "epoch": 0.92, "learning_rate": 4.046150036447089e-06, "loss": 2.2694, "step": 527030 }, { "epoch": 0.92, "learning_rate": 4.045278096520262e-06, "loss": 2.2977, "step": 527040 }, { "epoch": 0.92, "learning_rate": 4.044406156593435e-06, "loss": 2.2209, "step": 527050 }, { "epoch": 0.92, "learning_rate": 4.043534216666608e-06, "loss": 2.2043, "step": 527060 }, { "epoch": 0.92, "learning_rate": 4.042662276739782e-06, "loss": 2.2195, "step": 527070 }, { "epoch": 0.92, "learning_rate": 4.041790336812956e-06, "loss": 2.2269, "step": 527080 }, { "epoch": 0.92, "learning_rate": 4.0409183968861286e-06, "loss": 2.4366, "step": 527090 }, { "epoch": 0.92, "learning_rate": 4.0400464569593015e-06, "loss": 2.2583, "step": 527100 }, { "epoch": 0.92, "learning_rate": 4.039174517032475e-06, "loss": 2.2263, "step": 527110 }, { "epoch": 0.92, "learning_rate": 4.038302577105648e-06, "loss": 2.2255, "step": 527120 }, { "epoch": 0.92, "learning_rate": 4.037430637178821e-06, "loss": 2.3571, "step": 527130 }, { "epoch": 0.92, "learning_rate": 4.036558697251994e-06, "loss": 2.2686, "step": 527140 }, { "epoch": 0.92, "learning_rate": 4.035686757325168e-06, "loss": 2.1992, "step": 527150 }, { "epoch": 0.92, "learning_rate": 4.034814817398341e-06, "loss": 2.2058, "step": 527160 }, { "epoch": 0.92, "learning_rate": 4.033942877471514e-06, "loss": 2.3167, "step": 527170 }, { "epoch": 0.92, "learning_rate": 4.0330709375446866e-06, "loss": 2.2181, "step": 527180 }, { "epoch": 0.92, "learning_rate": 4.03219899761786e-06, "loss": 2.2527, "step": 527190 }, { "epoch": 0.92, "learning_rate": 4.031327057691033e-06, "loss": 2.191, "step": 527200 }, { "epoch": 0.92, "learning_rate": 4.030455117764206e-06, "loss": 2.2868, "step": 527210 }, { "epoch": 0.92, "learning_rate": 4.02958317783738e-06, "loss": 2.3074, "step": 527220 }, { "epoch": 0.92, "learning_rate": 4.028711237910554e-06, "loss": 2.2522, "step": 527230 }, { "epoch": 0.92, "learning_rate": 4.027839297983727e-06, "loss": 2.2763, "step": 527240 }, { "epoch": 0.92, "learning_rate": 4.0269673580568996e-06, "loss": 2.2701, "step": 527250 }, { "epoch": 0.92, "learning_rate": 4.0260954181300725e-06, "loss": 2.34, "step": 527260 }, { "epoch": 0.92, "learning_rate": 4.025223478203246e-06, "loss": 2.1928, "step": 527270 }, { "epoch": 0.92, "learning_rate": 4.024351538276419e-06, "loss": 2.2227, "step": 527280 }, { "epoch": 0.92, "learning_rate": 4.023479598349592e-06, "loss": 2.2964, "step": 527290 }, { "epoch": 0.92, "learning_rate": 4.022607658422765e-06, "loss": 2.3117, "step": 527300 }, { "epoch": 0.92, "learning_rate": 4.021735718495939e-06, "loss": 2.1696, "step": 527310 }, { "epoch": 0.92, "learning_rate": 4.020863778569112e-06, "loss": 2.2097, "step": 527320 }, { "epoch": 0.92, "learning_rate": 4.019991838642285e-06, "loss": 2.2953, "step": 527330 }, { "epoch": 0.92, "learning_rate": 4.0191198987154576e-06, "loss": 2.228, "step": 527340 }, { "epoch": 0.92, "learning_rate": 4.018247958788632e-06, "loss": 2.3049, "step": 527350 }, { "epoch": 0.92, "learning_rate": 4.017376018861805e-06, "loss": 2.3029, "step": 527360 }, { "epoch": 0.92, "learning_rate": 4.016504078934978e-06, "loss": 2.2321, "step": 527370 }, { "epoch": 0.92, "learning_rate": 4.015632139008151e-06, "loss": 2.3452, "step": 527380 }, { "epoch": 0.92, "learning_rate": 4.014760199081325e-06, "loss": 2.2498, "step": 527390 }, { "epoch": 0.92, "learning_rate": 4.013888259154498e-06, "loss": 2.339, "step": 527400 }, { "epoch": 0.92, "learning_rate": 4.0130163192276706e-06, "loss": 2.2688, "step": 527410 }, { "epoch": 0.92, "learning_rate": 4.0121443793008435e-06, "loss": 2.2345, "step": 527420 }, { "epoch": 0.92, "learning_rate": 4.011272439374017e-06, "loss": 2.2583, "step": 527430 }, { "epoch": 0.92, "learning_rate": 4.01040049944719e-06, "loss": 2.3136, "step": 527440 }, { "epoch": 0.92, "learning_rate": 4.009528559520363e-06, "loss": 2.3222, "step": 527450 }, { "epoch": 0.92, "learning_rate": 4.008656619593536e-06, "loss": 2.1823, "step": 527460 }, { "epoch": 0.92, "learning_rate": 4.00778467966671e-06, "loss": 2.2457, "step": 527470 }, { "epoch": 0.92, "learning_rate": 4.0069127397398836e-06, "loss": 2.3609, "step": 527480 }, { "epoch": 0.92, "learning_rate": 4.0060407998130565e-06, "loss": 2.2309, "step": 527490 }, { "epoch": 0.92, "learning_rate": 4.005168859886229e-06, "loss": 2.3113, "step": 527500 }, { "epoch": 0.92, "learning_rate": 4.004296919959403e-06, "loss": 2.3069, "step": 527510 }, { "epoch": 0.92, "learning_rate": 4.003424980032576e-06, "loss": 2.2096, "step": 527520 }, { "epoch": 0.92, "learning_rate": 4.002553040105749e-06, "loss": 2.1956, "step": 527530 }, { "epoch": 0.92, "learning_rate": 4.001681100178922e-06, "loss": 2.2356, "step": 527540 }, { "epoch": 0.92, "learning_rate": 4.000809160252096e-06, "loss": 2.2159, "step": 527550 }, { "epoch": 0.92, "learning_rate": 3.999937220325269e-06, "loss": 2.2556, "step": 527560 }, { "epoch": 0.92, "learning_rate": 3.9990652803984416e-06, "loss": 2.3314, "step": 527570 }, { "epoch": 0.92, "learning_rate": 3.9981933404716145e-06, "loss": 2.3466, "step": 527580 }, { "epoch": 0.92, "learning_rate": 3.997321400544788e-06, "loss": 2.2307, "step": 527590 }, { "epoch": 0.92, "learning_rate": 3.996449460617961e-06, "loss": 2.2271, "step": 527600 }, { "epoch": 0.92, "learning_rate": 3.995577520691135e-06, "loss": 2.3454, "step": 527610 }, { "epoch": 0.92, "learning_rate": 3.994705580764308e-06, "loss": 2.2227, "step": 527620 }, { "epoch": 0.92, "learning_rate": 3.993833640837482e-06, "loss": 2.2691, "step": 527630 }, { "epoch": 0.92, "learning_rate": 3.9929617009106546e-06, "loss": 2.2316, "step": 527640 }, { "epoch": 0.92, "learning_rate": 3.9920897609838275e-06, "loss": 2.2441, "step": 527650 }, { "epoch": 0.92, "learning_rate": 3.991217821057e-06, "loss": 2.2461, "step": 527660 }, { "epoch": 0.92, "learning_rate": 3.990345881130174e-06, "loss": 2.2502, "step": 527670 }, { "epoch": 0.92, "learning_rate": 3.989473941203347e-06, "loss": 2.2748, "step": 527680 }, { "epoch": 0.92, "learning_rate": 3.98860200127652e-06, "loss": 2.2449, "step": 527690 }, { "epoch": 0.92, "learning_rate": 3.987730061349693e-06, "loss": 2.2761, "step": 527700 }, { "epoch": 0.92, "learning_rate": 3.986858121422867e-06, "loss": 2.2865, "step": 527710 }, { "epoch": 0.92, "learning_rate": 3.98598618149604e-06, "loss": 2.2278, "step": 527720 }, { "epoch": 0.92, "learning_rate": 3.9851142415692126e-06, "loss": 2.2691, "step": 527730 }, { "epoch": 0.92, "learning_rate": 3.9842423016423855e-06, "loss": 2.254, "step": 527740 }, { "epoch": 0.92, "learning_rate": 3.98337036171556e-06, "loss": 2.2851, "step": 527750 }, { "epoch": 0.92, "learning_rate": 3.982498421788733e-06, "loss": 2.2058, "step": 527760 }, { "epoch": 0.92, "learning_rate": 3.981626481861906e-06, "loss": 2.385, "step": 527770 }, { "epoch": 0.92, "learning_rate": 3.980754541935079e-06, "loss": 2.3016, "step": 527780 }, { "epoch": 0.92, "learning_rate": 3.979882602008253e-06, "loss": 2.2447, "step": 527790 }, { "epoch": 0.92, "learning_rate": 3.9790106620814256e-06, "loss": 2.3309, "step": 527800 }, { "epoch": 0.92, "learning_rate": 3.9781387221545985e-06, "loss": 2.3085, "step": 527810 }, { "epoch": 0.92, "learning_rate": 3.977266782227771e-06, "loss": 2.2069, "step": 527820 }, { "epoch": 0.92, "learning_rate": 3.976394842300945e-06, "loss": 2.2713, "step": 527830 }, { "epoch": 0.92, "learning_rate": 3.975522902374118e-06, "loss": 2.3137, "step": 527840 }, { "epoch": 0.92, "learning_rate": 3.974650962447291e-06, "loss": 2.1463, "step": 527850 }, { "epoch": 0.92, "learning_rate": 3.973779022520464e-06, "loss": 2.2211, "step": 527860 }, { "epoch": 0.92, "learning_rate": 3.972907082593638e-06, "loss": 2.3777, "step": 527870 }, { "epoch": 0.92, "learning_rate": 3.9720351426668115e-06, "loss": 2.2397, "step": 527880 }, { "epoch": 0.92, "learning_rate": 3.971163202739984e-06, "loss": 2.4369, "step": 527890 }, { "epoch": 0.92, "learning_rate": 3.970291262813157e-06, "loss": 2.1798, "step": 527900 }, { "epoch": 0.92, "learning_rate": 3.969419322886331e-06, "loss": 2.249, "step": 527910 }, { "epoch": 0.92, "learning_rate": 3.968547382959504e-06, "loss": 2.1415, "step": 527920 }, { "epoch": 0.92, "learning_rate": 3.967675443032677e-06, "loss": 2.2752, "step": 527930 }, { "epoch": 0.92, "learning_rate": 3.96680350310585e-06, "loss": 2.3479, "step": 527940 }, { "epoch": 0.92, "learning_rate": 3.965931563179024e-06, "loss": 2.2582, "step": 527950 }, { "epoch": 0.92, "learning_rate": 3.9650596232521966e-06, "loss": 2.1987, "step": 527960 }, { "epoch": 0.92, "learning_rate": 3.9641876833253695e-06, "loss": 2.3131, "step": 527970 }, { "epoch": 0.92, "learning_rate": 3.963315743398542e-06, "loss": 2.3295, "step": 527980 }, { "epoch": 0.92, "learning_rate": 3.962443803471716e-06, "loss": 2.2973, "step": 527990 }, { "epoch": 0.92, "learning_rate": 3.961571863544889e-06, "loss": 2.3396, "step": 528000 }, { "epoch": 0.92, "learning_rate": 3.960699923618063e-06, "loss": 2.2433, "step": 528010 }, { "epoch": 0.92, "learning_rate": 3.959827983691236e-06, "loss": 2.2913, "step": 528020 }, { "epoch": 0.92, "learning_rate": 3.9589560437644096e-06, "loss": 2.2854, "step": 528030 }, { "epoch": 0.92, "learning_rate": 3.9580841038375825e-06, "loss": 2.1932, "step": 528040 }, { "epoch": 0.92, "learning_rate": 3.957212163910755e-06, "loss": 2.2231, "step": 528050 }, { "epoch": 0.92, "learning_rate": 3.956340223983928e-06, "loss": 2.2105, "step": 528060 }, { "epoch": 0.92, "learning_rate": 3.955468284057102e-06, "loss": 2.1757, "step": 528070 }, { "epoch": 0.92, "learning_rate": 3.954596344130275e-06, "loss": 2.2595, "step": 528080 }, { "epoch": 0.92, "learning_rate": 3.953724404203448e-06, "loss": 2.2567, "step": 528090 }, { "epoch": 0.92, "learning_rate": 3.952852464276621e-06, "loss": 2.3215, "step": 528100 }, { "epoch": 0.92, "learning_rate": 3.951980524349795e-06, "loss": 2.3092, "step": 528110 }, { "epoch": 0.92, "learning_rate": 3.9511085844229676e-06, "loss": 2.187, "step": 528120 }, { "epoch": 0.92, "learning_rate": 3.9502366444961405e-06, "loss": 2.2467, "step": 528130 }, { "epoch": 0.92, "learning_rate": 3.949364704569314e-06, "loss": 2.2985, "step": 528140 }, { "epoch": 0.92, "learning_rate": 3.948492764642488e-06, "loss": 2.2686, "step": 528150 }, { "epoch": 0.92, "learning_rate": 3.947620824715661e-06, "loss": 2.2456, "step": 528160 }, { "epoch": 0.92, "learning_rate": 3.946748884788834e-06, "loss": 2.3095, "step": 528170 }, { "epoch": 0.92, "learning_rate": 3.945876944862007e-06, "loss": 2.286, "step": 528180 }, { "epoch": 0.92, "learning_rate": 3.9450050049351806e-06, "loss": 2.2551, "step": 528190 }, { "epoch": 0.92, "learning_rate": 3.9441330650083535e-06, "loss": 2.2478, "step": 528200 }, { "epoch": 0.92, "learning_rate": 3.943261125081526e-06, "loss": 2.257, "step": 528210 }, { "epoch": 0.92, "learning_rate": 3.942389185154699e-06, "loss": 2.1974, "step": 528220 }, { "epoch": 0.92, "learning_rate": 3.941517245227873e-06, "loss": 2.2346, "step": 528230 }, { "epoch": 0.92, "learning_rate": 3.940645305301046e-06, "loss": 2.2197, "step": 528240 }, { "epoch": 0.92, "learning_rate": 3.939773365374219e-06, "loss": 2.3732, "step": 528250 }, { "epoch": 0.92, "learning_rate": 3.938901425447393e-06, "loss": 2.2154, "step": 528260 }, { "epoch": 0.92, "learning_rate": 3.938029485520566e-06, "loss": 2.2959, "step": 528270 }, { "epoch": 0.92, "learning_rate": 3.937157545593739e-06, "loss": 2.2118, "step": 528280 }, { "epoch": 0.92, "learning_rate": 3.936285605666912e-06, "loss": 2.2474, "step": 528290 }, { "epoch": 0.92, "learning_rate": 3.935413665740085e-06, "loss": 2.3191, "step": 528300 }, { "epoch": 0.92, "learning_rate": 3.934541725813259e-06, "loss": 2.2538, "step": 528310 }, { "epoch": 0.92, "learning_rate": 3.933669785886432e-06, "loss": 2.2869, "step": 528320 }, { "epoch": 0.92, "learning_rate": 3.932797845959605e-06, "loss": 2.2409, "step": 528330 }, { "epoch": 0.92, "learning_rate": 3.931925906032778e-06, "loss": 2.2917, "step": 528340 }, { "epoch": 0.92, "learning_rate": 3.9310539661059516e-06, "loss": 2.3185, "step": 528350 }, { "epoch": 0.92, "learning_rate": 3.9301820261791245e-06, "loss": 2.2106, "step": 528360 }, { "epoch": 0.92, "learning_rate": 3.929310086252297e-06, "loss": 2.3676, "step": 528370 }, { "epoch": 0.92, "learning_rate": 3.92843814632547e-06, "loss": 2.2674, "step": 528380 }, { "epoch": 0.92, "learning_rate": 3.927566206398644e-06, "loss": 2.1977, "step": 528390 }, { "epoch": 0.92, "learning_rate": 3.926694266471817e-06, "loss": 2.07, "step": 528400 }, { "epoch": 0.92, "learning_rate": 3.925822326544991e-06, "loss": 2.2054, "step": 528410 }, { "epoch": 0.92, "learning_rate": 3.924950386618164e-06, "loss": 2.2063, "step": 528420 }, { "epoch": 0.92, "learning_rate": 3.9240784466913375e-06, "loss": 2.3726, "step": 528430 }, { "epoch": 0.92, "learning_rate": 3.92320650676451e-06, "loss": 2.2558, "step": 528440 }, { "epoch": 0.92, "learning_rate": 3.922334566837683e-06, "loss": 2.2481, "step": 528450 }, { "epoch": 0.92, "learning_rate": 3.921462626910856e-06, "loss": 2.2905, "step": 528460 }, { "epoch": 0.92, "learning_rate": 3.92059068698403e-06, "loss": 2.3244, "step": 528470 }, { "epoch": 0.92, "learning_rate": 3.919718747057203e-06, "loss": 2.1739, "step": 528480 }, { "epoch": 0.92, "learning_rate": 3.918846807130376e-06, "loss": 2.1749, "step": 528490 }, { "epoch": 0.92, "learning_rate": 3.917974867203549e-06, "loss": 2.2803, "step": 528500 }, { "epoch": 0.92, "learning_rate": 3.9171029272767226e-06, "loss": 2.2765, "step": 528510 }, { "epoch": 0.92, "learning_rate": 3.9162309873498955e-06, "loss": 2.2405, "step": 528520 }, { "epoch": 0.92, "learning_rate": 3.915359047423068e-06, "loss": 2.2172, "step": 528530 }, { "epoch": 0.92, "learning_rate": 3.914487107496242e-06, "loss": 2.3489, "step": 528540 }, { "epoch": 0.92, "learning_rate": 3.913615167569416e-06, "loss": 2.3097, "step": 528550 }, { "epoch": 0.92, "learning_rate": 3.912743227642589e-06, "loss": 2.2798, "step": 528560 }, { "epoch": 0.92, "learning_rate": 3.911871287715762e-06, "loss": 2.279, "step": 528570 }, { "epoch": 0.92, "learning_rate": 3.910999347788935e-06, "loss": 2.2782, "step": 528580 }, { "epoch": 0.92, "learning_rate": 3.9101274078621085e-06, "loss": 2.2503, "step": 528590 }, { "epoch": 0.92, "learning_rate": 3.909255467935281e-06, "loss": 2.3154, "step": 528600 }, { "epoch": 0.92, "learning_rate": 3.908383528008454e-06, "loss": 2.2351, "step": 528610 }, { "epoch": 0.92, "learning_rate": 3.907511588081627e-06, "loss": 2.1463, "step": 528620 }, { "epoch": 0.92, "learning_rate": 3.906639648154801e-06, "loss": 2.4308, "step": 528630 }, { "epoch": 0.92, "learning_rate": 3.905767708227974e-06, "loss": 2.2107, "step": 528640 }, { "epoch": 0.92, "learning_rate": 3.904895768301147e-06, "loss": 2.3068, "step": 528650 }, { "epoch": 0.92, "learning_rate": 3.904023828374321e-06, "loss": 2.2423, "step": 528660 }, { "epoch": 0.92, "learning_rate": 3.9031518884474936e-06, "loss": 2.2561, "step": 528670 }, { "epoch": 0.92, "learning_rate": 3.902279948520667e-06, "loss": 2.1994, "step": 528680 }, { "epoch": 0.92, "learning_rate": 3.90140800859384e-06, "loss": 2.3444, "step": 528690 }, { "epoch": 0.92, "learning_rate": 3.900536068667013e-06, "loss": 2.1698, "step": 528700 }, { "epoch": 0.92, "learning_rate": 3.899664128740187e-06, "loss": 2.2861, "step": 528710 }, { "epoch": 0.92, "learning_rate": 3.89879218881336e-06, "loss": 2.3246, "step": 528720 }, { "epoch": 0.92, "learning_rate": 3.897920248886533e-06, "loss": 2.3169, "step": 528730 }, { "epoch": 0.92, "learning_rate": 3.897048308959706e-06, "loss": 2.311, "step": 528740 }, { "epoch": 0.92, "learning_rate": 3.8961763690328795e-06, "loss": 2.2523, "step": 528750 }, { "epoch": 0.92, "learning_rate": 3.895304429106052e-06, "loss": 2.3164, "step": 528760 }, { "epoch": 0.92, "learning_rate": 3.894432489179225e-06, "loss": 2.1571, "step": 528770 }, { "epoch": 0.92, "learning_rate": 3.893560549252399e-06, "loss": 2.2802, "step": 528780 }, { "epoch": 0.92, "learning_rate": 3.892688609325572e-06, "loss": 2.249, "step": 528790 }, { "epoch": 0.92, "learning_rate": 3.891816669398745e-06, "loss": 2.2856, "step": 528800 }, { "epoch": 0.92, "learning_rate": 3.890944729471919e-06, "loss": 2.3186, "step": 528810 }, { "epoch": 0.92, "learning_rate": 3.890072789545092e-06, "loss": 2.3591, "step": 528820 }, { "epoch": 0.92, "learning_rate": 3.889200849618265e-06, "loss": 2.3525, "step": 528830 }, { "epoch": 0.92, "learning_rate": 3.888328909691438e-06, "loss": 2.3595, "step": 528840 }, { "epoch": 0.92, "learning_rate": 3.887456969764611e-06, "loss": 2.2556, "step": 528850 }, { "epoch": 0.92, "learning_rate": 3.886585029837784e-06, "loss": 2.2157, "step": 528860 }, { "epoch": 0.92, "learning_rate": 3.885713089910958e-06, "loss": 2.1867, "step": 528870 }, { "epoch": 0.92, "learning_rate": 3.884841149984131e-06, "loss": 2.3758, "step": 528880 }, { "epoch": 0.92, "learning_rate": 3.883969210057304e-06, "loss": 2.3033, "step": 528890 }, { "epoch": 0.92, "learning_rate": 3.883097270130477e-06, "loss": 2.2239, "step": 528900 }, { "epoch": 0.92, "learning_rate": 3.8822253302036505e-06, "loss": 2.17, "step": 528910 }, { "epoch": 0.92, "learning_rate": 3.881353390276823e-06, "loss": 2.3107, "step": 528920 }, { "epoch": 0.92, "learning_rate": 3.880481450349996e-06, "loss": 2.3168, "step": 528930 }, { "epoch": 0.92, "learning_rate": 3.87960951042317e-06, "loss": 2.3086, "step": 528940 }, { "epoch": 0.92, "learning_rate": 3.878737570496344e-06, "loss": 2.3326, "step": 528950 }, { "epoch": 0.92, "learning_rate": 3.877865630569517e-06, "loss": 2.2973, "step": 528960 }, { "epoch": 0.92, "learning_rate": 3.87699369064269e-06, "loss": 2.2107, "step": 528970 }, { "epoch": 0.92, "learning_rate": 3.876121750715863e-06, "loss": 2.3097, "step": 528980 }, { "epoch": 0.92, "learning_rate": 3.875249810789036e-06, "loss": 2.2641, "step": 528990 }, { "epoch": 0.92, "learning_rate": 3.874377870862209e-06, "loss": 2.1811, "step": 529000 }, { "epoch": 0.92, "learning_rate": 3.873505930935382e-06, "loss": 2.2345, "step": 529010 }, { "epoch": 0.92, "learning_rate": 3.872633991008555e-06, "loss": 2.2934, "step": 529020 }, { "epoch": 0.92, "learning_rate": 3.871762051081729e-06, "loss": 2.3385, "step": 529030 }, { "epoch": 0.92, "learning_rate": 3.870890111154902e-06, "loss": 2.2787, "step": 529040 }, { "epoch": 0.92, "learning_rate": 3.870018171228075e-06, "loss": 2.3171, "step": 529050 }, { "epoch": 0.92, "learning_rate": 3.8691462313012486e-06, "loss": 2.3983, "step": 529060 }, { "epoch": 0.92, "learning_rate": 3.8682742913744215e-06, "loss": 2.4258, "step": 529070 }, { "epoch": 0.92, "learning_rate": 3.867402351447595e-06, "loss": 2.2776, "step": 529080 }, { "epoch": 0.92, "learning_rate": 3.866530411520768e-06, "loss": 2.2025, "step": 529090 }, { "epoch": 0.92, "learning_rate": 3.865658471593941e-06, "loss": 2.2437, "step": 529100 }, { "epoch": 0.92, "learning_rate": 3.864786531667115e-06, "loss": 2.3038, "step": 529110 }, { "epoch": 0.92, "learning_rate": 3.863914591740288e-06, "loss": 2.2225, "step": 529120 }, { "epoch": 0.92, "learning_rate": 3.863042651813461e-06, "loss": 2.2331, "step": 529130 }, { "epoch": 0.92, "learning_rate": 3.862170711886634e-06, "loss": 2.1838, "step": 529140 }, { "epoch": 0.92, "learning_rate": 3.861298771959807e-06, "loss": 2.1961, "step": 529150 }, { "epoch": 0.92, "learning_rate": 3.86042683203298e-06, "loss": 2.2117, "step": 529160 }, { "epoch": 0.92, "learning_rate": 3.859554892106153e-06, "loss": 2.3353, "step": 529170 }, { "epoch": 0.92, "learning_rate": 3.858682952179327e-06, "loss": 2.2302, "step": 529180 }, { "epoch": 0.92, "learning_rate": 3.8578110122525e-06, "loss": 2.2929, "step": 529190 }, { "epoch": 0.92, "learning_rate": 3.856939072325673e-06, "loss": 2.3193, "step": 529200 }, { "epoch": 0.92, "learning_rate": 3.856067132398847e-06, "loss": 2.285, "step": 529210 }, { "epoch": 0.92, "learning_rate": 3.8551951924720196e-06, "loss": 2.218, "step": 529220 }, { "epoch": 0.92, "learning_rate": 3.854323252545193e-06, "loss": 2.1947, "step": 529230 }, { "epoch": 0.92, "learning_rate": 3.853451312618366e-06, "loss": 2.2639, "step": 529240 }, { "epoch": 0.92, "learning_rate": 3.852579372691539e-06, "loss": 2.2939, "step": 529250 }, { "epoch": 0.92, "learning_rate": 3.851707432764712e-06, "loss": 2.1668, "step": 529260 }, { "epoch": 0.92, "learning_rate": 3.850835492837886e-06, "loss": 2.2045, "step": 529270 }, { "epoch": 0.92, "learning_rate": 3.849963552911059e-06, "loss": 2.1408, "step": 529280 }, { "epoch": 0.92, "learning_rate": 3.849091612984232e-06, "loss": 2.2926, "step": 529290 }, { "epoch": 0.92, "learning_rate": 3.8482196730574055e-06, "loss": 2.2405, "step": 529300 }, { "epoch": 0.92, "learning_rate": 3.847347733130578e-06, "loss": 2.2676, "step": 529310 }, { "epoch": 0.92, "learning_rate": 3.846475793203751e-06, "loss": 2.2342, "step": 529320 }, { "epoch": 0.92, "learning_rate": 3.845603853276924e-06, "loss": 2.1874, "step": 529330 }, { "epoch": 0.92, "learning_rate": 3.844731913350098e-06, "loss": 2.3103, "step": 529340 }, { "epoch": 0.92, "learning_rate": 3.843859973423272e-06, "loss": 2.1242, "step": 529350 }, { "epoch": 0.92, "learning_rate": 3.842988033496445e-06, "loss": 2.2337, "step": 529360 }, { "epoch": 0.92, "learning_rate": 3.842116093569618e-06, "loss": 2.2281, "step": 529370 }, { "epoch": 0.92, "learning_rate": 3.8412441536427906e-06, "loss": 2.2996, "step": 529380 }, { "epoch": 0.92, "learning_rate": 3.840372213715964e-06, "loss": 2.2428, "step": 529390 }, { "epoch": 0.92, "learning_rate": 3.839500273789137e-06, "loss": 2.3157, "step": 529400 }, { "epoch": 0.92, "learning_rate": 3.83862833386231e-06, "loss": 2.3267, "step": 529410 }, { "epoch": 0.92, "learning_rate": 3.837756393935483e-06, "loss": 2.3833, "step": 529420 }, { "epoch": 0.92, "learning_rate": 3.836884454008657e-06, "loss": 2.2929, "step": 529430 }, { "epoch": 0.92, "learning_rate": 3.83601251408183e-06, "loss": 2.1754, "step": 529440 }, { "epoch": 0.92, "learning_rate": 3.835140574155003e-06, "loss": 2.2474, "step": 529450 }, { "epoch": 0.92, "learning_rate": 3.8342686342281765e-06, "loss": 2.2271, "step": 529460 }, { "epoch": 0.92, "learning_rate": 3.833396694301349e-06, "loss": 2.1705, "step": 529470 }, { "epoch": 0.92, "learning_rate": 3.832524754374523e-06, "loss": 2.2791, "step": 529480 }, { "epoch": 0.92, "learning_rate": 3.831652814447696e-06, "loss": 2.3624, "step": 529490 }, { "epoch": 0.92, "learning_rate": 3.830780874520869e-06, "loss": 2.2585, "step": 529500 }, { "epoch": 0.92, "learning_rate": 3.829908934594043e-06, "loss": 2.2992, "step": 529510 }, { "epoch": 0.92, "learning_rate": 3.829036994667216e-06, "loss": 2.2235, "step": 529520 }, { "epoch": 0.92, "learning_rate": 3.828165054740389e-06, "loss": 2.263, "step": 529530 }, { "epoch": 0.92, "learning_rate": 3.8272931148135616e-06, "loss": 2.3141, "step": 529540 }, { "epoch": 0.92, "learning_rate": 3.826421174886735e-06, "loss": 2.2888, "step": 529550 }, { "epoch": 0.92, "learning_rate": 3.825549234959908e-06, "loss": 2.253, "step": 529560 }, { "epoch": 0.92, "learning_rate": 3.824677295033081e-06, "loss": 2.1746, "step": 529570 }, { "epoch": 0.92, "learning_rate": 3.823805355106255e-06, "loss": 2.293, "step": 529580 }, { "epoch": 0.92, "learning_rate": 3.822933415179428e-06, "loss": 2.2782, "step": 529590 }, { "epoch": 0.92, "learning_rate": 3.822061475252601e-06, "loss": 2.254, "step": 529600 }, { "epoch": 0.92, "learning_rate": 3.8211895353257746e-06, "loss": 2.329, "step": 529610 }, { "epoch": 0.92, "learning_rate": 3.8203175953989475e-06, "loss": 2.2292, "step": 529620 }, { "epoch": 0.92, "learning_rate": 3.819445655472121e-06, "loss": 2.2585, "step": 529630 }, { "epoch": 0.92, "learning_rate": 3.818573715545294e-06, "loss": 2.343, "step": 529640 }, { "epoch": 0.92, "learning_rate": 3.817701775618467e-06, "loss": 2.0914, "step": 529650 }, { "epoch": 0.92, "learning_rate": 3.81682983569164e-06, "loss": 2.3212, "step": 529660 }, { "epoch": 0.92, "learning_rate": 3.815957895764814e-06, "loss": 2.361, "step": 529670 }, { "epoch": 0.92, "learning_rate": 3.815085955837987e-06, "loss": 2.3497, "step": 529680 }, { "epoch": 0.92, "learning_rate": 3.81421401591116e-06, "loss": 2.2011, "step": 529690 }, { "epoch": 0.92, "learning_rate": 3.813342075984333e-06, "loss": 2.174, "step": 529700 }, { "epoch": 0.92, "learning_rate": 3.8124701360575063e-06, "loss": 2.1365, "step": 529710 }, { "epoch": 0.92, "learning_rate": 3.8115981961306793e-06, "loss": 2.1215, "step": 529720 }, { "epoch": 0.92, "learning_rate": 3.8107262562038526e-06, "loss": 2.3216, "step": 529730 }, { "epoch": 0.92, "learning_rate": 3.8098543162770264e-06, "loss": 2.3235, "step": 529740 }, { "epoch": 0.92, "learning_rate": 3.8089823763501993e-06, "loss": 2.2905, "step": 529750 }, { "epoch": 0.92, "learning_rate": 3.8081104364233727e-06, "loss": 2.1971, "step": 529760 }, { "epoch": 0.92, "learning_rate": 3.8072384964965456e-06, "loss": 2.2566, "step": 529770 }, { "epoch": 0.92, "learning_rate": 3.806366556569719e-06, "loss": 2.2751, "step": 529780 }, { "epoch": 0.92, "learning_rate": 3.805494616642892e-06, "loss": 2.3119, "step": 529790 }, { "epoch": 0.92, "learning_rate": 3.804622676716065e-06, "loss": 2.224, "step": 529800 }, { "epoch": 0.92, "learning_rate": 3.803750736789238e-06, "loss": 2.3261, "step": 529810 }, { "epoch": 0.92, "learning_rate": 3.8028787968624115e-06, "loss": 2.3354, "step": 529820 }, { "epoch": 0.92, "learning_rate": 3.802006856935585e-06, "loss": 2.2237, "step": 529830 }, { "epoch": 0.92, "learning_rate": 3.8011349170087577e-06, "loss": 2.3126, "step": 529840 }, { "epoch": 0.92, "learning_rate": 3.800262977081931e-06, "loss": 2.2227, "step": 529850 }, { "epoch": 0.92, "learning_rate": 3.799391037155104e-06, "loss": 2.2999, "step": 529860 }, { "epoch": 0.92, "learning_rate": 3.7985190972282773e-06, "loss": 2.3102, "step": 529870 }, { "epoch": 0.92, "learning_rate": 3.797647157301451e-06, "loss": 2.1868, "step": 529880 }, { "epoch": 0.92, "learning_rate": 3.796775217374624e-06, "loss": 2.3093, "step": 529890 }, { "epoch": 0.92, "learning_rate": 3.7959032774477974e-06, "loss": 2.3609, "step": 529900 }, { "epoch": 0.92, "learning_rate": 3.7950313375209703e-06, "loss": 2.2522, "step": 529910 }, { "epoch": 0.92, "learning_rate": 3.7941593975941437e-06, "loss": 2.1952, "step": 529920 }, { "epoch": 0.92, "learning_rate": 3.7932874576673166e-06, "loss": 2.4004, "step": 529930 }, { "epoch": 0.92, "learning_rate": 3.79241551774049e-06, "loss": 2.3281, "step": 529940 }, { "epoch": 0.92, "learning_rate": 3.7915435778136633e-06, "loss": 2.2447, "step": 529950 }, { "epoch": 0.92, "learning_rate": 3.790671637886836e-06, "loss": 2.218, "step": 529960 }, { "epoch": 0.92, "learning_rate": 3.7897996979600095e-06, "loss": 2.1908, "step": 529970 }, { "epoch": 0.92, "learning_rate": 3.7889277580331825e-06, "loss": 2.2895, "step": 529980 }, { "epoch": 0.92, "learning_rate": 3.788055818106356e-06, "loss": 2.281, "step": 529990 }, { "epoch": 0.92, "learning_rate": 3.7871838781795287e-06, "loss": 2.2828, "step": 530000 }, { "epoch": 0.92, "learning_rate": 3.7863119382527025e-06, "loss": 2.1907, "step": 530010 }, { "epoch": 0.92, "learning_rate": 3.785439998325876e-06, "loss": 2.2742, "step": 530020 }, { "epoch": 0.92, "learning_rate": 3.7845680583990488e-06, "loss": 2.1436, "step": 530030 }, { "epoch": 0.92, "learning_rate": 3.783696118472222e-06, "loss": 2.309, "step": 530040 }, { "epoch": 0.92, "learning_rate": 3.782824178545395e-06, "loss": 2.2215, "step": 530050 }, { "epoch": 0.92, "learning_rate": 3.7819522386185684e-06, "loss": 2.2464, "step": 530060 }, { "epoch": 0.92, "learning_rate": 3.7810802986917413e-06, "loss": 2.2355, "step": 530070 }, { "epoch": 0.92, "learning_rate": 3.7802083587649147e-06, "loss": 2.2877, "step": 530080 }, { "epoch": 0.92, "learning_rate": 3.779336418838088e-06, "loss": 2.2456, "step": 530090 }, { "epoch": 0.92, "learning_rate": 3.778464478911261e-06, "loss": 2.1406, "step": 530100 }, { "epoch": 0.92, "learning_rate": 3.7775925389844343e-06, "loss": 2.2534, "step": 530110 }, { "epoch": 0.92, "learning_rate": 3.776720599057607e-06, "loss": 2.2977, "step": 530120 }, { "epoch": 0.92, "learning_rate": 3.7758486591307805e-06, "loss": 2.2675, "step": 530130 }, { "epoch": 0.92, "learning_rate": 3.7749767192039543e-06, "loss": 2.3178, "step": 530140 }, { "epoch": 0.92, "learning_rate": 3.7741047792771272e-06, "loss": 2.2713, "step": 530150 }, { "epoch": 0.92, "learning_rate": 3.7732328393503006e-06, "loss": 2.1764, "step": 530160 }, { "epoch": 0.92, "learning_rate": 3.7723608994234735e-06, "loss": 2.2213, "step": 530170 }, { "epoch": 0.92, "learning_rate": 3.771488959496647e-06, "loss": 2.3288, "step": 530180 }, { "epoch": 0.92, "learning_rate": 3.7706170195698198e-06, "loss": 2.3528, "step": 530190 }, { "epoch": 0.92, "learning_rate": 3.769745079642993e-06, "loss": 2.2147, "step": 530200 }, { "epoch": 0.92, "learning_rate": 3.7688731397161665e-06, "loss": 2.1127, "step": 530210 }, { "epoch": 0.92, "learning_rate": 3.7680011997893394e-06, "loss": 2.2387, "step": 530220 }, { "epoch": 0.92, "learning_rate": 3.7671292598625127e-06, "loss": 2.1301, "step": 530230 }, { "epoch": 0.92, "learning_rate": 3.7662573199356857e-06, "loss": 2.2443, "step": 530240 }, { "epoch": 0.92, "learning_rate": 3.765385380008859e-06, "loss": 2.3442, "step": 530250 }, { "epoch": 0.92, "learning_rate": 3.764513440082032e-06, "loss": 2.3322, "step": 530260 }, { "epoch": 0.92, "learning_rate": 3.7636415001552053e-06, "loss": 2.319, "step": 530270 }, { "epoch": 0.92, "learning_rate": 3.762769560228379e-06, "loss": 2.2485, "step": 530280 }, { "epoch": 0.92, "learning_rate": 3.761897620301552e-06, "loss": 2.3177, "step": 530290 }, { "epoch": 0.92, "learning_rate": 3.7610256803747253e-06, "loss": 2.3409, "step": 530300 }, { "epoch": 0.92, "learning_rate": 3.7601537404478982e-06, "loss": 2.261, "step": 530310 }, { "epoch": 0.92, "learning_rate": 3.7592818005210716e-06, "loss": 2.1737, "step": 530320 }, { "epoch": 0.92, "learning_rate": 3.7584098605942445e-06, "loss": 2.257, "step": 530330 }, { "epoch": 0.92, "learning_rate": 3.757537920667418e-06, "loss": 2.1924, "step": 530340 }, { "epoch": 0.92, "learning_rate": 3.756665980740591e-06, "loss": 2.2326, "step": 530350 }, { "epoch": 0.92, "learning_rate": 3.755794040813764e-06, "loss": 2.3009, "step": 530360 }, { "epoch": 0.92, "learning_rate": 3.7549221008869375e-06, "loss": 2.3173, "step": 530370 }, { "epoch": 0.92, "learning_rate": 3.7540501609601104e-06, "loss": 2.3047, "step": 530380 }, { "epoch": 0.92, "learning_rate": 3.7531782210332837e-06, "loss": 2.2725, "step": 530390 }, { "epoch": 0.92, "learning_rate": 3.7523062811064567e-06, "loss": 2.2791, "step": 530400 }, { "epoch": 0.92, "learning_rate": 3.7514343411796304e-06, "loss": 2.224, "step": 530410 }, { "epoch": 0.92, "learning_rate": 3.7505624012528038e-06, "loss": 2.2095, "step": 530420 }, { "epoch": 0.93, "learning_rate": 3.7496904613259767e-06, "loss": 2.2576, "step": 530430 }, { "epoch": 0.93, "learning_rate": 3.74881852139915e-06, "loss": 2.1874, "step": 530440 }, { "epoch": 0.93, "learning_rate": 3.747946581472323e-06, "loss": 2.2145, "step": 530450 }, { "epoch": 0.93, "learning_rate": 3.7470746415454963e-06, "loss": 2.2775, "step": 530460 }, { "epoch": 0.93, "learning_rate": 3.7462027016186697e-06, "loss": 2.1692, "step": 530470 }, { "epoch": 0.93, "learning_rate": 3.7453307616918426e-06, "loss": 2.3202, "step": 530480 }, { "epoch": 0.93, "learning_rate": 3.744458821765016e-06, "loss": 2.311, "step": 530490 }, { "epoch": 0.93, "learning_rate": 3.743586881838189e-06, "loss": 2.1241, "step": 530500 }, { "epoch": 0.93, "learning_rate": 3.742714941911362e-06, "loss": 2.2372, "step": 530510 }, { "epoch": 0.93, "learning_rate": 3.741843001984535e-06, "loss": 2.3876, "step": 530520 }, { "epoch": 0.93, "learning_rate": 3.7409710620577085e-06, "loss": 2.0389, "step": 530530 }, { "epoch": 0.93, "learning_rate": 3.7400991221308822e-06, "loss": 2.2576, "step": 530540 }, { "epoch": 0.93, "learning_rate": 3.739227182204055e-06, "loss": 2.2618, "step": 530550 }, { "epoch": 0.93, "learning_rate": 3.7383552422772285e-06, "loss": 2.3099, "step": 530560 }, { "epoch": 0.93, "learning_rate": 3.7374833023504014e-06, "loss": 2.2231, "step": 530570 }, { "epoch": 0.93, "learning_rate": 3.7366113624235748e-06, "loss": 2.1881, "step": 530580 }, { "epoch": 0.93, "learning_rate": 3.7357394224967477e-06, "loss": 2.1861, "step": 530590 }, { "epoch": 0.93, "learning_rate": 3.734867482569921e-06, "loss": 2.2241, "step": 530600 }, { "epoch": 0.93, "learning_rate": 3.7339955426430944e-06, "loss": 2.2315, "step": 530610 }, { "epoch": 0.93, "learning_rate": 3.7331236027162673e-06, "loss": 2.1618, "step": 530620 }, { "epoch": 0.93, "learning_rate": 3.7322516627894407e-06, "loss": 2.3327, "step": 530630 }, { "epoch": 0.93, "learning_rate": 3.7313797228626136e-06, "loss": 2.2402, "step": 530640 }, { "epoch": 0.93, "learning_rate": 3.730507782935787e-06, "loss": 2.1857, "step": 530650 }, { "epoch": 0.93, "learning_rate": 3.72963584300896e-06, "loss": 2.3156, "step": 530660 }, { "epoch": 0.93, "learning_rate": 3.7287639030821336e-06, "loss": 2.3496, "step": 530670 }, { "epoch": 0.93, "learning_rate": 3.727891963155307e-06, "loss": 2.275, "step": 530680 }, { "epoch": 0.93, "learning_rate": 3.72702002322848e-06, "loss": 2.1659, "step": 530690 }, { "epoch": 0.93, "learning_rate": 3.7261480833016532e-06, "loss": 2.2946, "step": 530700 }, { "epoch": 0.93, "learning_rate": 3.725276143374826e-06, "loss": 2.2618, "step": 530710 }, { "epoch": 0.93, "learning_rate": 3.7244042034479995e-06, "loss": 2.2274, "step": 530720 }, { "epoch": 0.93, "learning_rate": 3.723532263521173e-06, "loss": 2.2916, "step": 530730 }, { "epoch": 0.93, "learning_rate": 3.7226603235943458e-06, "loss": 2.1984, "step": 530740 }, { "epoch": 0.93, "learning_rate": 3.721788383667519e-06, "loss": 2.2969, "step": 530750 }, { "epoch": 0.93, "learning_rate": 3.720916443740692e-06, "loss": 2.288, "step": 530760 }, { "epoch": 0.93, "learning_rate": 3.7200445038138654e-06, "loss": 2.3209, "step": 530770 }, { "epoch": 0.93, "learning_rate": 3.7191725638870383e-06, "loss": 2.272, "step": 530780 }, { "epoch": 0.93, "learning_rate": 3.7183006239602117e-06, "loss": 2.1877, "step": 530790 }, { "epoch": 0.93, "learning_rate": 3.7174286840333846e-06, "loss": 2.2782, "step": 530800 }, { "epoch": 0.93, "learning_rate": 3.7165567441065584e-06, "loss": 2.2273, "step": 530810 }, { "epoch": 0.93, "learning_rate": 3.7156848041797317e-06, "loss": 2.2624, "step": 530820 }, { "epoch": 0.93, "learning_rate": 3.7148128642529046e-06, "loss": 2.1843, "step": 530830 }, { "epoch": 0.93, "learning_rate": 3.713940924326078e-06, "loss": 2.2825, "step": 530840 }, { "epoch": 0.93, "learning_rate": 3.713068984399251e-06, "loss": 2.2386, "step": 530850 }, { "epoch": 0.93, "learning_rate": 3.7121970444724242e-06, "loss": 2.1365, "step": 530860 }, { "epoch": 0.93, "learning_rate": 3.7113251045455976e-06, "loss": 2.1917, "step": 530870 }, { "epoch": 0.93, "learning_rate": 3.7104531646187705e-06, "loss": 2.303, "step": 530880 }, { "epoch": 0.93, "learning_rate": 3.709581224691944e-06, "loss": 2.2696, "step": 530890 }, { "epoch": 0.93, "learning_rate": 3.7087092847651168e-06, "loss": 2.2281, "step": 530900 }, { "epoch": 0.93, "learning_rate": 3.70783734483829e-06, "loss": 2.1166, "step": 530910 }, { "epoch": 0.93, "learning_rate": 3.706965404911463e-06, "loss": 2.2791, "step": 530920 }, { "epoch": 0.93, "learning_rate": 3.7060934649846364e-06, "loss": 2.3143, "step": 530930 }, { "epoch": 0.93, "learning_rate": 3.70522152505781e-06, "loss": 2.1888, "step": 530940 }, { "epoch": 0.93, "learning_rate": 3.704349585130983e-06, "loss": 2.2018, "step": 530950 }, { "epoch": 0.93, "learning_rate": 3.7034776452041564e-06, "loss": 2.2419, "step": 530960 }, { "epoch": 0.93, "learning_rate": 3.7026057052773294e-06, "loss": 2.3235, "step": 530970 }, { "epoch": 0.93, "learning_rate": 3.7017337653505027e-06, "loss": 2.4075, "step": 530980 }, { "epoch": 0.93, "learning_rate": 3.700861825423676e-06, "loss": 2.2271, "step": 530990 }, { "epoch": 0.93, "learning_rate": 3.699989885496849e-06, "loss": 2.2836, "step": 531000 }, { "epoch": 0.93, "learning_rate": 3.6991179455700223e-06, "loss": 2.2379, "step": 531010 }, { "epoch": 0.93, "learning_rate": 3.6982460056431952e-06, "loss": 2.226, "step": 531020 }, { "epoch": 0.93, "learning_rate": 3.6973740657163686e-06, "loss": 2.3035, "step": 531030 }, { "epoch": 0.93, "learning_rate": 3.6965021257895415e-06, "loss": 2.3299, "step": 531040 }, { "epoch": 0.93, "learning_rate": 3.695630185862715e-06, "loss": 2.2689, "step": 531050 }, { "epoch": 0.93, "learning_rate": 3.6947582459358878e-06, "loss": 2.083, "step": 531060 }, { "epoch": 0.93, "learning_rate": 3.6938863060090616e-06, "loss": 2.3011, "step": 531070 }, { "epoch": 0.93, "learning_rate": 3.693014366082235e-06, "loss": 2.3382, "step": 531080 }, { "epoch": 0.93, "learning_rate": 3.692142426155408e-06, "loss": 2.2576, "step": 531090 }, { "epoch": 0.93, "learning_rate": 3.691270486228581e-06, "loss": 2.2803, "step": 531100 }, { "epoch": 0.93, "learning_rate": 3.690398546301754e-06, "loss": 2.2515, "step": 531110 }, { "epoch": 0.93, "learning_rate": 3.6895266063749274e-06, "loss": 2.2292, "step": 531120 }, { "epoch": 0.93, "learning_rate": 3.6886546664481008e-06, "loss": 2.3099, "step": 531130 }, { "epoch": 0.93, "learning_rate": 3.6877827265212737e-06, "loss": 2.2523, "step": 531140 }, { "epoch": 0.93, "learning_rate": 3.686910786594447e-06, "loss": 2.342, "step": 531150 }, { "epoch": 0.93, "learning_rate": 3.68603884666762e-06, "loss": 2.3068, "step": 531160 }, { "epoch": 0.93, "learning_rate": 3.6851669067407933e-06, "loss": 2.2895, "step": 531170 }, { "epoch": 0.93, "learning_rate": 3.6842949668139662e-06, "loss": 2.1714, "step": 531180 }, { "epoch": 0.93, "learning_rate": 3.6834230268871396e-06, "loss": 2.2728, "step": 531190 }, { "epoch": 0.93, "learning_rate": 3.6825510869603125e-06, "loss": 2.2842, "step": 531200 }, { "epoch": 0.93, "learning_rate": 3.6816791470334863e-06, "loss": 2.153, "step": 531210 }, { "epoch": 0.93, "learning_rate": 3.6808072071066596e-06, "loss": 2.3774, "step": 531220 }, { "epoch": 0.93, "learning_rate": 3.6799352671798326e-06, "loss": 2.3966, "step": 531230 }, { "epoch": 0.93, "learning_rate": 3.679063327253006e-06, "loss": 2.2222, "step": 531240 }, { "epoch": 0.93, "learning_rate": 3.6781913873261792e-06, "loss": 2.2868, "step": 531250 }, { "epoch": 0.93, "learning_rate": 3.677319447399352e-06, "loss": 2.2377, "step": 531260 }, { "epoch": 0.93, "learning_rate": 3.6764475074725255e-06, "loss": 2.3106, "step": 531270 }, { "epoch": 0.93, "learning_rate": 3.6755755675456984e-06, "loss": 2.3176, "step": 531280 }, { "epoch": 0.93, "learning_rate": 3.6747036276188718e-06, "loss": 2.2431, "step": 531290 }, { "epoch": 0.93, "learning_rate": 3.6738316876920447e-06, "loss": 2.2523, "step": 531300 }, { "epoch": 0.93, "learning_rate": 3.672959747765218e-06, "loss": 2.1491, "step": 531310 }, { "epoch": 0.93, "learning_rate": 3.672087807838391e-06, "loss": 2.228, "step": 531320 }, { "epoch": 0.93, "learning_rate": 3.6712158679115643e-06, "loss": 2.276, "step": 531330 }, { "epoch": 0.93, "learning_rate": 3.670343927984738e-06, "loss": 2.1837, "step": 531340 }, { "epoch": 0.93, "learning_rate": 3.669471988057911e-06, "loss": 2.3741, "step": 531350 }, { "epoch": 0.93, "learning_rate": 3.6686000481310844e-06, "loss": 2.2402, "step": 531360 }, { "epoch": 0.93, "learning_rate": 3.6677281082042577e-06, "loss": 2.209, "step": 531370 }, { "epoch": 0.93, "learning_rate": 3.6668561682774306e-06, "loss": 2.3007, "step": 531380 }, { "epoch": 0.93, "learning_rate": 3.665984228350604e-06, "loss": 2.2506, "step": 531390 }, { "epoch": 0.93, "learning_rate": 3.665112288423777e-06, "loss": 2.1751, "step": 531400 }, { "epoch": 0.93, "learning_rate": 3.6642403484969502e-06, "loss": 2.2998, "step": 531410 }, { "epoch": 0.93, "learning_rate": 3.663368408570123e-06, "loss": 2.3238, "step": 531420 }, { "epoch": 0.93, "learning_rate": 3.6624964686432965e-06, "loss": 2.2079, "step": 531430 }, { "epoch": 0.93, "learning_rate": 3.6616245287164694e-06, "loss": 2.1828, "step": 531440 }, { "epoch": 0.93, "learning_rate": 3.6607525887896428e-06, "loss": 2.284, "step": 531450 }, { "epoch": 0.93, "learning_rate": 3.6598806488628157e-06, "loss": 2.1897, "step": 531460 }, { "epoch": 0.93, "learning_rate": 3.6590087089359895e-06, "loss": 2.3235, "step": 531470 }, { "epoch": 0.93, "learning_rate": 3.658136769009163e-06, "loss": 2.2138, "step": 531480 }, { "epoch": 0.93, "learning_rate": 3.6572648290823357e-06, "loss": 2.2282, "step": 531490 }, { "epoch": 0.93, "learning_rate": 3.656392889155509e-06, "loss": 2.2667, "step": 531500 }, { "epoch": 0.93, "learning_rate": 3.6555209492286824e-06, "loss": 2.3041, "step": 531510 }, { "epoch": 0.93, "learning_rate": 3.6546490093018554e-06, "loss": 2.3017, "step": 531520 }, { "epoch": 0.93, "learning_rate": 3.6537770693750287e-06, "loss": 2.3076, "step": 531530 }, { "epoch": 0.93, "learning_rate": 3.6529051294482016e-06, "loss": 2.1581, "step": 531540 }, { "epoch": 0.93, "learning_rate": 3.652033189521375e-06, "loss": 2.1707, "step": 531550 }, { "epoch": 0.93, "learning_rate": 3.651161249594548e-06, "loss": 2.2171, "step": 531560 }, { "epoch": 0.93, "learning_rate": 3.6502893096677212e-06, "loss": 2.2004, "step": 531570 }, { "epoch": 0.93, "learning_rate": 3.649417369740894e-06, "loss": 2.2313, "step": 531580 }, { "epoch": 0.93, "learning_rate": 3.6485454298140675e-06, "loss": 2.2715, "step": 531590 }, { "epoch": 0.93, "learning_rate": 3.6476734898872404e-06, "loss": 2.3293, "step": 531600 }, { "epoch": 0.93, "learning_rate": 3.646801549960414e-06, "loss": 2.2932, "step": 531610 }, { "epoch": 0.93, "learning_rate": 3.6459296100335876e-06, "loss": 2.2361, "step": 531620 }, { "epoch": 0.93, "learning_rate": 3.645057670106761e-06, "loss": 2.3005, "step": 531630 }, { "epoch": 0.93, "learning_rate": 3.644185730179934e-06, "loss": 2.2168, "step": 531640 }, { "epoch": 0.93, "learning_rate": 3.643313790253107e-06, "loss": 2.3165, "step": 531650 }, { "epoch": 0.93, "learning_rate": 3.64244185032628e-06, "loss": 2.2469, "step": 531660 }, { "epoch": 0.93, "learning_rate": 3.6415699103994534e-06, "loss": 2.3345, "step": 531670 }, { "epoch": 0.93, "learning_rate": 3.6406979704726264e-06, "loss": 2.3305, "step": 531680 }, { "epoch": 0.93, "learning_rate": 3.6398260305457997e-06, "loss": 2.2385, "step": 531690 }, { "epoch": 0.93, "learning_rate": 3.6389540906189726e-06, "loss": 2.3255, "step": 531700 }, { "epoch": 0.93, "learning_rate": 3.638082150692146e-06, "loss": 2.2056, "step": 531710 }, { "epoch": 0.93, "learning_rate": 3.637210210765319e-06, "loss": 2.1902, "step": 531720 }, { "epoch": 0.93, "learning_rate": 3.6363382708384922e-06, "loss": 2.218, "step": 531730 }, { "epoch": 0.93, "learning_rate": 3.635466330911666e-06, "loss": 2.2024, "step": 531740 }, { "epoch": 0.93, "learning_rate": 3.634594390984839e-06, "loss": 2.1747, "step": 531750 }, { "epoch": 0.93, "learning_rate": 3.6337224510580123e-06, "loss": 2.319, "step": 531760 }, { "epoch": 0.93, "learning_rate": 3.6328505111311856e-06, "loss": 2.243, "step": 531770 }, { "epoch": 0.93, "learning_rate": 3.6319785712043586e-06, "loss": 2.1829, "step": 531780 }, { "epoch": 0.93, "learning_rate": 3.631106631277532e-06, "loss": 2.2186, "step": 531790 }, { "epoch": 0.93, "learning_rate": 3.630234691350705e-06, "loss": 2.1927, "step": 531800 }, { "epoch": 0.93, "learning_rate": 3.629362751423878e-06, "loss": 2.2249, "step": 531810 }, { "epoch": 0.93, "learning_rate": 3.628490811497051e-06, "loss": 2.2447, "step": 531820 }, { "epoch": 0.93, "learning_rate": 3.6276188715702244e-06, "loss": 2.1663, "step": 531830 }, { "epoch": 0.93, "learning_rate": 3.6267469316433974e-06, "loss": 2.3668, "step": 531840 }, { "epoch": 0.93, "learning_rate": 3.6258749917165707e-06, "loss": 2.2507, "step": 531850 }, { "epoch": 0.93, "learning_rate": 3.6250030517897436e-06, "loss": 2.3141, "step": 531860 }, { "epoch": 0.93, "learning_rate": 3.6241311118629174e-06, "loss": 2.188, "step": 531870 }, { "epoch": 0.93, "learning_rate": 3.6232591719360907e-06, "loss": 2.1261, "step": 531880 }, { "epoch": 0.93, "learning_rate": 3.622387232009264e-06, "loss": 2.2262, "step": 531890 }, { "epoch": 0.93, "learning_rate": 3.621515292082437e-06, "loss": 2.213, "step": 531900 }, { "epoch": 0.93, "learning_rate": 3.6206433521556104e-06, "loss": 2.2301, "step": 531910 }, { "epoch": 0.93, "learning_rate": 3.6197714122287833e-06, "loss": 2.2684, "step": 531920 }, { "epoch": 0.93, "learning_rate": 3.6188994723019566e-06, "loss": 2.1987, "step": 531930 }, { "epoch": 0.93, "learning_rate": 3.6180275323751296e-06, "loss": 2.3346, "step": 531940 }, { "epoch": 0.93, "learning_rate": 3.617155592448303e-06, "loss": 2.2453, "step": 531950 }, { "epoch": 0.93, "learning_rate": 3.616283652521476e-06, "loss": 2.2199, "step": 531960 }, { "epoch": 0.93, "learning_rate": 3.615411712594649e-06, "loss": 2.3475, "step": 531970 }, { "epoch": 0.93, "learning_rate": 3.614539772667822e-06, "loss": 2.3182, "step": 531980 }, { "epoch": 0.93, "learning_rate": 3.6136678327409954e-06, "loss": 2.0041, "step": 531990 }, { "epoch": 0.93, "learning_rate": 3.6127958928141692e-06, "loss": 2.2182, "step": 532000 }, { "epoch": 0.93, "learning_rate": 3.611923952887342e-06, "loss": 2.1656, "step": 532010 }, { "epoch": 0.93, "learning_rate": 3.6110520129605155e-06, "loss": 2.3005, "step": 532020 }, { "epoch": 0.93, "learning_rate": 3.610180073033689e-06, "loss": 2.2463, "step": 532030 }, { "epoch": 0.93, "learning_rate": 3.6093081331068618e-06, "loss": 2.1894, "step": 532040 }, { "epoch": 0.93, "learning_rate": 3.608436193180035e-06, "loss": 2.3269, "step": 532050 }, { "epoch": 0.93, "learning_rate": 3.607564253253208e-06, "loss": 2.3251, "step": 532060 }, { "epoch": 0.93, "learning_rate": 3.6066923133263814e-06, "loss": 2.3544, "step": 532070 }, { "epoch": 0.93, "learning_rate": 3.6058203733995543e-06, "loss": 2.3052, "step": 532080 }, { "epoch": 0.93, "learning_rate": 3.6049484334727276e-06, "loss": 2.1812, "step": 532090 }, { "epoch": 0.93, "learning_rate": 3.6040764935459006e-06, "loss": 2.2686, "step": 532100 }, { "epoch": 0.93, "learning_rate": 3.603204553619074e-06, "loss": 2.2499, "step": 532110 }, { "epoch": 0.93, "learning_rate": 3.602332613692247e-06, "loss": 2.1908, "step": 532120 }, { "epoch": 0.93, "learning_rate": 3.60146067376542e-06, "loss": 2.3209, "step": 532130 }, { "epoch": 0.93, "learning_rate": 3.600588733838594e-06, "loss": 2.2806, "step": 532140 }, { "epoch": 0.93, "learning_rate": 3.5997167939117673e-06, "loss": 2.3178, "step": 532150 }, { "epoch": 0.93, "learning_rate": 3.5988448539849402e-06, "loss": 2.2125, "step": 532160 }, { "epoch": 0.93, "learning_rate": 3.5979729140581136e-06, "loss": 2.2375, "step": 532170 }, { "epoch": 0.93, "learning_rate": 3.5971009741312865e-06, "loss": 2.2681, "step": 532180 }, { "epoch": 0.93, "learning_rate": 3.59622903420446e-06, "loss": 2.2903, "step": 532190 }, { "epoch": 0.93, "learning_rate": 3.5953570942776328e-06, "loss": 2.2666, "step": 532200 }, { "epoch": 0.93, "learning_rate": 3.594485154350806e-06, "loss": 2.3087, "step": 532210 }, { "epoch": 0.93, "learning_rate": 3.593613214423979e-06, "loss": 2.2813, "step": 532220 }, { "epoch": 0.93, "learning_rate": 3.5927412744971524e-06, "loss": 2.283, "step": 532230 }, { "epoch": 0.93, "learning_rate": 3.5918693345703253e-06, "loss": 2.3044, "step": 532240 }, { "epoch": 0.93, "learning_rate": 3.5909973946434986e-06, "loss": 2.257, "step": 532250 }, { "epoch": 0.93, "learning_rate": 3.5901254547166716e-06, "loss": 2.2303, "step": 532260 }, { "epoch": 0.93, "learning_rate": 3.5892535147898453e-06, "loss": 2.0543, "step": 532270 }, { "epoch": 0.93, "learning_rate": 3.5883815748630187e-06, "loss": 2.3175, "step": 532280 }, { "epoch": 0.93, "learning_rate": 3.587509634936192e-06, "loss": 2.1778, "step": 532290 }, { "epoch": 0.93, "learning_rate": 3.586637695009365e-06, "loss": 2.279, "step": 532300 }, { "epoch": 0.93, "learning_rate": 3.5857657550825383e-06, "loss": 2.2472, "step": 532310 }, { "epoch": 0.93, "learning_rate": 3.5848938151557112e-06, "loss": 2.1796, "step": 532320 }, { "epoch": 0.93, "learning_rate": 3.5840218752288846e-06, "loss": 2.2346, "step": 532330 }, { "epoch": 0.93, "learning_rate": 3.5831499353020575e-06, "loss": 2.207, "step": 532340 }, { "epoch": 0.93, "learning_rate": 3.582277995375231e-06, "loss": 2.3044, "step": 532350 }, { "epoch": 0.93, "learning_rate": 3.5814060554484038e-06, "loss": 2.2831, "step": 532360 }, { "epoch": 0.93, "learning_rate": 3.580534115521577e-06, "loss": 2.3154, "step": 532370 }, { "epoch": 0.93, "learning_rate": 3.57966217559475e-06, "loss": 2.3359, "step": 532380 }, { "epoch": 0.93, "learning_rate": 3.5787902356679234e-06, "loss": 2.2497, "step": 532390 }, { "epoch": 0.93, "learning_rate": 3.577918295741097e-06, "loss": 2.1722, "step": 532400 }, { "epoch": 0.93, "learning_rate": 3.5770463558142705e-06, "loss": 2.3471, "step": 532410 }, { "epoch": 0.93, "learning_rate": 3.5761744158874434e-06, "loss": 2.2032, "step": 532420 }, { "epoch": 0.93, "learning_rate": 3.5753024759606168e-06, "loss": 2.2162, "step": 532430 }, { "epoch": 0.93, "learning_rate": 3.5744305360337897e-06, "loss": 2.2597, "step": 532440 }, { "epoch": 0.93, "learning_rate": 3.573558596106963e-06, "loss": 2.3014, "step": 532450 }, { "epoch": 0.93, "learning_rate": 3.572686656180136e-06, "loss": 2.3223, "step": 532460 }, { "epoch": 0.93, "learning_rate": 3.5718147162533093e-06, "loss": 2.2229, "step": 532470 }, { "epoch": 0.93, "learning_rate": 3.5709427763264822e-06, "loss": 2.2874, "step": 532480 }, { "epoch": 0.93, "learning_rate": 3.5700708363996556e-06, "loss": 2.1721, "step": 532490 }, { "epoch": 0.93, "learning_rate": 3.5691988964728285e-06, "loss": 2.3954, "step": 532500 }, { "epoch": 0.93, "learning_rate": 3.568326956546002e-06, "loss": 2.2023, "step": 532510 }, { "epoch": 0.93, "learning_rate": 3.5674550166191748e-06, "loss": 2.2505, "step": 532520 }, { "epoch": 0.93, "learning_rate": 3.566583076692348e-06, "loss": 2.3498, "step": 532530 }, { "epoch": 0.93, "learning_rate": 3.565711136765522e-06, "loss": 2.3234, "step": 532540 }, { "epoch": 0.93, "learning_rate": 3.5648391968386952e-06, "loss": 2.32, "step": 532550 }, { "epoch": 0.93, "learning_rate": 3.563967256911868e-06, "loss": 2.2989, "step": 532560 }, { "epoch": 0.93, "learning_rate": 3.5630953169850415e-06, "loss": 2.1259, "step": 532570 }, { "epoch": 0.93, "learning_rate": 3.5622233770582144e-06, "loss": 2.3008, "step": 532580 }, { "epoch": 0.93, "learning_rate": 3.5613514371313878e-06, "loss": 2.2789, "step": 532590 }, { "epoch": 0.93, "learning_rate": 3.5604794972045607e-06, "loss": 2.1415, "step": 532600 }, { "epoch": 0.93, "learning_rate": 3.559607557277734e-06, "loss": 2.2772, "step": 532610 }, { "epoch": 0.93, "learning_rate": 3.558735617350907e-06, "loss": 2.1764, "step": 532620 }, { "epoch": 0.93, "learning_rate": 3.5578636774240803e-06, "loss": 2.2841, "step": 532630 }, { "epoch": 0.93, "learning_rate": 3.5569917374972532e-06, "loss": 2.3178, "step": 532640 }, { "epoch": 0.93, "learning_rate": 3.5561197975704266e-06, "loss": 2.3074, "step": 532650 }, { "epoch": 0.93, "learning_rate": 3.5552478576435995e-06, "loss": 2.2043, "step": 532660 }, { "epoch": 0.93, "learning_rate": 3.5543759177167737e-06, "loss": 2.3038, "step": 532670 }, { "epoch": 0.93, "learning_rate": 3.5535039777899466e-06, "loss": 2.2804, "step": 532680 }, { "epoch": 0.93, "learning_rate": 3.55263203786312e-06, "loss": 2.1827, "step": 532690 }, { "epoch": 0.93, "learning_rate": 3.551760097936293e-06, "loss": 2.163, "step": 532700 }, { "epoch": 0.93, "learning_rate": 3.5508881580094662e-06, "loss": 2.2345, "step": 532710 }, { "epoch": 0.93, "learning_rate": 3.550016218082639e-06, "loss": 2.3177, "step": 532720 }, { "epoch": 0.93, "learning_rate": 3.5491442781558125e-06, "loss": 2.1984, "step": 532730 }, { "epoch": 0.93, "learning_rate": 3.5482723382289854e-06, "loss": 2.2816, "step": 532740 }, { "epoch": 0.93, "learning_rate": 3.5474003983021588e-06, "loss": 2.2675, "step": 532750 }, { "epoch": 0.93, "learning_rate": 3.5465284583753317e-06, "loss": 2.3153, "step": 532760 }, { "epoch": 0.93, "learning_rate": 3.545656518448505e-06, "loss": 2.1843, "step": 532770 }, { "epoch": 0.93, "learning_rate": 3.544784578521678e-06, "loss": 2.235, "step": 532780 }, { "epoch": 0.93, "learning_rate": 3.5439126385948513e-06, "loss": 2.1979, "step": 532790 }, { "epoch": 0.93, "learning_rate": 3.543040698668025e-06, "loss": 2.2039, "step": 532800 }, { "epoch": 0.93, "learning_rate": 3.5421687587411984e-06, "loss": 2.2391, "step": 532810 }, { "epoch": 0.93, "learning_rate": 3.5412968188143713e-06, "loss": 2.2328, "step": 532820 }, { "epoch": 0.93, "learning_rate": 3.5404248788875447e-06, "loss": 2.3527, "step": 532830 }, { "epoch": 0.93, "learning_rate": 3.5395529389607176e-06, "loss": 2.3501, "step": 532840 }, { "epoch": 0.93, "learning_rate": 3.538680999033891e-06, "loss": 2.3038, "step": 532850 }, { "epoch": 0.93, "learning_rate": 3.537809059107064e-06, "loss": 2.3055, "step": 532860 }, { "epoch": 0.93, "learning_rate": 3.5369371191802372e-06, "loss": 2.3335, "step": 532870 }, { "epoch": 0.93, "learning_rate": 3.53606517925341e-06, "loss": 2.1543, "step": 532880 }, { "epoch": 0.93, "learning_rate": 3.5351932393265835e-06, "loss": 2.3897, "step": 532890 }, { "epoch": 0.93, "learning_rate": 3.5343212993997564e-06, "loss": 2.345, "step": 532900 }, { "epoch": 0.93, "learning_rate": 3.5334493594729298e-06, "loss": 2.2098, "step": 532910 }, { "epoch": 0.93, "learning_rate": 3.5325774195461027e-06, "loss": 2.2146, "step": 532920 }, { "epoch": 0.93, "learning_rate": 3.531705479619276e-06, "loss": 2.3104, "step": 532930 }, { "epoch": 0.93, "learning_rate": 3.53083353969245e-06, "loss": 2.2872, "step": 532940 }, { "epoch": 0.93, "learning_rate": 3.529961599765623e-06, "loss": 2.1525, "step": 532950 }, { "epoch": 0.93, "learning_rate": 3.529089659838796e-06, "loss": 2.2936, "step": 532960 }, { "epoch": 0.93, "learning_rate": 3.5282177199119694e-06, "loss": 2.2488, "step": 532970 }, { "epoch": 0.93, "learning_rate": 3.5273457799851423e-06, "loss": 2.2132, "step": 532980 }, { "epoch": 0.93, "learning_rate": 3.5264738400583157e-06, "loss": 2.1815, "step": 532990 }, { "epoch": 0.93, "learning_rate": 3.5256019001314886e-06, "loss": 2.1018, "step": 533000 }, { "epoch": 0.93, "learning_rate": 3.524729960204662e-06, "loss": 2.2702, "step": 533010 }, { "epoch": 0.93, "learning_rate": 3.523858020277835e-06, "loss": 2.2127, "step": 533020 }, { "epoch": 0.93, "learning_rate": 3.5229860803510082e-06, "loss": 2.3189, "step": 533030 }, { "epoch": 0.93, "learning_rate": 3.522114140424181e-06, "loss": 2.1812, "step": 533040 }, { "epoch": 0.93, "learning_rate": 3.5212422004973545e-06, "loss": 2.3011, "step": 533050 }, { "epoch": 0.93, "learning_rate": 3.5203702605705274e-06, "loss": 2.1871, "step": 533060 }, { "epoch": 0.93, "learning_rate": 3.5194983206437016e-06, "loss": 2.2964, "step": 533070 }, { "epoch": 0.93, "learning_rate": 3.5186263807168745e-06, "loss": 2.2158, "step": 533080 }, { "epoch": 0.93, "learning_rate": 3.517754440790048e-06, "loss": 2.2663, "step": 533090 }, { "epoch": 0.93, "learning_rate": 3.516882500863221e-06, "loss": 2.3093, "step": 533100 }, { "epoch": 0.93, "learning_rate": 3.516010560936394e-06, "loss": 2.2594, "step": 533110 }, { "epoch": 0.93, "learning_rate": 3.515138621009567e-06, "loss": 2.3665, "step": 533120 }, { "epoch": 0.93, "learning_rate": 3.5142666810827404e-06, "loss": 2.1679, "step": 533130 }, { "epoch": 0.93, "learning_rate": 3.5133947411559133e-06, "loss": 2.3013, "step": 533140 }, { "epoch": 0.93, "learning_rate": 3.5125228012290867e-06, "loss": 2.3236, "step": 533150 }, { "epoch": 0.93, "learning_rate": 3.5116508613022596e-06, "loss": 2.2488, "step": 533160 }, { "epoch": 0.93, "learning_rate": 3.510778921375433e-06, "loss": 2.3885, "step": 533170 }, { "epoch": 0.93, "learning_rate": 3.509906981448606e-06, "loss": 2.1666, "step": 533180 }, { "epoch": 0.93, "learning_rate": 3.5090350415217792e-06, "loss": 2.3521, "step": 533190 }, { "epoch": 0.93, "learning_rate": 3.508163101594953e-06, "loss": 2.2115, "step": 533200 }, { "epoch": 0.93, "learning_rate": 3.5072911616681263e-06, "loss": 2.2578, "step": 533210 }, { "epoch": 0.93, "learning_rate": 3.5064192217412993e-06, "loss": 2.1985, "step": 533220 }, { "epoch": 0.93, "learning_rate": 3.5055472818144726e-06, "loss": 2.2874, "step": 533230 }, { "epoch": 0.93, "learning_rate": 3.5046753418876455e-06, "loss": 2.239, "step": 533240 }, { "epoch": 0.93, "learning_rate": 3.503803401960819e-06, "loss": 2.2371, "step": 533250 }, { "epoch": 0.93, "learning_rate": 3.502931462033992e-06, "loss": 2.2925, "step": 533260 }, { "epoch": 0.93, "learning_rate": 3.502059522107165e-06, "loss": 2.2873, "step": 533270 }, { "epoch": 0.93, "learning_rate": 3.501187582180338e-06, "loss": 2.3071, "step": 533280 }, { "epoch": 0.93, "learning_rate": 3.5003156422535114e-06, "loss": 2.1931, "step": 533290 }, { "epoch": 0.93, "learning_rate": 3.4994437023266843e-06, "loss": 2.284, "step": 533300 }, { "epoch": 0.93, "learning_rate": 3.4985717623998577e-06, "loss": 2.3184, "step": 533310 }, { "epoch": 0.93, "learning_rate": 3.4976998224730306e-06, "loss": 2.265, "step": 533320 }, { "epoch": 0.93, "learning_rate": 3.496827882546205e-06, "loss": 2.2631, "step": 533330 }, { "epoch": 0.93, "learning_rate": 3.4959559426193777e-06, "loss": 2.2034, "step": 533340 }, { "epoch": 0.93, "learning_rate": 3.495084002692551e-06, "loss": 2.265, "step": 533350 }, { "epoch": 0.93, "learning_rate": 3.494212062765724e-06, "loss": 2.402, "step": 533360 }, { "epoch": 0.93, "learning_rate": 3.4933401228388973e-06, "loss": 2.4324, "step": 533370 }, { "epoch": 0.93, "learning_rate": 3.4924681829120703e-06, "loss": 2.2677, "step": 533380 }, { "epoch": 0.93, "learning_rate": 3.4915962429852436e-06, "loss": 2.255, "step": 533390 }, { "epoch": 0.93, "learning_rate": 3.4907243030584165e-06, "loss": 2.1521, "step": 533400 }, { "epoch": 0.93, "learning_rate": 3.48985236313159e-06, "loss": 2.3285, "step": 533410 }, { "epoch": 0.93, "learning_rate": 3.488980423204763e-06, "loss": 2.1899, "step": 533420 }, { "epoch": 0.93, "learning_rate": 3.488108483277936e-06, "loss": 2.1583, "step": 533430 }, { "epoch": 0.93, "learning_rate": 3.487236543351109e-06, "loss": 2.2142, "step": 533440 }, { "epoch": 0.93, "learning_rate": 3.4863646034242824e-06, "loss": 2.2307, "step": 533450 }, { "epoch": 0.93, "learning_rate": 3.4854926634974553e-06, "loss": 2.129, "step": 533460 }, { "epoch": 0.93, "learning_rate": 3.4846207235706295e-06, "loss": 2.299, "step": 533470 }, { "epoch": 0.93, "learning_rate": 3.4837487836438025e-06, "loss": 2.226, "step": 533480 }, { "epoch": 0.93, "learning_rate": 3.482876843716976e-06, "loss": 2.18, "step": 533490 }, { "epoch": 0.93, "learning_rate": 3.4820049037901487e-06, "loss": 2.3491, "step": 533500 }, { "epoch": 0.93, "learning_rate": 3.481132963863322e-06, "loss": 2.2945, "step": 533510 }, { "epoch": 0.93, "learning_rate": 3.480261023936495e-06, "loss": 2.2743, "step": 533520 }, { "epoch": 0.93, "learning_rate": 3.4793890840096683e-06, "loss": 2.281, "step": 533530 }, { "epoch": 0.93, "learning_rate": 3.4785171440828413e-06, "loss": 2.3046, "step": 533540 }, { "epoch": 0.93, "learning_rate": 3.4776452041560146e-06, "loss": 2.1625, "step": 533550 }, { "epoch": 0.93, "learning_rate": 3.4767732642291875e-06, "loss": 2.2506, "step": 533560 }, { "epoch": 0.93, "learning_rate": 3.475901324302361e-06, "loss": 2.2378, "step": 533570 }, { "epoch": 0.93, "learning_rate": 3.475029384375534e-06, "loss": 2.2099, "step": 533580 }, { "epoch": 0.93, "learning_rate": 3.474157444448707e-06, "loss": 2.2845, "step": 533590 }, { "epoch": 0.93, "learning_rate": 3.473285504521881e-06, "loss": 2.307, "step": 533600 }, { "epoch": 0.93, "learning_rate": 3.4724135645950543e-06, "loss": 2.2424, "step": 533610 }, { "epoch": 0.93, "learning_rate": 3.471541624668227e-06, "loss": 2.2955, "step": 533620 }, { "epoch": 0.93, "learning_rate": 3.4706696847414005e-06, "loss": 2.2231, "step": 533630 }, { "epoch": 0.93, "learning_rate": 3.4697977448145735e-06, "loss": 2.2253, "step": 533640 }, { "epoch": 0.93, "learning_rate": 3.468925804887747e-06, "loss": 2.2533, "step": 533650 }, { "epoch": 0.93, "learning_rate": 3.4680538649609197e-06, "loss": 2.3474, "step": 533660 }, { "epoch": 0.93, "learning_rate": 3.467181925034093e-06, "loss": 2.3044, "step": 533670 }, { "epoch": 0.93, "learning_rate": 3.466309985107266e-06, "loss": 2.2864, "step": 533680 }, { "epoch": 0.93, "learning_rate": 3.4654380451804393e-06, "loss": 2.2088, "step": 533690 }, { "epoch": 0.93, "learning_rate": 3.4645661052536123e-06, "loss": 2.288, "step": 533700 }, { "epoch": 0.93, "learning_rate": 3.4636941653267856e-06, "loss": 2.2948, "step": 533710 }, { "epoch": 0.93, "learning_rate": 3.4628222253999585e-06, "loss": 2.2674, "step": 533720 }, { "epoch": 0.93, "learning_rate": 3.4619502854731327e-06, "loss": 2.1449, "step": 533730 }, { "epoch": 0.93, "learning_rate": 3.4610783455463057e-06, "loss": 2.1584, "step": 533740 }, { "epoch": 0.93, "learning_rate": 3.460206405619479e-06, "loss": 2.2557, "step": 533750 }, { "epoch": 0.93, "learning_rate": 3.459334465692652e-06, "loss": 2.2228, "step": 533760 }, { "epoch": 0.93, "learning_rate": 3.4584625257658253e-06, "loss": 2.2678, "step": 533770 }, { "epoch": 0.93, "learning_rate": 3.457590585838998e-06, "loss": 2.1563, "step": 533780 }, { "epoch": 0.93, "learning_rate": 3.4567186459121715e-06, "loss": 2.3384, "step": 533790 }, { "epoch": 0.93, "learning_rate": 3.4558467059853445e-06, "loss": 2.2342, "step": 533800 }, { "epoch": 0.93, "learning_rate": 3.454974766058518e-06, "loss": 2.2086, "step": 533810 }, { "epoch": 0.93, "learning_rate": 3.4541028261316907e-06, "loss": 2.2482, "step": 533820 }, { "epoch": 0.93, "learning_rate": 3.453230886204864e-06, "loss": 2.3153, "step": 533830 }, { "epoch": 0.93, "learning_rate": 3.452358946278037e-06, "loss": 2.2546, "step": 533840 }, { "epoch": 0.93, "learning_rate": 3.4514870063512103e-06, "loss": 2.2646, "step": 533850 }, { "epoch": 0.93, "learning_rate": 3.4506150664243833e-06, "loss": 2.0877, "step": 533860 }, { "epoch": 0.93, "learning_rate": 3.4497431264975575e-06, "loss": 2.2811, "step": 533870 }, { "epoch": 0.93, "learning_rate": 3.4488711865707304e-06, "loss": 2.2165, "step": 533880 }, { "epoch": 0.93, "learning_rate": 3.4479992466439037e-06, "loss": 2.2715, "step": 533890 }, { "epoch": 0.93, "learning_rate": 3.4471273067170767e-06, "loss": 2.2576, "step": 533900 }, { "epoch": 0.93, "learning_rate": 3.44625536679025e-06, "loss": 2.2876, "step": 533910 }, { "epoch": 0.93, "learning_rate": 3.445383426863423e-06, "loss": 2.2891, "step": 533920 }, { "epoch": 0.93, "learning_rate": 3.4445114869365963e-06, "loss": 2.1243, "step": 533930 }, { "epoch": 0.93, "learning_rate": 3.443639547009769e-06, "loss": 2.2856, "step": 533940 }, { "epoch": 0.93, "learning_rate": 3.4427676070829425e-06, "loss": 2.2452, "step": 533950 }, { "epoch": 0.93, "learning_rate": 3.4418956671561155e-06, "loss": 2.3078, "step": 533960 }, { "epoch": 0.93, "learning_rate": 3.441023727229289e-06, "loss": 2.2704, "step": 533970 }, { "epoch": 0.93, "learning_rate": 3.4401517873024617e-06, "loss": 2.396, "step": 533980 }, { "epoch": 0.93, "learning_rate": 3.439279847375635e-06, "loss": 2.2718, "step": 533990 }, { "epoch": 0.93, "learning_rate": 3.438407907448809e-06, "loss": 2.1842, "step": 534000 }, { "epoch": 0.93, "learning_rate": 3.437535967521982e-06, "loss": 2.2311, "step": 534010 }, { "epoch": 0.93, "learning_rate": 3.436664027595155e-06, "loss": 2.1971, "step": 534020 }, { "epoch": 0.93, "learning_rate": 3.4357920876683285e-06, "loss": 2.2959, "step": 534030 }, { "epoch": 0.93, "learning_rate": 3.4349201477415014e-06, "loss": 2.2511, "step": 534040 }, { "epoch": 0.93, "learning_rate": 3.4340482078146747e-06, "loss": 2.225, "step": 534050 }, { "epoch": 0.93, "learning_rate": 3.4331762678878477e-06, "loss": 2.3078, "step": 534060 }, { "epoch": 0.93, "learning_rate": 3.432304327961021e-06, "loss": 2.2912, "step": 534070 }, { "epoch": 0.93, "learning_rate": 3.431432388034194e-06, "loss": 2.3061, "step": 534080 }, { "epoch": 0.93, "learning_rate": 3.4305604481073673e-06, "loss": 2.2225, "step": 534090 }, { "epoch": 0.93, "learning_rate": 3.42968850818054e-06, "loss": 2.2274, "step": 534100 }, { "epoch": 0.93, "learning_rate": 3.4288165682537135e-06, "loss": 2.353, "step": 534110 }, { "epoch": 0.93, "learning_rate": 3.4279446283268865e-06, "loss": 2.2081, "step": 534120 }, { "epoch": 0.93, "learning_rate": 3.4270726884000607e-06, "loss": 2.2648, "step": 534130 }, { "epoch": 0.93, "learning_rate": 3.4262007484732336e-06, "loss": 2.282, "step": 534140 }, { "epoch": 0.93, "learning_rate": 3.425328808546407e-06, "loss": 2.3338, "step": 534150 }, { "epoch": 0.93, "learning_rate": 3.42445686861958e-06, "loss": 2.3397, "step": 534160 }, { "epoch": 0.93, "learning_rate": 3.423584928692753e-06, "loss": 2.2898, "step": 534170 }, { "epoch": 0.93, "learning_rate": 3.422712988765926e-06, "loss": 2.2992, "step": 534180 }, { "epoch": 0.93, "learning_rate": 3.4218410488390995e-06, "loss": 2.2678, "step": 534190 }, { "epoch": 0.93, "learning_rate": 3.4209691089122724e-06, "loss": 2.1875, "step": 534200 }, { "epoch": 0.93, "learning_rate": 3.4200971689854457e-06, "loss": 2.2489, "step": 534210 }, { "epoch": 0.93, "learning_rate": 3.4192252290586187e-06, "loss": 2.3225, "step": 534220 }, { "epoch": 0.93, "learning_rate": 3.418353289131792e-06, "loss": 2.2155, "step": 534230 }, { "epoch": 0.93, "learning_rate": 3.417481349204965e-06, "loss": 2.2621, "step": 534240 }, { "epoch": 0.93, "learning_rate": 3.4166094092781383e-06, "loss": 2.2432, "step": 534250 }, { "epoch": 0.93, "learning_rate": 3.415737469351311e-06, "loss": 2.2718, "step": 534260 }, { "epoch": 0.93, "learning_rate": 3.4148655294244854e-06, "loss": 2.2298, "step": 534270 }, { "epoch": 0.93, "learning_rate": 3.4139935894976583e-06, "loss": 2.2712, "step": 534280 }, { "epoch": 0.93, "learning_rate": 3.4131216495708317e-06, "loss": 2.2153, "step": 534290 }, { "epoch": 0.93, "learning_rate": 3.4122497096440046e-06, "loss": 2.2556, "step": 534300 }, { "epoch": 0.93, "learning_rate": 3.411377769717178e-06, "loss": 2.1313, "step": 534310 }, { "epoch": 0.93, "learning_rate": 3.410505829790351e-06, "loss": 2.2606, "step": 534320 }, { "epoch": 0.93, "learning_rate": 3.409633889863524e-06, "loss": 2.2666, "step": 534330 }, { "epoch": 0.93, "learning_rate": 3.408761949936697e-06, "loss": 2.2232, "step": 534340 }, { "epoch": 0.93, "learning_rate": 3.4078900100098705e-06, "loss": 2.2947, "step": 534350 }, { "epoch": 0.93, "learning_rate": 3.4070180700830434e-06, "loss": 2.199, "step": 534360 }, { "epoch": 0.93, "learning_rate": 3.4061461301562167e-06, "loss": 2.3334, "step": 534370 }, { "epoch": 0.93, "learning_rate": 3.4052741902293897e-06, "loss": 2.2286, "step": 534380 }, { "epoch": 0.93, "learning_rate": 3.404402250302563e-06, "loss": 2.1579, "step": 534390 }, { "epoch": 0.93, "learning_rate": 3.4035303103757368e-06, "loss": 2.2231, "step": 534400 }, { "epoch": 0.93, "learning_rate": 3.40265837044891e-06, "loss": 2.143, "step": 534410 }, { "epoch": 0.93, "learning_rate": 3.401786430522083e-06, "loss": 2.1563, "step": 534420 }, { "epoch": 0.93, "learning_rate": 3.4009144905952564e-06, "loss": 2.1365, "step": 534430 }, { "epoch": 0.93, "learning_rate": 3.4000425506684293e-06, "loss": 2.1862, "step": 534440 }, { "epoch": 0.93, "learning_rate": 3.3991706107416027e-06, "loss": 2.3183, "step": 534450 }, { "epoch": 0.93, "learning_rate": 3.3982986708147756e-06, "loss": 2.2022, "step": 534460 }, { "epoch": 0.93, "learning_rate": 3.397426730887949e-06, "loss": 2.2973, "step": 534470 }, { "epoch": 0.93, "learning_rate": 3.396554790961122e-06, "loss": 2.1479, "step": 534480 }, { "epoch": 0.93, "learning_rate": 3.395682851034295e-06, "loss": 2.3197, "step": 534490 }, { "epoch": 0.93, "learning_rate": 3.394810911107468e-06, "loss": 2.3254, "step": 534500 }, { "epoch": 0.93, "learning_rate": 3.3939389711806415e-06, "loss": 2.2445, "step": 534510 }, { "epoch": 0.93, "learning_rate": 3.3930670312538144e-06, "loss": 2.2181, "step": 534520 }, { "epoch": 0.93, "learning_rate": 3.3921950913269886e-06, "loss": 2.1547, "step": 534530 }, { "epoch": 0.93, "learning_rate": 3.3913231514001615e-06, "loss": 2.4095, "step": 534540 }, { "epoch": 0.93, "learning_rate": 3.390451211473335e-06, "loss": 2.1781, "step": 534550 }, { "epoch": 0.93, "learning_rate": 3.3895792715465078e-06, "loss": 2.2839, "step": 534560 }, { "epoch": 0.93, "learning_rate": 3.388707331619681e-06, "loss": 2.2618, "step": 534570 }, { "epoch": 0.93, "learning_rate": 3.387835391692854e-06, "loss": 2.3502, "step": 534580 }, { "epoch": 0.93, "learning_rate": 3.3869634517660274e-06, "loss": 2.2531, "step": 534590 }, { "epoch": 0.93, "learning_rate": 3.3860915118392003e-06, "loss": 2.1683, "step": 534600 }, { "epoch": 0.93, "learning_rate": 3.3852195719123737e-06, "loss": 2.2914, "step": 534610 }, { "epoch": 0.93, "learning_rate": 3.3843476319855466e-06, "loss": 2.2209, "step": 534620 }, { "epoch": 0.93, "learning_rate": 3.38347569205872e-06, "loss": 2.1329, "step": 534630 }, { "epoch": 0.93, "learning_rate": 3.382603752131893e-06, "loss": 2.2614, "step": 534640 }, { "epoch": 0.93, "learning_rate": 3.381731812205066e-06, "loss": 2.2779, "step": 534650 }, { "epoch": 0.93, "learning_rate": 3.38085987227824e-06, "loss": 2.1359, "step": 534660 }, { "epoch": 0.93, "learning_rate": 3.3799879323514133e-06, "loss": 2.1651, "step": 534670 }, { "epoch": 0.93, "learning_rate": 3.3791159924245862e-06, "loss": 2.2805, "step": 534680 }, { "epoch": 0.93, "learning_rate": 3.3782440524977596e-06, "loss": 2.3253, "step": 534690 }, { "epoch": 0.93, "learning_rate": 3.3773721125709325e-06, "loss": 2.2763, "step": 534700 }, { "epoch": 0.93, "learning_rate": 3.376500172644106e-06, "loss": 2.1133, "step": 534710 }, { "epoch": 0.93, "learning_rate": 3.3756282327172788e-06, "loss": 2.28, "step": 534720 }, { "epoch": 0.93, "learning_rate": 3.374756292790452e-06, "loss": 2.2504, "step": 534730 }, { "epoch": 0.93, "learning_rate": 3.373884352863625e-06, "loss": 2.3417, "step": 534740 }, { "epoch": 0.93, "learning_rate": 3.3730124129367984e-06, "loss": 2.1796, "step": 534750 }, { "epoch": 0.93, "learning_rate": 3.3721404730099713e-06, "loss": 2.2775, "step": 534760 }, { "epoch": 0.93, "learning_rate": 3.3712685330831447e-06, "loss": 2.2932, "step": 534770 }, { "epoch": 0.93, "learning_rate": 3.3703965931563176e-06, "loss": 2.2224, "step": 534780 }, { "epoch": 0.93, "learning_rate": 3.369524653229491e-06, "loss": 2.3642, "step": 534790 }, { "epoch": 0.93, "learning_rate": 3.3686527133026647e-06, "loss": 2.2552, "step": 534800 }, { "epoch": 0.93, "learning_rate": 3.367780773375838e-06, "loss": 2.253, "step": 534810 }, { "epoch": 0.93, "learning_rate": 3.366908833449011e-06, "loss": 2.2611, "step": 534820 }, { "epoch": 0.93, "learning_rate": 3.3660368935221843e-06, "loss": 2.3071, "step": 534830 }, { "epoch": 0.93, "learning_rate": 3.3651649535953572e-06, "loss": 2.2476, "step": 534840 }, { "epoch": 0.93, "learning_rate": 3.3642930136685306e-06, "loss": 2.2678, "step": 534850 }, { "epoch": 0.93, "learning_rate": 3.3634210737417035e-06, "loss": 2.2939, "step": 534860 }, { "epoch": 0.93, "learning_rate": 3.362549133814877e-06, "loss": 2.2695, "step": 534870 }, { "epoch": 0.93, "learning_rate": 3.3616771938880498e-06, "loss": 2.1956, "step": 534880 }, { "epoch": 0.93, "learning_rate": 3.360805253961223e-06, "loss": 2.2643, "step": 534890 }, { "epoch": 0.93, "learning_rate": 3.359933314034396e-06, "loss": 2.1824, "step": 534900 }, { "epoch": 0.93, "learning_rate": 3.3590613741075694e-06, "loss": 2.2407, "step": 534910 }, { "epoch": 0.93, "learning_rate": 3.3581894341807427e-06, "loss": 2.2691, "step": 534920 }, { "epoch": 0.93, "learning_rate": 3.3573174942539165e-06, "loss": 2.241, "step": 534930 }, { "epoch": 0.93, "learning_rate": 3.3564455543270894e-06, "loss": 2.2839, "step": 534940 }, { "epoch": 0.93, "learning_rate": 3.3555736144002628e-06, "loss": 2.2307, "step": 534950 }, { "epoch": 0.93, "learning_rate": 3.3547016744734357e-06, "loss": 2.2294, "step": 534960 }, { "epoch": 0.93, "learning_rate": 3.353829734546609e-06, "loss": 2.279, "step": 534970 }, { "epoch": 0.93, "learning_rate": 3.352957794619782e-06, "loss": 2.2433, "step": 534980 }, { "epoch": 0.93, "learning_rate": 3.3520858546929553e-06, "loss": 2.2397, "step": 534990 }, { "epoch": 0.93, "learning_rate": 3.3512139147661282e-06, "loss": 2.3348, "step": 535000 }, { "epoch": 0.93, "learning_rate": 3.3503419748393016e-06, "loss": 2.3274, "step": 535010 }, { "epoch": 0.93, "learning_rate": 3.3494700349124745e-06, "loss": 2.2107, "step": 535020 }, { "epoch": 0.93, "learning_rate": 3.348598094985648e-06, "loss": 2.301, "step": 535030 }, { "epoch": 0.93, "learning_rate": 3.3477261550588208e-06, "loss": 2.3355, "step": 535040 }, { "epoch": 0.93, "learning_rate": 3.346854215131994e-06, "loss": 2.3201, "step": 535050 }, { "epoch": 0.93, "learning_rate": 3.345982275205168e-06, "loss": 2.3214, "step": 535060 }, { "epoch": 0.93, "learning_rate": 3.3451103352783412e-06, "loss": 2.1851, "step": 535070 }, { "epoch": 0.93, "learning_rate": 3.344238395351514e-06, "loss": 2.2501, "step": 535080 }, { "epoch": 0.93, "learning_rate": 3.3433664554246875e-06, "loss": 2.2748, "step": 535090 }, { "epoch": 0.93, "learning_rate": 3.3424945154978604e-06, "loss": 2.1218, "step": 535100 }, { "epoch": 0.93, "learning_rate": 3.3416225755710338e-06, "loss": 2.2084, "step": 535110 }, { "epoch": 0.93, "learning_rate": 3.3407506356442067e-06, "loss": 2.2043, "step": 535120 }, { "epoch": 0.93, "learning_rate": 3.33987869571738e-06, "loss": 2.1721, "step": 535130 }, { "epoch": 0.93, "learning_rate": 3.339006755790553e-06, "loss": 2.2642, "step": 535140 }, { "epoch": 0.93, "learning_rate": 3.3381348158637263e-06, "loss": 2.2685, "step": 535150 }, { "epoch": 0.93, "learning_rate": 3.3372628759368992e-06, "loss": 2.2938, "step": 535160 }, { "epoch": 0.93, "learning_rate": 3.3363909360100726e-06, "loss": 2.3086, "step": 535170 }, { "epoch": 0.93, "learning_rate": 3.335518996083246e-06, "loss": 2.2737, "step": 535180 }, { "epoch": 0.93, "learning_rate": 3.334647056156419e-06, "loss": 2.3166, "step": 535190 }, { "epoch": 0.93, "learning_rate": 3.3337751162295926e-06, "loss": 2.2667, "step": 535200 }, { "epoch": 0.93, "learning_rate": 3.332903176302766e-06, "loss": 2.2067, "step": 535210 }, { "epoch": 0.93, "learning_rate": 3.332031236375939e-06, "loss": 2.3123, "step": 535220 }, { "epoch": 0.93, "learning_rate": 3.3311592964491122e-06, "loss": 2.2458, "step": 535230 }, { "epoch": 0.93, "learning_rate": 3.330287356522285e-06, "loss": 2.198, "step": 535240 }, { "epoch": 0.93, "learning_rate": 3.3294154165954585e-06, "loss": 2.1825, "step": 535250 }, { "epoch": 0.93, "learning_rate": 3.3285434766686314e-06, "loss": 2.3119, "step": 535260 }, { "epoch": 0.93, "learning_rate": 3.3276715367418048e-06, "loss": 2.2547, "step": 535270 }, { "epoch": 0.93, "learning_rate": 3.3267995968149777e-06, "loss": 2.1329, "step": 535280 }, { "epoch": 0.93, "learning_rate": 3.325927656888151e-06, "loss": 2.2197, "step": 535290 }, { "epoch": 0.93, "learning_rate": 3.325055716961324e-06, "loss": 2.3162, "step": 535300 }, { "epoch": 0.93, "learning_rate": 3.3241837770344973e-06, "loss": 2.2555, "step": 535310 }, { "epoch": 0.93, "learning_rate": 3.3233118371076707e-06, "loss": 2.3087, "step": 535320 }, { "epoch": 0.93, "learning_rate": 3.3224398971808444e-06, "loss": 2.2921, "step": 535330 }, { "epoch": 0.93, "learning_rate": 3.3215679572540174e-06, "loss": 2.2476, "step": 535340 }, { "epoch": 0.93, "learning_rate": 3.3206960173271907e-06, "loss": 2.2516, "step": 535350 }, { "epoch": 0.93, "learning_rate": 3.3198240774003636e-06, "loss": 2.1826, "step": 535360 }, { "epoch": 0.93, "learning_rate": 3.318952137473537e-06, "loss": 2.2514, "step": 535370 }, { "epoch": 0.93, "learning_rate": 3.31808019754671e-06, "loss": 2.3359, "step": 535380 }, { "epoch": 0.93, "learning_rate": 3.3172082576198832e-06, "loss": 2.2104, "step": 535390 }, { "epoch": 0.93, "learning_rate": 3.316336317693056e-06, "loss": 2.1037, "step": 535400 }, { "epoch": 0.93, "learning_rate": 3.3154643777662295e-06, "loss": 2.3122, "step": 535410 }, { "epoch": 0.93, "learning_rate": 3.3145924378394024e-06, "loss": 2.286, "step": 535420 }, { "epoch": 0.93, "learning_rate": 3.3137204979125758e-06, "loss": 2.317, "step": 535430 }, { "epoch": 0.93, "learning_rate": 3.312848557985749e-06, "loss": 2.2106, "step": 535440 }, { "epoch": 0.93, "learning_rate": 3.311976618058922e-06, "loss": 2.2187, "step": 535450 }, { "epoch": 0.93, "learning_rate": 3.311104678132096e-06, "loss": 2.291, "step": 535460 }, { "epoch": 0.93, "learning_rate": 3.310232738205269e-06, "loss": 2.2479, "step": 535470 }, { "epoch": 0.93, "learning_rate": 3.309360798278442e-06, "loss": 2.2038, "step": 535480 }, { "epoch": 0.93, "learning_rate": 3.3084888583516154e-06, "loss": 2.1474, "step": 535490 }, { "epoch": 0.93, "learning_rate": 3.3076169184247884e-06, "loss": 2.2648, "step": 535500 }, { "epoch": 0.93, "learning_rate": 3.3067449784979617e-06, "loss": 2.1899, "step": 535510 }, { "epoch": 0.93, "learning_rate": 3.3058730385711346e-06, "loss": 2.2674, "step": 535520 }, { "epoch": 0.93, "learning_rate": 3.305001098644308e-06, "loss": 2.2722, "step": 535530 }, { "epoch": 0.93, "learning_rate": 3.304129158717481e-06, "loss": 2.2693, "step": 535540 }, { "epoch": 0.93, "learning_rate": 3.3032572187906542e-06, "loss": 2.2177, "step": 535550 }, { "epoch": 0.93, "learning_rate": 3.302385278863827e-06, "loss": 2.2165, "step": 535560 }, { "epoch": 0.93, "learning_rate": 3.3015133389370005e-06, "loss": 2.2643, "step": 535570 }, { "epoch": 0.93, "learning_rate": 3.300641399010174e-06, "loss": 2.2669, "step": 535580 }, { "epoch": 0.93, "learning_rate": 3.2997694590833468e-06, "loss": 2.2574, "step": 535590 }, { "epoch": 0.93, "learning_rate": 3.2988975191565206e-06, "loss": 2.3148, "step": 535600 }, { "epoch": 0.93, "learning_rate": 3.298025579229694e-06, "loss": 2.3414, "step": 535610 }, { "epoch": 0.93, "learning_rate": 3.297153639302867e-06, "loss": 2.2758, "step": 535620 }, { "epoch": 0.93, "learning_rate": 3.29628169937604e-06, "loss": 2.2296, "step": 535630 }, { "epoch": 0.93, "learning_rate": 3.295409759449213e-06, "loss": 2.2938, "step": 535640 }, { "epoch": 0.93, "learning_rate": 3.2945378195223864e-06, "loss": 2.2688, "step": 535650 }, { "epoch": 0.93, "learning_rate": 3.2936658795955594e-06, "loss": 2.3066, "step": 535660 }, { "epoch": 0.93, "learning_rate": 3.2927939396687327e-06, "loss": 2.3637, "step": 535670 }, { "epoch": 0.93, "learning_rate": 3.2919219997419056e-06, "loss": 2.1657, "step": 535680 }, { "epoch": 0.93, "learning_rate": 3.291050059815079e-06, "loss": 2.212, "step": 535690 }, { "epoch": 0.93, "learning_rate": 3.2901781198882523e-06, "loss": 2.323, "step": 535700 }, { "epoch": 0.93, "learning_rate": 3.2893061799614252e-06, "loss": 2.2901, "step": 535710 }, { "epoch": 0.93, "learning_rate": 3.2884342400345986e-06, "loss": 2.1724, "step": 535720 }, { "epoch": 0.93, "learning_rate": 3.2875623001077724e-06, "loss": 2.344, "step": 535730 }, { "epoch": 0.93, "learning_rate": 3.2866903601809453e-06, "loss": 2.3463, "step": 535740 }, { "epoch": 0.93, "learning_rate": 3.2858184202541186e-06, "loss": 2.1896, "step": 535750 }, { "epoch": 0.93, "learning_rate": 3.2849464803272916e-06, "loss": 2.2397, "step": 535760 }, { "epoch": 0.93, "learning_rate": 3.284074540400465e-06, "loss": 2.2323, "step": 535770 }, { "epoch": 0.93, "learning_rate": 3.283202600473638e-06, "loss": 2.2906, "step": 535780 }, { "epoch": 0.93, "learning_rate": 3.282330660546811e-06, "loss": 2.1888, "step": 535790 }, { "epoch": 0.93, "learning_rate": 3.281458720619984e-06, "loss": 2.2675, "step": 535800 }, { "epoch": 0.93, "learning_rate": 3.2805867806931574e-06, "loss": 2.2495, "step": 535810 }, { "epoch": 0.93, "learning_rate": 3.2797148407663304e-06, "loss": 2.2783, "step": 535820 }, { "epoch": 0.93, "learning_rate": 3.2788429008395037e-06, "loss": 2.2552, "step": 535830 }, { "epoch": 0.93, "learning_rate": 3.277970960912677e-06, "loss": 2.2055, "step": 535840 }, { "epoch": 0.93, "learning_rate": 3.27709902098585e-06, "loss": 2.1947, "step": 535850 }, { "epoch": 0.93, "learning_rate": 3.2762270810590237e-06, "loss": 2.1378, "step": 535860 }, { "epoch": 0.93, "learning_rate": 3.275355141132197e-06, "loss": 2.2285, "step": 535870 }, { "epoch": 0.93, "learning_rate": 3.27448320120537e-06, "loss": 2.178, "step": 535880 }, { "epoch": 0.93, "learning_rate": 3.2736112612785434e-06, "loss": 2.2436, "step": 535890 }, { "epoch": 0.93, "learning_rate": 3.2727393213517163e-06, "loss": 2.2486, "step": 535900 }, { "epoch": 0.93, "learning_rate": 3.2718673814248896e-06, "loss": 2.3218, "step": 535910 }, { "epoch": 0.93, "learning_rate": 3.2709954414980626e-06, "loss": 2.2781, "step": 535920 }, { "epoch": 0.93, "learning_rate": 3.270123501571236e-06, "loss": 2.202, "step": 535930 }, { "epoch": 0.93, "learning_rate": 3.269251561644409e-06, "loss": 2.2034, "step": 535940 }, { "epoch": 0.93, "learning_rate": 3.268379621717582e-06, "loss": 2.286, "step": 535950 }, { "epoch": 0.93, "learning_rate": 3.2675076817907555e-06, "loss": 2.2337, "step": 535960 }, { "epoch": 0.93, "learning_rate": 3.2666357418639284e-06, "loss": 2.1801, "step": 535970 }, { "epoch": 0.93, "learning_rate": 3.2657638019371018e-06, "loss": 2.3168, "step": 535980 }, { "epoch": 0.93, "learning_rate": 3.2648918620102756e-06, "loss": 2.2644, "step": 535990 }, { "epoch": 0.93, "learning_rate": 3.2640199220834485e-06, "loss": 2.2873, "step": 536000 }, { "epoch": 0.93, "learning_rate": 3.263147982156622e-06, "loss": 2.229, "step": 536010 }, { "epoch": 0.93, "learning_rate": 3.2622760422297947e-06, "loss": 2.2341, "step": 536020 }, { "epoch": 0.93, "learning_rate": 3.261404102302968e-06, "loss": 2.1947, "step": 536030 }, { "epoch": 0.93, "learning_rate": 3.260532162376141e-06, "loss": 2.4571, "step": 536040 }, { "epoch": 0.93, "learning_rate": 3.2596602224493144e-06, "loss": 2.3251, "step": 536050 }, { "epoch": 0.93, "learning_rate": 3.2587882825224873e-06, "loss": 2.2201, "step": 536060 }, { "epoch": 0.93, "learning_rate": 3.2579163425956606e-06, "loss": 2.2249, "step": 536070 }, { "epoch": 0.93, "learning_rate": 3.2570444026688336e-06, "loss": 2.2656, "step": 536080 }, { "epoch": 0.93, "learning_rate": 3.256172462742007e-06, "loss": 2.2806, "step": 536090 }, { "epoch": 0.93, "learning_rate": 3.2553005228151802e-06, "loss": 2.2444, "step": 536100 }, { "epoch": 0.93, "learning_rate": 3.254428582888353e-06, "loss": 2.399, "step": 536110 }, { "epoch": 0.93, "learning_rate": 3.2535566429615265e-06, "loss": 2.1222, "step": 536120 }, { "epoch": 0.93, "learning_rate": 3.2526847030347003e-06, "loss": 2.2786, "step": 536130 }, { "epoch": 0.93, "learning_rate": 3.251812763107873e-06, "loss": 2.2067, "step": 536140 }, { "epoch": 0.93, "learning_rate": 3.2509408231810466e-06, "loss": 2.2573, "step": 536150 }, { "epoch": 0.93, "learning_rate": 3.2500688832542195e-06, "loss": 2.1837, "step": 536160 }, { "epoch": 0.94, "learning_rate": 3.249196943327393e-06, "loss": 2.1983, "step": 536170 }, { "epoch": 0.94, "learning_rate": 3.2483250034005657e-06, "loss": 2.2212, "step": 536180 }, { "epoch": 0.94, "learning_rate": 3.247453063473739e-06, "loss": 2.3439, "step": 536190 }, { "epoch": 0.94, "learning_rate": 3.246581123546912e-06, "loss": 2.3146, "step": 536200 }, { "epoch": 0.94, "learning_rate": 3.2457091836200854e-06, "loss": 2.2567, "step": 536210 }, { "epoch": 0.94, "learning_rate": 3.2448372436932587e-06, "loss": 2.2441, "step": 536220 }, { "epoch": 0.94, "learning_rate": 3.2439653037664316e-06, "loss": 2.2706, "step": 536230 }, { "epoch": 0.94, "learning_rate": 3.243093363839605e-06, "loss": 2.3006, "step": 536240 }, { "epoch": 0.94, "learning_rate": 3.242221423912778e-06, "loss": 2.2381, "step": 536250 }, { "epoch": 0.94, "learning_rate": 3.2413494839859517e-06, "loss": 2.392, "step": 536260 }, { "epoch": 0.94, "learning_rate": 3.240477544059125e-06, "loss": 2.2326, "step": 536270 }, { "epoch": 0.94, "learning_rate": 3.239605604132298e-06, "loss": 2.24, "step": 536280 }, { "epoch": 0.94, "learning_rate": 3.2387336642054713e-06, "loss": 2.0923, "step": 536290 }, { "epoch": 0.94, "learning_rate": 3.237861724278644e-06, "loss": 2.1709, "step": 536300 }, { "epoch": 0.94, "learning_rate": 3.2369897843518176e-06, "loss": 2.1517, "step": 536310 }, { "epoch": 0.94, "learning_rate": 3.2361178444249905e-06, "loss": 2.2985, "step": 536320 }, { "epoch": 0.94, "learning_rate": 3.235245904498164e-06, "loss": 2.3014, "step": 536330 }, { "epoch": 0.94, "learning_rate": 3.2343739645713367e-06, "loss": 2.3085, "step": 536340 }, { "epoch": 0.94, "learning_rate": 3.23350202464451e-06, "loss": 2.3036, "step": 536350 }, { "epoch": 0.94, "learning_rate": 3.2326300847176834e-06, "loss": 2.2863, "step": 536360 }, { "epoch": 0.94, "learning_rate": 3.2317581447908564e-06, "loss": 2.3914, "step": 536370 }, { "epoch": 0.94, "learning_rate": 3.2308862048640297e-06, "loss": 2.2307, "step": 536380 }, { "epoch": 0.94, "learning_rate": 3.2300142649372035e-06, "loss": 2.1266, "step": 536390 }, { "epoch": 0.94, "learning_rate": 3.2291423250103764e-06, "loss": 2.2812, "step": 536400 }, { "epoch": 0.94, "learning_rate": 3.2282703850835498e-06, "loss": 2.3657, "step": 536410 }, { "epoch": 0.94, "learning_rate": 3.2273984451567227e-06, "loss": 2.122, "step": 536420 }, { "epoch": 0.94, "learning_rate": 3.226526505229896e-06, "loss": 2.2138, "step": 536430 }, { "epoch": 0.94, "learning_rate": 3.225654565303069e-06, "loss": 2.2666, "step": 536440 }, { "epoch": 0.94, "learning_rate": 3.2247826253762423e-06, "loss": 2.2036, "step": 536450 }, { "epoch": 0.94, "learning_rate": 3.2239106854494152e-06, "loss": 2.2021, "step": 536460 }, { "epoch": 0.94, "learning_rate": 3.2230387455225886e-06, "loss": 2.293, "step": 536470 }, { "epoch": 0.94, "learning_rate": 3.222166805595762e-06, "loss": 2.1794, "step": 536480 }, { "epoch": 0.94, "learning_rate": 3.221294865668935e-06, "loss": 2.2521, "step": 536490 }, { "epoch": 0.94, "learning_rate": 3.220422925742108e-06, "loss": 2.1766, "step": 536500 }, { "epoch": 0.94, "learning_rate": 3.219550985815281e-06, "loss": 2.2993, "step": 536510 }, { "epoch": 0.94, "learning_rate": 3.2186790458884544e-06, "loss": 2.2886, "step": 536520 }, { "epoch": 0.94, "learning_rate": 3.2178071059616282e-06, "loss": 2.3214, "step": 536530 }, { "epoch": 0.94, "learning_rate": 3.216935166034801e-06, "loss": 2.1927, "step": 536540 }, { "epoch": 0.94, "learning_rate": 3.2160632261079745e-06, "loss": 2.2478, "step": 536550 }, { "epoch": 0.94, "learning_rate": 3.2151912861811474e-06, "loss": 2.2278, "step": 536560 }, { "epoch": 0.94, "learning_rate": 3.2143193462543208e-06, "loss": 2.2832, "step": 536570 }, { "epoch": 0.94, "learning_rate": 3.2134474063274937e-06, "loss": 2.3393, "step": 536580 }, { "epoch": 0.94, "learning_rate": 3.212575466400667e-06, "loss": 2.2266, "step": 536590 }, { "epoch": 0.94, "learning_rate": 3.21170352647384e-06, "loss": 2.2304, "step": 536600 }, { "epoch": 0.94, "learning_rate": 3.2108315865470133e-06, "loss": 2.2773, "step": 536610 }, { "epoch": 0.94, "learning_rate": 3.2099596466201866e-06, "loss": 2.2542, "step": 536620 }, { "epoch": 0.94, "learning_rate": 3.2090877066933596e-06, "loss": 2.1482, "step": 536630 }, { "epoch": 0.94, "learning_rate": 3.208215766766533e-06, "loss": 2.2627, "step": 536640 }, { "epoch": 0.94, "learning_rate": 3.207343826839706e-06, "loss": 2.3117, "step": 536650 }, { "epoch": 0.94, "learning_rate": 3.2064718869128796e-06, "loss": 2.3057, "step": 536660 }, { "epoch": 0.94, "learning_rate": 3.205599946986053e-06, "loss": 2.1842, "step": 536670 }, { "epoch": 0.94, "learning_rate": 3.204728007059226e-06, "loss": 2.1814, "step": 536680 }, { "epoch": 0.94, "learning_rate": 3.2038560671323992e-06, "loss": 2.1736, "step": 536690 }, { "epoch": 0.94, "learning_rate": 3.202984127205572e-06, "loss": 2.3084, "step": 536700 }, { "epoch": 0.94, "learning_rate": 3.2021121872787455e-06, "loss": 2.3203, "step": 536710 }, { "epoch": 0.94, "learning_rate": 3.2012402473519184e-06, "loss": 2.2249, "step": 536720 }, { "epoch": 0.94, "learning_rate": 3.2003683074250918e-06, "loss": 2.3413, "step": 536730 }, { "epoch": 0.94, "learning_rate": 3.199496367498265e-06, "loss": 2.2555, "step": 536740 }, { "epoch": 0.94, "learning_rate": 3.198624427571438e-06, "loss": 2.316, "step": 536750 }, { "epoch": 0.94, "learning_rate": 3.1977524876446114e-06, "loss": 2.1765, "step": 536760 }, { "epoch": 0.94, "learning_rate": 3.1968805477177843e-06, "loss": 2.2823, "step": 536770 }, { "epoch": 0.94, "learning_rate": 3.1960086077909576e-06, "loss": 2.2221, "step": 536780 }, { "epoch": 0.94, "learning_rate": 3.1951366678641314e-06, "loss": 2.3498, "step": 536790 }, { "epoch": 0.94, "learning_rate": 3.1942647279373043e-06, "loss": 2.1695, "step": 536800 }, { "epoch": 0.94, "learning_rate": 3.1933927880104777e-06, "loss": 2.2141, "step": 536810 }, { "epoch": 0.94, "learning_rate": 3.1925208480836506e-06, "loss": 2.3309, "step": 536820 }, { "epoch": 0.94, "learning_rate": 3.191648908156824e-06, "loss": 2.2212, "step": 536830 }, { "epoch": 0.94, "learning_rate": 3.190776968229997e-06, "loss": 2.2307, "step": 536840 }, { "epoch": 0.94, "learning_rate": 3.1899050283031702e-06, "loss": 2.3116, "step": 536850 }, { "epoch": 0.94, "learning_rate": 3.189033088376343e-06, "loss": 2.3307, "step": 536860 }, { "epoch": 0.94, "learning_rate": 3.1881611484495165e-06, "loss": 2.3183, "step": 536870 }, { "epoch": 0.94, "learning_rate": 3.18728920852269e-06, "loss": 2.2587, "step": 536880 }, { "epoch": 0.94, "learning_rate": 3.1864172685958628e-06, "loss": 2.3687, "step": 536890 }, { "epoch": 0.94, "learning_rate": 3.185545328669036e-06, "loss": 2.1713, "step": 536900 }, { "epoch": 0.94, "learning_rate": 3.184673388742209e-06, "loss": 2.3361, "step": 536910 }, { "epoch": 0.94, "learning_rate": 3.1838014488153824e-06, "loss": 2.3099, "step": 536920 }, { "epoch": 0.94, "learning_rate": 3.182929508888556e-06, "loss": 2.3755, "step": 536930 }, { "epoch": 0.94, "learning_rate": 3.182057568961729e-06, "loss": 2.2319, "step": 536940 }, { "epoch": 0.94, "learning_rate": 3.1811856290349024e-06, "loss": 2.2196, "step": 536950 }, { "epoch": 0.94, "learning_rate": 3.1803136891080753e-06, "loss": 2.2917, "step": 536960 }, { "epoch": 0.94, "learning_rate": 3.1794417491812487e-06, "loss": 2.3442, "step": 536970 }, { "epoch": 0.94, "learning_rate": 3.1785698092544216e-06, "loss": 2.2319, "step": 536980 }, { "epoch": 0.94, "learning_rate": 3.177697869327595e-06, "loss": 2.2195, "step": 536990 }, { "epoch": 0.94, "learning_rate": 3.1768259294007683e-06, "loss": 2.1825, "step": 537000 }, { "epoch": 0.94, "learning_rate": 3.1759539894739412e-06, "loss": 2.2083, "step": 537010 }, { "epoch": 0.94, "learning_rate": 3.1750820495471146e-06, "loss": 2.1925, "step": 537020 }, { "epoch": 0.94, "learning_rate": 3.1742101096202875e-06, "loss": 2.2748, "step": 537030 }, { "epoch": 0.94, "learning_rate": 3.173338169693461e-06, "loss": 2.2268, "step": 537040 }, { "epoch": 0.94, "learning_rate": 3.1724662297666338e-06, "loss": 2.3471, "step": 537050 }, { "epoch": 0.94, "learning_rate": 3.1715942898398075e-06, "loss": 2.2587, "step": 537060 }, { "epoch": 0.94, "learning_rate": 3.170722349912981e-06, "loss": 2.1665, "step": 537070 }, { "epoch": 0.94, "learning_rate": 3.169850409986154e-06, "loss": 2.2729, "step": 537080 }, { "epoch": 0.94, "learning_rate": 3.168978470059327e-06, "loss": 2.2281, "step": 537090 }, { "epoch": 0.94, "learning_rate": 3.1681065301325e-06, "loss": 2.3033, "step": 537100 }, { "epoch": 0.94, "learning_rate": 3.1672345902056734e-06, "loss": 2.2519, "step": 537110 }, { "epoch": 0.94, "learning_rate": 3.1663626502788463e-06, "loss": 2.239, "step": 537120 }, { "epoch": 0.94, "learning_rate": 3.1654907103520197e-06, "loss": 2.2318, "step": 537130 }, { "epoch": 0.94, "learning_rate": 3.164618770425193e-06, "loss": 2.2499, "step": 537140 }, { "epoch": 0.94, "learning_rate": 3.163746830498366e-06, "loss": 2.2372, "step": 537150 }, { "epoch": 0.94, "learning_rate": 3.1628748905715393e-06, "loss": 2.0954, "step": 537160 }, { "epoch": 0.94, "learning_rate": 3.1620029506447122e-06, "loss": 2.1726, "step": 537170 }, { "epoch": 0.94, "learning_rate": 3.1611310107178856e-06, "loss": 2.144, "step": 537180 }, { "epoch": 0.94, "learning_rate": 3.1602590707910593e-06, "loss": 2.2116, "step": 537190 }, { "epoch": 0.94, "learning_rate": 3.1593871308642323e-06, "loss": 2.2739, "step": 537200 }, { "epoch": 0.94, "learning_rate": 3.1585151909374056e-06, "loss": 2.3296, "step": 537210 }, { "epoch": 0.94, "learning_rate": 3.1576432510105785e-06, "loss": 2.191, "step": 537220 }, { "epoch": 0.94, "learning_rate": 3.156771311083752e-06, "loss": 2.3443, "step": 537230 }, { "epoch": 0.94, "learning_rate": 3.155899371156925e-06, "loss": 2.3893, "step": 537240 }, { "epoch": 0.94, "learning_rate": 3.155027431230098e-06, "loss": 2.2076, "step": 537250 }, { "epoch": 0.94, "learning_rate": 3.1541554913032715e-06, "loss": 2.276, "step": 537260 }, { "epoch": 0.94, "learning_rate": 3.1532835513764444e-06, "loss": 2.2453, "step": 537270 }, { "epoch": 0.94, "learning_rate": 3.1524116114496178e-06, "loss": 2.1982, "step": 537280 }, { "epoch": 0.94, "learning_rate": 3.1515396715227907e-06, "loss": 2.3439, "step": 537290 }, { "epoch": 0.94, "learning_rate": 3.150667731595964e-06, "loss": 2.347, "step": 537300 }, { "epoch": 0.94, "learning_rate": 3.149795791669137e-06, "loss": 2.259, "step": 537310 }, { "epoch": 0.94, "learning_rate": 3.1489238517423103e-06, "loss": 2.2691, "step": 537320 }, { "epoch": 0.94, "learning_rate": 3.148051911815484e-06, "loss": 2.2693, "step": 537330 }, { "epoch": 0.94, "learning_rate": 3.147179971888657e-06, "loss": 2.2585, "step": 537340 }, { "epoch": 0.94, "learning_rate": 3.1463080319618303e-06, "loss": 2.2635, "step": 537350 }, { "epoch": 0.94, "learning_rate": 3.1454360920350033e-06, "loss": 2.2717, "step": 537360 }, { "epoch": 0.94, "learning_rate": 3.1445641521081766e-06, "loss": 2.3047, "step": 537370 }, { "epoch": 0.94, "learning_rate": 3.1436922121813495e-06, "loss": 2.3806, "step": 537380 }, { "epoch": 0.94, "learning_rate": 3.142820272254523e-06, "loss": 2.2675, "step": 537390 }, { "epoch": 0.94, "learning_rate": 3.1419483323276962e-06, "loss": 2.1566, "step": 537400 }, { "epoch": 0.94, "learning_rate": 3.141076392400869e-06, "loss": 2.2624, "step": 537410 }, { "epoch": 0.94, "learning_rate": 3.1402044524740425e-06, "loss": 2.2903, "step": 537420 }, { "epoch": 0.94, "learning_rate": 3.1393325125472154e-06, "loss": 2.1672, "step": 537430 }, { "epoch": 0.94, "learning_rate": 3.1384605726203888e-06, "loss": 2.2072, "step": 537440 }, { "epoch": 0.94, "learning_rate": 3.1375886326935617e-06, "loss": 2.197, "step": 537450 }, { "epoch": 0.94, "learning_rate": 3.1367166927667355e-06, "loss": 2.2747, "step": 537460 }, { "epoch": 0.94, "learning_rate": 3.135844752839909e-06, "loss": 2.2124, "step": 537470 }, { "epoch": 0.94, "learning_rate": 3.1349728129130817e-06, "loss": 2.2018, "step": 537480 }, { "epoch": 0.94, "learning_rate": 3.134100872986255e-06, "loss": 2.2206, "step": 537490 }, { "epoch": 0.94, "learning_rate": 3.133228933059428e-06, "loss": 2.2808, "step": 537500 }, { "epoch": 0.94, "learning_rate": 3.1323569931326013e-06, "loss": 2.2972, "step": 537510 }, { "epoch": 0.94, "learning_rate": 3.1314850532057747e-06, "loss": 2.2253, "step": 537520 }, { "epoch": 0.94, "learning_rate": 3.1306131132789476e-06, "loss": 2.253, "step": 537530 }, { "epoch": 0.94, "learning_rate": 3.129741173352121e-06, "loss": 2.2628, "step": 537540 }, { "epoch": 0.94, "learning_rate": 3.128869233425294e-06, "loss": 2.2365, "step": 537550 }, { "epoch": 0.94, "learning_rate": 3.1279972934984672e-06, "loss": 2.2695, "step": 537560 }, { "epoch": 0.94, "learning_rate": 3.12712535357164e-06, "loss": 2.2909, "step": 537570 }, { "epoch": 0.94, "learning_rate": 3.1262534136448135e-06, "loss": 2.2352, "step": 537580 }, { "epoch": 0.94, "learning_rate": 3.1253814737179873e-06, "loss": 2.3245, "step": 537590 }, { "epoch": 0.94, "learning_rate": 3.12450953379116e-06, "loss": 2.202, "step": 537600 }, { "epoch": 0.94, "learning_rate": 3.123637593864333e-06, "loss": 2.1498, "step": 537610 }, { "epoch": 0.94, "learning_rate": 3.1227656539375065e-06, "loss": 2.3136, "step": 537620 }, { "epoch": 0.94, "learning_rate": 3.12189371401068e-06, "loss": 2.2406, "step": 537630 }, { "epoch": 0.94, "learning_rate": 3.121021774083853e-06, "loss": 2.2072, "step": 537640 }, { "epoch": 0.94, "learning_rate": 3.120149834157026e-06, "loss": 2.1767, "step": 537650 }, { "epoch": 0.94, "learning_rate": 3.1192778942301994e-06, "loss": 2.3305, "step": 537660 }, { "epoch": 0.94, "learning_rate": 3.1184059543033723e-06, "loss": 2.331, "step": 537670 }, { "epoch": 0.94, "learning_rate": 3.1175340143765457e-06, "loss": 2.2184, "step": 537680 }, { "epoch": 0.94, "learning_rate": 3.116662074449719e-06, "loss": 2.3048, "step": 537690 }, { "epoch": 0.94, "learning_rate": 3.115790134522892e-06, "loss": 2.3394, "step": 537700 }, { "epoch": 0.94, "learning_rate": 3.1149181945960653e-06, "loss": 2.3074, "step": 537710 }, { "epoch": 0.94, "learning_rate": 3.1140462546692386e-06, "loss": 2.1718, "step": 537720 }, { "epoch": 0.94, "learning_rate": 3.1131743147424116e-06, "loss": 2.2154, "step": 537730 }, { "epoch": 0.94, "learning_rate": 3.112302374815585e-06, "loss": 2.2192, "step": 537740 }, { "epoch": 0.94, "learning_rate": 3.111430434888758e-06, "loss": 2.2203, "step": 537750 }, { "epoch": 0.94, "learning_rate": 3.110558494961931e-06, "loss": 2.2006, "step": 537760 }, { "epoch": 0.94, "learning_rate": 3.1096865550351045e-06, "loss": 2.358, "step": 537770 }, { "epoch": 0.94, "learning_rate": 3.108814615108278e-06, "loss": 2.3073, "step": 537780 }, { "epoch": 0.94, "learning_rate": 3.107942675181451e-06, "loss": 2.342, "step": 537790 }, { "epoch": 0.94, "learning_rate": 3.107070735254624e-06, "loss": 2.3046, "step": 537800 }, { "epoch": 0.94, "learning_rate": 3.106198795327797e-06, "loss": 2.3038, "step": 537810 }, { "epoch": 0.94, "learning_rate": 3.1053268554009704e-06, "loss": 2.1727, "step": 537820 }, { "epoch": 0.94, "learning_rate": 3.1044549154741438e-06, "loss": 2.2889, "step": 537830 }, { "epoch": 0.94, "learning_rate": 3.103582975547317e-06, "loss": 2.1305, "step": 537840 }, { "epoch": 0.94, "learning_rate": 3.10271103562049e-06, "loss": 2.1498, "step": 537850 }, { "epoch": 0.94, "learning_rate": 3.1018390956936634e-06, "loss": 2.2472, "step": 537860 }, { "epoch": 0.94, "learning_rate": 3.1009671557668363e-06, "loss": 2.1019, "step": 537870 }, { "epoch": 0.94, "learning_rate": 3.1000952158400096e-06, "loss": 2.2235, "step": 537880 }, { "epoch": 0.94, "learning_rate": 3.099223275913183e-06, "loss": 2.2897, "step": 537890 }, { "epoch": 0.94, "learning_rate": 3.0983513359863563e-06, "loss": 2.279, "step": 537900 }, { "epoch": 0.94, "learning_rate": 3.0974793960595293e-06, "loss": 2.29, "step": 537910 }, { "epoch": 0.94, "learning_rate": 3.0966074561327026e-06, "loss": 2.1617, "step": 537920 }, { "epoch": 0.94, "learning_rate": 3.0957355162058755e-06, "loss": 2.198, "step": 537930 }, { "epoch": 0.94, "learning_rate": 3.094863576279049e-06, "loss": 2.2504, "step": 537940 }, { "epoch": 0.94, "learning_rate": 3.093991636352222e-06, "loss": 2.2537, "step": 537950 }, { "epoch": 0.94, "learning_rate": 3.093119696425395e-06, "loss": 2.1914, "step": 537960 }, { "epoch": 0.94, "learning_rate": 3.0922477564985685e-06, "loss": 2.3215, "step": 537970 }, { "epoch": 0.94, "learning_rate": 3.091375816571742e-06, "loss": 2.3401, "step": 537980 }, { "epoch": 0.94, "learning_rate": 3.0905038766449148e-06, "loss": 2.271, "step": 537990 }, { "epoch": 0.94, "learning_rate": 3.089631936718088e-06, "loss": 2.2241, "step": 538000 }, { "epoch": 0.94, "learning_rate": 3.088759996791261e-06, "loss": 2.2137, "step": 538010 }, { "epoch": 0.94, "learning_rate": 3.0878880568644344e-06, "loss": 2.3792, "step": 538020 }, { "epoch": 0.94, "learning_rate": 3.0870161169376077e-06, "loss": 2.3484, "step": 538030 }, { "epoch": 0.94, "learning_rate": 3.086144177010781e-06, "loss": 2.2959, "step": 538040 }, { "epoch": 0.94, "learning_rate": 3.085272237083954e-06, "loss": 2.3472, "step": 538050 }, { "epoch": 0.94, "learning_rate": 3.0844002971571273e-06, "loss": 2.2093, "step": 538060 }, { "epoch": 0.94, "learning_rate": 3.0835283572303003e-06, "loss": 2.2218, "step": 538070 }, { "epoch": 0.94, "learning_rate": 3.0826564173034736e-06, "loss": 2.2519, "step": 538080 }, { "epoch": 0.94, "learning_rate": 3.081784477376647e-06, "loss": 2.2299, "step": 538090 }, { "epoch": 0.94, "learning_rate": 3.0809125374498203e-06, "loss": 2.333, "step": 538100 }, { "epoch": 0.94, "learning_rate": 3.0800405975229932e-06, "loss": 2.2391, "step": 538110 }, { "epoch": 0.94, "learning_rate": 3.0791686575961666e-06, "loss": 2.2007, "step": 538120 }, { "epoch": 0.94, "learning_rate": 3.0782967176693395e-06, "loss": 2.335, "step": 538130 }, { "epoch": 0.94, "learning_rate": 3.077424777742513e-06, "loss": 2.2149, "step": 538140 }, { "epoch": 0.94, "learning_rate": 3.0765528378156858e-06, "loss": 2.2026, "step": 538150 }, { "epoch": 0.94, "learning_rate": 3.0756808978888595e-06, "loss": 2.2326, "step": 538160 }, { "epoch": 0.94, "learning_rate": 3.0748089579620325e-06, "loss": 2.2673, "step": 538170 }, { "epoch": 0.94, "learning_rate": 3.073937018035206e-06, "loss": 2.156, "step": 538180 }, { "epoch": 0.94, "learning_rate": 3.0730650781083787e-06, "loss": 2.3259, "step": 538190 }, { "epoch": 0.94, "learning_rate": 3.072193138181552e-06, "loss": 2.3315, "step": 538200 }, { "epoch": 0.94, "learning_rate": 3.071321198254725e-06, "loss": 2.336, "step": 538210 }, { "epoch": 0.94, "learning_rate": 3.0704492583278983e-06, "loss": 2.2484, "step": 538220 }, { "epoch": 0.94, "learning_rate": 3.0695773184010717e-06, "loss": 2.2614, "step": 538230 }, { "epoch": 0.94, "learning_rate": 3.068705378474245e-06, "loss": 2.1838, "step": 538240 }, { "epoch": 0.94, "learning_rate": 3.067833438547418e-06, "loss": 2.3151, "step": 538250 }, { "epoch": 0.94, "learning_rate": 3.0669614986205913e-06, "loss": 2.4027, "step": 538260 }, { "epoch": 0.94, "learning_rate": 3.0660895586937642e-06, "loss": 2.2875, "step": 538270 }, { "epoch": 0.94, "learning_rate": 3.0652176187669376e-06, "loss": 2.2285, "step": 538280 }, { "epoch": 0.94, "learning_rate": 3.064345678840111e-06, "loss": 2.2681, "step": 538290 }, { "epoch": 0.94, "learning_rate": 3.0634737389132843e-06, "loss": 2.2327, "step": 538300 }, { "epoch": 0.94, "learning_rate": 3.062601798986457e-06, "loss": 2.3268, "step": 538310 }, { "epoch": 0.94, "learning_rate": 3.0617298590596305e-06, "loss": 2.2679, "step": 538320 }, { "epoch": 0.94, "learning_rate": 3.0608579191328035e-06, "loss": 2.1337, "step": 538330 }, { "epoch": 0.94, "learning_rate": 3.059985979205977e-06, "loss": 2.2828, "step": 538340 }, { "epoch": 0.94, "learning_rate": 3.0591140392791497e-06, "loss": 2.2102, "step": 538350 }, { "epoch": 0.94, "learning_rate": 3.0582420993523235e-06, "loss": 2.2311, "step": 538360 }, { "epoch": 0.94, "learning_rate": 3.0573701594254964e-06, "loss": 2.2303, "step": 538370 }, { "epoch": 0.94, "learning_rate": 3.0564982194986698e-06, "loss": 2.3625, "step": 538380 }, { "epoch": 0.94, "learning_rate": 3.0556262795718427e-06, "loss": 2.2991, "step": 538390 }, { "epoch": 0.94, "learning_rate": 3.054754339645016e-06, "loss": 2.2171, "step": 538400 }, { "epoch": 0.94, "learning_rate": 3.053882399718189e-06, "loss": 2.2216, "step": 538410 }, { "epoch": 0.94, "learning_rate": 3.0530104597913627e-06, "loss": 2.2384, "step": 538420 }, { "epoch": 0.94, "learning_rate": 3.0521385198645357e-06, "loss": 2.203, "step": 538430 }, { "epoch": 0.94, "learning_rate": 3.051266579937709e-06, "loss": 2.3495, "step": 538440 }, { "epoch": 0.94, "learning_rate": 3.050394640010882e-06, "loss": 2.3383, "step": 538450 }, { "epoch": 0.94, "learning_rate": 3.0495227000840553e-06, "loss": 2.2315, "step": 538460 }, { "epoch": 0.94, "learning_rate": 3.048650760157228e-06, "loss": 2.2375, "step": 538470 }, { "epoch": 0.94, "learning_rate": 3.0477788202304015e-06, "loss": 2.325, "step": 538480 }, { "epoch": 0.94, "learning_rate": 3.046906880303575e-06, "loss": 2.1858, "step": 538490 }, { "epoch": 0.94, "learning_rate": 3.0460349403767482e-06, "loss": 2.2176, "step": 538500 }, { "epoch": 0.94, "learning_rate": 3.045163000449921e-06, "loss": 2.362, "step": 538510 }, { "epoch": 0.94, "learning_rate": 3.0442910605230945e-06, "loss": 2.231, "step": 538520 }, { "epoch": 0.94, "learning_rate": 3.0434191205962674e-06, "loss": 2.2626, "step": 538530 }, { "epoch": 0.94, "learning_rate": 3.0425471806694408e-06, "loss": 2.0989, "step": 538540 }, { "epoch": 0.94, "learning_rate": 3.0416752407426137e-06, "loss": 2.2577, "step": 538550 }, { "epoch": 0.94, "learning_rate": 3.0408033008157875e-06, "loss": 2.231, "step": 538560 }, { "epoch": 0.94, "learning_rate": 3.0399313608889604e-06, "loss": 2.2074, "step": 538570 }, { "epoch": 0.94, "learning_rate": 3.0390594209621337e-06, "loss": 2.268, "step": 538580 }, { "epoch": 0.94, "learning_rate": 3.0381874810353067e-06, "loss": 2.2338, "step": 538590 }, { "epoch": 0.94, "learning_rate": 3.03731554110848e-06, "loss": 2.2253, "step": 538600 }, { "epoch": 0.94, "learning_rate": 3.036443601181653e-06, "loss": 2.36, "step": 538610 }, { "epoch": 0.94, "learning_rate": 3.0355716612548267e-06, "loss": 2.1486, "step": 538620 }, { "epoch": 0.94, "learning_rate": 3.0346997213279996e-06, "loss": 2.2602, "step": 538630 }, { "epoch": 0.94, "learning_rate": 3.033827781401173e-06, "loss": 2.2557, "step": 538640 }, { "epoch": 0.94, "learning_rate": 3.032955841474346e-06, "loss": 2.2848, "step": 538650 }, { "epoch": 0.94, "learning_rate": 3.0320839015475192e-06, "loss": 2.3446, "step": 538660 }, { "epoch": 0.94, "learning_rate": 3.031211961620692e-06, "loss": 2.2588, "step": 538670 }, { "epoch": 0.94, "learning_rate": 3.0303400216938655e-06, "loss": 2.2247, "step": 538680 }, { "epoch": 0.94, "learning_rate": 3.029468081767039e-06, "loss": 2.317, "step": 538690 }, { "epoch": 0.94, "learning_rate": 3.028596141840212e-06, "loss": 2.1933, "step": 538700 }, { "epoch": 0.94, "learning_rate": 3.027724201913385e-06, "loss": 2.341, "step": 538710 }, { "epoch": 0.94, "learning_rate": 3.0268522619865585e-06, "loss": 2.1921, "step": 538720 }, { "epoch": 0.94, "learning_rate": 3.0259803220597314e-06, "loss": 2.2067, "step": 538730 }, { "epoch": 0.94, "learning_rate": 3.0251083821329047e-06, "loss": 2.2744, "step": 538740 }, { "epoch": 0.94, "learning_rate": 3.024236442206078e-06, "loss": 2.2983, "step": 538750 }, { "epoch": 0.94, "learning_rate": 3.0233645022792514e-06, "loss": 2.2492, "step": 538760 }, { "epoch": 0.94, "learning_rate": 3.0224925623524243e-06, "loss": 2.2708, "step": 538770 }, { "epoch": 0.94, "learning_rate": 3.0216206224255977e-06, "loss": 2.3082, "step": 538780 }, { "epoch": 0.94, "learning_rate": 3.0207486824987706e-06, "loss": 2.2357, "step": 538790 }, { "epoch": 0.94, "learning_rate": 3.019876742571944e-06, "loss": 2.2389, "step": 538800 }, { "epoch": 0.94, "learning_rate": 3.019004802645117e-06, "loss": 2.2049, "step": 538810 }, { "epoch": 0.94, "learning_rate": 3.0181328627182907e-06, "loss": 2.2336, "step": 538820 }, { "epoch": 0.94, "learning_rate": 3.0172609227914636e-06, "loss": 2.2695, "step": 538830 }, { "epoch": 0.94, "learning_rate": 3.016388982864637e-06, "loss": 2.1233, "step": 538840 }, { "epoch": 0.94, "learning_rate": 3.01551704293781e-06, "loss": 2.1803, "step": 538850 }, { "epoch": 0.94, "learning_rate": 3.014645103010983e-06, "loss": 2.2154, "step": 538860 }, { "epoch": 0.94, "learning_rate": 3.013773163084156e-06, "loss": 2.1458, "step": 538870 }, { "epoch": 0.94, "learning_rate": 3.0129012231573295e-06, "loss": 2.2503, "step": 538880 }, { "epoch": 0.94, "learning_rate": 3.012029283230503e-06, "loss": 2.1722, "step": 538890 }, { "epoch": 0.94, "learning_rate": 3.011157343303676e-06, "loss": 2.2256, "step": 538900 }, { "epoch": 0.94, "learning_rate": 3.010285403376849e-06, "loss": 2.326, "step": 538910 }, { "epoch": 0.94, "learning_rate": 3.0094134634500224e-06, "loss": 2.2235, "step": 538920 }, { "epoch": 0.94, "learning_rate": 3.0085415235231953e-06, "loss": 2.3167, "step": 538930 }, { "epoch": 0.94, "learning_rate": 3.0076695835963687e-06, "loss": 2.2821, "step": 538940 }, { "epoch": 0.94, "learning_rate": 3.006797643669542e-06, "loss": 2.3024, "step": 538950 }, { "epoch": 0.94, "learning_rate": 3.0059257037427154e-06, "loss": 2.168, "step": 538960 }, { "epoch": 0.94, "learning_rate": 3.0050537638158883e-06, "loss": 2.2276, "step": 538970 }, { "epoch": 0.94, "learning_rate": 3.0041818238890617e-06, "loss": 2.2684, "step": 538980 }, { "epoch": 0.94, "learning_rate": 3.0033098839622346e-06, "loss": 2.2646, "step": 538990 }, { "epoch": 0.94, "learning_rate": 3.002437944035408e-06, "loss": 2.302, "step": 539000 }, { "epoch": 0.94, "learning_rate": 3.001566004108581e-06, "loss": 2.2066, "step": 539010 }, { "epoch": 0.94, "learning_rate": 3.0006940641817546e-06, "loss": 2.2302, "step": 539020 }, { "epoch": 0.94, "learning_rate": 2.9998221242549275e-06, "loss": 2.2653, "step": 539030 }, { "epoch": 0.94, "learning_rate": 2.998950184328101e-06, "loss": 2.0885, "step": 539040 }, { "epoch": 0.94, "learning_rate": 2.998078244401274e-06, "loss": 2.3462, "step": 539050 }, { "epoch": 0.94, "learning_rate": 2.997206304474447e-06, "loss": 2.3821, "step": 539060 }, { "epoch": 0.94, "learning_rate": 2.99633436454762e-06, "loss": 2.2756, "step": 539070 }, { "epoch": 0.94, "learning_rate": 2.9954624246207934e-06, "loss": 2.1996, "step": 539080 }, { "epoch": 0.94, "learning_rate": 2.9945904846939668e-06, "loss": 2.3177, "step": 539090 }, { "epoch": 0.94, "learning_rate": 2.99371854476714e-06, "loss": 2.1772, "step": 539100 }, { "epoch": 0.94, "learning_rate": 2.992846604840313e-06, "loss": 2.1176, "step": 539110 }, { "epoch": 0.94, "learning_rate": 2.9919746649134864e-06, "loss": 2.2484, "step": 539120 }, { "epoch": 0.94, "learning_rate": 2.9911027249866593e-06, "loss": 2.1558, "step": 539130 }, { "epoch": 0.94, "learning_rate": 2.9902307850598327e-06, "loss": 2.2883, "step": 539140 }, { "epoch": 0.94, "learning_rate": 2.989358845133006e-06, "loss": 2.2449, "step": 539150 }, { "epoch": 0.94, "learning_rate": 2.9884869052061794e-06, "loss": 2.235, "step": 539160 }, { "epoch": 0.94, "learning_rate": 2.9876149652793523e-06, "loss": 2.2053, "step": 539170 }, { "epoch": 0.94, "learning_rate": 2.9867430253525256e-06, "loss": 2.2278, "step": 539180 }, { "epoch": 0.94, "learning_rate": 2.9858710854256985e-06, "loss": 2.3148, "step": 539190 }, { "epoch": 0.94, "learning_rate": 2.984999145498872e-06, "loss": 2.1276, "step": 539200 }, { "epoch": 0.94, "learning_rate": 2.984127205572045e-06, "loss": 2.2232, "step": 539210 }, { "epoch": 0.94, "learning_rate": 2.9832552656452186e-06, "loss": 2.1979, "step": 539220 }, { "epoch": 0.94, "learning_rate": 2.9823833257183915e-06, "loss": 2.2856, "step": 539230 }, { "epoch": 0.94, "learning_rate": 2.981511385791565e-06, "loss": 2.3332, "step": 539240 }, { "epoch": 0.94, "learning_rate": 2.9806394458647378e-06, "loss": 2.239, "step": 539250 }, { "epoch": 0.94, "learning_rate": 2.979767505937911e-06, "loss": 2.2871, "step": 539260 }, { "epoch": 0.94, "learning_rate": 2.978895566011084e-06, "loss": 2.3672, "step": 539270 }, { "epoch": 0.94, "learning_rate": 2.9780236260842574e-06, "loss": 2.3777, "step": 539280 }, { "epoch": 0.94, "learning_rate": 2.9771516861574307e-06, "loss": 2.2182, "step": 539290 }, { "epoch": 0.94, "learning_rate": 2.976279746230604e-06, "loss": 2.1132, "step": 539300 }, { "epoch": 0.94, "learning_rate": 2.975407806303777e-06, "loss": 2.2654, "step": 539310 }, { "epoch": 0.94, "learning_rate": 2.9745358663769504e-06, "loss": 2.1756, "step": 539320 }, { "epoch": 0.94, "learning_rate": 2.9736639264501233e-06, "loss": 2.3638, "step": 539330 }, { "epoch": 0.94, "learning_rate": 2.9727919865232966e-06, "loss": 2.3133, "step": 539340 }, { "epoch": 0.94, "learning_rate": 2.97192004659647e-06, "loss": 2.128, "step": 539350 }, { "epoch": 0.94, "learning_rate": 2.9710481066696433e-06, "loss": 2.2716, "step": 539360 }, { "epoch": 0.94, "learning_rate": 2.9701761667428162e-06, "loss": 2.2794, "step": 539370 }, { "epoch": 0.94, "learning_rate": 2.9693042268159896e-06, "loss": 2.2574, "step": 539380 }, { "epoch": 0.94, "learning_rate": 2.9684322868891625e-06, "loss": 2.3982, "step": 539390 }, { "epoch": 0.94, "learning_rate": 2.967560346962336e-06, "loss": 2.2724, "step": 539400 }, { "epoch": 0.94, "learning_rate": 2.9666884070355088e-06, "loss": 2.097, "step": 539410 }, { "epoch": 0.94, "learning_rate": 2.9658164671086825e-06, "loss": 2.2299, "step": 539420 }, { "epoch": 0.94, "learning_rate": 2.9649445271818555e-06, "loss": 2.2144, "step": 539430 }, { "epoch": 0.94, "learning_rate": 2.964072587255029e-06, "loss": 2.1987, "step": 539440 }, { "epoch": 0.94, "learning_rate": 2.9632006473282017e-06, "loss": 2.2401, "step": 539450 }, { "epoch": 0.94, "learning_rate": 2.962328707401375e-06, "loss": 2.2864, "step": 539460 }, { "epoch": 0.94, "learning_rate": 2.961456767474548e-06, "loss": 2.3012, "step": 539470 }, { "epoch": 0.94, "learning_rate": 2.9605848275477214e-06, "loss": 2.25, "step": 539480 }, { "epoch": 0.94, "learning_rate": 2.9597128876208947e-06, "loss": 2.2975, "step": 539490 }, { "epoch": 0.94, "learning_rate": 2.958840947694068e-06, "loss": 2.222, "step": 539500 }, { "epoch": 0.94, "learning_rate": 2.957969007767241e-06, "loss": 2.3901, "step": 539510 }, { "epoch": 0.94, "learning_rate": 2.9570970678404143e-06, "loss": 2.2003, "step": 539520 }, { "epoch": 0.94, "learning_rate": 2.9562251279135872e-06, "loss": 2.2822, "step": 539530 }, { "epoch": 0.94, "learning_rate": 2.9553531879867606e-06, "loss": 2.2553, "step": 539540 }, { "epoch": 0.94, "learning_rate": 2.954481248059934e-06, "loss": 2.2627, "step": 539550 }, { "epoch": 0.94, "learning_rate": 2.9536093081331073e-06, "loss": 2.3358, "step": 539560 }, { "epoch": 0.94, "learning_rate": 2.95273736820628e-06, "loss": 2.0655, "step": 539570 }, { "epoch": 0.94, "learning_rate": 2.9518654282794535e-06, "loss": 2.228, "step": 539580 }, { "epoch": 0.94, "learning_rate": 2.9509934883526265e-06, "loss": 2.1838, "step": 539590 }, { "epoch": 0.94, "learning_rate": 2.9501215484258e-06, "loss": 2.256, "step": 539600 }, { "epoch": 0.94, "learning_rate": 2.9492496084989727e-06, "loss": 2.2456, "step": 539610 }, { "epoch": 0.94, "learning_rate": 2.9483776685721465e-06, "loss": 2.3102, "step": 539620 }, { "epoch": 0.94, "learning_rate": 2.9475057286453194e-06, "loss": 2.2184, "step": 539630 }, { "epoch": 0.94, "learning_rate": 2.9466337887184928e-06, "loss": 2.2501, "step": 539640 }, { "epoch": 0.94, "learning_rate": 2.9457618487916657e-06, "loss": 2.2602, "step": 539650 }, { "epoch": 0.94, "learning_rate": 2.944889908864839e-06, "loss": 2.324, "step": 539660 }, { "epoch": 0.94, "learning_rate": 2.944017968938012e-06, "loss": 2.2136, "step": 539670 }, { "epoch": 0.94, "learning_rate": 2.9431460290111853e-06, "loss": 2.217, "step": 539680 }, { "epoch": 0.94, "learning_rate": 2.9422740890843587e-06, "loss": 2.3251, "step": 539690 }, { "epoch": 0.94, "learning_rate": 2.941402149157532e-06, "loss": 2.2054, "step": 539700 }, { "epoch": 0.94, "learning_rate": 2.940530209230705e-06, "loss": 2.1712, "step": 539710 }, { "epoch": 0.94, "learning_rate": 2.9396582693038783e-06, "loss": 2.1703, "step": 539720 }, { "epoch": 0.94, "learning_rate": 2.938786329377051e-06, "loss": 2.2816, "step": 539730 }, { "epoch": 0.94, "learning_rate": 2.9379143894502245e-06, "loss": 2.2571, "step": 539740 }, { "epoch": 0.94, "learning_rate": 2.937042449523398e-06, "loss": 2.2897, "step": 539750 }, { "epoch": 0.94, "learning_rate": 2.9361705095965712e-06, "loss": 2.2736, "step": 539760 }, { "epoch": 0.94, "learning_rate": 2.935298569669744e-06, "loss": 2.3179, "step": 539770 }, { "epoch": 0.94, "learning_rate": 2.9344266297429175e-06, "loss": 2.1965, "step": 539780 }, { "epoch": 0.94, "learning_rate": 2.9335546898160904e-06, "loss": 2.3385, "step": 539790 }, { "epoch": 0.94, "learning_rate": 2.9326827498892638e-06, "loss": 2.2129, "step": 539800 }, { "epoch": 0.94, "learning_rate": 2.9318108099624367e-06, "loss": 2.2405, "step": 539810 }, { "epoch": 0.94, "learning_rate": 2.9309388700356105e-06, "loss": 2.2127, "step": 539820 }, { "epoch": 0.94, "learning_rate": 2.9300669301087834e-06, "loss": 2.3267, "step": 539830 }, { "epoch": 0.94, "learning_rate": 2.9291949901819567e-06, "loss": 2.1402, "step": 539840 }, { "epoch": 0.94, "learning_rate": 2.9283230502551297e-06, "loss": 2.2536, "step": 539850 }, { "epoch": 0.94, "learning_rate": 2.927451110328303e-06, "loss": 2.2806, "step": 539860 }, { "epoch": 0.94, "learning_rate": 2.926579170401476e-06, "loss": 2.2737, "step": 539870 }, { "epoch": 0.94, "learning_rate": 2.9257072304746493e-06, "loss": 2.2023, "step": 539880 }, { "epoch": 0.94, "learning_rate": 2.9248352905478226e-06, "loss": 2.138, "step": 539890 }, { "epoch": 0.94, "learning_rate": 2.923963350620996e-06, "loss": 2.207, "step": 539900 }, { "epoch": 0.94, "learning_rate": 2.923091410694169e-06, "loss": 2.1866, "step": 539910 }, { "epoch": 0.94, "learning_rate": 2.9222194707673422e-06, "loss": 2.1378, "step": 539920 }, { "epoch": 0.94, "learning_rate": 2.921347530840515e-06, "loss": 2.2999, "step": 539930 }, { "epoch": 0.94, "learning_rate": 2.9204755909136885e-06, "loss": 2.3994, "step": 539940 }, { "epoch": 0.94, "learning_rate": 2.919603650986862e-06, "loss": 2.2017, "step": 539950 }, { "epoch": 0.94, "learning_rate": 2.918731711060035e-06, "loss": 2.2468, "step": 539960 }, { "epoch": 0.94, "learning_rate": 2.917859771133208e-06, "loss": 2.2979, "step": 539970 }, { "epoch": 0.94, "learning_rate": 2.9169878312063815e-06, "loss": 2.3121, "step": 539980 }, { "epoch": 0.94, "learning_rate": 2.9161158912795544e-06, "loss": 2.2874, "step": 539990 }, { "epoch": 0.94, "learning_rate": 2.9152439513527277e-06, "loss": 2.2134, "step": 540000 }, { "epoch": 0.94, "learning_rate": 2.9143720114259007e-06, "loss": 2.2113, "step": 540010 }, { "epoch": 0.94, "learning_rate": 2.9135000714990744e-06, "loss": 2.2596, "step": 540020 }, { "epoch": 0.94, "learning_rate": 2.9126281315722474e-06, "loss": 2.3426, "step": 540030 }, { "epoch": 0.94, "learning_rate": 2.9117561916454207e-06, "loss": 2.1943, "step": 540040 }, { "epoch": 0.94, "learning_rate": 2.9108842517185936e-06, "loss": 2.2508, "step": 540050 }, { "epoch": 0.94, "learning_rate": 2.910012311791767e-06, "loss": 2.2456, "step": 540060 }, { "epoch": 0.94, "learning_rate": 2.90914037186494e-06, "loss": 2.3432, "step": 540070 }, { "epoch": 0.94, "learning_rate": 2.9082684319381132e-06, "loss": 2.282, "step": 540080 }, { "epoch": 0.94, "learning_rate": 2.9073964920112866e-06, "loss": 2.151, "step": 540090 }, { "epoch": 0.94, "learning_rate": 2.90652455208446e-06, "loss": 2.2381, "step": 540100 }, { "epoch": 0.94, "learning_rate": 2.905652612157633e-06, "loss": 2.3599, "step": 540110 }, { "epoch": 0.94, "learning_rate": 2.904780672230806e-06, "loss": 2.343, "step": 540120 }, { "epoch": 0.94, "learning_rate": 2.903908732303979e-06, "loss": 2.2384, "step": 540130 }, { "epoch": 0.94, "learning_rate": 2.9030367923771525e-06, "loss": 2.1882, "step": 540140 }, { "epoch": 0.94, "learning_rate": 2.902164852450326e-06, "loss": 2.2624, "step": 540150 }, { "epoch": 0.94, "learning_rate": 2.901292912523499e-06, "loss": 2.1403, "step": 540160 }, { "epoch": 0.94, "learning_rate": 2.900420972596672e-06, "loss": 2.2205, "step": 540170 }, { "epoch": 0.94, "learning_rate": 2.8995490326698454e-06, "loss": 2.3256, "step": 540180 }, { "epoch": 0.94, "learning_rate": 2.8986770927430184e-06, "loss": 2.2557, "step": 540190 }, { "epoch": 0.94, "learning_rate": 2.8978051528161917e-06, "loss": 2.1819, "step": 540200 }, { "epoch": 0.94, "learning_rate": 2.8969332128893646e-06, "loss": 2.2904, "step": 540210 }, { "epoch": 0.94, "learning_rate": 2.8960612729625384e-06, "loss": 2.2203, "step": 540220 }, { "epoch": 0.94, "learning_rate": 2.8951893330357113e-06, "loss": 2.2878, "step": 540230 }, { "epoch": 0.94, "learning_rate": 2.8943173931088847e-06, "loss": 2.2856, "step": 540240 }, { "epoch": 0.94, "learning_rate": 2.8934454531820576e-06, "loss": 2.2974, "step": 540250 }, { "epoch": 0.94, "learning_rate": 2.892573513255231e-06, "loss": 2.3288, "step": 540260 }, { "epoch": 0.94, "learning_rate": 2.891701573328404e-06, "loss": 2.3138, "step": 540270 }, { "epoch": 0.94, "learning_rate": 2.8908296334015776e-06, "loss": 2.2988, "step": 540280 }, { "epoch": 0.94, "learning_rate": 2.8899576934747506e-06, "loss": 2.2295, "step": 540290 }, { "epoch": 0.94, "learning_rate": 2.889085753547924e-06, "loss": 2.2917, "step": 540300 }, { "epoch": 0.94, "learning_rate": 2.888213813621097e-06, "loss": 2.1653, "step": 540310 }, { "epoch": 0.94, "learning_rate": 2.88734187369427e-06, "loss": 2.309, "step": 540320 }, { "epoch": 0.94, "learning_rate": 2.886469933767443e-06, "loss": 2.299, "step": 540330 }, { "epoch": 0.94, "learning_rate": 2.8855979938406164e-06, "loss": 2.2283, "step": 540340 }, { "epoch": 0.94, "learning_rate": 2.8847260539137898e-06, "loss": 2.334, "step": 540350 }, { "epoch": 0.94, "learning_rate": 2.883854113986963e-06, "loss": 2.2694, "step": 540360 }, { "epoch": 0.94, "learning_rate": 2.882982174060136e-06, "loss": 2.2008, "step": 540370 }, { "epoch": 0.94, "learning_rate": 2.8821102341333094e-06, "loss": 2.3084, "step": 540380 }, { "epoch": 0.94, "learning_rate": 2.8812382942064823e-06, "loss": 2.2588, "step": 540390 }, { "epoch": 0.94, "learning_rate": 2.8803663542796557e-06, "loss": 2.3873, "step": 540400 }, { "epoch": 0.94, "learning_rate": 2.8794944143528286e-06, "loss": 2.2096, "step": 540410 }, { "epoch": 0.94, "learning_rate": 2.8786224744260024e-06, "loss": 2.3244, "step": 540420 }, { "epoch": 0.94, "learning_rate": 2.8777505344991753e-06, "loss": 2.1248, "step": 540430 }, { "epoch": 0.94, "learning_rate": 2.8768785945723486e-06, "loss": 2.2167, "step": 540440 }, { "epoch": 0.94, "learning_rate": 2.8760066546455216e-06, "loss": 2.2877, "step": 540450 }, { "epoch": 0.94, "learning_rate": 2.875134714718695e-06, "loss": 2.3946, "step": 540460 }, { "epoch": 0.94, "learning_rate": 2.874262774791868e-06, "loss": 2.2434, "step": 540470 }, { "epoch": 0.94, "learning_rate": 2.8733908348650416e-06, "loss": 2.2508, "step": 540480 }, { "epoch": 0.94, "learning_rate": 2.8725188949382145e-06, "loss": 2.421, "step": 540490 }, { "epoch": 0.94, "learning_rate": 2.871646955011388e-06, "loss": 2.2716, "step": 540500 }, { "epoch": 0.94, "learning_rate": 2.8707750150845608e-06, "loss": 2.3113, "step": 540510 }, { "epoch": 0.94, "learning_rate": 2.869903075157734e-06, "loss": 2.2386, "step": 540520 }, { "epoch": 0.94, "learning_rate": 2.869031135230907e-06, "loss": 2.2159, "step": 540530 }, { "epoch": 0.94, "learning_rate": 2.8681591953040804e-06, "loss": 2.3384, "step": 540540 }, { "epoch": 0.94, "learning_rate": 2.8672872553772537e-06, "loss": 2.2309, "step": 540550 }, { "epoch": 0.94, "learning_rate": 2.866415315450427e-06, "loss": 2.2789, "step": 540560 }, { "epoch": 0.94, "learning_rate": 2.8655433755236e-06, "loss": 2.3167, "step": 540570 }, { "epoch": 0.94, "learning_rate": 2.8646714355967734e-06, "loss": 2.2653, "step": 540580 }, { "epoch": 0.94, "learning_rate": 2.8637994956699463e-06, "loss": 2.3175, "step": 540590 }, { "epoch": 0.94, "learning_rate": 2.8629275557431196e-06, "loss": 2.2194, "step": 540600 }, { "epoch": 0.94, "learning_rate": 2.8620556158162926e-06, "loss": 2.2829, "step": 540610 }, { "epoch": 0.94, "learning_rate": 2.8611836758894663e-06, "loss": 2.3105, "step": 540620 }, { "epoch": 0.94, "learning_rate": 2.8603117359626392e-06, "loss": 2.2302, "step": 540630 }, { "epoch": 0.94, "learning_rate": 2.8594397960358126e-06, "loss": 2.2409, "step": 540640 }, { "epoch": 0.94, "learning_rate": 2.8585678561089855e-06, "loss": 2.1455, "step": 540650 }, { "epoch": 0.94, "learning_rate": 2.857695916182159e-06, "loss": 2.186, "step": 540660 }, { "epoch": 0.94, "learning_rate": 2.8568239762553318e-06, "loss": 2.4162, "step": 540670 }, { "epoch": 0.94, "learning_rate": 2.8559520363285056e-06, "loss": 2.2992, "step": 540680 }, { "epoch": 0.94, "learning_rate": 2.8550800964016785e-06, "loss": 2.3027, "step": 540690 }, { "epoch": 0.94, "learning_rate": 2.854208156474852e-06, "loss": 2.29, "step": 540700 }, { "epoch": 0.94, "learning_rate": 2.8533362165480247e-06, "loss": 2.3895, "step": 540710 }, { "epoch": 0.94, "learning_rate": 2.852464276621198e-06, "loss": 2.3049, "step": 540720 }, { "epoch": 0.94, "learning_rate": 2.851592336694371e-06, "loss": 2.265, "step": 540730 }, { "epoch": 0.94, "learning_rate": 2.8507203967675444e-06, "loss": 2.3475, "step": 540740 }, { "epoch": 0.94, "learning_rate": 2.8498484568407177e-06, "loss": 2.261, "step": 540750 }, { "epoch": 0.94, "learning_rate": 2.848976516913891e-06, "loss": 2.241, "step": 540760 }, { "epoch": 0.94, "learning_rate": 2.848104576987064e-06, "loss": 2.2555, "step": 540770 }, { "epoch": 0.94, "learning_rate": 2.8472326370602373e-06, "loss": 2.2443, "step": 540780 }, { "epoch": 0.94, "learning_rate": 2.8463606971334102e-06, "loss": 2.272, "step": 540790 }, { "epoch": 0.94, "learning_rate": 2.8454887572065836e-06, "loss": 2.2289, "step": 540800 }, { "epoch": 0.94, "learning_rate": 2.8446168172797565e-06, "loss": 2.1593, "step": 540810 }, { "epoch": 0.94, "learning_rate": 2.8437448773529303e-06, "loss": 2.3521, "step": 540820 }, { "epoch": 0.94, "learning_rate": 2.842872937426103e-06, "loss": 2.2919, "step": 540830 }, { "epoch": 0.94, "learning_rate": 2.8420009974992766e-06, "loss": 2.2447, "step": 540840 }, { "epoch": 0.94, "learning_rate": 2.8411290575724495e-06, "loss": 2.3496, "step": 540850 }, { "epoch": 0.94, "learning_rate": 2.840257117645623e-06, "loss": 2.3239, "step": 540860 }, { "epoch": 0.94, "learning_rate": 2.8393851777187957e-06, "loss": 2.2108, "step": 540870 }, { "epoch": 0.94, "learning_rate": 2.8385132377919695e-06, "loss": 2.2232, "step": 540880 }, { "epoch": 0.94, "learning_rate": 2.8376412978651424e-06, "loss": 2.2325, "step": 540890 }, { "epoch": 0.94, "learning_rate": 2.836769357938316e-06, "loss": 2.2405, "step": 540900 }, { "epoch": 0.94, "learning_rate": 2.8358974180114887e-06, "loss": 2.2198, "step": 540910 }, { "epoch": 0.94, "learning_rate": 2.835025478084662e-06, "loss": 2.2733, "step": 540920 }, { "epoch": 0.94, "learning_rate": 2.834153538157835e-06, "loss": 2.1588, "step": 540930 }, { "epoch": 0.94, "learning_rate": 2.8332815982310083e-06, "loss": 2.1059, "step": 540940 }, { "epoch": 0.94, "learning_rate": 2.8324096583041817e-06, "loss": 2.2738, "step": 540950 }, { "epoch": 0.94, "learning_rate": 2.831537718377355e-06, "loss": 2.2489, "step": 540960 }, { "epoch": 0.94, "learning_rate": 2.830665778450528e-06, "loss": 2.2083, "step": 540970 }, { "epoch": 0.94, "learning_rate": 2.8297938385237013e-06, "loss": 2.2335, "step": 540980 }, { "epoch": 0.94, "learning_rate": 2.8289218985968742e-06, "loss": 2.1287, "step": 540990 }, { "epoch": 0.94, "learning_rate": 2.8280499586700476e-06, "loss": 2.2468, "step": 541000 }, { "epoch": 0.94, "learning_rate": 2.8271780187432205e-06, "loss": 2.3236, "step": 541010 }, { "epoch": 0.94, "learning_rate": 2.8263060788163943e-06, "loss": 2.3914, "step": 541020 }, { "epoch": 0.94, "learning_rate": 2.825434138889567e-06, "loss": 2.2496, "step": 541030 }, { "epoch": 0.94, "learning_rate": 2.8245621989627405e-06, "loss": 2.1572, "step": 541040 }, { "epoch": 0.94, "learning_rate": 2.8236902590359134e-06, "loss": 2.2968, "step": 541050 }, { "epoch": 0.94, "learning_rate": 2.822818319109087e-06, "loss": 2.2623, "step": 541060 }, { "epoch": 0.94, "learning_rate": 2.8219463791822597e-06, "loss": 2.2851, "step": 541070 }, { "epoch": 0.94, "learning_rate": 2.8210744392554335e-06, "loss": 2.1921, "step": 541080 }, { "epoch": 0.94, "learning_rate": 2.8202024993286064e-06, "loss": 2.2444, "step": 541090 }, { "epoch": 0.94, "learning_rate": 2.8193305594017798e-06, "loss": 2.2458, "step": 541100 }, { "epoch": 0.94, "learning_rate": 2.8184586194749527e-06, "loss": 2.1417, "step": 541110 }, { "epoch": 0.94, "learning_rate": 2.817586679548126e-06, "loss": 2.2236, "step": 541120 }, { "epoch": 0.94, "learning_rate": 2.816714739621299e-06, "loss": 2.2748, "step": 541130 }, { "epoch": 0.94, "learning_rate": 2.8158427996944723e-06, "loss": 2.3522, "step": 541140 }, { "epoch": 0.94, "learning_rate": 2.8149708597676456e-06, "loss": 2.2961, "step": 541150 }, { "epoch": 0.94, "learning_rate": 2.814098919840819e-06, "loss": 2.2983, "step": 541160 }, { "epoch": 0.94, "learning_rate": 2.813226979913992e-06, "loss": 2.3057, "step": 541170 }, { "epoch": 0.94, "learning_rate": 2.8123550399871653e-06, "loss": 2.1915, "step": 541180 }, { "epoch": 0.94, "learning_rate": 2.811483100060338e-06, "loss": 2.1937, "step": 541190 }, { "epoch": 0.94, "learning_rate": 2.8106111601335115e-06, "loss": 2.2664, "step": 541200 }, { "epoch": 0.94, "learning_rate": 2.8097392202066844e-06, "loss": 2.1822, "step": 541210 }, { "epoch": 0.94, "learning_rate": 2.8088672802798582e-06, "loss": 2.3907, "step": 541220 }, { "epoch": 0.94, "learning_rate": 2.807995340353031e-06, "loss": 2.3318, "step": 541230 }, { "epoch": 0.94, "learning_rate": 2.8071234004262045e-06, "loss": 2.1943, "step": 541240 }, { "epoch": 0.94, "learning_rate": 2.8062514604993774e-06, "loss": 2.3491, "step": 541250 }, { "epoch": 0.94, "learning_rate": 2.8053795205725508e-06, "loss": 2.1221, "step": 541260 }, { "epoch": 0.94, "learning_rate": 2.8045075806457237e-06, "loss": 2.2213, "step": 541270 }, { "epoch": 0.94, "learning_rate": 2.8036356407188974e-06, "loss": 2.1274, "step": 541280 }, { "epoch": 0.94, "learning_rate": 2.8027637007920704e-06, "loss": 2.2496, "step": 541290 }, { "epoch": 0.94, "learning_rate": 2.8018917608652437e-06, "loss": 2.2521, "step": 541300 }, { "epoch": 0.94, "learning_rate": 2.8010198209384166e-06, "loss": 2.3243, "step": 541310 }, { "epoch": 0.94, "learning_rate": 2.80014788101159e-06, "loss": 2.2248, "step": 541320 }, { "epoch": 0.94, "learning_rate": 2.799275941084763e-06, "loss": 2.2542, "step": 541330 }, { "epoch": 0.94, "learning_rate": 2.7984040011579363e-06, "loss": 2.3226, "step": 541340 }, { "epoch": 0.94, "learning_rate": 2.7975320612311096e-06, "loss": 2.2503, "step": 541350 }, { "epoch": 0.94, "learning_rate": 2.796660121304283e-06, "loss": 2.2996, "step": 541360 }, { "epoch": 0.94, "learning_rate": 2.795788181377456e-06, "loss": 2.295, "step": 541370 }, { "epoch": 0.94, "learning_rate": 2.7949162414506292e-06, "loss": 2.2106, "step": 541380 }, { "epoch": 0.94, "learning_rate": 2.794044301523802e-06, "loss": 2.3409, "step": 541390 }, { "epoch": 0.94, "learning_rate": 2.7931723615969755e-06, "loss": 2.2292, "step": 541400 }, { "epoch": 0.94, "learning_rate": 2.7923004216701484e-06, "loss": 2.2278, "step": 541410 }, { "epoch": 0.94, "learning_rate": 2.791428481743322e-06, "loss": 2.2276, "step": 541420 }, { "epoch": 0.94, "learning_rate": 2.790556541816495e-06, "loss": 2.263, "step": 541430 }, { "epoch": 0.94, "learning_rate": 2.7896846018896684e-06, "loss": 2.2881, "step": 541440 }, { "epoch": 0.94, "learning_rate": 2.7888126619628414e-06, "loss": 2.1251, "step": 541450 }, { "epoch": 0.94, "learning_rate": 2.7879407220360147e-06, "loss": 2.3008, "step": 541460 }, { "epoch": 0.94, "learning_rate": 2.7870687821091876e-06, "loss": 2.342, "step": 541470 }, { "epoch": 0.94, "learning_rate": 2.7861968421823614e-06, "loss": 2.2441, "step": 541480 }, { "epoch": 0.94, "learning_rate": 2.7853249022555343e-06, "loss": 2.3613, "step": 541490 }, { "epoch": 0.94, "learning_rate": 2.7844529623287077e-06, "loss": 2.1987, "step": 541500 }, { "epoch": 0.94, "learning_rate": 2.7835810224018806e-06, "loss": 2.2505, "step": 541510 }, { "epoch": 0.94, "learning_rate": 2.782709082475054e-06, "loss": 2.2227, "step": 541520 }, { "epoch": 0.94, "learning_rate": 2.781837142548227e-06, "loss": 2.3024, "step": 541530 }, { "epoch": 0.94, "learning_rate": 2.7809652026214002e-06, "loss": 2.2036, "step": 541540 }, { "epoch": 0.94, "learning_rate": 2.7800932626945736e-06, "loss": 2.304, "step": 541550 }, { "epoch": 0.94, "learning_rate": 2.779221322767747e-06, "loss": 2.321, "step": 541560 }, { "epoch": 0.94, "learning_rate": 2.77834938284092e-06, "loss": 2.3093, "step": 541570 }, { "epoch": 0.94, "learning_rate": 2.777477442914093e-06, "loss": 2.2561, "step": 541580 }, { "epoch": 0.94, "learning_rate": 2.776605502987266e-06, "loss": 2.3034, "step": 541590 }, { "epoch": 0.94, "learning_rate": 2.7757335630604394e-06, "loss": 2.1889, "step": 541600 }, { "epoch": 0.94, "learning_rate": 2.774861623133613e-06, "loss": 2.1813, "step": 541610 }, { "epoch": 0.94, "learning_rate": 2.773989683206786e-06, "loss": 2.2896, "step": 541620 }, { "epoch": 0.94, "learning_rate": 2.773117743279959e-06, "loss": 2.3173, "step": 541630 }, { "epoch": 0.94, "learning_rate": 2.7722458033531324e-06, "loss": 2.1663, "step": 541640 }, { "epoch": 0.94, "learning_rate": 2.7713738634263053e-06, "loss": 2.263, "step": 541650 }, { "epoch": 0.94, "learning_rate": 2.7705019234994787e-06, "loss": 2.2263, "step": 541660 }, { "epoch": 0.94, "learning_rate": 2.7696299835726516e-06, "loss": 2.1989, "step": 541670 }, { "epoch": 0.94, "learning_rate": 2.7687580436458254e-06, "loss": 2.2914, "step": 541680 }, { "epoch": 0.94, "learning_rate": 2.7678861037189983e-06, "loss": 2.3203, "step": 541690 }, { "epoch": 0.94, "learning_rate": 2.7670141637921716e-06, "loss": 2.3471, "step": 541700 }, { "epoch": 0.94, "learning_rate": 2.7661422238653446e-06, "loss": 2.3099, "step": 541710 }, { "epoch": 0.94, "learning_rate": 2.765270283938518e-06, "loss": 2.1245, "step": 541720 }, { "epoch": 0.94, "learning_rate": 2.764398344011691e-06, "loss": 2.2202, "step": 541730 }, { "epoch": 0.94, "learning_rate": 2.763526404084864e-06, "loss": 2.2339, "step": 541740 }, { "epoch": 0.94, "learning_rate": 2.7626544641580375e-06, "loss": 2.2455, "step": 541750 }, { "epoch": 0.94, "learning_rate": 2.761782524231211e-06, "loss": 2.1982, "step": 541760 }, { "epoch": 0.94, "learning_rate": 2.760910584304384e-06, "loss": 2.3577, "step": 541770 }, { "epoch": 0.94, "learning_rate": 2.760038644377557e-06, "loss": 2.2907, "step": 541780 }, { "epoch": 0.94, "learning_rate": 2.75916670445073e-06, "loss": 2.2584, "step": 541790 }, { "epoch": 0.94, "learning_rate": 2.7582947645239034e-06, "loss": 2.2408, "step": 541800 }, { "epoch": 0.94, "learning_rate": 2.7574228245970768e-06, "loss": 2.2726, "step": 541810 }, { "epoch": 0.94, "learning_rate": 2.75655088467025e-06, "loss": 2.3176, "step": 541820 }, { "epoch": 0.94, "learning_rate": 2.755678944743423e-06, "loss": 2.4122, "step": 541830 }, { "epoch": 0.94, "learning_rate": 2.7548070048165964e-06, "loss": 2.2176, "step": 541840 }, { "epoch": 0.94, "learning_rate": 2.7539350648897693e-06, "loss": 2.3301, "step": 541850 }, { "epoch": 0.94, "learning_rate": 2.7530631249629426e-06, "loss": 2.1891, "step": 541860 }, { "epoch": 0.94, "learning_rate": 2.7521911850361156e-06, "loss": 2.2989, "step": 541870 }, { "epoch": 0.94, "learning_rate": 2.7513192451092893e-06, "loss": 2.2439, "step": 541880 }, { "epoch": 0.94, "learning_rate": 2.7504473051824623e-06, "loss": 2.2117, "step": 541890 }, { "epoch": 0.95, "learning_rate": 2.7495753652556356e-06, "loss": 2.1015, "step": 541900 }, { "epoch": 0.95, "learning_rate": 2.7487034253288085e-06, "loss": 2.2446, "step": 541910 }, { "epoch": 0.95, "learning_rate": 2.747831485401982e-06, "loss": 2.3763, "step": 541920 }, { "epoch": 0.95, "learning_rate": 2.746959545475155e-06, "loss": 2.2387, "step": 541930 }, { "epoch": 0.95, "learning_rate": 2.746087605548328e-06, "loss": 2.2434, "step": 541940 }, { "epoch": 0.95, "learning_rate": 2.7452156656215015e-06, "loss": 2.2584, "step": 541950 }, { "epoch": 0.95, "learning_rate": 2.744343725694675e-06, "loss": 2.2054, "step": 541960 }, { "epoch": 0.95, "learning_rate": 2.7434717857678478e-06, "loss": 2.2764, "step": 541970 }, { "epoch": 0.95, "learning_rate": 2.742599845841021e-06, "loss": 2.1751, "step": 541980 }, { "epoch": 0.95, "learning_rate": 2.741727905914194e-06, "loss": 2.2874, "step": 541990 }, { "epoch": 0.95, "learning_rate": 2.7408559659873674e-06, "loss": 2.2982, "step": 542000 }, { "epoch": 0.95, "learning_rate": 2.7399840260605407e-06, "loss": 2.1865, "step": 542010 }, { "epoch": 0.95, "learning_rate": 2.739112086133714e-06, "loss": 2.231, "step": 542020 }, { "epoch": 0.95, "learning_rate": 2.738240146206887e-06, "loss": 2.2745, "step": 542030 }, { "epoch": 0.95, "learning_rate": 2.7373682062800603e-06, "loss": 2.2183, "step": 542040 }, { "epoch": 0.95, "learning_rate": 2.7364962663532333e-06, "loss": 2.293, "step": 542050 }, { "epoch": 0.95, "learning_rate": 2.7356243264264066e-06, "loss": 2.2182, "step": 542060 }, { "epoch": 0.95, "learning_rate": 2.7347523864995795e-06, "loss": 2.2624, "step": 542070 }, { "epoch": 0.95, "learning_rate": 2.7338804465727533e-06, "loss": 2.2767, "step": 542080 }, { "epoch": 0.95, "learning_rate": 2.7330085066459262e-06, "loss": 2.1843, "step": 542090 }, { "epoch": 0.95, "learning_rate": 2.7321365667190996e-06, "loss": 2.2788, "step": 542100 }, { "epoch": 0.95, "learning_rate": 2.7312646267922725e-06, "loss": 2.4059, "step": 542110 }, { "epoch": 0.95, "learning_rate": 2.730392686865446e-06, "loss": 2.3118, "step": 542120 }, { "epoch": 0.95, "learning_rate": 2.7295207469386188e-06, "loss": 2.287, "step": 542130 }, { "epoch": 0.95, "learning_rate": 2.728648807011792e-06, "loss": 2.2732, "step": 542140 }, { "epoch": 0.95, "learning_rate": 2.7277768670849655e-06, "loss": 2.1569, "step": 542150 }, { "epoch": 0.95, "learning_rate": 2.726904927158139e-06, "loss": 2.3242, "step": 542160 }, { "epoch": 0.95, "learning_rate": 2.7260329872313117e-06, "loss": 2.2388, "step": 542170 }, { "epoch": 0.95, "learning_rate": 2.725161047304485e-06, "loss": 2.2865, "step": 542180 }, { "epoch": 0.95, "learning_rate": 2.724289107377658e-06, "loss": 2.3761, "step": 542190 }, { "epoch": 0.95, "learning_rate": 2.7234171674508313e-06, "loss": 2.3591, "step": 542200 }, { "epoch": 0.95, "learning_rate": 2.7225452275240047e-06, "loss": 2.2767, "step": 542210 }, { "epoch": 0.95, "learning_rate": 2.721673287597178e-06, "loss": 2.2714, "step": 542220 }, { "epoch": 0.95, "learning_rate": 2.720801347670351e-06, "loss": 2.1954, "step": 542230 }, { "epoch": 0.95, "learning_rate": 2.7199294077435243e-06, "loss": 2.2514, "step": 542240 }, { "epoch": 0.95, "learning_rate": 2.7190574678166972e-06, "loss": 2.2663, "step": 542250 }, { "epoch": 0.95, "learning_rate": 2.7181855278898706e-06, "loss": 2.2491, "step": 542260 }, { "epoch": 0.95, "learning_rate": 2.7173135879630435e-06, "loss": 2.3274, "step": 542270 }, { "epoch": 0.95, "learning_rate": 2.7164416480362173e-06, "loss": 2.1346, "step": 542280 }, { "epoch": 0.95, "learning_rate": 2.71556970810939e-06, "loss": 2.2683, "step": 542290 }, { "epoch": 0.95, "learning_rate": 2.7146977681825635e-06, "loss": 2.3552, "step": 542300 }, { "epoch": 0.95, "learning_rate": 2.7138258282557365e-06, "loss": 2.2762, "step": 542310 }, { "epoch": 0.95, "learning_rate": 2.71295388832891e-06, "loss": 2.3246, "step": 542320 }, { "epoch": 0.95, "learning_rate": 2.7120819484020827e-06, "loss": 2.328, "step": 542330 }, { "epoch": 0.95, "learning_rate": 2.711210008475256e-06, "loss": 2.3488, "step": 542340 }, { "epoch": 0.95, "learning_rate": 2.7103380685484294e-06, "loss": 2.1645, "step": 542350 }, { "epoch": 0.95, "learning_rate": 2.7094661286216028e-06, "loss": 2.2161, "step": 542360 }, { "epoch": 0.95, "learning_rate": 2.7085941886947757e-06, "loss": 2.3565, "step": 542370 }, { "epoch": 0.95, "learning_rate": 2.707722248767949e-06, "loss": 2.314, "step": 542380 }, { "epoch": 0.95, "learning_rate": 2.706850308841122e-06, "loss": 2.203, "step": 542390 }, { "epoch": 0.95, "learning_rate": 2.7059783689142953e-06, "loss": 2.27, "step": 542400 }, { "epoch": 0.95, "learning_rate": 2.7051064289874686e-06, "loss": 2.0449, "step": 542410 }, { "epoch": 0.95, "learning_rate": 2.704234489060642e-06, "loss": 2.2567, "step": 542420 }, { "epoch": 0.95, "learning_rate": 2.703362549133815e-06, "loss": 2.192, "step": 542430 }, { "epoch": 0.95, "learning_rate": 2.7024906092069883e-06, "loss": 2.2177, "step": 542440 }, { "epoch": 0.95, "learning_rate": 2.701618669280161e-06, "loss": 2.2, "step": 542450 }, { "epoch": 0.95, "learning_rate": 2.7007467293533345e-06, "loss": 2.2507, "step": 542460 }, { "epoch": 0.95, "learning_rate": 2.6998747894265075e-06, "loss": 2.3072, "step": 542470 }, { "epoch": 0.95, "learning_rate": 2.6990028494996812e-06, "loss": 2.2949, "step": 542480 }, { "epoch": 0.95, "learning_rate": 2.698130909572854e-06, "loss": 2.3034, "step": 542490 }, { "epoch": 0.95, "learning_rate": 2.6972589696460275e-06, "loss": 2.3105, "step": 542500 }, { "epoch": 0.95, "learning_rate": 2.6963870297192004e-06, "loss": 2.1524, "step": 542510 }, { "epoch": 0.95, "learning_rate": 2.6955150897923738e-06, "loss": 2.2648, "step": 542520 }, { "epoch": 0.95, "learning_rate": 2.6946431498655467e-06, "loss": 2.1524, "step": 542530 }, { "epoch": 0.95, "learning_rate": 2.69377120993872e-06, "loss": 2.3211, "step": 542540 }, { "epoch": 0.95, "learning_rate": 2.6928992700118934e-06, "loss": 2.2292, "step": 542550 }, { "epoch": 0.95, "learning_rate": 2.6920273300850667e-06, "loss": 2.1146, "step": 542560 }, { "epoch": 0.95, "learning_rate": 2.6911553901582396e-06, "loss": 2.2195, "step": 542570 }, { "epoch": 0.95, "learning_rate": 2.690283450231413e-06, "loss": 2.3257, "step": 542580 }, { "epoch": 0.95, "learning_rate": 2.689411510304586e-06, "loss": 2.19, "step": 542590 }, { "epoch": 0.95, "learning_rate": 2.6885395703777593e-06, "loss": 2.3293, "step": 542600 }, { "epoch": 0.95, "learning_rate": 2.6876676304509326e-06, "loss": 2.2646, "step": 542610 }, { "epoch": 0.95, "learning_rate": 2.686795690524106e-06, "loss": 2.3193, "step": 542620 }, { "epoch": 0.95, "learning_rate": 2.685923750597279e-06, "loss": 2.2391, "step": 542630 }, { "epoch": 0.95, "learning_rate": 2.6850518106704522e-06, "loss": 2.2322, "step": 542640 }, { "epoch": 0.95, "learning_rate": 2.684179870743625e-06, "loss": 2.2417, "step": 542650 }, { "epoch": 0.95, "learning_rate": 2.6833079308167985e-06, "loss": 2.1089, "step": 542660 }, { "epoch": 0.95, "learning_rate": 2.6824359908899714e-06, "loss": 2.1256, "step": 542670 }, { "epoch": 0.95, "learning_rate": 2.681564050963145e-06, "loss": 2.2517, "step": 542680 }, { "epoch": 0.95, "learning_rate": 2.680692111036318e-06, "loss": 2.1697, "step": 542690 }, { "epoch": 0.95, "learning_rate": 2.6798201711094915e-06, "loss": 2.338, "step": 542700 }, { "epoch": 0.95, "learning_rate": 2.6789482311826644e-06, "loss": 2.3024, "step": 542710 }, { "epoch": 0.95, "learning_rate": 2.6780762912558377e-06, "loss": 2.2246, "step": 542720 }, { "epoch": 0.95, "learning_rate": 2.6772043513290107e-06, "loss": 2.313, "step": 542730 }, { "epoch": 0.95, "learning_rate": 2.676332411402184e-06, "loss": 2.1964, "step": 542740 }, { "epoch": 0.95, "learning_rate": 2.6754604714753573e-06, "loss": 2.2752, "step": 542750 }, { "epoch": 0.95, "learning_rate": 2.6745885315485307e-06, "loss": 2.2693, "step": 542760 }, { "epoch": 0.95, "learning_rate": 2.6737165916217036e-06, "loss": 2.1416, "step": 542770 }, { "epoch": 0.95, "learning_rate": 2.672844651694877e-06, "loss": 2.2308, "step": 542780 }, { "epoch": 0.95, "learning_rate": 2.67197271176805e-06, "loss": 2.1081, "step": 542790 }, { "epoch": 0.95, "learning_rate": 2.6711007718412232e-06, "loss": 2.1882, "step": 542800 }, { "epoch": 0.95, "learning_rate": 2.6702288319143966e-06, "loss": 2.2281, "step": 542810 }, { "epoch": 0.95, "learning_rate": 2.66935689198757e-06, "loss": 2.1907, "step": 542820 }, { "epoch": 0.95, "learning_rate": 2.668484952060743e-06, "loss": 2.2475, "step": 542830 }, { "epoch": 0.95, "learning_rate": 2.667613012133916e-06, "loss": 2.2082, "step": 542840 }, { "epoch": 0.95, "learning_rate": 2.666741072207089e-06, "loss": 2.31, "step": 542850 }, { "epoch": 0.95, "learning_rate": 2.6658691322802625e-06, "loss": 2.2796, "step": 542860 }, { "epoch": 0.95, "learning_rate": 2.6649971923534354e-06, "loss": 2.3255, "step": 542870 }, { "epoch": 0.95, "learning_rate": 2.664125252426609e-06, "loss": 2.2165, "step": 542880 }, { "epoch": 0.95, "learning_rate": 2.663253312499782e-06, "loss": 2.2226, "step": 542890 }, { "epoch": 0.95, "learning_rate": 2.6623813725729554e-06, "loss": 2.353, "step": 542900 }, { "epoch": 0.95, "learning_rate": 2.6615094326461283e-06, "loss": 2.2204, "step": 542910 }, { "epoch": 0.95, "learning_rate": 2.6606374927193017e-06, "loss": 2.2835, "step": 542920 }, { "epoch": 0.95, "learning_rate": 2.6597655527924746e-06, "loss": 2.282, "step": 542930 }, { "epoch": 0.95, "learning_rate": 2.6588936128656484e-06, "loss": 2.1742, "step": 542940 }, { "epoch": 0.95, "learning_rate": 2.6580216729388213e-06, "loss": 2.2272, "step": 542950 }, { "epoch": 0.95, "learning_rate": 2.6571497330119947e-06, "loss": 2.2137, "step": 542960 }, { "epoch": 0.95, "learning_rate": 2.6562777930851676e-06, "loss": 2.3083, "step": 542970 }, { "epoch": 0.95, "learning_rate": 2.655405853158341e-06, "loss": 2.163, "step": 542980 }, { "epoch": 0.95, "learning_rate": 2.654533913231514e-06, "loss": 2.2642, "step": 542990 }, { "epoch": 0.95, "learning_rate": 2.653661973304687e-06, "loss": 2.2568, "step": 543000 }, { "epoch": 0.95, "learning_rate": 2.6527900333778605e-06, "loss": 2.2644, "step": 543010 }, { "epoch": 0.95, "learning_rate": 2.651918093451034e-06, "loss": 2.1923, "step": 543020 }, { "epoch": 0.95, "learning_rate": 2.651046153524207e-06, "loss": 2.2127, "step": 543030 }, { "epoch": 0.95, "learning_rate": 2.65017421359738e-06, "loss": 2.2218, "step": 543040 }, { "epoch": 0.95, "learning_rate": 2.649302273670553e-06, "loss": 2.0549, "step": 543050 }, { "epoch": 0.95, "learning_rate": 2.6484303337437264e-06, "loss": 2.3251, "step": 543060 }, { "epoch": 0.95, "learning_rate": 2.6475583938168998e-06, "loss": 2.2968, "step": 543070 }, { "epoch": 0.95, "learning_rate": 2.646686453890073e-06, "loss": 2.2509, "step": 543080 }, { "epoch": 0.95, "learning_rate": 2.645814513963246e-06, "loss": 2.3343, "step": 543090 }, { "epoch": 0.95, "learning_rate": 2.6449425740364194e-06, "loss": 2.2422, "step": 543100 }, { "epoch": 0.95, "learning_rate": 2.6440706341095923e-06, "loss": 2.2182, "step": 543110 }, { "epoch": 0.95, "learning_rate": 2.6431986941827657e-06, "loss": 2.3742, "step": 543120 }, { "epoch": 0.95, "learning_rate": 2.6423267542559386e-06, "loss": 2.3237, "step": 543130 }, { "epoch": 0.95, "learning_rate": 2.6414548143291123e-06, "loss": 2.2463, "step": 543140 }, { "epoch": 0.95, "learning_rate": 2.6405828744022853e-06, "loss": 2.2592, "step": 543150 }, { "epoch": 0.95, "learning_rate": 2.6397109344754586e-06, "loss": 2.3101, "step": 543160 }, { "epoch": 0.95, "learning_rate": 2.6388389945486315e-06, "loss": 2.2334, "step": 543170 }, { "epoch": 0.95, "learning_rate": 2.637967054621805e-06, "loss": 2.2268, "step": 543180 }, { "epoch": 0.95, "learning_rate": 2.637095114694978e-06, "loss": 2.1403, "step": 543190 }, { "epoch": 0.95, "learning_rate": 2.636223174768151e-06, "loss": 2.2605, "step": 543200 }, { "epoch": 0.95, "learning_rate": 2.6353512348413245e-06, "loss": 2.2981, "step": 543210 }, { "epoch": 0.95, "learning_rate": 2.634479294914498e-06, "loss": 2.3147, "step": 543220 }, { "epoch": 0.95, "learning_rate": 2.6336073549876708e-06, "loss": 2.3118, "step": 543230 }, { "epoch": 0.95, "learning_rate": 2.632735415060844e-06, "loss": 2.1757, "step": 543240 }, { "epoch": 0.95, "learning_rate": 2.631863475134017e-06, "loss": 2.3479, "step": 543250 }, { "epoch": 0.95, "learning_rate": 2.6309915352071904e-06, "loss": 2.2171, "step": 543260 }, { "epoch": 0.95, "learning_rate": 2.6301195952803637e-06, "loss": 2.3316, "step": 543270 }, { "epoch": 0.95, "learning_rate": 2.629247655353537e-06, "loss": 2.2638, "step": 543280 }, { "epoch": 0.95, "learning_rate": 2.62837571542671e-06, "loss": 2.1645, "step": 543290 }, { "epoch": 0.95, "learning_rate": 2.6275037754998833e-06, "loss": 2.2728, "step": 543300 }, { "epoch": 0.95, "learning_rate": 2.6266318355730563e-06, "loss": 2.2189, "step": 543310 }, { "epoch": 0.95, "learning_rate": 2.6257598956462296e-06, "loss": 2.1662, "step": 543320 }, { "epoch": 0.95, "learning_rate": 2.624887955719403e-06, "loss": 2.3045, "step": 543330 }, { "epoch": 0.95, "learning_rate": 2.6240160157925763e-06, "loss": 2.0843, "step": 543340 }, { "epoch": 0.95, "learning_rate": 2.6231440758657492e-06, "loss": 2.2851, "step": 543350 }, { "epoch": 0.95, "learning_rate": 2.6222721359389226e-06, "loss": 2.1663, "step": 543360 }, { "epoch": 0.95, "learning_rate": 2.6214001960120955e-06, "loss": 2.2716, "step": 543370 }, { "epoch": 0.95, "learning_rate": 2.620528256085269e-06, "loss": 2.1842, "step": 543380 }, { "epoch": 0.95, "learning_rate": 2.6196563161584418e-06, "loss": 2.2985, "step": 543390 }, { "epoch": 0.95, "learning_rate": 2.618784376231615e-06, "loss": 2.2749, "step": 543400 }, { "epoch": 0.95, "learning_rate": 2.6179124363047885e-06, "loss": 2.3029, "step": 543410 }, { "epoch": 0.95, "learning_rate": 2.617040496377962e-06, "loss": 2.2788, "step": 543420 }, { "epoch": 0.95, "learning_rate": 2.6161685564511347e-06, "loss": 2.3096, "step": 543430 }, { "epoch": 0.95, "learning_rate": 2.615296616524308e-06, "loss": 2.1936, "step": 543440 }, { "epoch": 0.95, "learning_rate": 2.614424676597481e-06, "loss": 2.2127, "step": 543450 }, { "epoch": 0.95, "learning_rate": 2.6135527366706543e-06, "loss": 2.2605, "step": 543460 }, { "epoch": 0.95, "learning_rate": 2.6126807967438277e-06, "loss": 2.2964, "step": 543470 }, { "epoch": 0.95, "learning_rate": 2.611808856817001e-06, "loss": 2.3369, "step": 543480 }, { "epoch": 0.95, "learning_rate": 2.610936916890174e-06, "loss": 2.155, "step": 543490 }, { "epoch": 0.95, "learning_rate": 2.6100649769633473e-06, "loss": 2.3023, "step": 543500 }, { "epoch": 0.95, "learning_rate": 2.6091930370365202e-06, "loss": 2.2857, "step": 543510 }, { "epoch": 0.95, "learning_rate": 2.6083210971096936e-06, "loss": 2.19, "step": 543520 }, { "epoch": 0.95, "learning_rate": 2.607449157182867e-06, "loss": 2.3202, "step": 543530 }, { "epoch": 0.95, "learning_rate": 2.6065772172560403e-06, "loss": 2.1464, "step": 543540 }, { "epoch": 0.95, "learning_rate": 2.605705277329213e-06, "loss": 2.0498, "step": 543550 }, { "epoch": 0.95, "learning_rate": 2.6048333374023865e-06, "loss": 2.3068, "step": 543560 }, { "epoch": 0.95, "learning_rate": 2.6039613974755595e-06, "loss": 2.3308, "step": 543570 }, { "epoch": 0.95, "learning_rate": 2.603089457548733e-06, "loss": 2.2498, "step": 543580 }, { "epoch": 0.95, "learning_rate": 2.602217517621906e-06, "loss": 2.2576, "step": 543590 }, { "epoch": 0.95, "learning_rate": 2.601345577695079e-06, "loss": 2.1605, "step": 543600 }, { "epoch": 0.95, "learning_rate": 2.6004736377682524e-06, "loss": 2.2711, "step": 543610 }, { "epoch": 0.95, "learning_rate": 2.5996016978414258e-06, "loss": 2.2722, "step": 543620 }, { "epoch": 0.95, "learning_rate": 2.5987297579145987e-06, "loss": 2.2055, "step": 543630 }, { "epoch": 0.95, "learning_rate": 2.597857817987772e-06, "loss": 2.1815, "step": 543640 }, { "epoch": 0.95, "learning_rate": 2.596985878060945e-06, "loss": 2.3642, "step": 543650 }, { "epoch": 0.95, "learning_rate": 2.5961139381341183e-06, "loss": 2.2899, "step": 543660 }, { "epoch": 0.95, "learning_rate": 2.5952419982072917e-06, "loss": 2.1949, "step": 543670 }, { "epoch": 0.95, "learning_rate": 2.594370058280465e-06, "loss": 2.269, "step": 543680 }, { "epoch": 0.95, "learning_rate": 2.593498118353638e-06, "loss": 2.2939, "step": 543690 }, { "epoch": 0.95, "learning_rate": 2.5926261784268113e-06, "loss": 2.3265, "step": 543700 }, { "epoch": 0.95, "learning_rate": 2.591754238499984e-06, "loss": 2.28, "step": 543710 }, { "epoch": 0.95, "learning_rate": 2.5908822985731575e-06, "loss": 2.119, "step": 543720 }, { "epoch": 0.95, "learning_rate": 2.590010358646331e-06, "loss": 2.4113, "step": 543730 }, { "epoch": 0.95, "learning_rate": 2.5891384187195042e-06, "loss": 2.2507, "step": 543740 }, { "epoch": 0.95, "learning_rate": 2.588266478792677e-06, "loss": 2.1589, "step": 543750 }, { "epoch": 0.95, "learning_rate": 2.5873945388658505e-06, "loss": 2.2475, "step": 543760 }, { "epoch": 0.95, "learning_rate": 2.5865225989390234e-06, "loss": 2.2911, "step": 543770 }, { "epoch": 0.95, "learning_rate": 2.5856506590121968e-06, "loss": 2.2108, "step": 543780 }, { "epoch": 0.95, "learning_rate": 2.58477871908537e-06, "loss": 2.346, "step": 543790 }, { "epoch": 0.95, "learning_rate": 2.583906779158543e-06, "loss": 2.1875, "step": 543800 }, { "epoch": 0.95, "learning_rate": 2.5830348392317164e-06, "loss": 2.2479, "step": 543810 }, { "epoch": 0.95, "learning_rate": 2.5821628993048897e-06, "loss": 2.3395, "step": 543820 }, { "epoch": 0.95, "learning_rate": 2.5812909593780627e-06, "loss": 2.2599, "step": 543830 }, { "epoch": 0.95, "learning_rate": 2.580419019451236e-06, "loss": 2.2114, "step": 543840 }, { "epoch": 0.95, "learning_rate": 2.5795470795244094e-06, "loss": 2.1499, "step": 543850 }, { "epoch": 0.95, "learning_rate": 2.5786751395975823e-06, "loss": 2.2229, "step": 543860 }, { "epoch": 0.95, "learning_rate": 2.5778031996707556e-06, "loss": 2.269, "step": 543870 }, { "epoch": 0.95, "learning_rate": 2.576931259743929e-06, "loss": 2.1191, "step": 543880 }, { "epoch": 0.95, "learning_rate": 2.576059319817102e-06, "loss": 2.3093, "step": 543890 }, { "epoch": 0.95, "learning_rate": 2.5751873798902752e-06, "loss": 2.3097, "step": 543900 }, { "epoch": 0.95, "learning_rate": 2.574315439963448e-06, "loss": 2.2516, "step": 543910 }, { "epoch": 0.95, "learning_rate": 2.5734435000366215e-06, "loss": 2.2993, "step": 543920 }, { "epoch": 0.95, "learning_rate": 2.572571560109795e-06, "loss": 2.235, "step": 543930 }, { "epoch": 0.95, "learning_rate": 2.571699620182968e-06, "loss": 2.1701, "step": 543940 }, { "epoch": 0.95, "learning_rate": 2.570827680256141e-06, "loss": 2.297, "step": 543950 }, { "epoch": 0.95, "learning_rate": 2.5699557403293145e-06, "loss": 2.2669, "step": 543960 }, { "epoch": 0.95, "learning_rate": 2.5690838004024874e-06, "loss": 2.1571, "step": 543970 }, { "epoch": 0.95, "learning_rate": 2.5682118604756607e-06, "loss": 2.2778, "step": 543980 }, { "epoch": 0.95, "learning_rate": 2.567339920548834e-06, "loss": 2.3698, "step": 543990 }, { "epoch": 0.95, "learning_rate": 2.566467980622007e-06, "loss": 2.1493, "step": 544000 }, { "epoch": 0.95, "learning_rate": 2.5655960406951804e-06, "loss": 2.2864, "step": 544010 }, { "epoch": 0.95, "learning_rate": 2.5647241007683537e-06, "loss": 2.2517, "step": 544020 }, { "epoch": 0.95, "learning_rate": 2.5638521608415266e-06, "loss": 2.3508, "step": 544030 }, { "epoch": 0.95, "learning_rate": 2.5629802209147e-06, "loss": 2.1819, "step": 544040 }, { "epoch": 0.95, "learning_rate": 2.5621082809878733e-06, "loss": 2.1974, "step": 544050 }, { "epoch": 0.95, "learning_rate": 2.5612363410610462e-06, "loss": 2.2557, "step": 544060 }, { "epoch": 0.95, "learning_rate": 2.5603644011342196e-06, "loss": 2.1219, "step": 544070 }, { "epoch": 0.95, "learning_rate": 2.559492461207393e-06, "loss": 2.216, "step": 544080 }, { "epoch": 0.95, "learning_rate": 2.558620521280566e-06, "loss": 2.2217, "step": 544090 }, { "epoch": 0.95, "learning_rate": 2.557748581353739e-06, "loss": 2.2263, "step": 544100 }, { "epoch": 0.95, "learning_rate": 2.5568766414269125e-06, "loss": 2.2696, "step": 544110 }, { "epoch": 0.95, "learning_rate": 2.5560047015000855e-06, "loss": 2.2584, "step": 544120 }, { "epoch": 0.95, "learning_rate": 2.555132761573259e-06, "loss": 2.281, "step": 544130 }, { "epoch": 0.95, "learning_rate": 2.554260821646432e-06, "loss": 2.3413, "step": 544140 }, { "epoch": 0.95, "learning_rate": 2.553388881719605e-06, "loss": 2.2642, "step": 544150 }, { "epoch": 0.95, "learning_rate": 2.5525169417927784e-06, "loss": 2.3207, "step": 544160 }, { "epoch": 0.95, "learning_rate": 2.5516450018659518e-06, "loss": 2.2741, "step": 544170 }, { "epoch": 0.95, "learning_rate": 2.5507730619391247e-06, "loss": 2.272, "step": 544180 }, { "epoch": 0.95, "learning_rate": 2.549901122012298e-06, "loss": 2.2075, "step": 544190 }, { "epoch": 0.95, "learning_rate": 2.549029182085471e-06, "loss": 2.3438, "step": 544200 }, { "epoch": 0.95, "learning_rate": 2.5481572421586443e-06, "loss": 2.2739, "step": 544210 }, { "epoch": 0.95, "learning_rate": 2.5472853022318177e-06, "loss": 2.326, "step": 544220 }, { "epoch": 0.95, "learning_rate": 2.5464133623049906e-06, "loss": 2.2058, "step": 544230 }, { "epoch": 0.95, "learning_rate": 2.545541422378164e-06, "loss": 2.2055, "step": 544240 }, { "epoch": 0.95, "learning_rate": 2.5446694824513373e-06, "loss": 2.2434, "step": 544250 }, { "epoch": 0.95, "learning_rate": 2.54379754252451e-06, "loss": 2.1337, "step": 544260 }, { "epoch": 0.95, "learning_rate": 2.5429256025976835e-06, "loss": 2.2736, "step": 544270 }, { "epoch": 0.95, "learning_rate": 2.542053662670857e-06, "loss": 2.2926, "step": 544280 }, { "epoch": 0.95, "learning_rate": 2.54118172274403e-06, "loss": 2.2843, "step": 544290 }, { "epoch": 0.95, "learning_rate": 2.540309782817203e-06, "loss": 2.3947, "step": 544300 }, { "epoch": 0.95, "learning_rate": 2.5394378428903765e-06, "loss": 2.2809, "step": 544310 }, { "epoch": 0.95, "learning_rate": 2.5385659029635494e-06, "loss": 2.2993, "step": 544320 }, { "epoch": 0.95, "learning_rate": 2.5376939630367228e-06, "loss": 2.2124, "step": 544330 }, { "epoch": 0.95, "learning_rate": 2.536822023109896e-06, "loss": 2.4059, "step": 544340 }, { "epoch": 0.95, "learning_rate": 2.535950083183069e-06, "loss": 2.3454, "step": 544350 }, { "epoch": 0.95, "learning_rate": 2.5350781432562424e-06, "loss": 2.2322, "step": 544360 }, { "epoch": 0.95, "learning_rate": 2.5342062033294157e-06, "loss": 2.2385, "step": 544370 }, { "epoch": 0.95, "learning_rate": 2.5333342634025887e-06, "loss": 2.2068, "step": 544380 }, { "epoch": 0.95, "learning_rate": 2.532462323475762e-06, "loss": 2.2872, "step": 544390 }, { "epoch": 0.95, "learning_rate": 2.531590383548935e-06, "loss": 2.2398, "step": 544400 }, { "epoch": 0.95, "learning_rate": 2.5307184436221083e-06, "loss": 2.1245, "step": 544410 }, { "epoch": 0.95, "learning_rate": 2.5298465036952816e-06, "loss": 2.3552, "step": 544420 }, { "epoch": 0.95, "learning_rate": 2.528974563768455e-06, "loss": 2.2119, "step": 544430 }, { "epoch": 0.95, "learning_rate": 2.528102623841628e-06, "loss": 2.3118, "step": 544440 }, { "epoch": 0.95, "learning_rate": 2.5272306839148012e-06, "loss": 2.2709, "step": 544450 }, { "epoch": 0.95, "learning_rate": 2.526358743987974e-06, "loss": 2.2983, "step": 544460 }, { "epoch": 0.95, "learning_rate": 2.5254868040611475e-06, "loss": 2.2849, "step": 544470 }, { "epoch": 0.95, "learning_rate": 2.524614864134321e-06, "loss": 2.1921, "step": 544480 }, { "epoch": 0.95, "learning_rate": 2.5237429242074938e-06, "loss": 2.2888, "step": 544490 }, { "epoch": 0.95, "learning_rate": 2.522870984280667e-06, "loss": 2.2396, "step": 544500 }, { "epoch": 0.95, "learning_rate": 2.5219990443538405e-06, "loss": 2.1193, "step": 544510 }, { "epoch": 0.95, "learning_rate": 2.5211271044270134e-06, "loss": 2.3253, "step": 544520 }, { "epoch": 0.95, "learning_rate": 2.5202551645001867e-06, "loss": 2.1952, "step": 544530 }, { "epoch": 0.95, "learning_rate": 2.51938322457336e-06, "loss": 2.2469, "step": 544540 }, { "epoch": 0.95, "learning_rate": 2.518511284646533e-06, "loss": 2.2822, "step": 544550 }, { "epoch": 0.95, "learning_rate": 2.5176393447197064e-06, "loss": 2.2287, "step": 544560 }, { "epoch": 0.95, "learning_rate": 2.5167674047928797e-06, "loss": 2.285, "step": 544570 }, { "epoch": 0.95, "learning_rate": 2.5158954648660526e-06, "loss": 2.4004, "step": 544580 }, { "epoch": 0.95, "learning_rate": 2.515023524939226e-06, "loss": 2.27, "step": 544590 }, { "epoch": 0.95, "learning_rate": 2.514151585012399e-06, "loss": 2.2398, "step": 544600 }, { "epoch": 0.95, "learning_rate": 2.5132796450855722e-06, "loss": 2.2618, "step": 544610 }, { "epoch": 0.95, "learning_rate": 2.5124077051587456e-06, "loss": 2.2678, "step": 544620 }, { "epoch": 0.95, "learning_rate": 2.511535765231919e-06, "loss": 2.2477, "step": 544630 }, { "epoch": 0.95, "learning_rate": 2.510663825305092e-06, "loss": 2.2156, "step": 544640 }, { "epoch": 0.95, "learning_rate": 2.509791885378265e-06, "loss": 2.2105, "step": 544650 }, { "epoch": 0.95, "learning_rate": 2.508919945451438e-06, "loss": 2.2446, "step": 544660 }, { "epoch": 0.95, "learning_rate": 2.5080480055246115e-06, "loss": 2.2738, "step": 544670 }, { "epoch": 0.95, "learning_rate": 2.507176065597785e-06, "loss": 2.2045, "step": 544680 }, { "epoch": 0.95, "learning_rate": 2.506304125670958e-06, "loss": 2.2266, "step": 544690 }, { "epoch": 0.95, "learning_rate": 2.505432185744131e-06, "loss": 2.1725, "step": 544700 }, { "epoch": 0.95, "learning_rate": 2.5045602458173044e-06, "loss": 2.2779, "step": 544710 }, { "epoch": 0.95, "learning_rate": 2.5036883058904774e-06, "loss": 2.3916, "step": 544720 }, { "epoch": 0.95, "learning_rate": 2.5028163659636507e-06, "loss": 2.1494, "step": 544730 }, { "epoch": 0.95, "learning_rate": 2.501944426036824e-06, "loss": 2.1204, "step": 544740 }, { "epoch": 0.95, "learning_rate": 2.501072486109997e-06, "loss": 2.2106, "step": 544750 }, { "epoch": 0.95, "learning_rate": 2.5002005461831703e-06, "loss": 2.2678, "step": 544760 }, { "epoch": 0.95, "learning_rate": 2.4993286062563437e-06, "loss": 2.3199, "step": 544770 }, { "epoch": 0.95, "learning_rate": 2.4984566663295166e-06, "loss": 2.1956, "step": 544780 }, { "epoch": 0.95, "learning_rate": 2.49758472640269e-06, "loss": 2.153, "step": 544790 }, { "epoch": 0.95, "learning_rate": 2.496712786475863e-06, "loss": 2.2359, "step": 544800 }, { "epoch": 0.95, "learning_rate": 2.495840846549036e-06, "loss": 2.2833, "step": 544810 }, { "epoch": 0.95, "learning_rate": 2.4949689066222096e-06, "loss": 2.2076, "step": 544820 }, { "epoch": 0.95, "learning_rate": 2.494096966695383e-06, "loss": 2.0867, "step": 544830 }, { "epoch": 0.95, "learning_rate": 2.493225026768556e-06, "loss": 2.2388, "step": 544840 }, { "epoch": 0.95, "learning_rate": 2.492353086841729e-06, "loss": 2.3474, "step": 544850 }, { "epoch": 0.95, "learning_rate": 2.491481146914902e-06, "loss": 2.2093, "step": 544860 }, { "epoch": 0.95, "learning_rate": 2.4906092069880754e-06, "loss": 2.2256, "step": 544870 }, { "epoch": 0.95, "learning_rate": 2.4897372670612488e-06, "loss": 2.2515, "step": 544880 }, { "epoch": 0.95, "learning_rate": 2.488865327134422e-06, "loss": 2.2327, "step": 544890 }, { "epoch": 0.95, "learning_rate": 2.487993387207595e-06, "loss": 2.1421, "step": 544900 }, { "epoch": 0.95, "learning_rate": 2.4871214472807684e-06, "loss": 2.1358, "step": 544910 }, { "epoch": 0.95, "learning_rate": 2.4862495073539413e-06, "loss": 2.2707, "step": 544920 }, { "epoch": 0.95, "learning_rate": 2.4853775674271147e-06, "loss": 2.3101, "step": 544930 }, { "epoch": 0.95, "learning_rate": 2.484505627500288e-06, "loss": 2.3213, "step": 544940 }, { "epoch": 0.95, "learning_rate": 2.4836336875734614e-06, "loss": 2.2114, "step": 544950 }, { "epoch": 0.95, "learning_rate": 2.4827617476466343e-06, "loss": 2.2298, "step": 544960 }, { "epoch": 0.95, "learning_rate": 2.4818898077198076e-06, "loss": 2.1848, "step": 544970 }, { "epoch": 0.95, "learning_rate": 2.4810178677929806e-06, "loss": 2.2756, "step": 544980 }, { "epoch": 0.95, "learning_rate": 2.480145927866154e-06, "loss": 2.2417, "step": 544990 }, { "epoch": 0.95, "learning_rate": 2.479273987939327e-06, "loss": 2.2328, "step": 545000 }, { "epoch": 0.95, "learning_rate": 2.4784020480125e-06, "loss": 2.312, "step": 545010 }, { "epoch": 0.95, "learning_rate": 2.4775301080856735e-06, "loss": 2.3354, "step": 545020 }, { "epoch": 0.95, "learning_rate": 2.476658168158847e-06, "loss": 2.1976, "step": 545030 }, { "epoch": 0.95, "learning_rate": 2.4757862282320198e-06, "loss": 2.2623, "step": 545040 }, { "epoch": 0.95, "learning_rate": 2.474914288305193e-06, "loss": 2.1757, "step": 545050 }, { "epoch": 0.95, "learning_rate": 2.474042348378366e-06, "loss": 2.263, "step": 545060 }, { "epoch": 0.95, "learning_rate": 2.4731704084515394e-06, "loss": 2.1892, "step": 545070 }, { "epoch": 0.95, "learning_rate": 2.4722984685247127e-06, "loss": 2.3593, "step": 545080 }, { "epoch": 0.95, "learning_rate": 2.471426528597886e-06, "loss": 2.3011, "step": 545090 }, { "epoch": 0.95, "learning_rate": 2.470554588671059e-06, "loss": 2.2, "step": 545100 }, { "epoch": 0.95, "learning_rate": 2.4696826487442324e-06, "loss": 2.2158, "step": 545110 }, { "epoch": 0.95, "learning_rate": 2.4688107088174053e-06, "loss": 2.2828, "step": 545120 }, { "epoch": 0.95, "learning_rate": 2.4679387688905786e-06, "loss": 2.2866, "step": 545130 }, { "epoch": 0.95, "learning_rate": 2.467066828963752e-06, "loss": 2.1983, "step": 545140 }, { "epoch": 0.95, "learning_rate": 2.4661948890369253e-06, "loss": 2.2994, "step": 545150 }, { "epoch": 0.95, "learning_rate": 2.4653229491100982e-06, "loss": 2.3157, "step": 545160 }, { "epoch": 0.95, "learning_rate": 2.4644510091832716e-06, "loss": 2.1165, "step": 545170 }, { "epoch": 0.95, "learning_rate": 2.4635790692564445e-06, "loss": 2.2817, "step": 545180 }, { "epoch": 0.95, "learning_rate": 2.462707129329618e-06, "loss": 2.1859, "step": 545190 }, { "epoch": 0.95, "learning_rate": 2.4618351894027908e-06, "loss": 2.3134, "step": 545200 }, { "epoch": 0.95, "learning_rate": 2.4609632494759646e-06, "loss": 2.2209, "step": 545210 }, { "epoch": 0.95, "learning_rate": 2.4600913095491375e-06, "loss": 2.3163, "step": 545220 }, { "epoch": 0.95, "learning_rate": 2.459219369622311e-06, "loss": 2.2983, "step": 545230 }, { "epoch": 0.95, "learning_rate": 2.4583474296954837e-06, "loss": 2.2761, "step": 545240 }, { "epoch": 0.95, "learning_rate": 2.457475489768657e-06, "loss": 2.2094, "step": 545250 }, { "epoch": 0.95, "learning_rate": 2.45660354984183e-06, "loss": 2.108, "step": 545260 }, { "epoch": 0.95, "learning_rate": 2.4557316099150034e-06, "loss": 2.2564, "step": 545270 }, { "epoch": 0.95, "learning_rate": 2.4548596699881767e-06, "loss": 2.2008, "step": 545280 }, { "epoch": 0.95, "learning_rate": 2.45398773006135e-06, "loss": 2.2437, "step": 545290 }, { "epoch": 0.95, "learning_rate": 2.453115790134523e-06, "loss": 2.2615, "step": 545300 }, { "epoch": 0.95, "learning_rate": 2.4522438502076963e-06, "loss": 2.3225, "step": 545310 }, { "epoch": 0.95, "learning_rate": 2.4513719102808692e-06, "loss": 2.2736, "step": 545320 }, { "epoch": 0.95, "learning_rate": 2.4504999703540426e-06, "loss": 2.1832, "step": 545330 }, { "epoch": 0.95, "learning_rate": 2.449628030427216e-06, "loss": 2.2579, "step": 545340 }, { "epoch": 0.95, "learning_rate": 2.4487560905003893e-06, "loss": 2.1994, "step": 545350 }, { "epoch": 0.95, "learning_rate": 2.4478841505735622e-06, "loss": 2.3694, "step": 545360 }, { "epoch": 0.95, "learning_rate": 2.4470122106467356e-06, "loss": 2.2571, "step": 545370 }, { "epoch": 0.95, "learning_rate": 2.4461402707199085e-06, "loss": 2.1509, "step": 545380 }, { "epoch": 0.95, "learning_rate": 2.445268330793082e-06, "loss": 2.2328, "step": 545390 }, { "epoch": 0.95, "learning_rate": 2.4443963908662548e-06, "loss": 2.3319, "step": 545400 }, { "epoch": 0.95, "learning_rate": 2.4435244509394285e-06, "loss": 2.2635, "step": 545410 }, { "epoch": 0.95, "learning_rate": 2.4426525110126014e-06, "loss": 2.2592, "step": 545420 }, { "epoch": 0.95, "learning_rate": 2.441780571085775e-06, "loss": 2.1532, "step": 545430 }, { "epoch": 0.95, "learning_rate": 2.4409086311589477e-06, "loss": 2.2211, "step": 545440 }, { "epoch": 0.95, "learning_rate": 2.440036691232121e-06, "loss": 2.2978, "step": 545450 }, { "epoch": 0.95, "learning_rate": 2.439164751305294e-06, "loss": 2.2862, "step": 545460 }, { "epoch": 0.95, "learning_rate": 2.4382928113784678e-06, "loss": 2.2549, "step": 545470 }, { "epoch": 0.95, "learning_rate": 2.4374208714516407e-06, "loss": 2.2473, "step": 545480 }, { "epoch": 0.95, "learning_rate": 2.436548931524814e-06, "loss": 2.3084, "step": 545490 }, { "epoch": 0.95, "learning_rate": 2.435676991597987e-06, "loss": 2.1976, "step": 545500 }, { "epoch": 0.95, "learning_rate": 2.4348050516711603e-06, "loss": 2.1313, "step": 545510 }, { "epoch": 0.95, "learning_rate": 2.4339331117443332e-06, "loss": 2.2891, "step": 545520 }, { "epoch": 0.95, "learning_rate": 2.4330611718175066e-06, "loss": 2.2785, "step": 545530 }, { "epoch": 0.95, "learning_rate": 2.43218923189068e-06, "loss": 2.2639, "step": 545540 }, { "epoch": 0.95, "learning_rate": 2.4313172919638533e-06, "loss": 2.2013, "step": 545550 }, { "epoch": 0.95, "learning_rate": 2.430445352037026e-06, "loss": 2.3245, "step": 545560 }, { "epoch": 0.95, "learning_rate": 2.4295734121101995e-06, "loss": 2.2147, "step": 545570 }, { "epoch": 0.95, "learning_rate": 2.4287014721833724e-06, "loss": 2.2235, "step": 545580 }, { "epoch": 0.95, "learning_rate": 2.427829532256546e-06, "loss": 2.2633, "step": 545590 }, { "epoch": 0.95, "learning_rate": 2.4269575923297187e-06, "loss": 2.2725, "step": 545600 }, { "epoch": 0.95, "learning_rate": 2.4260856524028925e-06, "loss": 2.2017, "step": 545610 }, { "epoch": 0.95, "learning_rate": 2.4252137124760654e-06, "loss": 2.2619, "step": 545620 }, { "epoch": 0.95, "learning_rate": 2.4243417725492388e-06, "loss": 2.2781, "step": 545630 }, { "epoch": 0.95, "learning_rate": 2.4234698326224117e-06, "loss": 2.3427, "step": 545640 }, { "epoch": 0.95, "learning_rate": 2.422597892695585e-06, "loss": 2.2573, "step": 545650 }, { "epoch": 0.95, "learning_rate": 2.421725952768758e-06, "loss": 2.1072, "step": 545660 }, { "epoch": 0.95, "learning_rate": 2.4208540128419317e-06, "loss": 2.3521, "step": 545670 }, { "epoch": 0.95, "learning_rate": 2.4199820729151046e-06, "loss": 2.1925, "step": 545680 }, { "epoch": 0.95, "learning_rate": 2.419110132988278e-06, "loss": 2.4101, "step": 545690 }, { "epoch": 0.95, "learning_rate": 2.418238193061451e-06, "loss": 2.2786, "step": 545700 }, { "epoch": 0.95, "learning_rate": 2.4173662531346243e-06, "loss": 2.3245, "step": 545710 }, { "epoch": 0.95, "learning_rate": 2.416494313207797e-06, "loss": 2.3808, "step": 545720 }, { "epoch": 0.95, "learning_rate": 2.4156223732809705e-06, "loss": 2.3069, "step": 545730 }, { "epoch": 0.95, "learning_rate": 2.414750433354144e-06, "loss": 2.2514, "step": 545740 }, { "epoch": 0.95, "learning_rate": 2.4138784934273172e-06, "loss": 2.3171, "step": 545750 }, { "epoch": 0.95, "learning_rate": 2.41300655350049e-06, "loss": 2.3116, "step": 545760 }, { "epoch": 0.95, "learning_rate": 2.4121346135736635e-06, "loss": 2.2331, "step": 545770 }, { "epoch": 0.95, "learning_rate": 2.4112626736468364e-06, "loss": 2.2581, "step": 545780 }, { "epoch": 0.95, "learning_rate": 2.4103907337200098e-06, "loss": 2.2611, "step": 545790 }, { "epoch": 0.95, "learning_rate": 2.409518793793183e-06, "loss": 2.3104, "step": 545800 }, { "epoch": 0.95, "learning_rate": 2.4086468538663564e-06, "loss": 2.2208, "step": 545810 }, { "epoch": 0.95, "learning_rate": 2.4077749139395294e-06, "loss": 2.154, "step": 545820 }, { "epoch": 0.95, "learning_rate": 2.4069029740127027e-06, "loss": 2.3364, "step": 545830 }, { "epoch": 0.95, "learning_rate": 2.4060310340858756e-06, "loss": 2.2608, "step": 545840 }, { "epoch": 0.95, "learning_rate": 2.405159094159049e-06, "loss": 2.1997, "step": 545850 }, { "epoch": 0.95, "learning_rate": 2.404287154232222e-06, "loss": 2.2819, "step": 545860 }, { "epoch": 0.95, "learning_rate": 2.4034152143053957e-06, "loss": 2.2785, "step": 545870 }, { "epoch": 0.95, "learning_rate": 2.4025432743785686e-06, "loss": 2.3315, "step": 545880 }, { "epoch": 0.95, "learning_rate": 2.401671334451742e-06, "loss": 2.375, "step": 545890 }, { "epoch": 0.95, "learning_rate": 2.400799394524915e-06, "loss": 2.3274, "step": 545900 }, { "epoch": 0.95, "learning_rate": 2.3999274545980882e-06, "loss": 2.2501, "step": 545910 }, { "epoch": 0.95, "learning_rate": 2.399055514671261e-06, "loss": 2.2307, "step": 545920 }, { "epoch": 0.95, "learning_rate": 2.3981835747444345e-06, "loss": 2.164, "step": 545930 }, { "epoch": 0.95, "learning_rate": 2.397311634817608e-06, "loss": 2.1375, "step": 545940 }, { "epoch": 0.95, "learning_rate": 2.396439694890781e-06, "loss": 2.2169, "step": 545950 }, { "epoch": 0.95, "learning_rate": 2.395567754963954e-06, "loss": 2.3007, "step": 545960 }, { "epoch": 0.95, "learning_rate": 2.3946958150371274e-06, "loss": 2.1939, "step": 545970 }, { "epoch": 0.95, "learning_rate": 2.3938238751103004e-06, "loss": 2.2579, "step": 545980 }, { "epoch": 0.95, "learning_rate": 2.3929519351834737e-06, "loss": 2.2623, "step": 545990 }, { "epoch": 0.95, "learning_rate": 2.392079995256647e-06, "loss": 2.1107, "step": 546000 }, { "epoch": 0.95, "learning_rate": 2.3912080553298204e-06, "loss": 2.2154, "step": 546010 }, { "epoch": 0.95, "learning_rate": 2.3903361154029933e-06, "loss": 2.3147, "step": 546020 }, { "epoch": 0.95, "learning_rate": 2.3894641754761667e-06, "loss": 2.2499, "step": 546030 }, { "epoch": 0.95, "learning_rate": 2.3885922355493396e-06, "loss": 2.2636, "step": 546040 }, { "epoch": 0.95, "learning_rate": 2.387720295622513e-06, "loss": 2.1825, "step": 546050 }, { "epoch": 0.95, "learning_rate": 2.386848355695686e-06, "loss": 2.3019, "step": 546060 }, { "epoch": 0.95, "learning_rate": 2.3859764157688596e-06, "loss": 2.2237, "step": 546070 }, { "epoch": 0.95, "learning_rate": 2.3851044758420326e-06, "loss": 2.2071, "step": 546080 }, { "epoch": 0.95, "learning_rate": 2.384232535915206e-06, "loss": 2.2997, "step": 546090 }, { "epoch": 0.95, "learning_rate": 2.383360595988379e-06, "loss": 2.1521, "step": 546100 }, { "epoch": 0.95, "learning_rate": 2.382488656061552e-06, "loss": 2.351, "step": 546110 }, { "epoch": 0.95, "learning_rate": 2.381616716134725e-06, "loss": 2.2448, "step": 546120 }, { "epoch": 0.95, "learning_rate": 2.3807447762078984e-06, "loss": 2.267, "step": 546130 }, { "epoch": 0.95, "learning_rate": 2.379872836281072e-06, "loss": 2.3421, "step": 546140 }, { "epoch": 0.95, "learning_rate": 2.379000896354245e-06, "loss": 2.2389, "step": 546150 }, { "epoch": 0.95, "learning_rate": 2.378128956427418e-06, "loss": 2.2053, "step": 546160 }, { "epoch": 0.95, "learning_rate": 2.3772570165005914e-06, "loss": 2.2504, "step": 546170 }, { "epoch": 0.95, "learning_rate": 2.3763850765737643e-06, "loss": 2.2459, "step": 546180 }, { "epoch": 0.95, "learning_rate": 2.3755131366469377e-06, "loss": 2.225, "step": 546190 }, { "epoch": 0.95, "learning_rate": 2.374641196720111e-06, "loss": 2.2955, "step": 546200 }, { "epoch": 0.95, "learning_rate": 2.3737692567932844e-06, "loss": 2.2561, "step": 546210 }, { "epoch": 0.95, "learning_rate": 2.3728973168664573e-06, "loss": 2.1852, "step": 546220 }, { "epoch": 0.95, "learning_rate": 2.3720253769396306e-06, "loss": 2.243, "step": 546230 }, { "epoch": 0.95, "learning_rate": 2.3711534370128036e-06, "loss": 2.216, "step": 546240 }, { "epoch": 0.95, "learning_rate": 2.370281497085977e-06, "loss": 2.2331, "step": 546250 }, { "epoch": 0.95, "learning_rate": 2.36940955715915e-06, "loss": 2.3522, "step": 546260 }, { "epoch": 0.95, "learning_rate": 2.3685376172323236e-06, "loss": 2.3059, "step": 546270 }, { "epoch": 0.95, "learning_rate": 2.3676656773054965e-06, "loss": 2.308, "step": 546280 }, { "epoch": 0.95, "learning_rate": 2.36679373737867e-06, "loss": 2.2304, "step": 546290 }, { "epoch": 0.95, "learning_rate": 2.365921797451843e-06, "loss": 2.1864, "step": 546300 }, { "epoch": 0.95, "learning_rate": 2.365049857525016e-06, "loss": 2.0917, "step": 546310 }, { "epoch": 0.95, "learning_rate": 2.364177917598189e-06, "loss": 2.2946, "step": 546320 }, { "epoch": 0.95, "learning_rate": 2.3633059776713624e-06, "loss": 2.3124, "step": 546330 }, { "epoch": 0.95, "learning_rate": 2.3624340377445358e-06, "loss": 2.3082, "step": 546340 }, { "epoch": 0.95, "learning_rate": 2.361562097817709e-06, "loss": 2.4248, "step": 546350 }, { "epoch": 0.95, "learning_rate": 2.360690157890882e-06, "loss": 2.1653, "step": 546360 }, { "epoch": 0.95, "learning_rate": 2.3598182179640554e-06, "loss": 2.3416, "step": 546370 }, { "epoch": 0.95, "learning_rate": 2.3589462780372283e-06, "loss": 2.2055, "step": 546380 }, { "epoch": 0.95, "learning_rate": 2.3580743381104016e-06, "loss": 2.2958, "step": 546390 }, { "epoch": 0.95, "learning_rate": 2.357202398183575e-06, "loss": 2.2981, "step": 546400 }, { "epoch": 0.95, "learning_rate": 2.3563304582567483e-06, "loss": 2.2739, "step": 546410 }, { "epoch": 0.95, "learning_rate": 2.3554585183299213e-06, "loss": 2.2434, "step": 546420 }, { "epoch": 0.95, "learning_rate": 2.3545865784030946e-06, "loss": 2.1919, "step": 546430 }, { "epoch": 0.95, "learning_rate": 2.3537146384762675e-06, "loss": 2.3015, "step": 546440 }, { "epoch": 0.95, "learning_rate": 2.352842698549441e-06, "loss": 2.2654, "step": 546450 }, { "epoch": 0.95, "learning_rate": 2.351970758622614e-06, "loss": 2.1999, "step": 546460 }, { "epoch": 0.95, "learning_rate": 2.3510988186957876e-06, "loss": 2.234, "step": 546470 }, { "epoch": 0.95, "learning_rate": 2.3502268787689605e-06, "loss": 2.3861, "step": 546480 }, { "epoch": 0.95, "learning_rate": 2.349354938842134e-06, "loss": 2.2771, "step": 546490 }, { "epoch": 0.95, "learning_rate": 2.3484829989153068e-06, "loss": 2.2003, "step": 546500 }, { "epoch": 0.95, "learning_rate": 2.34761105898848e-06, "loss": 2.1573, "step": 546510 }, { "epoch": 0.95, "learning_rate": 2.346739119061653e-06, "loss": 2.206, "step": 546520 }, { "epoch": 0.95, "learning_rate": 2.3458671791348264e-06, "loss": 2.1976, "step": 546530 }, { "epoch": 0.95, "learning_rate": 2.3449952392079997e-06, "loss": 2.2254, "step": 546540 }, { "epoch": 0.95, "learning_rate": 2.344123299281173e-06, "loss": 2.2502, "step": 546550 }, { "epoch": 0.95, "learning_rate": 2.343251359354346e-06, "loss": 2.3419, "step": 546560 }, { "epoch": 0.95, "learning_rate": 2.3423794194275193e-06, "loss": 2.3007, "step": 546570 }, { "epoch": 0.95, "learning_rate": 2.3415074795006923e-06, "loss": 2.2496, "step": 546580 }, { "epoch": 0.95, "learning_rate": 2.3406355395738656e-06, "loss": 2.2267, "step": 546590 }, { "epoch": 0.95, "learning_rate": 2.339763599647039e-06, "loss": 2.235, "step": 546600 }, { "epoch": 0.95, "learning_rate": 2.3388916597202123e-06, "loss": 2.2486, "step": 546610 }, { "epoch": 0.95, "learning_rate": 2.3380197197933852e-06, "loss": 2.274, "step": 546620 }, { "epoch": 0.95, "learning_rate": 2.3371477798665586e-06, "loss": 2.2604, "step": 546630 }, { "epoch": 0.95, "learning_rate": 2.3362758399397315e-06, "loss": 2.3021, "step": 546640 }, { "epoch": 0.95, "learning_rate": 2.335403900012905e-06, "loss": 2.2332, "step": 546650 }, { "epoch": 0.95, "learning_rate": 2.3345319600860778e-06, "loss": 2.2688, "step": 546660 }, { "epoch": 0.95, "learning_rate": 2.3336600201592515e-06, "loss": 2.2771, "step": 546670 }, { "epoch": 0.95, "learning_rate": 2.3327880802324245e-06, "loss": 2.344, "step": 546680 }, { "epoch": 0.95, "learning_rate": 2.331916140305598e-06, "loss": 2.2443, "step": 546690 }, { "epoch": 0.95, "learning_rate": 2.3310442003787707e-06, "loss": 2.2089, "step": 546700 }, { "epoch": 0.95, "learning_rate": 2.330172260451944e-06, "loss": 2.281, "step": 546710 }, { "epoch": 0.95, "learning_rate": 2.329300320525117e-06, "loss": 2.1677, "step": 546720 }, { "epoch": 0.95, "learning_rate": 2.3284283805982903e-06, "loss": 2.1939, "step": 546730 }, { "epoch": 0.95, "learning_rate": 2.3275564406714637e-06, "loss": 2.3583, "step": 546740 }, { "epoch": 0.95, "learning_rate": 2.326684500744637e-06, "loss": 2.2376, "step": 546750 }, { "epoch": 0.95, "learning_rate": 2.32581256081781e-06, "loss": 2.3141, "step": 546760 }, { "epoch": 0.95, "learning_rate": 2.3249406208909833e-06, "loss": 2.2933, "step": 546770 }, { "epoch": 0.95, "learning_rate": 2.3240686809641562e-06, "loss": 2.2202, "step": 546780 }, { "epoch": 0.95, "learning_rate": 2.3231967410373296e-06, "loss": 2.2829, "step": 546790 }, { "epoch": 0.95, "learning_rate": 2.322324801110503e-06, "loss": 2.2842, "step": 546800 }, { "epoch": 0.95, "learning_rate": 2.3214528611836763e-06, "loss": 2.2399, "step": 546810 }, { "epoch": 0.95, "learning_rate": 2.320580921256849e-06, "loss": 2.2808, "step": 546820 }, { "epoch": 0.95, "learning_rate": 2.3197089813300225e-06, "loss": 2.305, "step": 546830 }, { "epoch": 0.95, "learning_rate": 2.3188370414031955e-06, "loss": 2.3999, "step": 546840 }, { "epoch": 0.95, "learning_rate": 2.317965101476369e-06, "loss": 2.3725, "step": 546850 }, { "epoch": 0.95, "learning_rate": 2.3170931615495417e-06, "loss": 2.1977, "step": 546860 }, { "epoch": 0.95, "learning_rate": 2.3162212216227155e-06, "loss": 2.2745, "step": 546870 }, { "epoch": 0.95, "learning_rate": 2.3153492816958884e-06, "loss": 2.301, "step": 546880 }, { "epoch": 0.95, "learning_rate": 2.3144773417690618e-06, "loss": 2.2798, "step": 546890 }, { "epoch": 0.95, "learning_rate": 2.3136054018422347e-06, "loss": 2.2484, "step": 546900 }, { "epoch": 0.95, "learning_rate": 2.312733461915408e-06, "loss": 2.3052, "step": 546910 }, { "epoch": 0.95, "learning_rate": 2.311861521988581e-06, "loss": 2.223, "step": 546920 }, { "epoch": 0.95, "learning_rate": 2.3109895820617543e-06, "loss": 2.2238, "step": 546930 }, { "epoch": 0.95, "learning_rate": 2.3101176421349276e-06, "loss": 2.3042, "step": 546940 }, { "epoch": 0.95, "learning_rate": 2.309245702208101e-06, "loss": 2.3014, "step": 546950 }, { "epoch": 0.95, "learning_rate": 2.308373762281274e-06, "loss": 2.2912, "step": 546960 }, { "epoch": 0.95, "learning_rate": 2.3075018223544473e-06, "loss": 2.2321, "step": 546970 }, { "epoch": 0.95, "learning_rate": 2.30662988242762e-06, "loss": 2.2372, "step": 546980 }, { "epoch": 0.95, "learning_rate": 2.3057579425007935e-06, "loss": 2.2261, "step": 546990 }, { "epoch": 0.95, "learning_rate": 2.304886002573967e-06, "loss": 2.2528, "step": 547000 }, { "epoch": 0.95, "learning_rate": 2.3040140626471402e-06, "loss": 2.3404, "step": 547010 }, { "epoch": 0.95, "learning_rate": 2.303142122720313e-06, "loss": 2.3461, "step": 547020 }, { "epoch": 0.95, "learning_rate": 2.3022701827934865e-06, "loss": 2.3317, "step": 547030 }, { "epoch": 0.95, "learning_rate": 2.3013982428666594e-06, "loss": 2.246, "step": 547040 }, { "epoch": 0.95, "learning_rate": 2.3005263029398328e-06, "loss": 2.1873, "step": 547050 }, { "epoch": 0.95, "learning_rate": 2.2996543630130057e-06, "loss": 2.3561, "step": 547060 }, { "epoch": 0.95, "learning_rate": 2.2987824230861795e-06, "loss": 2.2678, "step": 547070 }, { "epoch": 0.95, "learning_rate": 2.2979104831593524e-06, "loss": 2.2016, "step": 547080 }, { "epoch": 0.95, "learning_rate": 2.2970385432325257e-06, "loss": 2.2192, "step": 547090 }, { "epoch": 0.95, "learning_rate": 2.2961666033056986e-06, "loss": 2.2594, "step": 547100 }, { "epoch": 0.95, "learning_rate": 2.295294663378872e-06, "loss": 2.3505, "step": 547110 }, { "epoch": 0.95, "learning_rate": 2.294422723452045e-06, "loss": 2.2501, "step": 547120 }, { "epoch": 0.95, "learning_rate": 2.2935507835252187e-06, "loss": 2.2323, "step": 547130 }, { "epoch": 0.95, "learning_rate": 2.2926788435983916e-06, "loss": 2.1234, "step": 547140 }, { "epoch": 0.95, "learning_rate": 2.291806903671565e-06, "loss": 2.0985, "step": 547150 }, { "epoch": 0.95, "learning_rate": 2.290934963744738e-06, "loss": 2.3311, "step": 547160 }, { "epoch": 0.95, "learning_rate": 2.2900630238179112e-06, "loss": 2.233, "step": 547170 }, { "epoch": 0.95, "learning_rate": 2.289191083891084e-06, "loss": 2.2663, "step": 547180 }, { "epoch": 0.95, "learning_rate": 2.2883191439642575e-06, "loss": 2.2596, "step": 547190 }, { "epoch": 0.95, "learning_rate": 2.287447204037431e-06, "loss": 2.2153, "step": 547200 }, { "epoch": 0.95, "learning_rate": 2.286575264110604e-06, "loss": 2.1509, "step": 547210 }, { "epoch": 0.95, "learning_rate": 2.285703324183777e-06, "loss": 2.2355, "step": 547220 }, { "epoch": 0.95, "learning_rate": 2.2848313842569505e-06, "loss": 2.3394, "step": 547230 }, { "epoch": 0.95, "learning_rate": 2.2839594443301234e-06, "loss": 2.0861, "step": 547240 }, { "epoch": 0.95, "learning_rate": 2.2830875044032967e-06, "loss": 2.3179, "step": 547250 }, { "epoch": 0.95, "learning_rate": 2.2822155644764697e-06, "loss": 2.4755, "step": 547260 }, { "epoch": 0.95, "learning_rate": 2.2813436245496434e-06, "loss": 2.2912, "step": 547270 }, { "epoch": 0.95, "learning_rate": 2.2804716846228163e-06, "loss": 2.2019, "step": 547280 }, { "epoch": 0.95, "learning_rate": 2.2795997446959897e-06, "loss": 2.2186, "step": 547290 }, { "epoch": 0.95, "learning_rate": 2.2787278047691626e-06, "loss": 2.2714, "step": 547300 }, { "epoch": 0.95, "learning_rate": 2.277855864842336e-06, "loss": 2.3745, "step": 547310 }, { "epoch": 0.95, "learning_rate": 2.276983924915509e-06, "loss": 2.2315, "step": 547320 }, { "epoch": 0.95, "learning_rate": 2.2761119849886827e-06, "loss": 2.2822, "step": 547330 }, { "epoch": 0.95, "learning_rate": 2.2752400450618556e-06, "loss": 2.2022, "step": 547340 }, { "epoch": 0.95, "learning_rate": 2.274368105135029e-06, "loss": 2.2784, "step": 547350 }, { "epoch": 0.95, "learning_rate": 2.273496165208202e-06, "loss": 2.2043, "step": 547360 }, { "epoch": 0.95, "learning_rate": 2.272624225281375e-06, "loss": 2.3141, "step": 547370 }, { "epoch": 0.95, "learning_rate": 2.271752285354548e-06, "loss": 2.2086, "step": 547380 }, { "epoch": 0.95, "learning_rate": 2.2708803454277215e-06, "loss": 2.2828, "step": 547390 }, { "epoch": 0.95, "learning_rate": 2.270008405500895e-06, "loss": 2.1905, "step": 547400 }, { "epoch": 0.95, "learning_rate": 2.269136465574068e-06, "loss": 2.3122, "step": 547410 }, { "epoch": 0.95, "learning_rate": 2.268264525647241e-06, "loss": 2.2688, "step": 547420 }, { "epoch": 0.95, "learning_rate": 2.2673925857204144e-06, "loss": 2.1581, "step": 547430 }, { "epoch": 0.95, "learning_rate": 2.2665206457935873e-06, "loss": 2.3199, "step": 547440 }, { "epoch": 0.95, "learning_rate": 2.2656487058667607e-06, "loss": 2.1878, "step": 547450 }, { "epoch": 0.95, "learning_rate": 2.2647767659399336e-06, "loss": 2.0662, "step": 547460 }, { "epoch": 0.95, "learning_rate": 2.2639048260131074e-06, "loss": 2.2949, "step": 547470 }, { "epoch": 0.95, "learning_rate": 2.2630328860862803e-06, "loss": 2.1925, "step": 547480 }, { "epoch": 0.95, "learning_rate": 2.2621609461594537e-06, "loss": 2.1069, "step": 547490 }, { "epoch": 0.95, "learning_rate": 2.2612890062326266e-06, "loss": 2.2431, "step": 547500 }, { "epoch": 0.95, "learning_rate": 2.2604170663058e-06, "loss": 2.2422, "step": 547510 }, { "epoch": 0.95, "learning_rate": 2.259545126378973e-06, "loss": 2.2959, "step": 547520 }, { "epoch": 0.95, "learning_rate": 2.2586731864521466e-06, "loss": 2.2155, "step": 547530 }, { "epoch": 0.95, "learning_rate": 2.2578012465253195e-06, "loss": 2.3109, "step": 547540 }, { "epoch": 0.95, "learning_rate": 2.256929306598493e-06, "loss": 2.2589, "step": 547550 }, { "epoch": 0.95, "learning_rate": 2.256057366671666e-06, "loss": 2.2799, "step": 547560 }, { "epoch": 0.95, "learning_rate": 2.255185426744839e-06, "loss": 2.2483, "step": 547570 }, { "epoch": 0.95, "learning_rate": 2.254313486818012e-06, "loss": 2.2025, "step": 547580 }, { "epoch": 0.95, "learning_rate": 2.2534415468911854e-06, "loss": 2.2733, "step": 547590 }, { "epoch": 0.95, "learning_rate": 2.2525696069643588e-06, "loss": 2.3538, "step": 547600 }, { "epoch": 0.95, "learning_rate": 2.251697667037532e-06, "loss": 2.3007, "step": 547610 }, { "epoch": 0.95, "learning_rate": 2.250825727110705e-06, "loss": 2.3888, "step": 547620 }, { "epoch": 0.96, "learning_rate": 2.2499537871838784e-06, "loss": 2.2001, "step": 547630 }, { "epoch": 0.96, "learning_rate": 2.2490818472570513e-06, "loss": 2.3206, "step": 547640 }, { "epoch": 0.96, "learning_rate": 2.2482099073302247e-06, "loss": 2.2795, "step": 547650 }, { "epoch": 0.96, "learning_rate": 2.2473379674033976e-06, "loss": 2.1441, "step": 547660 }, { "epoch": 0.96, "learning_rate": 2.2464660274765713e-06, "loss": 2.3291, "step": 547670 }, { "epoch": 0.96, "learning_rate": 2.2455940875497443e-06, "loss": 2.3019, "step": 547680 }, { "epoch": 0.96, "learning_rate": 2.2447221476229176e-06, "loss": 2.1395, "step": 547690 }, { "epoch": 0.96, "learning_rate": 2.2438502076960905e-06, "loss": 2.4181, "step": 547700 }, { "epoch": 0.96, "learning_rate": 2.242978267769264e-06, "loss": 2.3326, "step": 547710 }, { "epoch": 0.96, "learning_rate": 2.242106327842437e-06, "loss": 2.2458, "step": 547720 }, { "epoch": 0.96, "learning_rate": 2.2412343879156106e-06, "loss": 2.252, "step": 547730 }, { "epoch": 0.96, "learning_rate": 2.2403624479887835e-06, "loss": 2.2049, "step": 547740 }, { "epoch": 0.96, "learning_rate": 2.239490508061957e-06, "loss": 2.196, "step": 547750 }, { "epoch": 0.96, "learning_rate": 2.2386185681351298e-06, "loss": 2.3516, "step": 547760 }, { "epoch": 0.96, "learning_rate": 2.237746628208303e-06, "loss": 2.2954, "step": 547770 }, { "epoch": 0.96, "learning_rate": 2.236874688281476e-06, "loss": 2.1983, "step": 547780 }, { "epoch": 0.96, "learning_rate": 2.2360027483546494e-06, "loss": 2.146, "step": 547790 }, { "epoch": 0.96, "learning_rate": 2.2351308084278227e-06, "loss": 2.2141, "step": 547800 }, { "epoch": 0.96, "learning_rate": 2.234258868500996e-06, "loss": 2.2574, "step": 547810 }, { "epoch": 0.96, "learning_rate": 2.233386928574169e-06, "loss": 2.1786, "step": 547820 }, { "epoch": 0.96, "learning_rate": 2.2325149886473423e-06, "loss": 2.2283, "step": 547830 }, { "epoch": 0.96, "learning_rate": 2.2316430487205153e-06, "loss": 2.232, "step": 547840 }, { "epoch": 0.96, "learning_rate": 2.2307711087936886e-06, "loss": 2.2842, "step": 547850 }, { "epoch": 0.96, "learning_rate": 2.2298991688668615e-06, "loss": 2.2714, "step": 547860 }, { "epoch": 0.96, "learning_rate": 2.2290272289400353e-06, "loss": 2.1873, "step": 547870 }, { "epoch": 0.96, "learning_rate": 2.2281552890132082e-06, "loss": 2.2551, "step": 547880 }, { "epoch": 0.96, "learning_rate": 2.2272833490863816e-06, "loss": 2.2201, "step": 547890 }, { "epoch": 0.96, "learning_rate": 2.2264114091595545e-06, "loss": 2.1522, "step": 547900 }, { "epoch": 0.96, "learning_rate": 2.225539469232728e-06, "loss": 2.3391, "step": 547910 }, { "epoch": 0.96, "learning_rate": 2.2246675293059008e-06, "loss": 2.2814, "step": 547920 }, { "epoch": 0.96, "learning_rate": 2.2237955893790745e-06, "loss": 2.287, "step": 547930 }, { "epoch": 0.96, "learning_rate": 2.2229236494522475e-06, "loss": 2.3146, "step": 547940 }, { "epoch": 0.96, "learning_rate": 2.222051709525421e-06, "loss": 2.1639, "step": 547950 }, { "epoch": 0.96, "learning_rate": 2.2211797695985937e-06, "loss": 2.3047, "step": 547960 }, { "epoch": 0.96, "learning_rate": 2.220307829671767e-06, "loss": 2.2788, "step": 547970 }, { "epoch": 0.96, "learning_rate": 2.21943588974494e-06, "loss": 2.2073, "step": 547980 }, { "epoch": 0.96, "learning_rate": 2.2185639498181133e-06, "loss": 2.2876, "step": 547990 }, { "epoch": 0.96, "learning_rate": 2.2176920098912867e-06, "loss": 2.2736, "step": 548000 }, { "epoch": 0.96, "learning_rate": 2.21682006996446e-06, "loss": 2.265, "step": 548010 }, { "epoch": 0.96, "learning_rate": 2.215948130037633e-06, "loss": 2.2266, "step": 548020 }, { "epoch": 0.96, "learning_rate": 2.2150761901108063e-06, "loss": 2.2271, "step": 548030 }, { "epoch": 0.96, "learning_rate": 2.2142042501839792e-06, "loss": 2.2247, "step": 548040 }, { "epoch": 0.96, "learning_rate": 2.2133323102571526e-06, "loss": 2.2552, "step": 548050 }, { "epoch": 0.96, "learning_rate": 2.2124603703303255e-06, "loss": 2.2627, "step": 548060 }, { "epoch": 0.96, "learning_rate": 2.2115884304034993e-06, "loss": 2.2483, "step": 548070 }, { "epoch": 0.96, "learning_rate": 2.210716490476672e-06, "loss": 2.3368, "step": 548080 }, { "epoch": 0.96, "learning_rate": 2.2098445505498455e-06, "loss": 2.2257, "step": 548090 }, { "epoch": 0.96, "learning_rate": 2.2089726106230185e-06, "loss": 2.2755, "step": 548100 }, { "epoch": 0.96, "learning_rate": 2.208100670696192e-06, "loss": 2.2692, "step": 548110 }, { "epoch": 0.96, "learning_rate": 2.2072287307693647e-06, "loss": 2.2085, "step": 548120 }, { "epoch": 0.96, "learning_rate": 2.2063567908425385e-06, "loss": 2.1802, "step": 548130 }, { "epoch": 0.96, "learning_rate": 2.2054848509157114e-06, "loss": 2.1915, "step": 548140 }, { "epoch": 0.96, "learning_rate": 2.2046129109888848e-06, "loss": 2.2696, "step": 548150 }, { "epoch": 0.96, "learning_rate": 2.2037409710620577e-06, "loss": 2.2594, "step": 548160 }, { "epoch": 0.96, "learning_rate": 2.202869031135231e-06, "loss": 2.3258, "step": 548170 }, { "epoch": 0.96, "learning_rate": 2.201997091208404e-06, "loss": 2.2721, "step": 548180 }, { "epoch": 0.96, "learning_rate": 2.2011251512815773e-06, "loss": 2.2186, "step": 548190 }, { "epoch": 0.96, "learning_rate": 2.2002532113547507e-06, "loss": 2.3382, "step": 548200 }, { "epoch": 0.96, "learning_rate": 2.199381271427924e-06, "loss": 2.3268, "step": 548210 }, { "epoch": 0.96, "learning_rate": 2.198509331501097e-06, "loss": 2.3425, "step": 548220 }, { "epoch": 0.96, "learning_rate": 2.1976373915742703e-06, "loss": 2.1319, "step": 548230 }, { "epoch": 0.96, "learning_rate": 2.196765451647443e-06, "loss": 2.2031, "step": 548240 }, { "epoch": 0.96, "learning_rate": 2.1958935117206165e-06, "loss": 2.2311, "step": 548250 }, { "epoch": 0.96, "learning_rate": 2.1950215717937895e-06, "loss": 2.2964, "step": 548260 }, { "epoch": 0.96, "learning_rate": 2.1941496318669632e-06, "loss": 2.241, "step": 548270 }, { "epoch": 0.96, "learning_rate": 2.193277691940136e-06, "loss": 2.1729, "step": 548280 }, { "epoch": 0.96, "learning_rate": 2.1924057520133095e-06, "loss": 2.1319, "step": 548290 }, { "epoch": 0.96, "learning_rate": 2.1915338120864824e-06, "loss": 2.2774, "step": 548300 }, { "epoch": 0.96, "learning_rate": 2.1906618721596558e-06, "loss": 2.3251, "step": 548310 }, { "epoch": 0.96, "learning_rate": 2.1897899322328287e-06, "loss": 2.2287, "step": 548320 }, { "epoch": 0.96, "learning_rate": 2.1889179923060025e-06, "loss": 2.2735, "step": 548330 }, { "epoch": 0.96, "learning_rate": 2.1880460523791754e-06, "loss": 2.3578, "step": 548340 }, { "epoch": 0.96, "learning_rate": 2.1871741124523487e-06, "loss": 2.3219, "step": 548350 }, { "epoch": 0.96, "learning_rate": 2.1863021725255217e-06, "loss": 2.285, "step": 548360 }, { "epoch": 0.96, "learning_rate": 2.185430232598695e-06, "loss": 2.2455, "step": 548370 }, { "epoch": 0.96, "learning_rate": 2.184558292671868e-06, "loss": 2.2134, "step": 548380 }, { "epoch": 0.96, "learning_rate": 2.1836863527450413e-06, "loss": 2.3495, "step": 548390 }, { "epoch": 0.96, "learning_rate": 2.1828144128182146e-06, "loss": 2.2239, "step": 548400 }, { "epoch": 0.96, "learning_rate": 2.181942472891388e-06, "loss": 2.2084, "step": 548410 }, { "epoch": 0.96, "learning_rate": 2.181070532964561e-06, "loss": 2.2495, "step": 548420 }, { "epoch": 0.96, "learning_rate": 2.1801985930377342e-06, "loss": 2.2749, "step": 548430 }, { "epoch": 0.96, "learning_rate": 2.179326653110907e-06, "loss": 2.2085, "step": 548440 }, { "epoch": 0.96, "learning_rate": 2.1784547131840805e-06, "loss": 2.2028, "step": 548450 }, { "epoch": 0.96, "learning_rate": 2.1775827732572534e-06, "loss": 2.2778, "step": 548460 }, { "epoch": 0.96, "learning_rate": 2.176710833330427e-06, "loss": 2.3775, "step": 548470 }, { "epoch": 0.96, "learning_rate": 2.1758388934036e-06, "loss": 2.1392, "step": 548480 }, { "epoch": 0.96, "learning_rate": 2.1749669534767735e-06, "loss": 2.2315, "step": 548490 }, { "epoch": 0.96, "learning_rate": 2.1740950135499464e-06, "loss": 2.3304, "step": 548500 }, { "epoch": 0.96, "learning_rate": 2.1732230736231197e-06, "loss": 2.2791, "step": 548510 }, { "epoch": 0.96, "learning_rate": 2.1723511336962927e-06, "loss": 2.2093, "step": 548520 }, { "epoch": 0.96, "learning_rate": 2.1714791937694664e-06, "loss": 2.2383, "step": 548530 }, { "epoch": 0.96, "learning_rate": 2.1706072538426394e-06, "loss": 2.4283, "step": 548540 }, { "epoch": 0.96, "learning_rate": 2.1697353139158127e-06, "loss": 2.2694, "step": 548550 }, { "epoch": 0.96, "learning_rate": 2.1688633739889856e-06, "loss": 2.1701, "step": 548560 }, { "epoch": 0.96, "learning_rate": 2.167991434062159e-06, "loss": 2.2412, "step": 548570 }, { "epoch": 0.96, "learning_rate": 2.167119494135332e-06, "loss": 2.2505, "step": 548580 }, { "epoch": 0.96, "learning_rate": 2.1662475542085052e-06, "loss": 2.2266, "step": 548590 }, { "epoch": 0.96, "learning_rate": 2.1653756142816786e-06, "loss": 2.3442, "step": 548600 }, { "epoch": 0.96, "learning_rate": 2.164503674354852e-06, "loss": 2.3059, "step": 548610 }, { "epoch": 0.96, "learning_rate": 2.163631734428025e-06, "loss": 2.3164, "step": 548620 }, { "epoch": 0.96, "learning_rate": 2.162759794501198e-06, "loss": 2.4074, "step": 548630 }, { "epoch": 0.96, "learning_rate": 2.161887854574371e-06, "loss": 2.3199, "step": 548640 }, { "epoch": 0.96, "learning_rate": 2.1610159146475445e-06, "loss": 2.1971, "step": 548650 }, { "epoch": 0.96, "learning_rate": 2.160143974720718e-06, "loss": 2.2494, "step": 548660 }, { "epoch": 0.96, "learning_rate": 2.159272034793891e-06, "loss": 2.3235, "step": 548670 }, { "epoch": 0.96, "learning_rate": 2.158400094867064e-06, "loss": 2.3405, "step": 548680 }, { "epoch": 0.96, "learning_rate": 2.1575281549402374e-06, "loss": 2.2133, "step": 548690 }, { "epoch": 0.96, "learning_rate": 2.1566562150134104e-06, "loss": 2.3514, "step": 548700 }, { "epoch": 0.96, "learning_rate": 2.1557842750865837e-06, "loss": 2.2337, "step": 548710 }, { "epoch": 0.96, "learning_rate": 2.1549123351597566e-06, "loss": 2.2102, "step": 548720 }, { "epoch": 0.96, "learning_rate": 2.1540403952329304e-06, "loss": 2.2615, "step": 548730 }, { "epoch": 0.96, "learning_rate": 2.1531684553061033e-06, "loss": 2.2055, "step": 548740 }, { "epoch": 0.96, "learning_rate": 2.1522965153792767e-06, "loss": 2.2878, "step": 548750 }, { "epoch": 0.96, "learning_rate": 2.1514245754524496e-06, "loss": 2.3249, "step": 548760 }, { "epoch": 0.96, "learning_rate": 2.150552635525623e-06, "loss": 2.3096, "step": 548770 }, { "epoch": 0.96, "learning_rate": 2.149680695598796e-06, "loss": 2.3044, "step": 548780 }, { "epoch": 0.96, "learning_rate": 2.148808755671969e-06, "loss": 2.2532, "step": 548790 }, { "epoch": 0.96, "learning_rate": 2.1479368157451425e-06, "loss": 2.2492, "step": 548800 }, { "epoch": 0.96, "learning_rate": 2.147064875818316e-06, "loss": 2.161, "step": 548810 }, { "epoch": 0.96, "learning_rate": 2.146192935891489e-06, "loss": 2.2425, "step": 548820 }, { "epoch": 0.96, "learning_rate": 2.145320995964662e-06, "loss": 2.2544, "step": 548830 }, { "epoch": 0.96, "learning_rate": 2.144449056037835e-06, "loss": 2.2085, "step": 548840 }, { "epoch": 0.96, "learning_rate": 2.1435771161110084e-06, "loss": 2.1969, "step": 548850 }, { "epoch": 0.96, "learning_rate": 2.1427051761841818e-06, "loss": 2.2056, "step": 548860 }, { "epoch": 0.96, "learning_rate": 2.141833236257355e-06, "loss": 2.1675, "step": 548870 }, { "epoch": 0.96, "learning_rate": 2.140961296330528e-06, "loss": 2.3683, "step": 548880 }, { "epoch": 0.96, "learning_rate": 2.1400893564037014e-06, "loss": 2.2568, "step": 548890 }, { "epoch": 0.96, "learning_rate": 2.1392174164768743e-06, "loss": 2.2644, "step": 548900 }, { "epoch": 0.96, "learning_rate": 2.1383454765500477e-06, "loss": 2.2656, "step": 548910 }, { "epoch": 0.96, "learning_rate": 2.1374735366232206e-06, "loss": 2.2273, "step": 548920 }, { "epoch": 0.96, "learning_rate": 2.1366015966963944e-06, "loss": 2.2378, "step": 548930 }, { "epoch": 0.96, "learning_rate": 2.1357296567695673e-06, "loss": 2.2276, "step": 548940 }, { "epoch": 0.96, "learning_rate": 2.1348577168427406e-06, "loss": 2.3637, "step": 548950 }, { "epoch": 0.96, "learning_rate": 2.1339857769159136e-06, "loss": 2.2605, "step": 548960 }, { "epoch": 0.96, "learning_rate": 2.133113836989087e-06, "loss": 2.232, "step": 548970 }, { "epoch": 0.96, "learning_rate": 2.13224189706226e-06, "loss": 2.2656, "step": 548980 }, { "epoch": 0.96, "learning_rate": 2.131369957135433e-06, "loss": 2.3304, "step": 548990 }, { "epoch": 0.96, "learning_rate": 2.1304980172086065e-06, "loss": 2.1228, "step": 549000 }, { "epoch": 0.96, "learning_rate": 2.12962607728178e-06, "loss": 2.3305, "step": 549010 }, { "epoch": 0.96, "learning_rate": 2.1287541373549528e-06, "loss": 2.308, "step": 549020 }, { "epoch": 0.96, "learning_rate": 2.127882197428126e-06, "loss": 2.2958, "step": 549030 }, { "epoch": 0.96, "learning_rate": 2.127010257501299e-06, "loss": 2.2719, "step": 549040 }, { "epoch": 0.96, "learning_rate": 2.1261383175744724e-06, "loss": 2.3376, "step": 549050 }, { "epoch": 0.96, "learning_rate": 2.1252663776476457e-06, "loss": 2.2011, "step": 549060 }, { "epoch": 0.96, "learning_rate": 2.124394437720819e-06, "loss": 2.2153, "step": 549070 }, { "epoch": 0.96, "learning_rate": 2.123522497793992e-06, "loss": 2.2211, "step": 549080 }, { "epoch": 0.96, "learning_rate": 2.1226505578671654e-06, "loss": 2.2413, "step": 549090 }, { "epoch": 0.96, "learning_rate": 2.1217786179403383e-06, "loss": 2.2932, "step": 549100 }, { "epoch": 0.96, "learning_rate": 2.1209066780135116e-06, "loss": 2.2626, "step": 549110 }, { "epoch": 0.96, "learning_rate": 2.1200347380866846e-06, "loss": 2.2682, "step": 549120 }, { "epoch": 0.96, "learning_rate": 2.1191627981598583e-06, "loss": 2.3554, "step": 549130 }, { "epoch": 0.96, "learning_rate": 2.1182908582330312e-06, "loss": 2.2765, "step": 549140 }, { "epoch": 0.96, "learning_rate": 2.1174189183062046e-06, "loss": 2.3049, "step": 549150 }, { "epoch": 0.96, "learning_rate": 2.1165469783793775e-06, "loss": 2.3702, "step": 549160 }, { "epoch": 0.96, "learning_rate": 2.115675038452551e-06, "loss": 2.1818, "step": 549170 }, { "epoch": 0.96, "learning_rate": 2.1148030985257238e-06, "loss": 2.2866, "step": 549180 }, { "epoch": 0.96, "learning_rate": 2.113931158598897e-06, "loss": 2.3641, "step": 549190 }, { "epoch": 0.96, "learning_rate": 2.1130592186720705e-06, "loss": 2.2369, "step": 549200 }, { "epoch": 0.96, "learning_rate": 2.112187278745244e-06, "loss": 2.3028, "step": 549210 }, { "epoch": 0.96, "learning_rate": 2.1113153388184167e-06, "loss": 2.3245, "step": 549220 }, { "epoch": 0.96, "learning_rate": 2.11044339889159e-06, "loss": 2.1161, "step": 549230 }, { "epoch": 0.96, "learning_rate": 2.109571458964763e-06, "loss": 2.3191, "step": 549240 }, { "epoch": 0.96, "learning_rate": 2.1086995190379364e-06, "loss": 2.2109, "step": 549250 }, { "epoch": 0.96, "learning_rate": 2.1078275791111097e-06, "loss": 2.1694, "step": 549260 }, { "epoch": 0.96, "learning_rate": 2.106955639184283e-06, "loss": 2.3058, "step": 549270 }, { "epoch": 0.96, "learning_rate": 2.106083699257456e-06, "loss": 2.3565, "step": 549280 }, { "epoch": 0.96, "learning_rate": 2.1052117593306293e-06, "loss": 2.2459, "step": 549290 }, { "epoch": 0.96, "learning_rate": 2.1043398194038022e-06, "loss": 2.3758, "step": 549300 }, { "epoch": 0.96, "learning_rate": 2.1034678794769756e-06, "loss": 2.252, "step": 549310 }, { "epoch": 0.96, "learning_rate": 2.1025959395501485e-06, "loss": 2.2538, "step": 549320 }, { "epoch": 0.96, "learning_rate": 2.1017239996233223e-06, "loss": 2.2192, "step": 549330 }, { "epoch": 0.96, "learning_rate": 2.100852059696495e-06, "loss": 2.2591, "step": 549340 }, { "epoch": 0.96, "learning_rate": 2.0999801197696686e-06, "loss": 2.2811, "step": 549350 }, { "epoch": 0.96, "learning_rate": 2.0991081798428415e-06, "loss": 2.2203, "step": 549360 }, { "epoch": 0.96, "learning_rate": 2.098236239916015e-06, "loss": 2.2842, "step": 549370 }, { "epoch": 0.96, "learning_rate": 2.0973642999891877e-06, "loss": 2.314, "step": 549380 }, { "epoch": 0.96, "learning_rate": 2.096492360062361e-06, "loss": 2.2475, "step": 549390 }, { "epoch": 0.96, "learning_rate": 2.0956204201355344e-06, "loss": 2.3045, "step": 549400 }, { "epoch": 0.96, "learning_rate": 2.0947484802087078e-06, "loss": 2.3666, "step": 549410 }, { "epoch": 0.96, "learning_rate": 2.0938765402818807e-06, "loss": 2.2596, "step": 549420 }, { "epoch": 0.96, "learning_rate": 2.093004600355054e-06, "loss": 2.2387, "step": 549430 }, { "epoch": 0.96, "learning_rate": 2.092132660428227e-06, "loss": 2.224, "step": 549440 }, { "epoch": 0.96, "learning_rate": 2.0912607205014003e-06, "loss": 2.3323, "step": 549450 }, { "epoch": 0.96, "learning_rate": 2.0903887805745737e-06, "loss": 2.2351, "step": 549460 }, { "epoch": 0.96, "learning_rate": 2.089516840647747e-06, "loss": 2.2693, "step": 549470 }, { "epoch": 0.96, "learning_rate": 2.08864490072092e-06, "loss": 2.193, "step": 549480 }, { "epoch": 0.96, "learning_rate": 2.0877729607940933e-06, "loss": 2.3525, "step": 549490 }, { "epoch": 0.96, "learning_rate": 2.086901020867266e-06, "loss": 2.272, "step": 549500 }, { "epoch": 0.96, "learning_rate": 2.0860290809404396e-06, "loss": 2.2348, "step": 549510 }, { "epoch": 0.96, "learning_rate": 2.0851571410136125e-06, "loss": 2.2678, "step": 549520 }, { "epoch": 0.96, "learning_rate": 2.0842852010867862e-06, "loss": 2.1919, "step": 549530 }, { "epoch": 0.96, "learning_rate": 2.083413261159959e-06, "loss": 2.2756, "step": 549540 }, { "epoch": 0.96, "learning_rate": 2.0825413212331325e-06, "loss": 2.3498, "step": 549550 }, { "epoch": 0.96, "learning_rate": 2.0816693813063054e-06, "loss": 2.199, "step": 549560 }, { "epoch": 0.96, "learning_rate": 2.0807974413794788e-06, "loss": 2.2142, "step": 549570 }, { "epoch": 0.96, "learning_rate": 2.0799255014526517e-06, "loss": 2.0132, "step": 549580 }, { "epoch": 0.96, "learning_rate": 2.079053561525825e-06, "loss": 2.2042, "step": 549590 }, { "epoch": 0.96, "learning_rate": 2.0781816215989984e-06, "loss": 2.2316, "step": 549600 }, { "epoch": 0.96, "learning_rate": 2.0773096816721717e-06, "loss": 2.297, "step": 549610 }, { "epoch": 0.96, "learning_rate": 2.0764377417453447e-06, "loss": 2.1572, "step": 549620 }, { "epoch": 0.96, "learning_rate": 2.075565801818518e-06, "loss": 2.1747, "step": 549630 }, { "epoch": 0.96, "learning_rate": 2.074693861891691e-06, "loss": 2.2471, "step": 549640 }, { "epoch": 0.96, "learning_rate": 2.0738219219648643e-06, "loss": 2.2145, "step": 549650 }, { "epoch": 0.96, "learning_rate": 2.0729499820380376e-06, "loss": 2.2956, "step": 549660 }, { "epoch": 0.96, "learning_rate": 2.072078042111211e-06, "loss": 2.2143, "step": 549670 }, { "epoch": 0.96, "learning_rate": 2.071206102184384e-06, "loss": 2.211, "step": 549680 }, { "epoch": 0.96, "learning_rate": 2.0703341622575572e-06, "loss": 2.2311, "step": 549690 }, { "epoch": 0.96, "learning_rate": 2.06946222233073e-06, "loss": 2.2775, "step": 549700 }, { "epoch": 0.96, "learning_rate": 2.0685902824039035e-06, "loss": 2.313, "step": 549710 }, { "epoch": 0.96, "learning_rate": 2.0677183424770764e-06, "loss": 2.2429, "step": 549720 }, { "epoch": 0.96, "learning_rate": 2.06684640255025e-06, "loss": 2.2047, "step": 549730 }, { "epoch": 0.96, "learning_rate": 2.065974462623423e-06, "loss": 2.2742, "step": 549740 }, { "epoch": 0.96, "learning_rate": 2.0651025226965965e-06, "loss": 2.1623, "step": 549750 }, { "epoch": 0.96, "learning_rate": 2.0642305827697694e-06, "loss": 2.2385, "step": 549760 }, { "epoch": 0.96, "learning_rate": 2.0633586428429427e-06, "loss": 2.2121, "step": 549770 }, { "epoch": 0.96, "learning_rate": 2.0624867029161157e-06, "loss": 2.2441, "step": 549780 }, { "epoch": 0.96, "learning_rate": 2.061614762989289e-06, "loss": 2.2667, "step": 549790 }, { "epoch": 0.96, "learning_rate": 2.0607428230624624e-06, "loss": 2.3278, "step": 549800 }, { "epoch": 0.96, "learning_rate": 2.0598708831356357e-06, "loss": 2.1885, "step": 549810 }, { "epoch": 0.96, "learning_rate": 2.0589989432088086e-06, "loss": 2.1507, "step": 549820 }, { "epoch": 0.96, "learning_rate": 2.058127003281982e-06, "loss": 2.2038, "step": 549830 }, { "epoch": 0.96, "learning_rate": 2.057255063355155e-06, "loss": 2.1565, "step": 549840 }, { "epoch": 0.96, "learning_rate": 2.0563831234283283e-06, "loss": 2.4138, "step": 549850 }, { "epoch": 0.96, "learning_rate": 2.0555111835015016e-06, "loss": 2.2313, "step": 549860 }, { "epoch": 0.96, "learning_rate": 2.054639243574675e-06, "loss": 2.3024, "step": 549870 }, { "epoch": 0.96, "learning_rate": 2.053767303647848e-06, "loss": 2.196, "step": 549880 }, { "epoch": 0.96, "learning_rate": 2.0528953637210212e-06, "loss": 2.2501, "step": 549890 }, { "epoch": 0.96, "learning_rate": 2.052023423794194e-06, "loss": 2.2949, "step": 549900 }, { "epoch": 0.96, "learning_rate": 2.0511514838673675e-06, "loss": 2.2572, "step": 549910 }, { "epoch": 0.96, "learning_rate": 2.0502795439405404e-06, "loss": 2.3009, "step": 549920 }, { "epoch": 0.96, "learning_rate": 2.049407604013714e-06, "loss": 2.1467, "step": 549930 }, { "epoch": 0.96, "learning_rate": 2.048535664086887e-06, "loss": 2.2156, "step": 549940 }, { "epoch": 0.96, "learning_rate": 2.0476637241600604e-06, "loss": 2.2554, "step": 549950 }, { "epoch": 0.96, "learning_rate": 2.0467917842332334e-06, "loss": 2.4111, "step": 549960 }, { "epoch": 0.96, "learning_rate": 2.0459198443064067e-06, "loss": 2.2792, "step": 549970 }, { "epoch": 0.96, "learning_rate": 2.0450479043795796e-06, "loss": 2.1987, "step": 549980 }, { "epoch": 0.96, "learning_rate": 2.0441759644527534e-06, "loss": 2.2193, "step": 549990 }, { "epoch": 0.96, "learning_rate": 2.0433040245259263e-06, "loss": 2.233, "step": 550000 }, { "epoch": 0.96, "learning_rate": 2.0424320845990997e-06, "loss": 2.2137, "step": 550010 }, { "epoch": 0.96, "learning_rate": 2.0415601446722726e-06, "loss": 2.224, "step": 550020 }, { "epoch": 0.96, "learning_rate": 2.040688204745446e-06, "loss": 2.2596, "step": 550030 }, { "epoch": 0.96, "learning_rate": 2.039816264818619e-06, "loss": 2.2274, "step": 550040 }, { "epoch": 0.96, "learning_rate": 2.0389443248917922e-06, "loss": 2.3068, "step": 550050 }, { "epoch": 0.96, "learning_rate": 2.0380723849649656e-06, "loss": 2.2634, "step": 550060 }, { "epoch": 0.96, "learning_rate": 2.037200445038139e-06, "loss": 2.2667, "step": 550070 }, { "epoch": 0.96, "learning_rate": 2.036328505111312e-06, "loss": 2.2477, "step": 550080 }, { "epoch": 0.96, "learning_rate": 2.035456565184485e-06, "loss": 2.2404, "step": 550090 }, { "epoch": 0.96, "learning_rate": 2.034584625257658e-06, "loss": 2.3097, "step": 550100 }, { "epoch": 0.96, "learning_rate": 2.0337126853308314e-06, "loss": 2.2108, "step": 550110 }, { "epoch": 0.96, "learning_rate": 2.032840745404005e-06, "loss": 2.2717, "step": 550120 }, { "epoch": 0.96, "learning_rate": 2.031968805477178e-06, "loss": 2.18, "step": 550130 }, { "epoch": 0.96, "learning_rate": 2.031096865550351e-06, "loss": 2.2825, "step": 550140 }, { "epoch": 0.96, "learning_rate": 2.0302249256235244e-06, "loss": 2.2011, "step": 550150 }, { "epoch": 0.96, "learning_rate": 2.0293529856966973e-06, "loss": 2.3342, "step": 550160 }, { "epoch": 0.96, "learning_rate": 2.0284810457698707e-06, "loss": 2.334, "step": 550170 }, { "epoch": 0.96, "learning_rate": 2.0276091058430436e-06, "loss": 2.3034, "step": 550180 }, { "epoch": 0.96, "learning_rate": 2.0267371659162174e-06, "loss": 2.2741, "step": 550190 }, { "epoch": 0.96, "learning_rate": 2.0258652259893903e-06, "loss": 2.2089, "step": 550200 }, { "epoch": 0.96, "learning_rate": 2.0249932860625636e-06, "loss": 2.2486, "step": 550210 }, { "epoch": 0.96, "learning_rate": 2.0241213461357366e-06, "loss": 2.2691, "step": 550220 }, { "epoch": 0.96, "learning_rate": 2.02324940620891e-06, "loss": 2.2506, "step": 550230 }, { "epoch": 0.96, "learning_rate": 2.022377466282083e-06, "loss": 2.2759, "step": 550240 }, { "epoch": 0.96, "learning_rate": 2.021505526355256e-06, "loss": 2.2623, "step": 550250 }, { "epoch": 0.96, "learning_rate": 2.0206335864284295e-06, "loss": 2.3624, "step": 550260 }, { "epoch": 0.96, "learning_rate": 2.019761646501603e-06, "loss": 2.2381, "step": 550270 }, { "epoch": 0.96, "learning_rate": 2.018889706574776e-06, "loss": 2.2783, "step": 550280 }, { "epoch": 0.96, "learning_rate": 2.018017766647949e-06, "loss": 2.2405, "step": 550290 }, { "epoch": 0.96, "learning_rate": 2.017145826721122e-06, "loss": 2.2536, "step": 550300 }, { "epoch": 0.96, "learning_rate": 2.0162738867942954e-06, "loss": 2.2682, "step": 550310 }, { "epoch": 0.96, "learning_rate": 2.0154019468674688e-06, "loss": 2.2475, "step": 550320 }, { "epoch": 0.96, "learning_rate": 2.014530006940642e-06, "loss": 2.2928, "step": 550330 }, { "epoch": 0.96, "learning_rate": 2.013658067013815e-06, "loss": 2.2551, "step": 550340 }, { "epoch": 0.96, "learning_rate": 2.0127861270869884e-06, "loss": 2.3168, "step": 550350 }, { "epoch": 0.96, "learning_rate": 2.0119141871601613e-06, "loss": 2.2481, "step": 550360 }, { "epoch": 0.96, "learning_rate": 2.0110422472333346e-06, "loss": 2.2395, "step": 550370 }, { "epoch": 0.96, "learning_rate": 2.010170307306508e-06, "loss": 2.2371, "step": 550380 }, { "epoch": 0.96, "learning_rate": 2.0092983673796813e-06, "loss": 2.1903, "step": 550390 }, { "epoch": 0.96, "learning_rate": 2.0084264274528543e-06, "loss": 2.1325, "step": 550400 }, { "epoch": 0.96, "learning_rate": 2.0075544875260276e-06, "loss": 2.2045, "step": 550410 }, { "epoch": 0.96, "learning_rate": 2.0066825475992005e-06, "loss": 2.2285, "step": 550420 }, { "epoch": 0.96, "learning_rate": 2.005810607672374e-06, "loss": 2.2945, "step": 550430 }, { "epoch": 0.96, "learning_rate": 2.0049386677455472e-06, "loss": 2.2642, "step": 550440 }, { "epoch": 0.96, "learning_rate": 2.00406672781872e-06, "loss": 2.2451, "step": 550450 }, { "epoch": 0.96, "learning_rate": 2.0031947878918935e-06, "loss": 2.1505, "step": 550460 }, { "epoch": 0.96, "learning_rate": 2.002322847965067e-06, "loss": 2.2826, "step": 550470 }, { "epoch": 0.96, "learning_rate": 2.0014509080382398e-06, "loss": 2.1626, "step": 550480 }, { "epoch": 0.96, "learning_rate": 2.000578968111413e-06, "loss": 2.2798, "step": 550490 }, { "epoch": 0.96, "learning_rate": 1.999707028184586e-06, "loss": 2.2426, "step": 550500 }, { "epoch": 0.96, "learning_rate": 1.9988350882577594e-06, "loss": 2.2846, "step": 550510 }, { "epoch": 0.96, "learning_rate": 1.9979631483309327e-06, "loss": 2.2586, "step": 550520 }, { "epoch": 0.96, "learning_rate": 1.997091208404106e-06, "loss": 2.2094, "step": 550530 }, { "epoch": 0.96, "learning_rate": 1.996219268477279e-06, "loss": 2.1888, "step": 550540 }, { "epoch": 0.96, "learning_rate": 1.9953473285504523e-06, "loss": 2.1734, "step": 550550 }, { "epoch": 0.96, "learning_rate": 1.9944753886236253e-06, "loss": 2.3198, "step": 550560 }, { "epoch": 0.96, "learning_rate": 1.9936034486967986e-06, "loss": 2.1513, "step": 550570 }, { "epoch": 0.96, "learning_rate": 1.992731508769972e-06, "loss": 2.2692, "step": 550580 }, { "epoch": 0.96, "learning_rate": 1.9918595688431453e-06, "loss": 2.2369, "step": 550590 }, { "epoch": 0.96, "learning_rate": 1.9909876289163182e-06, "loss": 2.2818, "step": 550600 }, { "epoch": 0.96, "learning_rate": 1.9901156889894916e-06, "loss": 2.2742, "step": 550610 }, { "epoch": 0.96, "learning_rate": 1.9892437490626645e-06, "loss": 2.1107, "step": 550620 }, { "epoch": 0.96, "learning_rate": 1.988371809135838e-06, "loss": 2.2136, "step": 550630 }, { "epoch": 0.96, "learning_rate": 1.987499869209011e-06, "loss": 2.2626, "step": 550640 }, { "epoch": 0.96, "learning_rate": 1.986627929282184e-06, "loss": 2.1764, "step": 550650 }, { "epoch": 0.96, "learning_rate": 1.9857559893553574e-06, "loss": 2.1722, "step": 550660 }, { "epoch": 0.96, "learning_rate": 1.984884049428531e-06, "loss": 2.3007, "step": 550670 }, { "epoch": 0.96, "learning_rate": 1.9840121095017037e-06, "loss": 2.3462, "step": 550680 }, { "epoch": 0.96, "learning_rate": 1.983140169574877e-06, "loss": 2.3655, "step": 550690 }, { "epoch": 0.96, "learning_rate": 1.9822682296480504e-06, "loss": 2.288, "step": 550700 }, { "epoch": 0.96, "learning_rate": 1.9813962897212233e-06, "loss": 2.3511, "step": 550710 }, { "epoch": 0.96, "learning_rate": 1.9805243497943967e-06, "loss": 2.1934, "step": 550720 }, { "epoch": 0.96, "learning_rate": 1.97965240986757e-06, "loss": 2.2678, "step": 550730 }, { "epoch": 0.96, "learning_rate": 1.978780469940743e-06, "loss": 2.3617, "step": 550740 }, { "epoch": 0.96, "learning_rate": 1.9779085300139163e-06, "loss": 2.3644, "step": 550750 }, { "epoch": 0.96, "learning_rate": 1.9770365900870892e-06, "loss": 2.1546, "step": 550760 }, { "epoch": 0.96, "learning_rate": 1.9761646501602626e-06, "loss": 2.3161, "step": 550770 }, { "epoch": 0.96, "learning_rate": 1.975292710233436e-06, "loss": 2.3406, "step": 550780 }, { "epoch": 0.96, "learning_rate": 1.9744207703066093e-06, "loss": 2.2442, "step": 550790 }, { "epoch": 0.96, "learning_rate": 1.973548830379782e-06, "loss": 2.2272, "step": 550800 }, { "epoch": 0.96, "learning_rate": 1.9726768904529555e-06, "loss": 2.2034, "step": 550810 }, { "epoch": 0.96, "learning_rate": 1.9718049505261285e-06, "loss": 2.2605, "step": 550820 }, { "epoch": 0.96, "learning_rate": 1.970933010599302e-06, "loss": 2.2596, "step": 550830 }, { "epoch": 0.96, "learning_rate": 1.970061070672475e-06, "loss": 2.3294, "step": 550840 }, { "epoch": 0.96, "learning_rate": 1.969189130745648e-06, "loss": 2.1313, "step": 550850 }, { "epoch": 0.96, "learning_rate": 1.9683171908188214e-06, "loss": 2.2056, "step": 550860 }, { "epoch": 0.96, "learning_rate": 1.9674452508919948e-06, "loss": 2.3046, "step": 550870 }, { "epoch": 0.96, "learning_rate": 1.9665733109651677e-06, "loss": 2.3104, "step": 550880 }, { "epoch": 0.96, "learning_rate": 1.965701371038341e-06, "loss": 2.1023, "step": 550890 }, { "epoch": 0.96, "learning_rate": 1.9648294311115144e-06, "loss": 2.2828, "step": 550900 }, { "epoch": 0.96, "learning_rate": 1.9639574911846873e-06, "loss": 2.3221, "step": 550910 }, { "epoch": 0.96, "learning_rate": 1.9630855512578606e-06, "loss": 2.1929, "step": 550920 }, { "epoch": 0.96, "learning_rate": 1.962213611331034e-06, "loss": 2.189, "step": 550930 }, { "epoch": 0.96, "learning_rate": 1.961341671404207e-06, "loss": 2.2766, "step": 550940 }, { "epoch": 0.96, "learning_rate": 1.9604697314773803e-06, "loss": 2.124, "step": 550950 }, { "epoch": 0.96, "learning_rate": 1.9595977915505536e-06, "loss": 2.2524, "step": 550960 }, { "epoch": 0.96, "learning_rate": 1.9587258516237265e-06, "loss": 2.2324, "step": 550970 }, { "epoch": 0.96, "learning_rate": 1.9578539116969e-06, "loss": 2.3051, "step": 550980 }, { "epoch": 0.96, "learning_rate": 1.9569819717700732e-06, "loss": 2.3175, "step": 550990 }, { "epoch": 0.96, "learning_rate": 1.956110031843246e-06, "loss": 2.2662, "step": 551000 }, { "epoch": 0.96, "learning_rate": 1.9552380919164195e-06, "loss": 2.3021, "step": 551010 }, { "epoch": 0.96, "learning_rate": 1.9543661519895924e-06, "loss": 2.2099, "step": 551020 }, { "epoch": 0.96, "learning_rate": 1.9534942120627658e-06, "loss": 2.1783, "step": 551030 }, { "epoch": 0.96, "learning_rate": 1.952622272135939e-06, "loss": 2.2927, "step": 551040 }, { "epoch": 0.96, "learning_rate": 1.951750332209112e-06, "loss": 2.3145, "step": 551050 }, { "epoch": 0.96, "learning_rate": 1.9508783922822854e-06, "loss": 2.3566, "step": 551060 }, { "epoch": 0.96, "learning_rate": 1.9500064523554587e-06, "loss": 2.2983, "step": 551070 }, { "epoch": 0.96, "learning_rate": 1.9491345124286316e-06, "loss": 2.2202, "step": 551080 }, { "epoch": 0.96, "learning_rate": 1.948262572501805e-06, "loss": 2.1849, "step": 551090 }, { "epoch": 0.96, "learning_rate": 1.9473906325749783e-06, "loss": 2.2116, "step": 551100 }, { "epoch": 0.96, "learning_rate": 1.9465186926481513e-06, "loss": 2.2921, "step": 551110 }, { "epoch": 0.96, "learning_rate": 1.9456467527213246e-06, "loss": 2.4628, "step": 551120 }, { "epoch": 0.96, "learning_rate": 1.944774812794498e-06, "loss": 2.2863, "step": 551130 }, { "epoch": 0.96, "learning_rate": 1.943902872867671e-06, "loss": 2.1973, "step": 551140 }, { "epoch": 0.96, "learning_rate": 1.9430309329408442e-06, "loss": 2.3097, "step": 551150 }, { "epoch": 0.96, "learning_rate": 1.9421589930140176e-06, "loss": 2.3081, "step": 551160 }, { "epoch": 0.96, "learning_rate": 1.9412870530871905e-06, "loss": 2.241, "step": 551170 }, { "epoch": 0.96, "learning_rate": 1.940415113160364e-06, "loss": 2.1982, "step": 551180 }, { "epoch": 0.96, "learning_rate": 1.939543173233537e-06, "loss": 2.2838, "step": 551190 }, { "epoch": 0.96, "learning_rate": 1.93867123330671e-06, "loss": 2.3082, "step": 551200 }, { "epoch": 0.96, "learning_rate": 1.9377992933798835e-06, "loss": 2.2891, "step": 551210 }, { "epoch": 0.96, "learning_rate": 1.936927353453057e-06, "loss": 2.1735, "step": 551220 }, { "epoch": 0.96, "learning_rate": 1.9360554135262297e-06, "loss": 2.2645, "step": 551230 }, { "epoch": 0.96, "learning_rate": 1.935183473599403e-06, "loss": 2.269, "step": 551240 }, { "epoch": 0.96, "learning_rate": 1.934311533672576e-06, "loss": 2.2991, "step": 551250 }, { "epoch": 0.96, "learning_rate": 1.9334395937457493e-06, "loss": 2.2868, "step": 551260 }, { "epoch": 0.96, "learning_rate": 1.9325676538189227e-06, "loss": 2.3244, "step": 551270 }, { "epoch": 0.96, "learning_rate": 1.9316957138920956e-06, "loss": 2.2505, "step": 551280 }, { "epoch": 0.96, "learning_rate": 1.930823773965269e-06, "loss": 2.2732, "step": 551290 }, { "epoch": 0.96, "learning_rate": 1.9299518340384423e-06, "loss": 2.1887, "step": 551300 }, { "epoch": 0.96, "learning_rate": 1.9290798941116152e-06, "loss": 2.2848, "step": 551310 }, { "epoch": 0.96, "learning_rate": 1.9282079541847886e-06, "loss": 2.2294, "step": 551320 }, { "epoch": 0.96, "learning_rate": 1.927336014257962e-06, "loss": 2.1747, "step": 551330 }, { "epoch": 0.96, "learning_rate": 1.926464074331135e-06, "loss": 2.33, "step": 551340 }, { "epoch": 0.96, "learning_rate": 1.925592134404308e-06, "loss": 2.1724, "step": 551350 }, { "epoch": 0.96, "learning_rate": 1.9247201944774815e-06, "loss": 2.3032, "step": 551360 }, { "epoch": 0.96, "learning_rate": 1.9238482545506545e-06, "loss": 2.235, "step": 551370 }, { "epoch": 0.96, "learning_rate": 1.922976314623828e-06, "loss": 2.267, "step": 551380 }, { "epoch": 0.96, "learning_rate": 1.922104374697001e-06, "loss": 2.226, "step": 551390 }, { "epoch": 0.96, "learning_rate": 1.921232434770174e-06, "loss": 2.2197, "step": 551400 }, { "epoch": 0.96, "learning_rate": 1.9203604948433474e-06, "loss": 2.2292, "step": 551410 }, { "epoch": 0.96, "learning_rate": 1.9194885549165208e-06, "loss": 2.2012, "step": 551420 }, { "epoch": 0.96, "learning_rate": 1.9186166149896937e-06, "loss": 2.2295, "step": 551430 }, { "epoch": 0.96, "learning_rate": 1.917744675062867e-06, "loss": 2.3263, "step": 551440 }, { "epoch": 0.96, "learning_rate": 1.91687273513604e-06, "loss": 2.2882, "step": 551450 }, { "epoch": 0.96, "learning_rate": 1.9160007952092133e-06, "loss": 2.2617, "step": 551460 }, { "epoch": 0.96, "learning_rate": 1.9151288552823866e-06, "loss": 2.2816, "step": 551470 }, { "epoch": 0.96, "learning_rate": 1.91425691535556e-06, "loss": 2.243, "step": 551480 }, { "epoch": 0.96, "learning_rate": 1.913384975428733e-06, "loss": 2.2922, "step": 551490 }, { "epoch": 0.96, "learning_rate": 1.9125130355019063e-06, "loss": 2.1378, "step": 551500 }, { "epoch": 0.96, "learning_rate": 1.911641095575079e-06, "loss": 2.3663, "step": 551510 }, { "epoch": 0.96, "learning_rate": 1.9107691556482525e-06, "loss": 2.2003, "step": 551520 }, { "epoch": 0.96, "learning_rate": 1.909897215721426e-06, "loss": 2.1962, "step": 551530 }, { "epoch": 0.96, "learning_rate": 1.909025275794599e-06, "loss": 2.1229, "step": 551540 }, { "epoch": 0.96, "learning_rate": 1.908153335867772e-06, "loss": 2.2654, "step": 551550 }, { "epoch": 0.96, "learning_rate": 1.9072813959409453e-06, "loss": 2.2426, "step": 551560 }, { "epoch": 0.96, "learning_rate": 1.9064094560141184e-06, "loss": 2.2591, "step": 551570 }, { "epoch": 0.96, "learning_rate": 1.9055375160872916e-06, "loss": 2.2525, "step": 551580 }, { "epoch": 0.96, "learning_rate": 1.9046655761604651e-06, "loss": 2.3497, "step": 551590 }, { "epoch": 0.96, "learning_rate": 1.9037936362336382e-06, "loss": 2.2373, "step": 551600 }, { "epoch": 0.96, "learning_rate": 1.9029216963068114e-06, "loss": 2.094, "step": 551610 }, { "epoch": 0.96, "learning_rate": 1.9020497563799845e-06, "loss": 2.1656, "step": 551620 }, { "epoch": 0.96, "learning_rate": 1.9011778164531577e-06, "loss": 2.267, "step": 551630 }, { "epoch": 0.96, "learning_rate": 1.9003058765263308e-06, "loss": 2.2511, "step": 551640 }, { "epoch": 0.96, "learning_rate": 1.899433936599504e-06, "loss": 2.3047, "step": 551650 }, { "epoch": 0.96, "learning_rate": 1.8985619966726775e-06, "loss": 2.2751, "step": 551660 }, { "epoch": 0.96, "learning_rate": 1.8976900567458506e-06, "loss": 2.2888, "step": 551670 }, { "epoch": 0.96, "learning_rate": 1.8968181168190237e-06, "loss": 2.3028, "step": 551680 }, { "epoch": 0.96, "learning_rate": 1.8959461768921969e-06, "loss": 2.3219, "step": 551690 }, { "epoch": 0.96, "learning_rate": 1.89507423696537e-06, "loss": 2.3045, "step": 551700 }, { "epoch": 0.96, "learning_rate": 1.8942022970385432e-06, "loss": 2.2194, "step": 551710 }, { "epoch": 0.96, "learning_rate": 1.8933303571117167e-06, "loss": 2.2948, "step": 551720 }, { "epoch": 0.96, "learning_rate": 1.8924584171848898e-06, "loss": 2.2159, "step": 551730 }, { "epoch": 0.96, "learning_rate": 1.891586477258063e-06, "loss": 2.2528, "step": 551740 }, { "epoch": 0.96, "learning_rate": 1.8907145373312361e-06, "loss": 2.3496, "step": 551750 }, { "epoch": 0.96, "learning_rate": 1.8898425974044092e-06, "loss": 2.2518, "step": 551760 }, { "epoch": 0.96, "learning_rate": 1.8889706574775824e-06, "loss": 2.1767, "step": 551770 }, { "epoch": 0.96, "learning_rate": 1.8880987175507555e-06, "loss": 2.2376, "step": 551780 }, { "epoch": 0.96, "learning_rate": 1.887226777623929e-06, "loss": 2.2406, "step": 551790 }, { "epoch": 0.96, "learning_rate": 1.8863548376971022e-06, "loss": 2.3826, "step": 551800 }, { "epoch": 0.96, "learning_rate": 1.8854828977702753e-06, "loss": 2.1954, "step": 551810 }, { "epoch": 0.96, "learning_rate": 1.8846109578434485e-06, "loss": 2.3046, "step": 551820 }, { "epoch": 0.96, "learning_rate": 1.8837390179166216e-06, "loss": 2.2776, "step": 551830 }, { "epoch": 0.96, "learning_rate": 1.8828670779897947e-06, "loss": 2.3111, "step": 551840 }, { "epoch": 0.96, "learning_rate": 1.8819951380629679e-06, "loss": 2.2894, "step": 551850 }, { "epoch": 0.96, "learning_rate": 1.8811231981361414e-06, "loss": 2.2037, "step": 551860 }, { "epoch": 0.96, "learning_rate": 1.8802512582093146e-06, "loss": 2.2353, "step": 551870 }, { "epoch": 0.96, "learning_rate": 1.8793793182824877e-06, "loss": 2.2409, "step": 551880 }, { "epoch": 0.96, "learning_rate": 1.8785073783556608e-06, "loss": 2.2054, "step": 551890 }, { "epoch": 0.96, "learning_rate": 1.877635438428834e-06, "loss": 2.2473, "step": 551900 }, { "epoch": 0.96, "learning_rate": 1.8767634985020071e-06, "loss": 2.3203, "step": 551910 }, { "epoch": 0.96, "learning_rate": 1.8758915585751807e-06, "loss": 2.2967, "step": 551920 }, { "epoch": 0.96, "learning_rate": 1.8750196186483538e-06, "loss": 2.2635, "step": 551930 }, { "epoch": 0.96, "learning_rate": 1.874147678721527e-06, "loss": 2.2932, "step": 551940 }, { "epoch": 0.96, "learning_rate": 1.8732757387947e-06, "loss": 2.2163, "step": 551950 }, { "epoch": 0.96, "learning_rate": 1.8724037988678732e-06, "loss": 2.2227, "step": 551960 }, { "epoch": 0.96, "learning_rate": 1.8715318589410463e-06, "loss": 2.274, "step": 551970 }, { "epoch": 0.96, "learning_rate": 1.8706599190142195e-06, "loss": 2.3497, "step": 551980 }, { "epoch": 0.96, "learning_rate": 1.869787979087393e-06, "loss": 2.3136, "step": 551990 }, { "epoch": 0.96, "learning_rate": 1.8689160391605662e-06, "loss": 2.2337, "step": 552000 }, { "epoch": 0.96, "learning_rate": 1.8680440992337393e-06, "loss": 2.194, "step": 552010 }, { "epoch": 0.96, "learning_rate": 1.8671721593069124e-06, "loss": 2.4179, "step": 552020 }, { "epoch": 0.96, "learning_rate": 1.8663002193800856e-06, "loss": 2.2832, "step": 552030 }, { "epoch": 0.96, "learning_rate": 1.8654282794532587e-06, "loss": 2.2109, "step": 552040 }, { "epoch": 0.96, "learning_rate": 1.8645563395264318e-06, "loss": 2.3328, "step": 552050 }, { "epoch": 0.96, "learning_rate": 1.8636843995996054e-06, "loss": 2.1954, "step": 552060 }, { "epoch": 0.96, "learning_rate": 1.8628124596727785e-06, "loss": 2.1698, "step": 552070 }, { "epoch": 0.96, "learning_rate": 1.8619405197459517e-06, "loss": 2.2372, "step": 552080 }, { "epoch": 0.96, "learning_rate": 1.8610685798191248e-06, "loss": 2.1831, "step": 552090 }, { "epoch": 0.96, "learning_rate": 1.860196639892298e-06, "loss": 2.3198, "step": 552100 }, { "epoch": 0.96, "learning_rate": 1.859324699965471e-06, "loss": 2.1868, "step": 552110 }, { "epoch": 0.96, "learning_rate": 1.8584527600386446e-06, "loss": 2.2697, "step": 552120 }, { "epoch": 0.96, "learning_rate": 1.8575808201118178e-06, "loss": 2.1802, "step": 552130 }, { "epoch": 0.96, "learning_rate": 1.856708880184991e-06, "loss": 2.2026, "step": 552140 }, { "epoch": 0.96, "learning_rate": 1.855836940258164e-06, "loss": 2.2473, "step": 552150 }, { "epoch": 0.96, "learning_rate": 1.8549650003313372e-06, "loss": 2.3191, "step": 552160 }, { "epoch": 0.96, "learning_rate": 1.8540930604045103e-06, "loss": 2.4016, "step": 552170 }, { "epoch": 0.96, "learning_rate": 1.8532211204776834e-06, "loss": 2.2182, "step": 552180 }, { "epoch": 0.96, "learning_rate": 1.852349180550857e-06, "loss": 2.2538, "step": 552190 }, { "epoch": 0.96, "learning_rate": 1.8514772406240301e-06, "loss": 2.2405, "step": 552200 }, { "epoch": 0.96, "learning_rate": 1.8506053006972033e-06, "loss": 2.2943, "step": 552210 }, { "epoch": 0.96, "learning_rate": 1.8497333607703764e-06, "loss": 2.1779, "step": 552220 }, { "epoch": 0.96, "learning_rate": 1.8488614208435495e-06, "loss": 2.3304, "step": 552230 }, { "epoch": 0.96, "learning_rate": 1.8479894809167227e-06, "loss": 2.3454, "step": 552240 }, { "epoch": 0.96, "learning_rate": 1.8471175409898958e-06, "loss": 2.1409, "step": 552250 }, { "epoch": 0.96, "learning_rate": 1.8462456010630694e-06, "loss": 2.2056, "step": 552260 }, { "epoch": 0.96, "learning_rate": 1.8453736611362425e-06, "loss": 2.2273, "step": 552270 }, { "epoch": 0.96, "learning_rate": 1.8445017212094156e-06, "loss": 2.2739, "step": 552280 }, { "epoch": 0.96, "learning_rate": 1.8436297812825888e-06, "loss": 2.3057, "step": 552290 }, { "epoch": 0.96, "learning_rate": 1.842757841355762e-06, "loss": 2.2, "step": 552300 }, { "epoch": 0.96, "learning_rate": 1.841885901428935e-06, "loss": 2.2718, "step": 552310 }, { "epoch": 0.96, "learning_rate": 1.8410139615021086e-06, "loss": 2.1524, "step": 552320 }, { "epoch": 0.96, "learning_rate": 1.8401420215752817e-06, "loss": 2.3101, "step": 552330 }, { "epoch": 0.96, "learning_rate": 1.8392700816484549e-06, "loss": 2.1887, "step": 552340 }, { "epoch": 0.96, "learning_rate": 1.838398141721628e-06, "loss": 2.3018, "step": 552350 }, { "epoch": 0.96, "learning_rate": 1.8375262017948011e-06, "loss": 2.2816, "step": 552360 }, { "epoch": 0.96, "learning_rate": 1.8366542618679743e-06, "loss": 2.2158, "step": 552370 }, { "epoch": 0.96, "learning_rate": 1.8357823219411474e-06, "loss": 2.2361, "step": 552380 }, { "epoch": 0.96, "learning_rate": 1.834910382014321e-06, "loss": 2.2731, "step": 552390 }, { "epoch": 0.96, "learning_rate": 1.834038442087494e-06, "loss": 2.2669, "step": 552400 }, { "epoch": 0.96, "learning_rate": 1.8331665021606672e-06, "loss": 2.3504, "step": 552410 }, { "epoch": 0.96, "learning_rate": 1.8322945622338404e-06, "loss": 2.2293, "step": 552420 }, { "epoch": 0.96, "learning_rate": 1.8314226223070135e-06, "loss": 2.2698, "step": 552430 }, { "epoch": 0.96, "learning_rate": 1.8305506823801866e-06, "loss": 2.2858, "step": 552440 }, { "epoch": 0.96, "learning_rate": 1.8296787424533598e-06, "loss": 2.2318, "step": 552450 }, { "epoch": 0.96, "learning_rate": 1.8288068025265333e-06, "loss": 2.3177, "step": 552460 }, { "epoch": 0.96, "learning_rate": 1.8279348625997065e-06, "loss": 2.2286, "step": 552470 }, { "epoch": 0.96, "learning_rate": 1.8270629226728796e-06, "loss": 2.2512, "step": 552480 }, { "epoch": 0.96, "learning_rate": 1.8261909827460527e-06, "loss": 2.3272, "step": 552490 }, { "epoch": 0.96, "learning_rate": 1.8253190428192259e-06, "loss": 2.2255, "step": 552500 }, { "epoch": 0.96, "learning_rate": 1.824447102892399e-06, "loss": 2.1682, "step": 552510 }, { "epoch": 0.96, "learning_rate": 1.8235751629655726e-06, "loss": 2.2626, "step": 552520 }, { "epoch": 0.96, "learning_rate": 1.8227032230387457e-06, "loss": 2.1825, "step": 552530 }, { "epoch": 0.96, "learning_rate": 1.8218312831119188e-06, "loss": 2.3173, "step": 552540 }, { "epoch": 0.96, "learning_rate": 1.820959343185092e-06, "loss": 2.2592, "step": 552550 }, { "epoch": 0.96, "learning_rate": 1.820087403258265e-06, "loss": 2.3082, "step": 552560 }, { "epoch": 0.96, "learning_rate": 1.8192154633314382e-06, "loss": 2.2512, "step": 552570 }, { "epoch": 0.96, "learning_rate": 1.8183435234046114e-06, "loss": 2.2687, "step": 552580 }, { "epoch": 0.96, "learning_rate": 1.817471583477785e-06, "loss": 2.2291, "step": 552590 }, { "epoch": 0.96, "learning_rate": 1.816599643550958e-06, "loss": 2.2665, "step": 552600 }, { "epoch": 0.96, "learning_rate": 1.8157277036241312e-06, "loss": 2.3579, "step": 552610 }, { "epoch": 0.96, "learning_rate": 1.8148557636973043e-06, "loss": 2.2447, "step": 552620 }, { "epoch": 0.96, "learning_rate": 1.8139838237704775e-06, "loss": 2.2538, "step": 552630 }, { "epoch": 0.96, "learning_rate": 1.8131118838436506e-06, "loss": 2.157, "step": 552640 }, { "epoch": 0.96, "learning_rate": 1.8122399439168237e-06, "loss": 2.3167, "step": 552650 }, { "epoch": 0.96, "learning_rate": 1.8113680039899973e-06, "loss": 2.427, "step": 552660 }, { "epoch": 0.96, "learning_rate": 1.8104960640631704e-06, "loss": 2.281, "step": 552670 }, { "epoch": 0.96, "learning_rate": 1.8096241241363436e-06, "loss": 2.2491, "step": 552680 }, { "epoch": 0.96, "learning_rate": 1.8087521842095167e-06, "loss": 2.2694, "step": 552690 }, { "epoch": 0.96, "learning_rate": 1.8078802442826898e-06, "loss": 2.275, "step": 552700 }, { "epoch": 0.96, "learning_rate": 1.807008304355863e-06, "loss": 2.3274, "step": 552710 }, { "epoch": 0.96, "learning_rate": 1.8061363644290365e-06, "loss": 2.3189, "step": 552720 }, { "epoch": 0.96, "learning_rate": 1.8052644245022097e-06, "loss": 2.2287, "step": 552730 }, { "epoch": 0.96, "learning_rate": 1.8043924845753828e-06, "loss": 2.2174, "step": 552740 }, { "epoch": 0.96, "learning_rate": 1.803520544648556e-06, "loss": 2.2923, "step": 552750 }, { "epoch": 0.96, "learning_rate": 1.802648604721729e-06, "loss": 2.2849, "step": 552760 }, { "epoch": 0.96, "learning_rate": 1.8017766647949022e-06, "loss": 2.2156, "step": 552770 }, { "epoch": 0.96, "learning_rate": 1.8009047248680753e-06, "loss": 2.1536, "step": 552780 }, { "epoch": 0.96, "learning_rate": 1.8000327849412489e-06, "loss": 2.2014, "step": 552790 }, { "epoch": 0.96, "learning_rate": 1.799160845014422e-06, "loss": 2.2737, "step": 552800 }, { "epoch": 0.96, "learning_rate": 1.7982889050875952e-06, "loss": 2.3023, "step": 552810 }, { "epoch": 0.96, "learning_rate": 1.7974169651607683e-06, "loss": 2.2478, "step": 552820 }, { "epoch": 0.96, "learning_rate": 1.7965450252339414e-06, "loss": 2.3029, "step": 552830 }, { "epoch": 0.96, "learning_rate": 1.7956730853071146e-06, "loss": 2.3484, "step": 552840 }, { "epoch": 0.96, "learning_rate": 1.7948011453802881e-06, "loss": 2.3055, "step": 552850 }, { "epoch": 0.96, "learning_rate": 1.7939292054534613e-06, "loss": 2.2635, "step": 552860 }, { "epoch": 0.96, "learning_rate": 1.7930572655266344e-06, "loss": 2.3619, "step": 552870 }, { "epoch": 0.96, "learning_rate": 1.7921853255998075e-06, "loss": 2.1922, "step": 552880 }, { "epoch": 0.96, "learning_rate": 1.7913133856729807e-06, "loss": 2.2854, "step": 552890 }, { "epoch": 0.96, "learning_rate": 1.7904414457461538e-06, "loss": 2.2297, "step": 552900 }, { "epoch": 0.96, "learning_rate": 1.789569505819327e-06, "loss": 2.3282, "step": 552910 }, { "epoch": 0.96, "learning_rate": 1.7886975658925005e-06, "loss": 2.3598, "step": 552920 }, { "epoch": 0.96, "learning_rate": 1.7878256259656736e-06, "loss": 2.3253, "step": 552930 }, { "epoch": 0.96, "learning_rate": 1.7869536860388468e-06, "loss": 2.2163, "step": 552940 }, { "epoch": 0.96, "learning_rate": 1.7860817461120199e-06, "loss": 2.3038, "step": 552950 }, { "epoch": 0.96, "learning_rate": 1.785209806185193e-06, "loss": 2.1539, "step": 552960 }, { "epoch": 0.96, "learning_rate": 1.7843378662583662e-06, "loss": 2.3165, "step": 552970 }, { "epoch": 0.96, "learning_rate": 1.7834659263315393e-06, "loss": 2.2569, "step": 552980 }, { "epoch": 0.96, "learning_rate": 1.7825939864047129e-06, "loss": 2.175, "step": 552990 }, { "epoch": 0.96, "learning_rate": 1.781722046477886e-06, "loss": 2.325, "step": 553000 }, { "epoch": 0.96, "learning_rate": 1.7808501065510591e-06, "loss": 2.2807, "step": 553010 }, { "epoch": 0.96, "learning_rate": 1.7799781666242323e-06, "loss": 2.32, "step": 553020 }, { "epoch": 0.96, "learning_rate": 1.7791062266974054e-06, "loss": 2.2674, "step": 553030 }, { "epoch": 0.96, "learning_rate": 1.7782342867705785e-06, "loss": 2.3068, "step": 553040 }, { "epoch": 0.96, "learning_rate": 1.777362346843752e-06, "loss": 2.2626, "step": 553050 }, { "epoch": 0.96, "learning_rate": 1.7764904069169252e-06, "loss": 2.2435, "step": 553060 }, { "epoch": 0.96, "learning_rate": 1.7756184669900984e-06, "loss": 2.2644, "step": 553070 }, { "epoch": 0.96, "learning_rate": 1.7747465270632715e-06, "loss": 2.267, "step": 553080 }, { "epoch": 0.96, "learning_rate": 1.7738745871364446e-06, "loss": 2.3047, "step": 553090 }, { "epoch": 0.96, "learning_rate": 1.7730026472096178e-06, "loss": 2.2573, "step": 553100 }, { "epoch": 0.96, "learning_rate": 1.7721307072827909e-06, "loss": 2.1954, "step": 553110 }, { "epoch": 0.96, "learning_rate": 1.7712587673559645e-06, "loss": 2.1124, "step": 553120 }, { "epoch": 0.96, "learning_rate": 1.7703868274291376e-06, "loss": 2.291, "step": 553130 }, { "epoch": 0.96, "learning_rate": 1.7695148875023107e-06, "loss": 2.323, "step": 553140 }, { "epoch": 0.96, "learning_rate": 1.7686429475754839e-06, "loss": 2.1658, "step": 553150 }, { "epoch": 0.96, "learning_rate": 1.767771007648657e-06, "loss": 2.1501, "step": 553160 }, { "epoch": 0.96, "learning_rate": 1.7668990677218301e-06, "loss": 2.241, "step": 553170 }, { "epoch": 0.96, "learning_rate": 1.7660271277950033e-06, "loss": 2.2042, "step": 553180 }, { "epoch": 0.96, "learning_rate": 1.7651551878681768e-06, "loss": 2.2815, "step": 553190 }, { "epoch": 0.96, "learning_rate": 1.76428324794135e-06, "loss": 2.2974, "step": 553200 }, { "epoch": 0.96, "learning_rate": 1.763411308014523e-06, "loss": 2.259, "step": 553210 }, { "epoch": 0.96, "learning_rate": 1.7625393680876962e-06, "loss": 2.2552, "step": 553220 }, { "epoch": 0.96, "learning_rate": 1.7616674281608694e-06, "loss": 2.1913, "step": 553230 }, { "epoch": 0.96, "learning_rate": 1.7607954882340425e-06, "loss": 2.211, "step": 553240 }, { "epoch": 0.96, "learning_rate": 1.759923548307216e-06, "loss": 2.1047, "step": 553250 }, { "epoch": 0.96, "learning_rate": 1.7590516083803892e-06, "loss": 2.2718, "step": 553260 }, { "epoch": 0.96, "learning_rate": 1.7581796684535623e-06, "loss": 2.3275, "step": 553270 }, { "epoch": 0.96, "learning_rate": 1.7573077285267355e-06, "loss": 2.3052, "step": 553280 }, { "epoch": 0.96, "learning_rate": 1.7564357885999086e-06, "loss": 2.3094, "step": 553290 }, { "epoch": 0.96, "learning_rate": 1.7555638486730817e-06, "loss": 2.3273, "step": 553300 }, { "epoch": 0.96, "learning_rate": 1.7546919087462549e-06, "loss": 2.3653, "step": 553310 }, { "epoch": 0.96, "learning_rate": 1.7538199688194284e-06, "loss": 2.2131, "step": 553320 }, { "epoch": 0.96, "learning_rate": 1.7529480288926015e-06, "loss": 2.1681, "step": 553330 }, { "epoch": 0.96, "learning_rate": 1.7520760889657747e-06, "loss": 2.131, "step": 553340 }, { "epoch": 0.96, "learning_rate": 1.7512041490389478e-06, "loss": 2.3241, "step": 553350 }, { "epoch": 0.96, "learning_rate": 1.750332209112121e-06, "loss": 2.3555, "step": 553360 }, { "epoch": 0.97, "learning_rate": 1.749460269185294e-06, "loss": 2.3085, "step": 553370 }, { "epoch": 0.97, "learning_rate": 1.7485883292584672e-06, "loss": 2.2096, "step": 553380 }, { "epoch": 0.97, "learning_rate": 1.7477163893316408e-06, "loss": 2.1571, "step": 553390 }, { "epoch": 0.97, "learning_rate": 1.746844449404814e-06, "loss": 2.3937, "step": 553400 }, { "epoch": 0.97, "learning_rate": 1.745972509477987e-06, "loss": 2.252, "step": 553410 }, { "epoch": 0.97, "learning_rate": 1.7451005695511602e-06, "loss": 2.2851, "step": 553420 }, { "epoch": 0.97, "learning_rate": 1.7442286296243333e-06, "loss": 2.3478, "step": 553430 }, { "epoch": 0.97, "learning_rate": 1.7433566896975065e-06, "loss": 2.1997, "step": 553440 }, { "epoch": 0.97, "learning_rate": 1.74248474977068e-06, "loss": 2.2476, "step": 553450 }, { "epoch": 0.97, "learning_rate": 1.7416128098438531e-06, "loss": 2.3198, "step": 553460 }, { "epoch": 0.97, "learning_rate": 1.7407408699170263e-06, "loss": 2.1941, "step": 553470 }, { "epoch": 0.97, "learning_rate": 1.7398689299901994e-06, "loss": 2.1799, "step": 553480 }, { "epoch": 0.97, "learning_rate": 1.7389969900633726e-06, "loss": 2.1985, "step": 553490 }, { "epoch": 0.97, "learning_rate": 1.7381250501365457e-06, "loss": 2.1746, "step": 553500 }, { "epoch": 0.97, "learning_rate": 1.7372531102097188e-06, "loss": 2.2752, "step": 553510 }, { "epoch": 0.97, "learning_rate": 1.7363811702828924e-06, "loss": 2.3473, "step": 553520 }, { "epoch": 0.97, "learning_rate": 1.7355092303560655e-06, "loss": 2.3697, "step": 553530 }, { "epoch": 0.97, "learning_rate": 1.7346372904292386e-06, "loss": 2.3522, "step": 553540 }, { "epoch": 0.97, "learning_rate": 1.7337653505024118e-06, "loss": 2.2706, "step": 553550 }, { "epoch": 0.97, "learning_rate": 1.732893410575585e-06, "loss": 2.1929, "step": 553560 }, { "epoch": 0.97, "learning_rate": 1.732021470648758e-06, "loss": 2.303, "step": 553570 }, { "epoch": 0.97, "learning_rate": 1.7311495307219314e-06, "loss": 2.1921, "step": 553580 }, { "epoch": 0.97, "learning_rate": 1.7302775907951047e-06, "loss": 2.3248, "step": 553590 }, { "epoch": 0.97, "learning_rate": 1.7294056508682779e-06, "loss": 2.2501, "step": 553600 }, { "epoch": 0.97, "learning_rate": 1.728533710941451e-06, "loss": 2.2211, "step": 553610 }, { "epoch": 0.97, "learning_rate": 1.7276617710146241e-06, "loss": 2.2948, "step": 553620 }, { "epoch": 0.97, "learning_rate": 1.7267898310877973e-06, "loss": 2.2848, "step": 553630 }, { "epoch": 0.97, "learning_rate": 1.7259178911609706e-06, "loss": 2.181, "step": 553640 }, { "epoch": 0.97, "learning_rate": 1.725045951234144e-06, "loss": 2.3184, "step": 553650 }, { "epoch": 0.97, "learning_rate": 1.7241740113073171e-06, "loss": 2.1916, "step": 553660 }, { "epoch": 0.97, "learning_rate": 1.7233020713804902e-06, "loss": 2.2737, "step": 553670 }, { "epoch": 0.97, "learning_rate": 1.7224301314536634e-06, "loss": 2.3077, "step": 553680 }, { "epoch": 0.97, "learning_rate": 1.7215581915268365e-06, "loss": 2.2741, "step": 553690 }, { "epoch": 0.97, "learning_rate": 1.7206862516000096e-06, "loss": 2.181, "step": 553700 }, { "epoch": 0.97, "learning_rate": 1.719814311673183e-06, "loss": 2.3821, "step": 553710 }, { "epoch": 0.97, "learning_rate": 1.7189423717463563e-06, "loss": 2.1242, "step": 553720 }, { "epoch": 0.97, "learning_rate": 1.7180704318195295e-06, "loss": 2.1756, "step": 553730 }, { "epoch": 0.97, "learning_rate": 1.7171984918927026e-06, "loss": 2.2809, "step": 553740 }, { "epoch": 0.97, "learning_rate": 1.7163265519658757e-06, "loss": 2.1752, "step": 553750 }, { "epoch": 0.97, "learning_rate": 1.7154546120390489e-06, "loss": 2.3747, "step": 553760 }, { "epoch": 0.97, "learning_rate": 1.7145826721122222e-06, "loss": 2.2294, "step": 553770 }, { "epoch": 0.97, "learning_rate": 1.7137107321853954e-06, "loss": 2.2404, "step": 553780 }, { "epoch": 0.97, "learning_rate": 1.7128387922585687e-06, "loss": 2.2205, "step": 553790 }, { "epoch": 0.97, "learning_rate": 1.7119668523317418e-06, "loss": 2.1693, "step": 553800 }, { "epoch": 0.97, "learning_rate": 1.711094912404915e-06, "loss": 2.2301, "step": 553810 }, { "epoch": 0.97, "learning_rate": 1.7102229724780881e-06, "loss": 2.2516, "step": 553820 }, { "epoch": 0.97, "learning_rate": 1.7093510325512612e-06, "loss": 2.2237, "step": 553830 }, { "epoch": 0.97, "learning_rate": 1.7084790926244346e-06, "loss": 2.1335, "step": 553840 }, { "epoch": 0.97, "learning_rate": 1.707607152697608e-06, "loss": 2.2342, "step": 553850 }, { "epoch": 0.97, "learning_rate": 1.706735212770781e-06, "loss": 2.2849, "step": 553860 }, { "epoch": 0.97, "learning_rate": 1.7058632728439542e-06, "loss": 2.3399, "step": 553870 }, { "epoch": 0.97, "learning_rate": 1.7049913329171273e-06, "loss": 2.2417, "step": 553880 }, { "epoch": 0.97, "learning_rate": 1.7041193929903005e-06, "loss": 2.3057, "step": 553890 }, { "epoch": 0.97, "learning_rate": 1.7032474530634738e-06, "loss": 2.4038, "step": 553900 }, { "epoch": 0.97, "learning_rate": 1.702375513136647e-06, "loss": 2.2919, "step": 553910 }, { "epoch": 0.97, "learning_rate": 1.7015035732098203e-06, "loss": 2.3155, "step": 553920 }, { "epoch": 0.97, "learning_rate": 1.7006316332829934e-06, "loss": 2.2119, "step": 553930 }, { "epoch": 0.97, "learning_rate": 1.6997596933561666e-06, "loss": 2.3619, "step": 553940 }, { "epoch": 0.97, "learning_rate": 1.6988877534293397e-06, "loss": 2.294, "step": 553950 }, { "epoch": 0.97, "learning_rate": 1.6980158135025128e-06, "loss": 2.2218, "step": 553960 }, { "epoch": 0.97, "learning_rate": 1.6971438735756862e-06, "loss": 2.3403, "step": 553970 }, { "epoch": 0.97, "learning_rate": 1.6962719336488593e-06, "loss": 2.2258, "step": 553980 }, { "epoch": 0.97, "learning_rate": 1.6953999937220327e-06, "loss": 2.2204, "step": 553990 }, { "epoch": 0.97, "learning_rate": 1.6945280537952058e-06, "loss": 2.1147, "step": 554000 }, { "epoch": 0.97, "learning_rate": 1.693656113868379e-06, "loss": 2.2985, "step": 554010 }, { "epoch": 0.97, "learning_rate": 1.692784173941552e-06, "loss": 2.252, "step": 554020 }, { "epoch": 0.97, "learning_rate": 1.6919122340147254e-06, "loss": 2.2344, "step": 554030 }, { "epoch": 0.97, "learning_rate": 1.6910402940878986e-06, "loss": 2.318, "step": 554040 }, { "epoch": 0.97, "learning_rate": 1.690168354161072e-06, "loss": 2.3401, "step": 554050 }, { "epoch": 0.97, "learning_rate": 1.689296414234245e-06, "loss": 2.2197, "step": 554060 }, { "epoch": 0.97, "learning_rate": 1.6884244743074182e-06, "loss": 2.1917, "step": 554070 }, { "epoch": 0.97, "learning_rate": 1.6875525343805913e-06, "loss": 2.2286, "step": 554080 }, { "epoch": 0.97, "learning_rate": 1.6866805944537644e-06, "loss": 2.2192, "step": 554090 }, { "epoch": 0.97, "learning_rate": 1.6858086545269378e-06, "loss": 2.1195, "step": 554100 }, { "epoch": 0.97, "learning_rate": 1.684936714600111e-06, "loss": 2.3637, "step": 554110 }, { "epoch": 0.97, "learning_rate": 1.6840647746732843e-06, "loss": 2.2766, "step": 554120 }, { "epoch": 0.97, "learning_rate": 1.6831928347464574e-06, "loss": 2.3601, "step": 554130 }, { "epoch": 0.97, "learning_rate": 1.6823208948196305e-06, "loss": 2.1361, "step": 554140 }, { "epoch": 0.97, "learning_rate": 1.6814489548928037e-06, "loss": 2.1989, "step": 554150 }, { "epoch": 0.97, "learning_rate": 1.680577014965977e-06, "loss": 2.227, "step": 554160 }, { "epoch": 0.97, "learning_rate": 1.6797050750391502e-06, "loss": 2.2987, "step": 554170 }, { "epoch": 0.97, "learning_rate": 1.6788331351123235e-06, "loss": 2.1902, "step": 554180 }, { "epoch": 0.97, "learning_rate": 1.6779611951854966e-06, "loss": 2.3424, "step": 554190 }, { "epoch": 0.97, "learning_rate": 1.6770892552586698e-06, "loss": 2.301, "step": 554200 }, { "epoch": 0.97, "learning_rate": 1.676217315331843e-06, "loss": 2.1808, "step": 554210 }, { "epoch": 0.97, "learning_rate": 1.675345375405016e-06, "loss": 2.2922, "step": 554220 }, { "epoch": 0.97, "learning_rate": 1.6744734354781894e-06, "loss": 2.3374, "step": 554230 }, { "epoch": 0.97, "learning_rate": 1.6736014955513625e-06, "loss": 2.3415, "step": 554240 }, { "epoch": 0.97, "learning_rate": 1.6727295556245359e-06, "loss": 2.2748, "step": 554250 }, { "epoch": 0.97, "learning_rate": 1.671857615697709e-06, "loss": 2.2454, "step": 554260 }, { "epoch": 0.97, "learning_rate": 1.6709856757708821e-06, "loss": 2.2884, "step": 554270 }, { "epoch": 0.97, "learning_rate": 1.6701137358440553e-06, "loss": 2.2739, "step": 554280 }, { "epoch": 0.97, "learning_rate": 1.6692417959172286e-06, "loss": 2.1906, "step": 554290 }, { "epoch": 0.97, "learning_rate": 1.6683698559904018e-06, "loss": 2.3138, "step": 554300 }, { "epoch": 0.97, "learning_rate": 1.6674979160635749e-06, "loss": 2.1153, "step": 554310 }, { "epoch": 0.97, "learning_rate": 1.6666259761367482e-06, "loss": 2.2674, "step": 554320 }, { "epoch": 0.97, "learning_rate": 1.6657540362099214e-06, "loss": 2.3433, "step": 554330 }, { "epoch": 0.97, "learning_rate": 1.6648820962830945e-06, "loss": 2.3748, "step": 554340 }, { "epoch": 0.97, "learning_rate": 1.6640101563562676e-06, "loss": 2.2691, "step": 554350 }, { "epoch": 0.97, "learning_rate": 1.663138216429441e-06, "loss": 2.2277, "step": 554360 }, { "epoch": 0.97, "learning_rate": 1.6622662765026141e-06, "loss": 2.3055, "step": 554370 }, { "epoch": 0.97, "learning_rate": 1.6613943365757875e-06, "loss": 2.2573, "step": 554380 }, { "epoch": 0.97, "learning_rate": 1.6605223966489606e-06, "loss": 2.244, "step": 554390 }, { "epoch": 0.97, "learning_rate": 1.6596504567221337e-06, "loss": 2.273, "step": 554400 }, { "epoch": 0.97, "learning_rate": 1.6587785167953069e-06, "loss": 2.2629, "step": 554410 }, { "epoch": 0.97, "learning_rate": 1.6579065768684802e-06, "loss": 2.2635, "step": 554420 }, { "epoch": 0.97, "learning_rate": 1.6570346369416533e-06, "loss": 2.243, "step": 554430 }, { "epoch": 0.97, "learning_rate": 1.6561626970148265e-06, "loss": 2.2626, "step": 554440 }, { "epoch": 0.97, "learning_rate": 1.6552907570879998e-06, "loss": 2.2504, "step": 554450 }, { "epoch": 0.97, "learning_rate": 1.654418817161173e-06, "loss": 2.254, "step": 554460 }, { "epoch": 0.97, "learning_rate": 1.653546877234346e-06, "loss": 2.2493, "step": 554470 }, { "epoch": 0.97, "learning_rate": 1.6526749373075192e-06, "loss": 2.2131, "step": 554480 }, { "epoch": 0.97, "learning_rate": 1.6518029973806926e-06, "loss": 2.2277, "step": 554490 }, { "epoch": 0.97, "learning_rate": 1.6509310574538657e-06, "loss": 2.1969, "step": 554500 }, { "epoch": 0.97, "learning_rate": 1.6500591175270388e-06, "loss": 2.2662, "step": 554510 }, { "epoch": 0.97, "learning_rate": 1.6491871776002122e-06, "loss": 2.2429, "step": 554520 }, { "epoch": 0.97, "learning_rate": 1.6483152376733853e-06, "loss": 2.2458, "step": 554530 }, { "epoch": 0.97, "learning_rate": 1.6474432977465585e-06, "loss": 2.264, "step": 554540 }, { "epoch": 0.97, "learning_rate": 1.6465713578197318e-06, "loss": 2.2421, "step": 554550 }, { "epoch": 0.97, "learning_rate": 1.645699417892905e-06, "loss": 2.229, "step": 554560 }, { "epoch": 0.97, "learning_rate": 1.644827477966078e-06, "loss": 2.259, "step": 554570 }, { "epoch": 0.97, "learning_rate": 1.6439555380392514e-06, "loss": 2.3506, "step": 554580 }, { "epoch": 0.97, "learning_rate": 1.6430835981124246e-06, "loss": 2.12, "step": 554590 }, { "epoch": 0.97, "learning_rate": 1.6422116581855977e-06, "loss": 2.1462, "step": 554600 }, { "epoch": 0.97, "learning_rate": 1.6413397182587708e-06, "loss": 2.2328, "step": 554610 }, { "epoch": 0.97, "learning_rate": 1.6404677783319442e-06, "loss": 2.2884, "step": 554620 }, { "epoch": 0.97, "learning_rate": 1.6395958384051173e-06, "loss": 2.3023, "step": 554630 }, { "epoch": 0.97, "learning_rate": 1.6387238984782904e-06, "loss": 2.2997, "step": 554640 }, { "epoch": 0.97, "learning_rate": 1.6378519585514638e-06, "loss": 2.2715, "step": 554650 }, { "epoch": 0.97, "learning_rate": 1.636980018624637e-06, "loss": 2.212, "step": 554660 }, { "epoch": 0.97, "learning_rate": 1.63610807869781e-06, "loss": 2.2865, "step": 554670 }, { "epoch": 0.97, "learning_rate": 1.6352361387709834e-06, "loss": 2.2824, "step": 554680 }, { "epoch": 0.97, "learning_rate": 1.6343641988441565e-06, "loss": 2.2597, "step": 554690 }, { "epoch": 0.97, "learning_rate": 1.6334922589173297e-06, "loss": 2.225, "step": 554700 }, { "epoch": 0.97, "learning_rate": 1.6326203189905028e-06, "loss": 2.2208, "step": 554710 }, { "epoch": 0.97, "learning_rate": 1.6317483790636762e-06, "loss": 2.251, "step": 554720 }, { "epoch": 0.97, "learning_rate": 1.6308764391368493e-06, "loss": 2.316, "step": 554730 }, { "epoch": 0.97, "learning_rate": 1.6300044992100224e-06, "loss": 2.246, "step": 554740 }, { "epoch": 0.97, "learning_rate": 1.6291325592831958e-06, "loss": 2.1604, "step": 554750 }, { "epoch": 0.97, "learning_rate": 1.628260619356369e-06, "loss": 2.2608, "step": 554760 }, { "epoch": 0.97, "learning_rate": 1.627388679429542e-06, "loss": 2.2199, "step": 554770 }, { "epoch": 0.97, "learning_rate": 1.6265167395027154e-06, "loss": 2.3545, "step": 554780 }, { "epoch": 0.97, "learning_rate": 1.6256447995758885e-06, "loss": 2.2729, "step": 554790 }, { "epoch": 0.97, "learning_rate": 1.6247728596490617e-06, "loss": 2.2121, "step": 554800 }, { "epoch": 0.97, "learning_rate": 1.623900919722235e-06, "loss": 2.3864, "step": 554810 }, { "epoch": 0.97, "learning_rate": 1.6230289797954081e-06, "loss": 2.3141, "step": 554820 }, { "epoch": 0.97, "learning_rate": 1.6221570398685813e-06, "loss": 2.1324, "step": 554830 }, { "epoch": 0.97, "learning_rate": 1.6212850999417544e-06, "loss": 2.251, "step": 554840 }, { "epoch": 0.97, "learning_rate": 1.6204131600149278e-06, "loss": 2.2826, "step": 554850 }, { "epoch": 0.97, "learning_rate": 1.6195412200881009e-06, "loss": 2.3082, "step": 554860 }, { "epoch": 0.97, "learning_rate": 1.618669280161274e-06, "loss": 2.2582, "step": 554870 }, { "epoch": 0.97, "learning_rate": 1.6177973402344474e-06, "loss": 2.1674, "step": 554880 }, { "epoch": 0.97, "learning_rate": 1.6169254003076205e-06, "loss": 2.224, "step": 554890 }, { "epoch": 0.97, "learning_rate": 1.6160534603807936e-06, "loss": 2.2808, "step": 554900 }, { "epoch": 0.97, "learning_rate": 1.6151815204539668e-06, "loss": 2.2951, "step": 554910 }, { "epoch": 0.97, "learning_rate": 1.6143095805271401e-06, "loss": 2.2683, "step": 554920 }, { "epoch": 0.97, "learning_rate": 1.6134376406003133e-06, "loss": 2.2188, "step": 554930 }, { "epoch": 0.97, "learning_rate": 1.6125657006734866e-06, "loss": 2.2146, "step": 554940 }, { "epoch": 0.97, "learning_rate": 1.6116937607466597e-06, "loss": 2.3173, "step": 554950 }, { "epoch": 0.97, "learning_rate": 1.6108218208198329e-06, "loss": 2.2339, "step": 554960 }, { "epoch": 0.97, "learning_rate": 1.609949880893006e-06, "loss": 2.1198, "step": 554970 }, { "epoch": 0.97, "learning_rate": 1.6090779409661794e-06, "loss": 2.4139, "step": 554980 }, { "epoch": 0.97, "learning_rate": 1.6082060010393525e-06, "loss": 2.3212, "step": 554990 }, { "epoch": 0.97, "learning_rate": 1.6073340611125256e-06, "loss": 2.3449, "step": 555000 }, { "epoch": 0.97, "learning_rate": 1.606462121185699e-06, "loss": 2.2039, "step": 555010 }, { "epoch": 0.97, "learning_rate": 1.605590181258872e-06, "loss": 2.1972, "step": 555020 }, { "epoch": 0.97, "learning_rate": 1.6047182413320452e-06, "loss": 2.2929, "step": 555030 }, { "epoch": 0.97, "learning_rate": 1.6038463014052184e-06, "loss": 2.2426, "step": 555040 }, { "epoch": 0.97, "learning_rate": 1.6029743614783917e-06, "loss": 2.3362, "step": 555050 }, { "epoch": 0.97, "learning_rate": 1.6021024215515649e-06, "loss": 2.2201, "step": 555060 }, { "epoch": 0.97, "learning_rate": 1.6012304816247382e-06, "loss": 2.2887, "step": 555070 }, { "epoch": 0.97, "learning_rate": 1.6003585416979113e-06, "loss": 2.2736, "step": 555080 }, { "epoch": 0.97, "learning_rate": 1.5994866017710845e-06, "loss": 2.257, "step": 555090 }, { "epoch": 0.97, "learning_rate": 1.5986146618442576e-06, "loss": 2.2901, "step": 555100 }, { "epoch": 0.97, "learning_rate": 1.5977427219174307e-06, "loss": 2.2906, "step": 555110 }, { "epoch": 0.97, "learning_rate": 1.596870781990604e-06, "loss": 2.129, "step": 555120 }, { "epoch": 0.97, "learning_rate": 1.5959988420637772e-06, "loss": 2.2973, "step": 555130 }, { "epoch": 0.97, "learning_rate": 1.5951269021369506e-06, "loss": 2.2271, "step": 555140 }, { "epoch": 0.97, "learning_rate": 1.5942549622101237e-06, "loss": 2.2339, "step": 555150 }, { "epoch": 0.97, "learning_rate": 1.5933830222832968e-06, "loss": 2.3421, "step": 555160 }, { "epoch": 0.97, "learning_rate": 1.59251108235647e-06, "loss": 2.3837, "step": 555170 }, { "epoch": 0.97, "learning_rate": 1.5916391424296433e-06, "loss": 2.2561, "step": 555180 }, { "epoch": 0.97, "learning_rate": 1.5907672025028165e-06, "loss": 2.2621, "step": 555190 }, { "epoch": 0.97, "learning_rate": 1.5898952625759898e-06, "loss": 2.3197, "step": 555200 }, { "epoch": 0.97, "learning_rate": 1.589023322649163e-06, "loss": 2.2127, "step": 555210 }, { "epoch": 0.97, "learning_rate": 1.588151382722336e-06, "loss": 2.2264, "step": 555220 }, { "epoch": 0.97, "learning_rate": 1.5872794427955092e-06, "loss": 2.3189, "step": 555230 }, { "epoch": 0.97, "learning_rate": 1.5864075028686823e-06, "loss": 2.2904, "step": 555240 }, { "epoch": 0.97, "learning_rate": 1.5855355629418557e-06, "loss": 2.2969, "step": 555250 }, { "epoch": 0.97, "learning_rate": 1.584663623015029e-06, "loss": 2.3153, "step": 555260 }, { "epoch": 0.97, "learning_rate": 1.5837916830882022e-06, "loss": 2.2445, "step": 555270 }, { "epoch": 0.97, "learning_rate": 1.5829197431613753e-06, "loss": 2.2881, "step": 555280 }, { "epoch": 0.97, "learning_rate": 1.5820478032345484e-06, "loss": 2.284, "step": 555290 }, { "epoch": 0.97, "learning_rate": 1.5811758633077216e-06, "loss": 2.2476, "step": 555300 }, { "epoch": 0.97, "learning_rate": 1.5803039233808947e-06, "loss": 2.207, "step": 555310 }, { "epoch": 0.97, "learning_rate": 1.579431983454068e-06, "loss": 2.2626, "step": 555320 }, { "epoch": 0.97, "learning_rate": 1.5785600435272414e-06, "loss": 2.1805, "step": 555330 }, { "epoch": 0.97, "learning_rate": 1.5776881036004145e-06, "loss": 2.2812, "step": 555340 }, { "epoch": 0.97, "learning_rate": 1.5768161636735877e-06, "loss": 2.1062, "step": 555350 }, { "epoch": 0.97, "learning_rate": 1.5759442237467608e-06, "loss": 2.2624, "step": 555360 }, { "epoch": 0.97, "learning_rate": 1.575072283819934e-06, "loss": 2.2567, "step": 555370 }, { "epoch": 0.97, "learning_rate": 1.5742003438931073e-06, "loss": 2.1279, "step": 555380 }, { "epoch": 0.97, "learning_rate": 1.5733284039662806e-06, "loss": 2.2571, "step": 555390 }, { "epoch": 0.97, "learning_rate": 1.5724564640394538e-06, "loss": 2.2348, "step": 555400 }, { "epoch": 0.97, "learning_rate": 1.571584524112627e-06, "loss": 2.3653, "step": 555410 }, { "epoch": 0.97, "learning_rate": 1.5707125841858e-06, "loss": 2.2842, "step": 555420 }, { "epoch": 0.97, "learning_rate": 1.5698406442589732e-06, "loss": 2.3318, "step": 555430 }, { "epoch": 0.97, "learning_rate": 1.5689687043321463e-06, "loss": 2.3517, "step": 555440 }, { "epoch": 0.97, "learning_rate": 1.5680967644053196e-06, "loss": 2.2991, "step": 555450 }, { "epoch": 0.97, "learning_rate": 1.567224824478493e-06, "loss": 2.2404, "step": 555460 }, { "epoch": 0.97, "learning_rate": 1.5663528845516661e-06, "loss": 2.2132, "step": 555470 }, { "epoch": 0.97, "learning_rate": 1.5654809446248393e-06, "loss": 2.2334, "step": 555480 }, { "epoch": 0.97, "learning_rate": 1.5646090046980124e-06, "loss": 2.2079, "step": 555490 }, { "epoch": 0.97, "learning_rate": 1.5637370647711855e-06, "loss": 2.2957, "step": 555500 }, { "epoch": 0.97, "learning_rate": 1.5628651248443587e-06, "loss": 2.2932, "step": 555510 }, { "epoch": 0.97, "learning_rate": 1.561993184917532e-06, "loss": 2.1311, "step": 555520 }, { "epoch": 0.97, "learning_rate": 1.5611212449907054e-06, "loss": 2.1689, "step": 555530 }, { "epoch": 0.97, "learning_rate": 1.5602493050638785e-06, "loss": 2.3365, "step": 555540 }, { "epoch": 0.97, "learning_rate": 1.5593773651370516e-06, "loss": 2.2702, "step": 555550 }, { "epoch": 0.97, "learning_rate": 1.558505425210225e-06, "loss": 2.3433, "step": 555560 }, { "epoch": 0.97, "learning_rate": 1.5576334852833981e-06, "loss": 2.3235, "step": 555570 }, { "epoch": 0.97, "learning_rate": 1.5567615453565712e-06, "loss": 2.2545, "step": 555580 }, { "epoch": 0.97, "learning_rate": 1.5558896054297444e-06, "loss": 2.3105, "step": 555590 }, { "epoch": 0.97, "learning_rate": 1.5550176655029177e-06, "loss": 2.3016, "step": 555600 }, { "epoch": 0.97, "learning_rate": 1.5541457255760909e-06, "loss": 2.2619, "step": 555610 }, { "epoch": 0.97, "learning_rate": 1.553273785649264e-06, "loss": 2.2994, "step": 555620 }, { "epoch": 0.97, "learning_rate": 1.5524018457224373e-06, "loss": 2.2392, "step": 555630 }, { "epoch": 0.97, "learning_rate": 1.5515299057956105e-06, "loss": 2.3068, "step": 555640 }, { "epoch": 0.97, "learning_rate": 1.5506579658687836e-06, "loss": 2.2707, "step": 555650 }, { "epoch": 0.97, "learning_rate": 1.549786025941957e-06, "loss": 2.242, "step": 555660 }, { "epoch": 0.97, "learning_rate": 1.54891408601513e-06, "loss": 2.2699, "step": 555670 }, { "epoch": 0.97, "learning_rate": 1.5480421460883032e-06, "loss": 2.3619, "step": 555680 }, { "epoch": 0.97, "learning_rate": 1.5471702061614764e-06, "loss": 2.2337, "step": 555690 }, { "epoch": 0.97, "learning_rate": 1.5462982662346497e-06, "loss": 2.2171, "step": 555700 }, { "epoch": 0.97, "learning_rate": 1.5454263263078228e-06, "loss": 2.2539, "step": 555710 }, { "epoch": 0.97, "learning_rate": 1.544554386380996e-06, "loss": 2.3429, "step": 555720 }, { "epoch": 0.97, "learning_rate": 1.5436824464541693e-06, "loss": 2.281, "step": 555730 }, { "epoch": 0.97, "learning_rate": 1.5428105065273425e-06, "loss": 2.3049, "step": 555740 }, { "epoch": 0.97, "learning_rate": 1.5419385666005156e-06, "loss": 2.1721, "step": 555750 }, { "epoch": 0.97, "learning_rate": 1.541066626673689e-06, "loss": 2.4376, "step": 555760 }, { "epoch": 0.97, "learning_rate": 1.540194686746862e-06, "loss": 2.3109, "step": 555770 }, { "epoch": 0.97, "learning_rate": 1.5393227468200352e-06, "loss": 2.2443, "step": 555780 }, { "epoch": 0.97, "learning_rate": 1.5384508068932083e-06, "loss": 2.1826, "step": 555790 }, { "epoch": 0.97, "learning_rate": 1.5375788669663817e-06, "loss": 2.2966, "step": 555800 }, { "epoch": 0.97, "learning_rate": 1.5367069270395548e-06, "loss": 2.2749, "step": 555810 }, { "epoch": 0.97, "learning_rate": 1.535834987112728e-06, "loss": 2.2512, "step": 555820 }, { "epoch": 0.97, "learning_rate": 1.5349630471859013e-06, "loss": 2.3076, "step": 555830 }, { "epoch": 0.97, "learning_rate": 1.5340911072590744e-06, "loss": 2.2531, "step": 555840 }, { "epoch": 0.97, "learning_rate": 1.5332191673322476e-06, "loss": 2.2215, "step": 555850 }, { "epoch": 0.97, "learning_rate": 1.532347227405421e-06, "loss": 2.2785, "step": 555860 }, { "epoch": 0.97, "learning_rate": 1.531475287478594e-06, "loss": 2.2501, "step": 555870 }, { "epoch": 0.97, "learning_rate": 1.5306033475517672e-06, "loss": 2.3064, "step": 555880 }, { "epoch": 0.97, "learning_rate": 1.5297314076249403e-06, "loss": 2.2887, "step": 555890 }, { "epoch": 0.97, "learning_rate": 1.5288594676981137e-06, "loss": 2.3909, "step": 555900 }, { "epoch": 0.97, "learning_rate": 1.5279875277712868e-06, "loss": 2.2474, "step": 555910 }, { "epoch": 0.97, "learning_rate": 1.52711558784446e-06, "loss": 2.3194, "step": 555920 }, { "epoch": 0.97, "learning_rate": 1.5262436479176333e-06, "loss": 2.1862, "step": 555930 }, { "epoch": 0.97, "learning_rate": 1.5253717079908064e-06, "loss": 2.2852, "step": 555940 }, { "epoch": 0.97, "learning_rate": 1.5244997680639796e-06, "loss": 2.21, "step": 555950 }, { "epoch": 0.97, "learning_rate": 1.523627828137153e-06, "loss": 2.2061, "step": 555960 }, { "epoch": 0.97, "learning_rate": 1.522755888210326e-06, "loss": 2.1962, "step": 555970 }, { "epoch": 0.97, "learning_rate": 1.5218839482834992e-06, "loss": 2.3278, "step": 555980 }, { "epoch": 0.97, "learning_rate": 1.5210120083566723e-06, "loss": 2.3555, "step": 555990 }, { "epoch": 0.97, "learning_rate": 1.5201400684298456e-06, "loss": 2.2766, "step": 556000 }, { "epoch": 0.97, "learning_rate": 1.5192681285030188e-06, "loss": 2.2627, "step": 556010 }, { "epoch": 0.97, "learning_rate": 1.518396188576192e-06, "loss": 2.2313, "step": 556020 }, { "epoch": 0.97, "learning_rate": 1.5175242486493653e-06, "loss": 2.264, "step": 556030 }, { "epoch": 0.97, "learning_rate": 1.5166523087225384e-06, "loss": 2.2079, "step": 556040 }, { "epoch": 0.97, "learning_rate": 1.5157803687957115e-06, "loss": 2.3158, "step": 556050 }, { "epoch": 0.97, "learning_rate": 1.5149084288688849e-06, "loss": 2.2848, "step": 556060 }, { "epoch": 0.97, "learning_rate": 1.514036488942058e-06, "loss": 2.2374, "step": 556070 }, { "epoch": 0.97, "learning_rate": 1.5131645490152312e-06, "loss": 2.2489, "step": 556080 }, { "epoch": 0.97, "learning_rate": 1.5122926090884043e-06, "loss": 2.2706, "step": 556090 }, { "epoch": 0.97, "learning_rate": 1.5114206691615776e-06, "loss": 2.3939, "step": 556100 }, { "epoch": 0.97, "learning_rate": 1.5105487292347508e-06, "loss": 2.3169, "step": 556110 }, { "epoch": 0.97, "learning_rate": 1.509676789307924e-06, "loss": 2.2499, "step": 556120 }, { "epoch": 0.97, "learning_rate": 1.5088048493810972e-06, "loss": 2.1636, "step": 556130 }, { "epoch": 0.97, "learning_rate": 1.5079329094542704e-06, "loss": 2.1416, "step": 556140 }, { "epoch": 0.97, "learning_rate": 1.5070609695274435e-06, "loss": 2.2278, "step": 556150 }, { "epoch": 0.97, "learning_rate": 1.5061890296006169e-06, "loss": 2.1529, "step": 556160 }, { "epoch": 0.97, "learning_rate": 1.50531708967379e-06, "loss": 2.2838, "step": 556170 }, { "epoch": 0.97, "learning_rate": 1.5044451497469631e-06, "loss": 2.2997, "step": 556180 }, { "epoch": 0.97, "learning_rate": 1.5035732098201363e-06, "loss": 2.2549, "step": 556190 }, { "epoch": 0.97, "learning_rate": 1.5027012698933096e-06, "loss": 2.2632, "step": 556200 }, { "epoch": 0.97, "learning_rate": 1.5018293299664827e-06, "loss": 2.2286, "step": 556210 }, { "epoch": 0.97, "learning_rate": 1.5009573900396559e-06, "loss": 2.2266, "step": 556220 }, { "epoch": 0.97, "learning_rate": 1.5000854501128292e-06, "loss": 2.1704, "step": 556230 }, { "epoch": 0.97, "learning_rate": 1.4992135101860024e-06, "loss": 2.196, "step": 556240 }, { "epoch": 0.97, "learning_rate": 1.4983415702591755e-06, "loss": 2.0888, "step": 556250 }, { "epoch": 0.97, "learning_rate": 1.4974696303323488e-06, "loss": 2.346, "step": 556260 }, { "epoch": 0.97, "learning_rate": 1.496597690405522e-06, "loss": 2.2748, "step": 556270 }, { "epoch": 0.97, "learning_rate": 1.4957257504786951e-06, "loss": 2.3429, "step": 556280 }, { "epoch": 0.97, "learning_rate": 1.4948538105518682e-06, "loss": 2.2014, "step": 556290 }, { "epoch": 0.97, "learning_rate": 1.4939818706250416e-06, "loss": 2.2558, "step": 556300 }, { "epoch": 0.97, "learning_rate": 1.4931099306982147e-06, "loss": 2.3525, "step": 556310 }, { "epoch": 0.97, "learning_rate": 1.4922379907713879e-06, "loss": 2.2544, "step": 556320 }, { "epoch": 0.97, "learning_rate": 1.4913660508445612e-06, "loss": 2.2916, "step": 556330 }, { "epoch": 0.97, "learning_rate": 1.4904941109177343e-06, "loss": 2.231, "step": 556340 }, { "epoch": 0.97, "learning_rate": 1.4896221709909075e-06, "loss": 2.2176, "step": 556350 }, { "epoch": 0.97, "learning_rate": 1.4887502310640808e-06, "loss": 2.2391, "step": 556360 }, { "epoch": 0.97, "learning_rate": 1.487878291137254e-06, "loss": 2.2239, "step": 556370 }, { "epoch": 0.97, "learning_rate": 1.487006351210427e-06, "loss": 2.1511, "step": 556380 }, { "epoch": 0.97, "learning_rate": 1.4861344112836002e-06, "loss": 2.3223, "step": 556390 }, { "epoch": 0.97, "learning_rate": 1.4852624713567736e-06, "loss": 2.2759, "step": 556400 }, { "epoch": 0.97, "learning_rate": 1.4843905314299467e-06, "loss": 2.2577, "step": 556410 }, { "epoch": 0.97, "learning_rate": 1.4835185915031198e-06, "loss": 2.168, "step": 556420 }, { "epoch": 0.97, "learning_rate": 1.4826466515762932e-06, "loss": 2.2506, "step": 556430 }, { "epoch": 0.97, "learning_rate": 1.4817747116494663e-06, "loss": 2.2292, "step": 556440 }, { "epoch": 0.97, "learning_rate": 1.4809027717226395e-06, "loss": 2.2864, "step": 556450 }, { "epoch": 0.97, "learning_rate": 1.4800308317958128e-06, "loss": 2.1869, "step": 556460 }, { "epoch": 0.97, "learning_rate": 1.479158891868986e-06, "loss": 2.3212, "step": 556470 }, { "epoch": 0.97, "learning_rate": 1.478286951942159e-06, "loss": 2.3397, "step": 556480 }, { "epoch": 0.97, "learning_rate": 1.4774150120153322e-06, "loss": 2.3069, "step": 556490 }, { "epoch": 0.97, "learning_rate": 1.4765430720885056e-06, "loss": 2.2283, "step": 556500 }, { "epoch": 0.97, "learning_rate": 1.4756711321616787e-06, "loss": 2.2471, "step": 556510 }, { "epoch": 0.97, "learning_rate": 1.4747991922348518e-06, "loss": 2.1821, "step": 556520 }, { "epoch": 0.97, "learning_rate": 1.4739272523080252e-06, "loss": 2.2605, "step": 556530 }, { "epoch": 0.97, "learning_rate": 1.4730553123811983e-06, "loss": 2.2762, "step": 556540 }, { "epoch": 0.97, "learning_rate": 1.4721833724543714e-06, "loss": 2.2054, "step": 556550 }, { "epoch": 0.97, "learning_rate": 1.4713114325275448e-06, "loss": 2.2169, "step": 556560 }, { "epoch": 0.97, "learning_rate": 1.470439492600718e-06, "loss": 2.2147, "step": 556570 }, { "epoch": 0.97, "learning_rate": 1.469567552673891e-06, "loss": 2.3589, "step": 556580 }, { "epoch": 0.97, "learning_rate": 1.4686956127470642e-06, "loss": 2.2304, "step": 556590 }, { "epoch": 0.97, "learning_rate": 1.4678236728202375e-06, "loss": 2.2363, "step": 556600 }, { "epoch": 0.97, "learning_rate": 1.4669517328934107e-06, "loss": 2.2838, "step": 556610 }, { "epoch": 0.97, "learning_rate": 1.4660797929665838e-06, "loss": 2.2719, "step": 556620 }, { "epoch": 0.97, "learning_rate": 1.4652078530397572e-06, "loss": 2.2487, "step": 556630 }, { "epoch": 0.97, "learning_rate": 1.4643359131129303e-06, "loss": 2.2318, "step": 556640 }, { "epoch": 0.97, "learning_rate": 1.4634639731861034e-06, "loss": 2.2873, "step": 556650 }, { "epoch": 0.97, "learning_rate": 1.4625920332592768e-06, "loss": 2.2771, "step": 556660 }, { "epoch": 0.97, "learning_rate": 1.46172009333245e-06, "loss": 2.1261, "step": 556670 }, { "epoch": 0.97, "learning_rate": 1.460848153405623e-06, "loss": 2.3138, "step": 556680 }, { "epoch": 0.97, "learning_rate": 1.4599762134787962e-06, "loss": 2.1783, "step": 556690 }, { "epoch": 0.97, "learning_rate": 1.4591042735519695e-06, "loss": 2.2976, "step": 556700 }, { "epoch": 0.97, "learning_rate": 1.4582323336251427e-06, "loss": 2.2825, "step": 556710 }, { "epoch": 0.97, "learning_rate": 1.4573603936983158e-06, "loss": 2.2415, "step": 556720 }, { "epoch": 0.97, "learning_rate": 1.4564884537714891e-06, "loss": 2.2896, "step": 556730 }, { "epoch": 0.97, "learning_rate": 1.4556165138446623e-06, "loss": 2.2563, "step": 556740 }, { "epoch": 0.97, "learning_rate": 1.4547445739178354e-06, "loss": 2.2992, "step": 556750 }, { "epoch": 0.97, "learning_rate": 1.4538726339910088e-06, "loss": 2.3119, "step": 556760 }, { "epoch": 0.97, "learning_rate": 1.4530006940641819e-06, "loss": 2.3751, "step": 556770 }, { "epoch": 0.97, "learning_rate": 1.452128754137355e-06, "loss": 2.1475, "step": 556780 }, { "epoch": 0.97, "learning_rate": 1.4512568142105282e-06, "loss": 2.2757, "step": 556790 }, { "epoch": 0.97, "learning_rate": 1.4503848742837015e-06, "loss": 2.2821, "step": 556800 }, { "epoch": 0.97, "learning_rate": 1.4495129343568746e-06, "loss": 2.1999, "step": 556810 }, { "epoch": 0.97, "learning_rate": 1.4486409944300478e-06, "loss": 2.3075, "step": 556820 }, { "epoch": 0.97, "learning_rate": 1.4477690545032211e-06, "loss": 2.1464, "step": 556830 }, { "epoch": 0.97, "learning_rate": 1.4468971145763943e-06, "loss": 2.3657, "step": 556840 }, { "epoch": 0.97, "learning_rate": 1.4460251746495674e-06, "loss": 2.2333, "step": 556850 }, { "epoch": 0.97, "learning_rate": 1.4451532347227407e-06, "loss": 2.2439, "step": 556860 }, { "epoch": 0.97, "learning_rate": 1.4442812947959139e-06, "loss": 2.1618, "step": 556870 }, { "epoch": 0.97, "learning_rate": 1.443409354869087e-06, "loss": 2.2677, "step": 556880 }, { "epoch": 0.97, "learning_rate": 1.4425374149422601e-06, "loss": 2.2772, "step": 556890 }, { "epoch": 0.97, "learning_rate": 1.4416654750154335e-06, "loss": 2.2589, "step": 556900 }, { "epoch": 0.97, "learning_rate": 1.4407935350886066e-06, "loss": 2.2198, "step": 556910 }, { "epoch": 0.97, "learning_rate": 1.4399215951617798e-06, "loss": 2.1906, "step": 556920 }, { "epoch": 0.97, "learning_rate": 1.439049655234953e-06, "loss": 2.3355, "step": 556930 }, { "epoch": 0.97, "learning_rate": 1.4381777153081262e-06, "loss": 2.1785, "step": 556940 }, { "epoch": 0.97, "learning_rate": 1.4373057753812994e-06, "loss": 2.2304, "step": 556950 }, { "epoch": 0.97, "learning_rate": 1.4364338354544727e-06, "loss": 2.3393, "step": 556960 }, { "epoch": 0.97, "learning_rate": 1.4355618955276459e-06, "loss": 2.3296, "step": 556970 }, { "epoch": 0.97, "learning_rate": 1.434689955600819e-06, "loss": 2.1528, "step": 556980 }, { "epoch": 0.97, "learning_rate": 1.4338180156739923e-06, "loss": 2.1813, "step": 556990 }, { "epoch": 0.97, "learning_rate": 1.4329460757471655e-06, "loss": 2.2529, "step": 557000 }, { "epoch": 0.97, "learning_rate": 1.4320741358203386e-06, "loss": 2.2411, "step": 557010 }, { "epoch": 0.97, "learning_rate": 1.4312021958935117e-06, "loss": 2.2884, "step": 557020 }, { "epoch": 0.97, "learning_rate": 1.430330255966685e-06, "loss": 2.2115, "step": 557030 }, { "epoch": 0.97, "learning_rate": 1.4294583160398582e-06, "loss": 2.1466, "step": 557040 }, { "epoch": 0.97, "learning_rate": 1.4285863761130314e-06, "loss": 2.3351, "step": 557050 }, { "epoch": 0.97, "learning_rate": 1.4277144361862047e-06, "loss": 2.2066, "step": 557060 }, { "epoch": 0.97, "learning_rate": 1.4268424962593778e-06, "loss": 2.3266, "step": 557070 }, { "epoch": 0.97, "learning_rate": 1.425970556332551e-06, "loss": 2.234, "step": 557080 }, { "epoch": 0.97, "learning_rate": 1.4250986164057243e-06, "loss": 2.2568, "step": 557090 }, { "epoch": 0.97, "learning_rate": 1.4242266764788974e-06, "loss": 2.232, "step": 557100 }, { "epoch": 0.97, "learning_rate": 1.4233547365520706e-06, "loss": 2.335, "step": 557110 }, { "epoch": 0.97, "learning_rate": 1.4224827966252437e-06, "loss": 2.2722, "step": 557120 }, { "epoch": 0.97, "learning_rate": 1.421610856698417e-06, "loss": 2.366, "step": 557130 }, { "epoch": 0.97, "learning_rate": 1.4207389167715902e-06, "loss": 2.2835, "step": 557140 }, { "epoch": 0.97, "learning_rate": 1.4198669768447633e-06, "loss": 2.3118, "step": 557150 }, { "epoch": 0.97, "learning_rate": 1.4189950369179367e-06, "loss": 2.2839, "step": 557160 }, { "epoch": 0.97, "learning_rate": 1.4181230969911098e-06, "loss": 2.3092, "step": 557170 }, { "epoch": 0.97, "learning_rate": 1.417251157064283e-06, "loss": 2.1787, "step": 557180 }, { "epoch": 0.97, "learning_rate": 1.4163792171374563e-06, "loss": 2.271, "step": 557190 }, { "epoch": 0.97, "learning_rate": 1.4155072772106294e-06, "loss": 2.2317, "step": 557200 }, { "epoch": 0.97, "learning_rate": 1.4146353372838026e-06, "loss": 2.2617, "step": 557210 }, { "epoch": 0.97, "learning_rate": 1.4137633973569757e-06, "loss": 2.3213, "step": 557220 }, { "epoch": 0.97, "learning_rate": 1.412891457430149e-06, "loss": 2.2165, "step": 557230 }, { "epoch": 0.97, "learning_rate": 1.4120195175033222e-06, "loss": 2.3584, "step": 557240 }, { "epoch": 0.97, "learning_rate": 1.4111475775764953e-06, "loss": 2.27, "step": 557250 }, { "epoch": 0.97, "learning_rate": 1.4102756376496687e-06, "loss": 2.2048, "step": 557260 }, { "epoch": 0.97, "learning_rate": 1.4094036977228418e-06, "loss": 2.2289, "step": 557270 }, { "epoch": 0.97, "learning_rate": 1.408531757796015e-06, "loss": 2.3524, "step": 557280 }, { "epoch": 0.97, "learning_rate": 1.4076598178691883e-06, "loss": 2.2002, "step": 557290 }, { "epoch": 0.97, "learning_rate": 1.4067878779423614e-06, "loss": 2.2693, "step": 557300 }, { "epoch": 0.97, "learning_rate": 1.4059159380155345e-06, "loss": 2.2165, "step": 557310 }, { "epoch": 0.97, "learning_rate": 1.4050439980887077e-06, "loss": 2.3103, "step": 557320 }, { "epoch": 0.97, "learning_rate": 1.404172058161881e-06, "loss": 2.3465, "step": 557330 }, { "epoch": 0.97, "learning_rate": 1.4033001182350542e-06, "loss": 2.376, "step": 557340 }, { "epoch": 0.97, "learning_rate": 1.4024281783082273e-06, "loss": 2.3299, "step": 557350 }, { "epoch": 0.97, "learning_rate": 1.4015562383814006e-06, "loss": 2.2997, "step": 557360 }, { "epoch": 0.97, "learning_rate": 1.4006842984545738e-06, "loss": 2.2071, "step": 557370 }, { "epoch": 0.97, "learning_rate": 1.399812358527747e-06, "loss": 2.2718, "step": 557380 }, { "epoch": 0.97, "learning_rate": 1.3989404186009203e-06, "loss": 2.2663, "step": 557390 }, { "epoch": 0.97, "learning_rate": 1.3980684786740934e-06, "loss": 2.2225, "step": 557400 }, { "epoch": 0.97, "learning_rate": 1.3971965387472665e-06, "loss": 2.2257, "step": 557410 }, { "epoch": 0.97, "learning_rate": 1.3963245988204397e-06, "loss": 2.1495, "step": 557420 }, { "epoch": 0.97, "learning_rate": 1.395452658893613e-06, "loss": 2.1333, "step": 557430 }, { "epoch": 0.97, "learning_rate": 1.3945807189667861e-06, "loss": 2.2335, "step": 557440 }, { "epoch": 0.97, "learning_rate": 1.3937087790399593e-06, "loss": 2.2179, "step": 557450 }, { "epoch": 0.97, "learning_rate": 1.3928368391131326e-06, "loss": 2.1709, "step": 557460 }, { "epoch": 0.97, "learning_rate": 1.3919648991863058e-06, "loss": 2.2746, "step": 557470 }, { "epoch": 0.97, "learning_rate": 1.3910929592594789e-06, "loss": 2.309, "step": 557480 }, { "epoch": 0.97, "learning_rate": 1.3902210193326522e-06, "loss": 2.3955, "step": 557490 }, { "epoch": 0.97, "learning_rate": 1.3893490794058254e-06, "loss": 2.2406, "step": 557500 }, { "epoch": 0.97, "learning_rate": 1.3884771394789985e-06, "loss": 2.3348, "step": 557510 }, { "epoch": 0.97, "learning_rate": 1.3876051995521716e-06, "loss": 2.196, "step": 557520 }, { "epoch": 0.97, "learning_rate": 1.386733259625345e-06, "loss": 2.1193, "step": 557530 }, { "epoch": 0.97, "learning_rate": 1.3858613196985181e-06, "loss": 2.2508, "step": 557540 }, { "epoch": 0.97, "learning_rate": 1.3849893797716913e-06, "loss": 2.306, "step": 557550 }, { "epoch": 0.97, "learning_rate": 1.3841174398448646e-06, "loss": 2.2178, "step": 557560 }, { "epoch": 0.97, "learning_rate": 1.3832454999180377e-06, "loss": 2.2354, "step": 557570 }, { "epoch": 0.97, "learning_rate": 1.3823735599912109e-06, "loss": 2.3524, "step": 557580 }, { "epoch": 0.97, "learning_rate": 1.3815016200643842e-06, "loss": 2.3315, "step": 557590 }, { "epoch": 0.97, "learning_rate": 1.3806296801375574e-06, "loss": 2.2657, "step": 557600 }, { "epoch": 0.97, "learning_rate": 1.3797577402107305e-06, "loss": 2.2192, "step": 557610 }, { "epoch": 0.97, "learning_rate": 1.3788858002839036e-06, "loss": 2.2569, "step": 557620 }, { "epoch": 0.97, "learning_rate": 1.378013860357077e-06, "loss": 2.2495, "step": 557630 }, { "epoch": 0.97, "learning_rate": 1.3771419204302501e-06, "loss": 2.2579, "step": 557640 }, { "epoch": 0.97, "learning_rate": 1.3762699805034232e-06, "loss": 2.2374, "step": 557650 }, { "epoch": 0.97, "learning_rate": 1.3753980405765966e-06, "loss": 2.2429, "step": 557660 }, { "epoch": 0.97, "learning_rate": 1.3745261006497697e-06, "loss": 2.26, "step": 557670 }, { "epoch": 0.97, "learning_rate": 1.3736541607229429e-06, "loss": 2.3051, "step": 557680 }, { "epoch": 0.97, "learning_rate": 1.3727822207961162e-06, "loss": 2.2358, "step": 557690 }, { "epoch": 0.97, "learning_rate": 1.3719102808692893e-06, "loss": 2.2889, "step": 557700 }, { "epoch": 0.97, "learning_rate": 1.3710383409424625e-06, "loss": 2.1749, "step": 557710 }, { "epoch": 0.97, "learning_rate": 1.3701664010156356e-06, "loss": 2.2625, "step": 557720 }, { "epoch": 0.97, "learning_rate": 1.369294461088809e-06, "loss": 2.2314, "step": 557730 }, { "epoch": 0.97, "learning_rate": 1.368422521161982e-06, "loss": 2.2213, "step": 557740 }, { "epoch": 0.97, "learning_rate": 1.3675505812351552e-06, "loss": 2.2866, "step": 557750 }, { "epoch": 0.97, "learning_rate": 1.3666786413083286e-06, "loss": 2.2699, "step": 557760 }, { "epoch": 0.97, "learning_rate": 1.3658067013815017e-06, "loss": 2.1604, "step": 557770 }, { "epoch": 0.97, "learning_rate": 1.3649347614546748e-06, "loss": 2.2491, "step": 557780 }, { "epoch": 0.97, "learning_rate": 1.3640628215278482e-06, "loss": 2.2856, "step": 557790 }, { "epoch": 0.97, "learning_rate": 1.3631908816010213e-06, "loss": 2.2596, "step": 557800 }, { "epoch": 0.97, "learning_rate": 1.3623189416741945e-06, "loss": 2.2502, "step": 557810 }, { "epoch": 0.97, "learning_rate": 1.3614470017473676e-06, "loss": 2.2107, "step": 557820 }, { "epoch": 0.97, "learning_rate": 1.360575061820541e-06, "loss": 2.2273, "step": 557830 }, { "epoch": 0.97, "learning_rate": 1.359703121893714e-06, "loss": 2.2728, "step": 557840 }, { "epoch": 0.97, "learning_rate": 1.3588311819668872e-06, "loss": 2.2593, "step": 557850 }, { "epoch": 0.97, "learning_rate": 1.3579592420400606e-06, "loss": 2.2579, "step": 557860 }, { "epoch": 0.97, "learning_rate": 1.3570873021132337e-06, "loss": 2.2654, "step": 557870 }, { "epoch": 0.97, "learning_rate": 1.3562153621864068e-06, "loss": 2.1041, "step": 557880 }, { "epoch": 0.97, "learning_rate": 1.3553434222595802e-06, "loss": 2.1499, "step": 557890 }, { "epoch": 0.97, "learning_rate": 1.3544714823327533e-06, "loss": 2.222, "step": 557900 }, { "epoch": 0.97, "learning_rate": 1.3535995424059264e-06, "loss": 2.3645, "step": 557910 }, { "epoch": 0.97, "learning_rate": 1.3527276024790996e-06, "loss": 2.2273, "step": 557920 }, { "epoch": 0.97, "learning_rate": 1.351855662552273e-06, "loss": 2.2721, "step": 557930 }, { "epoch": 0.97, "learning_rate": 1.350983722625446e-06, "loss": 2.2276, "step": 557940 }, { "epoch": 0.97, "learning_rate": 1.3501117826986192e-06, "loss": 2.2702, "step": 557950 }, { "epoch": 0.97, "learning_rate": 1.3492398427717925e-06, "loss": 2.3439, "step": 557960 }, { "epoch": 0.97, "learning_rate": 1.3483679028449657e-06, "loss": 2.311, "step": 557970 }, { "epoch": 0.97, "learning_rate": 1.3474959629181388e-06, "loss": 2.2971, "step": 557980 }, { "epoch": 0.97, "learning_rate": 1.3466240229913121e-06, "loss": 2.2345, "step": 557990 }, { "epoch": 0.97, "learning_rate": 1.3457520830644853e-06, "loss": 2.3805, "step": 558000 }, { "epoch": 0.97, "learning_rate": 1.3448801431376584e-06, "loss": 2.234, "step": 558010 }, { "epoch": 0.97, "learning_rate": 1.3440082032108316e-06, "loss": 2.2137, "step": 558020 }, { "epoch": 0.97, "learning_rate": 1.343136263284005e-06, "loss": 2.32, "step": 558030 }, { "epoch": 0.97, "learning_rate": 1.342264323357178e-06, "loss": 2.1954, "step": 558040 }, { "epoch": 0.97, "learning_rate": 1.3413923834303512e-06, "loss": 2.0258, "step": 558050 }, { "epoch": 0.97, "learning_rate": 1.3405204435035245e-06, "loss": 2.2558, "step": 558060 }, { "epoch": 0.97, "learning_rate": 1.3396485035766976e-06, "loss": 2.1589, "step": 558070 }, { "epoch": 0.97, "learning_rate": 1.3387765636498708e-06, "loss": 2.3309, "step": 558080 }, { "epoch": 0.97, "learning_rate": 1.3379046237230441e-06, "loss": 2.2468, "step": 558090 }, { "epoch": 0.97, "learning_rate": 1.3370326837962173e-06, "loss": 2.2752, "step": 558100 }, { "epoch": 0.97, "learning_rate": 1.3361607438693904e-06, "loss": 2.3213, "step": 558110 }, { "epoch": 0.97, "learning_rate": 1.3352888039425635e-06, "loss": 2.2877, "step": 558120 }, { "epoch": 0.97, "learning_rate": 1.3344168640157369e-06, "loss": 2.2485, "step": 558130 }, { "epoch": 0.97, "learning_rate": 1.33354492408891e-06, "loss": 2.3491, "step": 558140 }, { "epoch": 0.97, "learning_rate": 1.3326729841620831e-06, "loss": 2.2751, "step": 558150 }, { "epoch": 0.97, "learning_rate": 1.3318010442352565e-06, "loss": 2.3038, "step": 558160 }, { "epoch": 0.97, "learning_rate": 1.3309291043084296e-06, "loss": 2.2789, "step": 558170 }, { "epoch": 0.97, "learning_rate": 1.3300571643816028e-06, "loss": 2.184, "step": 558180 }, { "epoch": 0.97, "learning_rate": 1.3291852244547761e-06, "loss": 2.165, "step": 558190 }, { "epoch": 0.97, "learning_rate": 1.3283132845279492e-06, "loss": 2.1944, "step": 558200 }, { "epoch": 0.97, "learning_rate": 1.3274413446011224e-06, "loss": 2.2595, "step": 558210 }, { "epoch": 0.97, "learning_rate": 1.3265694046742955e-06, "loss": 2.2371, "step": 558220 }, { "epoch": 0.97, "learning_rate": 1.3256974647474689e-06, "loss": 2.3085, "step": 558230 }, { "epoch": 0.97, "learning_rate": 1.324825524820642e-06, "loss": 2.2845, "step": 558240 }, { "epoch": 0.97, "learning_rate": 1.3239535848938151e-06, "loss": 2.2287, "step": 558250 }, { "epoch": 0.97, "learning_rate": 1.3230816449669885e-06, "loss": 2.2292, "step": 558260 }, { "epoch": 0.97, "learning_rate": 1.3222097050401616e-06, "loss": 2.323, "step": 558270 }, { "epoch": 0.97, "learning_rate": 1.3213377651133347e-06, "loss": 2.2172, "step": 558280 }, { "epoch": 0.97, "learning_rate": 1.320465825186508e-06, "loss": 2.2229, "step": 558290 }, { "epoch": 0.97, "learning_rate": 1.3195938852596812e-06, "loss": 2.3149, "step": 558300 }, { "epoch": 0.97, "learning_rate": 1.3187219453328544e-06, "loss": 2.2392, "step": 558310 }, { "epoch": 0.97, "learning_rate": 1.3178500054060275e-06, "loss": 2.219, "step": 558320 }, { "epoch": 0.97, "learning_rate": 1.3169780654792008e-06, "loss": 2.2994, "step": 558330 }, { "epoch": 0.97, "learning_rate": 1.316106125552374e-06, "loss": 2.298, "step": 558340 }, { "epoch": 0.97, "learning_rate": 1.3152341856255471e-06, "loss": 2.3215, "step": 558350 }, { "epoch": 0.97, "learning_rate": 1.3143622456987205e-06, "loss": 2.3763, "step": 558360 }, { "epoch": 0.97, "learning_rate": 1.3134903057718936e-06, "loss": 2.3559, "step": 558370 }, { "epoch": 0.97, "learning_rate": 1.3126183658450667e-06, "loss": 2.129, "step": 558380 }, { "epoch": 0.97, "learning_rate": 1.31174642591824e-06, "loss": 2.2144, "step": 558390 }, { "epoch": 0.97, "learning_rate": 1.3108744859914132e-06, "loss": 2.3498, "step": 558400 }, { "epoch": 0.97, "learning_rate": 1.3100025460645863e-06, "loss": 2.2458, "step": 558410 }, { "epoch": 0.97, "learning_rate": 1.3091306061377597e-06, "loss": 2.2619, "step": 558420 }, { "epoch": 0.97, "learning_rate": 1.3082586662109328e-06, "loss": 2.2135, "step": 558430 }, { "epoch": 0.97, "learning_rate": 1.307386726284106e-06, "loss": 2.2637, "step": 558440 }, { "epoch": 0.97, "learning_rate": 1.306514786357279e-06, "loss": 2.279, "step": 558450 }, { "epoch": 0.97, "learning_rate": 1.3056428464304524e-06, "loss": 2.139, "step": 558460 }, { "epoch": 0.97, "learning_rate": 1.3047709065036256e-06, "loss": 2.2944, "step": 558470 }, { "epoch": 0.97, "learning_rate": 1.3038989665767987e-06, "loss": 2.2057, "step": 558480 }, { "epoch": 0.97, "learning_rate": 1.303027026649972e-06, "loss": 2.1446, "step": 558490 }, { "epoch": 0.97, "learning_rate": 1.3021550867231452e-06, "loss": 2.2854, "step": 558500 }, { "epoch": 0.97, "learning_rate": 1.3012831467963183e-06, "loss": 2.1906, "step": 558510 }, { "epoch": 0.97, "learning_rate": 1.3004112068694917e-06, "loss": 2.3106, "step": 558520 }, { "epoch": 0.97, "learning_rate": 1.2995392669426648e-06, "loss": 2.1754, "step": 558530 }, { "epoch": 0.97, "learning_rate": 1.298667327015838e-06, "loss": 2.2834, "step": 558540 }, { "epoch": 0.97, "learning_rate": 1.297795387089011e-06, "loss": 2.3427, "step": 558550 }, { "epoch": 0.97, "learning_rate": 1.2969234471621844e-06, "loss": 2.2798, "step": 558560 }, { "epoch": 0.97, "learning_rate": 1.2960515072353576e-06, "loss": 2.1845, "step": 558570 }, { "epoch": 0.97, "learning_rate": 1.2951795673085307e-06, "loss": 2.2228, "step": 558580 }, { "epoch": 0.97, "learning_rate": 1.294307627381704e-06, "loss": 2.2685, "step": 558590 }, { "epoch": 0.97, "learning_rate": 1.2934356874548772e-06, "loss": 2.203, "step": 558600 }, { "epoch": 0.97, "learning_rate": 1.2925637475280503e-06, "loss": 2.3443, "step": 558610 }, { "epoch": 0.97, "learning_rate": 1.2916918076012237e-06, "loss": 2.1876, "step": 558620 }, { "epoch": 0.97, "learning_rate": 1.2908198676743968e-06, "loss": 2.3354, "step": 558630 }, { "epoch": 0.97, "learning_rate": 1.28994792774757e-06, "loss": 2.2132, "step": 558640 }, { "epoch": 0.97, "learning_rate": 1.289075987820743e-06, "loss": 2.2528, "step": 558650 }, { "epoch": 0.97, "learning_rate": 1.2882040478939164e-06, "loss": 2.2778, "step": 558660 }, { "epoch": 0.97, "learning_rate": 1.2873321079670895e-06, "loss": 2.3244, "step": 558670 }, { "epoch": 0.97, "learning_rate": 1.2864601680402627e-06, "loss": 2.2474, "step": 558680 }, { "epoch": 0.97, "learning_rate": 1.285588228113436e-06, "loss": 2.2185, "step": 558690 }, { "epoch": 0.97, "learning_rate": 1.2847162881866092e-06, "loss": 2.2469, "step": 558700 }, { "epoch": 0.97, "learning_rate": 1.2838443482597823e-06, "loss": 2.2871, "step": 558710 }, { "epoch": 0.97, "learning_rate": 1.2829724083329556e-06, "loss": 2.2921, "step": 558720 }, { "epoch": 0.97, "learning_rate": 1.2821004684061288e-06, "loss": 2.3394, "step": 558730 }, { "epoch": 0.97, "learning_rate": 1.281228528479302e-06, "loss": 2.1689, "step": 558740 }, { "epoch": 0.97, "learning_rate": 1.280356588552475e-06, "loss": 2.1776, "step": 558750 }, { "epoch": 0.97, "learning_rate": 1.2794846486256484e-06, "loss": 2.3054, "step": 558760 }, { "epoch": 0.97, "learning_rate": 1.2786127086988215e-06, "loss": 2.2465, "step": 558770 }, { "epoch": 0.97, "learning_rate": 1.2777407687719947e-06, "loss": 2.2158, "step": 558780 }, { "epoch": 0.97, "learning_rate": 1.276868828845168e-06, "loss": 2.232, "step": 558790 }, { "epoch": 0.97, "learning_rate": 1.2759968889183411e-06, "loss": 2.1998, "step": 558800 }, { "epoch": 0.97, "learning_rate": 1.2751249489915143e-06, "loss": 2.2291, "step": 558810 }, { "epoch": 0.97, "learning_rate": 1.2742530090646876e-06, "loss": 2.2286, "step": 558820 }, { "epoch": 0.97, "learning_rate": 1.2733810691378608e-06, "loss": 2.2935, "step": 558830 }, { "epoch": 0.97, "learning_rate": 1.2725091292110339e-06, "loss": 2.3482, "step": 558840 }, { "epoch": 0.97, "learning_rate": 1.271637189284207e-06, "loss": 2.2398, "step": 558850 }, { "epoch": 0.97, "learning_rate": 1.2707652493573804e-06, "loss": 2.3636, "step": 558860 }, { "epoch": 0.97, "learning_rate": 1.2698933094305535e-06, "loss": 2.2312, "step": 558870 }, { "epoch": 0.97, "learning_rate": 1.2690213695037266e-06, "loss": 2.2623, "step": 558880 }, { "epoch": 0.97, "learning_rate": 1.2681494295769e-06, "loss": 2.2292, "step": 558890 }, { "epoch": 0.97, "learning_rate": 1.2672774896500731e-06, "loss": 2.3562, "step": 558900 }, { "epoch": 0.97, "learning_rate": 1.2664055497232463e-06, "loss": 2.2337, "step": 558910 }, { "epoch": 0.97, "learning_rate": 1.2655336097964196e-06, "loss": 2.2799, "step": 558920 }, { "epoch": 0.97, "learning_rate": 1.2646616698695927e-06, "loss": 2.2665, "step": 558930 }, { "epoch": 0.97, "learning_rate": 1.2637897299427659e-06, "loss": 2.1419, "step": 558940 }, { "epoch": 0.97, "learning_rate": 1.262917790015939e-06, "loss": 2.2718, "step": 558950 }, { "epoch": 0.97, "learning_rate": 1.2620458500891123e-06, "loss": 2.1522, "step": 558960 }, { "epoch": 0.97, "learning_rate": 1.2611739101622855e-06, "loss": 2.1907, "step": 558970 }, { "epoch": 0.97, "learning_rate": 1.2603019702354586e-06, "loss": 2.2259, "step": 558980 }, { "epoch": 0.97, "learning_rate": 1.259430030308632e-06, "loss": 2.2349, "step": 558990 }, { "epoch": 0.97, "learning_rate": 1.258558090381805e-06, "loss": 2.2312, "step": 559000 }, { "epoch": 0.97, "learning_rate": 1.2576861504549782e-06, "loss": 2.3962, "step": 559010 }, { "epoch": 0.97, "learning_rate": 1.2568142105281516e-06, "loss": 2.196, "step": 559020 }, { "epoch": 0.97, "learning_rate": 1.2559422706013247e-06, "loss": 2.2349, "step": 559030 }, { "epoch": 0.97, "learning_rate": 1.2550703306744978e-06, "loss": 2.3159, "step": 559040 }, { "epoch": 0.97, "learning_rate": 1.254198390747671e-06, "loss": 2.2864, "step": 559050 }, { "epoch": 0.97, "learning_rate": 1.2533264508208443e-06, "loss": 2.3125, "step": 559060 }, { "epoch": 0.97, "learning_rate": 1.2524545108940175e-06, "loss": 2.1632, "step": 559070 }, { "epoch": 0.97, "learning_rate": 1.2515825709671906e-06, "loss": 2.1982, "step": 559080 }, { "epoch": 0.97, "learning_rate": 1.250710631040364e-06, "loss": 2.1882, "step": 559090 }, { "epoch": 0.98, "learning_rate": 1.249838691113537e-06, "loss": 2.303, "step": 559100 }, { "epoch": 0.98, "learning_rate": 1.2489667511867102e-06, "loss": 2.3185, "step": 559110 }, { "epoch": 0.98, "learning_rate": 1.2480948112598836e-06, "loss": 2.1983, "step": 559120 }, { "epoch": 0.98, "learning_rate": 1.2472228713330567e-06, "loss": 2.2022, "step": 559130 }, { "epoch": 0.98, "learning_rate": 1.2463509314062298e-06, "loss": 2.3166, "step": 559140 }, { "epoch": 0.98, "learning_rate": 1.245478991479403e-06, "loss": 2.2578, "step": 559150 }, { "epoch": 0.98, "learning_rate": 1.2446070515525763e-06, "loss": 2.3798, "step": 559160 }, { "epoch": 0.98, "learning_rate": 1.2437351116257494e-06, "loss": 2.1052, "step": 559170 }, { "epoch": 0.98, "learning_rate": 1.2428631716989226e-06, "loss": 2.2327, "step": 559180 }, { "epoch": 0.98, "learning_rate": 1.241991231772096e-06, "loss": 2.3314, "step": 559190 }, { "epoch": 0.98, "learning_rate": 1.241119291845269e-06, "loss": 2.2306, "step": 559200 }, { "epoch": 0.98, "learning_rate": 1.2402473519184422e-06, "loss": 2.2913, "step": 559210 }, { "epoch": 0.98, "learning_rate": 1.2393754119916155e-06, "loss": 2.2686, "step": 559220 }, { "epoch": 0.98, "learning_rate": 1.2385034720647887e-06, "loss": 2.358, "step": 559230 }, { "epoch": 0.98, "learning_rate": 1.2376315321379618e-06, "loss": 2.2, "step": 559240 }, { "epoch": 0.98, "learning_rate": 1.236759592211135e-06, "loss": 2.3191, "step": 559250 }, { "epoch": 0.98, "learning_rate": 1.2358876522843083e-06, "loss": 2.2996, "step": 559260 }, { "epoch": 0.98, "learning_rate": 1.2350157123574814e-06, "loss": 2.2346, "step": 559270 }, { "epoch": 0.98, "learning_rate": 1.2341437724306546e-06, "loss": 2.196, "step": 559280 }, { "epoch": 0.98, "learning_rate": 1.233271832503828e-06, "loss": 2.28, "step": 559290 }, { "epoch": 0.98, "learning_rate": 1.232399892577001e-06, "loss": 2.3259, "step": 559300 }, { "epoch": 0.98, "learning_rate": 1.2315279526501742e-06, "loss": 2.3384, "step": 559310 }, { "epoch": 0.98, "learning_rate": 1.2306560127233475e-06, "loss": 2.2386, "step": 559320 }, { "epoch": 0.98, "learning_rate": 1.2297840727965207e-06, "loss": 2.2795, "step": 559330 }, { "epoch": 0.98, "learning_rate": 1.2289121328696938e-06, "loss": 2.2903, "step": 559340 }, { "epoch": 0.98, "learning_rate": 1.228040192942867e-06, "loss": 2.2048, "step": 559350 }, { "epoch": 0.98, "learning_rate": 1.2271682530160403e-06, "loss": 2.2694, "step": 559360 }, { "epoch": 0.98, "learning_rate": 1.2262963130892134e-06, "loss": 2.1487, "step": 559370 }, { "epoch": 0.98, "learning_rate": 1.2254243731623865e-06, "loss": 2.1174, "step": 559380 }, { "epoch": 0.98, "learning_rate": 1.2245524332355599e-06, "loss": 2.2024, "step": 559390 }, { "epoch": 0.98, "learning_rate": 1.223680493308733e-06, "loss": 2.249, "step": 559400 }, { "epoch": 0.98, "learning_rate": 1.2228085533819062e-06, "loss": 2.2771, "step": 559410 }, { "epoch": 0.98, "learning_rate": 1.2219366134550795e-06, "loss": 2.242, "step": 559420 }, { "epoch": 0.98, "learning_rate": 1.2210646735282526e-06, "loss": 2.1684, "step": 559430 }, { "epoch": 0.98, "learning_rate": 1.2201927336014258e-06, "loss": 2.1752, "step": 559440 }, { "epoch": 0.98, "learning_rate": 1.219320793674599e-06, "loss": 2.4073, "step": 559450 }, { "epoch": 0.98, "learning_rate": 1.2184488537477723e-06, "loss": 2.3331, "step": 559460 }, { "epoch": 0.98, "learning_rate": 1.2175769138209454e-06, "loss": 2.1774, "step": 559470 }, { "epoch": 0.98, "learning_rate": 1.2167049738941185e-06, "loss": 2.1561, "step": 559480 }, { "epoch": 0.98, "learning_rate": 1.2158330339672919e-06, "loss": 2.2997, "step": 559490 }, { "epoch": 0.98, "learning_rate": 1.214961094040465e-06, "loss": 2.1782, "step": 559500 }, { "epoch": 0.98, "learning_rate": 1.2140891541136381e-06, "loss": 2.2278, "step": 559510 }, { "epoch": 0.98, "learning_rate": 1.2132172141868115e-06, "loss": 2.333, "step": 559520 }, { "epoch": 0.98, "learning_rate": 1.2123452742599846e-06, "loss": 2.2219, "step": 559530 }, { "epoch": 0.98, "learning_rate": 1.2114733343331578e-06, "loss": 2.1262, "step": 559540 }, { "epoch": 0.98, "learning_rate": 1.2106013944063309e-06, "loss": 2.197, "step": 559550 }, { "epoch": 0.98, "learning_rate": 1.2097294544795042e-06, "loss": 2.2699, "step": 559560 }, { "epoch": 0.98, "learning_rate": 1.2088575145526774e-06, "loss": 2.2473, "step": 559570 }, { "epoch": 0.98, "learning_rate": 1.2079855746258505e-06, "loss": 2.2492, "step": 559580 }, { "epoch": 0.98, "learning_rate": 1.2071136346990239e-06, "loss": 2.2226, "step": 559590 }, { "epoch": 0.98, "learning_rate": 1.206241694772197e-06, "loss": 2.2128, "step": 559600 }, { "epoch": 0.98, "learning_rate": 1.2053697548453701e-06, "loss": 2.2359, "step": 559610 }, { "epoch": 0.98, "learning_rate": 1.2044978149185435e-06, "loss": 2.2815, "step": 559620 }, { "epoch": 0.98, "learning_rate": 1.2036258749917166e-06, "loss": 2.2204, "step": 559630 }, { "epoch": 0.98, "learning_rate": 1.2027539350648897e-06, "loss": 2.1787, "step": 559640 }, { "epoch": 0.98, "learning_rate": 1.2018819951380629e-06, "loss": 2.2499, "step": 559650 }, { "epoch": 0.98, "learning_rate": 1.2010100552112362e-06, "loss": 2.1928, "step": 559660 }, { "epoch": 0.98, "learning_rate": 1.2001381152844094e-06, "loss": 2.3713, "step": 559670 }, { "epoch": 0.98, "learning_rate": 1.1992661753575825e-06, "loss": 2.2505, "step": 559680 }, { "epoch": 0.98, "learning_rate": 1.1983942354307558e-06, "loss": 2.261, "step": 559690 }, { "epoch": 0.98, "learning_rate": 1.197522295503929e-06, "loss": 2.2751, "step": 559700 }, { "epoch": 0.98, "learning_rate": 1.196650355577102e-06, "loss": 2.3133, "step": 559710 }, { "epoch": 0.98, "learning_rate": 1.1957784156502755e-06, "loss": 2.3428, "step": 559720 }, { "epoch": 0.98, "learning_rate": 1.1949064757234486e-06, "loss": 2.1907, "step": 559730 }, { "epoch": 0.98, "learning_rate": 1.1940345357966217e-06, "loss": 2.31, "step": 559740 }, { "epoch": 0.98, "learning_rate": 1.193162595869795e-06, "loss": 2.2414, "step": 559750 }, { "epoch": 0.98, "learning_rate": 1.1922906559429682e-06, "loss": 2.2894, "step": 559760 }, { "epoch": 0.98, "learning_rate": 1.1914187160161413e-06, "loss": 2.3549, "step": 559770 }, { "epoch": 0.98, "learning_rate": 1.1905467760893145e-06, "loss": 2.1604, "step": 559780 }, { "epoch": 0.98, "learning_rate": 1.1896748361624878e-06, "loss": 2.1888, "step": 559790 }, { "epoch": 0.98, "learning_rate": 1.188802896235661e-06, "loss": 2.2956, "step": 559800 }, { "epoch": 0.98, "learning_rate": 1.187930956308834e-06, "loss": 2.2489, "step": 559810 }, { "epoch": 0.98, "learning_rate": 1.1870590163820074e-06, "loss": 2.1996, "step": 559820 }, { "epoch": 0.98, "learning_rate": 1.1861870764551806e-06, "loss": 2.292, "step": 559830 }, { "epoch": 0.98, "learning_rate": 1.1853151365283537e-06, "loss": 2.275, "step": 559840 }, { "epoch": 0.98, "learning_rate": 1.184443196601527e-06, "loss": 2.3384, "step": 559850 }, { "epoch": 0.98, "learning_rate": 1.1835712566747002e-06, "loss": 2.3103, "step": 559860 }, { "epoch": 0.98, "learning_rate": 1.1826993167478733e-06, "loss": 2.2746, "step": 559870 }, { "epoch": 0.98, "learning_rate": 1.1818273768210465e-06, "loss": 2.2354, "step": 559880 }, { "epoch": 0.98, "learning_rate": 1.1809554368942198e-06, "loss": 2.1509, "step": 559890 }, { "epoch": 0.98, "learning_rate": 1.180083496967393e-06, "loss": 2.2359, "step": 559900 }, { "epoch": 0.98, "learning_rate": 1.179211557040566e-06, "loss": 2.2744, "step": 559910 }, { "epoch": 0.98, "learning_rate": 1.1783396171137394e-06, "loss": 2.2434, "step": 559920 }, { "epoch": 0.98, "learning_rate": 1.1774676771869125e-06, "loss": 2.3005, "step": 559930 }, { "epoch": 0.98, "learning_rate": 1.1765957372600857e-06, "loss": 2.1885, "step": 559940 }, { "epoch": 0.98, "learning_rate": 1.175723797333259e-06, "loss": 2.2272, "step": 559950 }, { "epoch": 0.98, "learning_rate": 1.1748518574064322e-06, "loss": 2.2666, "step": 559960 }, { "epoch": 0.98, "learning_rate": 1.1739799174796053e-06, "loss": 2.2408, "step": 559970 }, { "epoch": 0.98, "learning_rate": 1.1731079775527784e-06, "loss": 2.2886, "step": 559980 }, { "epoch": 0.98, "learning_rate": 1.1722360376259518e-06, "loss": 2.1221, "step": 559990 }, { "epoch": 0.98, "learning_rate": 1.171364097699125e-06, "loss": 2.2362, "step": 560000 }, { "epoch": 0.98, "learning_rate": 1.170492157772298e-06, "loss": 2.2836, "step": 560010 }, { "epoch": 0.98, "learning_rate": 1.1696202178454714e-06, "loss": 2.2937, "step": 560020 }, { "epoch": 0.98, "learning_rate": 1.1687482779186445e-06, "loss": 2.2424, "step": 560030 }, { "epoch": 0.98, "learning_rate": 1.1678763379918177e-06, "loss": 2.3813, "step": 560040 }, { "epoch": 0.98, "learning_rate": 1.167004398064991e-06, "loss": 2.1948, "step": 560050 }, { "epoch": 0.98, "learning_rate": 1.1661324581381641e-06, "loss": 2.2482, "step": 560060 }, { "epoch": 0.98, "learning_rate": 1.1652605182113373e-06, "loss": 2.2512, "step": 560070 }, { "epoch": 0.98, "learning_rate": 1.1643885782845104e-06, "loss": 2.3467, "step": 560080 }, { "epoch": 0.98, "learning_rate": 1.1635166383576838e-06, "loss": 2.1642, "step": 560090 }, { "epoch": 0.98, "learning_rate": 1.162644698430857e-06, "loss": 2.2601, "step": 560100 }, { "epoch": 0.98, "learning_rate": 1.16177275850403e-06, "loss": 2.1966, "step": 560110 }, { "epoch": 0.98, "learning_rate": 1.1609008185772034e-06, "loss": 2.1497, "step": 560120 }, { "epoch": 0.98, "learning_rate": 1.1600288786503765e-06, "loss": 2.1988, "step": 560130 }, { "epoch": 0.98, "learning_rate": 1.1591569387235496e-06, "loss": 2.2529, "step": 560140 }, { "epoch": 0.98, "learning_rate": 1.158284998796723e-06, "loss": 2.1327, "step": 560150 }, { "epoch": 0.98, "learning_rate": 1.1574130588698961e-06, "loss": 2.3862, "step": 560160 }, { "epoch": 0.98, "learning_rate": 1.1565411189430693e-06, "loss": 2.2971, "step": 560170 }, { "epoch": 0.98, "learning_rate": 1.1556691790162424e-06, "loss": 2.2394, "step": 560180 }, { "epoch": 0.98, "learning_rate": 1.1547972390894157e-06, "loss": 2.2354, "step": 560190 }, { "epoch": 0.98, "learning_rate": 1.1539252991625889e-06, "loss": 2.1403, "step": 560200 }, { "epoch": 0.98, "learning_rate": 1.153053359235762e-06, "loss": 2.2891, "step": 560210 }, { "epoch": 0.98, "learning_rate": 1.1521814193089354e-06, "loss": 2.2835, "step": 560220 }, { "epoch": 0.98, "learning_rate": 1.1513094793821085e-06, "loss": 2.2729, "step": 560230 }, { "epoch": 0.98, "learning_rate": 1.1504375394552816e-06, "loss": 2.3164, "step": 560240 }, { "epoch": 0.98, "learning_rate": 1.149565599528455e-06, "loss": 2.1026, "step": 560250 }, { "epoch": 0.98, "learning_rate": 1.1486936596016281e-06, "loss": 2.2854, "step": 560260 }, { "epoch": 0.98, "learning_rate": 1.1478217196748012e-06, "loss": 2.2539, "step": 560270 }, { "epoch": 0.98, "learning_rate": 1.1469497797479744e-06, "loss": 2.1666, "step": 560280 }, { "epoch": 0.98, "learning_rate": 1.1460778398211477e-06, "loss": 2.2243, "step": 560290 }, { "epoch": 0.98, "learning_rate": 1.1452058998943209e-06, "loss": 2.3096, "step": 560300 }, { "epoch": 0.98, "learning_rate": 1.144333959967494e-06, "loss": 2.2344, "step": 560310 }, { "epoch": 0.98, "learning_rate": 1.1434620200406673e-06, "loss": 2.1954, "step": 560320 }, { "epoch": 0.98, "learning_rate": 1.1425900801138405e-06, "loss": 2.2445, "step": 560330 }, { "epoch": 0.98, "learning_rate": 1.1417181401870136e-06, "loss": 2.1848, "step": 560340 }, { "epoch": 0.98, "learning_rate": 1.140846200260187e-06, "loss": 2.364, "step": 560350 }, { "epoch": 0.98, "learning_rate": 1.13997426033336e-06, "loss": 2.2378, "step": 560360 }, { "epoch": 0.98, "learning_rate": 1.1391023204065332e-06, "loss": 2.3023, "step": 560370 }, { "epoch": 0.98, "learning_rate": 1.1382303804797064e-06, "loss": 2.2514, "step": 560380 }, { "epoch": 0.98, "learning_rate": 1.1373584405528797e-06, "loss": 2.2346, "step": 560390 }, { "epoch": 0.98, "learning_rate": 1.1364865006260528e-06, "loss": 2.212, "step": 560400 }, { "epoch": 0.98, "learning_rate": 1.135614560699226e-06, "loss": 2.2476, "step": 560410 }, { "epoch": 0.98, "learning_rate": 1.1347426207723993e-06, "loss": 2.2794, "step": 560420 }, { "epoch": 0.98, "learning_rate": 1.1338706808455725e-06, "loss": 2.3437, "step": 560430 }, { "epoch": 0.98, "learning_rate": 1.1329987409187456e-06, "loss": 2.1432, "step": 560440 }, { "epoch": 0.98, "learning_rate": 1.132126800991919e-06, "loss": 2.1399, "step": 560450 }, { "epoch": 0.98, "learning_rate": 1.131254861065092e-06, "loss": 2.2166, "step": 560460 }, { "epoch": 0.98, "learning_rate": 1.1303829211382652e-06, "loss": 2.2856, "step": 560470 }, { "epoch": 0.98, "learning_rate": 1.1295109812114383e-06, "loss": 2.2547, "step": 560480 }, { "epoch": 0.98, "learning_rate": 1.1286390412846117e-06, "loss": 2.278, "step": 560490 }, { "epoch": 0.98, "learning_rate": 1.1277671013577848e-06, "loss": 2.2243, "step": 560500 }, { "epoch": 0.98, "learning_rate": 1.126895161430958e-06, "loss": 2.3362, "step": 560510 }, { "epoch": 0.98, "learning_rate": 1.1260232215041313e-06, "loss": 2.3506, "step": 560520 }, { "epoch": 0.98, "learning_rate": 1.1251512815773044e-06, "loss": 2.2223, "step": 560530 }, { "epoch": 0.98, "learning_rate": 1.1242793416504776e-06, "loss": 2.2848, "step": 560540 }, { "epoch": 0.98, "learning_rate": 1.123407401723651e-06, "loss": 2.2239, "step": 560550 }, { "epoch": 0.98, "learning_rate": 1.122535461796824e-06, "loss": 2.1378, "step": 560560 }, { "epoch": 0.98, "learning_rate": 1.1216635218699972e-06, "loss": 2.3284, "step": 560570 }, { "epoch": 0.98, "learning_rate": 1.1207915819431703e-06, "loss": 2.2218, "step": 560580 }, { "epoch": 0.98, "learning_rate": 1.1199196420163437e-06, "loss": 2.3705, "step": 560590 }, { "epoch": 0.98, "learning_rate": 1.1190477020895168e-06, "loss": 2.2129, "step": 560600 }, { "epoch": 0.98, "learning_rate": 1.11817576216269e-06, "loss": 2.2863, "step": 560610 }, { "epoch": 0.98, "learning_rate": 1.1173038222358633e-06, "loss": 2.3711, "step": 560620 }, { "epoch": 0.98, "learning_rate": 1.1164318823090364e-06, "loss": 2.2838, "step": 560630 }, { "epoch": 0.98, "learning_rate": 1.1155599423822096e-06, "loss": 2.3096, "step": 560640 }, { "epoch": 0.98, "learning_rate": 1.114688002455383e-06, "loss": 2.1327, "step": 560650 }, { "epoch": 0.98, "learning_rate": 1.113816062528556e-06, "loss": 2.1761, "step": 560660 }, { "epoch": 0.98, "learning_rate": 1.1129441226017292e-06, "loss": 2.2696, "step": 560670 }, { "epoch": 0.98, "learning_rate": 1.1120721826749023e-06, "loss": 2.2596, "step": 560680 }, { "epoch": 0.98, "learning_rate": 1.1112002427480757e-06, "loss": 2.1831, "step": 560690 }, { "epoch": 0.98, "learning_rate": 1.1103283028212488e-06, "loss": 2.2795, "step": 560700 }, { "epoch": 0.98, "learning_rate": 1.109456362894422e-06, "loss": 2.2092, "step": 560710 }, { "epoch": 0.98, "learning_rate": 1.1085844229675953e-06, "loss": 2.206, "step": 560720 }, { "epoch": 0.98, "learning_rate": 1.1077124830407684e-06, "loss": 2.32, "step": 560730 }, { "epoch": 0.98, "learning_rate": 1.1068405431139415e-06, "loss": 2.3078, "step": 560740 }, { "epoch": 0.98, "learning_rate": 1.1059686031871149e-06, "loss": 2.342, "step": 560750 }, { "epoch": 0.98, "learning_rate": 1.105096663260288e-06, "loss": 2.2596, "step": 560760 }, { "epoch": 0.98, "learning_rate": 1.1042247233334612e-06, "loss": 2.3602, "step": 560770 }, { "epoch": 0.98, "learning_rate": 1.1033527834066343e-06, "loss": 2.2678, "step": 560780 }, { "epoch": 0.98, "learning_rate": 1.1024808434798076e-06, "loss": 2.2437, "step": 560790 }, { "epoch": 0.98, "learning_rate": 1.1016089035529808e-06, "loss": 2.2969, "step": 560800 }, { "epoch": 0.98, "learning_rate": 1.100736963626154e-06, "loss": 2.1401, "step": 560810 }, { "epoch": 0.98, "learning_rate": 1.0998650236993272e-06, "loss": 2.2128, "step": 560820 }, { "epoch": 0.98, "learning_rate": 1.0989930837725004e-06, "loss": 2.2287, "step": 560830 }, { "epoch": 0.98, "learning_rate": 1.0981211438456735e-06, "loss": 2.1963, "step": 560840 }, { "epoch": 0.98, "learning_rate": 1.0972492039188469e-06, "loss": 2.1909, "step": 560850 }, { "epoch": 0.98, "learning_rate": 1.09637726399202e-06, "loss": 2.3629, "step": 560860 }, { "epoch": 0.98, "learning_rate": 1.0955053240651931e-06, "loss": 2.3116, "step": 560870 }, { "epoch": 0.98, "learning_rate": 1.0946333841383663e-06, "loss": 2.1741, "step": 560880 }, { "epoch": 0.98, "learning_rate": 1.0937614442115396e-06, "loss": 2.1977, "step": 560890 }, { "epoch": 0.98, "learning_rate": 1.0928895042847127e-06, "loss": 2.2809, "step": 560900 }, { "epoch": 0.98, "learning_rate": 1.0920175643578859e-06, "loss": 2.1329, "step": 560910 }, { "epoch": 0.98, "learning_rate": 1.0911456244310592e-06, "loss": 2.3361, "step": 560920 }, { "epoch": 0.98, "learning_rate": 1.0902736845042324e-06, "loss": 2.1677, "step": 560930 }, { "epoch": 0.98, "learning_rate": 1.0894017445774055e-06, "loss": 2.1659, "step": 560940 }, { "epoch": 0.98, "learning_rate": 1.0885298046505788e-06, "loss": 2.2684, "step": 560950 }, { "epoch": 0.98, "learning_rate": 1.087657864723752e-06, "loss": 2.3013, "step": 560960 }, { "epoch": 0.98, "learning_rate": 1.0867859247969251e-06, "loss": 2.3516, "step": 560970 }, { "epoch": 0.98, "learning_rate": 1.0859139848700985e-06, "loss": 2.3725, "step": 560980 }, { "epoch": 0.98, "learning_rate": 1.0850420449432716e-06, "loss": 2.2086, "step": 560990 }, { "epoch": 0.98, "learning_rate": 1.0841701050164447e-06, "loss": 2.3558, "step": 561000 }, { "epoch": 0.98, "learning_rate": 1.0832981650896179e-06, "loss": 2.3488, "step": 561010 }, { "epoch": 0.98, "learning_rate": 1.0824262251627912e-06, "loss": 2.2939, "step": 561020 }, { "epoch": 0.98, "learning_rate": 1.0815542852359643e-06, "loss": 2.1998, "step": 561030 }, { "epoch": 0.98, "learning_rate": 1.0806823453091375e-06, "loss": 2.3013, "step": 561040 }, { "epoch": 0.98, "learning_rate": 1.0798104053823108e-06, "loss": 2.2287, "step": 561050 }, { "epoch": 0.98, "learning_rate": 1.078938465455484e-06, "loss": 2.2175, "step": 561060 }, { "epoch": 0.98, "learning_rate": 1.078066525528657e-06, "loss": 2.279, "step": 561070 }, { "epoch": 0.98, "learning_rate": 1.0771945856018304e-06, "loss": 2.207, "step": 561080 }, { "epoch": 0.98, "learning_rate": 1.0763226456750036e-06, "loss": 2.2057, "step": 561090 }, { "epoch": 0.98, "learning_rate": 1.0754507057481767e-06, "loss": 2.3825, "step": 561100 }, { "epoch": 0.98, "learning_rate": 1.07457876582135e-06, "loss": 2.2906, "step": 561110 }, { "epoch": 0.98, "learning_rate": 1.0737068258945232e-06, "loss": 2.2422, "step": 561120 }, { "epoch": 0.98, "learning_rate": 1.0728348859676963e-06, "loss": 2.2374, "step": 561130 }, { "epoch": 0.98, "learning_rate": 1.0719629460408695e-06, "loss": 2.1227, "step": 561140 }, { "epoch": 0.98, "learning_rate": 1.0710910061140428e-06, "loss": 2.3305, "step": 561150 }, { "epoch": 0.98, "learning_rate": 1.070219066187216e-06, "loss": 2.3062, "step": 561160 }, { "epoch": 0.98, "learning_rate": 1.069347126260389e-06, "loss": 2.375, "step": 561170 }, { "epoch": 0.98, "learning_rate": 1.0684751863335624e-06, "loss": 2.3366, "step": 561180 }, { "epoch": 0.98, "learning_rate": 1.0676032464067356e-06, "loss": 2.1475, "step": 561190 }, { "epoch": 0.98, "learning_rate": 1.0667313064799087e-06, "loss": 2.3217, "step": 561200 }, { "epoch": 0.98, "learning_rate": 1.065859366553082e-06, "loss": 2.1556, "step": 561210 }, { "epoch": 0.98, "learning_rate": 1.0649874266262552e-06, "loss": 2.2612, "step": 561220 }, { "epoch": 0.98, "learning_rate": 1.0641154866994283e-06, "loss": 2.3734, "step": 561230 }, { "epoch": 0.98, "learning_rate": 1.0632435467726017e-06, "loss": 2.2656, "step": 561240 }, { "epoch": 0.98, "learning_rate": 1.0623716068457748e-06, "loss": 2.2837, "step": 561250 }, { "epoch": 0.98, "learning_rate": 1.061499666918948e-06, "loss": 2.315, "step": 561260 }, { "epoch": 0.98, "learning_rate": 1.060627726992121e-06, "loss": 2.1716, "step": 561270 }, { "epoch": 0.98, "learning_rate": 1.0597557870652944e-06, "loss": 2.2645, "step": 561280 }, { "epoch": 0.98, "learning_rate": 1.0588838471384675e-06, "loss": 2.2822, "step": 561290 }, { "epoch": 0.98, "learning_rate": 1.0580119072116407e-06, "loss": 2.3514, "step": 561300 }, { "epoch": 0.98, "learning_rate": 1.057139967284814e-06, "loss": 2.2571, "step": 561310 }, { "epoch": 0.98, "learning_rate": 1.0562680273579872e-06, "loss": 2.2039, "step": 561320 }, { "epoch": 0.98, "learning_rate": 1.0553960874311603e-06, "loss": 2.2091, "step": 561330 }, { "epoch": 0.98, "learning_rate": 1.0545241475043336e-06, "loss": 2.2877, "step": 561340 }, { "epoch": 0.98, "learning_rate": 1.0536522075775068e-06, "loss": 2.2743, "step": 561350 }, { "epoch": 0.98, "learning_rate": 1.05278026765068e-06, "loss": 2.2122, "step": 561360 }, { "epoch": 0.98, "learning_rate": 1.0519083277238533e-06, "loss": 2.2259, "step": 561370 }, { "epoch": 0.98, "learning_rate": 1.0510363877970264e-06, "loss": 2.1938, "step": 561380 }, { "epoch": 0.98, "learning_rate": 1.0501644478701995e-06, "loss": 2.3835, "step": 561390 }, { "epoch": 0.98, "learning_rate": 1.0492925079433727e-06, "loss": 2.235, "step": 561400 }, { "epoch": 0.98, "learning_rate": 1.048420568016546e-06, "loss": 2.191, "step": 561410 }, { "epoch": 0.98, "learning_rate": 1.0475486280897191e-06, "loss": 2.2837, "step": 561420 }, { "epoch": 0.98, "learning_rate": 1.0466766881628923e-06, "loss": 2.2419, "step": 561430 }, { "epoch": 0.98, "learning_rate": 1.0458047482360656e-06, "loss": 2.2102, "step": 561440 }, { "epoch": 0.98, "learning_rate": 1.0449328083092388e-06, "loss": 2.2566, "step": 561450 }, { "epoch": 0.98, "learning_rate": 1.0440608683824119e-06, "loss": 2.2947, "step": 561460 }, { "epoch": 0.98, "learning_rate": 1.0431889284555852e-06, "loss": 2.2382, "step": 561470 }, { "epoch": 0.98, "learning_rate": 1.0423169885287584e-06, "loss": 2.226, "step": 561480 }, { "epoch": 0.98, "learning_rate": 1.0414450486019315e-06, "loss": 2.2959, "step": 561490 }, { "epoch": 0.98, "learning_rate": 1.0405731086751049e-06, "loss": 2.2731, "step": 561500 }, { "epoch": 0.98, "learning_rate": 1.039701168748278e-06, "loss": 2.2655, "step": 561510 }, { "epoch": 0.98, "learning_rate": 1.0388292288214511e-06, "loss": 2.2094, "step": 561520 }, { "epoch": 0.98, "learning_rate": 1.0379572888946243e-06, "loss": 2.2075, "step": 561530 }, { "epoch": 0.98, "learning_rate": 1.0370853489677976e-06, "loss": 2.2398, "step": 561540 }, { "epoch": 0.98, "learning_rate": 1.0362134090409707e-06, "loss": 2.3226, "step": 561550 }, { "epoch": 0.98, "learning_rate": 1.0353414691141439e-06, "loss": 2.2867, "step": 561560 }, { "epoch": 0.98, "learning_rate": 1.0344695291873172e-06, "loss": 2.2684, "step": 561570 }, { "epoch": 0.98, "learning_rate": 1.0335975892604904e-06, "loss": 2.2569, "step": 561580 }, { "epoch": 0.98, "learning_rate": 1.0327256493336635e-06, "loss": 2.2437, "step": 561590 }, { "epoch": 0.98, "learning_rate": 1.0318537094068368e-06, "loss": 2.2257, "step": 561600 }, { "epoch": 0.98, "learning_rate": 1.03098176948001e-06, "loss": 2.2769, "step": 561610 }, { "epoch": 0.98, "learning_rate": 1.030109829553183e-06, "loss": 2.3251, "step": 561620 }, { "epoch": 0.98, "learning_rate": 1.0292378896263564e-06, "loss": 2.3117, "step": 561630 }, { "epoch": 0.98, "learning_rate": 1.0283659496995296e-06, "loss": 2.2348, "step": 561640 }, { "epoch": 0.98, "learning_rate": 1.0274940097727027e-06, "loss": 2.2728, "step": 561650 }, { "epoch": 0.98, "learning_rate": 1.026622069845876e-06, "loss": 2.1051, "step": 561660 }, { "epoch": 0.98, "learning_rate": 1.0257501299190492e-06, "loss": 2.214, "step": 561670 }, { "epoch": 0.98, "learning_rate": 1.0248781899922223e-06, "loss": 2.2584, "step": 561680 }, { "epoch": 0.98, "learning_rate": 1.0240062500653955e-06, "loss": 2.1876, "step": 561690 }, { "epoch": 0.98, "learning_rate": 1.0231343101385688e-06, "loss": 2.2276, "step": 561700 }, { "epoch": 0.98, "learning_rate": 1.022262370211742e-06, "loss": 2.3318, "step": 561710 }, { "epoch": 0.98, "learning_rate": 1.021390430284915e-06, "loss": 2.2341, "step": 561720 }, { "epoch": 0.98, "learning_rate": 1.0205184903580884e-06, "loss": 2.3171, "step": 561730 }, { "epoch": 0.98, "learning_rate": 1.0196465504312616e-06, "loss": 2.2509, "step": 561740 }, { "epoch": 0.98, "learning_rate": 1.0187746105044347e-06, "loss": 2.42, "step": 561750 }, { "epoch": 0.98, "learning_rate": 1.017902670577608e-06, "loss": 2.1528, "step": 561760 }, { "epoch": 0.98, "learning_rate": 1.0170307306507812e-06, "loss": 2.2868, "step": 561770 }, { "epoch": 0.98, "learning_rate": 1.0161587907239543e-06, "loss": 2.3448, "step": 561780 }, { "epoch": 0.98, "learning_rate": 1.0152868507971277e-06, "loss": 2.2158, "step": 561790 }, { "epoch": 0.98, "learning_rate": 1.0144149108703008e-06, "loss": 2.2836, "step": 561800 }, { "epoch": 0.98, "learning_rate": 1.013542970943474e-06, "loss": 2.4156, "step": 561810 }, { "epoch": 0.98, "learning_rate": 1.012671031016647e-06, "loss": 2.2206, "step": 561820 }, { "epoch": 0.98, "learning_rate": 1.0117990910898204e-06, "loss": 2.1765, "step": 561830 }, { "epoch": 0.98, "learning_rate": 1.0109271511629935e-06, "loss": 2.231, "step": 561840 }, { "epoch": 0.98, "learning_rate": 1.0100552112361667e-06, "loss": 2.274, "step": 561850 }, { "epoch": 0.98, "learning_rate": 1.00918327130934e-06, "loss": 2.2393, "step": 561860 }, { "epoch": 0.98, "learning_rate": 1.0083113313825132e-06, "loss": 2.3253, "step": 561870 }, { "epoch": 0.98, "learning_rate": 1.0074393914556863e-06, "loss": 2.1912, "step": 561880 }, { "epoch": 0.98, "learning_rate": 1.0065674515288596e-06, "loss": 2.2858, "step": 561890 }, { "epoch": 0.98, "learning_rate": 1.0056955116020328e-06, "loss": 2.2749, "step": 561900 }, { "epoch": 0.98, "learning_rate": 1.004823571675206e-06, "loss": 2.2418, "step": 561910 }, { "epoch": 0.98, "learning_rate": 1.0039516317483793e-06, "loss": 2.3366, "step": 561920 }, { "epoch": 0.98, "learning_rate": 1.0030796918215524e-06, "loss": 2.2901, "step": 561930 }, { "epoch": 0.98, "learning_rate": 1.0022077518947255e-06, "loss": 2.2997, "step": 561940 }, { "epoch": 0.98, "learning_rate": 1.0013358119678987e-06, "loss": 2.3353, "step": 561950 }, { "epoch": 0.98, "learning_rate": 1.000463872041072e-06, "loss": 2.217, "step": 561960 }, { "epoch": 0.98, "learning_rate": 9.995919321142451e-07, "loss": 2.3019, "step": 561970 }, { "epoch": 0.98, "learning_rate": 9.987199921874183e-07, "loss": 2.2875, "step": 561980 }, { "epoch": 0.98, "learning_rate": 9.978480522605916e-07, "loss": 2.2951, "step": 561990 }, { "epoch": 0.98, "learning_rate": 9.969761123337648e-07, "loss": 2.1514, "step": 562000 }, { "epoch": 0.98, "learning_rate": 9.961041724069379e-07, "loss": 2.264, "step": 562010 }, { "epoch": 0.98, "learning_rate": 9.952322324801112e-07, "loss": 2.2657, "step": 562020 }, { "epoch": 0.98, "learning_rate": 9.943602925532844e-07, "loss": 2.3328, "step": 562030 }, { "epoch": 0.98, "learning_rate": 9.934883526264575e-07, "loss": 2.3698, "step": 562040 }, { "epoch": 0.98, "learning_rate": 9.926164126996309e-07, "loss": 2.2118, "step": 562050 }, { "epoch": 0.98, "learning_rate": 9.91744472772804e-07, "loss": 2.3477, "step": 562060 }, { "epoch": 0.98, "learning_rate": 9.908725328459771e-07, "loss": 2.2331, "step": 562070 }, { "epoch": 0.98, "learning_rate": 9.900005929191503e-07, "loss": 2.3357, "step": 562080 }, { "epoch": 0.98, "learning_rate": 9.891286529923236e-07, "loss": 2.285, "step": 562090 }, { "epoch": 0.98, "learning_rate": 9.882567130654967e-07, "loss": 2.3814, "step": 562100 }, { "epoch": 0.98, "learning_rate": 9.873847731386699e-07, "loss": 2.3199, "step": 562110 }, { "epoch": 0.98, "learning_rate": 9.865128332118432e-07, "loss": 2.1881, "step": 562120 }, { "epoch": 0.98, "learning_rate": 9.856408932850164e-07, "loss": 2.3348, "step": 562130 }, { "epoch": 0.98, "learning_rate": 9.847689533581895e-07, "loss": 2.349, "step": 562140 }, { "epoch": 0.98, "learning_rate": 9.838970134313628e-07, "loss": 2.2428, "step": 562150 }, { "epoch": 0.98, "learning_rate": 9.83025073504536e-07, "loss": 2.2607, "step": 562160 }, { "epoch": 0.98, "learning_rate": 9.821531335777091e-07, "loss": 2.3305, "step": 562170 }, { "epoch": 0.98, "learning_rate": 9.812811936508825e-07, "loss": 2.3528, "step": 562180 }, { "epoch": 0.98, "learning_rate": 9.804092537240556e-07, "loss": 2.3714, "step": 562190 }, { "epoch": 0.98, "learning_rate": 9.795373137972287e-07, "loss": 2.331, "step": 562200 }, { "epoch": 0.98, "learning_rate": 9.786653738704019e-07, "loss": 2.187, "step": 562210 }, { "epoch": 0.98, "learning_rate": 9.777934339435752e-07, "loss": 2.3204, "step": 562220 }, { "epoch": 0.98, "learning_rate": 9.769214940167483e-07, "loss": 2.2534, "step": 562230 }, { "epoch": 0.98, "learning_rate": 9.760495540899215e-07, "loss": 2.1692, "step": 562240 }, { "epoch": 0.98, "learning_rate": 9.751776141630948e-07, "loss": 2.2021, "step": 562250 }, { "epoch": 0.98, "learning_rate": 9.74305674236268e-07, "loss": 2.3338, "step": 562260 }, { "epoch": 0.98, "learning_rate": 9.73433734309441e-07, "loss": 2.1877, "step": 562270 }, { "epoch": 0.98, "learning_rate": 9.725617943826144e-07, "loss": 2.1975, "step": 562280 }, { "epoch": 0.98, "learning_rate": 9.716898544557876e-07, "loss": 2.2767, "step": 562290 }, { "epoch": 0.98, "learning_rate": 9.708179145289607e-07, "loss": 2.2955, "step": 562300 }, { "epoch": 0.98, "learning_rate": 9.699459746021338e-07, "loss": 2.3001, "step": 562310 }, { "epoch": 0.98, "learning_rate": 9.690740346753072e-07, "loss": 2.2813, "step": 562320 }, { "epoch": 0.98, "learning_rate": 9.682020947484803e-07, "loss": 2.2731, "step": 562330 }, { "epoch": 0.98, "learning_rate": 9.673301548216535e-07, "loss": 2.2692, "step": 562340 }, { "epoch": 0.98, "learning_rate": 9.664582148948268e-07, "loss": 2.2259, "step": 562350 }, { "epoch": 0.98, "learning_rate": 9.65586274968e-07, "loss": 2.3122, "step": 562360 }, { "epoch": 0.98, "learning_rate": 9.64714335041173e-07, "loss": 2.3276, "step": 562370 }, { "epoch": 0.98, "learning_rate": 9.638423951143464e-07, "loss": 2.2612, "step": 562380 }, { "epoch": 0.98, "learning_rate": 9.629704551875196e-07, "loss": 2.2987, "step": 562390 }, { "epoch": 0.98, "learning_rate": 9.620985152606927e-07, "loss": 2.2785, "step": 562400 }, { "epoch": 0.98, "learning_rate": 9.612265753338658e-07, "loss": 2.1792, "step": 562410 }, { "epoch": 0.98, "learning_rate": 9.603546354070392e-07, "loss": 2.1427, "step": 562420 }, { "epoch": 0.98, "learning_rate": 9.594826954802123e-07, "loss": 2.2518, "step": 562430 }, { "epoch": 0.98, "learning_rate": 9.586107555533854e-07, "loss": 2.3458, "step": 562440 }, { "epoch": 0.98, "learning_rate": 9.577388156265588e-07, "loss": 2.2893, "step": 562450 }, { "epoch": 0.98, "learning_rate": 9.56866875699732e-07, "loss": 2.2465, "step": 562460 }, { "epoch": 0.98, "learning_rate": 9.55994935772905e-07, "loss": 2.3136, "step": 562470 }, { "epoch": 0.98, "learning_rate": 9.551229958460784e-07, "loss": 2.2978, "step": 562480 }, { "epoch": 0.98, "learning_rate": 9.542510559192515e-07, "loss": 2.3661, "step": 562490 }, { "epoch": 0.98, "learning_rate": 9.533791159924246e-07, "loss": 2.2757, "step": 562500 }, { "epoch": 0.98, "learning_rate": 9.525071760655977e-07, "loss": 2.2476, "step": 562510 }, { "epoch": 0.98, "learning_rate": 9.51635236138771e-07, "loss": 2.2354, "step": 562520 }, { "epoch": 0.98, "learning_rate": 9.507632962119442e-07, "loss": 2.2733, "step": 562530 }, { "epoch": 0.98, "learning_rate": 9.498913562851173e-07, "loss": 2.3437, "step": 562540 }, { "epoch": 0.98, "learning_rate": 9.490194163582907e-07, "loss": 2.2418, "step": 562550 }, { "epoch": 0.98, "learning_rate": 9.481474764314638e-07, "loss": 2.1783, "step": 562560 }, { "epoch": 0.98, "learning_rate": 9.472755365046369e-07, "loss": 2.3158, "step": 562570 }, { "epoch": 0.98, "learning_rate": 9.464035965778103e-07, "loss": 2.2304, "step": 562580 }, { "epoch": 0.98, "learning_rate": 9.455316566509834e-07, "loss": 2.1899, "step": 562590 }, { "epoch": 0.98, "learning_rate": 9.446597167241565e-07, "loss": 2.1701, "step": 562600 }, { "epoch": 0.98, "learning_rate": 9.437877767973299e-07, "loss": 2.2597, "step": 562610 }, { "epoch": 0.98, "learning_rate": 9.42915836870503e-07, "loss": 2.3538, "step": 562620 }, { "epoch": 0.98, "learning_rate": 9.420438969436762e-07, "loss": 2.1842, "step": 562630 }, { "epoch": 0.98, "learning_rate": 9.411719570168493e-07, "loss": 2.1564, "step": 562640 }, { "epoch": 0.98, "learning_rate": 9.403000170900226e-07, "loss": 2.2102, "step": 562650 }, { "epoch": 0.98, "learning_rate": 9.394280771631958e-07, "loss": 2.2827, "step": 562660 }, { "epoch": 0.98, "learning_rate": 9.385561372363689e-07, "loss": 2.2028, "step": 562670 }, { "epoch": 0.98, "learning_rate": 9.376841973095423e-07, "loss": 2.2833, "step": 562680 }, { "epoch": 0.98, "learning_rate": 9.368122573827154e-07, "loss": 2.3622, "step": 562690 }, { "epoch": 0.98, "learning_rate": 9.359403174558885e-07, "loss": 2.2367, "step": 562700 }, { "epoch": 0.98, "learning_rate": 9.350683775290619e-07, "loss": 2.2848, "step": 562710 }, { "epoch": 0.98, "learning_rate": 9.34196437602235e-07, "loss": 2.2458, "step": 562720 }, { "epoch": 0.98, "learning_rate": 9.333244976754081e-07, "loss": 2.2344, "step": 562730 }, { "epoch": 0.98, "learning_rate": 9.324525577485813e-07, "loss": 2.3331, "step": 562740 }, { "epoch": 0.98, "learning_rate": 9.315806178217546e-07, "loss": 2.1674, "step": 562750 }, { "epoch": 0.98, "learning_rate": 9.307086778949278e-07, "loss": 2.2783, "step": 562760 }, { "epoch": 0.98, "learning_rate": 9.298367379681009e-07, "loss": 2.3326, "step": 562770 }, { "epoch": 0.98, "learning_rate": 9.289647980412742e-07, "loss": 2.3818, "step": 562780 }, { "epoch": 0.98, "learning_rate": 9.280928581144474e-07, "loss": 2.2422, "step": 562790 }, { "epoch": 0.98, "learning_rate": 9.272209181876205e-07, "loss": 2.3358, "step": 562800 }, { "epoch": 0.98, "learning_rate": 9.263489782607939e-07, "loss": 2.2369, "step": 562810 }, { "epoch": 0.98, "learning_rate": 9.25477038333967e-07, "loss": 2.2468, "step": 562820 }, { "epoch": 0.98, "learning_rate": 9.246050984071401e-07, "loss": 2.3564, "step": 562830 }, { "epoch": 0.98, "learning_rate": 9.237331584803134e-07, "loss": 2.2635, "step": 562840 }, { "epoch": 0.98, "learning_rate": 9.228612185534866e-07, "loss": 2.31, "step": 562850 }, { "epoch": 0.98, "learning_rate": 9.219892786266597e-07, "loss": 2.1726, "step": 562860 }, { "epoch": 0.98, "learning_rate": 9.211173386998329e-07, "loss": 2.2974, "step": 562870 }, { "epoch": 0.98, "learning_rate": 9.202453987730062e-07, "loss": 2.3372, "step": 562880 }, { "epoch": 0.98, "learning_rate": 9.193734588461794e-07, "loss": 2.1252, "step": 562890 }, { "epoch": 0.98, "learning_rate": 9.185015189193525e-07, "loss": 2.1867, "step": 562900 }, { "epoch": 0.98, "learning_rate": 9.176295789925258e-07, "loss": 2.2259, "step": 562910 }, { "epoch": 0.98, "learning_rate": 9.16757639065699e-07, "loss": 2.2098, "step": 562920 }, { "epoch": 0.98, "learning_rate": 9.158856991388721e-07, "loss": 2.3059, "step": 562930 }, { "epoch": 0.98, "learning_rate": 9.150137592120453e-07, "loss": 2.2977, "step": 562940 }, { "epoch": 0.98, "learning_rate": 9.141418192852186e-07, "loss": 2.2685, "step": 562950 }, { "epoch": 0.98, "learning_rate": 9.132698793583917e-07, "loss": 2.1683, "step": 562960 }, { "epoch": 0.98, "learning_rate": 9.12397939431565e-07, "loss": 2.1839, "step": 562970 }, { "epoch": 0.98, "learning_rate": 9.115259995047382e-07, "loss": 2.2489, "step": 562980 }, { "epoch": 0.98, "learning_rate": 9.106540595779113e-07, "loss": 2.2183, "step": 562990 }, { "epoch": 0.98, "learning_rate": 9.097821196510845e-07, "loss": 2.2668, "step": 563000 }, { "epoch": 0.98, "learning_rate": 9.089101797242578e-07, "loss": 2.2331, "step": 563010 }, { "epoch": 0.98, "learning_rate": 9.08038239797431e-07, "loss": 2.2943, "step": 563020 }, { "epoch": 0.98, "learning_rate": 9.071662998706041e-07, "loss": 2.3451, "step": 563030 }, { "epoch": 0.98, "learning_rate": 9.062943599437773e-07, "loss": 2.168, "step": 563040 }, { "epoch": 0.98, "learning_rate": 9.054224200169506e-07, "loss": 2.253, "step": 563050 }, { "epoch": 0.98, "learning_rate": 9.045504800901237e-07, "loss": 2.2498, "step": 563060 }, { "epoch": 0.98, "learning_rate": 9.036785401632969e-07, "loss": 2.1895, "step": 563070 }, { "epoch": 0.98, "learning_rate": 9.028066002364702e-07, "loss": 2.2042, "step": 563080 }, { "epoch": 0.98, "learning_rate": 9.019346603096433e-07, "loss": 2.3531, "step": 563090 }, { "epoch": 0.98, "learning_rate": 9.010627203828166e-07, "loss": 2.1927, "step": 563100 }, { "epoch": 0.98, "learning_rate": 9.001907804559898e-07, "loss": 2.178, "step": 563110 }, { "epoch": 0.98, "learning_rate": 8.993188405291629e-07, "loss": 2.2787, "step": 563120 }, { "epoch": 0.98, "learning_rate": 8.984469006023361e-07, "loss": 2.3142, "step": 563130 }, { "epoch": 0.98, "learning_rate": 8.975749606755093e-07, "loss": 2.3551, "step": 563140 }, { "epoch": 0.98, "learning_rate": 8.967030207486825e-07, "loss": 2.2375, "step": 563150 }, { "epoch": 0.98, "learning_rate": 8.958310808218557e-07, "loss": 2.3814, "step": 563160 }, { "epoch": 0.98, "learning_rate": 8.949591408950289e-07, "loss": 2.2586, "step": 563170 }, { "epoch": 0.98, "learning_rate": 8.940872009682022e-07, "loss": 2.2952, "step": 563180 }, { "epoch": 0.98, "learning_rate": 8.932152610413753e-07, "loss": 2.2833, "step": 563190 }, { "epoch": 0.98, "learning_rate": 8.923433211145485e-07, "loss": 2.23, "step": 563200 }, { "epoch": 0.98, "learning_rate": 8.914713811877218e-07, "loss": 2.1484, "step": 563210 }, { "epoch": 0.98, "learning_rate": 8.905994412608949e-07, "loss": 2.167, "step": 563220 }, { "epoch": 0.98, "learning_rate": 8.897275013340682e-07, "loss": 2.3548, "step": 563230 }, { "epoch": 0.98, "learning_rate": 8.888555614072413e-07, "loss": 2.2475, "step": 563240 }, { "epoch": 0.98, "learning_rate": 8.879836214804145e-07, "loss": 2.2569, "step": 563250 }, { "epoch": 0.98, "learning_rate": 8.871116815535878e-07, "loss": 2.269, "step": 563260 }, { "epoch": 0.98, "learning_rate": 8.862397416267609e-07, "loss": 2.2654, "step": 563270 }, { "epoch": 0.98, "learning_rate": 8.853678016999341e-07, "loss": 2.3581, "step": 563280 }, { "epoch": 0.98, "learning_rate": 8.844958617731073e-07, "loss": 2.1809, "step": 563290 }, { "epoch": 0.98, "learning_rate": 8.836239218462805e-07, "loss": 2.3118, "step": 563300 }, { "epoch": 0.98, "learning_rate": 8.827519819194538e-07, "loss": 2.2944, "step": 563310 }, { "epoch": 0.98, "learning_rate": 8.818800419926269e-07, "loss": 2.2478, "step": 563320 }, { "epoch": 0.98, "learning_rate": 8.810081020658001e-07, "loss": 2.2749, "step": 563330 }, { "epoch": 0.98, "learning_rate": 8.801361621389733e-07, "loss": 2.2952, "step": 563340 }, { "epoch": 0.98, "learning_rate": 8.792642222121465e-07, "loss": 2.3279, "step": 563350 }, { "epoch": 0.98, "learning_rate": 8.783922822853198e-07, "loss": 2.2535, "step": 563360 }, { "epoch": 0.98, "learning_rate": 8.775203423584929e-07, "loss": 2.3122, "step": 563370 }, { "epoch": 0.98, "learning_rate": 8.766484024316661e-07, "loss": 2.0859, "step": 563380 }, { "epoch": 0.98, "learning_rate": 8.757764625048394e-07, "loss": 2.2589, "step": 563390 }, { "epoch": 0.98, "learning_rate": 8.749045225780125e-07, "loss": 2.2846, "step": 563400 }, { "epoch": 0.98, "learning_rate": 8.740325826511857e-07, "loss": 2.2639, "step": 563410 }, { "epoch": 0.98, "learning_rate": 8.731606427243589e-07, "loss": 2.2425, "step": 563420 }, { "epoch": 0.98, "learning_rate": 8.722887027975321e-07, "loss": 2.3136, "step": 563430 }, { "epoch": 0.98, "learning_rate": 8.714167628707053e-07, "loss": 2.2165, "step": 563440 }, { "epoch": 0.98, "learning_rate": 8.705448229438785e-07, "loss": 2.2748, "step": 563450 }, { "epoch": 0.98, "learning_rate": 8.696728830170517e-07, "loss": 2.3063, "step": 563460 }, { "epoch": 0.98, "learning_rate": 8.688009430902249e-07, "loss": 2.2266, "step": 563470 }, { "epoch": 0.98, "learning_rate": 8.679290031633981e-07, "loss": 2.3787, "step": 563480 }, { "epoch": 0.98, "learning_rate": 8.670570632365713e-07, "loss": 2.2116, "step": 563490 }, { "epoch": 0.98, "learning_rate": 8.661851233097445e-07, "loss": 2.3504, "step": 563500 }, { "epoch": 0.98, "learning_rate": 8.653131833829177e-07, "loss": 2.2168, "step": 563510 }, { "epoch": 0.98, "learning_rate": 8.64441243456091e-07, "loss": 2.1993, "step": 563520 }, { "epoch": 0.98, "learning_rate": 8.635693035292641e-07, "loss": 2.2392, "step": 563530 }, { "epoch": 0.98, "learning_rate": 8.626973636024372e-07, "loss": 2.2469, "step": 563540 }, { "epoch": 0.98, "learning_rate": 8.618254236756105e-07, "loss": 2.2169, "step": 563550 }, { "epoch": 0.98, "learning_rate": 8.609534837487837e-07, "loss": 2.1682, "step": 563560 }, { "epoch": 0.98, "learning_rate": 8.600815438219568e-07, "loss": 2.1782, "step": 563570 }, { "epoch": 0.98, "learning_rate": 8.592096038951301e-07, "loss": 2.2642, "step": 563580 }, { "epoch": 0.98, "learning_rate": 8.583376639683033e-07, "loss": 2.2717, "step": 563590 }, { "epoch": 0.98, "learning_rate": 8.574657240414765e-07, "loss": 2.1521, "step": 563600 }, { "epoch": 0.98, "learning_rate": 8.565937841146497e-07, "loss": 2.2407, "step": 563610 }, { "epoch": 0.98, "learning_rate": 8.557218441878229e-07, "loss": 2.2709, "step": 563620 }, { "epoch": 0.98, "learning_rate": 8.548499042609961e-07, "loss": 2.3894, "step": 563630 }, { "epoch": 0.98, "learning_rate": 8.539779643341692e-07, "loss": 2.2594, "step": 563640 }, { "epoch": 0.98, "learning_rate": 8.531060244073426e-07, "loss": 2.1642, "step": 563650 }, { "epoch": 0.98, "learning_rate": 8.522340844805157e-07, "loss": 2.3587, "step": 563660 }, { "epoch": 0.98, "learning_rate": 8.513621445536888e-07, "loss": 2.1569, "step": 563670 }, { "epoch": 0.98, "learning_rate": 8.504902046268621e-07, "loss": 2.2474, "step": 563680 }, { "epoch": 0.98, "learning_rate": 8.496182647000353e-07, "loss": 2.2394, "step": 563690 }, { "epoch": 0.98, "learning_rate": 8.487463247732084e-07, "loss": 2.3289, "step": 563700 }, { "epoch": 0.98, "learning_rate": 8.478743848463817e-07, "loss": 2.2337, "step": 563710 }, { "epoch": 0.98, "learning_rate": 8.470024449195549e-07, "loss": 2.1952, "step": 563720 }, { "epoch": 0.98, "learning_rate": 8.461305049927281e-07, "loss": 2.1816, "step": 563730 }, { "epoch": 0.98, "learning_rate": 8.452585650659012e-07, "loss": 2.2365, "step": 563740 }, { "epoch": 0.98, "learning_rate": 8.443866251390745e-07, "loss": 2.2146, "step": 563750 }, { "epoch": 0.98, "learning_rate": 8.435146852122477e-07, "loss": 2.2649, "step": 563760 }, { "epoch": 0.98, "learning_rate": 8.426427452854208e-07, "loss": 2.2548, "step": 563770 }, { "epoch": 0.98, "learning_rate": 8.417708053585942e-07, "loss": 2.229, "step": 563780 }, { "epoch": 0.98, "learning_rate": 8.408988654317673e-07, "loss": 2.2489, "step": 563790 }, { "epoch": 0.98, "learning_rate": 8.400269255049404e-07, "loss": 2.1303, "step": 563800 }, { "epoch": 0.98, "learning_rate": 8.391549855781137e-07, "loss": 2.2409, "step": 563810 }, { "epoch": 0.98, "learning_rate": 8.382830456512869e-07, "loss": 2.2933, "step": 563820 }, { "epoch": 0.98, "learning_rate": 8.3741110572446e-07, "loss": 2.3089, "step": 563830 }, { "epoch": 0.98, "learning_rate": 8.365391657976332e-07, "loss": 2.3019, "step": 563840 }, { "epoch": 0.98, "learning_rate": 8.356672258708065e-07, "loss": 2.1981, "step": 563850 }, { "epoch": 0.98, "learning_rate": 8.347952859439797e-07, "loss": 2.199, "step": 563860 }, { "epoch": 0.98, "learning_rate": 8.339233460171528e-07, "loss": 2.355, "step": 563870 }, { "epoch": 0.98, "learning_rate": 8.330514060903261e-07, "loss": 2.2595, "step": 563880 }, { "epoch": 0.98, "learning_rate": 8.321794661634993e-07, "loss": 2.0383, "step": 563890 }, { "epoch": 0.98, "learning_rate": 8.313075262366724e-07, "loss": 2.3561, "step": 563900 }, { "epoch": 0.98, "learning_rate": 8.304355863098458e-07, "loss": 2.2996, "step": 563910 }, { "epoch": 0.98, "learning_rate": 8.295636463830189e-07, "loss": 2.2617, "step": 563920 }, { "epoch": 0.98, "learning_rate": 8.28691706456192e-07, "loss": 2.2765, "step": 563930 }, { "epoch": 0.98, "learning_rate": 8.278197665293653e-07, "loss": 2.2632, "step": 563940 }, { "epoch": 0.98, "learning_rate": 8.269478266025385e-07, "loss": 2.2946, "step": 563950 }, { "epoch": 0.98, "learning_rate": 8.260758866757116e-07, "loss": 2.2306, "step": 563960 }, { "epoch": 0.98, "learning_rate": 8.252039467488848e-07, "loss": 2.3172, "step": 563970 }, { "epoch": 0.98, "learning_rate": 8.243320068220581e-07, "loss": 2.2092, "step": 563980 }, { "epoch": 0.98, "learning_rate": 8.234600668952313e-07, "loss": 2.3072, "step": 563990 }, { "epoch": 0.98, "learning_rate": 8.225881269684044e-07, "loss": 2.1649, "step": 564000 }, { "epoch": 0.98, "learning_rate": 8.217161870415777e-07, "loss": 2.3146, "step": 564010 }, { "epoch": 0.98, "learning_rate": 8.208442471147509e-07, "loss": 2.2742, "step": 564020 }, { "epoch": 0.98, "learning_rate": 8.19972307187924e-07, "loss": 2.2596, "step": 564030 }, { "epoch": 0.98, "learning_rate": 8.191003672610974e-07, "loss": 2.2809, "step": 564040 }, { "epoch": 0.98, "learning_rate": 8.182284273342705e-07, "loss": 2.303, "step": 564050 }, { "epoch": 0.98, "learning_rate": 8.173564874074436e-07, "loss": 2.3044, "step": 564060 }, { "epoch": 0.98, "learning_rate": 8.164845474806168e-07, "loss": 2.2742, "step": 564070 }, { "epoch": 0.98, "learning_rate": 8.156126075537901e-07, "loss": 2.2303, "step": 564080 }, { "epoch": 0.98, "learning_rate": 8.147406676269632e-07, "loss": 2.1893, "step": 564090 }, { "epoch": 0.98, "learning_rate": 8.138687277001364e-07, "loss": 2.2682, "step": 564100 }, { "epoch": 0.98, "learning_rate": 8.129967877733097e-07, "loss": 2.2967, "step": 564110 }, { "epoch": 0.98, "learning_rate": 8.121248478464829e-07, "loss": 2.2862, "step": 564120 }, { "epoch": 0.98, "learning_rate": 8.11252907919656e-07, "loss": 2.2666, "step": 564130 }, { "epoch": 0.98, "learning_rate": 8.103809679928293e-07, "loss": 2.1685, "step": 564140 }, { "epoch": 0.98, "learning_rate": 8.095090280660025e-07, "loss": 2.2236, "step": 564150 }, { "epoch": 0.98, "learning_rate": 8.086370881391756e-07, "loss": 2.319, "step": 564160 }, { "epoch": 0.98, "learning_rate": 8.077651482123487e-07, "loss": 2.2707, "step": 564170 }, { "epoch": 0.98, "learning_rate": 8.068932082855221e-07, "loss": 2.1779, "step": 564180 }, { "epoch": 0.98, "learning_rate": 8.060212683586952e-07, "loss": 2.3288, "step": 564190 }, { "epoch": 0.98, "learning_rate": 8.051493284318684e-07, "loss": 2.2389, "step": 564200 }, { "epoch": 0.98, "learning_rate": 8.042773885050417e-07, "loss": 2.1754, "step": 564210 }, { "epoch": 0.98, "learning_rate": 8.034054485782148e-07, "loss": 2.3098, "step": 564220 }, { "epoch": 0.98, "learning_rate": 8.02533508651388e-07, "loss": 2.3338, "step": 564230 }, { "epoch": 0.98, "learning_rate": 8.016615687245613e-07, "loss": 2.2843, "step": 564240 }, { "epoch": 0.98, "learning_rate": 8.007896287977345e-07, "loss": 2.3562, "step": 564250 }, { "epoch": 0.98, "learning_rate": 7.999176888709076e-07, "loss": 2.204, "step": 564260 }, { "epoch": 0.98, "learning_rate": 7.990457489440807e-07, "loss": 2.1956, "step": 564270 }, { "epoch": 0.98, "learning_rate": 7.981738090172541e-07, "loss": 2.3456, "step": 564280 }, { "epoch": 0.98, "learning_rate": 7.973018690904272e-07, "loss": 2.179, "step": 564290 }, { "epoch": 0.98, "learning_rate": 7.964299291636003e-07, "loss": 2.1896, "step": 564300 }, { "epoch": 0.98, "learning_rate": 7.955579892367737e-07, "loss": 2.3574, "step": 564310 }, { "epoch": 0.98, "learning_rate": 7.946860493099468e-07, "loss": 2.1898, "step": 564320 }, { "epoch": 0.98, "learning_rate": 7.9381410938312e-07, "loss": 2.2799, "step": 564330 }, { "epoch": 0.98, "learning_rate": 7.929421694562933e-07, "loss": 2.2201, "step": 564340 }, { "epoch": 0.98, "learning_rate": 7.920702295294664e-07, "loss": 2.2473, "step": 564350 }, { "epoch": 0.98, "learning_rate": 7.911982896026396e-07, "loss": 2.2674, "step": 564360 }, { "epoch": 0.98, "learning_rate": 7.903263496758127e-07, "loss": 2.3348, "step": 564370 }, { "epoch": 0.98, "learning_rate": 7.89454409748986e-07, "loss": 2.3759, "step": 564380 }, { "epoch": 0.98, "learning_rate": 7.885824698221592e-07, "loss": 2.271, "step": 564390 }, { "epoch": 0.98, "learning_rate": 7.877105298953323e-07, "loss": 2.3301, "step": 564400 }, { "epoch": 0.98, "learning_rate": 7.868385899685057e-07, "loss": 2.357, "step": 564410 }, { "epoch": 0.98, "learning_rate": 7.859666500416788e-07, "loss": 2.2438, "step": 564420 }, { "epoch": 0.98, "learning_rate": 7.850947101148519e-07, "loss": 2.1113, "step": 564430 }, { "epoch": 0.98, "learning_rate": 7.842227701880253e-07, "loss": 2.2355, "step": 564440 }, { "epoch": 0.98, "learning_rate": 7.833508302611984e-07, "loss": 2.236, "step": 564450 }, { "epoch": 0.98, "learning_rate": 7.824788903343715e-07, "loss": 2.3107, "step": 564460 }, { "epoch": 0.98, "learning_rate": 7.816069504075447e-07, "loss": 2.1796, "step": 564470 }, { "epoch": 0.98, "learning_rate": 7.807350104807179e-07, "loss": 2.1674, "step": 564480 }, { "epoch": 0.98, "learning_rate": 7.798630705538912e-07, "loss": 2.2377, "step": 564490 }, { "epoch": 0.98, "learning_rate": 7.789911306270644e-07, "loss": 2.1686, "step": 564500 }, { "epoch": 0.98, "learning_rate": 7.781191907002375e-07, "loss": 2.2091, "step": 564510 }, { "epoch": 0.98, "learning_rate": 7.772472507734108e-07, "loss": 2.2464, "step": 564520 }, { "epoch": 0.98, "learning_rate": 7.763753108465839e-07, "loss": 2.2199, "step": 564530 }, { "epoch": 0.98, "learning_rate": 7.755033709197572e-07, "loss": 2.2362, "step": 564540 }, { "epoch": 0.98, "learning_rate": 7.746314309929304e-07, "loss": 2.2365, "step": 564550 }, { "epoch": 0.98, "learning_rate": 7.737594910661035e-07, "loss": 2.2101, "step": 564560 }, { "epoch": 0.98, "learning_rate": 7.728875511392768e-07, "loss": 2.2937, "step": 564570 }, { "epoch": 0.98, "learning_rate": 7.720156112124499e-07, "loss": 2.2002, "step": 564580 }, { "epoch": 0.98, "learning_rate": 7.711436712856231e-07, "loss": 2.0609, "step": 564590 }, { "epoch": 0.98, "learning_rate": 7.702717313587964e-07, "loss": 2.1932, "step": 564600 }, { "epoch": 0.98, "learning_rate": 7.693997914319695e-07, "loss": 2.3044, "step": 564610 }, { "epoch": 0.98, "learning_rate": 7.685278515051428e-07, "loss": 2.2504, "step": 564620 }, { "epoch": 0.98, "learning_rate": 7.67655911578316e-07, "loss": 2.1779, "step": 564630 }, { "epoch": 0.98, "learning_rate": 7.667839716514891e-07, "loss": 2.1509, "step": 564640 }, { "epoch": 0.98, "learning_rate": 7.659120317246624e-07, "loss": 2.222, "step": 564650 }, { "epoch": 0.98, "learning_rate": 7.650400917978355e-07, "loss": 2.3494, "step": 564660 }, { "epoch": 0.98, "learning_rate": 7.641681518710088e-07, "loss": 2.3317, "step": 564670 }, { "epoch": 0.98, "learning_rate": 7.63296211944182e-07, "loss": 2.3167, "step": 564680 }, { "epoch": 0.98, "learning_rate": 7.624242720173551e-07, "loss": 2.315, "step": 564690 }, { "epoch": 0.98, "learning_rate": 7.615523320905284e-07, "loss": 2.3124, "step": 564700 }, { "epoch": 0.98, "learning_rate": 7.606803921637015e-07, "loss": 2.2515, "step": 564710 }, { "epoch": 0.98, "learning_rate": 7.598084522368747e-07, "loss": 2.3442, "step": 564720 }, { "epoch": 0.98, "learning_rate": 7.58936512310048e-07, "loss": 2.2467, "step": 564730 }, { "epoch": 0.98, "learning_rate": 7.580645723832211e-07, "loss": 2.228, "step": 564740 }, { "epoch": 0.98, "learning_rate": 7.571926324563944e-07, "loss": 2.2962, "step": 564750 }, { "epoch": 0.98, "learning_rate": 7.563206925295675e-07, "loss": 2.333, "step": 564760 }, { "epoch": 0.98, "learning_rate": 7.554487526027407e-07, "loss": 2.2435, "step": 564770 }, { "epoch": 0.98, "learning_rate": 7.54576812675914e-07, "loss": 2.2097, "step": 564780 }, { "epoch": 0.98, "learning_rate": 7.537048727490871e-07, "loss": 2.2659, "step": 564790 }, { "epoch": 0.98, "learning_rate": 7.528329328222604e-07, "loss": 2.2521, "step": 564800 }, { "epoch": 0.98, "learning_rate": 7.519609928954335e-07, "loss": 2.3104, "step": 564810 }, { "epoch": 0.98, "learning_rate": 7.510890529686067e-07, "loss": 2.3152, "step": 564820 }, { "epoch": 0.98, "learning_rate": 7.5021711304178e-07, "loss": 2.2084, "step": 564830 }, { "epoch": 0.99, "learning_rate": 7.493451731149531e-07, "loss": 2.2544, "step": 564840 }, { "epoch": 0.99, "learning_rate": 7.484732331881263e-07, "loss": 2.2766, "step": 564850 }, { "epoch": 0.99, "learning_rate": 7.476012932612995e-07, "loss": 2.3273, "step": 564860 }, { "epoch": 0.99, "learning_rate": 7.467293533344727e-07, "loss": 2.3189, "step": 564870 }, { "epoch": 0.99, "learning_rate": 7.45857413407646e-07, "loss": 2.0952, "step": 564880 }, { "epoch": 0.99, "learning_rate": 7.449854734808191e-07, "loss": 2.1253, "step": 564890 }, { "epoch": 0.99, "learning_rate": 7.441135335539923e-07, "loss": 2.3869, "step": 564900 }, { "epoch": 0.99, "learning_rate": 7.432415936271655e-07, "loss": 2.2481, "step": 564910 }, { "epoch": 0.99, "learning_rate": 7.423696537003387e-07, "loss": 2.1201, "step": 564920 }, { "epoch": 0.99, "learning_rate": 7.41497713773512e-07, "loss": 2.2553, "step": 564930 }, { "epoch": 0.99, "learning_rate": 7.406257738466851e-07, "loss": 2.2527, "step": 564940 }, { "epoch": 0.99, "learning_rate": 7.397538339198583e-07, "loss": 2.2273, "step": 564950 }, { "epoch": 0.99, "learning_rate": 7.388818939930315e-07, "loss": 2.2804, "step": 564960 }, { "epoch": 0.99, "learning_rate": 7.380099540662047e-07, "loss": 2.2636, "step": 564970 }, { "epoch": 0.99, "learning_rate": 7.371380141393779e-07, "loss": 2.2305, "step": 564980 }, { "epoch": 0.99, "learning_rate": 7.362660742125511e-07, "loss": 2.1349, "step": 564990 }, { "epoch": 0.99, "learning_rate": 7.353941342857243e-07, "loss": 2.1725, "step": 565000 }, { "epoch": 0.99, "learning_rate": 7.345221943588974e-07, "loss": 2.3944, "step": 565010 }, { "epoch": 0.99, "learning_rate": 7.336502544320707e-07, "loss": 2.3278, "step": 565020 }, { "epoch": 0.99, "learning_rate": 7.327783145052439e-07, "loss": 2.2342, "step": 565030 }, { "epoch": 0.99, "learning_rate": 7.319063745784171e-07, "loss": 2.2451, "step": 565040 }, { "epoch": 0.99, "learning_rate": 7.310344346515903e-07, "loss": 2.1649, "step": 565050 }, { "epoch": 0.99, "learning_rate": 7.301624947247634e-07, "loss": 2.3163, "step": 565060 }, { "epoch": 0.99, "learning_rate": 7.292905547979367e-07, "loss": 2.3208, "step": 565070 }, { "epoch": 0.99, "learning_rate": 7.284186148711099e-07, "loss": 2.2829, "step": 565080 }, { "epoch": 0.99, "learning_rate": 7.275466749442831e-07, "loss": 2.3568, "step": 565090 }, { "epoch": 0.99, "learning_rate": 7.266747350174563e-07, "loss": 2.2269, "step": 565100 }, { "epoch": 0.99, "learning_rate": 7.258027950906294e-07, "loss": 2.2657, "step": 565110 }, { "epoch": 0.99, "learning_rate": 7.249308551638027e-07, "loss": 2.2955, "step": 565120 }, { "epoch": 0.99, "learning_rate": 7.240589152369759e-07, "loss": 2.2948, "step": 565130 }, { "epoch": 0.99, "learning_rate": 7.23186975310149e-07, "loss": 2.3701, "step": 565140 }, { "epoch": 0.99, "learning_rate": 7.223150353833223e-07, "loss": 2.1348, "step": 565150 }, { "epoch": 0.99, "learning_rate": 7.214430954564954e-07, "loss": 2.1794, "step": 565160 }, { "epoch": 0.99, "learning_rate": 7.205711555296687e-07, "loss": 2.2437, "step": 565170 }, { "epoch": 0.99, "learning_rate": 7.196992156028419e-07, "loss": 2.2745, "step": 565180 }, { "epoch": 0.99, "learning_rate": 7.18827275676015e-07, "loss": 2.3191, "step": 565190 }, { "epoch": 0.99, "learning_rate": 7.179553357491883e-07, "loss": 2.229, "step": 565200 }, { "epoch": 0.99, "learning_rate": 7.170833958223614e-07, "loss": 2.2031, "step": 565210 }, { "epoch": 0.99, "learning_rate": 7.162114558955347e-07, "loss": 2.187, "step": 565220 }, { "epoch": 0.99, "learning_rate": 7.153395159687079e-07, "loss": 2.338, "step": 565230 }, { "epoch": 0.99, "learning_rate": 7.14467576041881e-07, "loss": 2.1543, "step": 565240 }, { "epoch": 0.99, "learning_rate": 7.135956361150543e-07, "loss": 2.2273, "step": 565250 }, { "epoch": 0.99, "learning_rate": 7.127236961882274e-07, "loss": 2.2736, "step": 565260 }, { "epoch": 0.99, "learning_rate": 7.118517562614006e-07, "loss": 2.2796, "step": 565270 }, { "epoch": 0.99, "learning_rate": 7.109798163345739e-07, "loss": 2.2559, "step": 565280 }, { "epoch": 0.99, "learning_rate": 7.10107876407747e-07, "loss": 2.2563, "step": 565290 }, { "epoch": 0.99, "learning_rate": 7.092359364809203e-07, "loss": 2.2775, "step": 565300 }, { "epoch": 0.99, "learning_rate": 7.083639965540934e-07, "loss": 2.2039, "step": 565310 }, { "epoch": 0.99, "learning_rate": 7.074920566272666e-07, "loss": 2.2327, "step": 565320 }, { "epoch": 0.99, "learning_rate": 7.066201167004399e-07, "loss": 2.3388, "step": 565330 }, { "epoch": 0.99, "learning_rate": 7.05748176773613e-07, "loss": 2.2131, "step": 565340 }, { "epoch": 0.99, "learning_rate": 7.048762368467862e-07, "loss": 2.2595, "step": 565350 }, { "epoch": 0.99, "learning_rate": 7.040042969199594e-07, "loss": 2.1787, "step": 565360 }, { "epoch": 0.99, "learning_rate": 7.031323569931326e-07, "loss": 2.2854, "step": 565370 }, { "epoch": 0.99, "learning_rate": 7.022604170663059e-07, "loss": 2.2124, "step": 565380 }, { "epoch": 0.99, "learning_rate": 7.01388477139479e-07, "loss": 2.1589, "step": 565390 }, { "epoch": 0.99, "learning_rate": 7.005165372126522e-07, "loss": 2.2644, "step": 565400 }, { "epoch": 0.99, "learning_rate": 6.996445972858254e-07, "loss": 2.4313, "step": 565410 }, { "epoch": 0.99, "learning_rate": 6.987726573589986e-07, "loss": 2.2437, "step": 565420 }, { "epoch": 0.99, "learning_rate": 6.979007174321719e-07, "loss": 2.2907, "step": 565430 }, { "epoch": 0.99, "learning_rate": 6.97028777505345e-07, "loss": 2.2222, "step": 565440 }, { "epoch": 0.99, "learning_rate": 6.961568375785182e-07, "loss": 2.3191, "step": 565450 }, { "epoch": 0.99, "learning_rate": 6.952848976516914e-07, "loss": 2.1629, "step": 565460 }, { "epoch": 0.99, "learning_rate": 6.944129577248646e-07, "loss": 2.1649, "step": 565470 }, { "epoch": 0.99, "learning_rate": 6.935410177980378e-07, "loss": 2.1814, "step": 565480 }, { "epoch": 0.99, "learning_rate": 6.92669077871211e-07, "loss": 2.1859, "step": 565490 }, { "epoch": 0.99, "learning_rate": 6.917971379443842e-07, "loss": 2.2481, "step": 565500 }, { "epoch": 0.99, "learning_rate": 6.909251980175574e-07, "loss": 2.2751, "step": 565510 }, { "epoch": 0.99, "learning_rate": 6.900532580907306e-07, "loss": 2.1521, "step": 565520 }, { "epoch": 0.99, "learning_rate": 6.891813181639038e-07, "loss": 2.3292, "step": 565530 }, { "epoch": 0.99, "learning_rate": 6.88309378237077e-07, "loss": 2.2744, "step": 565540 }, { "epoch": 0.99, "learning_rate": 6.874374383102502e-07, "loss": 2.311, "step": 565550 }, { "epoch": 0.99, "learning_rate": 6.865654983834233e-07, "loss": 2.3417, "step": 565560 }, { "epoch": 0.99, "learning_rate": 6.856935584565966e-07, "loss": 2.2685, "step": 565570 }, { "epoch": 0.99, "learning_rate": 6.848216185297698e-07, "loss": 2.1714, "step": 565580 }, { "epoch": 0.99, "learning_rate": 6.83949678602943e-07, "loss": 2.2941, "step": 565590 }, { "epoch": 0.99, "learning_rate": 6.830777386761162e-07, "loss": 2.2803, "step": 565600 }, { "epoch": 0.99, "learning_rate": 6.822057987492893e-07, "loss": 2.2903, "step": 565610 }, { "epoch": 0.99, "learning_rate": 6.813338588224626e-07, "loss": 2.246, "step": 565620 }, { "epoch": 0.99, "learning_rate": 6.804619188956358e-07, "loss": 2.3149, "step": 565630 }, { "epoch": 0.99, "learning_rate": 6.79589978968809e-07, "loss": 2.2535, "step": 565640 }, { "epoch": 0.99, "learning_rate": 6.787180390419822e-07, "loss": 2.3071, "step": 565650 }, { "epoch": 0.99, "learning_rate": 6.778460991151553e-07, "loss": 2.1893, "step": 565660 }, { "epoch": 0.99, "learning_rate": 6.769741591883286e-07, "loss": 2.2613, "step": 565670 }, { "epoch": 0.99, "learning_rate": 6.761022192615018e-07, "loss": 2.3175, "step": 565680 }, { "epoch": 0.99, "learning_rate": 6.752302793346749e-07, "loss": 2.2578, "step": 565690 }, { "epoch": 0.99, "learning_rate": 6.743583394078482e-07, "loss": 2.2987, "step": 565700 }, { "epoch": 0.99, "learning_rate": 6.734863994810213e-07, "loss": 2.2943, "step": 565710 }, { "epoch": 0.99, "learning_rate": 6.726144595541946e-07, "loss": 2.3093, "step": 565720 }, { "epoch": 0.99, "learning_rate": 6.717425196273678e-07, "loss": 2.3023, "step": 565730 }, { "epoch": 0.99, "learning_rate": 6.708705797005409e-07, "loss": 2.3029, "step": 565740 }, { "epoch": 0.99, "learning_rate": 6.699986397737142e-07, "loss": 2.2944, "step": 565750 }, { "epoch": 0.99, "learning_rate": 6.691266998468873e-07, "loss": 2.3321, "step": 565760 }, { "epoch": 0.99, "learning_rate": 6.682547599200606e-07, "loss": 2.1969, "step": 565770 }, { "epoch": 0.99, "learning_rate": 6.673828199932338e-07, "loss": 2.2164, "step": 565780 }, { "epoch": 0.99, "learning_rate": 6.665108800664069e-07, "loss": 2.3573, "step": 565790 }, { "epoch": 0.99, "learning_rate": 6.656389401395802e-07, "loss": 2.2565, "step": 565800 }, { "epoch": 0.99, "learning_rate": 6.647670002127533e-07, "loss": 2.0959, "step": 565810 }, { "epoch": 0.99, "learning_rate": 6.638950602859265e-07, "loss": 2.2382, "step": 565820 }, { "epoch": 0.99, "learning_rate": 6.630231203590998e-07, "loss": 2.2548, "step": 565830 }, { "epoch": 0.99, "learning_rate": 6.621511804322729e-07, "loss": 2.3389, "step": 565840 }, { "epoch": 0.99, "learning_rate": 6.612792405054462e-07, "loss": 2.2666, "step": 565850 }, { "epoch": 0.99, "learning_rate": 6.604073005786193e-07, "loss": 2.2959, "step": 565860 }, { "epoch": 0.99, "learning_rate": 6.595353606517925e-07, "loss": 2.0676, "step": 565870 }, { "epoch": 0.99, "learning_rate": 6.586634207249658e-07, "loss": 2.2161, "step": 565880 }, { "epoch": 0.99, "learning_rate": 6.577914807981389e-07, "loss": 2.1892, "step": 565890 }, { "epoch": 0.99, "learning_rate": 6.569195408713121e-07, "loss": 2.2233, "step": 565900 }, { "epoch": 0.99, "learning_rate": 6.560476009444853e-07, "loss": 2.4397, "step": 565910 }, { "epoch": 0.99, "learning_rate": 6.551756610176585e-07, "loss": 2.2185, "step": 565920 }, { "epoch": 0.99, "learning_rate": 6.543037210908318e-07, "loss": 2.2773, "step": 565930 }, { "epoch": 0.99, "learning_rate": 6.534317811640049e-07, "loss": 2.2584, "step": 565940 }, { "epoch": 0.99, "learning_rate": 6.525598412371781e-07, "loss": 2.2271, "step": 565950 }, { "epoch": 0.99, "learning_rate": 6.516879013103513e-07, "loss": 2.3018, "step": 565960 }, { "epoch": 0.99, "learning_rate": 6.508159613835245e-07, "loss": 2.2351, "step": 565970 }, { "epoch": 0.99, "learning_rate": 6.499440214566978e-07, "loss": 2.3005, "step": 565980 }, { "epoch": 0.99, "learning_rate": 6.490720815298709e-07, "loss": 2.304, "step": 565990 }, { "epoch": 0.99, "learning_rate": 6.482001416030441e-07, "loss": 2.2917, "step": 566000 }, { "epoch": 0.99, "learning_rate": 6.473282016762173e-07, "loss": 2.3166, "step": 566010 }, { "epoch": 0.99, "learning_rate": 6.464562617493905e-07, "loss": 2.1891, "step": 566020 }, { "epoch": 0.99, "learning_rate": 6.455843218225637e-07, "loss": 2.2635, "step": 566030 }, { "epoch": 0.99, "learning_rate": 6.447123818957369e-07, "loss": 2.2639, "step": 566040 }, { "epoch": 0.99, "learning_rate": 6.438404419689101e-07, "loss": 2.1587, "step": 566050 }, { "epoch": 0.99, "learning_rate": 6.429685020420834e-07, "loss": 2.3593, "step": 566060 }, { "epoch": 0.99, "learning_rate": 6.420965621152565e-07, "loss": 2.231, "step": 566070 }, { "epoch": 0.99, "learning_rate": 6.412246221884297e-07, "loss": 2.2201, "step": 566080 }, { "epoch": 0.99, "learning_rate": 6.403526822616029e-07, "loss": 2.3107, "step": 566090 }, { "epoch": 0.99, "learning_rate": 6.394807423347761e-07, "loss": 2.0938, "step": 566100 }, { "epoch": 0.99, "learning_rate": 6.386088024079494e-07, "loss": 2.1503, "step": 566110 }, { "epoch": 0.99, "learning_rate": 6.377368624811225e-07, "loss": 2.2791, "step": 566120 }, { "epoch": 0.99, "learning_rate": 6.368649225542957e-07, "loss": 2.2775, "step": 566130 }, { "epoch": 0.99, "learning_rate": 6.359929826274689e-07, "loss": 2.2487, "step": 566140 }, { "epoch": 0.99, "learning_rate": 6.351210427006421e-07, "loss": 2.3185, "step": 566150 }, { "epoch": 0.99, "learning_rate": 6.342491027738153e-07, "loss": 2.3706, "step": 566160 }, { "epoch": 0.99, "learning_rate": 6.333771628469885e-07, "loss": 2.2743, "step": 566170 }, { "epoch": 0.99, "learning_rate": 6.325052229201617e-07, "loss": 2.2395, "step": 566180 }, { "epoch": 0.99, "learning_rate": 6.316332829933349e-07, "loss": 2.151, "step": 566190 }, { "epoch": 0.99, "learning_rate": 6.307613430665081e-07, "loss": 2.266, "step": 566200 }, { "epoch": 0.99, "learning_rate": 6.298894031396813e-07, "loss": 2.1623, "step": 566210 }, { "epoch": 0.99, "learning_rate": 6.290174632128545e-07, "loss": 2.2844, "step": 566220 }, { "epoch": 0.99, "learning_rate": 6.281455232860277e-07, "loss": 2.2503, "step": 566230 }, { "epoch": 0.99, "learning_rate": 6.272735833592008e-07, "loss": 2.3142, "step": 566240 }, { "epoch": 0.99, "learning_rate": 6.264016434323741e-07, "loss": 2.2609, "step": 566250 }, { "epoch": 0.99, "learning_rate": 6.255297035055473e-07, "loss": 2.2132, "step": 566260 }, { "epoch": 0.99, "learning_rate": 6.246577635787205e-07, "loss": 2.2403, "step": 566270 }, { "epoch": 0.99, "learning_rate": 6.237858236518937e-07, "loss": 2.2105, "step": 566280 }, { "epoch": 0.99, "learning_rate": 6.229138837250668e-07, "loss": 2.3248, "step": 566290 }, { "epoch": 0.99, "learning_rate": 6.220419437982401e-07, "loss": 2.2775, "step": 566300 }, { "epoch": 0.99, "learning_rate": 6.211700038714133e-07, "loss": 2.191, "step": 566310 }, { "epoch": 0.99, "learning_rate": 6.202980639445865e-07, "loss": 2.3746, "step": 566320 }, { "epoch": 0.99, "learning_rate": 6.194261240177597e-07, "loss": 2.3063, "step": 566330 }, { "epoch": 0.99, "learning_rate": 6.185541840909328e-07, "loss": 2.242, "step": 566340 }, { "epoch": 0.99, "learning_rate": 6.176822441641061e-07, "loss": 2.3349, "step": 566350 }, { "epoch": 0.99, "learning_rate": 6.168103042372793e-07, "loss": 2.1948, "step": 566360 }, { "epoch": 0.99, "learning_rate": 6.159383643104524e-07, "loss": 2.2015, "step": 566370 }, { "epoch": 0.99, "learning_rate": 6.150664243836257e-07, "loss": 1.924, "step": 566380 }, { "epoch": 0.99, "learning_rate": 6.141944844567988e-07, "loss": 2.2269, "step": 566390 }, { "epoch": 0.99, "learning_rate": 6.133225445299721e-07, "loss": 2.2264, "step": 566400 }, { "epoch": 0.99, "learning_rate": 6.124506046031453e-07, "loss": 2.2052, "step": 566410 }, { "epoch": 0.99, "learning_rate": 6.115786646763184e-07, "loss": 2.2907, "step": 566420 }, { "epoch": 0.99, "learning_rate": 6.107067247494917e-07, "loss": 2.1831, "step": 566430 }, { "epoch": 0.99, "learning_rate": 6.098347848226648e-07, "loss": 2.2179, "step": 566440 }, { "epoch": 0.99, "learning_rate": 6.08962844895838e-07, "loss": 2.2396, "step": 566450 }, { "epoch": 0.99, "learning_rate": 6.080909049690113e-07, "loss": 2.2669, "step": 566460 }, { "epoch": 0.99, "learning_rate": 6.072189650421844e-07, "loss": 2.283, "step": 566470 }, { "epoch": 0.99, "learning_rate": 6.063470251153577e-07, "loss": 2.2969, "step": 566480 }, { "epoch": 0.99, "learning_rate": 6.054750851885308e-07, "loss": 2.29, "step": 566490 }, { "epoch": 0.99, "learning_rate": 6.04603145261704e-07, "loss": 2.1918, "step": 566500 }, { "epoch": 0.99, "learning_rate": 6.037312053348773e-07, "loss": 2.3284, "step": 566510 }, { "epoch": 0.99, "learning_rate": 6.028592654080504e-07, "loss": 2.1954, "step": 566520 }, { "epoch": 0.99, "learning_rate": 6.019873254812237e-07, "loss": 2.1641, "step": 566530 }, { "epoch": 0.99, "learning_rate": 6.011153855543968e-07, "loss": 2.235, "step": 566540 }, { "epoch": 0.99, "learning_rate": 6.0024344562757e-07, "loss": 2.3208, "step": 566550 }, { "epoch": 0.99, "learning_rate": 5.993715057007433e-07, "loss": 2.1548, "step": 566560 }, { "epoch": 0.99, "learning_rate": 5.984995657739164e-07, "loss": 2.2539, "step": 566570 }, { "epoch": 0.99, "learning_rate": 5.976276258470896e-07, "loss": 2.2403, "step": 566580 }, { "epoch": 0.99, "learning_rate": 5.967556859202629e-07, "loss": 2.2822, "step": 566590 }, { "epoch": 0.99, "learning_rate": 5.95883745993436e-07, "loss": 2.1449, "step": 566600 }, { "epoch": 0.99, "learning_rate": 5.950118060666093e-07, "loss": 2.2834, "step": 566610 }, { "epoch": 0.99, "learning_rate": 5.941398661397824e-07, "loss": 2.2029, "step": 566620 }, { "epoch": 0.99, "learning_rate": 5.932679262129556e-07, "loss": 2.1913, "step": 566630 }, { "epoch": 0.99, "learning_rate": 5.923959862861289e-07, "loss": 2.3106, "step": 566640 }, { "epoch": 0.99, "learning_rate": 5.91524046359302e-07, "loss": 2.2313, "step": 566650 }, { "epoch": 0.99, "learning_rate": 5.906521064324753e-07, "loss": 2.3769, "step": 566660 }, { "epoch": 0.99, "learning_rate": 5.897801665056484e-07, "loss": 2.3259, "step": 566670 }, { "epoch": 0.99, "learning_rate": 5.889082265788216e-07, "loss": 2.2012, "step": 566680 }, { "epoch": 0.99, "learning_rate": 5.880362866519949e-07, "loss": 2.3323, "step": 566690 }, { "epoch": 0.99, "learning_rate": 5.87164346725168e-07, "loss": 2.1371, "step": 566700 }, { "epoch": 0.99, "learning_rate": 5.862924067983412e-07, "loss": 2.274, "step": 566710 }, { "epoch": 0.99, "learning_rate": 5.854204668715145e-07, "loss": 2.2591, "step": 566720 }, { "epoch": 0.99, "learning_rate": 5.845485269446876e-07, "loss": 2.2483, "step": 566730 }, { "epoch": 0.99, "learning_rate": 5.836765870178609e-07, "loss": 2.3488, "step": 566740 }, { "epoch": 0.99, "learning_rate": 5.82804647091034e-07, "loss": 2.3975, "step": 566750 }, { "epoch": 0.99, "learning_rate": 5.819327071642072e-07, "loss": 2.2501, "step": 566760 }, { "epoch": 0.99, "learning_rate": 5.810607672373805e-07, "loss": 2.2656, "step": 566770 }, { "epoch": 0.99, "learning_rate": 5.801888273105536e-07, "loss": 2.1918, "step": 566780 }, { "epoch": 0.99, "learning_rate": 5.793168873837268e-07, "loss": 2.1489, "step": 566790 }, { "epoch": 0.99, "learning_rate": 5.784449474569001e-07, "loss": 2.3233, "step": 566800 }, { "epoch": 0.99, "learning_rate": 5.775730075300732e-07, "loss": 2.2854, "step": 566810 }, { "epoch": 0.99, "learning_rate": 5.767010676032465e-07, "loss": 2.4082, "step": 566820 }, { "epoch": 0.99, "learning_rate": 5.758291276764196e-07, "loss": 2.3313, "step": 566830 }, { "epoch": 0.99, "learning_rate": 5.749571877495928e-07, "loss": 2.2422, "step": 566840 }, { "epoch": 0.99, "learning_rate": 5.740852478227661e-07, "loss": 2.2496, "step": 566850 }, { "epoch": 0.99, "learning_rate": 5.732133078959392e-07, "loss": 2.1388, "step": 566860 }, { "epoch": 0.99, "learning_rate": 5.723413679691125e-07, "loss": 2.2519, "step": 566870 }, { "epoch": 0.99, "learning_rate": 5.714694280422856e-07, "loss": 2.2346, "step": 566880 }, { "epoch": 0.99, "learning_rate": 5.705974881154588e-07, "loss": 2.249, "step": 566890 }, { "epoch": 0.99, "learning_rate": 5.697255481886321e-07, "loss": 2.2889, "step": 566900 }, { "epoch": 0.99, "learning_rate": 5.688536082618052e-07, "loss": 2.2548, "step": 566910 }, { "epoch": 0.99, "learning_rate": 5.679816683349784e-07, "loss": 2.1983, "step": 566920 }, { "epoch": 0.99, "learning_rate": 5.671097284081517e-07, "loss": 2.3803, "step": 566930 }, { "epoch": 0.99, "learning_rate": 5.662377884813248e-07, "loss": 2.1307, "step": 566940 }, { "epoch": 0.99, "learning_rate": 5.653658485544981e-07, "loss": 2.2152, "step": 566950 }, { "epoch": 0.99, "learning_rate": 5.644939086276712e-07, "loss": 2.3433, "step": 566960 }, { "epoch": 0.99, "learning_rate": 5.636219687008444e-07, "loss": 2.2037, "step": 566970 }, { "epoch": 0.99, "learning_rate": 5.627500287740177e-07, "loss": 2.2483, "step": 566980 }, { "epoch": 0.99, "learning_rate": 5.618780888471908e-07, "loss": 2.2732, "step": 566990 }, { "epoch": 0.99, "learning_rate": 5.61006148920364e-07, "loss": 2.2291, "step": 567000 }, { "epoch": 0.99, "learning_rate": 5.601342089935372e-07, "loss": 2.2342, "step": 567010 }, { "epoch": 0.99, "learning_rate": 5.592622690667104e-07, "loss": 2.1306, "step": 567020 }, { "epoch": 0.99, "learning_rate": 5.583903291398837e-07, "loss": 2.2656, "step": 567030 }, { "epoch": 0.99, "learning_rate": 5.575183892130568e-07, "loss": 2.245, "step": 567040 }, { "epoch": 0.99, "learning_rate": 5.5664644928623e-07, "loss": 2.218, "step": 567050 }, { "epoch": 0.99, "learning_rate": 5.557745093594033e-07, "loss": 2.2285, "step": 567060 }, { "epoch": 0.99, "learning_rate": 5.549025694325764e-07, "loss": 2.2467, "step": 567070 }, { "epoch": 0.99, "learning_rate": 5.540306295057497e-07, "loss": 2.251, "step": 567080 }, { "epoch": 0.99, "learning_rate": 5.531586895789228e-07, "loss": 2.2466, "step": 567090 }, { "epoch": 0.99, "learning_rate": 5.52286749652096e-07, "loss": 2.244, "step": 567100 }, { "epoch": 0.99, "learning_rate": 5.514148097252693e-07, "loss": 2.2837, "step": 567110 }, { "epoch": 0.99, "learning_rate": 5.505428697984424e-07, "loss": 2.3508, "step": 567120 }, { "epoch": 0.99, "learning_rate": 5.496709298716156e-07, "loss": 2.2921, "step": 567130 }, { "epoch": 0.99, "learning_rate": 5.487989899447888e-07, "loss": 2.2045, "step": 567140 }, { "epoch": 0.99, "learning_rate": 5.47927050017962e-07, "loss": 2.1769, "step": 567150 }, { "epoch": 0.99, "learning_rate": 5.470551100911353e-07, "loss": 2.2698, "step": 567160 }, { "epoch": 0.99, "learning_rate": 5.461831701643084e-07, "loss": 2.2596, "step": 567170 }, { "epoch": 0.99, "learning_rate": 5.453112302374816e-07, "loss": 2.3036, "step": 567180 }, { "epoch": 0.99, "learning_rate": 5.444392903106548e-07, "loss": 2.2852, "step": 567190 }, { "epoch": 0.99, "learning_rate": 5.43567350383828e-07, "loss": 2.3892, "step": 567200 }, { "epoch": 0.99, "learning_rate": 5.426954104570013e-07, "loss": 2.2412, "step": 567210 }, { "epoch": 0.99, "learning_rate": 5.418234705301744e-07, "loss": 2.232, "step": 567220 }, { "epoch": 0.99, "learning_rate": 5.409515306033476e-07, "loss": 2.2865, "step": 567230 }, { "epoch": 0.99, "learning_rate": 5.400795906765208e-07, "loss": 2.2369, "step": 567240 }, { "epoch": 0.99, "learning_rate": 5.39207650749694e-07, "loss": 2.1936, "step": 567250 }, { "epoch": 0.99, "learning_rate": 5.383357108228672e-07, "loss": 2.2252, "step": 567260 }, { "epoch": 0.99, "learning_rate": 5.374637708960404e-07, "loss": 2.214, "step": 567270 }, { "epoch": 0.99, "learning_rate": 5.365918309692136e-07, "loss": 2.2131, "step": 567280 }, { "epoch": 0.99, "learning_rate": 5.357198910423868e-07, "loss": 2.2423, "step": 567290 }, { "epoch": 0.99, "learning_rate": 5.3484795111556e-07, "loss": 2.1948, "step": 567300 }, { "epoch": 0.99, "learning_rate": 5.339760111887332e-07, "loss": 2.2632, "step": 567310 }, { "epoch": 0.99, "learning_rate": 5.331040712619064e-07, "loss": 2.322, "step": 567320 }, { "epoch": 0.99, "learning_rate": 5.322321313350796e-07, "loss": 2.251, "step": 567330 }, { "epoch": 0.99, "learning_rate": 5.313601914082527e-07, "loss": 2.3405, "step": 567340 }, { "epoch": 0.99, "learning_rate": 5.30488251481426e-07, "loss": 2.157, "step": 567350 }, { "epoch": 0.99, "learning_rate": 5.296163115545992e-07, "loss": 2.1394, "step": 567360 }, { "epoch": 0.99, "learning_rate": 5.287443716277724e-07, "loss": 2.2781, "step": 567370 }, { "epoch": 0.99, "learning_rate": 5.278724317009456e-07, "loss": 2.274, "step": 567380 }, { "epoch": 0.99, "learning_rate": 5.270004917741187e-07, "loss": 2.3699, "step": 567390 }, { "epoch": 0.99, "learning_rate": 5.26128551847292e-07, "loss": 2.2243, "step": 567400 }, { "epoch": 0.99, "learning_rate": 5.252566119204652e-07, "loss": 2.2209, "step": 567410 }, { "epoch": 0.99, "learning_rate": 5.243846719936384e-07, "loss": 2.2952, "step": 567420 }, { "epoch": 0.99, "learning_rate": 5.235127320668116e-07, "loss": 2.3311, "step": 567430 }, { "epoch": 0.99, "learning_rate": 5.226407921399848e-07, "loss": 2.2642, "step": 567440 }, { "epoch": 0.99, "learning_rate": 5.21768852213158e-07, "loss": 2.2899, "step": 567450 }, { "epoch": 0.99, "learning_rate": 5.208969122863312e-07, "loss": 2.2738, "step": 567460 }, { "epoch": 0.99, "learning_rate": 5.200249723595043e-07, "loss": 2.1831, "step": 567470 }, { "epoch": 0.99, "learning_rate": 5.191530324326776e-07, "loss": 2.2717, "step": 567480 }, { "epoch": 0.99, "learning_rate": 5.182810925058508e-07, "loss": 2.3013, "step": 567490 }, { "epoch": 0.99, "learning_rate": 5.17409152579024e-07, "loss": 2.1975, "step": 567500 }, { "epoch": 0.99, "learning_rate": 5.165372126521972e-07, "loss": 2.2462, "step": 567510 }, { "epoch": 0.99, "learning_rate": 5.156652727253703e-07, "loss": 2.208, "step": 567520 }, { "epoch": 0.99, "learning_rate": 5.147933327985436e-07, "loss": 2.2867, "step": 567530 }, { "epoch": 0.99, "learning_rate": 5.139213928717168e-07, "loss": 2.1761, "step": 567540 }, { "epoch": 0.99, "learning_rate": 5.1304945294489e-07, "loss": 2.2264, "step": 567550 }, { "epoch": 0.99, "learning_rate": 5.121775130180632e-07, "loss": 2.2636, "step": 567560 }, { "epoch": 0.99, "learning_rate": 5.113055730912363e-07, "loss": 2.2454, "step": 567570 }, { "epoch": 0.99, "learning_rate": 5.104336331644096e-07, "loss": 2.2504, "step": 567580 }, { "epoch": 0.99, "learning_rate": 5.095616932375828e-07, "loss": 2.2308, "step": 567590 }, { "epoch": 0.99, "learning_rate": 5.086897533107559e-07, "loss": 2.3036, "step": 567600 }, { "epoch": 0.99, "learning_rate": 5.078178133839292e-07, "loss": 2.3239, "step": 567610 }, { "epoch": 0.99, "learning_rate": 5.069458734571023e-07, "loss": 2.1471, "step": 567620 }, { "epoch": 0.99, "learning_rate": 5.060739335302756e-07, "loss": 2.2312, "step": 567630 }, { "epoch": 0.99, "learning_rate": 5.052019936034488e-07, "loss": 2.2732, "step": 567640 }, { "epoch": 0.99, "learning_rate": 5.043300536766219e-07, "loss": 2.2422, "step": 567650 }, { "epoch": 0.99, "learning_rate": 5.034581137497952e-07, "loss": 2.2932, "step": 567660 }, { "epoch": 0.99, "learning_rate": 5.025861738229683e-07, "loss": 2.3347, "step": 567670 }, { "epoch": 0.99, "learning_rate": 5.017142338961415e-07, "loss": 2.3001, "step": 567680 }, { "epoch": 0.99, "learning_rate": 5.008422939693148e-07, "loss": 2.4094, "step": 567690 }, { "epoch": 0.99, "learning_rate": 4.999703540424879e-07, "loss": 2.2282, "step": 567700 }, { "epoch": 0.99, "learning_rate": 4.990984141156612e-07, "loss": 2.1282, "step": 567710 }, { "epoch": 0.99, "learning_rate": 4.982264741888343e-07, "loss": 2.3119, "step": 567720 }, { "epoch": 0.99, "learning_rate": 4.973545342620075e-07, "loss": 2.2459, "step": 567730 }, { "epoch": 0.99, "learning_rate": 4.964825943351808e-07, "loss": 2.3325, "step": 567740 }, { "epoch": 0.99, "learning_rate": 4.956106544083539e-07, "loss": 2.2282, "step": 567750 }, { "epoch": 0.99, "learning_rate": 4.947387144815272e-07, "loss": 2.1311, "step": 567760 }, { "epoch": 0.99, "learning_rate": 4.938667745547003e-07, "loss": 2.2202, "step": 567770 }, { "epoch": 0.99, "learning_rate": 4.929948346278735e-07, "loss": 2.2096, "step": 567780 }, { "epoch": 0.99, "learning_rate": 4.921228947010468e-07, "loss": 2.1934, "step": 567790 }, { "epoch": 0.99, "learning_rate": 4.912509547742199e-07, "loss": 2.1147, "step": 567800 }, { "epoch": 0.99, "learning_rate": 4.903790148473931e-07, "loss": 2.375, "step": 567810 }, { "epoch": 0.99, "learning_rate": 4.895070749205663e-07, "loss": 2.344, "step": 567820 }, { "epoch": 0.99, "learning_rate": 4.886351349937395e-07, "loss": 2.3063, "step": 567830 }, { "epoch": 0.99, "learning_rate": 4.877631950669128e-07, "loss": 2.3823, "step": 567840 }, { "epoch": 0.99, "learning_rate": 4.868912551400859e-07, "loss": 2.2679, "step": 567850 }, { "epoch": 0.99, "learning_rate": 4.860193152132591e-07, "loss": 2.2819, "step": 567860 }, { "epoch": 0.99, "learning_rate": 4.851473752864323e-07, "loss": 2.2344, "step": 567870 }, { "epoch": 0.99, "learning_rate": 4.842754353596055e-07, "loss": 2.1929, "step": 567880 }, { "epoch": 0.99, "learning_rate": 4.834034954327788e-07, "loss": 2.3466, "step": 567890 }, { "epoch": 0.99, "learning_rate": 4.825315555059519e-07, "loss": 2.2778, "step": 567900 }, { "epoch": 0.99, "learning_rate": 4.816596155791251e-07, "loss": 2.1532, "step": 567910 }, { "epoch": 0.99, "learning_rate": 4.807876756522983e-07, "loss": 2.3015, "step": 567920 }, { "epoch": 0.99, "learning_rate": 4.799157357254715e-07, "loss": 2.2469, "step": 567930 }, { "epoch": 0.99, "learning_rate": 4.790437957986447e-07, "loss": 2.3165, "step": 567940 }, { "epoch": 0.99, "learning_rate": 4.781718558718179e-07, "loss": 2.1923, "step": 567950 }, { "epoch": 0.99, "learning_rate": 4.772999159449911e-07, "loss": 2.2006, "step": 567960 }, { "epoch": 0.99, "learning_rate": 4.7642797601816425e-07, "loss": 2.1696, "step": 567970 }, { "epoch": 0.99, "learning_rate": 4.755560360913375e-07, "loss": 2.1114, "step": 567980 }, { "epoch": 0.99, "learning_rate": 4.7468409616451073e-07, "loss": 2.2594, "step": 567990 }, { "epoch": 0.99, "learning_rate": 4.7381215623768387e-07, "loss": 2.2817, "step": 568000 }, { "epoch": 0.99, "learning_rate": 4.729402163108571e-07, "loss": 2.1544, "step": 568010 }, { "epoch": 0.99, "learning_rate": 4.7206827638403024e-07, "loss": 2.1606, "step": 568020 }, { "epoch": 0.99, "learning_rate": 4.711963364572035e-07, "loss": 2.2792, "step": 568030 }, { "epoch": 0.99, "learning_rate": 4.703243965303767e-07, "loss": 2.2426, "step": 568040 }, { "epoch": 0.99, "learning_rate": 4.6945245660354986e-07, "loss": 2.2039, "step": 568050 }, { "epoch": 0.99, "learning_rate": 4.685805166767231e-07, "loss": 2.4092, "step": 568060 }, { "epoch": 0.99, "learning_rate": 4.6770857674989623e-07, "loss": 2.3315, "step": 568070 }, { "epoch": 0.99, "learning_rate": 4.668366368230695e-07, "loss": 2.2655, "step": 568080 }, { "epoch": 0.99, "learning_rate": 4.659646968962427e-07, "loss": 2.1789, "step": 568090 }, { "epoch": 0.99, "learning_rate": 4.6509275696941585e-07, "loss": 2.2498, "step": 568100 }, { "epoch": 0.99, "learning_rate": 4.642208170425891e-07, "loss": 2.3675, "step": 568110 }, { "epoch": 0.99, "learning_rate": 4.633488771157622e-07, "loss": 2.25, "step": 568120 }, { "epoch": 0.99, "learning_rate": 4.6247693718893547e-07, "loss": 2.1755, "step": 568130 }, { "epoch": 0.99, "learning_rate": 4.616049972621087e-07, "loss": 2.2111, "step": 568140 }, { "epoch": 0.99, "learning_rate": 4.6073305733528184e-07, "loss": 2.1776, "step": 568150 }, { "epoch": 0.99, "learning_rate": 4.598611174084551e-07, "loss": 2.2407, "step": 568160 }, { "epoch": 0.99, "learning_rate": 4.589891774816282e-07, "loss": 2.113, "step": 568170 }, { "epoch": 0.99, "learning_rate": 4.5811723755480146e-07, "loss": 2.3497, "step": 568180 }, { "epoch": 0.99, "learning_rate": 4.572452976279747e-07, "loss": 2.3144, "step": 568190 }, { "epoch": 0.99, "learning_rate": 4.5637335770114783e-07, "loss": 2.2142, "step": 568200 }, { "epoch": 0.99, "learning_rate": 4.5550141777432107e-07, "loss": 2.1791, "step": 568210 }, { "epoch": 0.99, "learning_rate": 4.546294778474942e-07, "loss": 2.2732, "step": 568220 }, { "epoch": 0.99, "learning_rate": 4.5375753792066745e-07, "loss": 2.3126, "step": 568230 }, { "epoch": 0.99, "learning_rate": 4.528855979938407e-07, "loss": 2.3021, "step": 568240 }, { "epoch": 0.99, "learning_rate": 4.520136580670138e-07, "loss": 2.2609, "step": 568250 }, { "epoch": 0.99, "learning_rate": 4.5114171814018706e-07, "loss": 2.2906, "step": 568260 }, { "epoch": 0.99, "learning_rate": 4.502697782133602e-07, "loss": 2.2645, "step": 568270 }, { "epoch": 0.99, "learning_rate": 4.4939783828653344e-07, "loss": 2.324, "step": 568280 }, { "epoch": 0.99, "learning_rate": 4.485258983597067e-07, "loss": 2.2306, "step": 568290 }, { "epoch": 0.99, "learning_rate": 4.476539584328798e-07, "loss": 2.1467, "step": 568300 }, { "epoch": 0.99, "learning_rate": 4.4678201850605305e-07, "loss": 2.297, "step": 568310 }, { "epoch": 0.99, "learning_rate": 4.459100785792262e-07, "loss": 2.3768, "step": 568320 }, { "epoch": 0.99, "learning_rate": 4.4503813865239943e-07, "loss": 2.2327, "step": 568330 }, { "epoch": 0.99, "learning_rate": 4.4416619872557267e-07, "loss": 2.2578, "step": 568340 }, { "epoch": 0.99, "learning_rate": 4.432942587987458e-07, "loss": 2.3469, "step": 568350 }, { "epoch": 0.99, "learning_rate": 4.4242231887191904e-07, "loss": 2.1666, "step": 568360 }, { "epoch": 0.99, "learning_rate": 4.415503789450922e-07, "loss": 2.3078, "step": 568370 }, { "epoch": 0.99, "learning_rate": 4.406784390182654e-07, "loss": 2.2391, "step": 568380 }, { "epoch": 0.99, "learning_rate": 4.3980649909143866e-07, "loss": 2.3258, "step": 568390 }, { "epoch": 0.99, "learning_rate": 4.389345591646118e-07, "loss": 2.3915, "step": 568400 }, { "epoch": 0.99, "learning_rate": 4.3806261923778504e-07, "loss": 2.1886, "step": 568410 }, { "epoch": 0.99, "learning_rate": 4.3719067931095817e-07, "loss": 2.3464, "step": 568420 }, { "epoch": 0.99, "learning_rate": 4.363187393841314e-07, "loss": 2.2475, "step": 568430 }, { "epoch": 0.99, "learning_rate": 4.3544679945730465e-07, "loss": 2.2958, "step": 568440 }, { "epoch": 0.99, "learning_rate": 4.345748595304778e-07, "loss": 2.2589, "step": 568450 }, { "epoch": 0.99, "learning_rate": 4.33702919603651e-07, "loss": 2.241, "step": 568460 }, { "epoch": 0.99, "learning_rate": 4.3283097967682416e-07, "loss": 2.2717, "step": 568470 }, { "epoch": 0.99, "learning_rate": 4.319590397499974e-07, "loss": 2.2042, "step": 568480 }, { "epoch": 0.99, "learning_rate": 4.3108709982317064e-07, "loss": 2.2261, "step": 568490 }, { "epoch": 0.99, "learning_rate": 4.302151598963438e-07, "loss": 2.2556, "step": 568500 }, { "epoch": 0.99, "learning_rate": 4.29343219969517e-07, "loss": 2.2345, "step": 568510 }, { "epoch": 0.99, "learning_rate": 4.2847128004269015e-07, "loss": 2.3172, "step": 568520 }, { "epoch": 0.99, "learning_rate": 4.275993401158634e-07, "loss": 2.2696, "step": 568530 }, { "epoch": 0.99, "learning_rate": 4.2672740018903663e-07, "loss": 2.2107, "step": 568540 }, { "epoch": 0.99, "learning_rate": 4.2585546026220977e-07, "loss": 2.2489, "step": 568550 }, { "epoch": 0.99, "learning_rate": 4.24983520335383e-07, "loss": 2.1769, "step": 568560 }, { "epoch": 0.99, "learning_rate": 4.2411158040855614e-07, "loss": 2.2242, "step": 568570 }, { "epoch": 0.99, "learning_rate": 4.232396404817294e-07, "loss": 2.3399, "step": 568580 }, { "epoch": 0.99, "learning_rate": 4.223677005549026e-07, "loss": 2.2864, "step": 568590 }, { "epoch": 0.99, "learning_rate": 4.2149576062807576e-07, "loss": 2.284, "step": 568600 }, { "epoch": 0.99, "learning_rate": 4.20623820701249e-07, "loss": 2.2034, "step": 568610 }, { "epoch": 0.99, "learning_rate": 4.1975188077442213e-07, "loss": 2.2895, "step": 568620 }, { "epoch": 0.99, "learning_rate": 4.188799408475954e-07, "loss": 2.2859, "step": 568630 }, { "epoch": 0.99, "learning_rate": 4.180080009207686e-07, "loss": 2.2077, "step": 568640 }, { "epoch": 0.99, "learning_rate": 4.1713606099394175e-07, "loss": 2.2646, "step": 568650 }, { "epoch": 0.99, "learning_rate": 4.16264121067115e-07, "loss": 2.3594, "step": 568660 }, { "epoch": 0.99, "learning_rate": 4.153921811402881e-07, "loss": 2.2671, "step": 568670 }, { "epoch": 0.99, "learning_rate": 4.1452024121346136e-07, "loss": 2.2002, "step": 568680 }, { "epoch": 0.99, "learning_rate": 4.136483012866346e-07, "loss": 2.3326, "step": 568690 }, { "epoch": 0.99, "learning_rate": 4.1277636135980774e-07, "loss": 2.2986, "step": 568700 }, { "epoch": 0.99, "learning_rate": 4.11904421432981e-07, "loss": 2.2526, "step": 568710 }, { "epoch": 0.99, "learning_rate": 4.110324815061541e-07, "loss": 2.233, "step": 568720 }, { "epoch": 0.99, "learning_rate": 4.1016054157932736e-07, "loss": 2.1782, "step": 568730 }, { "epoch": 0.99, "learning_rate": 4.092886016525006e-07, "loss": 2.3242, "step": 568740 }, { "epoch": 0.99, "learning_rate": 4.0841666172567373e-07, "loss": 2.2947, "step": 568750 }, { "epoch": 0.99, "learning_rate": 4.0754472179884697e-07, "loss": 2.2963, "step": 568760 }, { "epoch": 0.99, "learning_rate": 4.066727818720201e-07, "loss": 2.1796, "step": 568770 }, { "epoch": 0.99, "learning_rate": 4.0580084194519335e-07, "loss": 2.1004, "step": 568780 }, { "epoch": 0.99, "learning_rate": 4.049289020183666e-07, "loss": 2.263, "step": 568790 }, { "epoch": 0.99, "learning_rate": 4.040569620915397e-07, "loss": 2.1829, "step": 568800 }, { "epoch": 0.99, "learning_rate": 4.0318502216471296e-07, "loss": 2.2935, "step": 568810 }, { "epoch": 0.99, "learning_rate": 4.023130822378862e-07, "loss": 2.208, "step": 568820 }, { "epoch": 0.99, "learning_rate": 4.0144114231105934e-07, "loss": 2.2732, "step": 568830 }, { "epoch": 0.99, "learning_rate": 4.005692023842326e-07, "loss": 2.1925, "step": 568840 }, { "epoch": 0.99, "learning_rate": 3.996972624574057e-07, "loss": 2.3269, "step": 568850 }, { "epoch": 0.99, "learning_rate": 3.9882532253057895e-07, "loss": 2.1633, "step": 568860 }, { "epoch": 0.99, "learning_rate": 3.979533826037522e-07, "loss": 2.3015, "step": 568870 }, { "epoch": 0.99, "learning_rate": 3.9708144267692533e-07, "loss": 2.2691, "step": 568880 }, { "epoch": 0.99, "learning_rate": 3.9620950275009857e-07, "loss": 2.2864, "step": 568890 }, { "epoch": 0.99, "learning_rate": 3.953375628232717e-07, "loss": 2.228, "step": 568900 }, { "epoch": 0.99, "learning_rate": 3.9446562289644494e-07, "loss": 2.2239, "step": 568910 }, { "epoch": 0.99, "learning_rate": 3.935936829696182e-07, "loss": 2.2473, "step": 568920 }, { "epoch": 0.99, "learning_rate": 3.927217430427913e-07, "loss": 2.2274, "step": 568930 }, { "epoch": 0.99, "learning_rate": 3.9184980311596456e-07, "loss": 2.331, "step": 568940 }, { "epoch": 0.99, "learning_rate": 3.909778631891377e-07, "loss": 2.2807, "step": 568950 }, { "epoch": 0.99, "learning_rate": 3.9010592326231093e-07, "loss": 2.1732, "step": 568960 }, { "epoch": 0.99, "learning_rate": 3.892339833354841e-07, "loss": 2.2017, "step": 568970 }, { "epoch": 0.99, "learning_rate": 3.883620434086573e-07, "loss": 2.2332, "step": 568980 }, { "epoch": 0.99, "learning_rate": 3.874901034818305e-07, "loss": 2.3286, "step": 568990 }, { "epoch": 0.99, "learning_rate": 3.8661816355500374e-07, "loss": 2.2917, "step": 569000 }, { "epoch": 0.99, "learning_rate": 3.857462236281769e-07, "loss": 2.1798, "step": 569010 }, { "epoch": 0.99, "learning_rate": 3.848742837013501e-07, "loss": 2.2473, "step": 569020 }, { "epoch": 0.99, "learning_rate": 3.840023437745233e-07, "loss": 2.2214, "step": 569030 }, { "epoch": 0.99, "learning_rate": 3.831304038476965e-07, "loss": 2.1391, "step": 569040 }, { "epoch": 0.99, "learning_rate": 3.8225846392086973e-07, "loss": 2.3303, "step": 569050 }, { "epoch": 0.99, "learning_rate": 3.813865239940429e-07, "loss": 2.1754, "step": 569060 }, { "epoch": 0.99, "learning_rate": 3.805145840672161e-07, "loss": 2.2982, "step": 569070 }, { "epoch": 0.99, "learning_rate": 3.796426441403893e-07, "loss": 2.3022, "step": 569080 }, { "epoch": 0.99, "learning_rate": 3.787707042135625e-07, "loss": 2.2288, "step": 569090 }, { "epoch": 0.99, "learning_rate": 3.778987642867357e-07, "loss": 2.1857, "step": 569100 }, { "epoch": 0.99, "learning_rate": 3.770268243599089e-07, "loss": 2.2683, "step": 569110 }, { "epoch": 0.99, "learning_rate": 3.761548844330821e-07, "loss": 2.2357, "step": 569120 }, { "epoch": 0.99, "learning_rate": 3.752829445062553e-07, "loss": 2.1678, "step": 569130 }, { "epoch": 0.99, "learning_rate": 3.7441100457942847e-07, "loss": 2.2751, "step": 569140 }, { "epoch": 0.99, "learning_rate": 3.735390646526017e-07, "loss": 2.1905, "step": 569150 }, { "epoch": 0.99, "learning_rate": 3.726671247257749e-07, "loss": 2.3222, "step": 569160 }, { "epoch": 0.99, "learning_rate": 3.717951847989481e-07, "loss": 2.1932, "step": 569170 }, { "epoch": 0.99, "learning_rate": 3.7092324487212127e-07, "loss": 2.3227, "step": 569180 }, { "epoch": 0.99, "learning_rate": 3.700513049452945e-07, "loss": 2.253, "step": 569190 }, { "epoch": 0.99, "learning_rate": 3.691793650184677e-07, "loss": 2.3658, "step": 569200 }, { "epoch": 0.99, "learning_rate": 3.683074250916409e-07, "loss": 2.1946, "step": 569210 }, { "epoch": 0.99, "learning_rate": 3.674354851648141e-07, "loss": 2.3671, "step": 569220 }, { "epoch": 0.99, "learning_rate": 3.6656354523798726e-07, "loss": 2.183, "step": 569230 }, { "epoch": 0.99, "learning_rate": 3.656916053111605e-07, "loss": 2.2535, "step": 569240 }, { "epoch": 0.99, "learning_rate": 3.648196653843337e-07, "loss": 2.2648, "step": 569250 }, { "epoch": 0.99, "learning_rate": 3.639477254575069e-07, "loss": 2.2397, "step": 569260 }, { "epoch": 0.99, "learning_rate": 3.6307578553068007e-07, "loss": 2.399, "step": 569270 }, { "epoch": 0.99, "learning_rate": 3.6220384560385325e-07, "loss": 2.3223, "step": 569280 }, { "epoch": 0.99, "learning_rate": 3.613319056770265e-07, "loss": 2.2022, "step": 569290 }, { "epoch": 0.99, "learning_rate": 3.604599657501997e-07, "loss": 2.3358, "step": 569300 }, { "epoch": 0.99, "learning_rate": 3.5958802582337287e-07, "loss": 2.3096, "step": 569310 }, { "epoch": 0.99, "learning_rate": 3.5871608589654606e-07, "loss": 2.3705, "step": 569320 }, { "epoch": 0.99, "learning_rate": 3.578441459697193e-07, "loss": 2.2649, "step": 569330 }, { "epoch": 0.99, "learning_rate": 3.569722060428925e-07, "loss": 2.266, "step": 569340 }, { "epoch": 0.99, "learning_rate": 3.5610026611606567e-07, "loss": 2.286, "step": 569350 }, { "epoch": 0.99, "learning_rate": 3.5522832618923886e-07, "loss": 2.2132, "step": 569360 }, { "epoch": 0.99, "learning_rate": 3.5435638626241205e-07, "loss": 2.3126, "step": 569370 }, { "epoch": 0.99, "learning_rate": 3.534844463355853e-07, "loss": 2.3538, "step": 569380 }, { "epoch": 0.99, "learning_rate": 3.526125064087585e-07, "loss": 2.2871, "step": 569390 }, { "epoch": 0.99, "learning_rate": 3.5174056648193166e-07, "loss": 2.2556, "step": 569400 }, { "epoch": 0.99, "learning_rate": 3.5086862655510485e-07, "loss": 2.2022, "step": 569410 }, { "epoch": 0.99, "learning_rate": 3.499966866282781e-07, "loss": 2.3677, "step": 569420 }, { "epoch": 0.99, "learning_rate": 3.491247467014513e-07, "loss": 2.3194, "step": 569430 }, { "epoch": 0.99, "learning_rate": 3.4825280677462447e-07, "loss": 2.1762, "step": 569440 }, { "epoch": 0.99, "learning_rate": 3.4738086684779766e-07, "loss": 2.1846, "step": 569450 }, { "epoch": 0.99, "learning_rate": 3.465089269209709e-07, "loss": 2.1851, "step": 569460 }, { "epoch": 0.99, "learning_rate": 3.456369869941441e-07, "loss": 2.3105, "step": 569470 }, { "epoch": 0.99, "learning_rate": 3.4476504706731727e-07, "loss": 2.2982, "step": 569480 }, { "epoch": 0.99, "learning_rate": 3.4389310714049046e-07, "loss": 2.264, "step": 569490 }, { "epoch": 0.99, "learning_rate": 3.430211672136637e-07, "loss": 2.1563, "step": 569500 }, { "epoch": 0.99, "learning_rate": 3.421492272868369e-07, "loss": 2.286, "step": 569510 }, { "epoch": 0.99, "learning_rate": 3.412772873600101e-07, "loss": 2.2276, "step": 569520 }, { "epoch": 0.99, "learning_rate": 3.4040534743318326e-07, "loss": 2.1809, "step": 569530 }, { "epoch": 0.99, "learning_rate": 3.3953340750635645e-07, "loss": 2.2671, "step": 569540 }, { "epoch": 0.99, "learning_rate": 3.386614675795297e-07, "loss": 2.2493, "step": 569550 }, { "epoch": 0.99, "learning_rate": 3.377895276527029e-07, "loss": 2.2679, "step": 569560 }, { "epoch": 0.99, "learning_rate": 3.3691758772587606e-07, "loss": 2.3518, "step": 569570 }, { "epoch": 0.99, "learning_rate": 3.3604564779904925e-07, "loss": 2.1933, "step": 569580 }, { "epoch": 0.99, "learning_rate": 3.351737078722225e-07, "loss": 2.4105, "step": 569590 }, { "epoch": 0.99, "learning_rate": 3.343017679453957e-07, "loss": 2.2636, "step": 569600 }, { "epoch": 0.99, "learning_rate": 3.3342982801856887e-07, "loss": 2.3085, "step": 569610 }, { "epoch": 0.99, "learning_rate": 3.3255788809174206e-07, "loss": 2.3475, "step": 569620 }, { "epoch": 0.99, "learning_rate": 3.3168594816491524e-07, "loss": 2.3363, "step": 569630 }, { "epoch": 0.99, "learning_rate": 3.308140082380885e-07, "loss": 2.3511, "step": 569640 }, { "epoch": 0.99, "learning_rate": 3.2994206831126167e-07, "loss": 2.269, "step": 569650 }, { "epoch": 0.99, "learning_rate": 3.2907012838443486e-07, "loss": 2.2817, "step": 569660 }, { "epoch": 0.99, "learning_rate": 3.2819818845760805e-07, "loss": 2.1899, "step": 569670 }, { "epoch": 0.99, "learning_rate": 3.2732624853078123e-07, "loss": 2.2339, "step": 569680 }, { "epoch": 0.99, "learning_rate": 3.264543086039545e-07, "loss": 2.2488, "step": 569690 }, { "epoch": 0.99, "learning_rate": 3.2558236867712766e-07, "loss": 2.2322, "step": 569700 }, { "epoch": 0.99, "learning_rate": 3.2471042875030085e-07, "loss": 2.1889, "step": 569710 }, { "epoch": 0.99, "learning_rate": 3.2383848882347404e-07, "loss": 2.2424, "step": 569720 }, { "epoch": 0.99, "learning_rate": 3.229665488966472e-07, "loss": 2.2317, "step": 569730 }, { "epoch": 0.99, "learning_rate": 3.2209460896982047e-07, "loss": 2.3667, "step": 569740 }, { "epoch": 0.99, "learning_rate": 3.2122266904299365e-07, "loss": 2.2508, "step": 569750 }, { "epoch": 0.99, "learning_rate": 3.2035072911616684e-07, "loss": 2.2583, "step": 569760 }, { "epoch": 0.99, "learning_rate": 3.1947878918934003e-07, "loss": 2.1606, "step": 569770 }, { "epoch": 0.99, "learning_rate": 3.186068492625132e-07, "loss": 2.2784, "step": 569780 }, { "epoch": 0.99, "learning_rate": 3.1773490933568646e-07, "loss": 2.2699, "step": 569790 }, { "epoch": 0.99, "learning_rate": 3.1686296940885964e-07, "loss": 2.2515, "step": 569800 }, { "epoch": 0.99, "learning_rate": 3.1599102948203283e-07, "loss": 2.3212, "step": 569810 }, { "epoch": 0.99, "learning_rate": 3.15119089555206e-07, "loss": 2.2474, "step": 569820 }, { "epoch": 0.99, "learning_rate": 3.142471496283792e-07, "loss": 2.3037, "step": 569830 }, { "epoch": 0.99, "learning_rate": 3.1337520970155245e-07, "loss": 2.159, "step": 569840 }, { "epoch": 0.99, "learning_rate": 3.1250326977472563e-07, "loss": 2.2192, "step": 569850 }, { "epoch": 0.99, "learning_rate": 3.116313298478988e-07, "loss": 2.2066, "step": 569860 }, { "epoch": 0.99, "learning_rate": 3.10759389921072e-07, "loss": 2.2416, "step": 569870 }, { "epoch": 0.99, "learning_rate": 3.0988744999424525e-07, "loss": 2.2599, "step": 569880 }, { "epoch": 0.99, "learning_rate": 3.0901551006741844e-07, "loss": 2.2891, "step": 569890 }, { "epoch": 0.99, "learning_rate": 3.081435701405916e-07, "loss": 2.2971, "step": 569900 }, { "epoch": 0.99, "learning_rate": 3.072716302137648e-07, "loss": 2.2429, "step": 569910 }, { "epoch": 0.99, "learning_rate": 3.06399690286938e-07, "loss": 2.1869, "step": 569920 }, { "epoch": 0.99, "learning_rate": 3.0552775036011124e-07, "loss": 2.1962, "step": 569930 }, { "epoch": 0.99, "learning_rate": 3.0465581043328443e-07, "loss": 2.242, "step": 569940 }, { "epoch": 0.99, "learning_rate": 3.037838705064576e-07, "loss": 2.3744, "step": 569950 }, { "epoch": 0.99, "learning_rate": 3.029119305796308e-07, "loss": 2.2076, "step": 569960 }, { "epoch": 0.99, "learning_rate": 3.02039990652804e-07, "loss": 2.399, "step": 569970 }, { "epoch": 0.99, "learning_rate": 3.0116805072597723e-07, "loss": 2.1036, "step": 569980 }, { "epoch": 0.99, "learning_rate": 3.002961107991504e-07, "loss": 2.3789, "step": 569990 }, { "epoch": 0.99, "learning_rate": 2.994241708723236e-07, "loss": 2.3943, "step": 570000 }, { "epoch": 0.99, "learning_rate": 2.985522309454968e-07, "loss": 2.2626, "step": 570010 }, { "epoch": 0.99, "learning_rate": 2.9768029101867e-07, "loss": 2.2144, "step": 570020 }, { "epoch": 0.99, "learning_rate": 2.968083510918432e-07, "loss": 2.1759, "step": 570030 }, { "epoch": 0.99, "learning_rate": 2.959364111650164e-07, "loss": 2.3283, "step": 570040 }, { "epoch": 0.99, "learning_rate": 2.950644712381896e-07, "loss": 2.2905, "step": 570050 }, { "epoch": 0.99, "learning_rate": 2.941925313113628e-07, "loss": 2.2766, "step": 570060 }, { "epoch": 0.99, "learning_rate": 2.9332059138453597e-07, "loss": 2.2118, "step": 570070 }, { "epoch": 0.99, "learning_rate": 2.924486514577092e-07, "loss": 2.3283, "step": 570080 }, { "epoch": 0.99, "learning_rate": 2.915767115308824e-07, "loss": 2.3458, "step": 570090 }, { "epoch": 0.99, "learning_rate": 2.907047716040556e-07, "loss": 2.2024, "step": 570100 }, { "epoch": 0.99, "learning_rate": 2.898328316772288e-07, "loss": 2.1396, "step": 570110 }, { "epoch": 0.99, "learning_rate": 2.8896089175040196e-07, "loss": 2.1422, "step": 570120 }, { "epoch": 0.99, "learning_rate": 2.880889518235752e-07, "loss": 2.2124, "step": 570130 }, { "epoch": 0.99, "learning_rate": 2.872170118967484e-07, "loss": 2.2138, "step": 570140 }, { "epoch": 0.99, "learning_rate": 2.863450719699216e-07, "loss": 2.2987, "step": 570150 }, { "epoch": 0.99, "learning_rate": 2.8547313204309477e-07, "loss": 2.3429, "step": 570160 }, { "epoch": 0.99, "learning_rate": 2.8460119211626795e-07, "loss": 2.2576, "step": 570170 }, { "epoch": 0.99, "learning_rate": 2.837292521894412e-07, "loss": 2.3013, "step": 570180 }, { "epoch": 0.99, "learning_rate": 2.828573122626144e-07, "loss": 2.2701, "step": 570190 }, { "epoch": 0.99, "learning_rate": 2.8198537233578757e-07, "loss": 2.2244, "step": 570200 }, { "epoch": 0.99, "learning_rate": 2.8111343240896076e-07, "loss": 2.206, "step": 570210 }, { "epoch": 0.99, "learning_rate": 2.8024149248213395e-07, "loss": 2.3379, "step": 570220 }, { "epoch": 0.99, "learning_rate": 2.793695525553072e-07, "loss": 2.2151, "step": 570230 }, { "epoch": 0.99, "learning_rate": 2.7849761262848037e-07, "loss": 2.166, "step": 570240 }, { "epoch": 0.99, "learning_rate": 2.7762567270165356e-07, "loss": 2.2287, "step": 570250 }, { "epoch": 0.99, "learning_rate": 2.7675373277482675e-07, "loss": 2.277, "step": 570260 }, { "epoch": 0.99, "learning_rate": 2.7588179284799994e-07, "loss": 2.1623, "step": 570270 }, { "epoch": 0.99, "learning_rate": 2.750098529211732e-07, "loss": 2.3518, "step": 570280 }, { "epoch": 0.99, "learning_rate": 2.7413791299434636e-07, "loss": 2.1459, "step": 570290 }, { "epoch": 0.99, "learning_rate": 2.7326597306751955e-07, "loss": 2.2724, "step": 570300 }, { "epoch": 0.99, "learning_rate": 2.7239403314069274e-07, "loss": 2.1716, "step": 570310 }, { "epoch": 0.99, "learning_rate": 2.7152209321386593e-07, "loss": 2.2358, "step": 570320 }, { "epoch": 0.99, "learning_rate": 2.7065015328703917e-07, "loss": 2.1858, "step": 570330 }, { "epoch": 0.99, "learning_rate": 2.6977821336021236e-07, "loss": 2.1741, "step": 570340 }, { "epoch": 0.99, "learning_rate": 2.6890627343338554e-07, "loss": 2.2891, "step": 570350 }, { "epoch": 0.99, "learning_rate": 2.6803433350655873e-07, "loss": 2.3151, "step": 570360 }, { "epoch": 0.99, "learning_rate": 2.671623935797319e-07, "loss": 2.308, "step": 570370 }, { "epoch": 0.99, "learning_rate": 2.6629045365290516e-07, "loss": 2.2182, "step": 570380 }, { "epoch": 0.99, "learning_rate": 2.6541851372607835e-07, "loss": 2.1339, "step": 570390 }, { "epoch": 0.99, "learning_rate": 2.6454657379925153e-07, "loss": 2.2786, "step": 570400 }, { "epoch": 0.99, "learning_rate": 2.636746338724247e-07, "loss": 2.2791, "step": 570410 }, { "epoch": 0.99, "learning_rate": 2.628026939455979e-07, "loss": 2.3565, "step": 570420 }, { "epoch": 0.99, "learning_rate": 2.6193075401877115e-07, "loss": 2.3134, "step": 570430 }, { "epoch": 0.99, "learning_rate": 2.6105881409194434e-07, "loss": 2.2277, "step": 570440 }, { "epoch": 0.99, "learning_rate": 2.601868741651175e-07, "loss": 2.2907, "step": 570450 }, { "epoch": 0.99, "learning_rate": 2.593149342382907e-07, "loss": 2.2832, "step": 570460 }, { "epoch": 0.99, "learning_rate": 2.584429943114639e-07, "loss": 2.1163, "step": 570470 }, { "epoch": 0.99, "learning_rate": 2.5757105438463714e-07, "loss": 2.3437, "step": 570480 }, { "epoch": 0.99, "learning_rate": 2.5669911445781033e-07, "loss": 2.3424, "step": 570490 }, { "epoch": 0.99, "learning_rate": 2.558271745309835e-07, "loss": 2.1433, "step": 570500 }, { "epoch": 0.99, "learning_rate": 2.549552346041567e-07, "loss": 2.2962, "step": 570510 }, { "epoch": 0.99, "learning_rate": 2.540832946773299e-07, "loss": 2.3742, "step": 570520 }, { "epoch": 0.99, "learning_rate": 2.5321135475050313e-07, "loss": 2.2036, "step": 570530 }, { "epoch": 0.99, "learning_rate": 2.523394148236763e-07, "loss": 2.1495, "step": 570540 }, { "epoch": 0.99, "learning_rate": 2.514674748968495e-07, "loss": 2.2853, "step": 570550 }, { "epoch": 0.99, "learning_rate": 2.505955349700227e-07, "loss": 2.2481, "step": 570560 }, { "epoch": 1.0, "learning_rate": 2.4972359504319593e-07, "loss": 2.2966, "step": 570570 }, { "epoch": 1.0, "learning_rate": 2.488516551163691e-07, "loss": 2.2475, "step": 570580 }, { "epoch": 1.0, "learning_rate": 2.479797151895423e-07, "loss": 2.2644, "step": 570590 }, { "epoch": 1.0, "learning_rate": 2.471077752627155e-07, "loss": 2.2854, "step": 570600 }, { "epoch": 1.0, "learning_rate": 2.462358353358887e-07, "loss": 2.3998, "step": 570610 }, { "epoch": 1.0, "learning_rate": 2.453638954090619e-07, "loss": 2.2439, "step": 570620 }, { "epoch": 1.0, "learning_rate": 2.444919554822351e-07, "loss": 2.255, "step": 570630 }, { "epoch": 1.0, "learning_rate": 2.436200155554083e-07, "loss": 2.1877, "step": 570640 }, { "epoch": 1.0, "learning_rate": 2.427480756285815e-07, "loss": 2.3246, "step": 570650 }, { "epoch": 1.0, "learning_rate": 2.418761357017547e-07, "loss": 2.3867, "step": 570660 }, { "epoch": 1.0, "learning_rate": 2.410041957749279e-07, "loss": 2.3208, "step": 570670 }, { "epoch": 1.0, "learning_rate": 2.401322558481011e-07, "loss": 2.2254, "step": 570680 }, { "epoch": 1.0, "learning_rate": 2.392603159212743e-07, "loss": 2.2459, "step": 570690 }, { "epoch": 1.0, "learning_rate": 2.383883759944475e-07, "loss": 2.3352, "step": 570700 }, { "epoch": 1.0, "learning_rate": 2.375164360676207e-07, "loss": 2.1953, "step": 570710 }, { "epoch": 1.0, "learning_rate": 2.366444961407939e-07, "loss": 2.2773, "step": 570720 }, { "epoch": 1.0, "learning_rate": 2.357725562139671e-07, "loss": 2.2529, "step": 570730 }, { "epoch": 1.0, "learning_rate": 2.3490061628714028e-07, "loss": 2.2226, "step": 570740 }, { "epoch": 1.0, "learning_rate": 2.340286763603135e-07, "loss": 2.1657, "step": 570750 }, { "epoch": 1.0, "learning_rate": 2.3315673643348668e-07, "loss": 2.2381, "step": 570760 }, { "epoch": 1.0, "learning_rate": 2.322847965066599e-07, "loss": 2.1947, "step": 570770 }, { "epoch": 1.0, "learning_rate": 2.3141285657983308e-07, "loss": 2.2158, "step": 570780 }, { "epoch": 1.0, "learning_rate": 2.305409166530063e-07, "loss": 2.1701, "step": 570790 }, { "epoch": 1.0, "learning_rate": 2.2966897672617949e-07, "loss": 2.0989, "step": 570800 }, { "epoch": 1.0, "learning_rate": 2.2879703679935267e-07, "loss": 2.3187, "step": 570810 }, { "epoch": 1.0, "learning_rate": 2.279250968725259e-07, "loss": 2.289, "step": 570820 }, { "epoch": 1.0, "learning_rate": 2.270531569456991e-07, "loss": 2.3191, "step": 570830 }, { "epoch": 1.0, "learning_rate": 2.261812170188723e-07, "loss": 2.1839, "step": 570840 }, { "epoch": 1.0, "learning_rate": 2.2530927709204548e-07, "loss": 2.2369, "step": 570850 }, { "epoch": 1.0, "learning_rate": 2.2443733716521866e-07, "loss": 2.2265, "step": 570860 }, { "epoch": 1.0, "learning_rate": 2.235653972383919e-07, "loss": 2.2467, "step": 570870 }, { "epoch": 1.0, "learning_rate": 2.226934573115651e-07, "loss": 2.2648, "step": 570880 }, { "epoch": 1.0, "learning_rate": 2.2182151738473828e-07, "loss": 2.3264, "step": 570890 }, { "epoch": 1.0, "learning_rate": 2.2094957745791147e-07, "loss": 2.3239, "step": 570900 }, { "epoch": 1.0, "learning_rate": 2.2007763753108466e-07, "loss": 2.2935, "step": 570910 }, { "epoch": 1.0, "learning_rate": 2.192056976042579e-07, "loss": 2.2595, "step": 570920 }, { "epoch": 1.0, "learning_rate": 2.1833375767743108e-07, "loss": 2.2326, "step": 570930 }, { "epoch": 1.0, "learning_rate": 2.1746181775060427e-07, "loss": 2.3095, "step": 570940 }, { "epoch": 1.0, "learning_rate": 2.1658987782377746e-07, "loss": 2.236, "step": 570950 }, { "epoch": 1.0, "learning_rate": 2.1571793789695065e-07, "loss": 2.2673, "step": 570960 }, { "epoch": 1.0, "learning_rate": 2.148459979701239e-07, "loss": 2.2999, "step": 570970 }, { "epoch": 1.0, "learning_rate": 2.1397405804329707e-07, "loss": 2.2222, "step": 570980 }, { "epoch": 1.0, "learning_rate": 2.1310211811647026e-07, "loss": 2.1431, "step": 570990 }, { "epoch": 1.0, "learning_rate": 2.1223017818964345e-07, "loss": 2.2585, "step": 571000 }, { "epoch": 1.0, "learning_rate": 2.1135823826281664e-07, "loss": 2.2673, "step": 571010 }, { "epoch": 1.0, "learning_rate": 2.1048629833598988e-07, "loss": 2.2994, "step": 571020 }, { "epoch": 1.0, "learning_rate": 2.0961435840916307e-07, "loss": 2.2457, "step": 571030 }, { "epoch": 1.0, "learning_rate": 2.0874241848233625e-07, "loss": 2.2806, "step": 571040 }, { "epoch": 1.0, "learning_rate": 2.0787047855550944e-07, "loss": 2.2804, "step": 571050 }, { "epoch": 1.0, "learning_rate": 2.0699853862868263e-07, "loss": 2.456, "step": 571060 }, { "epoch": 1.0, "learning_rate": 2.0612659870185587e-07, "loss": 2.2934, "step": 571070 }, { "epoch": 1.0, "learning_rate": 2.0525465877502906e-07, "loss": 2.2359, "step": 571080 }, { "epoch": 1.0, "learning_rate": 2.0438271884820224e-07, "loss": 2.2754, "step": 571090 }, { "epoch": 1.0, "learning_rate": 2.0351077892137543e-07, "loss": 2.3558, "step": 571100 }, { "epoch": 1.0, "learning_rate": 2.0263883899454862e-07, "loss": 2.2218, "step": 571110 }, { "epoch": 1.0, "learning_rate": 2.0176689906772186e-07, "loss": 2.2544, "step": 571120 }, { "epoch": 1.0, "learning_rate": 2.0089495914089505e-07, "loss": 2.2827, "step": 571130 }, { "epoch": 1.0, "learning_rate": 2.0002301921406823e-07, "loss": 2.1714, "step": 571140 }, { "epoch": 1.0, "learning_rate": 1.9915107928724142e-07, "loss": 2.2969, "step": 571150 }, { "epoch": 1.0, "learning_rate": 1.982791393604146e-07, "loss": 2.3732, "step": 571160 }, { "epoch": 1.0, "learning_rate": 1.9740719943358785e-07, "loss": 2.3197, "step": 571170 }, { "epoch": 1.0, "learning_rate": 1.9653525950676104e-07, "loss": 2.281, "step": 571180 }, { "epoch": 1.0, "learning_rate": 1.9566331957993423e-07, "loss": 2.3257, "step": 571190 }, { "epoch": 1.0, "learning_rate": 1.9479137965310744e-07, "loss": 2.2665, "step": 571200 }, { "epoch": 1.0, "learning_rate": 1.9391943972628063e-07, "loss": 2.3043, "step": 571210 }, { "epoch": 1.0, "learning_rate": 1.9304749979945381e-07, "loss": 2.2255, "step": 571220 }, { "epoch": 1.0, "learning_rate": 1.9217555987262703e-07, "loss": 2.1702, "step": 571230 }, { "epoch": 1.0, "learning_rate": 1.9130361994580022e-07, "loss": 2.2863, "step": 571240 }, { "epoch": 1.0, "learning_rate": 1.9043168001897343e-07, "loss": 2.2577, "step": 571250 }, { "epoch": 1.0, "learning_rate": 1.8955974009214662e-07, "loss": 2.2701, "step": 571260 }, { "epoch": 1.0, "learning_rate": 1.886878001653198e-07, "loss": 2.1525, "step": 571270 }, { "epoch": 1.0, "learning_rate": 1.8781586023849302e-07, "loss": 2.1675, "step": 571280 }, { "epoch": 1.0, "learning_rate": 1.869439203116662e-07, "loss": 2.2049, "step": 571290 }, { "epoch": 1.0, "learning_rate": 1.8607198038483942e-07, "loss": 2.264, "step": 571300 }, { "epoch": 1.0, "learning_rate": 1.852000404580126e-07, "loss": 2.3672, "step": 571310 }, { "epoch": 1.0, "learning_rate": 1.843281005311858e-07, "loss": 2.084, "step": 571320 }, { "epoch": 1.0, "learning_rate": 1.83456160604359e-07, "loss": 2.3284, "step": 571330 }, { "epoch": 1.0, "learning_rate": 1.825842206775322e-07, "loss": 2.3041, "step": 571340 }, { "epoch": 1.0, "learning_rate": 1.817122807507054e-07, "loss": 2.2113, "step": 571350 }, { "epoch": 1.0, "learning_rate": 1.808403408238786e-07, "loss": 2.3083, "step": 571360 }, { "epoch": 1.0, "learning_rate": 1.799684008970518e-07, "loss": 2.2247, "step": 571370 }, { "epoch": 1.0, "learning_rate": 1.79096460970225e-07, "loss": 2.2277, "step": 571380 }, { "epoch": 1.0, "learning_rate": 1.782245210433982e-07, "loss": 2.1567, "step": 571390 }, { "epoch": 1.0, "learning_rate": 1.773525811165714e-07, "loss": 2.3178, "step": 571400 }, { "epoch": 1.0, "learning_rate": 1.764806411897446e-07, "loss": 2.226, "step": 571410 }, { "epoch": 1.0, "learning_rate": 1.7560870126291778e-07, "loss": 2.2858, "step": 571420 }, { "epoch": 1.0, "learning_rate": 1.74736761336091e-07, "loss": 2.203, "step": 571430 }, { "epoch": 1.0, "learning_rate": 1.7386482140926418e-07, "loss": 2.2729, "step": 571440 }, { "epoch": 1.0, "learning_rate": 1.729928814824374e-07, "loss": 2.1332, "step": 571450 }, { "epoch": 1.0, "learning_rate": 1.7212094155561058e-07, "loss": 2.2319, "step": 571460 }, { "epoch": 1.0, "learning_rate": 1.712490016287838e-07, "loss": 2.2906, "step": 571470 }, { "epoch": 1.0, "learning_rate": 1.7037706170195698e-07, "loss": 2.1907, "step": 571480 }, { "epoch": 1.0, "learning_rate": 1.6950512177513017e-07, "loss": 2.2036, "step": 571490 }, { "epoch": 1.0, "learning_rate": 1.6863318184830338e-07, "loss": 2.2807, "step": 571500 }, { "epoch": 1.0, "learning_rate": 1.6776124192147657e-07, "loss": 2.3081, "step": 571510 }, { "epoch": 1.0, "learning_rate": 1.6688930199464979e-07, "loss": 2.2331, "step": 571520 }, { "epoch": 1.0, "learning_rate": 1.6601736206782297e-07, "loss": 2.1752, "step": 571530 }, { "epoch": 1.0, "learning_rate": 1.6514542214099616e-07, "loss": 2.3517, "step": 571540 }, { "epoch": 1.0, "learning_rate": 1.6427348221416938e-07, "loss": 2.2649, "step": 571550 }, { "epoch": 1.0, "learning_rate": 1.6340154228734256e-07, "loss": 2.2415, "step": 571560 }, { "epoch": 1.0, "learning_rate": 1.6252960236051578e-07, "loss": 2.2963, "step": 571570 }, { "epoch": 1.0, "learning_rate": 1.6165766243368896e-07, "loss": 2.2559, "step": 571580 }, { "epoch": 1.0, "learning_rate": 1.6078572250686218e-07, "loss": 2.2868, "step": 571590 }, { "epoch": 1.0, "learning_rate": 1.5991378258003537e-07, "loss": 2.1464, "step": 571600 }, { "epoch": 1.0, "learning_rate": 1.5904184265320858e-07, "loss": 2.3577, "step": 571610 }, { "epoch": 1.0, "learning_rate": 1.5816990272638177e-07, "loss": 2.0768, "step": 571620 }, { "epoch": 1.0, "learning_rate": 1.5729796279955498e-07, "loss": 2.2744, "step": 571630 }, { "epoch": 1.0, "learning_rate": 1.5642602287272817e-07, "loss": 2.1728, "step": 571640 }, { "epoch": 1.0, "learning_rate": 1.5555408294590138e-07, "loss": 2.3516, "step": 571650 }, { "epoch": 1.0, "learning_rate": 1.5468214301907457e-07, "loss": 2.2486, "step": 571660 }, { "epoch": 1.0, "learning_rate": 1.5381020309224778e-07, "loss": 2.394, "step": 571670 }, { "epoch": 1.0, "learning_rate": 1.5293826316542097e-07, "loss": 2.1967, "step": 571680 }, { "epoch": 1.0, "learning_rate": 1.5206632323859416e-07, "loss": 2.2046, "step": 571690 }, { "epoch": 1.0, "learning_rate": 1.5119438331176737e-07, "loss": 2.2563, "step": 571700 }, { "epoch": 1.0, "learning_rate": 1.5032244338494056e-07, "loss": 2.293, "step": 571710 }, { "epoch": 1.0, "learning_rate": 1.4945050345811378e-07, "loss": 2.3405, "step": 571720 }, { "epoch": 1.0, "learning_rate": 1.4857856353128696e-07, "loss": 2.2204, "step": 571730 }, { "epoch": 1.0, "learning_rate": 1.4770662360446015e-07, "loss": 2.2555, "step": 571740 }, { "epoch": 1.0, "learning_rate": 1.4683468367763336e-07, "loss": 2.3056, "step": 571750 }, { "epoch": 1.0, "learning_rate": 1.4596274375080655e-07, "loss": 2.2958, "step": 571760 }, { "epoch": 1.0, "learning_rate": 1.4509080382397977e-07, "loss": 2.2775, "step": 571770 }, { "epoch": 1.0, "learning_rate": 1.4421886389715295e-07, "loss": 2.2433, "step": 571780 }, { "epoch": 1.0, "learning_rate": 1.4334692397032617e-07, "loss": 2.2202, "step": 571790 }, { "epoch": 1.0, "learning_rate": 1.4247498404349936e-07, "loss": 2.2256, "step": 571800 }, { "epoch": 1.0, "learning_rate": 1.4160304411667254e-07, "loss": 2.3036, "step": 571810 }, { "epoch": 1.0, "learning_rate": 1.4073110418984576e-07, "loss": 2.2836, "step": 571820 }, { "epoch": 1.0, "learning_rate": 1.3985916426301894e-07, "loss": 2.3317, "step": 571830 }, { "epoch": 1.0, "learning_rate": 1.3898722433619216e-07, "loss": 2.2606, "step": 571840 }, { "epoch": 1.0, "learning_rate": 1.3811528440936535e-07, "loss": 2.2207, "step": 571850 }, { "epoch": 1.0, "learning_rate": 1.3724334448253853e-07, "loss": 2.0733, "step": 571860 }, { "epoch": 1.0, "learning_rate": 1.3637140455571175e-07, "loss": 2.342, "step": 571870 }, { "epoch": 1.0, "learning_rate": 1.3549946462888494e-07, "loss": 2.2708, "step": 571880 }, { "epoch": 1.0, "learning_rate": 1.3462752470205815e-07, "loss": 2.3228, "step": 571890 }, { "epoch": 1.0, "learning_rate": 1.3375558477523134e-07, "loss": 2.2903, "step": 571900 }, { "epoch": 1.0, "learning_rate": 1.3288364484840452e-07, "loss": 2.2413, "step": 571910 }, { "epoch": 1.0, "learning_rate": 1.3201170492157774e-07, "loss": 2.2956, "step": 571920 }, { "epoch": 1.0, "learning_rate": 1.3113976499475093e-07, "loss": 2.2222, "step": 571930 }, { "epoch": 1.0, "learning_rate": 1.3026782506792414e-07, "loss": 2.3066, "step": 571940 }, { "epoch": 1.0, "learning_rate": 1.2939588514109733e-07, "loss": 2.1829, "step": 571950 }, { "epoch": 1.0, "learning_rate": 1.2852394521427052e-07, "loss": 2.1684, "step": 571960 }, { "epoch": 1.0, "learning_rate": 1.2765200528744373e-07, "loss": 2.2244, "step": 571970 }, { "epoch": 1.0, "learning_rate": 1.2678006536061692e-07, "loss": 2.3193, "step": 571980 }, { "epoch": 1.0, "learning_rate": 1.2590812543379013e-07, "loss": 2.3487, "step": 571990 }, { "epoch": 1.0, "learning_rate": 1.2503618550696332e-07, "loss": 2.2199, "step": 572000 }, { "epoch": 1.0, "learning_rate": 1.241642455801365e-07, "loss": 2.3133, "step": 572010 }, { "epoch": 1.0, "learning_rate": 1.2329230565330972e-07, "loss": 2.2798, "step": 572020 }, { "epoch": 1.0, "learning_rate": 1.224203657264829e-07, "loss": 2.2046, "step": 572030 }, { "epoch": 1.0, "learning_rate": 1.2154842579965612e-07, "loss": 2.3744, "step": 572040 }, { "epoch": 1.0, "learning_rate": 1.206764858728293e-07, "loss": 2.4191, "step": 572050 }, { "epoch": 1.0, "learning_rate": 1.198045459460025e-07, "loss": 2.2782, "step": 572060 }, { "epoch": 1.0, "learning_rate": 1.1893260601917571e-07, "loss": 2.2361, "step": 572070 }, { "epoch": 1.0, "learning_rate": 1.180606660923489e-07, "loss": 2.2564, "step": 572080 }, { "epoch": 1.0, "learning_rate": 1.1718872616552211e-07, "loss": 2.3162, "step": 572090 }, { "epoch": 1.0, "learning_rate": 1.163167862386953e-07, "loss": 2.0648, "step": 572100 }, { "epoch": 1.0, "learning_rate": 1.1544484631186849e-07, "loss": 2.2619, "step": 572110 }, { "epoch": 1.0, "learning_rate": 1.145729063850417e-07, "loss": 2.2279, "step": 572120 }, { "epoch": 1.0, "learning_rate": 1.1370096645821489e-07, "loss": 2.2867, "step": 572130 }, { "epoch": 1.0, "learning_rate": 1.128290265313881e-07, "loss": 2.2815, "step": 572140 }, { "epoch": 1.0, "learning_rate": 1.1195708660456129e-07, "loss": 2.2185, "step": 572150 }, { "epoch": 1.0, "learning_rate": 1.110851466777345e-07, "loss": 2.2817, "step": 572160 }, { "epoch": 1.0, "learning_rate": 1.1021320675090769e-07, "loss": 2.3216, "step": 572170 }, { "epoch": 1.0, "learning_rate": 1.0934126682408088e-07, "loss": 2.2245, "step": 572180 }, { "epoch": 1.0, "learning_rate": 1.084693268972541e-07, "loss": 2.1478, "step": 572190 }, { "epoch": 1.0, "learning_rate": 1.0759738697042728e-07, "loss": 2.262, "step": 572200 }, { "epoch": 1.0, "learning_rate": 1.067254470436005e-07, "loss": 2.2436, "step": 572210 }, { "epoch": 1.0, "learning_rate": 1.0585350711677368e-07, "loss": 2.1952, "step": 572220 }, { "epoch": 1.0, "learning_rate": 1.0498156718994688e-07, "loss": 2.1884, "step": 572230 }, { "epoch": 1.0, "learning_rate": 1.0410962726312009e-07, "loss": 2.296, "step": 572240 }, { "epoch": 1.0, "learning_rate": 1.0323768733629329e-07, "loss": 2.4044, "step": 572250 }, { "epoch": 1.0, "learning_rate": 1.0236574740946649e-07, "loss": 2.2555, "step": 572260 }, { "epoch": 1.0, "learning_rate": 1.0149380748263969e-07, "loss": 2.3379, "step": 572270 }, { "epoch": 1.0, "learning_rate": 1.0062186755581288e-07, "loss": 2.2583, "step": 572280 }, { "epoch": 1.0, "learning_rate": 9.974992762898608e-08, "loss": 2.2032, "step": 572290 }, { "epoch": 1.0, "learning_rate": 9.887798770215928e-08, "loss": 2.3011, "step": 572300 }, { "epoch": 1.0, "learning_rate": 9.800604777533248e-08, "loss": 2.2918, "step": 572310 }, { "epoch": 1.0, "learning_rate": 9.713410784850568e-08, "loss": 2.2356, "step": 572320 }, { "epoch": 1.0, "learning_rate": 9.626216792167888e-08, "loss": 2.2875, "step": 572330 }, { "epoch": 1.0, "learning_rate": 9.539022799485208e-08, "loss": 2.2941, "step": 572340 }, { "epoch": 1.0, "learning_rate": 9.451828806802527e-08, "loss": 2.3867, "step": 572350 }, { "epoch": 1.0, "learning_rate": 9.364634814119847e-08, "loss": 2.2459, "step": 572360 }, { "epoch": 1.0, "learning_rate": 9.277440821437167e-08, "loss": 2.2183, "step": 572370 }, { "epoch": 1.0, "learning_rate": 9.190246828754487e-08, "loss": 2.2926, "step": 572380 }, { "epoch": 1.0, "learning_rate": 9.103052836071807e-08, "loss": 2.2461, "step": 572390 }, { "epoch": 1.0, "learning_rate": 9.015858843389126e-08, "loss": 2.172, "step": 572400 }, { "epoch": 1.0, "learning_rate": 8.928664850706446e-08, "loss": 2.2275, "step": 572410 }, { "epoch": 1.0, "learning_rate": 8.841470858023766e-08, "loss": 2.2887, "step": 572420 }, { "epoch": 1.0, "learning_rate": 8.754276865341086e-08, "loss": 2.2779, "step": 572430 }, { "epoch": 1.0, "learning_rate": 8.667082872658406e-08, "loss": 2.3215, "step": 572440 }, { "epoch": 1.0, "learning_rate": 8.579888879975726e-08, "loss": 2.2636, "step": 572450 }, { "epoch": 1.0, "learning_rate": 8.492694887293045e-08, "loss": 2.2799, "step": 572460 }, { "epoch": 1.0, "learning_rate": 8.405500894610365e-08, "loss": 2.346, "step": 572470 }, { "epoch": 1.0, "learning_rate": 8.318306901927685e-08, "loss": 2.231, "step": 572480 }, { "epoch": 1.0, "learning_rate": 8.231112909245005e-08, "loss": 2.2112, "step": 572490 }, { "epoch": 1.0, "learning_rate": 8.143918916562325e-08, "loss": 2.1321, "step": 572500 }, { "epoch": 1.0, "learning_rate": 8.056724923879644e-08, "loss": 2.2999, "step": 572510 }, { "epoch": 1.0, "learning_rate": 7.969530931196964e-08, "loss": 2.2748, "step": 572520 }, { "epoch": 1.0, "learning_rate": 7.882336938514284e-08, "loss": 2.2668, "step": 572530 }, { "epoch": 1.0, "learning_rate": 7.795142945831604e-08, "loss": 2.2804, "step": 572540 }, { "epoch": 1.0, "learning_rate": 7.707948953148924e-08, "loss": 2.1993, "step": 572550 }, { "epoch": 1.0, "learning_rate": 7.620754960466243e-08, "loss": 2.2971, "step": 572560 }, { "epoch": 1.0, "learning_rate": 7.533560967783563e-08, "loss": 2.1637, "step": 572570 }, { "epoch": 1.0, "learning_rate": 7.446366975100883e-08, "loss": 2.1807, "step": 572580 }, { "epoch": 1.0, "learning_rate": 7.359172982418203e-08, "loss": 2.3349, "step": 572590 }, { "epoch": 1.0, "learning_rate": 7.271978989735524e-08, "loss": 2.2716, "step": 572600 }, { "epoch": 1.0, "learning_rate": 7.184784997052844e-08, "loss": 2.2836, "step": 572610 }, { "epoch": 1.0, "learning_rate": 7.097591004370162e-08, "loss": 2.1811, "step": 572620 }, { "epoch": 1.0, "learning_rate": 7.010397011687482e-08, "loss": 2.3288, "step": 572630 }, { "epoch": 1.0, "learning_rate": 6.923203019004803e-08, "loss": 2.263, "step": 572640 }, { "epoch": 1.0, "learning_rate": 6.836009026322123e-08, "loss": 2.3822, "step": 572650 }, { "epoch": 1.0, "learning_rate": 6.748815033639443e-08, "loss": 2.2203, "step": 572660 }, { "epoch": 1.0, "learning_rate": 6.661621040956763e-08, "loss": 2.3216, "step": 572670 }, { "epoch": 1.0, "learning_rate": 6.574427048274083e-08, "loss": 2.3593, "step": 572680 }, { "epoch": 1.0, "learning_rate": 6.487233055591402e-08, "loss": 2.2006, "step": 572690 }, { "epoch": 1.0, "learning_rate": 6.400039062908722e-08, "loss": 2.2267, "step": 572700 }, { "epoch": 1.0, "learning_rate": 6.312845070226042e-08, "loss": 2.3224, "step": 572710 }, { "epoch": 1.0, "learning_rate": 6.225651077543362e-08, "loss": 2.2104, "step": 572720 }, { "epoch": 1.0, "learning_rate": 6.138457084860682e-08, "loss": 2.2341, "step": 572730 }, { "epoch": 1.0, "learning_rate": 6.051263092178002e-08, "loss": 2.2437, "step": 572740 }, { "epoch": 1.0, "learning_rate": 5.964069099495322e-08, "loss": 2.2385, "step": 572750 }, { "epoch": 1.0, "learning_rate": 5.8768751068126415e-08, "loss": 2.1971, "step": 572760 }, { "epoch": 1.0, "learning_rate": 5.7896811141299616e-08, "loss": 2.2889, "step": 572770 }, { "epoch": 1.0, "learning_rate": 5.702487121447281e-08, "loss": 2.2758, "step": 572780 }, { "epoch": 1.0, "learning_rate": 5.6152931287646004e-08, "loss": 2.3389, "step": 572790 }, { "epoch": 1.0, "learning_rate": 5.5280991360819205e-08, "loss": 2.255, "step": 572800 }, { "epoch": 1.0, "learning_rate": 5.4409051433992406e-08, "loss": 2.2077, "step": 572810 }, { "epoch": 1.0, "learning_rate": 5.3537111507165607e-08, "loss": 2.2487, "step": 572820 }, { "epoch": 1.0, "learning_rate": 5.26651715803388e-08, "loss": 2.3189, "step": 572830 }, { "epoch": 1.0, "learning_rate": 5.1793231653512e-08, "loss": 2.1325, "step": 572840 }, { "epoch": 1.0, "learning_rate": 5.09212917266852e-08, "loss": 2.0689, "step": 572850 }, { "epoch": 1.0, "learning_rate": 5.00493517998584e-08, "loss": 2.4129, "step": 572860 }, { "epoch": 1.0, "learning_rate": 4.9177411873031604e-08, "loss": 2.2581, "step": 572870 }, { "epoch": 1.0, "learning_rate": 4.83054719462048e-08, "loss": 2.1987, "step": 572880 }, { "epoch": 1.0, "learning_rate": 4.7433532019378e-08, "loss": 2.2559, "step": 572890 }, { "epoch": 1.0, "learning_rate": 4.656159209255119e-08, "loss": 2.332, "step": 572900 }, { "epoch": 1.0, "learning_rate": 4.5689652165724394e-08, "loss": 2.3371, "step": 572910 }, { "epoch": 1.0, "learning_rate": 4.481771223889759e-08, "loss": 2.1172, "step": 572920 }, { "epoch": 1.0, "learning_rate": 4.394577231207079e-08, "loss": 2.3212, "step": 572930 }, { "epoch": 1.0, "learning_rate": 4.307383238524399e-08, "loss": 2.1773, "step": 572940 }, { "epoch": 1.0, "learning_rate": 4.2201892458417184e-08, "loss": 2.2615, "step": 572950 }, { "epoch": 1.0, "learning_rate": 4.1329952531590385e-08, "loss": 2.3336, "step": 572960 }, { "epoch": 1.0, "learning_rate": 4.045801260476358e-08, "loss": 2.3124, "step": 572970 }, { "epoch": 1.0, "learning_rate": 3.958607267793678e-08, "loss": 2.254, "step": 572980 }, { "epoch": 1.0, "learning_rate": 3.871413275110998e-08, "loss": 2.1415, "step": 572990 }, { "epoch": 1.0, "learning_rate": 3.7842192824283175e-08, "loss": 2.2239, "step": 573000 } ], "max_steps": 573434, "num_train_epochs": 1, "total_flos": 4.504923244855296e+18, "trial_name": null, "trial_params": null }