diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 80.0, - "global_step": 27637760, + "epoch": 90.0, + "global_step": 31092480, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -332536,11 +332536,41575 @@ "eval_samples_per_second": 1313.752, "eval_steps_per_second": 54.74, "step": 27637760 + }, + { + "epoch": 80.0, + "learning_rate": 1.001402284410893e-05, + "loss": 1.8644, + "step": 27638000 + }, + { + "epoch": 80.0, + "learning_rate": 1.0013299196461654e-05, + "loss": 1.8433, + "step": 27638500 + }, + { + "epoch": 80.0, + "learning_rate": 1.0012576996109671e-05, + "loss": 1.871, + "step": 27639000 + }, + { + "epoch": 80.01, + "learning_rate": 1.0011853348462393e-05, + "loss": 1.827, + "step": 27639500 + }, + { + "epoch": 80.01, + "learning_rate": 1.0011129700815117e-05, + "loss": 1.8403, + "step": 27640000 + }, + { + "epoch": 80.01, + "learning_rate": 1.0010406053167841e-05, + "loss": 1.855, + "step": 27640500 + }, + { + "epoch": 80.01, + "learning_rate": 1.0009682405520563e-05, + "loss": 1.8528, + "step": 27641000 + }, + { + "epoch": 80.01, + "learning_rate": 1.0008958757873287e-05, + "loss": 1.8581, + "step": 27641500 + }, + { + "epoch": 80.01, + "learning_rate": 1.0008235110226011e-05, + "loss": 1.8319, + "step": 27642000 + }, + { + "epoch": 80.01, + "learning_rate": 1.0007511462578733e-05, + "loss": 1.8088, + "step": 27642500 + }, + { + "epoch": 80.02, + "learning_rate": 1.0006790709522046e-05, + "loss": 1.8774, + "step": 27643000 + }, + { + "epoch": 80.02, + "learning_rate": 1.000606706187477e-05, + "loss": 1.8237, + "step": 27643500 + }, + { + "epoch": 80.02, + "learning_rate": 1.0005343414227492e-05, + "loss": 1.832, + "step": 27644000 + }, + { + "epoch": 80.02, + "learning_rate": 1.0004619766580216e-05, + "loss": 1.8556, + "step": 27644500 + }, + { + "epoch": 80.02, + "learning_rate": 1.0003896118932938e-05, + "loss": 1.8505, + "step": 27645000 + }, + { + "epoch": 80.02, + "learning_rate": 1.0003172471285662e-05, + "loss": 1.8303, + "step": 27645500 + }, + { + "epoch": 80.02, + "learning_rate": 1.0002448823638386e-05, + "loss": 1.8412, + "step": 27646000 + }, + { + "epoch": 80.03, + "learning_rate": 1.0001725175991108e-05, + "loss": 1.8324, + "step": 27646500 + }, + { + "epoch": 80.03, + "learning_rate": 1.0001001528343832e-05, + "loss": 1.8264, + "step": 27647000 + }, + { + "epoch": 80.03, + "learning_rate": 1.0000277880696554e-05, + "loss": 1.8437, + "step": 27647500 + }, + { + "epoch": 80.03, + "learning_rate": 9.999554233049278e-06, + "loss": 1.8318, + "step": 27648000 + }, + { + "epoch": 80.03, + "learning_rate": 9.998832032697295e-06, + "loss": 1.8657, + "step": 27648500 + }, + { + "epoch": 80.03, + "learning_rate": 9.99810838505002e-06, + "loss": 1.8668, + "step": 27649000 + }, + { + "epoch": 80.03, + "learning_rate": 9.997384737402742e-06, + "loss": 1.8192, + "step": 27649500 + }, + { + "epoch": 80.04, + "learning_rate": 9.996661089755465e-06, + "loss": 1.8476, + "step": 27650000 + }, + { + "epoch": 80.04, + "learning_rate": 9.995938889403483e-06, + "loss": 1.8293, + "step": 27650500 + }, + { + "epoch": 80.04, + "learning_rate": 9.995215241756207e-06, + "loss": 1.8371, + "step": 27651000 + }, + { + "epoch": 80.04, + "learning_rate": 9.99449159410893e-06, + "loss": 1.831, + "step": 27651500 + }, + { + "epoch": 80.04, + "learning_rate": 9.993769393756948e-06, + "loss": 1.8493, + "step": 27652000 + }, + { + "epoch": 80.04, + "learning_rate": 9.99304574610967e-06, + "loss": 1.8303, + "step": 27652500 + }, + { + "epoch": 80.04, + "learning_rate": 9.992322098462394e-06, + "loss": 1.8191, + "step": 27653000 + }, + { + "epoch": 80.05, + "learning_rate": 9.991598450815118e-06, + "loss": 1.8201, + "step": 27653500 + }, + { + "epoch": 80.05, + "learning_rate": 9.99087480316784e-06, + "loss": 1.8283, + "step": 27654000 + }, + { + "epoch": 80.05, + "learning_rate": 9.990151155520564e-06, + "loss": 1.8234, + "step": 27654500 + }, + { + "epoch": 80.05, + "learning_rate": 9.989427507873286e-06, + "loss": 1.8271, + "step": 27655000 + }, + { + "epoch": 80.05, + "learning_rate": 9.98870386022601e-06, + "loss": 1.8273, + "step": 27655500 + }, + { + "epoch": 80.05, + "learning_rate": 9.987980212578734e-06, + "loss": 1.8282, + "step": 27656000 + }, + { + "epoch": 80.05, + "learning_rate": 9.987258012226751e-06, + "loss": 1.8412, + "step": 27656500 + }, + { + "epoch": 80.06, + "learning_rate": 9.986534364579474e-06, + "loss": 1.8249, + "step": 27657000 + }, + { + "epoch": 80.06, + "learning_rate": 9.985810716932198e-06, + "loss": 1.8391, + "step": 27657500 + }, + { + "epoch": 80.06, + "learning_rate": 9.985087069284921e-06, + "loss": 1.8461, + "step": 27658000 + }, + { + "epoch": 80.06, + "learning_rate": 9.984363421637644e-06, + "loss": 1.844, + "step": 27658500 + }, + { + "epoch": 80.06, + "learning_rate": 9.983639773990368e-06, + "loss": 1.8462, + "step": 27659000 + }, + { + "epoch": 80.06, + "learning_rate": 9.98291612634309e-06, + "loss": 1.8083, + "step": 27659500 + }, + { + "epoch": 80.06, + "learning_rate": 9.982193925991109e-06, + "loss": 1.8099, + "step": 27660000 + }, + { + "epoch": 80.07, + "learning_rate": 9.981470278343831e-06, + "loss": 1.8519, + "step": 27660500 + }, + { + "epoch": 80.07, + "learning_rate": 9.98074807799185e-06, + "loss": 1.8394, + "step": 27661000 + }, + { + "epoch": 80.07, + "learning_rate": 9.980024430344572e-06, + "loss": 1.8224, + "step": 27661500 + }, + { + "epoch": 80.07, + "learning_rate": 9.979300782697296e-06, + "loss": 1.8759, + "step": 27662000 + }, + { + "epoch": 80.07, + "learning_rate": 9.978577135050018e-06, + "loss": 1.8483, + "step": 27662500 + }, + { + "epoch": 80.07, + "learning_rate": 9.977853487402742e-06, + "loss": 1.8401, + "step": 27663000 + }, + { + "epoch": 80.07, + "learning_rate": 9.977129839755466e-06, + "loss": 1.8655, + "step": 27663500 + }, + { + "epoch": 80.08, + "learning_rate": 9.976406192108188e-06, + "loss": 1.8436, + "step": 27664000 + }, + { + "epoch": 80.08, + "learning_rate": 9.975682544460912e-06, + "loss": 1.8348, + "step": 27664500 + }, + { + "epoch": 80.08, + "learning_rate": 9.974958896813635e-06, + "loss": 1.8263, + "step": 27665000 + }, + { + "epoch": 80.08, + "learning_rate": 9.974236696461654e-06, + "loss": 1.8617, + "step": 27665500 + }, + { + "epoch": 80.08, + "learning_rate": 9.973515943404966e-06, + "loss": 1.8325, + "step": 27666000 + }, + { + "epoch": 80.08, + "learning_rate": 9.972792295757688e-06, + "loss": 1.8528, + "step": 27666500 + }, + { + "epoch": 80.08, + "learning_rate": 9.972068648110412e-06, + "loss": 1.8486, + "step": 27667000 + }, + { + "epoch": 80.09, + "learning_rate": 9.971345000463136e-06, + "loss": 1.8331, + "step": 27667500 + }, + { + "epoch": 80.09, + "learning_rate": 9.970621352815858e-06, + "loss": 1.8281, + "step": 27668000 + }, + { + "epoch": 80.09, + "learning_rate": 9.969897705168582e-06, + "loss": 1.8552, + "step": 27668500 + }, + { + "epoch": 80.09, + "learning_rate": 9.969174057521304e-06, + "loss": 1.8315, + "step": 27669000 + }, + { + "epoch": 80.09, + "learning_rate": 9.968450409874028e-06, + "loss": 1.8378, + "step": 27669500 + }, + { + "epoch": 80.09, + "learning_rate": 9.96772676222675e-06, + "loss": 1.7938, + "step": 27670000 + }, + { + "epoch": 80.09, + "learning_rate": 9.967003114579474e-06, + "loss": 1.8326, + "step": 27670500 + }, + { + "epoch": 80.1, + "learning_rate": 9.966279466932198e-06, + "loss": 1.8635, + "step": 27671000 + }, + { + "epoch": 80.1, + "learning_rate": 9.96555581928492e-06, + "loss": 1.8402, + "step": 27671500 + }, + { + "epoch": 80.1, + "learning_rate": 9.964832171637644e-06, + "loss": 1.8225, + "step": 27672000 + }, + { + "epoch": 80.1, + "learning_rate": 9.964108523990367e-06, + "loss": 1.8161, + "step": 27672500 + }, + { + "epoch": 80.1, + "learning_rate": 9.96338487634309e-06, + "loss": 1.8316, + "step": 27673000 + }, + { + "epoch": 80.1, + "learning_rate": 9.962661228695813e-06, + "loss": 1.847, + "step": 27673500 + }, + { + "epoch": 80.1, + "learning_rate": 9.961939028343832e-06, + "loss": 1.8424, + "step": 27674000 + }, + { + "epoch": 80.11, + "learning_rate": 9.961215380696556e-06, + "loss": 1.8444, + "step": 27674500 + }, + { + "epoch": 80.11, + "learning_rate": 9.960491733049278e-06, + "loss": 1.8479, + "step": 27675000 + }, + { + "epoch": 80.11, + "learning_rate": 9.959768085402e-06, + "loss": 1.8371, + "step": 27675500 + }, + { + "epoch": 80.11, + "learning_rate": 9.959044437754724e-06, + "loss": 1.8227, + "step": 27676000 + }, + { + "epoch": 80.11, + "learning_rate": 9.958322237402743e-06, + "loss": 1.8427, + "step": 27676500 + }, + { + "epoch": 80.11, + "learning_rate": 9.957598589755465e-06, + "loss": 1.8406, + "step": 27677000 + }, + { + "epoch": 80.12, + "learning_rate": 9.956874942108188e-06, + "loss": 1.8354, + "step": 27677500 + }, + { + "epoch": 80.12, + "learning_rate": 9.956152741756207e-06, + "loss": 1.8422, + "step": 27678000 + }, + { + "epoch": 80.12, + "learning_rate": 9.95542909410893e-06, + "loss": 1.8564, + "step": 27678500 + }, + { + "epoch": 80.12, + "learning_rate": 9.954705446461653e-06, + "loss": 1.8405, + "step": 27679000 + }, + { + "epoch": 80.12, + "learning_rate": 9.953981798814375e-06, + "loss": 1.8881, + "step": 27679500 + }, + { + "epoch": 80.12, + "learning_rate": 9.9532581511671e-06, + "loss": 1.8583, + "step": 27680000 + }, + { + "epoch": 80.12, + "learning_rate": 9.952534503519823e-06, + "loss": 1.8551, + "step": 27680500 + }, + { + "epoch": 80.13, + "learning_rate": 9.951810855872545e-06, + "loss": 1.8598, + "step": 27681000 + }, + { + "epoch": 80.13, + "learning_rate": 9.951087208225269e-06, + "loss": 1.8564, + "step": 27681500 + }, + { + "epoch": 80.13, + "learning_rate": 9.950363560577993e-06, + "loss": 1.833, + "step": 27682000 + }, + { + "epoch": 80.13, + "learning_rate": 9.94964136022601e-06, + "loss": 1.8056, + "step": 27682500 + }, + { + "epoch": 80.13, + "learning_rate": 9.948917712578732e-06, + "loss": 1.8523, + "step": 27683000 + }, + { + "epoch": 80.13, + "learning_rate": 9.948194064931456e-06, + "loss": 1.8411, + "step": 27683500 + }, + { + "epoch": 80.13, + "learning_rate": 9.94747041728418e-06, + "loss": 1.8393, + "step": 27684000 + }, + { + "epoch": 80.14, + "learning_rate": 9.946746769636902e-06, + "loss": 1.8126, + "step": 27684500 + }, + { + "epoch": 80.14, + "learning_rate": 9.94602456928492e-06, + "loss": 1.8354, + "step": 27685000 + }, + { + "epoch": 80.14, + "learning_rate": 9.945302368932939e-06, + "loss": 1.8283, + "step": 27685500 + }, + { + "epoch": 80.14, + "learning_rate": 9.944578721285663e-06, + "loss": 1.8531, + "step": 27686000 + }, + { + "epoch": 80.14, + "learning_rate": 9.943855073638385e-06, + "loss": 1.838, + "step": 27686500 + }, + { + "epoch": 80.14, + "learning_rate": 9.943131425991107e-06, + "loss": 1.8059, + "step": 27687000 + }, + { + "epoch": 80.14, + "learning_rate": 9.942407778343833e-06, + "loss": 1.8481, + "step": 27687500 + }, + { + "epoch": 80.15, + "learning_rate": 9.941684130696555e-06, + "loss": 1.8286, + "step": 27688000 + }, + { + "epoch": 80.15, + "learning_rate": 9.940961930344572e-06, + "loss": 1.8287, + "step": 27688500 + }, + { + "epoch": 80.15, + "learning_rate": 9.940238282697296e-06, + "loss": 1.8459, + "step": 27689000 + }, + { + "epoch": 80.15, + "learning_rate": 9.93951463505002e-06, + "loss": 1.8324, + "step": 27689500 + }, + { + "epoch": 80.15, + "learning_rate": 9.938790987402742e-06, + "loss": 1.8388, + "step": 27690000 + }, + { + "epoch": 80.15, + "learning_rate": 9.938067339755464e-06, + "loss": 1.8392, + "step": 27690500 + }, + { + "epoch": 80.15, + "learning_rate": 9.937343692108188e-06, + "loss": 1.8476, + "step": 27691000 + }, + { + "epoch": 80.16, + "learning_rate": 9.936620044460912e-06, + "loss": 1.8404, + "step": 27691500 + }, + { + "epoch": 80.16, + "learning_rate": 9.935896396813635e-06, + "loss": 1.848, + "step": 27692000 + }, + { + "epoch": 80.16, + "learning_rate": 9.935172749166358e-06, + "loss": 1.8525, + "step": 27692500 + }, + { + "epoch": 80.16, + "learning_rate": 9.934449101519082e-06, + "loss": 1.8608, + "step": 27693000 + }, + { + "epoch": 80.16, + "learning_rate": 9.933725453871805e-06, + "loss": 1.8352, + "step": 27693500 + }, + { + "epoch": 80.16, + "learning_rate": 9.933003253519822e-06, + "loss": 1.8317, + "step": 27694000 + }, + { + "epoch": 80.16, + "learning_rate": 9.932279605872546e-06, + "loss": 1.8476, + "step": 27694500 + }, + { + "epoch": 80.17, + "learning_rate": 9.93155595822527e-06, + "loss": 1.8491, + "step": 27695000 + }, + { + "epoch": 80.17, + "learning_rate": 9.930832310577992e-06, + "loss": 1.8512, + "step": 27695500 + }, + { + "epoch": 80.17, + "learning_rate": 9.93011011022601e-06, + "loss": 1.8225, + "step": 27696000 + }, + { + "epoch": 80.17, + "learning_rate": 9.929387909874026e-06, + "loss": 1.8126, + "step": 27696500 + }, + { + "epoch": 80.17, + "learning_rate": 9.928664262226752e-06, + "loss": 1.8645, + "step": 27697000 + }, + { + "epoch": 80.17, + "learning_rate": 9.927940614579474e-06, + "loss": 1.836, + "step": 27697500 + }, + { + "epoch": 80.17, + "learning_rate": 9.927216966932197e-06, + "loss": 1.8289, + "step": 27698000 + }, + { + "epoch": 80.18, + "learning_rate": 9.926494766580215e-06, + "loss": 1.8454, + "step": 27698500 + }, + { + "epoch": 80.18, + "learning_rate": 9.92577111893294e-06, + "loss": 1.8273, + "step": 27699000 + }, + { + "epoch": 80.18, + "learning_rate": 9.925047471285662e-06, + "loss": 1.8465, + "step": 27699500 + }, + { + "epoch": 80.18, + "learning_rate": 9.924323823638384e-06, + "loss": 1.8584, + "step": 27700000 + }, + { + "epoch": 80.18, + "learning_rate": 9.92360017599111e-06, + "loss": 1.8345, + "step": 27700500 + }, + { + "epoch": 80.18, + "learning_rate": 9.922876528343832e-06, + "loss": 1.848, + "step": 27701000 + }, + { + "epoch": 80.18, + "learning_rate": 9.922152880696554e-06, + "loss": 1.8364, + "step": 27701500 + }, + { + "epoch": 80.19, + "learning_rate": 9.921430680344571e-06, + "loss": 1.8502, + "step": 27702000 + }, + { + "epoch": 80.19, + "learning_rate": 9.920707032697297e-06, + "loss": 1.8316, + "step": 27702500 + }, + { + "epoch": 80.19, + "learning_rate": 9.919983385050019e-06, + "loss": 1.8334, + "step": 27703000 + }, + { + "epoch": 80.19, + "learning_rate": 9.919259737402741e-06, + "loss": 1.8236, + "step": 27703500 + }, + { + "epoch": 80.19, + "learning_rate": 9.918536089755465e-06, + "loss": 1.8082, + "step": 27704000 + }, + { + "epoch": 80.19, + "learning_rate": 9.91781244210819e-06, + "loss": 1.8742, + "step": 27704500 + }, + { + "epoch": 80.19, + "learning_rate": 9.917088794460911e-06, + "loss": 1.8607, + "step": 27705000 + }, + { + "epoch": 80.2, + "learning_rate": 9.916365146813635e-06, + "loss": 1.8531, + "step": 27705500 + }, + { + "epoch": 80.2, + "learning_rate": 9.91564149916636e-06, + "loss": 1.8238, + "step": 27706000 + }, + { + "epoch": 80.2, + "learning_rate": 9.914917851519081e-06, + "loss": 1.8489, + "step": 27706500 + }, + { + "epoch": 80.2, + "learning_rate": 9.914197098462394e-06, + "loss": 1.8319, + "step": 27707000 + }, + { + "epoch": 80.2, + "learning_rate": 9.913473450815116e-06, + "loss": 1.8456, + "step": 27707500 + }, + { + "epoch": 80.2, + "learning_rate": 9.912751250463135e-06, + "loss": 1.8179, + "step": 27708000 + }, + { + "epoch": 80.2, + "learning_rate": 9.912027602815859e-06, + "loss": 1.8676, + "step": 27708500 + }, + { + "epoch": 80.21, + "learning_rate": 9.911303955168581e-06, + "loss": 1.8349, + "step": 27709000 + }, + { + "epoch": 80.21, + "learning_rate": 9.910580307521303e-06, + "loss": 1.8276, + "step": 27709500 + }, + { + "epoch": 80.21, + "learning_rate": 9.909856659874029e-06, + "loss": 1.842, + "step": 27710000 + }, + { + "epoch": 80.21, + "learning_rate": 9.909133012226751e-06, + "loss": 1.8157, + "step": 27710500 + }, + { + "epoch": 80.21, + "learning_rate": 9.908409364579473e-06, + "loss": 1.8286, + "step": 27711000 + }, + { + "epoch": 80.21, + "learning_rate": 9.907685716932199e-06, + "loss": 1.8276, + "step": 27711500 + }, + { + "epoch": 80.21, + "learning_rate": 9.906962069284921e-06, + "loss": 1.8279, + "step": 27712000 + }, + { + "epoch": 80.22, + "learning_rate": 9.906238421637643e-06, + "loss": 1.8344, + "step": 27712500 + }, + { + "epoch": 80.22, + "learning_rate": 9.905514773990367e-06, + "loss": 1.8435, + "step": 27713000 + }, + { + "epoch": 80.22, + "learning_rate": 9.904792573638386e-06, + "loss": 1.8341, + "step": 27713500 + }, + { + "epoch": 80.22, + "learning_rate": 9.904068925991109e-06, + "loss": 1.8589, + "step": 27714000 + }, + { + "epoch": 80.22, + "learning_rate": 9.90334527834383e-06, + "loss": 1.8543, + "step": 27714500 + }, + { + "epoch": 80.22, + "learning_rate": 9.902621630696555e-06, + "loss": 1.8243, + "step": 27715000 + }, + { + "epoch": 80.23, + "learning_rate": 9.901897983049279e-06, + "loss": 1.833, + "step": 27715500 + }, + { + "epoch": 80.23, + "learning_rate": 9.901175782697296e-06, + "loss": 1.8207, + "step": 27716000 + }, + { + "epoch": 80.23, + "learning_rate": 9.900453582345313e-06, + "loss": 1.8528, + "step": 27716500 + }, + { + "epoch": 80.23, + "learning_rate": 9.899729934698037e-06, + "loss": 1.8492, + "step": 27717000 + }, + { + "epoch": 80.23, + "learning_rate": 9.899006287050761e-06, + "loss": 1.8176, + "step": 27717500 + }, + { + "epoch": 80.23, + "learning_rate": 9.898282639403483e-06, + "loss": 1.8301, + "step": 27718000 + }, + { + "epoch": 80.23, + "learning_rate": 9.897558991756206e-06, + "loss": 1.8282, + "step": 27718500 + }, + { + "epoch": 80.24, + "learning_rate": 9.896835344108931e-06, + "loss": 1.8508, + "step": 27719000 + }, + { + "epoch": 80.24, + "learning_rate": 9.896111696461653e-06, + "loss": 1.8552, + "step": 27719500 + }, + { + "epoch": 80.24, + "learning_rate": 9.895388048814376e-06, + "loss": 1.8319, + "step": 27720000 + }, + { + "epoch": 80.24, + "learning_rate": 9.8946644011671e-06, + "loss": 1.8362, + "step": 27720500 + }, + { + "epoch": 80.24, + "learning_rate": 9.893940753519823e-06, + "loss": 1.8694, + "step": 27721000 + }, + { + "epoch": 80.24, + "learning_rate": 9.893217105872546e-06, + "loss": 1.8572, + "step": 27721500 + }, + { + "epoch": 80.24, + "learning_rate": 9.892493458225268e-06, + "loss": 1.8486, + "step": 27722000 + }, + { + "epoch": 80.25, + "learning_rate": 9.891771257873287e-06, + "loss": 1.8383, + "step": 27722500 + }, + { + "epoch": 80.25, + "learning_rate": 9.89104761022601e-06, + "loss": 1.8415, + "step": 27723000 + }, + { + "epoch": 80.25, + "learning_rate": 9.890323962578733e-06, + "loss": 1.8146, + "step": 27723500 + }, + { + "epoch": 80.25, + "learning_rate": 9.889600314931457e-06, + "loss": 1.8331, + "step": 27724000 + }, + { + "epoch": 80.25, + "learning_rate": 9.888876667284181e-06, + "loss": 1.8371, + "step": 27724500 + }, + { + "epoch": 80.25, + "learning_rate": 9.888154466932198e-06, + "loss": 1.8412, + "step": 27725000 + }, + { + "epoch": 80.25, + "learning_rate": 9.887432266580215e-06, + "loss": 1.8402, + "step": 27725500 + }, + { + "epoch": 80.26, + "learning_rate": 9.886708618932938e-06, + "loss": 1.8432, + "step": 27726000 + }, + { + "epoch": 80.26, + "learning_rate": 9.885984971285662e-06, + "loss": 1.8525, + "step": 27726500 + }, + { + "epoch": 80.26, + "learning_rate": 9.885261323638385e-06, + "loss": 1.8552, + "step": 27727000 + }, + { + "epoch": 80.26, + "learning_rate": 9.884537675991108e-06, + "loss": 1.8454, + "step": 27727500 + }, + { + "epoch": 80.26, + "learning_rate": 9.883814028343832e-06, + "loss": 1.8522, + "step": 27728000 + }, + { + "epoch": 80.26, + "learning_rate": 9.883090380696556e-06, + "loss": 1.8556, + "step": 27728500 + }, + { + "epoch": 80.26, + "learning_rate": 9.882366733049278e-06, + "loss": 1.8425, + "step": 27729000 + }, + { + "epoch": 80.27, + "learning_rate": 9.881643085402002e-06, + "loss": 1.8569, + "step": 27729500 + }, + { + "epoch": 80.27, + "learning_rate": 9.880919437754726e-06, + "loss": 1.8493, + "step": 27730000 + }, + { + "epoch": 80.27, + "learning_rate": 9.880195790107448e-06, + "loss": 1.8319, + "step": 27730500 + }, + { + "epoch": 80.27, + "learning_rate": 9.87947214246017e-06, + "loss": 1.8534, + "step": 27731000 + }, + { + "epoch": 80.27, + "learning_rate": 9.878748494812894e-06, + "loss": 1.8218, + "step": 27731500 + }, + { + "epoch": 80.27, + "learning_rate": 9.878024847165618e-06, + "loss": 1.8522, + "step": 27732000 + }, + { + "epoch": 80.27, + "learning_rate": 9.877302646813635e-06, + "loss": 1.8305, + "step": 27732500 + }, + { + "epoch": 80.28, + "learning_rate": 9.876578999166357e-06, + "loss": 1.8361, + "step": 27733000 + }, + { + "epoch": 80.28, + "learning_rate": 9.875856798814376e-06, + "loss": 1.8653, + "step": 27733500 + }, + { + "epoch": 80.28, + "learning_rate": 9.875134598462394e-06, + "loss": 1.8277, + "step": 27734000 + }, + { + "epoch": 80.28, + "learning_rate": 9.874410950815118e-06, + "loss": 1.8207, + "step": 27734500 + }, + { + "epoch": 80.28, + "learning_rate": 9.87368730316784e-06, + "loss": 1.848, + "step": 27735000 + }, + { + "epoch": 80.28, + "learning_rate": 9.872963655520564e-06, + "loss": 1.8562, + "step": 27735500 + }, + { + "epoch": 80.28, + "learning_rate": 9.872240007873288e-06, + "loss": 1.8197, + "step": 27736000 + }, + { + "epoch": 80.29, + "learning_rate": 9.87151636022601e-06, + "loss": 1.838, + "step": 27736500 + }, + { + "epoch": 80.29, + "learning_rate": 9.870792712578734e-06, + "loss": 1.817, + "step": 27737000 + }, + { + "epoch": 80.29, + "learning_rate": 9.870069064931456e-06, + "loss": 1.8602, + "step": 27737500 + }, + { + "epoch": 80.29, + "learning_rate": 9.86934541728418e-06, + "loss": 1.8545, + "step": 27738000 + }, + { + "epoch": 80.29, + "learning_rate": 9.868623216932197e-06, + "loss": 1.8344, + "step": 27738500 + }, + { + "epoch": 80.29, + "learning_rate": 9.867899569284921e-06, + "loss": 1.8583, + "step": 27739000 + }, + { + "epoch": 80.29, + "learning_rate": 9.867175921637645e-06, + "loss": 1.8368, + "step": 27739500 + }, + { + "epoch": 80.3, + "learning_rate": 9.866452273990367e-06, + "loss": 1.8144, + "step": 27740000 + }, + { + "epoch": 80.3, + "learning_rate": 9.86572862634309e-06, + "loss": 1.8418, + "step": 27740500 + }, + { + "epoch": 80.3, + "learning_rate": 9.865004978695813e-06, + "loss": 1.8499, + "step": 27741000 + }, + { + "epoch": 80.3, + "learning_rate": 9.864281331048537e-06, + "loss": 1.8573, + "step": 27741500 + }, + { + "epoch": 80.3, + "learning_rate": 9.86355768340126e-06, + "loss": 1.8552, + "step": 27742000 + }, + { + "epoch": 80.3, + "learning_rate": 9.862835483049279e-06, + "loss": 1.8493, + "step": 27742500 + }, + { + "epoch": 80.3, + "learning_rate": 9.862111835402e-06, + "loss": 1.8315, + "step": 27743000 + }, + { + "epoch": 80.31, + "learning_rate": 9.861388187754725e-06, + "loss": 1.832, + "step": 27743500 + }, + { + "epoch": 80.31, + "learning_rate": 9.860664540107447e-06, + "loss": 1.8466, + "step": 27744000 + }, + { + "epoch": 80.31, + "learning_rate": 9.859940892460171e-06, + "loss": 1.8625, + "step": 27744500 + }, + { + "epoch": 80.31, + "learning_rate": 9.859218692108188e-06, + "loss": 1.8634, + "step": 27745000 + }, + { + "epoch": 80.31, + "learning_rate": 9.858495044460912e-06, + "loss": 1.865, + "step": 27745500 + }, + { + "epoch": 80.31, + "learning_rate": 9.857771396813634e-06, + "loss": 1.8415, + "step": 27746000 + }, + { + "epoch": 80.31, + "learning_rate": 9.857047749166358e-06, + "loss": 1.834, + "step": 27746500 + }, + { + "epoch": 80.32, + "learning_rate": 9.856325548814375e-06, + "loss": 1.8384, + "step": 27747000 + }, + { + "epoch": 80.32, + "learning_rate": 9.8556019011671e-06, + "loss": 1.8221, + "step": 27747500 + }, + { + "epoch": 80.32, + "learning_rate": 9.854878253519823e-06, + "loss": 1.8288, + "step": 27748000 + }, + { + "epoch": 80.32, + "learning_rate": 9.854154605872546e-06, + "loss": 1.8634, + "step": 27748500 + }, + { + "epoch": 80.32, + "learning_rate": 9.85343095822527e-06, + "loss": 1.8581, + "step": 27749000 + }, + { + "epoch": 80.32, + "learning_rate": 9.852707310577992e-06, + "loss": 1.825, + "step": 27749500 + }, + { + "epoch": 80.32, + "learning_rate": 9.85198511022601e-06, + "loss": 1.8421, + "step": 27750000 + }, + { + "epoch": 80.33, + "learning_rate": 9.851261462578733e-06, + "loss": 1.8254, + "step": 27750500 + }, + { + "epoch": 80.33, + "learning_rate": 9.850537814931457e-06, + "loss": 1.8395, + "step": 27751000 + }, + { + "epoch": 80.33, + "learning_rate": 9.849814167284179e-06, + "loss": 1.8505, + "step": 27751500 + }, + { + "epoch": 80.33, + "learning_rate": 9.849090519636903e-06, + "loss": 1.8581, + "step": 27752000 + }, + { + "epoch": 80.33, + "learning_rate": 9.848366871989627e-06, + "loss": 1.8245, + "step": 27752500 + }, + { + "epoch": 80.33, + "learning_rate": 9.847644671637644e-06, + "loss": 1.8591, + "step": 27753000 + }, + { + "epoch": 80.34, + "learning_rate": 9.846921023990366e-06, + "loss": 1.8287, + "step": 27753500 + }, + { + "epoch": 80.34, + "learning_rate": 9.84619737634309e-06, + "loss": 1.8353, + "step": 27754000 + }, + { + "epoch": 80.34, + "learning_rate": 9.845475175991108e-06, + "loss": 1.848, + "step": 27754500 + }, + { + "epoch": 80.34, + "learning_rate": 9.844751528343832e-06, + "loss": 1.8321, + "step": 27755000 + }, + { + "epoch": 80.34, + "learning_rate": 9.844027880696555e-06, + "loss": 1.824, + "step": 27755500 + }, + { + "epoch": 80.34, + "learning_rate": 9.843304233049278e-06, + "loss": 1.8427, + "step": 27756000 + }, + { + "epoch": 80.34, + "learning_rate": 9.842580585402002e-06, + "loss": 1.8296, + "step": 27756500 + }, + { + "epoch": 80.35, + "learning_rate": 9.841858385050019e-06, + "loss": 1.8471, + "step": 27757000 + }, + { + "epoch": 80.35, + "learning_rate": 9.841136184698036e-06, + "loss": 1.8508, + "step": 27757500 + }, + { + "epoch": 80.35, + "learning_rate": 9.84041253705076e-06, + "loss": 1.808, + "step": 27758000 + }, + { + "epoch": 80.35, + "learning_rate": 9.839690336698777e-06, + "loss": 1.8495, + "step": 27758500 + }, + { + "epoch": 80.35, + "learning_rate": 9.838966689051501e-06, + "loss": 1.8316, + "step": 27759000 + }, + { + "epoch": 80.35, + "learning_rate": 9.838243041404223e-06, + "loss": 1.8486, + "step": 27759500 + }, + { + "epoch": 80.35, + "learning_rate": 9.837519393756947e-06, + "loss": 1.8566, + "step": 27760000 + }, + { + "epoch": 80.36, + "learning_rate": 9.836795746109671e-06, + "loss": 1.829, + "step": 27760500 + }, + { + "epoch": 80.36, + "learning_rate": 9.836072098462394e-06, + "loss": 1.8525, + "step": 27761000 + }, + { + "epoch": 80.36, + "learning_rate": 9.835348450815117e-06, + "loss": 1.8342, + "step": 27761500 + }, + { + "epoch": 80.36, + "learning_rate": 9.83462480316784e-06, + "loss": 1.8395, + "step": 27762000 + }, + { + "epoch": 80.36, + "learning_rate": 9.833901155520564e-06, + "loss": 1.8469, + "step": 27762500 + }, + { + "epoch": 80.36, + "learning_rate": 9.833177507873288e-06, + "loss": 1.8406, + "step": 27763000 + }, + { + "epoch": 80.36, + "learning_rate": 9.83245386022601e-06, + "loss": 1.8413, + "step": 27763500 + }, + { + "epoch": 80.37, + "learning_rate": 9.831730212578734e-06, + "loss": 1.8365, + "step": 27764000 + }, + { + "epoch": 80.37, + "learning_rate": 9.831006564931456e-06, + "loss": 1.8251, + "step": 27764500 + }, + { + "epoch": 80.37, + "learning_rate": 9.83028291728418e-06, + "loss": 1.8527, + "step": 27765000 + }, + { + "epoch": 80.37, + "learning_rate": 9.829559269636902e-06, + "loss": 1.8434, + "step": 27765500 + }, + { + "epoch": 80.37, + "learning_rate": 9.828835621989626e-06, + "loss": 1.8452, + "step": 27766000 + }, + { + "epoch": 80.37, + "learning_rate": 9.828113421637645e-06, + "loss": 1.8441, + "step": 27766500 + }, + { + "epoch": 80.37, + "learning_rate": 9.827389773990367e-06, + "loss": 1.8945, + "step": 27767000 + }, + { + "epoch": 80.38, + "learning_rate": 9.826666126343091e-06, + "loss": 1.8237, + "step": 27767500 + }, + { + "epoch": 80.38, + "learning_rate": 9.825942478695813e-06, + "loss": 1.8551, + "step": 27768000 + }, + { + "epoch": 80.38, + "learning_rate": 9.825218831048537e-06, + "loss": 1.8562, + "step": 27768500 + }, + { + "epoch": 80.38, + "learning_rate": 9.82449518340126e-06, + "loss": 1.8369, + "step": 27769000 + }, + { + "epoch": 80.38, + "learning_rate": 9.823771535753983e-06, + "loss": 1.8473, + "step": 27769500 + }, + { + "epoch": 80.38, + "learning_rate": 9.823047888106707e-06, + "loss": 1.8479, + "step": 27770000 + }, + { + "epoch": 80.38, + "learning_rate": 9.822325687754725e-06, + "loss": 1.8459, + "step": 27770500 + }, + { + "epoch": 80.39, + "learning_rate": 9.821602040107447e-06, + "loss": 1.8475, + "step": 27771000 + }, + { + "epoch": 80.39, + "learning_rate": 9.82087839246017e-06, + "loss": 1.8527, + "step": 27771500 + }, + { + "epoch": 80.39, + "learning_rate": 9.820154744812895e-06, + "loss": 1.8347, + "step": 27772000 + }, + { + "epoch": 80.39, + "learning_rate": 9.819431097165617e-06, + "loss": 1.8381, + "step": 27772500 + }, + { + "epoch": 80.39, + "learning_rate": 9.818707449518341e-06, + "loss": 1.8644, + "step": 27773000 + }, + { + "epoch": 80.39, + "learning_rate": 9.817983801871065e-06, + "loss": 1.8709, + "step": 27773500 + }, + { + "epoch": 80.39, + "learning_rate": 9.817261601519082e-06, + "loss": 1.8426, + "step": 27774000 + }, + { + "epoch": 80.4, + "learning_rate": 9.816537953871804e-06, + "loss": 1.8635, + "step": 27774500 + }, + { + "epoch": 80.4, + "learning_rate": 9.815814306224528e-06, + "loss": 1.8244, + "step": 27775000 + }, + { + "epoch": 80.4, + "learning_rate": 9.815092105872545e-06, + "loss": 1.8319, + "step": 27775500 + }, + { + "epoch": 80.4, + "learning_rate": 9.81436845822527e-06, + "loss": 1.8683, + "step": 27776000 + }, + { + "epoch": 80.4, + "learning_rate": 9.813644810577992e-06, + "loss": 1.8195, + "step": 27776500 + }, + { + "epoch": 80.4, + "learning_rate": 9.812921162930716e-06, + "loss": 1.8611, + "step": 27777000 + }, + { + "epoch": 80.4, + "learning_rate": 9.81219751528344e-06, + "loss": 1.8574, + "step": 27777500 + }, + { + "epoch": 80.41, + "learning_rate": 9.811473867636162e-06, + "loss": 1.8549, + "step": 27778000 + }, + { + "epoch": 80.41, + "learning_rate": 9.810750219988884e-06, + "loss": 1.8376, + "step": 27778500 + }, + { + "epoch": 80.41, + "learning_rate": 9.81002657234161e-06, + "loss": 1.8269, + "step": 27779000 + }, + { + "epoch": 80.41, + "learning_rate": 9.809304371989627e-06, + "loss": 1.8703, + "step": 27779500 + }, + { + "epoch": 80.41, + "learning_rate": 9.808580724342349e-06, + "loss": 1.8423, + "step": 27780000 + }, + { + "epoch": 80.41, + "learning_rate": 9.807857076695073e-06, + "loss": 1.8409, + "step": 27780500 + }, + { + "epoch": 80.41, + "learning_rate": 9.807133429047797e-06, + "loss": 1.8481, + "step": 27781000 + }, + { + "epoch": 80.42, + "learning_rate": 9.80640978140052e-06, + "loss": 1.8414, + "step": 27781500 + }, + { + "epoch": 80.42, + "learning_rate": 9.805686133753241e-06, + "loss": 1.8321, + "step": 27782000 + }, + { + "epoch": 80.42, + "learning_rate": 9.80496393340126e-06, + "loss": 1.8099, + "step": 27782500 + }, + { + "epoch": 80.42, + "learning_rate": 9.804241733049278e-06, + "loss": 1.8315, + "step": 27783000 + }, + { + "epoch": 80.42, + "learning_rate": 9.803518085402002e-06, + "loss": 1.8324, + "step": 27783500 + }, + { + "epoch": 80.42, + "learning_rate": 9.802794437754724e-06, + "loss": 1.8374, + "step": 27784000 + }, + { + "epoch": 80.42, + "learning_rate": 9.802070790107448e-06, + "loss": 1.8385, + "step": 27784500 + }, + { + "epoch": 80.43, + "learning_rate": 9.801347142460172e-06, + "loss": 1.8435, + "step": 27785000 + }, + { + "epoch": 80.43, + "learning_rate": 9.800623494812894e-06, + "loss": 1.8505, + "step": 27785500 + }, + { + "epoch": 80.43, + "learning_rate": 9.799899847165616e-06, + "loss": 1.8556, + "step": 27786000 + }, + { + "epoch": 80.43, + "learning_rate": 9.799176199518342e-06, + "loss": 1.8646, + "step": 27786500 + }, + { + "epoch": 80.43, + "learning_rate": 9.798452551871064e-06, + "loss": 1.8454, + "step": 27787000 + }, + { + "epoch": 80.43, + "learning_rate": 9.797728904223786e-06, + "loss": 1.856, + "step": 27787500 + }, + { + "epoch": 80.43, + "learning_rate": 9.79700525657651e-06, + "loss": 1.8189, + "step": 27788000 + }, + { + "epoch": 80.44, + "learning_rate": 9.796283056224529e-06, + "loss": 1.849, + "step": 27788500 + }, + { + "epoch": 80.44, + "learning_rate": 9.795559408577251e-06, + "loss": 1.8597, + "step": 27789000 + }, + { + "epoch": 80.44, + "learning_rate": 9.794835760929973e-06, + "loss": 1.8216, + "step": 27789500 + }, + { + "epoch": 80.44, + "learning_rate": 9.794112113282697e-06, + "loss": 1.8375, + "step": 27790000 + }, + { + "epoch": 80.44, + "learning_rate": 9.793388465635421e-06, + "loss": 1.8473, + "step": 27790500 + }, + { + "epoch": 80.44, + "learning_rate": 9.792664817988144e-06, + "loss": 1.8717, + "step": 27791000 + }, + { + "epoch": 80.45, + "learning_rate": 9.79194261763616e-06, + "loss": 1.8526, + "step": 27791500 + }, + { + "epoch": 80.45, + "learning_rate": 9.791218969988886e-06, + "loss": 1.8298, + "step": 27792000 + }, + { + "epoch": 80.45, + "learning_rate": 9.790495322341609e-06, + "loss": 1.8561, + "step": 27792500 + }, + { + "epoch": 80.45, + "learning_rate": 9.789771674694331e-06, + "loss": 1.8603, + "step": 27793000 + }, + { + "epoch": 80.45, + "learning_rate": 9.789049474342348e-06, + "loss": 1.8815, + "step": 27793500 + }, + { + "epoch": 80.45, + "learning_rate": 9.788325826695074e-06, + "loss": 1.8288, + "step": 27794000 + }, + { + "epoch": 80.45, + "learning_rate": 9.787602179047796e-06, + "loss": 1.8078, + "step": 27794500 + }, + { + "epoch": 80.46, + "learning_rate": 9.786878531400518e-06, + "loss": 1.857, + "step": 27795000 + }, + { + "epoch": 80.46, + "learning_rate": 9.786156331048536e-06, + "loss": 1.8389, + "step": 27795500 + }, + { + "epoch": 80.46, + "learning_rate": 9.785432683401261e-06, + "loss": 1.8533, + "step": 27796000 + }, + { + "epoch": 80.46, + "learning_rate": 9.784709035753983e-06, + "loss": 1.8528, + "step": 27796500 + }, + { + "epoch": 80.46, + "learning_rate": 9.783985388106706e-06, + "loss": 1.8518, + "step": 27797000 + }, + { + "epoch": 80.46, + "learning_rate": 9.783261740459431e-06, + "loss": 1.846, + "step": 27797500 + }, + { + "epoch": 80.46, + "learning_rate": 9.782539540107448e-06, + "loss": 1.825, + "step": 27798000 + }, + { + "epoch": 80.47, + "learning_rate": 9.781817339755466e-06, + "loss": 1.831, + "step": 27798500 + }, + { + "epoch": 80.47, + "learning_rate": 9.781093692108188e-06, + "loss": 1.8337, + "step": 27799000 + }, + { + "epoch": 80.47, + "learning_rate": 9.780370044460912e-06, + "loss": 1.8391, + "step": 27799500 + }, + { + "epoch": 80.47, + "learning_rate": 9.779646396813636e-06, + "loss": 1.8564, + "step": 27800000 + }, + { + "epoch": 80.47, + "learning_rate": 9.778922749166358e-06, + "loss": 1.8565, + "step": 27800500 + }, + { + "epoch": 80.47, + "learning_rate": 9.77819910151908e-06, + "loss": 1.8277, + "step": 27801000 + }, + { + "epoch": 80.47, + "learning_rate": 9.777475453871806e-06, + "loss": 1.8732, + "step": 27801500 + }, + { + "epoch": 80.48, + "learning_rate": 9.776751806224528e-06, + "loss": 1.8395, + "step": 27802000 + }, + { + "epoch": 80.48, + "learning_rate": 9.77602815857725e-06, + "loss": 1.8371, + "step": 27802500 + }, + { + "epoch": 80.48, + "learning_rate": 9.775304510929974e-06, + "loss": 1.8393, + "step": 27803000 + }, + { + "epoch": 80.48, + "learning_rate": 9.774580863282698e-06, + "loss": 1.8429, + "step": 27803500 + }, + { + "epoch": 80.48, + "learning_rate": 9.77385721563542e-06, + "loss": 1.814, + "step": 27804000 + }, + { + "epoch": 80.48, + "learning_rate": 9.773135015283438e-06, + "loss": 1.8395, + "step": 27804500 + }, + { + "epoch": 80.48, + "learning_rate": 9.772411367636163e-06, + "loss": 1.8544, + "step": 27805000 + }, + { + "epoch": 80.49, + "learning_rate": 9.771687719988886e-06, + "loss": 1.862, + "step": 27805500 + }, + { + "epoch": 80.49, + "learning_rate": 9.770964072341608e-06, + "loss": 1.8161, + "step": 27806000 + }, + { + "epoch": 80.49, + "learning_rate": 9.770241871989625e-06, + "loss": 1.8623, + "step": 27806500 + }, + { + "epoch": 80.49, + "learning_rate": 9.76951822434235e-06, + "loss": 1.8479, + "step": 27807000 + }, + { + "epoch": 80.49, + "learning_rate": 9.768794576695073e-06, + "loss": 1.8398, + "step": 27807500 + }, + { + "epoch": 80.49, + "learning_rate": 9.768070929047795e-06, + "loss": 1.8276, + "step": 27808000 + }, + { + "epoch": 80.49, + "learning_rate": 9.767347281400519e-06, + "loss": 1.8601, + "step": 27808500 + }, + { + "epoch": 80.5, + "learning_rate": 9.766625081048538e-06, + "loss": 1.8547, + "step": 27809000 + }, + { + "epoch": 80.5, + "learning_rate": 9.76590143340126e-06, + "loss": 1.8279, + "step": 27809500 + }, + { + "epoch": 80.5, + "learning_rate": 9.765177785753982e-06, + "loss": 1.8481, + "step": 27810000 + }, + { + "epoch": 80.5, + "learning_rate": 9.764454138106708e-06, + "loss": 1.8384, + "step": 27810500 + }, + { + "epoch": 80.5, + "learning_rate": 9.76373049045943e-06, + "loss": 1.8367, + "step": 27811000 + }, + { + "epoch": 80.5, + "learning_rate": 9.763006842812153e-06, + "loss": 1.8433, + "step": 27811500 + }, + { + "epoch": 80.5, + "learning_rate": 9.762283195164876e-06, + "loss": 1.8387, + "step": 27812000 + }, + { + "epoch": 80.51, + "learning_rate": 9.7615595475176e-06, + "loss": 1.8479, + "step": 27812500 + }, + { + "epoch": 80.51, + "learning_rate": 9.760837347165618e-06, + "loss": 1.8372, + "step": 27813000 + }, + { + "epoch": 80.51, + "learning_rate": 9.76011369951834e-06, + "loss": 1.8609, + "step": 27813500 + }, + { + "epoch": 80.51, + "learning_rate": 9.759391499166357e-06, + "loss": 1.8423, + "step": 27814000 + }, + { + "epoch": 80.51, + "learning_rate": 9.758667851519083e-06, + "loss": 1.848, + "step": 27814500 + }, + { + "epoch": 80.51, + "learning_rate": 9.757944203871805e-06, + "loss": 1.8335, + "step": 27815000 + }, + { + "epoch": 80.51, + "learning_rate": 9.757220556224527e-06, + "loss": 1.8353, + "step": 27815500 + }, + { + "epoch": 80.52, + "learning_rate": 9.756496908577251e-06, + "loss": 1.805, + "step": 27816000 + }, + { + "epoch": 80.52, + "learning_rate": 9.755773260929975e-06, + "loss": 1.8468, + "step": 27816500 + }, + { + "epoch": 80.52, + "learning_rate": 9.755049613282697e-06, + "loss": 1.8761, + "step": 27817000 + }, + { + "epoch": 80.52, + "learning_rate": 9.754325965635421e-06, + "loss": 1.8345, + "step": 27817500 + }, + { + "epoch": 80.52, + "learning_rate": 9.753602317988145e-06, + "loss": 1.8353, + "step": 27818000 + }, + { + "epoch": 80.52, + "learning_rate": 9.752880117636162e-06, + "loss": 1.861, + "step": 27818500 + }, + { + "epoch": 80.52, + "learning_rate": 9.752156469988885e-06, + "loss": 1.8225, + "step": 27819000 + }, + { + "epoch": 80.53, + "learning_rate": 9.751432822341609e-06, + "loss": 1.8393, + "step": 27819500 + }, + { + "epoch": 80.53, + "learning_rate": 9.750709174694333e-06, + "loss": 1.8608, + "step": 27820000 + }, + { + "epoch": 80.53, + "learning_rate": 9.74998697434235e-06, + "loss": 1.8313, + "step": 27820500 + }, + { + "epoch": 80.53, + "learning_rate": 9.749263326695072e-06, + "loss": 1.8435, + "step": 27821000 + }, + { + "epoch": 80.53, + "learning_rate": 9.74854112634309e-06, + "loss": 1.8378, + "step": 27821500 + }, + { + "epoch": 80.53, + "learning_rate": 9.747817478695815e-06, + "loss": 1.8375, + "step": 27822000 + }, + { + "epoch": 80.53, + "learning_rate": 9.747093831048537e-06, + "loss": 1.8321, + "step": 27822500 + }, + { + "epoch": 80.54, + "learning_rate": 9.74637018340126e-06, + "loss": 1.8491, + "step": 27823000 + }, + { + "epoch": 80.54, + "learning_rate": 9.745646535753983e-06, + "loss": 1.8582, + "step": 27823500 + }, + { + "epoch": 80.54, + "learning_rate": 9.744924335402002e-06, + "loss": 1.8377, + "step": 27824000 + }, + { + "epoch": 80.54, + "learning_rate": 9.744200687754724e-06, + "loss": 1.8516, + "step": 27824500 + }, + { + "epoch": 80.54, + "learning_rate": 9.743477040107447e-06, + "loss": 1.8329, + "step": 27825000 + }, + { + "epoch": 80.54, + "learning_rate": 9.74275339246017e-06, + "loss": 1.8349, + "step": 27825500 + }, + { + "epoch": 80.54, + "learning_rate": 9.742029744812895e-06, + "loss": 1.859, + "step": 27826000 + }, + { + "epoch": 80.55, + "learning_rate": 9.741307544460912e-06, + "loss": 1.8631, + "step": 27826500 + }, + { + "epoch": 80.55, + "learning_rate": 9.740583896813634e-06, + "loss": 1.8315, + "step": 27827000 + }, + { + "epoch": 80.55, + "learning_rate": 9.73986024916636e-06, + "loss": 1.8301, + "step": 27827500 + }, + { + "epoch": 80.55, + "learning_rate": 9.739136601519082e-06, + "loss": 1.8355, + "step": 27828000 + }, + { + "epoch": 80.55, + "learning_rate": 9.738412953871804e-06, + "loss": 1.8445, + "step": 27828500 + }, + { + "epoch": 80.55, + "learning_rate": 9.737689306224528e-06, + "loss": 1.832, + "step": 27829000 + }, + { + "epoch": 80.56, + "learning_rate": 9.736965658577252e-06, + "loss": 1.863, + "step": 27829500 + }, + { + "epoch": 80.56, + "learning_rate": 9.736242010929974e-06, + "loss": 1.8662, + "step": 27830000 + }, + { + "epoch": 80.56, + "learning_rate": 9.735519810577991e-06, + "loss": 1.8471, + "step": 27830500 + }, + { + "epoch": 80.56, + "learning_rate": 9.734796162930715e-06, + "loss": 1.8388, + "step": 27831000 + }, + { + "epoch": 80.56, + "learning_rate": 9.73407251528344e-06, + "loss": 1.8228, + "step": 27831500 + }, + { + "epoch": 80.56, + "learning_rate": 9.733348867636162e-06, + "loss": 1.842, + "step": 27832000 + }, + { + "epoch": 80.56, + "learning_rate": 9.732625219988885e-06, + "loss": 1.8301, + "step": 27832500 + }, + { + "epoch": 80.57, + "learning_rate": 9.73190157234161e-06, + "loss": 1.8271, + "step": 27833000 + }, + { + "epoch": 80.57, + "learning_rate": 9.731177924694332e-06, + "loss": 1.8585, + "step": 27833500 + }, + { + "epoch": 80.57, + "learning_rate": 9.730454277047056e-06, + "loss": 1.8493, + "step": 27834000 + }, + { + "epoch": 80.57, + "learning_rate": 9.729730629399778e-06, + "loss": 1.8409, + "step": 27834500 + }, + { + "epoch": 80.57, + "learning_rate": 9.729008429047797e-06, + "loss": 1.8448, + "step": 27835000 + }, + { + "epoch": 80.57, + "learning_rate": 9.728284781400519e-06, + "loss": 1.8387, + "step": 27835500 + }, + { + "epoch": 80.57, + "learning_rate": 9.727561133753243e-06, + "loss": 1.8642, + "step": 27836000 + }, + { + "epoch": 80.58, + "learning_rate": 9.726837486105965e-06, + "loss": 1.8401, + "step": 27836500 + }, + { + "epoch": 80.58, + "learning_rate": 9.726113838458689e-06, + "loss": 1.8573, + "step": 27837000 + }, + { + "epoch": 80.58, + "learning_rate": 9.725391638106706e-06, + "loss": 1.8552, + "step": 27837500 + }, + { + "epoch": 80.58, + "learning_rate": 9.72466799045943e-06, + "loss": 1.8386, + "step": 27838000 + }, + { + "epoch": 80.58, + "learning_rate": 9.723944342812154e-06, + "loss": 1.84, + "step": 27838500 + }, + { + "epoch": 80.58, + "learning_rate": 9.723220695164876e-06, + "loss": 1.8594, + "step": 27839000 + }, + { + "epoch": 80.58, + "learning_rate": 9.722497047517599e-06, + "loss": 1.854, + "step": 27839500 + }, + { + "epoch": 80.59, + "learning_rate": 9.721774847165618e-06, + "loss": 1.8628, + "step": 27840000 + }, + { + "epoch": 80.59, + "learning_rate": 9.721051199518341e-06, + "loss": 1.8427, + "step": 27840500 + }, + { + "epoch": 80.59, + "learning_rate": 9.720327551871064e-06, + "loss": 1.857, + "step": 27841000 + }, + { + "epoch": 80.59, + "learning_rate": 9.719603904223788e-06, + "loss": 1.8742, + "step": 27841500 + }, + { + "epoch": 80.59, + "learning_rate": 9.71888025657651e-06, + "loss": 1.8519, + "step": 27842000 + }, + { + "epoch": 80.59, + "learning_rate": 9.718156608929234e-06, + "loss": 1.8522, + "step": 27842500 + }, + { + "epoch": 80.59, + "learning_rate": 9.717434408577251e-06, + "loss": 1.8495, + "step": 27843000 + }, + { + "epoch": 80.6, + "learning_rate": 9.716712208225268e-06, + "loss": 1.8418, + "step": 27843500 + }, + { + "epoch": 80.6, + "learning_rate": 9.715988560577992e-06, + "loss": 1.8508, + "step": 27844000 + }, + { + "epoch": 80.6, + "learning_rate": 9.715264912930716e-06, + "loss": 1.8148, + "step": 27844500 + }, + { + "epoch": 80.6, + "learning_rate": 9.714541265283438e-06, + "loss": 1.8304, + "step": 27845000 + }, + { + "epoch": 80.6, + "learning_rate": 9.713817617636162e-06, + "loss": 1.8672, + "step": 27845500 + }, + { + "epoch": 80.6, + "learning_rate": 9.71309541728418e-06, + "loss": 1.8555, + "step": 27846000 + }, + { + "epoch": 80.6, + "learning_rate": 9.712371769636903e-06, + "loss": 1.836, + "step": 27846500 + }, + { + "epoch": 80.61, + "learning_rate": 9.711648121989626e-06, + "loss": 1.8178, + "step": 27847000 + }, + { + "epoch": 80.61, + "learning_rate": 9.71092447434235e-06, + "loss": 1.8483, + "step": 27847500 + }, + { + "epoch": 80.61, + "learning_rate": 9.710200826695074e-06, + "loss": 1.8455, + "step": 27848000 + }, + { + "epoch": 80.61, + "learning_rate": 9.709477179047796e-06, + "loss": 1.845, + "step": 27848500 + }, + { + "epoch": 80.61, + "learning_rate": 9.70875353140052e-06, + "loss": 1.8742, + "step": 27849000 + }, + { + "epoch": 80.61, + "learning_rate": 9.708029883753242e-06, + "loss": 1.8888, + "step": 27849500 + }, + { + "epoch": 80.61, + "learning_rate": 9.707306236105966e-06, + "loss": 1.8099, + "step": 27850000 + }, + { + "epoch": 80.62, + "learning_rate": 9.706582588458688e-06, + "loss": 1.8458, + "step": 27850500 + }, + { + "epoch": 80.62, + "learning_rate": 9.705858940811412e-06, + "loss": 1.857, + "step": 27851000 + }, + { + "epoch": 80.62, + "learning_rate": 9.705135293164136e-06, + "loss": 1.8217, + "step": 27851500 + }, + { + "epoch": 80.62, + "learning_rate": 9.704414540107448e-06, + "loss": 1.8261, + "step": 27852000 + }, + { + "epoch": 80.62, + "learning_rate": 9.70369089246017e-06, + "loss": 1.8399, + "step": 27852500 + }, + { + "epoch": 80.62, + "learning_rate": 9.702967244812894e-06, + "loss": 1.8326, + "step": 27853000 + }, + { + "epoch": 80.62, + "learning_rate": 9.702243597165617e-06, + "loss": 1.8545, + "step": 27853500 + }, + { + "epoch": 80.63, + "learning_rate": 9.70151994951834e-06, + "loss": 1.8474, + "step": 27854000 + }, + { + "epoch": 80.63, + "learning_rate": 9.700797749166358e-06, + "loss": 1.8733, + "step": 27854500 + }, + { + "epoch": 80.63, + "learning_rate": 9.700074101519082e-06, + "loss": 1.8421, + "step": 27855000 + }, + { + "epoch": 80.63, + "learning_rate": 9.699350453871806e-06, + "loss": 1.8604, + "step": 27855500 + }, + { + "epoch": 80.63, + "learning_rate": 9.698626806224528e-06, + "loss": 1.8269, + "step": 27856000 + }, + { + "epoch": 80.63, + "learning_rate": 9.697903158577252e-06, + "loss": 1.8263, + "step": 27856500 + }, + { + "epoch": 80.63, + "learning_rate": 9.697179510929974e-06, + "loss": 1.8772, + "step": 27857000 + }, + { + "epoch": 80.64, + "learning_rate": 9.696457310577993e-06, + "loss": 1.8339, + "step": 27857500 + }, + { + "epoch": 80.64, + "learning_rate": 9.695733662930715e-06, + "loss": 1.8405, + "step": 27858000 + }, + { + "epoch": 80.64, + "learning_rate": 9.69501001528344e-06, + "loss": 1.8196, + "step": 27858500 + }, + { + "epoch": 80.64, + "learning_rate": 9.694286367636161e-06, + "loss": 1.8334, + "step": 27859000 + }, + { + "epoch": 80.64, + "learning_rate": 9.693562719988885e-06, + "loss": 1.8652, + "step": 27859500 + }, + { + "epoch": 80.64, + "learning_rate": 9.69283907234161e-06, + "loss": 1.8569, + "step": 27860000 + }, + { + "epoch": 80.64, + "learning_rate": 9.692115424694332e-06, + "loss": 1.871, + "step": 27860500 + }, + { + "epoch": 80.65, + "learning_rate": 9.691391777047055e-06, + "loss": 1.8229, + "step": 27861000 + }, + { + "epoch": 80.65, + "learning_rate": 9.690668129399778e-06, + "loss": 1.8458, + "step": 27861500 + }, + { + "epoch": 80.65, + "learning_rate": 9.689945929047797e-06, + "loss": 1.8228, + "step": 27862000 + }, + { + "epoch": 80.65, + "learning_rate": 9.689222281400519e-06, + "loss": 1.8346, + "step": 27862500 + }, + { + "epoch": 80.65, + "learning_rate": 9.688498633753243e-06, + "loss": 1.8272, + "step": 27863000 + }, + { + "epoch": 80.65, + "learning_rate": 9.687774986105965e-06, + "loss": 1.8322, + "step": 27863500 + }, + { + "epoch": 80.65, + "learning_rate": 9.687051338458689e-06, + "loss": 1.8386, + "step": 27864000 + }, + { + "epoch": 80.66, + "learning_rate": 9.686327690811411e-06, + "loss": 1.854, + "step": 27864500 + }, + { + "epoch": 80.66, + "learning_rate": 9.685604043164135e-06, + "loss": 1.8504, + "step": 27865000 + }, + { + "epoch": 80.66, + "learning_rate": 9.684880395516859e-06, + "loss": 1.8243, + "step": 27865500 + }, + { + "epoch": 80.66, + "learning_rate": 9.684158195164876e-06, + "loss": 1.8357, + "step": 27866000 + }, + { + "epoch": 80.66, + "learning_rate": 9.683435994812894e-06, + "loss": 1.8612, + "step": 27866500 + }, + { + "epoch": 80.66, + "learning_rate": 9.682712347165617e-06, + "loss": 1.8434, + "step": 27867000 + }, + { + "epoch": 80.67, + "learning_rate": 9.681988699518341e-06, + "loss": 1.8442, + "step": 27867500 + }, + { + "epoch": 80.67, + "learning_rate": 9.681265051871064e-06, + "loss": 1.8503, + "step": 27868000 + }, + { + "epoch": 80.67, + "learning_rate": 9.680541404223788e-06, + "loss": 1.8459, + "step": 27868500 + }, + { + "epoch": 80.67, + "learning_rate": 9.67981775657651e-06, + "loss": 1.8372, + "step": 27869000 + }, + { + "epoch": 80.67, + "learning_rate": 9.679095556224529e-06, + "loss": 1.8667, + "step": 27869500 + }, + { + "epoch": 80.67, + "learning_rate": 9.678371908577251e-06, + "loss": 1.854, + "step": 27870000 + }, + { + "epoch": 80.67, + "learning_rate": 9.677648260929975e-06, + "loss": 1.8306, + "step": 27870500 + }, + { + "epoch": 80.68, + "learning_rate": 9.676924613282697e-06, + "loss": 1.8346, + "step": 27871000 + }, + { + "epoch": 80.68, + "learning_rate": 9.676200965635421e-06, + "loss": 1.849, + "step": 27871500 + }, + { + "epoch": 80.68, + "learning_rate": 9.675477317988143e-06, + "loss": 1.8433, + "step": 27872000 + }, + { + "epoch": 80.68, + "learning_rate": 9.674753670340867e-06, + "loss": 1.8362, + "step": 27872500 + }, + { + "epoch": 80.68, + "learning_rate": 9.674030022693591e-06, + "loss": 1.8148, + "step": 27873000 + }, + { + "epoch": 80.68, + "learning_rate": 9.673307822341608e-06, + "loss": 1.8349, + "step": 27873500 + }, + { + "epoch": 80.68, + "learning_rate": 9.67258417469433e-06, + "loss": 1.8548, + "step": 27874000 + }, + { + "epoch": 80.69, + "learning_rate": 9.671860527047055e-06, + "loss": 1.8459, + "step": 27874500 + }, + { + "epoch": 80.69, + "learning_rate": 9.671136879399778e-06, + "loss": 1.8239, + "step": 27875000 + }, + { + "epoch": 80.69, + "learning_rate": 9.6704132317525e-06, + "loss": 1.848, + "step": 27875500 + }, + { + "epoch": 80.69, + "learning_rate": 9.669689584105225e-06, + "loss": 1.8668, + "step": 27876000 + }, + { + "epoch": 80.69, + "learning_rate": 9.668965936457949e-06, + "loss": 1.8614, + "step": 27876500 + }, + { + "epoch": 80.69, + "learning_rate": 9.66824228881067e-06, + "loss": 1.8251, + "step": 27877000 + }, + { + "epoch": 80.69, + "learning_rate": 9.667518641163393e-06, + "loss": 1.831, + "step": 27877500 + }, + { + "epoch": 80.7, + "learning_rate": 9.666796440811412e-06, + "loss": 1.8285, + "step": 27878000 + }, + { + "epoch": 80.7, + "learning_rate": 9.666074240459431e-06, + "loss": 1.8403, + "step": 27878500 + }, + { + "epoch": 80.7, + "learning_rate": 9.665350592812153e-06, + "loss": 1.8382, + "step": 27879000 + }, + { + "epoch": 80.7, + "learning_rate": 9.664626945164875e-06, + "loss": 1.8674, + "step": 27879500 + }, + { + "epoch": 80.7, + "learning_rate": 9.6639032975176e-06, + "loss": 1.8351, + "step": 27880000 + }, + { + "epoch": 80.7, + "learning_rate": 9.663179649870323e-06, + "loss": 1.8691, + "step": 27880500 + }, + { + "epoch": 80.7, + "learning_rate": 9.662456002223045e-06, + "loss": 1.8377, + "step": 27881000 + }, + { + "epoch": 80.71, + "learning_rate": 9.66173235457577e-06, + "loss": 1.8467, + "step": 27881500 + }, + { + "epoch": 80.71, + "learning_rate": 9.661008706928493e-06, + "loss": 1.8723, + "step": 27882000 + }, + { + "epoch": 80.71, + "learning_rate": 9.660285059281216e-06, + "loss": 1.8445, + "step": 27882500 + }, + { + "epoch": 80.71, + "learning_rate": 9.659562858929233e-06, + "loss": 1.8601, + "step": 27883000 + }, + { + "epoch": 80.71, + "learning_rate": 9.65884065857725e-06, + "loss": 1.8663, + "step": 27883500 + }, + { + "epoch": 80.71, + "learning_rate": 9.658117010929976e-06, + "loss": 1.8315, + "step": 27884000 + }, + { + "epoch": 80.71, + "learning_rate": 9.657393363282698e-06, + "loss": 1.8589, + "step": 27884500 + }, + { + "epoch": 80.72, + "learning_rate": 9.65666971563542e-06, + "loss": 1.8499, + "step": 27885000 + }, + { + "epoch": 80.72, + "learning_rate": 9.655946067988144e-06, + "loss": 1.8573, + "step": 27885500 + }, + { + "epoch": 80.72, + "learning_rate": 9.655222420340868e-06, + "loss": 1.8716, + "step": 27886000 + }, + { + "epoch": 80.72, + "learning_rate": 9.65449877269359e-06, + "loss": 1.8466, + "step": 27886500 + }, + { + "epoch": 80.72, + "learning_rate": 9.653775125046314e-06, + "loss": 1.8431, + "step": 27887000 + }, + { + "epoch": 80.72, + "learning_rate": 9.653051477399038e-06, + "loss": 1.8492, + "step": 27887500 + }, + { + "epoch": 80.72, + "learning_rate": 9.652329277047055e-06, + "loss": 1.8582, + "step": 27888000 + }, + { + "epoch": 80.73, + "learning_rate": 9.651605629399778e-06, + "loss": 1.8428, + "step": 27888500 + }, + { + "epoch": 80.73, + "learning_rate": 9.650883429047795e-06, + "loss": 1.8542, + "step": 27889000 + }, + { + "epoch": 80.73, + "learning_rate": 9.650159781400519e-06, + "loss": 1.8536, + "step": 27889500 + }, + { + "epoch": 80.73, + "learning_rate": 9.649436133753243e-06, + "loss": 1.8535, + "step": 27890000 + }, + { + "epoch": 80.73, + "learning_rate": 9.648712486105965e-06, + "loss": 1.8466, + "step": 27890500 + }, + { + "epoch": 80.73, + "learning_rate": 9.647991733049277e-06, + "loss": 1.8539, + "step": 27891000 + }, + { + "epoch": 80.73, + "learning_rate": 9.647268085402001e-06, + "loss": 1.8466, + "step": 27891500 + }, + { + "epoch": 80.74, + "learning_rate": 9.646544437754725e-06, + "loss": 1.8618, + "step": 27892000 + }, + { + "epoch": 80.74, + "learning_rate": 9.645820790107447e-06, + "loss": 1.8648, + "step": 27892500 + }, + { + "epoch": 80.74, + "learning_rate": 9.64509714246017e-06, + "loss": 1.8423, + "step": 27893000 + }, + { + "epoch": 80.74, + "learning_rate": 9.644373494812895e-06, + "loss": 1.8682, + "step": 27893500 + }, + { + "epoch": 80.74, + "learning_rate": 9.643651294460912e-06, + "loss": 1.8803, + "step": 27894000 + }, + { + "epoch": 80.74, + "learning_rate": 9.642927646813635e-06, + "loss": 1.8301, + "step": 27894500 + }, + { + "epoch": 80.74, + "learning_rate": 9.642203999166359e-06, + "loss": 1.8815, + "step": 27895000 + }, + { + "epoch": 80.75, + "learning_rate": 9.641480351519082e-06, + "loss": 1.832, + "step": 27895500 + }, + { + "epoch": 80.75, + "learning_rate": 9.640756703871805e-06, + "loss": 1.8724, + "step": 27896000 + }, + { + "epoch": 80.75, + "learning_rate": 9.640033056224527e-06, + "loss": 1.8244, + "step": 27896500 + }, + { + "epoch": 80.75, + "learning_rate": 9.639309408577253e-06, + "loss": 1.8602, + "step": 27897000 + }, + { + "epoch": 80.75, + "learning_rate": 9.638585760929975e-06, + "loss": 1.8623, + "step": 27897500 + }, + { + "epoch": 80.75, + "learning_rate": 9.637862113282697e-06, + "loss": 1.8306, + "step": 27898000 + }, + { + "epoch": 80.75, + "learning_rate": 9.637138465635421e-06, + "loss": 1.8333, + "step": 27898500 + }, + { + "epoch": 80.76, + "learning_rate": 9.63641626528344e-06, + "loss": 1.8691, + "step": 27899000 + }, + { + "epoch": 80.76, + "learning_rate": 9.635692617636162e-06, + "loss": 1.8522, + "step": 27899500 + }, + { + "epoch": 80.76, + "learning_rate": 9.634968969988884e-06, + "loss": 1.8605, + "step": 27900000 + }, + { + "epoch": 80.76, + "learning_rate": 9.634245322341608e-06, + "loss": 1.8485, + "step": 27900500 + }, + { + "epoch": 80.76, + "learning_rate": 9.633521674694332e-06, + "loss": 1.843, + "step": 27901000 + }, + { + "epoch": 80.76, + "learning_rate": 9.632798027047054e-06, + "loss": 1.8381, + "step": 27901500 + }, + { + "epoch": 80.76, + "learning_rate": 9.632074379399778e-06, + "loss": 1.8373, + "step": 27902000 + }, + { + "epoch": 80.77, + "learning_rate": 9.631350731752502e-06, + "loss": 1.8511, + "step": 27902500 + }, + { + "epoch": 80.77, + "learning_rate": 9.630627084105225e-06, + "loss": 1.8615, + "step": 27903000 + }, + { + "epoch": 80.77, + "learning_rate": 9.629904883753242e-06, + "loss": 1.8586, + "step": 27903500 + }, + { + "epoch": 80.77, + "learning_rate": 9.629181236105966e-06, + "loss": 1.8587, + "step": 27904000 + }, + { + "epoch": 80.77, + "learning_rate": 9.62845758845869e-06, + "loss": 1.8511, + "step": 27904500 + }, + { + "epoch": 80.77, + "learning_rate": 9.627733940811412e-06, + "loss": 1.8228, + "step": 27905000 + }, + { + "epoch": 80.77, + "learning_rate": 9.627010293164134e-06, + "loss": 1.8506, + "step": 27905500 + }, + { + "epoch": 80.78, + "learning_rate": 9.62628664551686e-06, + "loss": 1.859, + "step": 27906000 + }, + { + "epoch": 80.78, + "learning_rate": 9.625562997869582e-06, + "loss": 1.845, + "step": 27906500 + }, + { + "epoch": 80.78, + "learning_rate": 9.624839350222304e-06, + "loss": 1.8543, + "step": 27907000 + }, + { + "epoch": 80.78, + "learning_rate": 9.624115702575028e-06, + "loss": 1.8285, + "step": 27907500 + }, + { + "epoch": 80.78, + "learning_rate": 9.623392054927752e-06, + "loss": 1.8575, + "step": 27908000 + }, + { + "epoch": 80.78, + "learning_rate": 9.62266985457577e-06, + "loss": 1.8239, + "step": 27908500 + }, + { + "epoch": 80.79, + "learning_rate": 9.621946206928492e-06, + "loss": 1.8468, + "step": 27909000 + }, + { + "epoch": 80.79, + "learning_rate": 9.621222559281217e-06, + "loss": 1.8545, + "step": 27909500 + }, + { + "epoch": 80.79, + "learning_rate": 9.62050180622453e-06, + "loss": 1.8411, + "step": 27910000 + }, + { + "epoch": 80.79, + "learning_rate": 9.619778158577252e-06, + "loss": 1.8309, + "step": 27910500 + }, + { + "epoch": 80.79, + "learning_rate": 9.619054510929974e-06, + "loss": 1.847, + "step": 27911000 + }, + { + "epoch": 80.79, + "learning_rate": 9.618330863282698e-06, + "loss": 1.8427, + "step": 27911500 + }, + { + "epoch": 80.79, + "learning_rate": 9.617607215635422e-06, + "loss": 1.8534, + "step": 27912000 + }, + { + "epoch": 80.8, + "learning_rate": 9.616883567988144e-06, + "loss": 1.8482, + "step": 27912500 + }, + { + "epoch": 80.8, + "learning_rate": 9.616159920340866e-06, + "loss": 1.8491, + "step": 27913000 + }, + { + "epoch": 80.8, + "learning_rate": 9.615436272693592e-06, + "loss": 1.8375, + "step": 27913500 + }, + { + "epoch": 80.8, + "learning_rate": 9.614712625046314e-06, + "loss": 1.8436, + "step": 27914000 + }, + { + "epoch": 80.8, + "learning_rate": 9.613988977399036e-06, + "loss": 1.8376, + "step": 27914500 + }, + { + "epoch": 80.8, + "learning_rate": 9.61326532975176e-06, + "loss": 1.8415, + "step": 27915000 + }, + { + "epoch": 80.8, + "learning_rate": 9.612541682104484e-06, + "loss": 1.8745, + "step": 27915500 + }, + { + "epoch": 80.81, + "learning_rate": 9.611818034457206e-06, + "loss": 1.8609, + "step": 27916000 + }, + { + "epoch": 80.81, + "learning_rate": 9.61109438680993e-06, + "loss": 1.8515, + "step": 27916500 + }, + { + "epoch": 80.81, + "learning_rate": 9.61037218645795e-06, + "loss": 1.8599, + "step": 27917000 + }, + { + "epoch": 80.81, + "learning_rate": 9.609649986105966e-06, + "loss": 1.8141, + "step": 27917500 + }, + { + "epoch": 80.81, + "learning_rate": 9.608927785753984e-06, + "loss": 1.8491, + "step": 27918000 + }, + { + "epoch": 80.81, + "learning_rate": 9.608204138106706e-06, + "loss": 1.8631, + "step": 27918500 + }, + { + "epoch": 80.81, + "learning_rate": 9.60748049045943e-06, + "loss": 1.8481, + "step": 27919000 + }, + { + "epoch": 80.82, + "learning_rate": 9.606758290107449e-06, + "loss": 1.8571, + "step": 27919500 + }, + { + "epoch": 80.82, + "learning_rate": 9.606034642460171e-06, + "loss": 1.8388, + "step": 27920000 + }, + { + "epoch": 80.82, + "learning_rate": 9.605310994812893e-06, + "loss": 1.838, + "step": 27920500 + }, + { + "epoch": 80.82, + "learning_rate": 9.604587347165617e-06, + "loss": 1.8462, + "step": 27921000 + }, + { + "epoch": 80.82, + "learning_rate": 9.603863699518341e-06, + "loss": 1.8586, + "step": 27921500 + }, + { + "epoch": 80.82, + "learning_rate": 9.603140051871063e-06, + "loss": 1.8373, + "step": 27922000 + }, + { + "epoch": 80.82, + "learning_rate": 9.602416404223787e-06, + "loss": 1.8561, + "step": 27922500 + }, + { + "epoch": 80.83, + "learning_rate": 9.601692756576511e-06, + "loss": 1.8326, + "step": 27923000 + }, + { + "epoch": 80.83, + "learning_rate": 9.600969108929233e-06, + "loss": 1.8378, + "step": 27923500 + }, + { + "epoch": 80.83, + "learning_rate": 9.600245461281956e-06, + "loss": 1.8278, + "step": 27924000 + }, + { + "epoch": 80.83, + "learning_rate": 9.59952181363468e-06, + "loss": 1.8543, + "step": 27924500 + }, + { + "epoch": 80.83, + "learning_rate": 9.598798165987404e-06, + "loss": 1.8488, + "step": 27925000 + }, + { + "epoch": 80.83, + "learning_rate": 9.598074518340126e-06, + "loss": 1.851, + "step": 27925500 + }, + { + "epoch": 80.83, + "learning_rate": 9.59735087069285e-06, + "loss": 1.833, + "step": 27926000 + }, + { + "epoch": 80.84, + "learning_rate": 9.596627223045574e-06, + "loss": 1.828, + "step": 27926500 + }, + { + "epoch": 80.84, + "learning_rate": 9.595903575398296e-06, + "loss": 1.8462, + "step": 27927000 + }, + { + "epoch": 80.84, + "learning_rate": 9.595181375046313e-06, + "loss": 1.8602, + "step": 27927500 + }, + { + "epoch": 80.84, + "learning_rate": 9.594457727399037e-06, + "loss": 1.8557, + "step": 27928000 + }, + { + "epoch": 80.84, + "learning_rate": 9.593734079751761e-06, + "loss": 1.8805, + "step": 27928500 + }, + { + "epoch": 80.84, + "learning_rate": 9.593010432104483e-06, + "loss": 1.8484, + "step": 27929000 + }, + { + "epoch": 80.84, + "learning_rate": 9.592286784457207e-06, + "loss": 1.8488, + "step": 27929500 + }, + { + "epoch": 80.85, + "learning_rate": 9.591564584105224e-06, + "loss": 1.8305, + "step": 27930000 + }, + { + "epoch": 80.85, + "learning_rate": 9.590840936457948e-06, + "loss": 1.8507, + "step": 27930500 + }, + { + "epoch": 80.85, + "learning_rate": 9.59011728881067e-06, + "loss": 1.8689, + "step": 27931000 + }, + { + "epoch": 80.85, + "learning_rate": 9.589393641163395e-06, + "loss": 1.8415, + "step": 27931500 + }, + { + "epoch": 80.85, + "learning_rate": 9.588671440811412e-06, + "loss": 1.8615, + "step": 27932000 + }, + { + "epoch": 80.85, + "learning_rate": 9.587947793164136e-06, + "loss": 1.8329, + "step": 27932500 + }, + { + "epoch": 80.85, + "learning_rate": 9.587224145516858e-06, + "loss": 1.8238, + "step": 27933000 + }, + { + "epoch": 80.86, + "learning_rate": 9.586500497869582e-06, + "loss": 1.8683, + "step": 27933500 + }, + { + "epoch": 80.86, + "learning_rate": 9.585776850222306e-06, + "loss": 1.8459, + "step": 27934000 + }, + { + "epoch": 80.86, + "learning_rate": 9.585054649870323e-06, + "loss": 1.8452, + "step": 27934500 + }, + { + "epoch": 80.86, + "learning_rate": 9.584331002223045e-06, + "loss": 1.8456, + "step": 27935000 + }, + { + "epoch": 80.86, + "learning_rate": 9.58360735457577e-06, + "loss": 1.8432, + "step": 27935500 + }, + { + "epoch": 80.86, + "learning_rate": 9.582883706928493e-06, + "loss": 1.837, + "step": 27936000 + }, + { + "epoch": 80.86, + "learning_rate": 9.582160059281215e-06, + "loss": 1.8622, + "step": 27936500 + }, + { + "epoch": 80.87, + "learning_rate": 9.58143641163394e-06, + "loss": 1.8499, + "step": 27937000 + }, + { + "epoch": 80.87, + "learning_rate": 9.580714211281957e-06, + "loss": 1.8471, + "step": 27937500 + }, + { + "epoch": 80.87, + "learning_rate": 9.57999056363468e-06, + "loss": 1.8596, + "step": 27938000 + }, + { + "epoch": 80.87, + "learning_rate": 9.579268363282698e-06, + "loss": 1.8501, + "step": 27938500 + }, + { + "epoch": 80.87, + "learning_rate": 9.57854471563542e-06, + "loss": 1.8649, + "step": 27939000 + }, + { + "epoch": 80.87, + "learning_rate": 9.577821067988144e-06, + "loss": 1.8399, + "step": 27939500 + }, + { + "epoch": 80.87, + "learning_rate": 9.577097420340868e-06, + "loss": 1.8438, + "step": 27940000 + }, + { + "epoch": 80.88, + "learning_rate": 9.57637377269359e-06, + "loss": 1.8387, + "step": 27940500 + }, + { + "epoch": 80.88, + "learning_rate": 9.575650125046314e-06, + "loss": 1.8661, + "step": 27941000 + }, + { + "epoch": 80.88, + "learning_rate": 9.574926477399038e-06, + "loss": 1.8209, + "step": 27941500 + }, + { + "epoch": 80.88, + "learning_rate": 9.57420282975176e-06, + "loss": 1.8292, + "step": 27942000 + }, + { + "epoch": 80.88, + "learning_rate": 9.573479182104484e-06, + "loss": 1.8229, + "step": 27942500 + }, + { + "epoch": 80.88, + "learning_rate": 9.572755534457206e-06, + "loss": 1.8591, + "step": 27943000 + }, + { + "epoch": 80.88, + "learning_rate": 9.57203188680993e-06, + "loss": 1.8529, + "step": 27943500 + }, + { + "epoch": 80.89, + "learning_rate": 9.571309686457947e-06, + "loss": 1.8315, + "step": 27944000 + }, + { + "epoch": 80.89, + "learning_rate": 9.570587486105965e-06, + "loss": 1.8449, + "step": 27944500 + }, + { + "epoch": 80.89, + "learning_rate": 9.569863838458689e-06, + "loss": 1.8481, + "step": 27945000 + }, + { + "epoch": 80.89, + "learning_rate": 9.569140190811413e-06, + "loss": 1.8462, + "step": 27945500 + }, + { + "epoch": 80.89, + "learning_rate": 9.568416543164135e-06, + "loss": 1.8399, + "step": 27946000 + }, + { + "epoch": 80.89, + "learning_rate": 9.567692895516859e-06, + "loss": 1.8525, + "step": 27946500 + }, + { + "epoch": 80.9, + "learning_rate": 9.566969247869583e-06, + "loss": 1.84, + "step": 27947000 + }, + { + "epoch": 80.9, + "learning_rate": 9.566245600222305e-06, + "loss": 1.8579, + "step": 27947500 + }, + { + "epoch": 80.9, + "learning_rate": 9.565521952575029e-06, + "loss": 1.8431, + "step": 27948000 + }, + { + "epoch": 80.9, + "learning_rate": 9.564798304927751e-06, + "loss": 1.846, + "step": 27948500 + }, + { + "epoch": 80.9, + "learning_rate": 9.564074657280475e-06, + "loss": 1.8423, + "step": 27949000 + }, + { + "epoch": 80.9, + "learning_rate": 9.563352456928492e-06, + "loss": 1.8228, + "step": 27949500 + }, + { + "epoch": 80.9, + "learning_rate": 9.562628809281216e-06, + "loss": 1.8442, + "step": 27950000 + }, + { + "epoch": 80.91, + "learning_rate": 9.561905161633938e-06, + "loss": 1.856, + "step": 27950500 + }, + { + "epoch": 80.91, + "learning_rate": 9.561181513986662e-06, + "loss": 1.8431, + "step": 27951000 + }, + { + "epoch": 80.91, + "learning_rate": 9.560457866339386e-06, + "loss": 1.8479, + "step": 27951500 + }, + { + "epoch": 80.91, + "learning_rate": 9.559735665987403e-06, + "loss": 1.8537, + "step": 27952000 + }, + { + "epoch": 80.91, + "learning_rate": 9.559012018340126e-06, + "loss": 1.8552, + "step": 27952500 + }, + { + "epoch": 80.91, + "learning_rate": 9.55828837069285e-06, + "loss": 1.8389, + "step": 27953000 + }, + { + "epoch": 80.91, + "learning_rate": 9.557564723045574e-06, + "loss": 1.8456, + "step": 27953500 + }, + { + "epoch": 80.92, + "learning_rate": 9.55684252269359e-06, + "loss": 1.8267, + "step": 27954000 + }, + { + "epoch": 80.92, + "learning_rate": 9.556120322341608e-06, + "loss": 1.8282, + "step": 27954500 + }, + { + "epoch": 80.92, + "learning_rate": 9.555396674694332e-06, + "loss": 1.8594, + "step": 27955000 + }, + { + "epoch": 80.92, + "learning_rate": 9.554673027047054e-06, + "loss": 1.8785, + "step": 27955500 + }, + { + "epoch": 80.92, + "learning_rate": 9.553949379399778e-06, + "loss": 1.8757, + "step": 27956000 + }, + { + "epoch": 80.92, + "learning_rate": 9.553225731752502e-06, + "loss": 1.8299, + "step": 27956500 + }, + { + "epoch": 80.92, + "learning_rate": 9.552502084105224e-06, + "loss": 1.8434, + "step": 27957000 + }, + { + "epoch": 80.93, + "learning_rate": 9.551779883753242e-06, + "loss": 1.8436, + "step": 27957500 + }, + { + "epoch": 80.93, + "learning_rate": 9.551056236105965e-06, + "loss": 1.8542, + "step": 27958000 + }, + { + "epoch": 80.93, + "learning_rate": 9.55033258845869e-06, + "loss": 1.8634, + "step": 27958500 + }, + { + "epoch": 80.93, + "learning_rate": 9.549608940811412e-06, + "loss": 1.8504, + "step": 27959000 + }, + { + "epoch": 80.93, + "learning_rate": 9.548885293164136e-06, + "loss": 1.85, + "step": 27959500 + }, + { + "epoch": 80.93, + "learning_rate": 9.548161645516858e-06, + "loss": 1.8499, + "step": 27960000 + }, + { + "epoch": 80.93, + "learning_rate": 9.547437997869582e-06, + "loss": 1.8234, + "step": 27960500 + }, + { + "epoch": 80.94, + "learning_rate": 9.546714350222306e-06, + "loss": 1.8596, + "step": 27961000 + }, + { + "epoch": 80.94, + "learning_rate": 9.545990702575028e-06, + "loss": 1.8349, + "step": 27961500 + }, + { + "epoch": 80.94, + "learning_rate": 9.545268502223045e-06, + "loss": 1.8672, + "step": 27962000 + }, + { + "epoch": 80.94, + "learning_rate": 9.544544854575769e-06, + "loss": 1.8367, + "step": 27962500 + }, + { + "epoch": 80.94, + "learning_rate": 9.543821206928493e-06, + "loss": 1.833, + "step": 27963000 + }, + { + "epoch": 80.94, + "learning_rate": 9.543097559281215e-06, + "loss": 1.8287, + "step": 27963500 + }, + { + "epoch": 80.94, + "learning_rate": 9.542375358929234e-06, + "loss": 1.8454, + "step": 27964000 + }, + { + "epoch": 80.95, + "learning_rate": 9.541651711281956e-06, + "loss": 1.8467, + "step": 27964500 + }, + { + "epoch": 80.95, + "learning_rate": 9.54092806363468e-06, + "loss": 1.8432, + "step": 27965000 + }, + { + "epoch": 80.95, + "learning_rate": 9.540204415987403e-06, + "loss": 1.853, + "step": 27965500 + }, + { + "epoch": 80.95, + "learning_rate": 9.539480768340127e-06, + "loss": 1.8599, + "step": 27966000 + }, + { + "epoch": 80.95, + "learning_rate": 9.53875712069285e-06, + "loss": 1.8262, + "step": 27966500 + }, + { + "epoch": 80.95, + "learning_rate": 9.538033473045573e-06, + "loss": 1.8558, + "step": 27967000 + }, + { + "epoch": 80.95, + "learning_rate": 9.53731127269359e-06, + "loss": 1.8442, + "step": 27967500 + }, + { + "epoch": 80.96, + "learning_rate": 9.536587625046314e-06, + "loss": 1.836, + "step": 27968000 + }, + { + "epoch": 80.96, + "learning_rate": 9.535863977399038e-06, + "loss": 1.8375, + "step": 27968500 + }, + { + "epoch": 80.96, + "learning_rate": 9.53514032975176e-06, + "loss": 1.8443, + "step": 27969000 + }, + { + "epoch": 80.96, + "learning_rate": 9.534416682104484e-06, + "loss": 1.8288, + "step": 27969500 + }, + { + "epoch": 80.96, + "learning_rate": 9.533693034457208e-06, + "loss": 1.8366, + "step": 27970000 + }, + { + "epoch": 80.96, + "learning_rate": 9.53296938680993e-06, + "loss": 1.859, + "step": 27970500 + }, + { + "epoch": 80.96, + "learning_rate": 9.532245739162652e-06, + "loss": 1.8444, + "step": 27971000 + }, + { + "epoch": 80.97, + "learning_rate": 9.531522091515376e-06, + "loss": 1.8493, + "step": 27971500 + }, + { + "epoch": 80.97, + "learning_rate": 9.5307984438681e-06, + "loss": 1.8461, + "step": 27972000 + }, + { + "epoch": 80.97, + "learning_rate": 9.530074796220822e-06, + "loss": 1.8595, + "step": 27972500 + }, + { + "epoch": 80.97, + "learning_rate": 9.529351148573546e-06, + "loss": 1.8667, + "step": 27973000 + }, + { + "epoch": 80.97, + "learning_rate": 9.528628948221564e-06, + "loss": 1.8656, + "step": 27973500 + }, + { + "epoch": 80.97, + "learning_rate": 9.527905300574288e-06, + "loss": 1.8372, + "step": 27974000 + }, + { + "epoch": 80.97, + "learning_rate": 9.527183100222305e-06, + "loss": 1.8724, + "step": 27974500 + }, + { + "epoch": 80.98, + "learning_rate": 9.526459452575029e-06, + "loss": 1.8354, + "step": 27975000 + }, + { + "epoch": 80.98, + "learning_rate": 9.525735804927751e-06, + "loss": 1.8524, + "step": 27975500 + }, + { + "epoch": 80.98, + "learning_rate": 9.525012157280475e-06, + "loss": 1.8496, + "step": 27976000 + }, + { + "epoch": 80.98, + "learning_rate": 9.524288509633197e-06, + "loss": 1.8127, + "step": 27976500 + }, + { + "epoch": 80.98, + "learning_rate": 9.523564861985921e-06, + "loss": 1.8504, + "step": 27977000 + }, + { + "epoch": 80.98, + "learning_rate": 9.522841214338645e-06, + "loss": 1.8636, + "step": 27977500 + }, + { + "epoch": 80.98, + "learning_rate": 9.522117566691367e-06, + "loss": 1.841, + "step": 27978000 + }, + { + "epoch": 80.99, + "learning_rate": 9.521393919044091e-06, + "loss": 1.8518, + "step": 27978500 + }, + { + "epoch": 80.99, + "learning_rate": 9.520671718692108e-06, + "loss": 1.8402, + "step": 27979000 + }, + { + "epoch": 80.99, + "learning_rate": 9.519948071044832e-06, + "loss": 1.842, + "step": 27979500 + }, + { + "epoch": 80.99, + "learning_rate": 9.519224423397555e-06, + "loss": 1.8683, + "step": 27980000 + }, + { + "epoch": 80.99, + "learning_rate": 9.518500775750278e-06, + "loss": 1.8396, + "step": 27980500 + }, + { + "epoch": 80.99, + "learning_rate": 9.517777128103002e-06, + "loss": 1.8664, + "step": 27981000 + }, + { + "epoch": 80.99, + "learning_rate": 9.517053480455725e-06, + "loss": 1.853, + "step": 27981500 + }, + { + "epoch": 81.0, + "learning_rate": 9.516329832808447e-06, + "loss": 1.8603, + "step": 27982000 + }, + { + "epoch": 81.0, + "learning_rate": 9.515607632456466e-06, + "loss": 1.839, + "step": 27982500 + }, + { + "epoch": 81.0, + "learning_rate": 9.51488398480919e-06, + "loss": 1.8393, + "step": 27983000 + }, + { + "epoch": 81.0, + "eval_accuracy": 0.6873256623884321, + "eval_accuracy_mlm": 0.6559826513935384, + "eval_accuracy_nsp": 0.8555109467306468, + "eval_loss": 2.204529047012329, + "eval_runtime": 331.9624, + "eval_samples_per_second": 1314.564, + "eval_steps_per_second": 54.774, + "step": 27983232 + }, + { + "epoch": 81.0, + "learning_rate": 9.514160337161912e-06, + "loss": 1.8289, + "step": 27983500 + }, + { + "epoch": 81.0, + "learning_rate": 9.513436689514634e-06, + "loss": 1.848, + "step": 27984000 + }, + { + "epoch": 81.0, + "learning_rate": 9.51271304186736e-06, + "loss": 1.811, + "step": 27984500 + }, + { + "epoch": 81.01, + "learning_rate": 9.511990841515377e-06, + "loss": 1.8314, + "step": 27985000 + }, + { + "epoch": 81.01, + "learning_rate": 9.5112671938681e-06, + "loss": 1.8233, + "step": 27985500 + }, + { + "epoch": 81.01, + "learning_rate": 9.510543546220823e-06, + "loss": 1.8343, + "step": 27986000 + }, + { + "epoch": 81.01, + "learning_rate": 9.509819898573547e-06, + "loss": 1.8559, + "step": 27986500 + }, + { + "epoch": 81.01, + "learning_rate": 9.509097698221564e-06, + "loss": 1.8376, + "step": 27987000 + }, + { + "epoch": 81.01, + "learning_rate": 9.508374050574287e-06, + "loss": 1.7997, + "step": 27987500 + }, + { + "epoch": 81.01, + "learning_rate": 9.50765040292701e-06, + "loss": 1.8277, + "step": 27988000 + }, + { + "epoch": 81.02, + "learning_rate": 9.506926755279734e-06, + "loss": 1.8183, + "step": 27988500 + }, + { + "epoch": 81.02, + "learning_rate": 9.506204554927752e-06, + "loss": 1.8362, + "step": 27989000 + }, + { + "epoch": 81.02, + "learning_rate": 9.505480907280474e-06, + "loss": 1.8496, + "step": 27989500 + }, + { + "epoch": 81.02, + "learning_rate": 9.504757259633198e-06, + "loss": 1.8604, + "step": 27990000 + }, + { + "epoch": 81.02, + "learning_rate": 9.504033611985922e-06, + "loss": 1.8382, + "step": 27990500 + }, + { + "epoch": 81.02, + "learning_rate": 9.503309964338644e-06, + "loss": 1.8236, + "step": 27991000 + }, + { + "epoch": 81.02, + "learning_rate": 9.502586316691366e-06, + "loss": 1.8519, + "step": 27991500 + }, + { + "epoch": 81.03, + "learning_rate": 9.501862669044092e-06, + "loss": 1.8567, + "step": 27992000 + }, + { + "epoch": 81.03, + "learning_rate": 9.501139021396814e-06, + "loss": 1.8519, + "step": 27992500 + }, + { + "epoch": 81.03, + "learning_rate": 9.500415373749536e-06, + "loss": 1.8376, + "step": 27993000 + }, + { + "epoch": 81.03, + "learning_rate": 9.499693173397554e-06, + "loss": 1.8397, + "step": 27993500 + }, + { + "epoch": 81.03, + "learning_rate": 9.49896952575028e-06, + "loss": 1.8032, + "step": 27994000 + }, + { + "epoch": 81.03, + "learning_rate": 9.498245878103001e-06, + "loss": 1.8208, + "step": 27994500 + }, + { + "epoch": 81.03, + "learning_rate": 9.497522230455724e-06, + "loss": 1.8153, + "step": 27995000 + }, + { + "epoch": 81.04, + "learning_rate": 9.496800030103743e-06, + "loss": 1.8227, + "step": 27995500 + }, + { + "epoch": 81.04, + "learning_rate": 9.496077829751762e-06, + "loss": 1.8619, + "step": 27996000 + }, + { + "epoch": 81.04, + "learning_rate": 9.495354182104484e-06, + "loss": 1.8431, + "step": 27996500 + }, + { + "epoch": 81.04, + "learning_rate": 9.494630534457206e-06, + "loss": 1.8263, + "step": 27997000 + }, + { + "epoch": 81.04, + "learning_rate": 9.49390688680993e-06, + "loss": 1.8264, + "step": 27997500 + }, + { + "epoch": 81.04, + "learning_rate": 9.493183239162654e-06, + "loss": 1.8234, + "step": 27998000 + }, + { + "epoch": 81.04, + "learning_rate": 9.492463933401261e-06, + "loss": 1.8351, + "step": 27998500 + }, + { + "epoch": 81.05, + "learning_rate": 9.491740285753983e-06, + "loss": 1.8437, + "step": 27999000 + }, + { + "epoch": 81.05, + "learning_rate": 9.491016638106706e-06, + "loss": 1.8498, + "step": 27999500 + }, + { + "epoch": 81.05, + "learning_rate": 9.49029299045943e-06, + "loss": 1.8355, + "step": 28000000 + }, + { + "epoch": 81.05, + "learning_rate": 9.489569342812154e-06, + "loss": 1.84, + "step": 28000500 + }, + { + "epoch": 81.05, + "learning_rate": 9.488845695164876e-06, + "loss": 1.8398, + "step": 28001000 + }, + { + "epoch": 81.05, + "learning_rate": 9.4881220475176e-06, + "loss": 1.8394, + "step": 28001500 + }, + { + "epoch": 81.05, + "learning_rate": 9.487399847165619e-06, + "loss": 1.842, + "step": 28002000 + }, + { + "epoch": 81.06, + "learning_rate": 9.486676199518341e-06, + "loss": 1.8563, + "step": 28002500 + }, + { + "epoch": 81.06, + "learning_rate": 9.485952551871063e-06, + "loss": 1.8594, + "step": 28003000 + }, + { + "epoch": 81.06, + "learning_rate": 9.485228904223787e-06, + "loss": 1.8372, + "step": 28003500 + }, + { + "epoch": 81.06, + "learning_rate": 9.484505256576511e-06, + "loss": 1.8357, + "step": 28004000 + }, + { + "epoch": 81.06, + "learning_rate": 9.483781608929233e-06, + "loss": 1.8588, + "step": 28004500 + }, + { + "epoch": 81.06, + "learning_rate": 9.483057961281955e-06, + "loss": 1.8487, + "step": 28005000 + }, + { + "epoch": 81.06, + "learning_rate": 9.482334313634681e-06, + "loss": 1.8661, + "step": 28005500 + }, + { + "epoch": 81.07, + "learning_rate": 9.481612113282698e-06, + "loss": 1.8235, + "step": 28006000 + }, + { + "epoch": 81.07, + "learning_rate": 9.48088846563542e-06, + "loss": 1.8069, + "step": 28006500 + }, + { + "epoch": 81.07, + "learning_rate": 9.480164817988143e-06, + "loss": 1.8556, + "step": 28007000 + }, + { + "epoch": 81.07, + "learning_rate": 9.479441170340868e-06, + "loss": 1.8299, + "step": 28007500 + }, + { + "epoch": 81.07, + "learning_rate": 9.47871752269359e-06, + "loss": 1.8301, + "step": 28008000 + }, + { + "epoch": 81.07, + "learning_rate": 9.477993875046313e-06, + "loss": 1.8214, + "step": 28008500 + }, + { + "epoch": 81.07, + "learning_rate": 9.477270227399038e-06, + "loss": 1.8483, + "step": 28009000 + }, + { + "epoch": 81.08, + "learning_rate": 9.47654657975176e-06, + "loss": 1.8412, + "step": 28009500 + }, + { + "epoch": 81.08, + "learning_rate": 9.475822932104483e-06, + "loss": 1.8414, + "step": 28010000 + }, + { + "epoch": 81.08, + "learning_rate": 9.475099284457207e-06, + "loss": 1.8161, + "step": 28010500 + }, + { + "epoch": 81.08, + "learning_rate": 9.47437563680993e-06, + "loss": 1.8472, + "step": 28011000 + }, + { + "epoch": 81.08, + "learning_rate": 9.473653436457948e-06, + "loss": 1.833, + "step": 28011500 + }, + { + "epoch": 81.08, + "learning_rate": 9.47292978881067e-06, + "loss": 1.8694, + "step": 28012000 + }, + { + "epoch": 81.08, + "learning_rate": 9.472206141163394e-06, + "loss": 1.8293, + "step": 28012500 + }, + { + "epoch": 81.09, + "learning_rate": 9.471482493516118e-06, + "loss": 1.8515, + "step": 28013000 + }, + { + "epoch": 81.09, + "learning_rate": 9.47075884586884e-06, + "loss": 1.8344, + "step": 28013500 + }, + { + "epoch": 81.09, + "learning_rate": 9.470035198221564e-06, + "loss": 1.8182, + "step": 28014000 + }, + { + "epoch": 81.09, + "learning_rate": 9.469311550574288e-06, + "loss": 1.8183, + "step": 28014500 + }, + { + "epoch": 81.09, + "learning_rate": 9.468589350222305e-06, + "loss": 1.8361, + "step": 28015000 + }, + { + "epoch": 81.09, + "learning_rate": 9.467865702575028e-06, + "loss": 1.8372, + "step": 28015500 + }, + { + "epoch": 81.09, + "learning_rate": 9.467142054927752e-06, + "loss": 1.8461, + "step": 28016000 + }, + { + "epoch": 81.1, + "learning_rate": 9.466418407280476e-06, + "loss": 1.8309, + "step": 28016500 + }, + { + "epoch": 81.1, + "learning_rate": 9.465696206928493e-06, + "loss": 1.8554, + "step": 28017000 + }, + { + "epoch": 81.1, + "learning_rate": 9.464972559281215e-06, + "loss": 1.8348, + "step": 28017500 + }, + { + "epoch": 81.1, + "learning_rate": 9.464248911633939e-06, + "loss": 1.8345, + "step": 28018000 + }, + { + "epoch": 81.1, + "learning_rate": 9.463525263986663e-06, + "loss": 1.826, + "step": 28018500 + }, + { + "epoch": 81.1, + "learning_rate": 9.46280306363468e-06, + "loss": 1.8249, + "step": 28019000 + }, + { + "epoch": 81.1, + "learning_rate": 9.462079415987402e-06, + "loss": 1.8342, + "step": 28019500 + }, + { + "epoch": 81.11, + "learning_rate": 9.461355768340126e-06, + "loss": 1.8358, + "step": 28020000 + }, + { + "epoch": 81.11, + "learning_rate": 9.46063212069285e-06, + "loss": 1.8147, + "step": 28020500 + }, + { + "epoch": 81.11, + "learning_rate": 9.459908473045572e-06, + "loss": 1.829, + "step": 28021000 + }, + { + "epoch": 81.11, + "learning_rate": 9.459184825398296e-06, + "loss": 1.8359, + "step": 28021500 + }, + { + "epoch": 81.11, + "learning_rate": 9.458462625046315e-06, + "loss": 1.8706, + "step": 28022000 + }, + { + "epoch": 81.11, + "learning_rate": 9.457738977399038e-06, + "loss": 1.8516, + "step": 28022500 + }, + { + "epoch": 81.12, + "learning_rate": 9.45701532975176e-06, + "loss": 1.8394, + "step": 28023000 + }, + { + "epoch": 81.12, + "learning_rate": 9.456291682104484e-06, + "loss": 1.8269, + "step": 28023500 + }, + { + "epoch": 81.12, + "learning_rate": 9.455569481752503e-06, + "loss": 1.8369, + "step": 28024000 + }, + { + "epoch": 81.12, + "learning_rate": 9.454845834105225e-06, + "loss": 1.8259, + "step": 28024500 + }, + { + "epoch": 81.12, + "learning_rate": 9.454122186457947e-06, + "loss": 1.8331, + "step": 28025000 + }, + { + "epoch": 81.12, + "learning_rate": 9.453398538810671e-06, + "loss": 1.8491, + "step": 28025500 + }, + { + "epoch": 81.12, + "learning_rate": 9.45267633845869e-06, + "loss": 1.8327, + "step": 28026000 + }, + { + "epoch": 81.13, + "learning_rate": 9.451952690811412e-06, + "loss": 1.8324, + "step": 28026500 + }, + { + "epoch": 81.13, + "learning_rate": 9.451229043164134e-06, + "loss": 1.8392, + "step": 28027000 + }, + { + "epoch": 81.13, + "learning_rate": 9.450505395516858e-06, + "loss": 1.8694, + "step": 28027500 + }, + { + "epoch": 81.13, + "learning_rate": 9.449781747869582e-06, + "loss": 1.8403, + "step": 28028000 + }, + { + "epoch": 81.13, + "learning_rate": 9.4490595475176e-06, + "loss": 1.8262, + "step": 28028500 + }, + { + "epoch": 81.13, + "learning_rate": 9.448337347165617e-06, + "loss": 1.8276, + "step": 28029000 + }, + { + "epoch": 81.13, + "learning_rate": 9.44761369951834e-06, + "loss": 1.8106, + "step": 28029500 + }, + { + "epoch": 81.14, + "learning_rate": 9.446890051871065e-06, + "loss": 1.8599, + "step": 28030000 + }, + { + "epoch": 81.14, + "learning_rate": 9.446166404223787e-06, + "loss": 1.8387, + "step": 28030500 + }, + { + "epoch": 81.14, + "learning_rate": 9.44544275657651e-06, + "loss": 1.8438, + "step": 28031000 + }, + { + "epoch": 81.14, + "learning_rate": 9.444719108929235e-06, + "loss": 1.8542, + "step": 28031500 + }, + { + "epoch": 81.14, + "learning_rate": 9.443995461281957e-06, + "loss": 1.8509, + "step": 28032000 + }, + { + "epoch": 81.14, + "learning_rate": 9.44327181363468e-06, + "loss": 1.8455, + "step": 28032500 + }, + { + "epoch": 81.14, + "learning_rate": 9.442548165987403e-06, + "loss": 1.8615, + "step": 28033000 + }, + { + "epoch": 81.15, + "learning_rate": 9.441825965635422e-06, + "loss": 1.832, + "step": 28033500 + }, + { + "epoch": 81.15, + "learning_rate": 9.441102317988144e-06, + "loss": 1.8418, + "step": 28034000 + }, + { + "epoch": 81.15, + "learning_rate": 9.440378670340867e-06, + "loss": 1.8403, + "step": 28034500 + }, + { + "epoch": 81.15, + "learning_rate": 9.43965502269359e-06, + "loss": 1.8572, + "step": 28035000 + }, + { + "epoch": 81.15, + "learning_rate": 9.43893282234161e-06, + "loss": 1.8228, + "step": 28035500 + }, + { + "epoch": 81.15, + "learning_rate": 9.438209174694332e-06, + "loss": 1.8609, + "step": 28036000 + }, + { + "epoch": 81.15, + "learning_rate": 9.437485527047054e-06, + "loss": 1.8482, + "step": 28036500 + }, + { + "epoch": 81.16, + "learning_rate": 9.436761879399778e-06, + "loss": 1.8307, + "step": 28037000 + }, + { + "epoch": 81.16, + "learning_rate": 9.436038231752502e-06, + "loss": 1.8225, + "step": 28037500 + }, + { + "epoch": 81.16, + "learning_rate": 9.435314584105224e-06, + "loss": 1.8357, + "step": 28038000 + }, + { + "epoch": 81.16, + "learning_rate": 9.434590936457948e-06, + "loss": 1.8271, + "step": 28038500 + }, + { + "epoch": 81.16, + "learning_rate": 9.433867288810672e-06, + "loss": 1.8505, + "step": 28039000 + }, + { + "epoch": 81.16, + "learning_rate": 9.433143641163394e-06, + "loss": 1.8122, + "step": 28039500 + }, + { + "epoch": 81.16, + "learning_rate": 9.432419993516118e-06, + "loss": 1.86, + "step": 28040000 + }, + { + "epoch": 81.17, + "learning_rate": 9.43169634586884e-06, + "loss": 1.8237, + "step": 28040500 + }, + { + "epoch": 81.17, + "learning_rate": 9.430972698221564e-06, + "loss": 1.857, + "step": 28041000 + }, + { + "epoch": 81.17, + "learning_rate": 9.430250497869581e-06, + "loss": 1.8401, + "step": 28041500 + }, + { + "epoch": 81.17, + "learning_rate": 9.429526850222305e-06, + "loss": 1.8803, + "step": 28042000 + }, + { + "epoch": 81.17, + "learning_rate": 9.42880320257503e-06, + "loss": 1.8237, + "step": 28042500 + }, + { + "epoch": 81.17, + "learning_rate": 9.428079554927752e-06, + "loss": 1.8372, + "step": 28043000 + }, + { + "epoch": 81.17, + "learning_rate": 9.427355907280474e-06, + "loss": 1.8371, + "step": 28043500 + }, + { + "epoch": 81.18, + "learning_rate": 9.426632259633198e-06, + "loss": 1.8199, + "step": 28044000 + }, + { + "epoch": 81.18, + "learning_rate": 9.425908611985922e-06, + "loss": 1.8087, + "step": 28044500 + }, + { + "epoch": 81.18, + "learning_rate": 9.425184964338644e-06, + "loss": 1.8347, + "step": 28045000 + }, + { + "epoch": 81.18, + "learning_rate": 9.424461316691368e-06, + "loss": 1.8429, + "step": 28045500 + }, + { + "epoch": 81.18, + "learning_rate": 9.423739116339385e-06, + "loss": 1.8317, + "step": 28046000 + }, + { + "epoch": 81.18, + "learning_rate": 9.423015468692109e-06, + "loss": 1.8337, + "step": 28046500 + }, + { + "epoch": 81.18, + "learning_rate": 9.422291821044831e-06, + "loss": 1.8448, + "step": 28047000 + }, + { + "epoch": 81.19, + "learning_rate": 9.42156962069285e-06, + "loss": 1.8472, + "step": 28047500 + }, + { + "epoch": 81.19, + "learning_rate": 9.420845973045572e-06, + "loss": 1.8512, + "step": 28048000 + }, + { + "epoch": 81.19, + "learning_rate": 9.420122325398296e-06, + "loss": 1.8322, + "step": 28048500 + }, + { + "epoch": 81.19, + "learning_rate": 9.419398677751019e-06, + "loss": 1.824, + "step": 28049000 + }, + { + "epoch": 81.19, + "learning_rate": 9.418676477399037e-06, + "loss": 1.8608, + "step": 28049500 + }, + { + "epoch": 81.19, + "learning_rate": 9.41795282975176e-06, + "loss": 1.8263, + "step": 28050000 + }, + { + "epoch": 81.19, + "learning_rate": 9.417230629399779e-06, + "loss": 1.8285, + "step": 28050500 + }, + { + "epoch": 81.2, + "learning_rate": 9.416506981752501e-06, + "loss": 1.8364, + "step": 28051000 + }, + { + "epoch": 81.2, + "learning_rate": 9.415783334105225e-06, + "loss": 1.8554, + "step": 28051500 + }, + { + "epoch": 81.2, + "learning_rate": 9.415059686457949e-06, + "loss": 1.8422, + "step": 28052000 + }, + { + "epoch": 81.2, + "learning_rate": 9.414336038810671e-06, + "loss": 1.8272, + "step": 28052500 + }, + { + "epoch": 81.2, + "learning_rate": 9.413612391163395e-06, + "loss": 1.8391, + "step": 28053000 + }, + { + "epoch": 81.2, + "learning_rate": 9.412888743516117e-06, + "loss": 1.839, + "step": 28053500 + }, + { + "epoch": 81.2, + "learning_rate": 9.412166543164136e-06, + "loss": 1.7969, + "step": 28054000 + }, + { + "epoch": 81.21, + "learning_rate": 9.411442895516858e-06, + "loss": 1.8308, + "step": 28054500 + }, + { + "epoch": 81.21, + "learning_rate": 9.410719247869582e-06, + "loss": 1.8408, + "step": 28055000 + }, + { + "epoch": 81.21, + "learning_rate": 9.409995600222304e-06, + "loss": 1.8399, + "step": 28055500 + }, + { + "epoch": 81.21, + "learning_rate": 9.409271952575028e-06, + "loss": 1.8243, + "step": 28056000 + }, + { + "epoch": 81.21, + "learning_rate": 9.40854830492775e-06, + "loss": 1.8401, + "step": 28056500 + }, + { + "epoch": 81.21, + "learning_rate": 9.407824657280475e-06, + "loss": 1.8363, + "step": 28057000 + }, + { + "epoch": 81.21, + "learning_rate": 9.407102456928492e-06, + "loss": 1.8535, + "step": 28057500 + }, + { + "epoch": 81.22, + "learning_rate": 9.406378809281216e-06, + "loss": 1.873, + "step": 28058000 + }, + { + "epoch": 81.22, + "learning_rate": 9.40565516163394e-06, + "loss": 1.8557, + "step": 28058500 + }, + { + "epoch": 81.22, + "learning_rate": 9.404931513986662e-06, + "loss": 1.8136, + "step": 28059000 + }, + { + "epoch": 81.22, + "learning_rate": 9.404207866339386e-06, + "loss": 1.8438, + "step": 28059500 + }, + { + "epoch": 81.22, + "learning_rate": 9.403484218692108e-06, + "loss": 1.8337, + "step": 28060000 + }, + { + "epoch": 81.22, + "learning_rate": 9.402760571044832e-06, + "loss": 1.843, + "step": 28060500 + }, + { + "epoch": 81.23, + "learning_rate": 9.402036923397554e-06, + "loss": 1.8601, + "step": 28061000 + }, + { + "epoch": 81.23, + "learning_rate": 9.401313275750278e-06, + "loss": 1.858, + "step": 28061500 + }, + { + "epoch": 81.23, + "learning_rate": 9.400589628103002e-06, + "loss": 1.8331, + "step": 28062000 + }, + { + "epoch": 81.23, + "learning_rate": 9.39986742775102e-06, + "loss": 1.8421, + "step": 28062500 + }, + { + "epoch": 81.23, + "learning_rate": 9.399143780103743e-06, + "loss": 1.8214, + "step": 28063000 + }, + { + "epoch": 81.23, + "learning_rate": 9.398420132456465e-06, + "loss": 1.8365, + "step": 28063500 + }, + { + "epoch": 81.23, + "learning_rate": 9.39769648480919e-06, + "loss": 1.8491, + "step": 28064000 + }, + { + "epoch": 81.24, + "learning_rate": 9.396974284457207e-06, + "loss": 1.8582, + "step": 28064500 + }, + { + "epoch": 81.24, + "learning_rate": 9.396252084105224e-06, + "loss": 1.8318, + "step": 28065000 + }, + { + "epoch": 81.24, + "learning_rate": 9.395528436457948e-06, + "loss": 1.8149, + "step": 28065500 + }, + { + "epoch": 81.24, + "learning_rate": 9.394804788810672e-06, + "loss": 1.8139, + "step": 28066000 + }, + { + "epoch": 81.24, + "learning_rate": 9.394082588458689e-06, + "loss": 1.8591, + "step": 28066500 + }, + { + "epoch": 81.24, + "learning_rate": 9.393358940811411e-06, + "loss": 1.8344, + "step": 28067000 + }, + { + "epoch": 81.24, + "learning_rate": 9.392635293164135e-06, + "loss": 1.8256, + "step": 28067500 + }, + { + "epoch": 81.25, + "learning_rate": 9.391911645516859e-06, + "loss": 1.8287, + "step": 28068000 + }, + { + "epoch": 81.25, + "learning_rate": 9.391187997869581e-06, + "loss": 1.808, + "step": 28068500 + }, + { + "epoch": 81.25, + "learning_rate": 9.390464350222305e-06, + "loss": 1.833, + "step": 28069000 + }, + { + "epoch": 81.25, + "learning_rate": 9.38974070257503e-06, + "loss": 1.831, + "step": 28069500 + }, + { + "epoch": 81.25, + "learning_rate": 9.389017054927751e-06, + "loss": 1.8145, + "step": 28070000 + }, + { + "epoch": 81.25, + "learning_rate": 9.388293407280474e-06, + "loss": 1.8608, + "step": 28070500 + }, + { + "epoch": 81.25, + "learning_rate": 9.387569759633198e-06, + "loss": 1.8501, + "step": 28071000 + }, + { + "epoch": 81.26, + "learning_rate": 9.386846111985922e-06, + "loss": 1.8216, + "step": 28071500 + }, + { + "epoch": 81.26, + "learning_rate": 9.386122464338644e-06, + "loss": 1.8326, + "step": 28072000 + }, + { + "epoch": 81.26, + "learning_rate": 9.385398816691368e-06, + "loss": 1.8662, + "step": 28072500 + }, + { + "epoch": 81.26, + "learning_rate": 9.384675169044092e-06, + "loss": 1.8157, + "step": 28073000 + }, + { + "epoch": 81.26, + "learning_rate": 9.383952968692109e-06, + "loss": 1.8315, + "step": 28073500 + }, + { + "epoch": 81.26, + "learning_rate": 9.383230768340126e-06, + "loss": 1.8216, + "step": 28074000 + }, + { + "epoch": 81.26, + "learning_rate": 9.38250712069285e-06, + "loss": 1.828, + "step": 28074500 + }, + { + "epoch": 81.27, + "learning_rate": 9.381783473045572e-06, + "loss": 1.8481, + "step": 28075000 + }, + { + "epoch": 81.27, + "learning_rate": 9.381059825398296e-06, + "loss": 1.8319, + "step": 28075500 + }, + { + "epoch": 81.27, + "learning_rate": 9.380336177751018e-06, + "loss": 1.8398, + "step": 28076000 + }, + { + "epoch": 81.27, + "learning_rate": 9.379612530103742e-06, + "loss": 1.8358, + "step": 28076500 + }, + { + "epoch": 81.27, + "learning_rate": 9.378888882456466e-06, + "loss": 1.8443, + "step": 28077000 + }, + { + "epoch": 81.27, + "learning_rate": 9.378165234809189e-06, + "loss": 1.8221, + "step": 28077500 + }, + { + "epoch": 81.27, + "learning_rate": 9.377441587161912e-06, + "loss": 1.8341, + "step": 28078000 + }, + { + "epoch": 81.28, + "learning_rate": 9.376717939514636e-06, + "loss": 1.8383, + "step": 28078500 + }, + { + "epoch": 81.28, + "learning_rate": 9.375995739162654e-06, + "loss": 1.8397, + "step": 28079000 + }, + { + "epoch": 81.28, + "learning_rate": 9.375272091515376e-06, + "loss": 1.8399, + "step": 28079500 + }, + { + "epoch": 81.28, + "learning_rate": 9.3745484438681e-06, + "loss": 1.8107, + "step": 28080000 + }, + { + "epoch": 81.28, + "learning_rate": 9.373824796220824e-06, + "loss": 1.8307, + "step": 28080500 + }, + { + "epoch": 81.28, + "learning_rate": 9.373101148573546e-06, + "loss": 1.8677, + "step": 28081000 + }, + { + "epoch": 81.28, + "learning_rate": 9.372378948221563e-06, + "loss": 1.8286, + "step": 28081500 + }, + { + "epoch": 81.29, + "learning_rate": 9.371655300574287e-06, + "loss": 1.8202, + "step": 28082000 + }, + { + "epoch": 81.29, + "learning_rate": 9.370931652927011e-06, + "loss": 1.8226, + "step": 28082500 + }, + { + "epoch": 81.29, + "learning_rate": 9.370208005279733e-06, + "loss": 1.8461, + "step": 28083000 + }, + { + "epoch": 81.29, + "learning_rate": 9.369484357632457e-06, + "loss": 1.8176, + "step": 28083500 + }, + { + "epoch": 81.29, + "learning_rate": 9.368762157280474e-06, + "loss": 1.8386, + "step": 28084000 + }, + { + "epoch": 81.29, + "learning_rate": 9.368038509633198e-06, + "loss": 1.8385, + "step": 28084500 + }, + { + "epoch": 81.29, + "learning_rate": 9.36731486198592e-06, + "loss": 1.8218, + "step": 28085000 + }, + { + "epoch": 81.3, + "learning_rate": 9.366591214338645e-06, + "loss": 1.8435, + "step": 28085500 + }, + { + "epoch": 81.3, + "learning_rate": 9.365867566691368e-06, + "loss": 1.8448, + "step": 28086000 + }, + { + "epoch": 81.3, + "learning_rate": 9.36514391904409e-06, + "loss": 1.8555, + "step": 28086500 + }, + { + "epoch": 81.3, + "learning_rate": 9.364420271396813e-06, + "loss": 1.8171, + "step": 28087000 + }, + { + "epoch": 81.3, + "learning_rate": 9.363698071044832e-06, + "loss": 1.8133, + "step": 28087500 + }, + { + "epoch": 81.3, + "learning_rate": 9.362974423397556e-06, + "loss": 1.8265, + "step": 28088000 + }, + { + "epoch": 81.3, + "learning_rate": 9.362250775750278e-06, + "loss": 1.838, + "step": 28088500 + }, + { + "epoch": 81.31, + "learning_rate": 9.361528575398295e-06, + "loss": 1.8439, + "step": 28089000 + }, + { + "epoch": 81.31, + "learning_rate": 9.36080492775102e-06, + "loss": 1.8412, + "step": 28089500 + }, + { + "epoch": 81.31, + "learning_rate": 9.360081280103743e-06, + "loss": 1.865, + "step": 28090000 + }, + { + "epoch": 81.31, + "learning_rate": 9.359357632456465e-06, + "loss": 1.8537, + "step": 28090500 + }, + { + "epoch": 81.31, + "learning_rate": 9.358633984809188e-06, + "loss": 1.8527, + "step": 28091000 + }, + { + "epoch": 81.31, + "learning_rate": 9.357911784457207e-06, + "loss": 1.842, + "step": 28091500 + }, + { + "epoch": 81.31, + "learning_rate": 9.35718813680993e-06, + "loss": 1.823, + "step": 28092000 + }, + { + "epoch": 81.32, + "learning_rate": 9.356464489162653e-06, + "loss": 1.8337, + "step": 28092500 + }, + { + "epoch": 81.32, + "learning_rate": 9.355740841515377e-06, + "loss": 1.8205, + "step": 28093000 + }, + { + "epoch": 81.32, + "learning_rate": 9.3550171938681e-06, + "loss": 1.8276, + "step": 28093500 + }, + { + "epoch": 81.32, + "learning_rate": 9.354293546220823e-06, + "loss": 1.8425, + "step": 28094000 + }, + { + "epoch": 81.32, + "learning_rate": 9.353569898573545e-06, + "loss": 1.8421, + "step": 28094500 + }, + { + "epoch": 81.32, + "learning_rate": 9.352847698221564e-06, + "loss": 1.8273, + "step": 28095000 + }, + { + "epoch": 81.32, + "learning_rate": 9.352124050574288e-06, + "loss": 1.853, + "step": 28095500 + }, + { + "epoch": 81.33, + "learning_rate": 9.35140040292701e-06, + "loss": 1.8452, + "step": 28096000 + }, + { + "epoch": 81.33, + "learning_rate": 9.350676755279732e-06, + "loss": 1.845, + "step": 28096500 + }, + { + "epoch": 81.33, + "learning_rate": 9.349953107632458e-06, + "loss": 1.8544, + "step": 28097000 + }, + { + "epoch": 81.33, + "learning_rate": 9.34922945998518e-06, + "loss": 1.8461, + "step": 28097500 + }, + { + "epoch": 81.33, + "learning_rate": 9.348505812337902e-06, + "loss": 1.8449, + "step": 28098000 + }, + { + "epoch": 81.33, + "learning_rate": 9.347782164690626e-06, + "loss": 1.828, + "step": 28098500 + }, + { + "epoch": 81.34, + "learning_rate": 9.34705851704335e-06, + "loss": 1.8221, + "step": 28099000 + }, + { + "epoch": 81.34, + "learning_rate": 9.346336316691368e-06, + "loss": 1.841, + "step": 28099500 + }, + { + "epoch": 81.34, + "learning_rate": 9.34561266904409e-06, + "loss": 1.8598, + "step": 28100000 + }, + { + "epoch": 81.34, + "learning_rate": 9.344889021396815e-06, + "loss": 1.8421, + "step": 28100500 + }, + { + "epoch": 81.34, + "learning_rate": 9.344165373749538e-06, + "loss": 1.8374, + "step": 28101000 + }, + { + "epoch": 81.34, + "learning_rate": 9.34344172610226e-06, + "loss": 1.8507, + "step": 28101500 + }, + { + "epoch": 81.34, + "learning_rate": 9.342718078454984e-06, + "loss": 1.849, + "step": 28102000 + }, + { + "epoch": 81.35, + "learning_rate": 9.341997325398296e-06, + "loss": 1.8547, + "step": 28102500 + }, + { + "epoch": 81.35, + "learning_rate": 9.34127367775102e-06, + "loss": 1.8373, + "step": 28103000 + }, + { + "epoch": 81.35, + "learning_rate": 9.340550030103742e-06, + "loss": 1.8419, + "step": 28103500 + }, + { + "epoch": 81.35, + "learning_rate": 9.339826382456464e-06, + "loss": 1.808, + "step": 28104000 + }, + { + "epoch": 81.35, + "learning_rate": 9.33910273480919e-06, + "loss": 1.852, + "step": 28104500 + }, + { + "epoch": 81.35, + "learning_rate": 9.338379087161912e-06, + "loss": 1.8363, + "step": 28105000 + }, + { + "epoch": 81.35, + "learning_rate": 9.337655439514635e-06, + "loss": 1.8413, + "step": 28105500 + }, + { + "epoch": 81.36, + "learning_rate": 9.336931791867358e-06, + "loss": 1.8502, + "step": 28106000 + }, + { + "epoch": 81.36, + "learning_rate": 9.336208144220082e-06, + "loss": 1.8622, + "step": 28106500 + }, + { + "epoch": 81.36, + "learning_rate": 9.335484496572805e-06, + "loss": 1.8514, + "step": 28107000 + }, + { + "epoch": 81.36, + "learning_rate": 9.334762296220822e-06, + "loss": 1.8561, + "step": 28107500 + }, + { + "epoch": 81.36, + "learning_rate": 9.334038648573548e-06, + "loss": 1.8254, + "step": 28108000 + }, + { + "epoch": 81.36, + "learning_rate": 9.33331500092627e-06, + "loss": 1.8319, + "step": 28108500 + }, + { + "epoch": 81.36, + "learning_rate": 9.332591353278992e-06, + "loss": 1.8358, + "step": 28109000 + }, + { + "epoch": 81.37, + "learning_rate": 9.331867705631716e-06, + "loss": 1.8403, + "step": 28109500 + }, + { + "epoch": 81.37, + "learning_rate": 9.331145505279735e-06, + "loss": 1.8545, + "step": 28110000 + }, + { + "epoch": 81.37, + "learning_rate": 9.330421857632457e-06, + "loss": 1.8409, + "step": 28110500 + }, + { + "epoch": 81.37, + "learning_rate": 9.329699657280474e-06, + "loss": 1.8493, + "step": 28111000 + }, + { + "epoch": 81.37, + "learning_rate": 9.328976009633197e-06, + "loss": 1.8138, + "step": 28111500 + }, + { + "epoch": 81.37, + "learning_rate": 9.328252361985922e-06, + "loss": 1.8249, + "step": 28112000 + }, + { + "epoch": 81.37, + "learning_rate": 9.327528714338644e-06, + "loss": 1.8348, + "step": 28112500 + }, + { + "epoch": 81.38, + "learning_rate": 9.326805066691367e-06, + "loss": 1.8528, + "step": 28113000 + }, + { + "epoch": 81.38, + "learning_rate": 9.326081419044092e-06, + "loss": 1.8142, + "step": 28113500 + }, + { + "epoch": 81.38, + "learning_rate": 9.325357771396815e-06, + "loss": 1.8553, + "step": 28114000 + }, + { + "epoch": 81.38, + "learning_rate": 9.324634123749537e-06, + "loss": 1.8281, + "step": 28114500 + }, + { + "epoch": 81.38, + "learning_rate": 9.32391047610226e-06, + "loss": 1.855, + "step": 28115000 + }, + { + "epoch": 81.38, + "learning_rate": 9.323186828454985e-06, + "loss": 1.8459, + "step": 28115500 + }, + { + "epoch": 81.38, + "learning_rate": 9.322463180807707e-06, + "loss": 1.8369, + "step": 28116000 + }, + { + "epoch": 81.39, + "learning_rate": 9.321739533160429e-06, + "loss": 1.8505, + "step": 28116500 + }, + { + "epoch": 81.39, + "learning_rate": 9.321015885513155e-06, + "loss": 1.8331, + "step": 28117000 + }, + { + "epoch": 81.39, + "learning_rate": 9.320293685161172e-06, + "loss": 1.8412, + "step": 28117500 + }, + { + "epoch": 81.39, + "learning_rate": 9.31957148480919e-06, + "loss": 1.8537, + "step": 28118000 + }, + { + "epoch": 81.39, + "learning_rate": 9.318849284457206e-06, + "loss": 1.8511, + "step": 28118500 + }, + { + "epoch": 81.39, + "learning_rate": 9.31812563680993e-06, + "loss": 1.8571, + "step": 28119000 + }, + { + "epoch": 81.39, + "learning_rate": 9.317404883753243e-06, + "loss": 1.8292, + "step": 28119500 + }, + { + "epoch": 81.4, + "learning_rate": 9.316681236105967e-06, + "loss": 1.8141, + "step": 28120000 + }, + { + "epoch": 81.4, + "learning_rate": 9.315957588458689e-06, + "loss": 1.8402, + "step": 28120500 + }, + { + "epoch": 81.4, + "learning_rate": 9.315235388106706e-06, + "loss": 1.8458, + "step": 28121000 + }, + { + "epoch": 81.4, + "learning_rate": 9.31451174045943e-06, + "loss": 1.8231, + "step": 28121500 + }, + { + "epoch": 81.4, + "learning_rate": 9.313788092812154e-06, + "loss": 1.8341, + "step": 28122000 + }, + { + "epoch": 81.4, + "learning_rate": 9.313064445164876e-06, + "loss": 1.8655, + "step": 28122500 + }, + { + "epoch": 81.4, + "learning_rate": 9.312340797517598e-06, + "loss": 1.8107, + "step": 28123000 + }, + { + "epoch": 81.41, + "learning_rate": 9.311617149870324e-06, + "loss": 1.8444, + "step": 28123500 + }, + { + "epoch": 81.41, + "learning_rate": 9.310893502223046e-06, + "loss": 1.8062, + "step": 28124000 + }, + { + "epoch": 81.41, + "learning_rate": 9.310169854575768e-06, + "loss": 1.8626, + "step": 28124500 + }, + { + "epoch": 81.41, + "learning_rate": 9.309446206928492e-06, + "loss": 1.8364, + "step": 28125000 + }, + { + "epoch": 81.41, + "learning_rate": 9.308722559281216e-06, + "loss": 1.8458, + "step": 28125500 + }, + { + "epoch": 81.41, + "learning_rate": 9.307998911633939e-06, + "loss": 1.8453, + "step": 28126000 + }, + { + "epoch": 81.41, + "learning_rate": 9.307276711281956e-06, + "loss": 1.8377, + "step": 28126500 + }, + { + "epoch": 81.42, + "learning_rate": 9.30655306363468e-06, + "loss": 1.8458, + "step": 28127000 + }, + { + "epoch": 81.42, + "learning_rate": 9.305829415987404e-06, + "loss": 1.8562, + "step": 28127500 + }, + { + "epoch": 81.42, + "learning_rate": 9.305105768340126e-06, + "loss": 1.8492, + "step": 28128000 + }, + { + "epoch": 81.42, + "learning_rate": 9.30438212069285e-06, + "loss": 1.8516, + "step": 28128500 + }, + { + "epoch": 81.42, + "learning_rate": 9.303658473045574e-06, + "loss": 1.8426, + "step": 28129000 + }, + { + "epoch": 81.42, + "learning_rate": 9.302934825398296e-06, + "loss": 1.8444, + "step": 28129500 + }, + { + "epoch": 81.42, + "learning_rate": 9.302211177751018e-06, + "loss": 1.833, + "step": 28130000 + }, + { + "epoch": 81.43, + "learning_rate": 9.301487530103744e-06, + "loss": 1.821, + "step": 28130500 + }, + { + "epoch": 81.43, + "learning_rate": 9.300765329751761e-06, + "loss": 1.8591, + "step": 28131000 + }, + { + "epoch": 81.43, + "learning_rate": 9.300041682104483e-06, + "loss": 1.8287, + "step": 28131500 + }, + { + "epoch": 81.43, + "learning_rate": 9.299318034457207e-06, + "loss": 1.8434, + "step": 28132000 + }, + { + "epoch": 81.43, + "learning_rate": 9.298594386809931e-06, + "loss": 1.8533, + "step": 28132500 + }, + { + "epoch": 81.43, + "learning_rate": 9.297870739162653e-06, + "loss": 1.8507, + "step": 28133000 + }, + { + "epoch": 81.43, + "learning_rate": 9.297147091515376e-06, + "loss": 1.8176, + "step": 28133500 + }, + { + "epoch": 81.44, + "learning_rate": 9.2964234438681e-06, + "loss": 1.8245, + "step": 28134000 + }, + { + "epoch": 81.44, + "learning_rate": 9.295699796220823e-06, + "loss": 1.8493, + "step": 28134500 + }, + { + "epoch": 81.44, + "learning_rate": 9.294976148573546e-06, + "loss": 1.8209, + "step": 28135000 + }, + { + "epoch": 81.44, + "learning_rate": 9.29425250092627e-06, + "loss": 1.843, + "step": 28135500 + }, + { + "epoch": 81.44, + "learning_rate": 9.293528853278994e-06, + "loss": 1.8293, + "step": 28136000 + }, + { + "epoch": 81.44, + "learning_rate": 9.292805205631716e-06, + "loss": 1.8104, + "step": 28136500 + }, + { + "epoch": 81.45, + "learning_rate": 9.29208155798444e-06, + "loss": 1.8752, + "step": 28137000 + }, + { + "epoch": 81.45, + "learning_rate": 9.291359357632457e-06, + "loss": 1.842, + "step": 28137500 + }, + { + "epoch": 81.45, + "learning_rate": 9.290635709985181e-06, + "loss": 1.8064, + "step": 28138000 + }, + { + "epoch": 81.45, + "learning_rate": 9.289912062337903e-06, + "loss": 1.8358, + "step": 28138500 + }, + { + "epoch": 81.45, + "learning_rate": 9.289188414690627e-06, + "loss": 1.813, + "step": 28139000 + }, + { + "epoch": 81.45, + "learning_rate": 9.28846476704335e-06, + "loss": 1.8388, + "step": 28139500 + }, + { + "epoch": 81.45, + "learning_rate": 9.287741119396073e-06, + "loss": 1.8572, + "step": 28140000 + }, + { + "epoch": 81.46, + "learning_rate": 9.287017471748795e-06, + "loss": 1.8594, + "step": 28140500 + }, + { + "epoch": 81.46, + "learning_rate": 9.28629382410152e-06, + "loss": 1.8446, + "step": 28141000 + }, + { + "epoch": 81.46, + "learning_rate": 9.285571623749538e-06, + "loss": 1.8225, + "step": 28141500 + }, + { + "epoch": 81.46, + "learning_rate": 9.28484797610226e-06, + "loss": 1.8487, + "step": 28142000 + }, + { + "epoch": 81.46, + "learning_rate": 9.284124328454983e-06, + "loss": 1.8234, + "step": 28142500 + }, + { + "epoch": 81.46, + "learning_rate": 9.283402128103002e-06, + "loss": 1.8445, + "step": 28143000 + }, + { + "epoch": 81.46, + "learning_rate": 9.282678480455726e-06, + "loss": 1.84, + "step": 28143500 + }, + { + "epoch": 81.47, + "learning_rate": 9.281954832808448e-06, + "loss": 1.846, + "step": 28144000 + }, + { + "epoch": 81.47, + "learning_rate": 9.281231185161172e-06, + "loss": 1.8189, + "step": 28144500 + }, + { + "epoch": 81.47, + "learning_rate": 9.280507537513894e-06, + "loss": 1.8056, + "step": 28145000 + }, + { + "epoch": 81.47, + "learning_rate": 9.279783889866618e-06, + "loss": 1.8407, + "step": 28145500 + }, + { + "epoch": 81.47, + "learning_rate": 9.279061689514635e-06, + "loss": 1.8207, + "step": 28146000 + }, + { + "epoch": 81.47, + "learning_rate": 9.27833804186736e-06, + "loss": 1.8146, + "step": 28146500 + }, + { + "epoch": 81.47, + "learning_rate": 9.277614394220081e-06, + "loss": 1.8609, + "step": 28147000 + }, + { + "epoch": 81.48, + "learning_rate": 9.276890746572805e-06, + "loss": 1.854, + "step": 28147500 + }, + { + "epoch": 81.48, + "learning_rate": 9.276167098925528e-06, + "loss": 1.8391, + "step": 28148000 + }, + { + "epoch": 81.48, + "learning_rate": 9.275443451278252e-06, + "loss": 1.8447, + "step": 28148500 + }, + { + "epoch": 81.48, + "learning_rate": 9.274719803630975e-06, + "loss": 1.801, + "step": 28149000 + }, + { + "epoch": 81.48, + "learning_rate": 9.273996155983698e-06, + "loss": 1.8323, + "step": 28149500 + }, + { + "epoch": 81.48, + "learning_rate": 9.273272508336422e-06, + "loss": 1.8492, + "step": 28150000 + }, + { + "epoch": 81.48, + "learning_rate": 9.272550307984439e-06, + "loss": 1.8455, + "step": 28150500 + }, + { + "epoch": 81.49, + "learning_rate": 9.271826660337163e-06, + "loss": 1.8406, + "step": 28151000 + }, + { + "epoch": 81.49, + "learning_rate": 9.271103012689885e-06, + "loss": 1.8437, + "step": 28151500 + }, + { + "epoch": 81.49, + "learning_rate": 9.270379365042609e-06, + "loss": 1.8462, + "step": 28152000 + }, + { + "epoch": 81.49, + "learning_rate": 9.269655717395333e-06, + "loss": 1.8382, + "step": 28152500 + }, + { + "epoch": 81.49, + "learning_rate": 9.268932069748055e-06, + "loss": 1.8453, + "step": 28153000 + }, + { + "epoch": 81.49, + "learning_rate": 9.268208422100779e-06, + "loss": 1.8517, + "step": 28153500 + }, + { + "epoch": 81.49, + "learning_rate": 9.267486221748796e-06, + "loss": 1.8559, + "step": 28154000 + }, + { + "epoch": 81.5, + "learning_rate": 9.26676257410152e-06, + "loss": 1.8487, + "step": 28154500 + }, + { + "epoch": 81.5, + "learning_rate": 9.266038926454242e-06, + "loss": 1.8384, + "step": 28155000 + }, + { + "epoch": 81.5, + "learning_rate": 9.265315278806966e-06, + "loss": 1.8456, + "step": 28155500 + }, + { + "epoch": 81.5, + "learning_rate": 9.264591631159689e-06, + "loss": 1.8272, + "step": 28156000 + }, + { + "epoch": 81.5, + "learning_rate": 9.263867983512413e-06, + "loss": 1.8412, + "step": 28156500 + }, + { + "epoch": 81.5, + "learning_rate": 9.263144335865136e-06, + "loss": 1.8219, + "step": 28157000 + }, + { + "epoch": 81.5, + "learning_rate": 9.262422135513154e-06, + "loss": 1.8328, + "step": 28157500 + }, + { + "epoch": 81.51, + "learning_rate": 9.261698487865876e-06, + "loss": 1.8457, + "step": 28158000 + }, + { + "epoch": 81.51, + "learning_rate": 9.2609748402186e-06, + "loss": 1.8367, + "step": 28158500 + }, + { + "epoch": 81.51, + "learning_rate": 9.260251192571324e-06, + "loss": 1.8398, + "step": 28159000 + }, + { + "epoch": 81.51, + "learning_rate": 9.259528992219341e-06, + "loss": 1.8051, + "step": 28159500 + }, + { + "epoch": 81.51, + "learning_rate": 9.258805344572063e-06, + "loss": 1.8597, + "step": 28160000 + }, + { + "epoch": 81.51, + "learning_rate": 9.258081696924787e-06, + "loss": 1.8296, + "step": 28160500 + }, + { + "epoch": 81.51, + "learning_rate": 9.257358049277511e-06, + "loss": 1.8271, + "step": 28161000 + }, + { + "epoch": 81.52, + "learning_rate": 9.256634401630233e-06, + "loss": 1.8257, + "step": 28161500 + }, + { + "epoch": 81.52, + "learning_rate": 9.255910753982957e-06, + "loss": 1.819, + "step": 28162000 + }, + { + "epoch": 81.52, + "learning_rate": 9.255188553630975e-06, + "loss": 1.8156, + "step": 28162500 + }, + { + "epoch": 81.52, + "learning_rate": 9.254464905983698e-06, + "loss": 1.8464, + "step": 28163000 + }, + { + "epoch": 81.52, + "learning_rate": 9.25374125833642e-06, + "loss": 1.804, + "step": 28163500 + }, + { + "epoch": 81.52, + "learning_rate": 9.253017610689145e-06, + "loss": 1.839, + "step": 28164000 + }, + { + "epoch": 81.52, + "learning_rate": 9.252293963041869e-06, + "loss": 1.813, + "step": 28164500 + }, + { + "epoch": 81.53, + "learning_rate": 9.251571762689886e-06, + "loss": 1.8297, + "step": 28165000 + }, + { + "epoch": 81.53, + "learning_rate": 9.250848115042608e-06, + "loss": 1.85, + "step": 28165500 + }, + { + "epoch": 81.53, + "learning_rate": 9.250124467395332e-06, + "loss": 1.8398, + "step": 28166000 + }, + { + "epoch": 81.53, + "learning_rate": 9.249400819748056e-06, + "loss": 1.8291, + "step": 28166500 + }, + { + "epoch": 81.53, + "learning_rate": 9.248677172100778e-06, + "loss": 1.818, + "step": 28167000 + }, + { + "epoch": 81.53, + "learning_rate": 9.247953524453502e-06, + "loss": 1.8427, + "step": 28167500 + }, + { + "epoch": 81.53, + "learning_rate": 9.24723132410152e-06, + "loss": 1.8501, + "step": 28168000 + }, + { + "epoch": 81.54, + "learning_rate": 9.246507676454243e-06, + "loss": 1.8394, + "step": 28168500 + }, + { + "epoch": 81.54, + "learning_rate": 9.245784028806965e-06, + "loss": 1.8247, + "step": 28169000 + }, + { + "epoch": 81.54, + "learning_rate": 9.245061828454983e-06, + "loss": 1.8314, + "step": 28169500 + }, + { + "epoch": 81.54, + "learning_rate": 9.244338180807707e-06, + "loss": 1.8543, + "step": 28170000 + }, + { + "epoch": 81.54, + "learning_rate": 9.24361453316043e-06, + "loss": 1.8381, + "step": 28170500 + }, + { + "epoch": 81.54, + "learning_rate": 9.242890885513153e-06, + "loss": 1.8465, + "step": 28171000 + }, + { + "epoch": 81.54, + "learning_rate": 9.242167237865877e-06, + "loss": 1.7891, + "step": 28171500 + }, + { + "epoch": 81.55, + "learning_rate": 9.2414435902186e-06, + "loss": 1.8432, + "step": 28172000 + }, + { + "epoch": 81.55, + "learning_rate": 9.240719942571323e-06, + "loss": 1.8544, + "step": 28172500 + }, + { + "epoch": 81.55, + "learning_rate": 9.239996294924047e-06, + "loss": 1.8346, + "step": 28173000 + }, + { + "epoch": 81.55, + "learning_rate": 9.239274094572064e-06, + "loss": 1.8611, + "step": 28173500 + }, + { + "epoch": 81.55, + "learning_rate": 9.238551894220081e-06, + "loss": 1.8116, + "step": 28174000 + }, + { + "epoch": 81.55, + "learning_rate": 9.237828246572805e-06, + "loss": 1.8579, + "step": 28174500 + }, + { + "epoch": 81.56, + "learning_rate": 9.237104598925527e-06, + "loss": 1.8842, + "step": 28175000 + }, + { + "epoch": 81.56, + "learning_rate": 9.236380951278251e-06, + "loss": 1.8845, + "step": 28175500 + }, + { + "epoch": 81.56, + "learning_rate": 9.23565875092627e-06, + "loss": 1.8406, + "step": 28176000 + }, + { + "epoch": 81.56, + "learning_rate": 9.234935103278993e-06, + "loss": 1.8472, + "step": 28176500 + }, + { + "epoch": 81.56, + "learning_rate": 9.234211455631715e-06, + "loss": 1.8484, + "step": 28177000 + }, + { + "epoch": 81.56, + "learning_rate": 9.233487807984439e-06, + "loss": 1.8392, + "step": 28177500 + }, + { + "epoch": 81.56, + "learning_rate": 9.232764160337163e-06, + "loss": 1.8614, + "step": 28178000 + }, + { + "epoch": 81.57, + "learning_rate": 9.232040512689885e-06, + "loss": 1.8342, + "step": 28178500 + }, + { + "epoch": 81.57, + "learning_rate": 9.231316865042609e-06, + "loss": 1.8176, + "step": 28179000 + }, + { + "epoch": 81.57, + "learning_rate": 9.230593217395333e-06, + "loss": 1.8639, + "step": 28179500 + }, + { + "epoch": 81.57, + "learning_rate": 9.22987101704335e-06, + "loss": 1.8222, + "step": 28180000 + }, + { + "epoch": 81.57, + "learning_rate": 9.229147369396072e-06, + "loss": 1.8237, + "step": 28180500 + }, + { + "epoch": 81.57, + "learning_rate": 9.228423721748796e-06, + "loss": 1.8528, + "step": 28181000 + }, + { + "epoch": 81.57, + "learning_rate": 9.22770007410152e-06, + "loss": 1.8472, + "step": 28181500 + }, + { + "epoch": 81.58, + "learning_rate": 9.226977873749537e-06, + "loss": 1.8501, + "step": 28182000 + }, + { + "epoch": 81.58, + "learning_rate": 9.226255673397555e-06, + "loss": 1.8426, + "step": 28182500 + }, + { + "epoch": 81.58, + "learning_rate": 9.225532025750279e-06, + "loss": 1.8651, + "step": 28183000 + }, + { + "epoch": 81.58, + "learning_rate": 9.224808378103002e-06, + "loss": 1.841, + "step": 28183500 + }, + { + "epoch": 81.58, + "learning_rate": 9.224084730455725e-06, + "loss": 1.8458, + "step": 28184000 + }, + { + "epoch": 81.58, + "learning_rate": 9.223361082808447e-06, + "loss": 1.8507, + "step": 28184500 + }, + { + "epoch": 81.58, + "learning_rate": 9.222637435161171e-06, + "loss": 1.8845, + "step": 28185000 + }, + { + "epoch": 81.59, + "learning_rate": 9.221913787513895e-06, + "loss": 1.8669, + "step": 28185500 + }, + { + "epoch": 81.59, + "learning_rate": 9.221190139866617e-06, + "loss": 1.8852, + "step": 28186000 + }, + { + "epoch": 81.59, + "learning_rate": 9.220466492219341e-06, + "loss": 1.838, + "step": 28186500 + }, + { + "epoch": 81.59, + "learning_rate": 9.219742844572065e-06, + "loss": 1.8563, + "step": 28187000 + }, + { + "epoch": 81.59, + "learning_rate": 9.219019196924787e-06, + "loss": 1.833, + "step": 28187500 + }, + { + "epoch": 81.59, + "learning_rate": 9.21829554927751e-06, + "loss": 1.8407, + "step": 28188000 + }, + { + "epoch": 81.59, + "learning_rate": 9.217573348925528e-06, + "loss": 1.8688, + "step": 28188500 + }, + { + "epoch": 81.6, + "learning_rate": 9.216849701278252e-06, + "loss": 1.8478, + "step": 28189000 + }, + { + "epoch": 81.6, + "learning_rate": 9.216126053630974e-06, + "loss": 1.8268, + "step": 28189500 + }, + { + "epoch": 81.6, + "learning_rate": 9.215402405983697e-06, + "loss": 1.8135, + "step": 28190000 + }, + { + "epoch": 81.6, + "learning_rate": 9.214680205631716e-06, + "loss": 1.844, + "step": 28190500 + }, + { + "epoch": 81.6, + "learning_rate": 9.21395655798444e-06, + "loss": 1.8467, + "step": 28191000 + }, + { + "epoch": 81.6, + "learning_rate": 9.213232910337162e-06, + "loss": 1.8294, + "step": 28191500 + }, + { + "epoch": 81.6, + "learning_rate": 9.212509262689886e-06, + "loss": 1.8465, + "step": 28192000 + }, + { + "epoch": 81.61, + "learning_rate": 9.211787062337903e-06, + "loss": 1.8117, + "step": 28192500 + }, + { + "epoch": 81.61, + "learning_rate": 9.211063414690627e-06, + "loss": 1.8809, + "step": 28193000 + }, + { + "epoch": 81.61, + "learning_rate": 9.210339767043349e-06, + "loss": 1.8351, + "step": 28193500 + }, + { + "epoch": 81.61, + "learning_rate": 9.209616119396073e-06, + "loss": 1.8212, + "step": 28194000 + }, + { + "epoch": 81.61, + "learning_rate": 9.208893919044092e-06, + "loss": 1.8661, + "step": 28194500 + }, + { + "epoch": 81.61, + "learning_rate": 9.208170271396814e-06, + "loss": 1.8602, + "step": 28195000 + }, + { + "epoch": 81.61, + "learning_rate": 9.207446623749536e-06, + "loss": 1.8325, + "step": 28195500 + }, + { + "epoch": 81.62, + "learning_rate": 9.20672297610226e-06, + "loss": 1.8239, + "step": 28196000 + }, + { + "epoch": 81.62, + "learning_rate": 9.205999328454984e-06, + "loss": 1.8615, + "step": 28196500 + }, + { + "epoch": 81.62, + "learning_rate": 9.205275680807707e-06, + "loss": 1.8186, + "step": 28197000 + }, + { + "epoch": 81.62, + "learning_rate": 9.204552033160429e-06, + "loss": 1.8704, + "step": 28197500 + }, + { + "epoch": 81.62, + "learning_rate": 9.203828385513154e-06, + "loss": 1.8306, + "step": 28198000 + }, + { + "epoch": 81.62, + "learning_rate": 9.203104737865877e-06, + "loss": 1.8617, + "step": 28198500 + }, + { + "epoch": 81.62, + "learning_rate": 9.202382537513894e-06, + "loss": 1.8647, + "step": 28199000 + }, + { + "epoch": 81.63, + "learning_rate": 9.201658889866618e-06, + "loss": 1.8524, + "step": 28199500 + }, + { + "epoch": 81.63, + "learning_rate": 9.200936689514637e-06, + "loss": 1.833, + "step": 28200000 + }, + { + "epoch": 81.63, + "learning_rate": 9.200213041867359e-06, + "loss": 1.8235, + "step": 28200500 + }, + { + "epoch": 81.63, + "learning_rate": 9.199489394220081e-06, + "loss": 1.8369, + "step": 28201000 + }, + { + "epoch": 81.63, + "learning_rate": 9.198765746572805e-06, + "loss": 1.8494, + "step": 28201500 + }, + { + "epoch": 81.63, + "learning_rate": 9.198042098925529e-06, + "loss": 1.8471, + "step": 28202000 + }, + { + "epoch": 81.63, + "learning_rate": 9.197319898573546e-06, + "loss": 1.825, + "step": 28202500 + }, + { + "epoch": 81.64, + "learning_rate": 9.196596250926269e-06, + "loss": 1.8174, + "step": 28203000 + }, + { + "epoch": 81.64, + "learning_rate": 9.195872603278992e-06, + "loss": 1.8413, + "step": 28203500 + }, + { + "epoch": 81.64, + "learning_rate": 9.195148955631716e-06, + "loss": 1.8144, + "step": 28204000 + }, + { + "epoch": 81.64, + "learning_rate": 9.194425307984439e-06, + "loss": 1.8482, + "step": 28204500 + }, + { + "epoch": 81.64, + "learning_rate": 9.193701660337163e-06, + "loss": 1.818, + "step": 28205000 + }, + { + "epoch": 81.64, + "learning_rate": 9.192979459985182e-06, + "loss": 1.8226, + "step": 28205500 + }, + { + "epoch": 81.64, + "learning_rate": 9.192255812337904e-06, + "loss": 1.8428, + "step": 28206000 + }, + { + "epoch": 81.65, + "learning_rate": 9.191532164690626e-06, + "loss": 1.8289, + "step": 28206500 + }, + { + "epoch": 81.65, + "learning_rate": 9.19080851704335e-06, + "loss": 1.8424, + "step": 28207000 + }, + { + "epoch": 81.65, + "learning_rate": 9.190086316691369e-06, + "loss": 1.8268, + "step": 28207500 + }, + { + "epoch": 81.65, + "learning_rate": 9.189362669044091e-06, + "loss": 1.8342, + "step": 28208000 + }, + { + "epoch": 81.65, + "learning_rate": 9.188639021396813e-06, + "loss": 1.8551, + "step": 28208500 + }, + { + "epoch": 81.65, + "learning_rate": 9.187915373749537e-06, + "loss": 1.8604, + "step": 28209000 + }, + { + "epoch": 81.65, + "learning_rate": 9.187191726102261e-06, + "loss": 1.837, + "step": 28209500 + }, + { + "epoch": 81.66, + "learning_rate": 9.186468078454983e-06, + "loss": 1.8357, + "step": 28210000 + }, + { + "epoch": 81.66, + "learning_rate": 9.185744430807706e-06, + "loss": 1.8831, + "step": 28210500 + }, + { + "epoch": 81.66, + "learning_rate": 9.185022230455725e-06, + "loss": 1.8531, + "step": 28211000 + }, + { + "epoch": 81.66, + "learning_rate": 9.184298582808449e-06, + "loss": 1.8323, + "step": 28211500 + }, + { + "epoch": 81.66, + "learning_rate": 9.18357493516117e-06, + "loss": 1.8546, + "step": 28212000 + }, + { + "epoch": 81.66, + "learning_rate": 9.182852734809188e-06, + "loss": 1.8336, + "step": 28212500 + }, + { + "epoch": 81.67, + "learning_rate": 9.182129087161914e-06, + "loss": 1.8387, + "step": 28213000 + }, + { + "epoch": 81.67, + "learning_rate": 9.181406886809931e-06, + "loss": 1.8396, + "step": 28213500 + }, + { + "epoch": 81.67, + "learning_rate": 9.180683239162653e-06, + "loss": 1.8457, + "step": 28214000 + }, + { + "epoch": 81.67, + "learning_rate": 9.179959591515375e-06, + "loss": 1.8573, + "step": 28214500 + }, + { + "epoch": 81.67, + "learning_rate": 9.179235943868101e-06, + "loss": 1.8571, + "step": 28215000 + }, + { + "epoch": 81.67, + "learning_rate": 9.178512296220823e-06, + "loss": 1.8531, + "step": 28215500 + }, + { + "epoch": 81.67, + "learning_rate": 9.177788648573545e-06, + "loss": 1.8433, + "step": 28216000 + }, + { + "epoch": 81.68, + "learning_rate": 9.17706500092627e-06, + "loss": 1.8498, + "step": 28216500 + }, + { + "epoch": 81.68, + "learning_rate": 9.176341353278993e-06, + "loss": 1.8575, + "step": 28217000 + }, + { + "epoch": 81.68, + "learning_rate": 9.175617705631716e-06, + "loss": 1.8393, + "step": 28217500 + }, + { + "epoch": 81.68, + "learning_rate": 9.17489405798444e-06, + "loss": 1.8376, + "step": 28218000 + }, + { + "epoch": 81.68, + "learning_rate": 9.174170410337163e-06, + "loss": 1.8307, + "step": 28218500 + }, + { + "epoch": 81.68, + "learning_rate": 9.173446762689886e-06, + "loss": 1.8105, + "step": 28219000 + }, + { + "epoch": 81.68, + "learning_rate": 9.172723115042608e-06, + "loss": 1.8574, + "step": 28219500 + }, + { + "epoch": 81.69, + "learning_rate": 9.171999467395333e-06, + "loss": 1.8685, + "step": 28220000 + }, + { + "epoch": 81.69, + "learning_rate": 9.171275819748056e-06, + "loss": 1.8458, + "step": 28220500 + }, + { + "epoch": 81.69, + "learning_rate": 9.170552172100778e-06, + "loss": 1.8253, + "step": 28221000 + }, + { + "epoch": 81.69, + "learning_rate": 9.169829971748795e-06, + "loss": 1.8266, + "step": 28221500 + }, + { + "epoch": 81.69, + "learning_rate": 9.16910632410152e-06, + "loss": 1.8485, + "step": 28222000 + }, + { + "epoch": 81.69, + "learning_rate": 9.168382676454243e-06, + "loss": 1.8596, + "step": 28222500 + }, + { + "epoch": 81.69, + "learning_rate": 9.167659028806965e-06, + "loss": 1.8404, + "step": 28223000 + }, + { + "epoch": 81.7, + "learning_rate": 9.16693538115969e-06, + "loss": 1.8501, + "step": 28223500 + }, + { + "epoch": 81.7, + "learning_rate": 9.166211733512413e-06, + "loss": 1.8343, + "step": 28224000 + }, + { + "epoch": 81.7, + "learning_rate": 9.16548953316043e-06, + "loss": 1.8374, + "step": 28224500 + }, + { + "epoch": 81.7, + "learning_rate": 9.164765885513153e-06, + "loss": 1.8215, + "step": 28225000 + }, + { + "epoch": 81.7, + "learning_rate": 9.164042237865877e-06, + "loss": 1.8611, + "step": 28225500 + }, + { + "epoch": 81.7, + "learning_rate": 9.1633185902186e-06, + "loss": 1.8223, + "step": 28226000 + }, + { + "epoch": 81.7, + "learning_rate": 9.162596389866618e-06, + "loss": 1.849, + "step": 28226500 + }, + { + "epoch": 81.71, + "learning_rate": 9.161874189514635e-06, + "loss": 1.834, + "step": 28227000 + }, + { + "epoch": 81.71, + "learning_rate": 9.161150541867359e-06, + "loss": 1.855, + "step": 28227500 + }, + { + "epoch": 81.71, + "learning_rate": 9.160426894220083e-06, + "loss": 1.8247, + "step": 28228000 + }, + { + "epoch": 81.71, + "learning_rate": 9.159703246572805e-06, + "loss": 1.843, + "step": 28228500 + }, + { + "epoch": 81.71, + "learning_rate": 9.158979598925527e-06, + "loss": 1.8368, + "step": 28229000 + }, + { + "epoch": 81.71, + "learning_rate": 9.158255951278253e-06, + "loss": 1.8529, + "step": 28229500 + }, + { + "epoch": 81.71, + "learning_rate": 9.157532303630975e-06, + "loss": 1.8475, + "step": 28230000 + }, + { + "epoch": 81.72, + "learning_rate": 9.156808655983697e-06, + "loss": 1.8216, + "step": 28230500 + }, + { + "epoch": 81.72, + "learning_rate": 9.156085008336421e-06, + "loss": 1.8424, + "step": 28231000 + }, + { + "epoch": 81.72, + "learning_rate": 9.15536280798444e-06, + "loss": 1.8436, + "step": 28231500 + }, + { + "epoch": 81.72, + "learning_rate": 9.154639160337162e-06, + "loss": 1.8152, + "step": 28232000 + }, + { + "epoch": 81.72, + "learning_rate": 9.153915512689885e-06, + "loss": 1.8499, + "step": 28232500 + }, + { + "epoch": 81.72, + "learning_rate": 9.153191865042609e-06, + "loss": 1.8385, + "step": 28233000 + }, + { + "epoch": 81.72, + "learning_rate": 9.152468217395333e-06, + "loss": 1.8582, + "step": 28233500 + }, + { + "epoch": 81.73, + "learning_rate": 9.151744569748055e-06, + "loss": 1.8458, + "step": 28234000 + }, + { + "epoch": 81.73, + "learning_rate": 9.151022369396072e-06, + "loss": 1.8448, + "step": 28234500 + }, + { + "epoch": 81.73, + "learning_rate": 9.150298721748796e-06, + "loss": 1.8612, + "step": 28235000 + }, + { + "epoch": 81.73, + "learning_rate": 9.14957507410152e-06, + "loss": 1.8224, + "step": 28235500 + }, + { + "epoch": 81.73, + "learning_rate": 9.148851426454242e-06, + "loss": 1.8421, + "step": 28236000 + }, + { + "epoch": 81.73, + "learning_rate": 9.148129226102261e-06, + "loss": 1.8394, + "step": 28236500 + }, + { + "epoch": 81.73, + "learning_rate": 9.147405578454983e-06, + "loss": 1.8295, + "step": 28237000 + }, + { + "epoch": 81.74, + "learning_rate": 9.146681930807707e-06, + "loss": 1.8248, + "step": 28237500 + }, + { + "epoch": 81.74, + "learning_rate": 9.14595828316043e-06, + "loss": 1.8375, + "step": 28238000 + }, + { + "epoch": 81.74, + "learning_rate": 9.145236082808448e-06, + "loss": 1.8097, + "step": 28238500 + }, + { + "epoch": 81.74, + "learning_rate": 9.144512435161172e-06, + "loss": 1.8277, + "step": 28239000 + }, + { + "epoch": 81.74, + "learning_rate": 9.143788787513895e-06, + "loss": 1.8477, + "step": 28239500 + }, + { + "epoch": 81.74, + "learning_rate": 9.143065139866617e-06, + "loss": 1.8364, + "step": 28240000 + }, + { + "epoch": 81.74, + "learning_rate": 9.14234149221934e-06, + "loss": 1.8456, + "step": 28240500 + }, + { + "epoch": 81.75, + "learning_rate": 9.141617844572065e-06, + "loss": 1.8398, + "step": 28241000 + }, + { + "epoch": 81.75, + "learning_rate": 9.140894196924787e-06, + "loss": 1.8407, + "step": 28241500 + }, + { + "epoch": 81.75, + "learning_rate": 9.140171996572804e-06, + "loss": 1.8201, + "step": 28242000 + }, + { + "epoch": 81.75, + "learning_rate": 9.139448348925528e-06, + "loss": 1.8519, + "step": 28242500 + }, + { + "epoch": 81.75, + "learning_rate": 9.138724701278252e-06, + "loss": 1.8229, + "step": 28243000 + }, + { + "epoch": 81.75, + "learning_rate": 9.13800250092627e-06, + "loss": 1.8368, + "step": 28243500 + }, + { + "epoch": 81.75, + "learning_rate": 9.137278853278993e-06, + "loss": 1.8494, + "step": 28244000 + }, + { + "epoch": 81.76, + "learning_rate": 9.136555205631715e-06, + "loss": 1.8452, + "step": 28244500 + }, + { + "epoch": 81.76, + "learning_rate": 9.13583155798444e-06, + "loss": 1.8461, + "step": 28245000 + }, + { + "epoch": 81.76, + "learning_rate": 9.135107910337162e-06, + "loss": 1.8437, + "step": 28245500 + }, + { + "epoch": 81.76, + "learning_rate": 9.134384262689886e-06, + "loss": 1.8588, + "step": 28246000 + }, + { + "epoch": 81.76, + "learning_rate": 9.13366061504261e-06, + "loss": 1.859, + "step": 28246500 + }, + { + "epoch": 81.76, + "learning_rate": 9.132936967395332e-06, + "loss": 1.8402, + "step": 28247000 + }, + { + "epoch": 81.76, + "learning_rate": 9.132213319748056e-06, + "loss": 1.8495, + "step": 28247500 + }, + { + "epoch": 81.77, + "learning_rate": 9.131489672100778e-06, + "loss": 1.8333, + "step": 28248000 + }, + { + "epoch": 81.77, + "learning_rate": 9.130767471748797e-06, + "loss": 1.8344, + "step": 28248500 + }, + { + "epoch": 81.77, + "learning_rate": 9.130043824101519e-06, + "loss": 1.8592, + "step": 28249000 + }, + { + "epoch": 81.77, + "learning_rate": 9.129320176454243e-06, + "loss": 1.8427, + "step": 28249500 + }, + { + "epoch": 81.77, + "learning_rate": 9.128596528806967e-06, + "loss": 1.8724, + "step": 28250000 + }, + { + "epoch": 81.77, + "learning_rate": 9.127872881159689e-06, + "loss": 1.8168, + "step": 28250500 + }, + { + "epoch": 81.78, + "learning_rate": 9.127149233512413e-06, + "loss": 1.8514, + "step": 28251000 + }, + { + "epoch": 81.78, + "learning_rate": 9.126425585865135e-06, + "loss": 1.8499, + "step": 28251500 + }, + { + "epoch": 81.78, + "learning_rate": 9.12570193821786e-06, + "loss": 1.8595, + "step": 28252000 + }, + { + "epoch": 81.78, + "learning_rate": 9.124979737865876e-06, + "loss": 1.8542, + "step": 28252500 + }, + { + "epoch": 81.78, + "learning_rate": 9.1242560902186e-06, + "loss": 1.8522, + "step": 28253000 + }, + { + "epoch": 81.78, + "learning_rate": 9.123532442571323e-06, + "loss": 1.8477, + "step": 28253500 + }, + { + "epoch": 81.78, + "learning_rate": 9.122808794924047e-06, + "loss": 1.8469, + "step": 28254000 + }, + { + "epoch": 81.79, + "learning_rate": 9.122086594572064e-06, + "loss": 1.8539, + "step": 28254500 + }, + { + "epoch": 81.79, + "learning_rate": 9.121362946924788e-06, + "loss": 1.8225, + "step": 28255000 + }, + { + "epoch": 81.79, + "learning_rate": 9.12063929927751e-06, + "loss": 1.8169, + "step": 28255500 + }, + { + "epoch": 81.79, + "learning_rate": 9.119917098925529e-06, + "loss": 1.8638, + "step": 28256000 + }, + { + "epoch": 81.79, + "learning_rate": 9.119193451278251e-06, + "loss": 1.8439, + "step": 28256500 + }, + { + "epoch": 81.79, + "learning_rate": 9.118469803630975e-06, + "loss": 1.8486, + "step": 28257000 + }, + { + "epoch": 81.79, + "learning_rate": 9.117746155983697e-06, + "loss": 1.8453, + "step": 28257500 + }, + { + "epoch": 81.8, + "learning_rate": 9.117023955631716e-06, + "loss": 1.8318, + "step": 28258000 + }, + { + "epoch": 81.8, + "learning_rate": 9.116300307984438e-06, + "loss": 1.8458, + "step": 28258500 + }, + { + "epoch": 81.8, + "learning_rate": 9.115576660337162e-06, + "loss": 1.8744, + "step": 28259000 + }, + { + "epoch": 81.8, + "learning_rate": 9.114853012689886e-06, + "loss": 1.84, + "step": 28259500 + }, + { + "epoch": 81.8, + "learning_rate": 9.114129365042609e-06, + "loss": 1.8733, + "step": 28260000 + }, + { + "epoch": 81.8, + "learning_rate": 9.113405717395332e-06, + "loss": 1.8493, + "step": 28260500 + }, + { + "epoch": 81.8, + "learning_rate": 9.112682069748055e-06, + "loss": 1.8247, + "step": 28261000 + }, + { + "epoch": 81.81, + "learning_rate": 9.111958422100779e-06, + "loss": 1.841, + "step": 28261500 + }, + { + "epoch": 81.81, + "learning_rate": 9.111236221748796e-06, + "loss": 1.8351, + "step": 28262000 + }, + { + "epoch": 81.81, + "learning_rate": 9.11051257410152e-06, + "loss": 1.8245, + "step": 28262500 + }, + { + "epoch": 81.81, + "learning_rate": 9.109790373749537e-06, + "loss": 1.854, + "step": 28263000 + }, + { + "epoch": 81.81, + "learning_rate": 9.109066726102261e-06, + "loss": 1.8365, + "step": 28263500 + }, + { + "epoch": 81.81, + "learning_rate": 9.108343078454983e-06, + "loss": 1.8241, + "step": 28264000 + }, + { + "epoch": 81.81, + "learning_rate": 9.107619430807707e-06, + "loss": 1.8312, + "step": 28264500 + }, + { + "epoch": 81.82, + "learning_rate": 9.10689578316043e-06, + "loss": 1.8161, + "step": 28265000 + }, + { + "epoch": 81.82, + "learning_rate": 9.106173582808448e-06, + "loss": 1.8163, + "step": 28265500 + }, + { + "epoch": 81.82, + "learning_rate": 9.10544993516117e-06, + "loss": 1.8412, + "step": 28266000 + }, + { + "epoch": 81.82, + "learning_rate": 9.104726287513894e-06, + "loss": 1.8258, + "step": 28266500 + }, + { + "epoch": 81.82, + "learning_rate": 9.104002639866618e-06, + "loss": 1.8133, + "step": 28267000 + }, + { + "epoch": 81.82, + "learning_rate": 9.10327899221934e-06, + "loss": 1.8419, + "step": 28267500 + }, + { + "epoch": 81.82, + "learning_rate": 9.102555344572065e-06, + "loss": 1.8614, + "step": 28268000 + }, + { + "epoch": 81.83, + "learning_rate": 9.101831696924787e-06, + "loss": 1.8831, + "step": 28268500 + }, + { + "epoch": 81.83, + "learning_rate": 9.10110804927751e-06, + "loss": 1.8581, + "step": 28269000 + }, + { + "epoch": 81.83, + "learning_rate": 9.100385848925528e-06, + "loss": 1.8434, + "step": 28269500 + }, + { + "epoch": 81.83, + "learning_rate": 9.099662201278252e-06, + "loss": 1.8293, + "step": 28270000 + }, + { + "epoch": 81.83, + "learning_rate": 9.098938553630974e-06, + "loss": 1.8377, + "step": 28270500 + }, + { + "epoch": 81.83, + "learning_rate": 9.098214905983698e-06, + "loss": 1.835, + "step": 28271000 + }, + { + "epoch": 81.83, + "learning_rate": 9.097492705631715e-06, + "loss": 1.8247, + "step": 28271500 + }, + { + "epoch": 81.84, + "learning_rate": 9.09676905798444e-06, + "loss": 1.8758, + "step": 28272000 + }, + { + "epoch": 81.84, + "learning_rate": 9.096045410337161e-06, + "loss": 1.8288, + "step": 28272500 + }, + { + "epoch": 81.84, + "learning_rate": 9.095321762689885e-06, + "loss": 1.8545, + "step": 28273000 + }, + { + "epoch": 81.84, + "learning_rate": 9.09459811504261e-06, + "loss": 1.812, + "step": 28273500 + }, + { + "epoch": 81.84, + "learning_rate": 9.093874467395332e-06, + "loss": 1.8057, + "step": 28274000 + }, + { + "epoch": 81.84, + "learning_rate": 9.093150819748055e-06, + "loss": 1.8396, + "step": 28274500 + }, + { + "epoch": 81.84, + "learning_rate": 9.09242717210078e-06, + "loss": 1.8454, + "step": 28275000 + }, + { + "epoch": 81.85, + "learning_rate": 9.091704971748797e-06, + "loss": 1.8462, + "step": 28275500 + }, + { + "epoch": 81.85, + "learning_rate": 9.090981324101519e-06, + "loss": 1.8549, + "step": 28276000 + }, + { + "epoch": 81.85, + "learning_rate": 9.090259123749538e-06, + "loss": 1.817, + "step": 28276500 + }, + { + "epoch": 81.85, + "learning_rate": 9.08953547610226e-06, + "loss": 1.8305, + "step": 28277000 + }, + { + "epoch": 81.85, + "learning_rate": 9.088811828454984e-06, + "loss": 1.8378, + "step": 28277500 + }, + { + "epoch": 81.85, + "learning_rate": 9.088089628103001e-06, + "loss": 1.8404, + "step": 28278000 + }, + { + "epoch": 81.85, + "learning_rate": 9.087365980455725e-06, + "loss": 1.8471, + "step": 28278500 + }, + { + "epoch": 81.86, + "learning_rate": 9.086642332808447e-06, + "loss": 1.852, + "step": 28279000 + }, + { + "epoch": 81.86, + "learning_rate": 9.085918685161171e-06, + "loss": 1.8631, + "step": 28279500 + }, + { + "epoch": 81.86, + "learning_rate": 9.085195037513894e-06, + "loss": 1.8263, + "step": 28280000 + }, + { + "epoch": 81.86, + "learning_rate": 9.084471389866618e-06, + "loss": 1.8387, + "step": 28280500 + }, + { + "epoch": 81.86, + "learning_rate": 9.083747742219341e-06, + "loss": 1.8508, + "step": 28281000 + }, + { + "epoch": 81.86, + "learning_rate": 9.083024094572064e-06, + "loss": 1.8476, + "step": 28281500 + }, + { + "epoch": 81.86, + "learning_rate": 9.082300446924788e-06, + "loss": 1.8646, + "step": 28282000 + }, + { + "epoch": 81.87, + "learning_rate": 9.081578246572805e-06, + "loss": 1.8499, + "step": 28282500 + }, + { + "epoch": 81.87, + "learning_rate": 9.080854598925529e-06, + "loss": 1.8195, + "step": 28283000 + }, + { + "epoch": 81.87, + "learning_rate": 9.080130951278251e-06, + "loss": 1.8526, + "step": 28283500 + }, + { + "epoch": 81.87, + "learning_rate": 9.079407303630975e-06, + "loss": 1.8453, + "step": 28284000 + }, + { + "epoch": 81.87, + "learning_rate": 9.078685103278992e-06, + "loss": 1.8636, + "step": 28284500 + }, + { + "epoch": 81.87, + "learning_rate": 9.077962902927011e-06, + "loss": 1.8507, + "step": 28285000 + }, + { + "epoch": 81.87, + "learning_rate": 9.077239255279733e-06, + "loss": 1.8317, + "step": 28285500 + }, + { + "epoch": 81.88, + "learning_rate": 9.07651705492775e-06, + "loss": 1.833, + "step": 28286000 + }, + { + "epoch": 81.88, + "learning_rate": 9.075793407280475e-06, + "loss": 1.8364, + "step": 28286500 + }, + { + "epoch": 81.88, + "learning_rate": 9.075069759633198e-06, + "loss": 1.8689, + "step": 28287000 + }, + { + "epoch": 81.88, + "learning_rate": 9.07434611198592e-06, + "loss": 1.8443, + "step": 28287500 + }, + { + "epoch": 81.88, + "learning_rate": 9.073622464338645e-06, + "loss": 1.8421, + "step": 28288000 + }, + { + "epoch": 81.88, + "learning_rate": 9.072898816691369e-06, + "loss": 1.8328, + "step": 28288500 + }, + { + "epoch": 81.89, + "learning_rate": 9.07217516904409e-06, + "loss": 1.8662, + "step": 28289000 + }, + { + "epoch": 81.89, + "learning_rate": 9.071451521396813e-06, + "loss": 1.8335, + "step": 28289500 + }, + { + "epoch": 81.89, + "learning_rate": 9.070727873749537e-06, + "loss": 1.8362, + "step": 28290000 + }, + { + "epoch": 81.89, + "learning_rate": 9.070004226102261e-06, + "loss": 1.859, + "step": 28290500 + }, + { + "epoch": 81.89, + "learning_rate": 9.069280578454983e-06, + "loss": 1.8322, + "step": 28291000 + }, + { + "epoch": 81.89, + "learning_rate": 9.068556930807707e-06, + "loss": 1.8448, + "step": 28291500 + }, + { + "epoch": 81.89, + "learning_rate": 9.067834730455724e-06, + "loss": 1.8566, + "step": 28292000 + }, + { + "epoch": 81.9, + "learning_rate": 9.067111082808448e-06, + "loss": 1.861, + "step": 28292500 + }, + { + "epoch": 81.9, + "learning_rate": 9.06638743516117e-06, + "loss": 1.8364, + "step": 28293000 + }, + { + "epoch": 81.9, + "learning_rate": 9.065663787513894e-06, + "loss": 1.8363, + "step": 28293500 + }, + { + "epoch": 81.9, + "learning_rate": 9.064943034457207e-06, + "loss": 1.8552, + "step": 28294000 + }, + { + "epoch": 81.9, + "learning_rate": 9.06421938680993e-06, + "loss": 1.8652, + "step": 28294500 + }, + { + "epoch": 81.9, + "learning_rate": 9.063495739162653e-06, + "loss": 1.8235, + "step": 28295000 + }, + { + "epoch": 81.9, + "learning_rate": 9.062772091515377e-06, + "loss": 1.8231, + "step": 28295500 + }, + { + "epoch": 81.91, + "learning_rate": 9.0620484438681e-06, + "loss": 1.8249, + "step": 28296000 + }, + { + "epoch": 81.91, + "learning_rate": 9.061324796220823e-06, + "loss": 1.8254, + "step": 28296500 + }, + { + "epoch": 81.91, + "learning_rate": 9.060601148573545e-06, + "loss": 1.8485, + "step": 28297000 + }, + { + "epoch": 81.91, + "learning_rate": 9.059877500926269e-06, + "loss": 1.8474, + "step": 28297500 + }, + { + "epoch": 81.91, + "learning_rate": 9.059153853278993e-06, + "loss": 1.8583, + "step": 28298000 + }, + { + "epoch": 81.91, + "learning_rate": 9.05843165292701e-06, + "loss": 1.8187, + "step": 28298500 + }, + { + "epoch": 81.91, + "learning_rate": 9.057708005279732e-06, + "loss": 1.8745, + "step": 28299000 + }, + { + "epoch": 81.92, + "learning_rate": 9.056984357632458e-06, + "loss": 1.8385, + "step": 28299500 + }, + { + "epoch": 81.92, + "learning_rate": 9.05626070998518e-06, + "loss": 1.8598, + "step": 28300000 + }, + { + "epoch": 81.92, + "learning_rate": 9.055537062337903e-06, + "loss": 1.8598, + "step": 28300500 + }, + { + "epoch": 81.92, + "learning_rate": 9.054813414690626e-06, + "loss": 1.8391, + "step": 28301000 + }, + { + "epoch": 81.92, + "learning_rate": 9.05408976704335e-06, + "loss": 1.8207, + "step": 28301500 + }, + { + "epoch": 81.92, + "learning_rate": 9.053367566691368e-06, + "loss": 1.7934, + "step": 28302000 + }, + { + "epoch": 81.92, + "learning_rate": 9.05264391904409e-06, + "loss": 1.8398, + "step": 28302500 + }, + { + "epoch": 81.93, + "learning_rate": 9.051920271396814e-06, + "loss": 1.8313, + "step": 28303000 + }, + { + "epoch": 81.93, + "learning_rate": 9.051196623749538e-06, + "loss": 1.8424, + "step": 28303500 + }, + { + "epoch": 81.93, + "learning_rate": 9.05047297610226e-06, + "loss": 1.8476, + "step": 28304000 + }, + { + "epoch": 81.93, + "learning_rate": 9.049750775750277e-06, + "loss": 1.8426, + "step": 28304500 + }, + { + "epoch": 81.93, + "learning_rate": 9.049028575398296e-06, + "loss": 1.8268, + "step": 28305000 + }, + { + "epoch": 81.93, + "learning_rate": 9.048306375046315e-06, + "loss": 1.8606, + "step": 28305500 + }, + { + "epoch": 81.93, + "learning_rate": 9.047582727399037e-06, + "loss": 1.8323, + "step": 28306000 + }, + { + "epoch": 81.94, + "learning_rate": 9.04685907975176e-06, + "loss": 1.8476, + "step": 28306500 + }, + { + "epoch": 81.94, + "learning_rate": 9.046135432104484e-06, + "loss": 1.8803, + "step": 28307000 + }, + { + "epoch": 81.94, + "learning_rate": 9.045411784457207e-06, + "loss": 1.8487, + "step": 28307500 + }, + { + "epoch": 81.94, + "learning_rate": 9.04468813680993e-06, + "loss": 1.8295, + "step": 28308000 + }, + { + "epoch": 81.94, + "learning_rate": 9.043964489162652e-06, + "loss": 1.8397, + "step": 28308500 + }, + { + "epoch": 81.94, + "learning_rate": 9.043240841515378e-06, + "loss": 1.8517, + "step": 28309000 + }, + { + "epoch": 81.94, + "learning_rate": 9.0425171938681e-06, + "loss": 1.8334, + "step": 28309500 + }, + { + "epoch": 81.95, + "learning_rate": 9.041793546220822e-06, + "loss": 1.8344, + "step": 28310000 + }, + { + "epoch": 81.95, + "learning_rate": 9.041069898573546e-06, + "loss": 1.8168, + "step": 28310500 + }, + { + "epoch": 81.95, + "learning_rate": 9.04034625092627e-06, + "loss": 1.8311, + "step": 28311000 + }, + { + "epoch": 81.95, + "learning_rate": 9.039624050574287e-06, + "loss": 1.8267, + "step": 28311500 + }, + { + "epoch": 81.95, + "learning_rate": 9.03890040292701e-06, + "loss": 1.8478, + "step": 28312000 + }, + { + "epoch": 81.95, + "learning_rate": 9.038176755279735e-06, + "loss": 1.8192, + "step": 28312500 + }, + { + "epoch": 81.95, + "learning_rate": 9.037453107632457e-06, + "loss": 1.8406, + "step": 28313000 + }, + { + "epoch": 81.96, + "learning_rate": 9.03672945998518e-06, + "loss": 1.8313, + "step": 28313500 + }, + { + "epoch": 81.96, + "learning_rate": 9.036005812337903e-06, + "loss": 1.8393, + "step": 28314000 + }, + { + "epoch": 81.96, + "learning_rate": 9.035283611985922e-06, + "loss": 1.8467, + "step": 28314500 + }, + { + "epoch": 81.96, + "learning_rate": 9.034559964338645e-06, + "loss": 1.8231, + "step": 28315000 + }, + { + "epoch": 81.96, + "learning_rate": 9.033836316691367e-06, + "loss": 1.8596, + "step": 28315500 + }, + { + "epoch": 81.96, + "learning_rate": 9.033114116339384e-06, + "loss": 1.8535, + "step": 28316000 + }, + { + "epoch": 81.96, + "learning_rate": 9.03239046869211e-06, + "loss": 1.8333, + "step": 28316500 + }, + { + "epoch": 81.97, + "learning_rate": 9.031666821044832e-06, + "loss": 1.8363, + "step": 28317000 + }, + { + "epoch": 81.97, + "learning_rate": 9.030943173397554e-06, + "loss": 1.8282, + "step": 28317500 + }, + { + "epoch": 81.97, + "learning_rate": 9.03021952575028e-06, + "loss": 1.8366, + "step": 28318000 + }, + { + "epoch": 81.97, + "learning_rate": 9.029495878103002e-06, + "loss": 1.8243, + "step": 28318500 + }, + { + "epoch": 81.97, + "learning_rate": 9.028772230455724e-06, + "loss": 1.8464, + "step": 28319000 + }, + { + "epoch": 81.97, + "learning_rate": 9.028050030103741e-06, + "loss": 1.8424, + "step": 28319500 + }, + { + "epoch": 81.97, + "learning_rate": 9.027326382456467e-06, + "loss": 1.8303, + "step": 28320000 + }, + { + "epoch": 81.98, + "learning_rate": 9.02660273480919e-06, + "loss": 1.8522, + "step": 28320500 + }, + { + "epoch": 81.98, + "learning_rate": 9.025879087161912e-06, + "loss": 1.8399, + "step": 28321000 + }, + { + "epoch": 81.98, + "learning_rate": 9.025155439514635e-06, + "loss": 1.8399, + "step": 28321500 + }, + { + "epoch": 81.98, + "learning_rate": 9.02443179186736e-06, + "loss": 1.8405, + "step": 28322000 + }, + { + "epoch": 81.98, + "learning_rate": 9.023709591515377e-06, + "loss": 1.8386, + "step": 28322500 + }, + { + "epoch": 81.98, + "learning_rate": 9.022985943868099e-06, + "loss": 1.8381, + "step": 28323000 + }, + { + "epoch": 81.98, + "learning_rate": 9.022262296220824e-06, + "loss": 1.839, + "step": 28323500 + }, + { + "epoch": 81.99, + "learning_rate": 9.021538648573547e-06, + "loss": 1.8397, + "step": 28324000 + }, + { + "epoch": 81.99, + "learning_rate": 9.020815000926269e-06, + "loss": 1.8307, + "step": 28324500 + }, + { + "epoch": 81.99, + "learning_rate": 9.020091353278993e-06, + "loss": 1.8392, + "step": 28325000 + }, + { + "epoch": 81.99, + "learning_rate": 9.019367705631717e-06, + "loss": 1.8508, + "step": 28325500 + }, + { + "epoch": 81.99, + "learning_rate": 9.018644057984439e-06, + "loss": 1.8258, + "step": 28326000 + }, + { + "epoch": 81.99, + "learning_rate": 9.017921857632456e-06, + "loss": 1.8354, + "step": 28326500 + }, + { + "epoch": 82.0, + "learning_rate": 9.01719820998518e-06, + "loss": 1.8423, + "step": 28327000 + }, + { + "epoch": 82.0, + "learning_rate": 9.016474562337904e-06, + "loss": 1.8488, + "step": 28327500 + }, + { + "epoch": 82.0, + "learning_rate": 9.015750914690626e-06, + "loss": 1.8605, + "step": 28328000 + }, + { + "epoch": 82.0, + "learning_rate": 9.015027267043349e-06, + "loss": 1.8234, + "step": 28328500 + }, + { + "epoch": 82.0, + "eval_accuracy": 0.6864873525969934, + "eval_accuracy_mlm": 0.6553302541283902, + "eval_accuracy_nsp": 0.8536204186202124, + "eval_loss": 2.1995444297790527, + "eval_runtime": 331.7228, + "eval_samples_per_second": 1315.514, + "eval_steps_per_second": 54.814, + "step": 28328704 + }, + { + "epoch": 82.0, + "learning_rate": 9.014305066691368e-06, + "loss": 1.8094, + "step": 28329000 + }, + { + "epoch": 82.0, + "learning_rate": 9.013581419044091e-06, + "loss": 1.8229, + "step": 28329500 + }, + { + "epoch": 82.0, + "learning_rate": 9.012857771396814e-06, + "loss": 1.8183, + "step": 28330000 + }, + { + "epoch": 82.01, + "learning_rate": 9.012134123749538e-06, + "loss": 1.8287, + "step": 28330500 + }, + { + "epoch": 82.01, + "learning_rate": 9.011410476102262e-06, + "loss": 1.8349, + "step": 28331000 + }, + { + "epoch": 82.01, + "learning_rate": 9.010688275750279e-06, + "loss": 1.8124, + "step": 28331500 + }, + { + "epoch": 82.01, + "learning_rate": 9.009964628103001e-06, + "loss": 1.8298, + "step": 28332000 + }, + { + "epoch": 82.01, + "learning_rate": 9.009240980455725e-06, + "loss": 1.8416, + "step": 28332500 + }, + { + "epoch": 82.01, + "learning_rate": 9.008517332808449e-06, + "loss": 1.826, + "step": 28333000 + }, + { + "epoch": 82.01, + "learning_rate": 9.007793685161171e-06, + "loss": 1.8233, + "step": 28333500 + }, + { + "epoch": 82.02, + "learning_rate": 9.007070037513893e-06, + "loss": 1.8308, + "step": 28334000 + }, + { + "epoch": 82.02, + "learning_rate": 9.006347837161912e-06, + "loss": 1.836, + "step": 28334500 + }, + { + "epoch": 82.02, + "learning_rate": 9.005624189514636e-06, + "loss": 1.8416, + "step": 28335000 + }, + { + "epoch": 82.02, + "learning_rate": 9.004900541867358e-06, + "loss": 1.8328, + "step": 28335500 + }, + { + "epoch": 82.02, + "learning_rate": 9.004176894220082e-06, + "loss": 1.7986, + "step": 28336000 + }, + { + "epoch": 82.02, + "learning_rate": 9.003453246572806e-06, + "loss": 1.8578, + "step": 28336500 + }, + { + "epoch": 82.02, + "learning_rate": 9.002729598925529e-06, + "loss": 1.8195, + "step": 28337000 + }, + { + "epoch": 82.03, + "learning_rate": 9.00200595127825e-06, + "loss": 1.8404, + "step": 28337500 + }, + { + "epoch": 82.03, + "learning_rate": 9.001282303630975e-06, + "loss": 1.8299, + "step": 28338000 + }, + { + "epoch": 82.03, + "learning_rate": 9.000558655983699e-06, + "loss": 1.8384, + "step": 28338500 + }, + { + "epoch": 82.03, + "learning_rate": 8.999836455631716e-06, + "loss": 1.8112, + "step": 28339000 + }, + { + "epoch": 82.03, + "learning_rate": 8.999112807984438e-06, + "loss": 1.8198, + "step": 28339500 + }, + { + "epoch": 82.03, + "learning_rate": 8.998390607632457e-06, + "loss": 1.8368, + "step": 28340000 + }, + { + "epoch": 82.03, + "learning_rate": 8.997666959985181e-06, + "loss": 1.8213, + "step": 28340500 + }, + { + "epoch": 82.04, + "learning_rate": 8.996943312337903e-06, + "loss": 1.8182, + "step": 28341000 + }, + { + "epoch": 82.04, + "learning_rate": 8.996219664690627e-06, + "loss": 1.8516, + "step": 28341500 + }, + { + "epoch": 82.04, + "learning_rate": 8.99549601704335e-06, + "loss": 1.8292, + "step": 28342000 + }, + { + "epoch": 82.04, + "learning_rate": 8.994772369396073e-06, + "loss": 1.8201, + "step": 28342500 + }, + { + "epoch": 82.04, + "learning_rate": 8.994048721748796e-06, + "loss": 1.8461, + "step": 28343000 + }, + { + "epoch": 82.04, + "learning_rate": 8.993326521396815e-06, + "loss": 1.8323, + "step": 28343500 + }, + { + "epoch": 82.04, + "learning_rate": 8.992602873749538e-06, + "loss": 1.855, + "step": 28344000 + }, + { + "epoch": 82.05, + "learning_rate": 8.99187922610226e-06, + "loss": 1.8458, + "step": 28344500 + }, + { + "epoch": 82.05, + "learning_rate": 8.991155578454983e-06, + "loss": 1.8231, + "step": 28345000 + }, + { + "epoch": 82.05, + "learning_rate": 8.990431930807707e-06, + "loss": 1.839, + "step": 28345500 + }, + { + "epoch": 82.05, + "learning_rate": 8.98970828316043e-06, + "loss": 1.8244, + "step": 28346000 + }, + { + "epoch": 82.05, + "learning_rate": 8.988986082808448e-06, + "loss": 1.8344, + "step": 28346500 + }, + { + "epoch": 82.05, + "learning_rate": 8.98826243516117e-06, + "loss": 1.8527, + "step": 28347000 + }, + { + "epoch": 82.05, + "learning_rate": 8.987538787513894e-06, + "loss": 1.7969, + "step": 28347500 + }, + { + "epoch": 82.06, + "learning_rate": 8.986815139866618e-06, + "loss": 1.8122, + "step": 28348000 + }, + { + "epoch": 82.06, + "learning_rate": 8.98609149221934e-06, + "loss": 1.8202, + "step": 28348500 + }, + { + "epoch": 82.06, + "learning_rate": 8.985367844572064e-06, + "loss": 1.8187, + "step": 28349000 + }, + { + "epoch": 82.06, + "learning_rate": 8.984645644220082e-06, + "loss": 1.836, + "step": 28349500 + }, + { + "epoch": 82.06, + "learning_rate": 8.983921996572805e-06, + "loss": 1.8301, + "step": 28350000 + }, + { + "epoch": 82.06, + "learning_rate": 8.983198348925528e-06, + "loss": 1.8055, + "step": 28350500 + }, + { + "epoch": 82.06, + "learning_rate": 8.982474701278252e-06, + "loss": 1.8079, + "step": 28351000 + }, + { + "epoch": 82.07, + "learning_rate": 8.981751053630976e-06, + "loss": 1.8473, + "step": 28351500 + }, + { + "epoch": 82.07, + "learning_rate": 8.981027405983698e-06, + "loss": 1.8246, + "step": 28352000 + }, + { + "epoch": 82.07, + "learning_rate": 8.980303758336422e-06, + "loss": 1.815, + "step": 28352500 + }, + { + "epoch": 82.07, + "learning_rate": 8.979580110689144e-06, + "loss": 1.8351, + "step": 28353000 + }, + { + "epoch": 82.07, + "learning_rate": 8.978856463041868e-06, + "loss": 1.8447, + "step": 28353500 + }, + { + "epoch": 82.07, + "learning_rate": 8.978134262689885e-06, + "loss": 1.8552, + "step": 28354000 + }, + { + "epoch": 82.07, + "learning_rate": 8.977410615042609e-06, + "loss": 1.8334, + "step": 28354500 + }, + { + "epoch": 82.08, + "learning_rate": 8.976686967395333e-06, + "loss": 1.8334, + "step": 28355000 + }, + { + "epoch": 82.08, + "learning_rate": 8.975963319748055e-06, + "loss": 1.8317, + "step": 28355500 + }, + { + "epoch": 82.08, + "learning_rate": 8.975239672100779e-06, + "loss": 1.8226, + "step": 28356000 + }, + { + "epoch": 82.08, + "learning_rate": 8.974516024453501e-06, + "loss": 1.8432, + "step": 28356500 + }, + { + "epoch": 82.08, + "learning_rate": 8.973792376806225e-06, + "loss": 1.8221, + "step": 28357000 + }, + { + "epoch": 82.08, + "learning_rate": 8.973068729158948e-06, + "loss": 1.8267, + "step": 28357500 + }, + { + "epoch": 82.08, + "learning_rate": 8.972346528806966e-06, + "loss": 1.8253, + "step": 28358000 + }, + { + "epoch": 82.09, + "learning_rate": 8.971622881159689e-06, + "loss": 1.8295, + "step": 28358500 + }, + { + "epoch": 82.09, + "learning_rate": 8.970899233512413e-06, + "loss": 1.8403, + "step": 28359000 + }, + { + "epoch": 82.09, + "learning_rate": 8.970175585865135e-06, + "loss": 1.8326, + "step": 28359500 + }, + { + "epoch": 82.09, + "learning_rate": 8.969451938217859e-06, + "loss": 1.8384, + "step": 28360000 + }, + { + "epoch": 82.09, + "learning_rate": 8.968728290570583e-06, + "loss": 1.858, + "step": 28360500 + }, + { + "epoch": 82.09, + "learning_rate": 8.9680060902186e-06, + "loss": 1.82, + "step": 28361000 + }, + { + "epoch": 82.09, + "learning_rate": 8.967282442571324e-06, + "loss": 1.8165, + "step": 28361500 + }, + { + "epoch": 82.1, + "learning_rate": 8.966558794924046e-06, + "loss": 1.821, + "step": 28362000 + }, + { + "epoch": 82.1, + "learning_rate": 8.965836594572063e-06, + "loss": 1.8346, + "step": 28362500 + }, + { + "epoch": 82.1, + "learning_rate": 8.965112946924787e-06, + "loss": 1.8624, + "step": 28363000 + }, + { + "epoch": 82.1, + "learning_rate": 8.964389299277511e-06, + "loss": 1.8395, + "step": 28363500 + }, + { + "epoch": 82.1, + "learning_rate": 8.963665651630233e-06, + "loss": 1.8173, + "step": 28364000 + }, + { + "epoch": 82.1, + "learning_rate": 8.962943451278252e-06, + "loss": 1.8391, + "step": 28364500 + }, + { + "epoch": 82.11, + "learning_rate": 8.962219803630975e-06, + "loss": 1.844, + "step": 28365000 + }, + { + "epoch": 82.11, + "learning_rate": 8.961496155983699e-06, + "loss": 1.805, + "step": 28365500 + }, + { + "epoch": 82.11, + "learning_rate": 8.96077250833642e-06, + "loss": 1.8406, + "step": 28366000 + }, + { + "epoch": 82.11, + "learning_rate": 8.960048860689145e-06, + "loss": 1.8572, + "step": 28366500 + }, + { + "epoch": 82.11, + "learning_rate": 8.959325213041869e-06, + "loss": 1.7849, + "step": 28367000 + }, + { + "epoch": 82.11, + "learning_rate": 8.958601565394591e-06, + "loss": 1.8114, + "step": 28367500 + }, + { + "epoch": 82.11, + "learning_rate": 8.957877917747315e-06, + "loss": 1.8321, + "step": 28368000 + }, + { + "epoch": 82.12, + "learning_rate": 8.957154270100037e-06, + "loss": 1.8642, + "step": 28368500 + }, + { + "epoch": 82.12, + "learning_rate": 8.956430622452761e-06, + "loss": 1.8387, + "step": 28369000 + }, + { + "epoch": 82.12, + "learning_rate": 8.955708422100778e-06, + "loss": 1.8207, + "step": 28369500 + }, + { + "epoch": 82.12, + "learning_rate": 8.954986221748795e-06, + "loss": 1.8472, + "step": 28370000 + }, + { + "epoch": 82.12, + "learning_rate": 8.95426257410152e-06, + "loss": 1.837, + "step": 28370500 + }, + { + "epoch": 82.12, + "learning_rate": 8.953538926454243e-06, + "loss": 1.8185, + "step": 28371000 + }, + { + "epoch": 82.12, + "learning_rate": 8.952815278806966e-06, + "loss": 1.8086, + "step": 28371500 + }, + { + "epoch": 82.13, + "learning_rate": 8.952093078454983e-06, + "loss": 1.7901, + "step": 28372000 + }, + { + "epoch": 82.13, + "learning_rate": 8.951369430807707e-06, + "loss": 1.8642, + "step": 28372500 + }, + { + "epoch": 82.13, + "learning_rate": 8.95064578316043e-06, + "loss": 1.8305, + "step": 28373000 + }, + { + "epoch": 82.13, + "learning_rate": 8.949922135513153e-06, + "loss": 1.7914, + "step": 28373500 + }, + { + "epoch": 82.13, + "learning_rate": 8.949198487865877e-06, + "loss": 1.8168, + "step": 28374000 + }, + { + "epoch": 82.13, + "learning_rate": 8.9484748402186e-06, + "loss": 1.8314, + "step": 28374500 + }, + { + "epoch": 82.13, + "learning_rate": 8.947751192571323e-06, + "loss": 1.8413, + "step": 28375000 + }, + { + "epoch": 82.14, + "learning_rate": 8.947027544924047e-06, + "loss": 1.8614, + "step": 28375500 + }, + { + "epoch": 82.14, + "learning_rate": 8.946303897276769e-06, + "loss": 1.8268, + "step": 28376000 + }, + { + "epoch": 82.14, + "learning_rate": 8.945580249629493e-06, + "loss": 1.8589, + "step": 28376500 + }, + { + "epoch": 82.14, + "learning_rate": 8.944856601982215e-06, + "loss": 1.827, + "step": 28377000 + }, + { + "epoch": 82.14, + "learning_rate": 8.94413295433494e-06, + "loss": 1.8204, + "step": 28377500 + }, + { + "epoch": 82.14, + "learning_rate": 8.943409306687663e-06, + "loss": 1.8419, + "step": 28378000 + }, + { + "epoch": 82.14, + "learning_rate": 8.942685659040385e-06, + "loss": 1.8333, + "step": 28378500 + }, + { + "epoch": 82.15, + "learning_rate": 8.941963458688403e-06, + "loss": 1.8561, + "step": 28379000 + }, + { + "epoch": 82.15, + "learning_rate": 8.941239811041127e-06, + "loss": 1.831, + "step": 28379500 + }, + { + "epoch": 82.15, + "learning_rate": 8.94051616339385e-06, + "loss": 1.8327, + "step": 28380000 + }, + { + "epoch": 82.15, + "learning_rate": 8.939792515746573e-06, + "loss": 1.834, + "step": 28380500 + }, + { + "epoch": 82.15, + "learning_rate": 8.939068868099297e-06, + "loss": 1.8123, + "step": 28381000 + }, + { + "epoch": 82.15, + "learning_rate": 8.93834522045202e-06, + "loss": 1.8428, + "step": 28381500 + }, + { + "epoch": 82.15, + "learning_rate": 8.937621572804743e-06, + "loss": 1.8345, + "step": 28382000 + }, + { + "epoch": 82.16, + "learning_rate": 8.936897925157465e-06, + "loss": 1.8369, + "step": 28382500 + }, + { + "epoch": 82.16, + "learning_rate": 8.936175724805484e-06, + "loss": 1.8383, + "step": 28383000 + }, + { + "epoch": 82.16, + "learning_rate": 8.935452077158208e-06, + "loss": 1.8248, + "step": 28383500 + }, + { + "epoch": 82.16, + "learning_rate": 8.934729876806225e-06, + "loss": 1.8567, + "step": 28384000 + }, + { + "epoch": 82.16, + "learning_rate": 8.934006229158947e-06, + "loss": 1.8266, + "step": 28384500 + }, + { + "epoch": 82.16, + "learning_rate": 8.933282581511671e-06, + "loss": 1.8388, + "step": 28385000 + }, + { + "epoch": 82.16, + "learning_rate": 8.932558933864395e-06, + "loss": 1.8287, + "step": 28385500 + }, + { + "epoch": 82.17, + "learning_rate": 8.931836733512413e-06, + "loss": 1.8435, + "step": 28386000 + }, + { + "epoch": 82.17, + "learning_rate": 8.931113085865135e-06, + "loss": 1.8207, + "step": 28386500 + }, + { + "epoch": 82.17, + "learning_rate": 8.930389438217859e-06, + "loss": 1.8461, + "step": 28387000 + }, + { + "epoch": 82.17, + "learning_rate": 8.929665790570583e-06, + "loss": 1.7996, + "step": 28387500 + }, + { + "epoch": 82.17, + "learning_rate": 8.928942142923305e-06, + "loss": 1.8456, + "step": 28388000 + }, + { + "epoch": 82.17, + "learning_rate": 8.928218495276029e-06, + "loss": 1.8543, + "step": 28388500 + }, + { + "epoch": 82.17, + "learning_rate": 8.927494847628753e-06, + "loss": 1.8454, + "step": 28389000 + }, + { + "epoch": 82.18, + "learning_rate": 8.92677264727677e-06, + "loss": 1.823, + "step": 28389500 + }, + { + "epoch": 82.18, + "learning_rate": 8.926048999629492e-06, + "loss": 1.8412, + "step": 28390000 + }, + { + "epoch": 82.18, + "learning_rate": 8.92532679927751e-06, + "loss": 1.8122, + "step": 28390500 + }, + { + "epoch": 82.18, + "learning_rate": 8.924603151630235e-06, + "loss": 1.8248, + "step": 28391000 + }, + { + "epoch": 82.18, + "learning_rate": 8.923879503982957e-06, + "loss": 1.8535, + "step": 28391500 + }, + { + "epoch": 82.18, + "learning_rate": 8.92315585633568e-06, + "loss": 1.8387, + "step": 28392000 + }, + { + "epoch": 82.18, + "learning_rate": 8.922432208688403e-06, + "loss": 1.795, + "step": 28392500 + }, + { + "epoch": 82.19, + "learning_rate": 8.921708561041127e-06, + "loss": 1.8115, + "step": 28393000 + }, + { + "epoch": 82.19, + "learning_rate": 8.92098491339385e-06, + "loss": 1.847, + "step": 28393500 + }, + { + "epoch": 82.19, + "learning_rate": 8.920262713041867e-06, + "loss": 1.8391, + "step": 28394000 + }, + { + "epoch": 82.19, + "learning_rate": 8.91953906539459e-06, + "loss": 1.8369, + "step": 28394500 + }, + { + "epoch": 82.19, + "learning_rate": 8.918815417747315e-06, + "loss": 1.8382, + "step": 28395000 + }, + { + "epoch": 82.19, + "learning_rate": 8.918091770100037e-06, + "loss": 1.8298, + "step": 28395500 + }, + { + "epoch": 82.19, + "learning_rate": 8.917368122452761e-06, + "loss": 1.8342, + "step": 28396000 + }, + { + "epoch": 82.2, + "learning_rate": 8.916644474805485e-06, + "loss": 1.8396, + "step": 28396500 + }, + { + "epoch": 82.2, + "learning_rate": 8.915920827158207e-06, + "loss": 1.8444, + "step": 28397000 + }, + { + "epoch": 82.2, + "learning_rate": 8.91519717951093e-06, + "loss": 1.861, + "step": 28397500 + }, + { + "epoch": 82.2, + "learning_rate": 8.914474979158948e-06, + "loss": 1.8273, + "step": 28398000 + }, + { + "epoch": 82.2, + "learning_rate": 8.913751331511672e-06, + "loss": 1.8684, + "step": 28398500 + }, + { + "epoch": 82.2, + "learning_rate": 8.913027683864394e-06, + "loss": 1.823, + "step": 28399000 + }, + { + "epoch": 82.2, + "learning_rate": 8.912304036217117e-06, + "loss": 1.8353, + "step": 28399500 + }, + { + "epoch": 82.21, + "learning_rate": 8.911580388569842e-06, + "loss": 1.8388, + "step": 28400000 + }, + { + "epoch": 82.21, + "learning_rate": 8.910856740922564e-06, + "loss": 1.816, + "step": 28400500 + }, + { + "epoch": 82.21, + "learning_rate": 8.910134540570582e-06, + "loss": 1.8367, + "step": 28401000 + }, + { + "epoch": 82.21, + "learning_rate": 8.909410892923304e-06, + "loss": 1.8279, + "step": 28401500 + }, + { + "epoch": 82.21, + "learning_rate": 8.90868724527603e-06, + "loss": 1.8667, + "step": 28402000 + }, + { + "epoch": 82.21, + "learning_rate": 8.907963597628752e-06, + "loss": 1.8386, + "step": 28402500 + }, + { + "epoch": 82.22, + "learning_rate": 8.907239949981474e-06, + "loss": 1.8532, + "step": 28403000 + }, + { + "epoch": 82.22, + "learning_rate": 8.9065163023342e-06, + "loss": 1.8288, + "step": 28403500 + }, + { + "epoch": 82.22, + "learning_rate": 8.905792654686922e-06, + "loss": 1.8295, + "step": 28404000 + }, + { + "epoch": 82.22, + "learning_rate": 8.905069007039644e-06, + "loss": 1.8453, + "step": 28404500 + }, + { + "epoch": 82.22, + "learning_rate": 8.904346806687661e-06, + "loss": 1.8428, + "step": 28405000 + }, + { + "epoch": 82.22, + "learning_rate": 8.903623159040387e-06, + "loss": 1.8148, + "step": 28405500 + }, + { + "epoch": 82.22, + "learning_rate": 8.90289951139311e-06, + "loss": 1.8332, + "step": 28406000 + }, + { + "epoch": 82.23, + "learning_rate": 8.902175863745831e-06, + "loss": 1.8385, + "step": 28406500 + }, + { + "epoch": 82.23, + "learning_rate": 8.901452216098555e-06, + "loss": 1.8151, + "step": 28407000 + }, + { + "epoch": 82.23, + "learning_rate": 8.90072856845128e-06, + "loss": 1.8404, + "step": 28407500 + }, + { + "epoch": 82.23, + "learning_rate": 8.900006368099297e-06, + "loss": 1.8559, + "step": 28408000 + }, + { + "epoch": 82.23, + "learning_rate": 8.899282720452019e-06, + "loss": 1.8132, + "step": 28408500 + }, + { + "epoch": 82.23, + "learning_rate": 8.898559072804743e-06, + "loss": 1.8473, + "step": 28409000 + }, + { + "epoch": 82.23, + "learning_rate": 8.897835425157467e-06, + "loss": 1.8785, + "step": 28409500 + }, + { + "epoch": 82.24, + "learning_rate": 8.897111777510189e-06, + "loss": 1.8185, + "step": 28410000 + }, + { + "epoch": 82.24, + "learning_rate": 8.896389577158206e-06, + "loss": 1.8307, + "step": 28410500 + }, + { + "epoch": 82.24, + "learning_rate": 8.895665929510932e-06, + "loss": 1.8532, + "step": 28411000 + }, + { + "epoch": 82.24, + "learning_rate": 8.894942281863654e-06, + "loss": 1.8308, + "step": 28411500 + }, + { + "epoch": 82.24, + "learning_rate": 8.894218634216376e-06, + "loss": 1.8168, + "step": 28412000 + }, + { + "epoch": 82.24, + "learning_rate": 8.893496433864393e-06, + "loss": 1.7987, + "step": 28412500 + }, + { + "epoch": 82.24, + "learning_rate": 8.892772786217119e-06, + "loss": 1.8425, + "step": 28413000 + }, + { + "epoch": 82.25, + "learning_rate": 8.892049138569841e-06, + "loss": 1.8254, + "step": 28413500 + }, + { + "epoch": 82.25, + "learning_rate": 8.891325490922564e-06, + "loss": 1.8316, + "step": 28414000 + }, + { + "epoch": 82.25, + "learning_rate": 8.89060329057058e-06, + "loss": 1.8516, + "step": 28414500 + }, + { + "epoch": 82.25, + "learning_rate": 8.889879642923306e-06, + "loss": 1.8286, + "step": 28415000 + }, + { + "epoch": 82.25, + "learning_rate": 8.889155995276029e-06, + "loss": 1.8485, + "step": 28415500 + }, + { + "epoch": 82.25, + "learning_rate": 8.888432347628751e-06, + "loss": 1.8349, + "step": 28416000 + }, + { + "epoch": 82.25, + "learning_rate": 8.887708699981477e-06, + "loss": 1.8176, + "step": 28416500 + }, + { + "epoch": 82.26, + "learning_rate": 8.886985052334199e-06, + "loss": 1.8285, + "step": 28417000 + }, + { + "epoch": 82.26, + "learning_rate": 8.886262851982216e-06, + "loss": 1.8561, + "step": 28417500 + }, + { + "epoch": 82.26, + "learning_rate": 8.885539204334938e-06, + "loss": 1.8243, + "step": 28418000 + }, + { + "epoch": 82.26, + "learning_rate": 8.884817003982957e-06, + "loss": 1.8061, + "step": 28418500 + }, + { + "epoch": 82.26, + "learning_rate": 8.884093356335681e-06, + "loss": 1.8296, + "step": 28419000 + }, + { + "epoch": 82.26, + "learning_rate": 8.883369708688403e-06, + "loss": 1.8227, + "step": 28419500 + }, + { + "epoch": 82.26, + "learning_rate": 8.882646061041126e-06, + "loss": 1.8628, + "step": 28420000 + }, + { + "epoch": 82.27, + "learning_rate": 8.881922413393851e-06, + "loss": 1.8153, + "step": 28420500 + }, + { + "epoch": 82.27, + "learning_rate": 8.881198765746573e-06, + "loss": 1.861, + "step": 28421000 + }, + { + "epoch": 82.27, + "learning_rate": 8.880475118099296e-06, + "loss": 1.8325, + "step": 28421500 + }, + { + "epoch": 82.27, + "learning_rate": 8.87975147045202e-06, + "loss": 1.8188, + "step": 28422000 + }, + { + "epoch": 82.27, + "learning_rate": 8.879030717395334e-06, + "loss": 1.8517, + "step": 28422500 + }, + { + "epoch": 82.27, + "learning_rate": 8.878307069748056e-06, + "loss": 1.862, + "step": 28423000 + }, + { + "epoch": 82.27, + "learning_rate": 8.877583422100778e-06, + "loss": 1.8475, + "step": 28423500 + }, + { + "epoch": 82.28, + "learning_rate": 8.876859774453502e-06, + "loss": 1.8272, + "step": 28424000 + }, + { + "epoch": 82.28, + "learning_rate": 8.876136126806226e-06, + "loss": 1.8287, + "step": 28424500 + }, + { + "epoch": 82.28, + "learning_rate": 8.875413926454243e-06, + "loss": 1.8199, + "step": 28425000 + }, + { + "epoch": 82.28, + "learning_rate": 8.874690278806965e-06, + "loss": 1.8448, + "step": 28425500 + }, + { + "epoch": 82.28, + "learning_rate": 8.87396663115969e-06, + "loss": 1.8464, + "step": 28426000 + }, + { + "epoch": 82.28, + "learning_rate": 8.873242983512413e-06, + "loss": 1.8324, + "step": 28426500 + }, + { + "epoch": 82.28, + "learning_rate": 8.872519335865135e-06, + "loss": 1.8519, + "step": 28427000 + }, + { + "epoch": 82.29, + "learning_rate": 8.871795688217858e-06, + "loss": 1.8291, + "step": 28427500 + }, + { + "epoch": 82.29, + "learning_rate": 8.871072040570583e-06, + "loss": 1.8158, + "step": 28428000 + }, + { + "epoch": 82.29, + "learning_rate": 8.8703498402186e-06, + "loss": 1.8545, + "step": 28428500 + }, + { + "epoch": 82.29, + "learning_rate": 8.869626192571323e-06, + "loss": 1.8381, + "step": 28429000 + }, + { + "epoch": 82.29, + "learning_rate": 8.868902544924047e-06, + "loss": 1.8284, + "step": 28429500 + }, + { + "epoch": 82.29, + "learning_rate": 8.86817889727677e-06, + "loss": 1.8352, + "step": 28430000 + }, + { + "epoch": 82.29, + "learning_rate": 8.867455249629493e-06, + "loss": 1.8108, + "step": 28430500 + }, + { + "epoch": 82.3, + "learning_rate": 8.866734496572805e-06, + "loss": 1.802, + "step": 28431000 + }, + { + "epoch": 82.3, + "learning_rate": 8.866010848925527e-06, + "loss": 1.8357, + "step": 28431500 + }, + { + "epoch": 82.3, + "learning_rate": 8.865287201278253e-06, + "loss": 1.8097, + "step": 28432000 + }, + { + "epoch": 82.3, + "learning_rate": 8.86456500092627e-06, + "loss": 1.8341, + "step": 28432500 + }, + { + "epoch": 82.3, + "learning_rate": 8.863841353278992e-06, + "loss": 1.8373, + "step": 28433000 + }, + { + "epoch": 82.3, + "learning_rate": 8.863117705631715e-06, + "loss": 1.8142, + "step": 28433500 + }, + { + "epoch": 82.3, + "learning_rate": 8.86239405798444e-06, + "loss": 1.8618, + "step": 28434000 + }, + { + "epoch": 82.31, + "learning_rate": 8.861671857632458e-06, + "loss": 1.863, + "step": 28434500 + }, + { + "epoch": 82.31, + "learning_rate": 8.86094820998518e-06, + "loss": 1.8519, + "step": 28435000 + }, + { + "epoch": 82.31, + "learning_rate": 8.860224562337904e-06, + "loss": 1.8191, + "step": 28435500 + }, + { + "epoch": 82.31, + "learning_rate": 8.859500914690628e-06, + "loss": 1.8158, + "step": 28436000 + }, + { + "epoch": 82.31, + "learning_rate": 8.85877726704335e-06, + "loss": 1.8041, + "step": 28436500 + }, + { + "epoch": 82.31, + "learning_rate": 8.858053619396072e-06, + "loss": 1.8203, + "step": 28437000 + }, + { + "epoch": 82.31, + "learning_rate": 8.857329971748796e-06, + "loss": 1.8218, + "step": 28437500 + }, + { + "epoch": 82.32, + "learning_rate": 8.85660632410152e-06, + "loss": 1.8511, + "step": 28438000 + }, + { + "epoch": 82.32, + "learning_rate": 8.855882676454242e-06, + "loss": 1.8448, + "step": 28438500 + }, + { + "epoch": 82.32, + "learning_rate": 8.855159028806966e-06, + "loss": 1.8203, + "step": 28439000 + }, + { + "epoch": 82.32, + "learning_rate": 8.85443538115969e-06, + "loss": 1.8408, + "step": 28439500 + }, + { + "epoch": 82.32, + "learning_rate": 8.853711733512412e-06, + "loss": 1.8369, + "step": 28440000 + }, + { + "epoch": 82.32, + "learning_rate": 8.852988085865136e-06, + "loss": 1.8273, + "step": 28440500 + }, + { + "epoch": 82.33, + "learning_rate": 8.852265885513153e-06, + "loss": 1.8336, + "step": 28441000 + }, + { + "epoch": 82.33, + "learning_rate": 8.851542237865877e-06, + "loss": 1.8449, + "step": 28441500 + }, + { + "epoch": 82.33, + "learning_rate": 8.8508185902186e-06, + "loss": 1.8333, + "step": 28442000 + }, + { + "epoch": 82.33, + "learning_rate": 8.850094942571324e-06, + "loss": 1.8448, + "step": 28442500 + }, + { + "epoch": 82.33, + "learning_rate": 8.849371294924047e-06, + "loss": 1.8241, + "step": 28443000 + }, + { + "epoch": 82.33, + "learning_rate": 8.84864764727677e-06, + "loss": 1.8554, + "step": 28443500 + }, + { + "epoch": 82.33, + "learning_rate": 8.847923999629492e-06, + "loss": 1.8122, + "step": 28444000 + }, + { + "epoch": 82.34, + "learning_rate": 8.847200351982216e-06, + "loss": 1.816, + "step": 28444500 + }, + { + "epoch": 82.34, + "learning_rate": 8.84647670433494e-06, + "loss": 1.8308, + "step": 28445000 + }, + { + "epoch": 82.34, + "learning_rate": 8.845753056687662e-06, + "loss": 1.8279, + "step": 28445500 + }, + { + "epoch": 82.34, + "learning_rate": 8.84503085633568e-06, + "loss": 1.8299, + "step": 28446000 + }, + { + "epoch": 82.34, + "learning_rate": 8.844307208688403e-06, + "loss": 1.8352, + "step": 28446500 + }, + { + "epoch": 82.34, + "learning_rate": 8.843583561041127e-06, + "loss": 1.8335, + "step": 28447000 + }, + { + "epoch": 82.34, + "learning_rate": 8.84285991339385e-06, + "loss": 1.8617, + "step": 28447500 + }, + { + "epoch": 82.35, + "learning_rate": 8.842136265746573e-06, + "loss": 1.8576, + "step": 28448000 + }, + { + "epoch": 82.35, + "learning_rate": 8.84141406539459e-06, + "loss": 1.8301, + "step": 28448500 + }, + { + "epoch": 82.35, + "learning_rate": 8.840690417747314e-06, + "loss": 1.8252, + "step": 28449000 + }, + { + "epoch": 82.35, + "learning_rate": 8.839966770100037e-06, + "loss": 1.8283, + "step": 28449500 + }, + { + "epoch": 82.35, + "learning_rate": 8.83924312245276e-06, + "loss": 1.841, + "step": 28450000 + }, + { + "epoch": 82.35, + "learning_rate": 8.838520922100778e-06, + "loss": 1.8472, + "step": 28450500 + }, + { + "epoch": 82.35, + "learning_rate": 8.837797274453502e-06, + "loss": 1.8331, + "step": 28451000 + }, + { + "epoch": 82.36, + "learning_rate": 8.837073626806224e-06, + "loss": 1.8177, + "step": 28451500 + }, + { + "epoch": 82.36, + "learning_rate": 8.836349979158948e-06, + "loss": 1.8439, + "step": 28452000 + }, + { + "epoch": 82.36, + "learning_rate": 8.835626331511672e-06, + "loss": 1.8496, + "step": 28452500 + }, + { + "epoch": 82.36, + "learning_rate": 8.834902683864394e-06, + "loss": 1.8568, + "step": 28453000 + }, + { + "epoch": 82.36, + "learning_rate": 8.834179036217118e-06, + "loss": 1.8262, + "step": 28453500 + }, + { + "epoch": 82.36, + "learning_rate": 8.833456835865135e-06, + "loss": 1.8523, + "step": 28454000 + }, + { + "epoch": 82.36, + "learning_rate": 8.83273318821786e-06, + "loss": 1.8232, + "step": 28454500 + }, + { + "epoch": 82.37, + "learning_rate": 8.832009540570581e-06, + "loss": 1.8563, + "step": 28455000 + }, + { + "epoch": 82.37, + "learning_rate": 8.831285892923305e-06, + "loss": 1.8057, + "step": 28455500 + }, + { + "epoch": 82.37, + "learning_rate": 8.83056224527603e-06, + "loss": 1.8408, + "step": 28456000 + }, + { + "epoch": 82.37, + "learning_rate": 8.829838597628752e-06, + "loss": 1.825, + "step": 28456500 + }, + { + "epoch": 82.37, + "learning_rate": 8.829114949981476e-06, + "loss": 1.8363, + "step": 28457000 + }, + { + "epoch": 82.37, + "learning_rate": 8.828391302334198e-06, + "loss": 1.8466, + "step": 28457500 + }, + { + "epoch": 82.37, + "learning_rate": 8.827669101982217e-06, + "loss": 1.8512, + "step": 28458000 + }, + { + "epoch": 82.38, + "learning_rate": 8.826945454334939e-06, + "loss": 1.8244, + "step": 28458500 + }, + { + "epoch": 82.38, + "learning_rate": 8.826221806687663e-06, + "loss": 1.8511, + "step": 28459000 + }, + { + "epoch": 82.38, + "learning_rate": 8.825498159040385e-06, + "loss": 1.8421, + "step": 28459500 + }, + { + "epoch": 82.38, + "learning_rate": 8.824774511393109e-06, + "loss": 1.8404, + "step": 28460000 + }, + { + "epoch": 82.38, + "learning_rate": 8.824050863745833e-06, + "loss": 1.858, + "step": 28460500 + }, + { + "epoch": 82.38, + "learning_rate": 8.823327216098555e-06, + "loss": 1.8502, + "step": 28461000 + }, + { + "epoch": 82.38, + "learning_rate": 8.822605015746572e-06, + "loss": 1.85, + "step": 28461500 + }, + { + "epoch": 82.39, + "learning_rate": 8.821881368099296e-06, + "loss": 1.8663, + "step": 28462000 + }, + { + "epoch": 82.39, + "learning_rate": 8.82115772045202e-06, + "loss": 1.8598, + "step": 28462500 + }, + { + "epoch": 82.39, + "learning_rate": 8.820434072804743e-06, + "loss": 1.8418, + "step": 28463000 + }, + { + "epoch": 82.39, + "learning_rate": 8.819710425157466e-06, + "loss": 1.8241, + "step": 28463500 + }, + { + "epoch": 82.39, + "learning_rate": 8.818986777510189e-06, + "loss": 1.8538, + "step": 28464000 + }, + { + "epoch": 82.39, + "learning_rate": 8.818263129862913e-06, + "loss": 1.8412, + "step": 28464500 + }, + { + "epoch": 82.39, + "learning_rate": 8.817539482215637e-06, + "loss": 1.8522, + "step": 28465000 + }, + { + "epoch": 82.4, + "learning_rate": 8.816815834568359e-06, + "loss": 1.8372, + "step": 28465500 + }, + { + "epoch": 82.4, + "learning_rate": 8.816093634216378e-06, + "loss": 1.8607, + "step": 28466000 + }, + { + "epoch": 82.4, + "learning_rate": 8.8153699865691e-06, + "loss": 1.8265, + "step": 28466500 + }, + { + "epoch": 82.4, + "learning_rate": 8.814647786217117e-06, + "loss": 1.8275, + "step": 28467000 + }, + { + "epoch": 82.4, + "learning_rate": 8.813924138569841e-06, + "loss": 1.8367, + "step": 28467500 + }, + { + "epoch": 82.4, + "learning_rate": 8.813200490922565e-06, + "loss": 1.8409, + "step": 28468000 + }, + { + "epoch": 82.4, + "learning_rate": 8.812476843275287e-06, + "loss": 1.8286, + "step": 28468500 + }, + { + "epoch": 82.41, + "learning_rate": 8.811753195628011e-06, + "loss": 1.8201, + "step": 28469000 + }, + { + "epoch": 82.41, + "learning_rate": 8.811032442571323e-06, + "loss": 1.8408, + "step": 28469500 + }, + { + "epoch": 82.41, + "learning_rate": 8.810308794924046e-06, + "loss": 1.8568, + "step": 28470000 + }, + { + "epoch": 82.41, + "learning_rate": 8.80958514727677e-06, + "loss": 1.8305, + "step": 28470500 + }, + { + "epoch": 82.41, + "learning_rate": 8.808861499629492e-06, + "loss": 1.8308, + "step": 28471000 + }, + { + "epoch": 82.41, + "learning_rate": 8.808137851982216e-06, + "loss": 1.8349, + "step": 28471500 + }, + { + "epoch": 82.41, + "learning_rate": 8.80741420433494e-06, + "loss": 1.8335, + "step": 28472000 + }, + { + "epoch": 82.42, + "learning_rate": 8.806690556687662e-06, + "loss": 1.846, + "step": 28472500 + }, + { + "epoch": 82.42, + "learning_rate": 8.805966909040386e-06, + "loss": 1.8307, + "step": 28473000 + }, + { + "epoch": 82.42, + "learning_rate": 8.80524326139311e-06, + "loss": 1.8195, + "step": 28473500 + }, + { + "epoch": 82.42, + "learning_rate": 8.804521061041127e-06, + "loss": 1.8118, + "step": 28474000 + }, + { + "epoch": 82.42, + "learning_rate": 8.80379741339385e-06, + "loss": 1.8352, + "step": 28474500 + }, + { + "epoch": 82.42, + "learning_rate": 8.803073765746573e-06, + "loss": 1.8719, + "step": 28475000 + }, + { + "epoch": 82.42, + "learning_rate": 8.802350118099297e-06, + "loss": 1.8515, + "step": 28475500 + }, + { + "epoch": 82.43, + "learning_rate": 8.801627917747314e-06, + "loss": 1.8392, + "step": 28476000 + }, + { + "epoch": 82.43, + "learning_rate": 8.800904270100037e-06, + "loss": 1.8293, + "step": 28476500 + }, + { + "epoch": 82.43, + "learning_rate": 8.80018062245276e-06, + "loss": 1.8371, + "step": 28477000 + }, + { + "epoch": 82.43, + "learning_rate": 8.799456974805484e-06, + "loss": 1.8333, + "step": 28477500 + }, + { + "epoch": 82.43, + "learning_rate": 8.798734774453502e-06, + "loss": 1.8115, + "step": 28478000 + }, + { + "epoch": 82.43, + "learning_rate": 8.798011126806224e-06, + "loss": 1.8524, + "step": 28478500 + }, + { + "epoch": 82.44, + "learning_rate": 8.797287479158948e-06, + "loss": 1.8574, + "step": 28479000 + }, + { + "epoch": 82.44, + "learning_rate": 8.796563831511672e-06, + "loss": 1.8229, + "step": 28479500 + }, + { + "epoch": 82.44, + "learning_rate": 8.795840183864394e-06, + "loss": 1.799, + "step": 28480000 + }, + { + "epoch": 82.44, + "learning_rate": 8.795117983512413e-06, + "loss": 1.8311, + "step": 28480500 + }, + { + "epoch": 82.44, + "learning_rate": 8.794394335865135e-06, + "loss": 1.8428, + "step": 28481000 + }, + { + "epoch": 82.44, + "learning_rate": 8.793670688217859e-06, + "loss": 1.8075, + "step": 28481500 + }, + { + "epoch": 82.44, + "learning_rate": 8.792947040570581e-06, + "loss": 1.8206, + "step": 28482000 + }, + { + "epoch": 82.45, + "learning_rate": 8.792223392923305e-06, + "loss": 1.8424, + "step": 28482500 + }, + { + "epoch": 82.45, + "learning_rate": 8.791501192571323e-06, + "loss": 1.8316, + "step": 28483000 + }, + { + "epoch": 82.45, + "learning_rate": 8.790777544924046e-06, + "loss": 1.8436, + "step": 28483500 + }, + { + "epoch": 82.45, + "learning_rate": 8.790053897276769e-06, + "loss": 1.8273, + "step": 28484000 + }, + { + "epoch": 82.45, + "learning_rate": 8.789331696924788e-06, + "loss": 1.8626, + "step": 28484500 + }, + { + "epoch": 82.45, + "learning_rate": 8.788608049277512e-06, + "loss": 1.8164, + "step": 28485000 + }, + { + "epoch": 82.45, + "learning_rate": 8.787884401630234e-06, + "loss": 1.8555, + "step": 28485500 + }, + { + "epoch": 82.46, + "learning_rate": 8.787160753982956e-06, + "loss": 1.8413, + "step": 28486000 + }, + { + "epoch": 82.46, + "learning_rate": 8.78643710633568e-06, + "loss": 1.8281, + "step": 28486500 + }, + { + "epoch": 82.46, + "learning_rate": 8.785713458688404e-06, + "loss": 1.8542, + "step": 28487000 + }, + { + "epoch": 82.46, + "learning_rate": 8.784989811041126e-06, + "loss": 1.8451, + "step": 28487500 + }, + { + "epoch": 82.46, + "learning_rate": 8.78426616339385e-06, + "loss": 1.8503, + "step": 28488000 + }, + { + "epoch": 82.46, + "learning_rate": 8.783543963041867e-06, + "loss": 1.8154, + "step": 28488500 + }, + { + "epoch": 82.46, + "learning_rate": 8.782820315394591e-06, + "loss": 1.8484, + "step": 28489000 + }, + { + "epoch": 82.47, + "learning_rate": 8.782098115042609e-06, + "loss": 1.8437, + "step": 28489500 + }, + { + "epoch": 82.47, + "learning_rate": 8.781374467395332e-06, + "loss": 1.8479, + "step": 28490000 + }, + { + "epoch": 82.47, + "learning_rate": 8.780650819748056e-06, + "loss": 1.8174, + "step": 28490500 + }, + { + "epoch": 82.47, + "learning_rate": 8.779927172100779e-06, + "loss": 1.8364, + "step": 28491000 + }, + { + "epoch": 82.47, + "learning_rate": 8.779204971748796e-06, + "loss": 1.8256, + "step": 28491500 + }, + { + "epoch": 82.47, + "learning_rate": 8.77848132410152e-06, + "loss": 1.8303, + "step": 28492000 + }, + { + "epoch": 82.47, + "learning_rate": 8.777759123749537e-06, + "loss": 1.8445, + "step": 28492500 + }, + { + "epoch": 82.48, + "learning_rate": 8.777035476102261e-06, + "loss": 1.8442, + "step": 28493000 + }, + { + "epoch": 82.48, + "learning_rate": 8.776311828454983e-06, + "loss": 1.816, + "step": 28493500 + }, + { + "epoch": 82.48, + "learning_rate": 8.775588180807707e-06, + "loss": 1.8397, + "step": 28494000 + }, + { + "epoch": 82.48, + "learning_rate": 8.774864533160431e-06, + "loss": 1.8031, + "step": 28494500 + }, + { + "epoch": 82.48, + "learning_rate": 8.774140885513153e-06, + "loss": 1.8424, + "step": 28495000 + }, + { + "epoch": 82.48, + "learning_rate": 8.773417237865876e-06, + "loss": 1.8462, + "step": 28495500 + }, + { + "epoch": 82.48, + "learning_rate": 8.7726935902186e-06, + "loss": 1.8433, + "step": 28496000 + }, + { + "epoch": 82.49, + "learning_rate": 8.771969942571323e-06, + "loss": 1.8394, + "step": 28496500 + }, + { + "epoch": 82.49, + "learning_rate": 8.771246294924046e-06, + "loss": 1.8478, + "step": 28497000 + }, + { + "epoch": 82.49, + "learning_rate": 8.77052264727677e-06, + "loss": 1.8345, + "step": 28497500 + }, + { + "epoch": 82.49, + "learning_rate": 8.769798999629493e-06, + "loss": 1.8478, + "step": 28498000 + }, + { + "epoch": 82.49, + "learning_rate": 8.769075351982216e-06, + "loss": 1.8205, + "step": 28498500 + }, + { + "epoch": 82.49, + "learning_rate": 8.768353151630233e-06, + "loss": 1.8541, + "step": 28499000 + }, + { + "epoch": 82.49, + "learning_rate": 8.767629503982957e-06, + "loss": 1.8373, + "step": 28499500 + }, + { + "epoch": 82.5, + "learning_rate": 8.76690585633568e-06, + "loss": 1.8243, + "step": 28500000 + }, + { + "epoch": 82.5, + "learning_rate": 8.766183655983698e-06, + "loss": 1.8379, + "step": 28500500 + }, + { + "epoch": 82.5, + "learning_rate": 8.76546000833642e-06, + "loss": 1.8287, + "step": 28501000 + }, + { + "epoch": 82.5, + "learning_rate": 8.764736360689144e-06, + "loss": 1.8368, + "step": 28501500 + }, + { + "epoch": 82.5, + "learning_rate": 8.764012713041868e-06, + "loss": 1.8371, + "step": 28502000 + }, + { + "epoch": 82.5, + "learning_rate": 8.76328906539459e-06, + "loss": 1.8287, + "step": 28502500 + }, + { + "epoch": 82.5, + "learning_rate": 8.762565417747314e-06, + "loss": 1.7944, + "step": 28503000 + }, + { + "epoch": 82.51, + "learning_rate": 8.761841770100038e-06, + "loss": 1.8361, + "step": 28503500 + }, + { + "epoch": 82.51, + "learning_rate": 8.76111812245276e-06, + "loss": 1.8452, + "step": 28504000 + }, + { + "epoch": 82.51, + "learning_rate": 8.760394474805483e-06, + "loss": 1.8374, + "step": 28504500 + }, + { + "epoch": 82.51, + "learning_rate": 8.759672274453502e-06, + "loss": 1.8383, + "step": 28505000 + }, + { + "epoch": 82.51, + "learning_rate": 8.75895007410152e-06, + "loss": 1.8206, + "step": 28505500 + }, + { + "epoch": 82.51, + "learning_rate": 8.758226426454243e-06, + "loss": 1.8102, + "step": 28506000 + }, + { + "epoch": 82.51, + "learning_rate": 8.757502778806965e-06, + "loss": 1.8268, + "step": 28506500 + }, + { + "epoch": 82.52, + "learning_rate": 8.756779131159689e-06, + "loss": 1.8314, + "step": 28507000 + }, + { + "epoch": 82.52, + "learning_rate": 8.756055483512413e-06, + "loss": 1.8186, + "step": 28507500 + }, + { + "epoch": 82.52, + "learning_rate": 8.755331835865135e-06, + "loss": 1.8387, + "step": 28508000 + }, + { + "epoch": 82.52, + "learning_rate": 8.754608188217859e-06, + "loss": 1.7927, + "step": 28508500 + }, + { + "epoch": 82.52, + "learning_rate": 8.753884540570583e-06, + "loss": 1.8516, + "step": 28509000 + }, + { + "epoch": 82.52, + "learning_rate": 8.753160892923305e-06, + "loss": 1.8235, + "step": 28509500 + }, + { + "epoch": 82.52, + "learning_rate": 8.752438692571322e-06, + "loss": 1.8465, + "step": 28510000 + }, + { + "epoch": 82.53, + "learning_rate": 8.751715044924046e-06, + "loss": 1.8421, + "step": 28510500 + }, + { + "epoch": 82.53, + "learning_rate": 8.750992844572065e-06, + "loss": 1.8027, + "step": 28511000 + }, + { + "epoch": 82.53, + "learning_rate": 8.750270644220083e-06, + "loss": 1.8222, + "step": 28511500 + }, + { + "epoch": 82.53, + "learning_rate": 8.749546996572805e-06, + "loss": 1.8179, + "step": 28512000 + }, + { + "epoch": 82.53, + "learning_rate": 8.748823348925527e-06, + "loss": 1.8419, + "step": 28512500 + }, + { + "epoch": 82.53, + "learning_rate": 8.748099701278253e-06, + "loss": 1.8399, + "step": 28513000 + }, + { + "epoch": 82.53, + "learning_rate": 8.747376053630975e-06, + "loss": 1.8485, + "step": 28513500 + }, + { + "epoch": 82.54, + "learning_rate": 8.746652405983697e-06, + "loss": 1.8619, + "step": 28514000 + }, + { + "epoch": 82.54, + "learning_rate": 8.745928758336421e-06, + "loss": 1.8501, + "step": 28514500 + }, + { + "epoch": 82.54, + "learning_rate": 8.745205110689145e-06, + "loss": 1.8676, + "step": 28515000 + }, + { + "epoch": 82.54, + "learning_rate": 8.744481463041867e-06, + "loss": 1.8439, + "step": 28515500 + }, + { + "epoch": 82.54, + "learning_rate": 8.743757815394591e-06, + "loss": 1.8407, + "step": 28516000 + }, + { + "epoch": 82.54, + "learning_rate": 8.74303561504261e-06, + "loss": 1.8367, + "step": 28516500 + }, + { + "epoch": 82.55, + "learning_rate": 8.742311967395332e-06, + "loss": 1.8405, + "step": 28517000 + }, + { + "epoch": 82.55, + "learning_rate": 8.741588319748055e-06, + "loss": 1.8534, + "step": 28517500 + }, + { + "epoch": 82.55, + "learning_rate": 8.740864672100778e-06, + "loss": 1.8075, + "step": 28518000 + }, + { + "epoch": 82.55, + "learning_rate": 8.740141024453502e-06, + "loss": 1.8136, + "step": 28518500 + }, + { + "epoch": 82.55, + "learning_rate": 8.739417376806225e-06, + "loss": 1.8403, + "step": 28519000 + }, + { + "epoch": 82.55, + "learning_rate": 8.738693729158947e-06, + "loss": 1.8307, + "step": 28519500 + }, + { + "epoch": 82.55, + "learning_rate": 8.737971528806966e-06, + "loss": 1.8365, + "step": 28520000 + }, + { + "epoch": 82.56, + "learning_rate": 8.73724788115969e-06, + "loss": 1.8427, + "step": 28520500 + }, + { + "epoch": 82.56, + "learning_rate": 8.736524233512412e-06, + "loss": 1.8349, + "step": 28521000 + }, + { + "epoch": 82.56, + "learning_rate": 8.735800585865136e-06, + "loss": 1.8179, + "step": 28521500 + }, + { + "epoch": 82.56, + "learning_rate": 8.735078385513155e-06, + "loss": 1.8109, + "step": 28522000 + }, + { + "epoch": 82.56, + "learning_rate": 8.734354737865877e-06, + "loss": 1.8189, + "step": 28522500 + }, + { + "epoch": 82.56, + "learning_rate": 8.7336310902186e-06, + "loss": 1.831, + "step": 28523000 + }, + { + "epoch": 82.56, + "learning_rate": 8.732907442571323e-06, + "loss": 1.8366, + "step": 28523500 + }, + { + "epoch": 82.57, + "learning_rate": 8.732183794924047e-06, + "loss": 1.847, + "step": 28524000 + }, + { + "epoch": 82.57, + "learning_rate": 8.73146014727677e-06, + "loss": 1.8394, + "step": 28524500 + }, + { + "epoch": 82.57, + "learning_rate": 8.730736499629492e-06, + "loss": 1.8456, + "step": 28525000 + }, + { + "epoch": 82.57, + "learning_rate": 8.730012851982217e-06, + "loss": 1.816, + "step": 28525500 + }, + { + "epoch": 82.57, + "learning_rate": 8.72928920433494e-06, + "loss": 1.8299, + "step": 28526000 + }, + { + "epoch": 82.57, + "learning_rate": 8.728565556687662e-06, + "loss": 1.8226, + "step": 28526500 + }, + { + "epoch": 82.57, + "learning_rate": 8.727841909040386e-06, + "loss": 1.8227, + "step": 28527000 + }, + { + "epoch": 82.58, + "learning_rate": 8.72711826139311e-06, + "loss": 1.8165, + "step": 28527500 + }, + { + "epoch": 82.58, + "learning_rate": 8.726394613745832e-06, + "loss": 1.8296, + "step": 28528000 + }, + { + "epoch": 82.58, + "learning_rate": 8.725670966098556e-06, + "loss": 1.8183, + "step": 28528500 + }, + { + "epoch": 82.58, + "learning_rate": 8.724948765746573e-06, + "loss": 1.8031, + "step": 28529000 + }, + { + "epoch": 82.58, + "learning_rate": 8.724225118099297e-06, + "loss": 1.8449, + "step": 28529500 + }, + { + "epoch": 82.58, + "learning_rate": 8.72350147045202e-06, + "loss": 1.8395, + "step": 28530000 + }, + { + "epoch": 82.58, + "learning_rate": 8.722777822804743e-06, + "loss": 1.8282, + "step": 28530500 + }, + { + "epoch": 82.59, + "learning_rate": 8.722054175157467e-06, + "loss": 1.8305, + "step": 28531000 + }, + { + "epoch": 82.59, + "learning_rate": 8.72133052751019e-06, + "loss": 1.8281, + "step": 28531500 + }, + { + "epoch": 82.59, + "learning_rate": 8.720606879862911e-06, + "loss": 1.8442, + "step": 28532000 + }, + { + "epoch": 82.59, + "learning_rate": 8.719883232215637e-06, + "loss": 1.8219, + "step": 28532500 + }, + { + "epoch": 82.59, + "learning_rate": 8.719161031863654e-06, + "loss": 1.8231, + "step": 28533000 + }, + { + "epoch": 82.59, + "learning_rate": 8.718437384216377e-06, + "loss": 1.8529, + "step": 28533500 + }, + { + "epoch": 82.59, + "learning_rate": 8.7177137365691e-06, + "loss": 1.8459, + "step": 28534000 + }, + { + "epoch": 82.6, + "learning_rate": 8.716990088921824e-06, + "loss": 1.8044, + "step": 28534500 + }, + { + "epoch": 82.6, + "learning_rate": 8.716266441274547e-06, + "loss": 1.8152, + "step": 28535000 + }, + { + "epoch": 82.6, + "learning_rate": 8.715544240922564e-06, + "loss": 1.8232, + "step": 28535500 + }, + { + "epoch": 82.6, + "learning_rate": 8.714820593275288e-06, + "loss": 1.8242, + "step": 28536000 + }, + { + "epoch": 82.6, + "learning_rate": 8.714098392923305e-06, + "loss": 1.8619, + "step": 28536500 + }, + { + "epoch": 82.6, + "learning_rate": 8.713374745276029e-06, + "loss": 1.8276, + "step": 28537000 + }, + { + "epoch": 82.6, + "learning_rate": 8.712651097628751e-06, + "loss": 1.8454, + "step": 28537500 + }, + { + "epoch": 82.61, + "learning_rate": 8.711927449981475e-06, + "loss": 1.8285, + "step": 28538000 + }, + { + "epoch": 82.61, + "learning_rate": 8.711203802334199e-06, + "loss": 1.8609, + "step": 28538500 + }, + { + "epoch": 82.61, + "learning_rate": 8.710480154686921e-06, + "loss": 1.8231, + "step": 28539000 + }, + { + "epoch": 82.61, + "learning_rate": 8.709756507039645e-06, + "loss": 1.8181, + "step": 28539500 + }, + { + "epoch": 82.61, + "learning_rate": 8.709034306687663e-06, + "loss": 1.8437, + "step": 28540000 + }, + { + "epoch": 82.61, + "learning_rate": 8.708310659040386e-06, + "loss": 1.8545, + "step": 28540500 + }, + { + "epoch": 82.61, + "learning_rate": 8.707587011393109e-06, + "loss": 1.8429, + "step": 28541000 + }, + { + "epoch": 82.62, + "learning_rate": 8.706863363745833e-06, + "loss": 1.8214, + "step": 28541500 + }, + { + "epoch": 82.62, + "learning_rate": 8.706139716098557e-06, + "loss": 1.8128, + "step": 28542000 + }, + { + "epoch": 82.62, + "learning_rate": 8.705416068451279e-06, + "loss": 1.8225, + "step": 28542500 + }, + { + "epoch": 82.62, + "learning_rate": 8.704693868099296e-06, + "loss": 1.8303, + "step": 28543000 + }, + { + "epoch": 82.62, + "learning_rate": 8.70397022045202e-06, + "loss": 1.841, + "step": 28543500 + }, + { + "epoch": 82.62, + "learning_rate": 8.703246572804744e-06, + "loss": 1.8157, + "step": 28544000 + }, + { + "epoch": 82.62, + "learning_rate": 8.702522925157466e-06, + "loss": 1.8306, + "step": 28544500 + }, + { + "epoch": 82.63, + "learning_rate": 8.701799277510188e-06, + "loss": 1.8594, + "step": 28545000 + }, + { + "epoch": 82.63, + "learning_rate": 8.701077077158207e-06, + "loss": 1.8155, + "step": 28545500 + }, + { + "epoch": 82.63, + "learning_rate": 8.700353429510931e-06, + "loss": 1.8173, + "step": 28546000 + }, + { + "epoch": 82.63, + "learning_rate": 8.699629781863653e-06, + "loss": 1.8363, + "step": 28546500 + }, + { + "epoch": 82.63, + "learning_rate": 8.698906134216377e-06, + "loss": 1.8297, + "step": 28547000 + }, + { + "epoch": 82.63, + "learning_rate": 8.6981824865691e-06, + "loss": 1.8253, + "step": 28547500 + }, + { + "epoch": 82.63, + "learning_rate": 8.697458838921824e-06, + "loss": 1.7961, + "step": 28548000 + }, + { + "epoch": 82.64, + "learning_rate": 8.696735191274546e-06, + "loss": 1.8393, + "step": 28548500 + }, + { + "epoch": 82.64, + "learning_rate": 8.69601154362727e-06, + "loss": 1.8364, + "step": 28549000 + }, + { + "epoch": 82.64, + "learning_rate": 8.695289343275287e-06, + "loss": 1.828, + "step": 28549500 + }, + { + "epoch": 82.64, + "learning_rate": 8.694565695628011e-06, + "loss": 1.8518, + "step": 28550000 + }, + { + "epoch": 82.64, + "learning_rate": 8.693842047980733e-06, + "loss": 1.8446, + "step": 28550500 + }, + { + "epoch": 82.64, + "learning_rate": 8.693118400333457e-06, + "loss": 1.8156, + "step": 28551000 + }, + { + "epoch": 82.64, + "learning_rate": 8.692394752686181e-06, + "loss": 1.8251, + "step": 28551500 + }, + { + "epoch": 82.65, + "learning_rate": 8.691671105038903e-06, + "loss": 1.8234, + "step": 28552000 + }, + { + "epoch": 82.65, + "learning_rate": 8.690947457391627e-06, + "loss": 1.8538, + "step": 28552500 + }, + { + "epoch": 82.65, + "learning_rate": 8.690223809744351e-06, + "loss": 1.8602, + "step": 28553000 + }, + { + "epoch": 82.65, + "learning_rate": 8.689500162097073e-06, + "loss": 1.8106, + "step": 28553500 + }, + { + "epoch": 82.65, + "learning_rate": 8.68877796174509e-06, + "loss": 1.8198, + "step": 28554000 + }, + { + "epoch": 82.65, + "learning_rate": 8.688054314097814e-06, + "loss": 1.841, + "step": 28554500 + }, + { + "epoch": 82.66, + "learning_rate": 8.687330666450538e-06, + "loss": 1.823, + "step": 28555000 + }, + { + "epoch": 82.66, + "learning_rate": 8.68660701880326e-06, + "loss": 1.8647, + "step": 28555500 + }, + { + "epoch": 82.66, + "learning_rate": 8.685884818451278e-06, + "loss": 1.8278, + "step": 28556000 + }, + { + "epoch": 82.66, + "learning_rate": 8.685161170804002e-06, + "loss": 1.8142, + "step": 28556500 + }, + { + "epoch": 82.66, + "learning_rate": 8.684437523156726e-06, + "loss": 1.8356, + "step": 28557000 + }, + { + "epoch": 82.66, + "learning_rate": 8.683713875509448e-06, + "loss": 1.8445, + "step": 28557500 + }, + { + "epoch": 82.66, + "learning_rate": 8.682990227862172e-06, + "loss": 1.8275, + "step": 28558000 + }, + { + "epoch": 82.67, + "learning_rate": 8.682266580214894e-06, + "loss": 1.8526, + "step": 28558500 + }, + { + "epoch": 82.67, + "learning_rate": 8.681542932567618e-06, + "loss": 1.8191, + "step": 28559000 + }, + { + "epoch": 82.67, + "learning_rate": 8.680820732215635e-06, + "loss": 1.8141, + "step": 28559500 + }, + { + "epoch": 82.67, + "learning_rate": 8.68009708456836e-06, + "loss": 1.8263, + "step": 28560000 + }, + { + "epoch": 82.67, + "learning_rate": 8.679373436921081e-06, + "loss": 1.8202, + "step": 28560500 + }, + { + "epoch": 82.67, + "learning_rate": 8.678649789273805e-06, + "loss": 1.8357, + "step": 28561000 + }, + { + "epoch": 82.67, + "learning_rate": 8.67792614162653e-06, + "loss": 1.8353, + "step": 28561500 + }, + { + "epoch": 82.68, + "learning_rate": 8.677202493979252e-06, + "loss": 1.8326, + "step": 28562000 + }, + { + "epoch": 82.68, + "learning_rate": 8.676478846331975e-06, + "loss": 1.8387, + "step": 28562500 + }, + { + "epoch": 82.68, + "learning_rate": 8.675755198684698e-06, + "loss": 1.8764, + "step": 28563000 + }, + { + "epoch": 82.68, + "learning_rate": 8.675031551037422e-06, + "loss": 1.8278, + "step": 28563500 + }, + { + "epoch": 82.68, + "learning_rate": 8.674309350685439e-06, + "loss": 1.8182, + "step": 28564000 + }, + { + "epoch": 82.68, + "learning_rate": 8.673585703038163e-06, + "loss": 1.8547, + "step": 28564500 + }, + { + "epoch": 82.68, + "learning_rate": 8.672862055390887e-06, + "loss": 1.8378, + "step": 28565000 + }, + { + "epoch": 82.69, + "learning_rate": 8.672138407743609e-06, + "loss": 1.8561, + "step": 28565500 + }, + { + "epoch": 82.69, + "learning_rate": 8.671416207391626e-06, + "loss": 1.8405, + "step": 28566000 + }, + { + "epoch": 82.69, + "learning_rate": 8.67069255974435e-06, + "loss": 1.8468, + "step": 28566500 + }, + { + "epoch": 82.69, + "learning_rate": 8.669968912097074e-06, + "loss": 1.8021, + "step": 28567000 + }, + { + "epoch": 82.69, + "learning_rate": 8.669245264449796e-06, + "loss": 1.8393, + "step": 28567500 + }, + { + "epoch": 82.69, + "learning_rate": 8.66852161680252e-06, + "loss": 1.8379, + "step": 28568000 + }, + { + "epoch": 82.69, + "learning_rate": 8.667797969155242e-06, + "loss": 1.833, + "step": 28568500 + }, + { + "epoch": 82.7, + "learning_rate": 8.667074321507966e-06, + "loss": 1.8348, + "step": 28569000 + }, + { + "epoch": 82.7, + "learning_rate": 8.666350673860689e-06, + "loss": 1.8372, + "step": 28569500 + }, + { + "epoch": 82.7, + "learning_rate": 8.665627026213413e-06, + "loss": 1.8384, + "step": 28570000 + }, + { + "epoch": 82.7, + "learning_rate": 8.664903378566137e-06, + "loss": 1.8634, + "step": 28570500 + }, + { + "epoch": 82.7, + "learning_rate": 8.664179730918859e-06, + "loss": 1.8345, + "step": 28571000 + }, + { + "epoch": 82.7, + "learning_rate": 8.663456083271583e-06, + "loss": 1.8177, + "step": 28571500 + }, + { + "epoch": 82.7, + "learning_rate": 8.6627338829196e-06, + "loss": 1.8609, + "step": 28572000 + }, + { + "epoch": 82.71, + "learning_rate": 8.662010235272324e-06, + "loss": 1.8058, + "step": 28572500 + }, + { + "epoch": 82.71, + "learning_rate": 8.661288034920341e-06, + "loss": 1.8271, + "step": 28573000 + }, + { + "epoch": 82.71, + "learning_rate": 8.660564387273065e-06, + "loss": 1.8117, + "step": 28573500 + }, + { + "epoch": 82.71, + "learning_rate": 8.659840739625787e-06, + "loss": 1.83, + "step": 28574000 + }, + { + "epoch": 82.71, + "learning_rate": 8.659117091978511e-06, + "loss": 1.8411, + "step": 28574500 + }, + { + "epoch": 82.71, + "learning_rate": 8.658393444331233e-06, + "loss": 1.8127, + "step": 28575000 + }, + { + "epoch": 82.71, + "learning_rate": 8.657669796683957e-06, + "loss": 1.8242, + "step": 28575500 + }, + { + "epoch": 82.72, + "learning_rate": 8.656946149036681e-06, + "loss": 1.8397, + "step": 28576000 + }, + { + "epoch": 82.72, + "learning_rate": 8.656222501389404e-06, + "loss": 1.8536, + "step": 28576500 + }, + { + "epoch": 82.72, + "learning_rate": 8.65550030103742e-06, + "loss": 1.8343, + "step": 28577000 + }, + { + "epoch": 82.72, + "learning_rate": 8.65477810068544e-06, + "loss": 1.8349, + "step": 28577500 + }, + { + "epoch": 82.72, + "learning_rate": 8.654054453038164e-06, + "loss": 1.8332, + "step": 28578000 + }, + { + "epoch": 82.72, + "learning_rate": 8.653330805390886e-06, + "loss": 1.8512, + "step": 28578500 + }, + { + "epoch": 82.72, + "learning_rate": 8.652607157743608e-06, + "loss": 1.8276, + "step": 28579000 + }, + { + "epoch": 82.73, + "learning_rate": 8.651883510096332e-06, + "loss": 1.8184, + "step": 28579500 + }, + { + "epoch": 82.73, + "learning_rate": 8.651159862449056e-06, + "loss": 1.8076, + "step": 28580000 + }, + { + "epoch": 82.73, + "learning_rate": 8.650437662097073e-06, + "loss": 1.8409, + "step": 28580500 + }, + { + "epoch": 82.73, + "learning_rate": 8.649714014449795e-06, + "loss": 1.829, + "step": 28581000 + }, + { + "epoch": 82.73, + "learning_rate": 8.64899036680252e-06, + "loss": 1.8469, + "step": 28581500 + }, + { + "epoch": 82.73, + "learning_rate": 8.648266719155243e-06, + "loss": 1.8227, + "step": 28582000 + }, + { + "epoch": 82.73, + "learning_rate": 8.647543071507966e-06, + "loss": 1.817, + "step": 28582500 + }, + { + "epoch": 82.74, + "learning_rate": 8.64681942386069e-06, + "loss": 1.8392, + "step": 28583000 + }, + { + "epoch": 82.74, + "learning_rate": 8.646095776213413e-06, + "loss": 1.8107, + "step": 28583500 + }, + { + "epoch": 82.74, + "learning_rate": 8.645372128566136e-06, + "loss": 1.7814, + "step": 28584000 + }, + { + "epoch": 82.74, + "learning_rate": 8.644649928214153e-06, + "loss": 1.8493, + "step": 28584500 + }, + { + "epoch": 82.74, + "learning_rate": 8.643926280566877e-06, + "loss": 1.8338, + "step": 28585000 + }, + { + "epoch": 82.74, + "learning_rate": 8.6432026329196e-06, + "loss": 1.8535, + "step": 28585500 + }, + { + "epoch": 82.74, + "learning_rate": 8.642478985272323e-06, + "loss": 1.8096, + "step": 28586000 + }, + { + "epoch": 82.75, + "learning_rate": 8.64175678492034e-06, + "loss": 1.826, + "step": 28586500 + }, + { + "epoch": 82.75, + "learning_rate": 8.641034584568359e-06, + "loss": 1.8317, + "step": 28587000 + }, + { + "epoch": 82.75, + "learning_rate": 8.640310936921083e-06, + "loss": 1.8384, + "step": 28587500 + }, + { + "epoch": 82.75, + "learning_rate": 8.639587289273805e-06, + "loss": 1.8246, + "step": 28588000 + }, + { + "epoch": 82.75, + "learning_rate": 8.638863641626528e-06, + "loss": 1.8007, + "step": 28588500 + }, + { + "epoch": 82.75, + "learning_rate": 8.638139993979253e-06, + "loss": 1.8517, + "step": 28589000 + }, + { + "epoch": 82.75, + "learning_rate": 8.637416346331975e-06, + "loss": 1.8155, + "step": 28589500 + }, + { + "epoch": 82.76, + "learning_rate": 8.636692698684698e-06, + "loss": 1.8151, + "step": 28590000 + }, + { + "epoch": 82.76, + "learning_rate": 8.635970498332715e-06, + "loss": 1.8489, + "step": 28590500 + }, + { + "epoch": 82.76, + "learning_rate": 8.63524685068544e-06, + "loss": 1.8183, + "step": 28591000 + }, + { + "epoch": 82.76, + "learning_rate": 8.634523203038163e-06, + "loss": 1.8485, + "step": 28591500 + }, + { + "epoch": 82.76, + "learning_rate": 8.63380100268618e-06, + "loss": 1.8218, + "step": 28592000 + }, + { + "epoch": 82.76, + "learning_rate": 8.633077355038904e-06, + "loss": 1.8489, + "step": 28592500 + }, + { + "epoch": 82.77, + "learning_rate": 8.632353707391628e-06, + "loss": 1.8492, + "step": 28593000 + }, + { + "epoch": 82.77, + "learning_rate": 8.63163005974435e-06, + "loss": 1.846, + "step": 28593500 + }, + { + "epoch": 82.77, + "learning_rate": 8.630906412097072e-06, + "loss": 1.8208, + "step": 28594000 + }, + { + "epoch": 82.77, + "learning_rate": 8.630182764449796e-06, + "loss": 1.805, + "step": 28594500 + }, + { + "epoch": 82.77, + "learning_rate": 8.62945911680252e-06, + "loss": 1.8336, + "step": 28595000 + }, + { + "epoch": 82.77, + "learning_rate": 8.628735469155242e-06, + "loss": 1.8419, + "step": 28595500 + }, + { + "epoch": 82.77, + "learning_rate": 8.628011821507966e-06, + "loss": 1.8498, + "step": 28596000 + }, + { + "epoch": 82.78, + "learning_rate": 8.62728817386069e-06, + "loss": 1.8157, + "step": 28596500 + }, + { + "epoch": 82.78, + "learning_rate": 8.626564526213412e-06, + "loss": 1.8405, + "step": 28597000 + }, + { + "epoch": 82.78, + "learning_rate": 8.625840878566135e-06, + "loss": 1.8264, + "step": 28597500 + }, + { + "epoch": 82.78, + "learning_rate": 8.62511723091886e-06, + "loss": 1.8258, + "step": 28598000 + }, + { + "epoch": 82.78, + "learning_rate": 8.624393583271583e-06, + "loss": 1.8135, + "step": 28598500 + }, + { + "epoch": 82.78, + "learning_rate": 8.623669935624305e-06, + "loss": 1.8234, + "step": 28599000 + }, + { + "epoch": 82.78, + "learning_rate": 8.622946287977029e-06, + "loss": 1.8132, + "step": 28599500 + }, + { + "epoch": 82.79, + "learning_rate": 8.622224087625048e-06, + "loss": 1.8353, + "step": 28600000 + }, + { + "epoch": 82.79, + "learning_rate": 8.621501887273065e-06, + "loss": 1.8138, + "step": 28600500 + }, + { + "epoch": 82.79, + "learning_rate": 8.620779686921082e-06, + "loss": 1.8512, + "step": 28601000 + }, + { + "epoch": 82.79, + "learning_rate": 8.620056039273804e-06, + "loss": 1.8468, + "step": 28601500 + }, + { + "epoch": 82.79, + "learning_rate": 8.61933239162653e-06, + "loss": 1.8184, + "step": 28602000 + }, + { + "epoch": 82.79, + "learning_rate": 8.618608743979252e-06, + "loss": 1.8447, + "step": 28602500 + }, + { + "epoch": 82.79, + "learning_rate": 8.617885096331974e-06, + "loss": 1.8263, + "step": 28603000 + }, + { + "epoch": 82.8, + "learning_rate": 8.617161448684698e-06, + "loss": 1.8525, + "step": 28603500 + }, + { + "epoch": 82.8, + "learning_rate": 8.616437801037422e-06, + "loss": 1.8223, + "step": 28604000 + }, + { + "epoch": 82.8, + "learning_rate": 8.615714153390145e-06, + "loss": 1.8225, + "step": 28604500 + }, + { + "epoch": 82.8, + "learning_rate": 8.614990505742867e-06, + "loss": 1.8433, + "step": 28605000 + }, + { + "epoch": 82.8, + "learning_rate": 8.614266858095592e-06, + "loss": 1.8558, + "step": 28605500 + }, + { + "epoch": 82.8, + "learning_rate": 8.61354465774361e-06, + "loss": 1.8224, + "step": 28606000 + }, + { + "epoch": 82.8, + "learning_rate": 8.612822457391627e-06, + "loss": 1.7999, + "step": 28606500 + }, + { + "epoch": 82.81, + "learning_rate": 8.61209880974435e-06, + "loss": 1.8387, + "step": 28607000 + }, + { + "epoch": 82.81, + "learning_rate": 8.611375162097075e-06, + "loss": 1.835, + "step": 28607500 + }, + { + "epoch": 82.81, + "learning_rate": 8.610651514449797e-06, + "loss": 1.8355, + "step": 28608000 + }, + { + "epoch": 82.81, + "learning_rate": 8.60992786680252e-06, + "loss": 1.8475, + "step": 28608500 + }, + { + "epoch": 82.81, + "learning_rate": 8.609204219155243e-06, + "loss": 1.7953, + "step": 28609000 + }, + { + "epoch": 82.81, + "learning_rate": 8.608480571507967e-06, + "loss": 1.8406, + "step": 28609500 + }, + { + "epoch": 82.81, + "learning_rate": 8.60775692386069e-06, + "loss": 1.8292, + "step": 28610000 + }, + { + "epoch": 82.82, + "learning_rate": 8.607033276213412e-06, + "loss": 1.8262, + "step": 28610500 + }, + { + "epoch": 82.82, + "learning_rate": 8.606309628566137e-06, + "loss": 1.8027, + "step": 28611000 + }, + { + "epoch": 82.82, + "learning_rate": 8.60558598091886e-06, + "loss": 1.8284, + "step": 28611500 + }, + { + "epoch": 82.82, + "learning_rate": 8.604862333271582e-06, + "loss": 1.8211, + "step": 28612000 + }, + { + "epoch": 82.82, + "learning_rate": 8.604140132919599e-06, + "loss": 1.8249, + "step": 28612500 + }, + { + "epoch": 82.82, + "learning_rate": 8.603417932567618e-06, + "loss": 1.8249, + "step": 28613000 + }, + { + "epoch": 82.82, + "learning_rate": 8.602694284920342e-06, + "loss": 1.8599, + "step": 28613500 + }, + { + "epoch": 82.83, + "learning_rate": 8.601970637273064e-06, + "loss": 1.8334, + "step": 28614000 + }, + { + "epoch": 82.83, + "learning_rate": 8.601246989625788e-06, + "loss": 1.8352, + "step": 28614500 + }, + { + "epoch": 82.83, + "learning_rate": 8.600523341978512e-06, + "loss": 1.8366, + "step": 28615000 + }, + { + "epoch": 82.83, + "learning_rate": 8.599799694331234e-06, + "loss": 1.8307, + "step": 28615500 + }, + { + "epoch": 82.83, + "learning_rate": 8.599077493979251e-06, + "loss": 1.8259, + "step": 28616000 + }, + { + "epoch": 82.83, + "learning_rate": 8.598353846331975e-06, + "loss": 1.8186, + "step": 28616500 + }, + { + "epoch": 82.83, + "learning_rate": 8.5976301986847e-06, + "loss": 1.842, + "step": 28617000 + }, + { + "epoch": 82.84, + "learning_rate": 8.596906551037421e-06, + "loss": 1.8776, + "step": 28617500 + }, + { + "epoch": 82.84, + "learning_rate": 8.596182903390144e-06, + "loss": 1.8266, + "step": 28618000 + }, + { + "epoch": 82.84, + "learning_rate": 8.595460703038163e-06, + "loss": 1.837, + "step": 28618500 + }, + { + "epoch": 82.84, + "learning_rate": 8.594737055390887e-06, + "loss": 1.8385, + "step": 28619000 + }, + { + "epoch": 82.84, + "learning_rate": 8.594013407743609e-06, + "loss": 1.847, + "step": 28619500 + }, + { + "epoch": 82.84, + "learning_rate": 8.593289760096333e-06, + "loss": 1.8257, + "step": 28620000 + }, + { + "epoch": 82.84, + "learning_rate": 8.592566112449057e-06, + "loss": 1.8447, + "step": 28620500 + }, + { + "epoch": 82.85, + "learning_rate": 8.591842464801779e-06, + "loss": 1.8255, + "step": 28621000 + }, + { + "epoch": 82.85, + "learning_rate": 8.591120264449796e-06, + "loss": 1.8462, + "step": 28621500 + }, + { + "epoch": 82.85, + "learning_rate": 8.590398064097813e-06, + "loss": 1.8388, + "step": 28622000 + }, + { + "epoch": 82.85, + "learning_rate": 8.589674416450539e-06, + "loss": 1.8272, + "step": 28622500 + }, + { + "epoch": 82.85, + "learning_rate": 8.588950768803261e-06, + "loss": 1.8246, + "step": 28623000 + }, + { + "epoch": 82.85, + "learning_rate": 8.588227121155983e-06, + "loss": 1.8365, + "step": 28623500 + }, + { + "epoch": 82.85, + "learning_rate": 8.587503473508707e-06, + "loss": 1.8425, + "step": 28624000 + }, + { + "epoch": 82.86, + "learning_rate": 8.586781273156726e-06, + "loss": 1.8485, + "step": 28624500 + }, + { + "epoch": 82.86, + "learning_rate": 8.586057625509449e-06, + "loss": 1.8515, + "step": 28625000 + }, + { + "epoch": 82.86, + "learning_rate": 8.58533397786217e-06, + "loss": 1.8293, + "step": 28625500 + }, + { + "epoch": 82.86, + "learning_rate": 8.584610330214895e-06, + "loss": 1.829, + "step": 28626000 + }, + { + "epoch": 82.86, + "learning_rate": 8.583886682567619e-06, + "loss": 1.8446, + "step": 28626500 + }, + { + "epoch": 82.86, + "learning_rate": 8.583163034920341e-06, + "loss": 1.8433, + "step": 28627000 + }, + { + "epoch": 82.86, + "learning_rate": 8.582439387273065e-06, + "loss": 1.8459, + "step": 28627500 + }, + { + "epoch": 82.87, + "learning_rate": 8.581715739625789e-06, + "loss": 1.8175, + "step": 28628000 + }, + { + "epoch": 82.87, + "learning_rate": 8.580992091978511e-06, + "loss": 1.8567, + "step": 28628500 + }, + { + "epoch": 82.87, + "learning_rate": 8.580268444331233e-06, + "loss": 1.8324, + "step": 28629000 + }, + { + "epoch": 82.87, + "learning_rate": 8.579544796683957e-06, + "loss": 1.8574, + "step": 28629500 + }, + { + "epoch": 82.87, + "learning_rate": 8.578822596331976e-06, + "loss": 1.8423, + "step": 28630000 + }, + { + "epoch": 82.87, + "learning_rate": 8.578098948684698e-06, + "loss": 1.8516, + "step": 28630500 + }, + { + "epoch": 82.88, + "learning_rate": 8.57737530103742e-06, + "loss": 1.848, + "step": 28631000 + }, + { + "epoch": 82.88, + "learning_rate": 8.576651653390146e-06, + "loss": 1.8146, + "step": 28631500 + }, + { + "epoch": 82.88, + "learning_rate": 8.575928005742868e-06, + "loss": 1.8206, + "step": 28632000 + }, + { + "epoch": 82.88, + "learning_rate": 8.57520435809559e-06, + "loss": 1.8331, + "step": 28632500 + }, + { + "epoch": 82.88, + "learning_rate": 8.574480710448315e-06, + "loss": 1.8281, + "step": 28633000 + }, + { + "epoch": 82.88, + "learning_rate": 8.573757062801038e-06, + "loss": 1.8292, + "step": 28633500 + }, + { + "epoch": 82.88, + "learning_rate": 8.573034862449056e-06, + "loss": 1.8128, + "step": 28634000 + }, + { + "epoch": 82.89, + "learning_rate": 8.572311214801778e-06, + "loss": 1.815, + "step": 28634500 + }, + { + "epoch": 82.89, + "learning_rate": 8.571589014449797e-06, + "loss": 1.8465, + "step": 28635000 + }, + { + "epoch": 82.89, + "learning_rate": 8.57086536680252e-06, + "loss": 1.8329, + "step": 28635500 + }, + { + "epoch": 82.89, + "learning_rate": 8.570143166450538e-06, + "loss": 1.8256, + "step": 28636000 + }, + { + "epoch": 82.89, + "learning_rate": 8.56941951880326e-06, + "loss": 1.8357, + "step": 28636500 + }, + { + "epoch": 82.89, + "learning_rate": 8.568697318451278e-06, + "loss": 1.8585, + "step": 28637000 + }, + { + "epoch": 82.89, + "learning_rate": 8.567973670804002e-06, + "loss": 1.8224, + "step": 28637500 + }, + { + "epoch": 82.9, + "learning_rate": 8.567250023156725e-06, + "loss": 1.8496, + "step": 28638000 + }, + { + "epoch": 82.9, + "learning_rate": 8.566526375509448e-06, + "loss": 1.833, + "step": 28638500 + }, + { + "epoch": 82.9, + "learning_rate": 8.565802727862172e-06, + "loss": 1.8468, + "step": 28639000 + }, + { + "epoch": 82.9, + "learning_rate": 8.565079080214896e-06, + "loss": 1.8224, + "step": 28639500 + }, + { + "epoch": 82.9, + "learning_rate": 8.564355432567618e-06, + "loss": 1.8252, + "step": 28640000 + }, + { + "epoch": 82.9, + "learning_rate": 8.563631784920342e-06, + "loss": 1.8406, + "step": 28640500 + }, + { + "epoch": 82.9, + "learning_rate": 8.562908137273066e-06, + "loss": 1.8357, + "step": 28641000 + }, + { + "epoch": 82.91, + "learning_rate": 8.562184489625788e-06, + "loss": 1.8418, + "step": 28641500 + }, + { + "epoch": 82.91, + "learning_rate": 8.56146084197851e-06, + "loss": 1.819, + "step": 28642000 + }, + { + "epoch": 82.91, + "learning_rate": 8.560737194331234e-06, + "loss": 1.8371, + "step": 28642500 + }, + { + "epoch": 82.91, + "learning_rate": 8.560013546683958e-06, + "loss": 1.8451, + "step": 28643000 + }, + { + "epoch": 82.91, + "learning_rate": 8.55928989903668e-06, + "loss": 1.8403, + "step": 28643500 + }, + { + "epoch": 82.91, + "learning_rate": 8.558566251389404e-06, + "loss": 1.8547, + "step": 28644000 + }, + { + "epoch": 82.91, + "learning_rate": 8.557842603742128e-06, + "loss": 1.827, + "step": 28644500 + }, + { + "epoch": 82.92, + "learning_rate": 8.55711895609485e-06, + "loss": 1.8187, + "step": 28645000 + }, + { + "epoch": 82.92, + "learning_rate": 8.556395308447574e-06, + "loss": 1.8223, + "step": 28645500 + }, + { + "epoch": 82.92, + "learning_rate": 8.555673108095591e-06, + "loss": 1.8515, + "step": 28646000 + }, + { + "epoch": 82.92, + "learning_rate": 8.554949460448315e-06, + "loss": 1.837, + "step": 28646500 + }, + { + "epoch": 82.92, + "learning_rate": 8.554225812801038e-06, + "loss": 1.8484, + "step": 28647000 + }, + { + "epoch": 82.92, + "learning_rate": 8.553502165153762e-06, + "loss": 1.8314, + "step": 28647500 + }, + { + "epoch": 82.92, + "learning_rate": 8.552778517506484e-06, + "loss": 1.8596, + "step": 28648000 + }, + { + "epoch": 82.93, + "learning_rate": 8.552056317154503e-06, + "loss": 1.8328, + "step": 28648500 + }, + { + "epoch": 82.93, + "learning_rate": 8.551332669507225e-06, + "loss": 1.8122, + "step": 28649000 + }, + { + "epoch": 82.93, + "learning_rate": 8.550609021859949e-06, + "loss": 1.8714, + "step": 28649500 + }, + { + "epoch": 82.93, + "learning_rate": 8.549885374212671e-06, + "loss": 1.8262, + "step": 28650000 + }, + { + "epoch": 82.93, + "learning_rate": 8.54916317386069e-06, + "loss": 1.8098, + "step": 28650500 + }, + { + "epoch": 82.93, + "learning_rate": 8.548439526213412e-06, + "loss": 1.8402, + "step": 28651000 + }, + { + "epoch": 82.93, + "learning_rate": 8.547715878566136e-06, + "loss": 1.8587, + "step": 28651500 + }, + { + "epoch": 82.94, + "learning_rate": 8.54699223091886e-06, + "loss": 1.8562, + "step": 28652000 + }, + { + "epoch": 82.94, + "learning_rate": 8.546268583271582e-06, + "loss": 1.8377, + "step": 28652500 + }, + { + "epoch": 82.94, + "learning_rate": 8.5455463829196e-06, + "loss": 1.819, + "step": 28653000 + }, + { + "epoch": 82.94, + "learning_rate": 8.544822735272324e-06, + "loss": 1.8415, + "step": 28653500 + }, + { + "epoch": 82.94, + "learning_rate": 8.544099087625047e-06, + "loss": 1.8537, + "step": 28654000 + }, + { + "epoch": 82.94, + "learning_rate": 8.543376887273065e-06, + "loss": 1.8301, + "step": 28654500 + }, + { + "epoch": 82.94, + "learning_rate": 8.542653239625787e-06, + "loss": 1.8421, + "step": 28655000 + }, + { + "epoch": 82.95, + "learning_rate": 8.541929591978511e-06, + "loss": 1.8311, + "step": 28655500 + }, + { + "epoch": 82.95, + "learning_rate": 8.541205944331235e-06, + "loss": 1.8311, + "step": 28656000 + }, + { + "epoch": 82.95, + "learning_rate": 8.540482296683957e-06, + "loss": 1.8402, + "step": 28656500 + }, + { + "epoch": 82.95, + "learning_rate": 8.539758649036681e-06, + "loss": 1.8473, + "step": 28657000 + }, + { + "epoch": 82.95, + "learning_rate": 8.539035001389403e-06, + "loss": 1.8241, + "step": 28657500 + }, + { + "epoch": 82.95, + "learning_rate": 8.538311353742127e-06, + "loss": 1.8271, + "step": 28658000 + }, + { + "epoch": 82.95, + "learning_rate": 8.537587706094851e-06, + "loss": 1.8187, + "step": 28658500 + }, + { + "epoch": 82.96, + "learning_rate": 8.536865505742868e-06, + "loss": 1.8231, + "step": 28659000 + }, + { + "epoch": 82.96, + "learning_rate": 8.53614185809559e-06, + "loss": 1.8409, + "step": 28659500 + }, + { + "epoch": 82.96, + "learning_rate": 8.535418210448314e-06, + "loss": 1.8413, + "step": 28660000 + }, + { + "epoch": 82.96, + "learning_rate": 8.534694562801038e-06, + "loss": 1.8463, + "step": 28660500 + }, + { + "epoch": 82.96, + "learning_rate": 8.53397091515376e-06, + "loss": 1.8611, + "step": 28661000 + }, + { + "epoch": 82.96, + "learning_rate": 8.533247267506485e-06, + "loss": 1.8282, + "step": 28661500 + }, + { + "epoch": 82.96, + "learning_rate": 8.532525067154502e-06, + "loss": 1.7978, + "step": 28662000 + }, + { + "epoch": 82.97, + "learning_rate": 8.531801419507226e-06, + "loss": 1.829, + "step": 28662500 + }, + { + "epoch": 82.97, + "learning_rate": 8.531079219155243e-06, + "loss": 1.8332, + "step": 28663000 + }, + { + "epoch": 82.97, + "learning_rate": 8.530355571507967e-06, + "loss": 1.83, + "step": 28663500 + }, + { + "epoch": 82.97, + "learning_rate": 8.529631923860689e-06, + "loss": 1.8597, + "step": 28664000 + }, + { + "epoch": 82.97, + "learning_rate": 8.528908276213413e-06, + "loss": 1.8296, + "step": 28664500 + }, + { + "epoch": 82.97, + "learning_rate": 8.528184628566135e-06, + "loss": 1.836, + "step": 28665000 + }, + { + "epoch": 82.97, + "learning_rate": 8.52746098091886e-06, + "loss": 1.854, + "step": 28665500 + }, + { + "epoch": 82.98, + "learning_rate": 8.526737333271583e-06, + "loss": 1.8243, + "step": 28666000 + }, + { + "epoch": 82.98, + "learning_rate": 8.526013685624305e-06, + "loss": 1.8226, + "step": 28666500 + }, + { + "epoch": 82.98, + "learning_rate": 8.52529003797703e-06, + "loss": 1.8301, + "step": 28667000 + }, + { + "epoch": 82.98, + "learning_rate": 8.524566390329752e-06, + "loss": 1.8566, + "step": 28667500 + }, + { + "epoch": 82.98, + "learning_rate": 8.523842742682475e-06, + "loss": 1.8444, + "step": 28668000 + }, + { + "epoch": 82.98, + "learning_rate": 8.523119095035198e-06, + "loss": 1.8206, + "step": 28668500 + }, + { + "epoch": 82.99, + "learning_rate": 8.522396894683217e-06, + "loss": 1.8227, + "step": 28669000 + }, + { + "epoch": 82.99, + "learning_rate": 8.52167324703594e-06, + "loss": 1.8123, + "step": 28669500 + }, + { + "epoch": 82.99, + "learning_rate": 8.520951046683958e-06, + "loss": 1.8587, + "step": 28670000 + }, + { + "epoch": 82.99, + "learning_rate": 8.52022739903668e-06, + "loss": 1.8301, + "step": 28670500 + }, + { + "epoch": 82.99, + "learning_rate": 8.519503751389404e-06, + "loss": 1.8423, + "step": 28671000 + }, + { + "epoch": 82.99, + "learning_rate": 8.518780103742128e-06, + "loss": 1.8202, + "step": 28671500 + }, + { + "epoch": 82.99, + "learning_rate": 8.51805645609485e-06, + "loss": 1.8189, + "step": 28672000 + }, + { + "epoch": 83.0, + "learning_rate": 8.517334255742867e-06, + "loss": 1.8269, + "step": 28672500 + }, + { + "epoch": 83.0, + "learning_rate": 8.516610608095591e-06, + "loss": 1.8158, + "step": 28673000 + }, + { + "epoch": 83.0, + "learning_rate": 8.515886960448315e-06, + "loss": 1.8249, + "step": 28673500 + }, + { + "epoch": 83.0, + "learning_rate": 8.515163312801037e-06, + "loss": 1.8303, + "step": 28674000 + }, + { + "epoch": 83.0, + "eval_accuracy": 0.687225884893444, + "eval_accuracy_mlm": 0.6562076438847384, + "eval_accuracy_nsp": 0.8535722960864922, + "eval_loss": 2.1801021099090576, + "eval_runtime": 331.764, + "eval_samples_per_second": 1315.351, + "eval_steps_per_second": 54.807, + "step": 28674176 + }, + { + "epoch": 83.0, + "learning_rate": 8.514439665153761e-06, + "loss": 1.8254, + "step": 28674500 + }, + { + "epoch": 83.0, + "learning_rate": 8.513717464801779e-06, + "loss": 1.8495, + "step": 28675000 + }, + { + "epoch": 83.0, + "learning_rate": 8.512993817154503e-06, + "loss": 1.8164, + "step": 28675500 + }, + { + "epoch": 83.01, + "learning_rate": 8.51227161680252e-06, + "loss": 1.8121, + "step": 28676000 + }, + { + "epoch": 83.01, + "learning_rate": 8.511547969155242e-06, + "loss": 1.8166, + "step": 28676500 + }, + { + "epoch": 83.01, + "learning_rate": 8.510824321507966e-06, + "loss": 1.8246, + "step": 28677000 + }, + { + "epoch": 83.01, + "learning_rate": 8.51010067386069e-06, + "loss": 1.8081, + "step": 28677500 + }, + { + "epoch": 83.01, + "learning_rate": 8.509377026213412e-06, + "loss": 1.7938, + "step": 28678000 + }, + { + "epoch": 83.01, + "learning_rate": 8.508653378566136e-06, + "loss": 1.8412, + "step": 28678500 + }, + { + "epoch": 83.01, + "learning_rate": 8.507931178214153e-06, + "loss": 1.8292, + "step": 28679000 + }, + { + "epoch": 83.02, + "learning_rate": 8.507207530566877e-06, + "loss": 1.8329, + "step": 28679500 + }, + { + "epoch": 83.02, + "learning_rate": 8.506485330214895e-06, + "loss": 1.8243, + "step": 28680000 + }, + { + "epoch": 83.02, + "learning_rate": 8.505761682567618e-06, + "loss": 1.8325, + "step": 28680500 + }, + { + "epoch": 83.02, + "learning_rate": 8.50503803492034e-06, + "loss": 1.8277, + "step": 28681000 + }, + { + "epoch": 83.02, + "learning_rate": 8.504314387273065e-06, + "loss": 1.7974, + "step": 28681500 + }, + { + "epoch": 83.02, + "learning_rate": 8.503590739625787e-06, + "loss": 1.81, + "step": 28682000 + }, + { + "epoch": 83.02, + "learning_rate": 8.50286709197851e-06, + "loss": 1.7936, + "step": 28682500 + }, + { + "epoch": 83.03, + "learning_rate": 8.502143444331235e-06, + "loss": 1.8275, + "step": 28683000 + }, + { + "epoch": 83.03, + "learning_rate": 8.501419796683957e-06, + "loss": 1.8421, + "step": 28683500 + }, + { + "epoch": 83.03, + "learning_rate": 8.500696149036681e-06, + "loss": 1.8323, + "step": 28684000 + }, + { + "epoch": 83.03, + "learning_rate": 8.499972501389405e-06, + "loss": 1.8137, + "step": 28684500 + }, + { + "epoch": 83.03, + "learning_rate": 8.499248853742127e-06, + "loss": 1.8433, + "step": 28685000 + }, + { + "epoch": 83.03, + "learning_rate": 8.49852520609485e-06, + "loss": 1.8188, + "step": 28685500 + }, + { + "epoch": 83.03, + "learning_rate": 8.497801558447573e-06, + "loss": 1.8444, + "step": 28686000 + }, + { + "epoch": 83.04, + "learning_rate": 8.497077910800297e-06, + "loss": 1.7865, + "step": 28686500 + }, + { + "epoch": 83.04, + "learning_rate": 8.49635426315302e-06, + "loss": 1.8267, + "step": 28687000 + }, + { + "epoch": 83.04, + "learning_rate": 8.495632062801037e-06, + "loss": 1.8301, + "step": 28687500 + }, + { + "epoch": 83.04, + "learning_rate": 8.494908415153762e-06, + "loss": 1.8153, + "step": 28688000 + }, + { + "epoch": 83.04, + "learning_rate": 8.494184767506484e-06, + "loss": 1.8184, + "step": 28688500 + }, + { + "epoch": 83.04, + "learning_rate": 8.493461119859207e-06, + "loss": 1.8243, + "step": 28689000 + }, + { + "epoch": 83.04, + "learning_rate": 8.492738919507224e-06, + "loss": 1.8226, + "step": 28689500 + }, + { + "epoch": 83.05, + "learning_rate": 8.49201527185995e-06, + "loss": 1.848, + "step": 28690000 + }, + { + "epoch": 83.05, + "learning_rate": 8.491291624212672e-06, + "loss": 1.8042, + "step": 28690500 + }, + { + "epoch": 83.05, + "learning_rate": 8.490567976565394e-06, + "loss": 1.8137, + "step": 28691000 + }, + { + "epoch": 83.05, + "learning_rate": 8.489845776213413e-06, + "loss": 1.8397, + "step": 28691500 + }, + { + "epoch": 83.05, + "learning_rate": 8.489122128566137e-06, + "loss": 1.8053, + "step": 28692000 + }, + { + "epoch": 83.05, + "learning_rate": 8.488398480918859e-06, + "loss": 1.806, + "step": 28692500 + }, + { + "epoch": 83.05, + "learning_rate": 8.487674833271581e-06, + "loss": 1.8324, + "step": 28693000 + }, + { + "epoch": 83.06, + "learning_rate": 8.486951185624307e-06, + "loss": 1.8516, + "step": 28693500 + }, + { + "epoch": 83.06, + "learning_rate": 8.48622753797703e-06, + "loss": 1.8303, + "step": 28694000 + }, + { + "epoch": 83.06, + "learning_rate": 8.485503890329751e-06, + "loss": 1.8139, + "step": 28694500 + }, + { + "epoch": 83.06, + "learning_rate": 8.484780242682475e-06, + "loss": 1.8336, + "step": 28695000 + }, + { + "epoch": 83.06, + "learning_rate": 8.4840565950352e-06, + "loss": 1.819, + "step": 28695500 + }, + { + "epoch": 83.06, + "learning_rate": 8.483334394683217e-06, + "loss": 1.831, + "step": 28696000 + }, + { + "epoch": 83.06, + "learning_rate": 8.482610747035939e-06, + "loss": 1.8414, + "step": 28696500 + }, + { + "epoch": 83.07, + "learning_rate": 8.481888546683956e-06, + "loss": 1.803, + "step": 28697000 + }, + { + "epoch": 83.07, + "learning_rate": 8.481164899036682e-06, + "loss": 1.8122, + "step": 28697500 + }, + { + "epoch": 83.07, + "learning_rate": 8.480441251389404e-06, + "loss": 1.8398, + "step": 28698000 + }, + { + "epoch": 83.07, + "learning_rate": 8.479717603742126e-06, + "loss": 1.7984, + "step": 28698500 + }, + { + "epoch": 83.07, + "learning_rate": 8.47899395609485e-06, + "loss": 1.8575, + "step": 28699000 + }, + { + "epoch": 83.07, + "learning_rate": 8.478270308447574e-06, + "loss": 1.8223, + "step": 28699500 + }, + { + "epoch": 83.07, + "learning_rate": 8.477546660800296e-06, + "loss": 1.8165, + "step": 28700000 + }, + { + "epoch": 83.08, + "learning_rate": 8.47682301315302e-06, + "loss": 1.8243, + "step": 28700500 + }, + { + "epoch": 83.08, + "learning_rate": 8.476100812801039e-06, + "loss": 1.8006, + "step": 28701000 + }, + { + "epoch": 83.08, + "learning_rate": 8.475377165153761e-06, + "loss": 1.8187, + "step": 28701500 + }, + { + "epoch": 83.08, + "learning_rate": 8.474653517506484e-06, + "loss": 1.8338, + "step": 28702000 + }, + { + "epoch": 83.08, + "learning_rate": 8.473929869859207e-06, + "loss": 1.8302, + "step": 28702500 + }, + { + "epoch": 83.08, + "learning_rate": 8.473206222211931e-06, + "loss": 1.8223, + "step": 28703000 + }, + { + "epoch": 83.08, + "learning_rate": 8.472482574564654e-06, + "loss": 1.7938, + "step": 28703500 + }, + { + "epoch": 83.09, + "learning_rate": 8.471758926917376e-06, + "loss": 1.8182, + "step": 28704000 + }, + { + "epoch": 83.09, + "learning_rate": 8.471036726565395e-06, + "loss": 1.8518, + "step": 28704500 + }, + { + "epoch": 83.09, + "learning_rate": 8.470313078918119e-06, + "loss": 1.82, + "step": 28705000 + }, + { + "epoch": 83.09, + "learning_rate": 8.469589431270841e-06, + "loss": 1.8405, + "step": 28705500 + }, + { + "epoch": 83.09, + "learning_rate": 8.468865783623565e-06, + "loss": 1.8045, + "step": 28706000 + }, + { + "epoch": 83.09, + "learning_rate": 8.468142135976289e-06, + "loss": 1.8214, + "step": 28706500 + }, + { + "epoch": 83.1, + "learning_rate": 8.467418488329011e-06, + "loss": 1.8155, + "step": 28707000 + }, + { + "epoch": 83.1, + "learning_rate": 8.466694840681733e-06, + "loss": 1.8045, + "step": 28707500 + }, + { + "epoch": 83.1, + "learning_rate": 8.465971193034459e-06, + "loss": 1.8159, + "step": 28708000 + }, + { + "epoch": 83.1, + "learning_rate": 8.465248992682476e-06, + "loss": 1.8163, + "step": 28708500 + }, + { + "epoch": 83.1, + "learning_rate": 8.464525345035198e-06, + "loss": 1.8122, + "step": 28709000 + }, + { + "epoch": 83.1, + "learning_rate": 8.46380169738792e-06, + "loss": 1.8337, + "step": 28709500 + }, + { + "epoch": 83.1, + "learning_rate": 8.46307949703594e-06, + "loss": 1.8132, + "step": 28710000 + }, + { + "epoch": 83.11, + "learning_rate": 8.462357296683959e-06, + "loss": 1.8283, + "step": 28710500 + }, + { + "epoch": 83.11, + "learning_rate": 8.46163364903668e-06, + "loss": 1.8366, + "step": 28711000 + }, + { + "epoch": 83.11, + "learning_rate": 8.460910001389403e-06, + "loss": 1.8314, + "step": 28711500 + }, + { + "epoch": 83.11, + "learning_rate": 8.460186353742127e-06, + "loss": 1.8366, + "step": 28712000 + }, + { + "epoch": 83.11, + "learning_rate": 8.45946270609485e-06, + "loss": 1.8068, + "step": 28712500 + }, + { + "epoch": 83.11, + "learning_rate": 8.458739058447573e-06, + "loss": 1.8367, + "step": 28713000 + }, + { + "epoch": 83.11, + "learning_rate": 8.458015410800297e-06, + "loss": 1.8315, + "step": 28713500 + }, + { + "epoch": 83.12, + "learning_rate": 8.457291763153021e-06, + "loss": 1.8191, + "step": 28714000 + }, + { + "epoch": 83.12, + "learning_rate": 8.456568115505743e-06, + "loss": 1.8274, + "step": 28714500 + }, + { + "epoch": 83.12, + "learning_rate": 8.455844467858465e-06, + "loss": 1.807, + "step": 28715000 + }, + { + "epoch": 83.12, + "learning_rate": 8.455122267506484e-06, + "loss": 1.8183, + "step": 28715500 + }, + { + "epoch": 83.12, + "learning_rate": 8.454400067154503e-06, + "loss": 1.8307, + "step": 28716000 + }, + { + "epoch": 83.12, + "learning_rate": 8.453676419507226e-06, + "loss": 1.8307, + "step": 28716500 + }, + { + "epoch": 83.12, + "learning_rate": 8.452952771859948e-06, + "loss": 1.8307, + "step": 28717000 + }, + { + "epoch": 83.13, + "learning_rate": 8.452229124212672e-06, + "loss": 1.8421, + "step": 28717500 + }, + { + "epoch": 83.13, + "learning_rate": 8.451505476565396e-06, + "loss": 1.8123, + "step": 28718000 + }, + { + "epoch": 83.13, + "learning_rate": 8.450781828918118e-06, + "loss": 1.8319, + "step": 28718500 + }, + { + "epoch": 83.13, + "learning_rate": 8.450058181270842e-06, + "loss": 1.8179, + "step": 28719000 + }, + { + "epoch": 83.13, + "learning_rate": 8.449334533623566e-06, + "loss": 1.8224, + "step": 28719500 + }, + { + "epoch": 83.13, + "learning_rate": 8.448610885976288e-06, + "loss": 1.8335, + "step": 28720000 + }, + { + "epoch": 83.13, + "learning_rate": 8.447888685624305e-06, + "loss": 1.8402, + "step": 28720500 + }, + { + "epoch": 83.14, + "learning_rate": 8.447165037977029e-06, + "loss": 1.8365, + "step": 28721000 + }, + { + "epoch": 83.14, + "learning_rate": 8.446441390329753e-06, + "loss": 1.8157, + "step": 28721500 + }, + { + "epoch": 83.14, + "learning_rate": 8.445717742682475e-06, + "loss": 1.8243, + "step": 28722000 + }, + { + "epoch": 83.14, + "learning_rate": 8.444995542330493e-06, + "loss": 1.8181, + "step": 28722500 + }, + { + "epoch": 83.14, + "learning_rate": 8.44427334197851e-06, + "loss": 1.8086, + "step": 28723000 + }, + { + "epoch": 83.14, + "learning_rate": 8.443549694331235e-06, + "loss": 1.8065, + "step": 28723500 + }, + { + "epoch": 83.14, + "learning_rate": 8.442826046683958e-06, + "loss": 1.8283, + "step": 28724000 + }, + { + "epoch": 83.15, + "learning_rate": 8.44210239903668e-06, + "loss": 1.8231, + "step": 28724500 + }, + { + "epoch": 83.15, + "learning_rate": 8.441378751389404e-06, + "loss": 1.7976, + "step": 28725000 + }, + { + "epoch": 83.15, + "learning_rate": 8.440655103742128e-06, + "loss": 1.8206, + "step": 28725500 + }, + { + "epoch": 83.15, + "learning_rate": 8.43993145609485e-06, + "loss": 1.8042, + "step": 28726000 + }, + { + "epoch": 83.15, + "learning_rate": 8.439207808447574e-06, + "loss": 1.8385, + "step": 28726500 + }, + { + "epoch": 83.15, + "learning_rate": 8.438484160800298e-06, + "loss": 1.8249, + "step": 28727000 + }, + { + "epoch": 83.15, + "learning_rate": 8.43776051315302e-06, + "loss": 1.8275, + "step": 28727500 + }, + { + "epoch": 83.16, + "learning_rate": 8.437036865505742e-06, + "loss": 1.8431, + "step": 28728000 + }, + { + "epoch": 83.16, + "learning_rate": 8.436313217858466e-06, + "loss": 1.8389, + "step": 28728500 + }, + { + "epoch": 83.16, + "learning_rate": 8.43558957021119e-06, + "loss": 1.8422, + "step": 28729000 + }, + { + "epoch": 83.16, + "learning_rate": 8.434865922563912e-06, + "loss": 1.8327, + "step": 28729500 + }, + { + "epoch": 83.16, + "learning_rate": 8.434142274916636e-06, + "loss": 1.8088, + "step": 28730000 + }, + { + "epoch": 83.16, + "learning_rate": 8.433420074564655e-06, + "loss": 1.8367, + "step": 28730500 + }, + { + "epoch": 83.16, + "learning_rate": 8.432696426917377e-06, + "loss": 1.8296, + "step": 28731000 + }, + { + "epoch": 83.17, + "learning_rate": 8.4319727792701e-06, + "loss": 1.8361, + "step": 28731500 + }, + { + "epoch": 83.17, + "learning_rate": 8.431249131622824e-06, + "loss": 1.8283, + "step": 28732000 + }, + { + "epoch": 83.17, + "learning_rate": 8.430525483975548e-06, + "loss": 1.841, + "step": 28732500 + }, + { + "epoch": 83.17, + "learning_rate": 8.42980183632827e-06, + "loss": 1.8105, + "step": 28733000 + }, + { + "epoch": 83.17, + "learning_rate": 8.429078188680994e-06, + "loss": 1.8384, + "step": 28733500 + }, + { + "epoch": 83.17, + "learning_rate": 8.428355988329011e-06, + "loss": 1.8336, + "step": 28734000 + }, + { + "epoch": 83.17, + "learning_rate": 8.427632340681735e-06, + "loss": 1.8189, + "step": 28734500 + }, + { + "epoch": 83.18, + "learning_rate": 8.426908693034457e-06, + "loss": 1.836, + "step": 28735000 + }, + { + "epoch": 83.18, + "learning_rate": 8.426185045387181e-06, + "loss": 1.8075, + "step": 28735500 + }, + { + "epoch": 83.18, + "learning_rate": 8.425461397739905e-06, + "loss": 1.8337, + "step": 28736000 + }, + { + "epoch": 83.18, + "learning_rate": 8.424737750092627e-06, + "loss": 1.7994, + "step": 28736500 + }, + { + "epoch": 83.18, + "learning_rate": 8.424015549740644e-06, + "loss": 1.8136, + "step": 28737000 + }, + { + "epoch": 83.18, + "learning_rate": 8.423291902093368e-06, + "loss": 1.7992, + "step": 28737500 + }, + { + "epoch": 83.18, + "learning_rate": 8.422568254446092e-06, + "loss": 1.8304, + "step": 28738000 + }, + { + "epoch": 83.19, + "learning_rate": 8.421844606798815e-06, + "loss": 1.8181, + "step": 28738500 + }, + { + "epoch": 83.19, + "learning_rate": 8.421120959151538e-06, + "loss": 1.8149, + "step": 28739000 + }, + { + "epoch": 83.19, + "learning_rate": 8.42039731150426e-06, + "loss": 1.8088, + "step": 28739500 + }, + { + "epoch": 83.19, + "learning_rate": 8.41967511115228e-06, + "loss": 1.8259, + "step": 28740000 + }, + { + "epoch": 83.19, + "learning_rate": 8.418951463505002e-06, + "loss": 1.838, + "step": 28740500 + }, + { + "epoch": 83.19, + "learning_rate": 8.418227815857726e-06, + "loss": 1.8466, + "step": 28741000 + }, + { + "epoch": 83.19, + "learning_rate": 8.41750416821045e-06, + "loss": 1.8039, + "step": 28741500 + }, + { + "epoch": 83.2, + "learning_rate": 8.416780520563172e-06, + "loss": 1.8311, + "step": 28742000 + }, + { + "epoch": 83.2, + "learning_rate": 8.41605832021119e-06, + "loss": 1.8247, + "step": 28742500 + }, + { + "epoch": 83.2, + "learning_rate": 8.415336119859208e-06, + "loss": 1.8006, + "step": 28743000 + }, + { + "epoch": 83.2, + "learning_rate": 8.41461247221193e-06, + "loss": 1.8308, + "step": 28743500 + }, + { + "epoch": 83.2, + "learning_rate": 8.413888824564654e-06, + "loss": 1.8306, + "step": 28744000 + }, + { + "epoch": 83.2, + "learning_rate": 8.413165176917377e-06, + "loss": 1.8031, + "step": 28744500 + }, + { + "epoch": 83.21, + "learning_rate": 8.4124415292701e-06, + "loss": 1.8131, + "step": 28745000 + }, + { + "epoch": 83.21, + "learning_rate": 8.411717881622824e-06, + "loss": 1.8525, + "step": 28745500 + }, + { + "epoch": 83.21, + "learning_rate": 8.410995681270842e-06, + "loss": 1.8562, + "step": 28746000 + }, + { + "epoch": 83.21, + "learning_rate": 8.410272033623564e-06, + "loss": 1.8366, + "step": 28746500 + }, + { + "epoch": 83.21, + "learning_rate": 8.409548385976288e-06, + "loss": 1.7926, + "step": 28747000 + }, + { + "epoch": 83.21, + "learning_rate": 8.408824738329012e-06, + "loss": 1.8068, + "step": 28747500 + }, + { + "epoch": 83.21, + "learning_rate": 8.408101090681734e-06, + "loss": 1.8556, + "step": 28748000 + }, + { + "epoch": 83.22, + "learning_rate": 8.407377443034458e-06, + "loss": 1.8362, + "step": 28748500 + }, + { + "epoch": 83.22, + "learning_rate": 8.40665379538718e-06, + "loss": 1.8009, + "step": 28749000 + }, + { + "epoch": 83.22, + "learning_rate": 8.405930147739904e-06, + "loss": 1.8361, + "step": 28749500 + }, + { + "epoch": 83.22, + "learning_rate": 8.405206500092628e-06, + "loss": 1.8001, + "step": 28750000 + }, + { + "epoch": 83.22, + "learning_rate": 8.404484299740645e-06, + "loss": 1.8239, + "step": 28750500 + }, + { + "epoch": 83.22, + "learning_rate": 8.40376065209337e-06, + "loss": 1.8227, + "step": 28751000 + }, + { + "epoch": 83.22, + "learning_rate": 8.403037004446091e-06, + "loss": 1.8195, + "step": 28751500 + }, + { + "epoch": 83.23, + "learning_rate": 8.402313356798815e-06, + "loss": 1.8449, + "step": 28752000 + }, + { + "epoch": 83.23, + "learning_rate": 8.401589709151538e-06, + "loss": 1.8322, + "step": 28752500 + }, + { + "epoch": 83.23, + "learning_rate": 8.400866061504262e-06, + "loss": 1.8197, + "step": 28753000 + }, + { + "epoch": 83.23, + "learning_rate": 8.400142413856984e-06, + "loss": 1.861, + "step": 28753500 + }, + { + "epoch": 83.23, + "learning_rate": 8.399420213505003e-06, + "loss": 1.8365, + "step": 28754000 + }, + { + "epoch": 83.23, + "learning_rate": 8.398696565857725e-06, + "loss": 1.8226, + "step": 28754500 + }, + { + "epoch": 83.23, + "learning_rate": 8.397972918210449e-06, + "loss": 1.8119, + "step": 28755000 + }, + { + "epoch": 83.24, + "learning_rate": 8.397249270563173e-06, + "loss": 1.8112, + "step": 28755500 + }, + { + "epoch": 83.24, + "learning_rate": 8.396528517506485e-06, + "loss": 1.8356, + "step": 28756000 + }, + { + "epoch": 83.24, + "learning_rate": 8.395804869859207e-06, + "loss": 1.8347, + "step": 28756500 + }, + { + "epoch": 83.24, + "learning_rate": 8.395081222211931e-06, + "loss": 1.8428, + "step": 28757000 + }, + { + "epoch": 83.24, + "learning_rate": 8.394357574564653e-06, + "loss": 1.8291, + "step": 28757500 + }, + { + "epoch": 83.24, + "learning_rate": 8.393633926917377e-06, + "loss": 1.8306, + "step": 28758000 + }, + { + "epoch": 83.24, + "learning_rate": 8.3929102792701e-06, + "loss": 1.8298, + "step": 28758500 + }, + { + "epoch": 83.25, + "learning_rate": 8.392186631622824e-06, + "loss": 1.8381, + "step": 28759000 + }, + { + "epoch": 83.25, + "learning_rate": 8.391462983975547e-06, + "loss": 1.8123, + "step": 28759500 + }, + { + "epoch": 83.25, + "learning_rate": 8.39073933632827e-06, + "loss": 1.8257, + "step": 28760000 + }, + { + "epoch": 83.25, + "learning_rate": 8.390017135976289e-06, + "loss": 1.85, + "step": 28760500 + }, + { + "epoch": 83.25, + "learning_rate": 8.389293488329011e-06, + "loss": 1.8274, + "step": 28761000 + }, + { + "epoch": 83.25, + "learning_rate": 8.388569840681735e-06, + "loss": 1.8243, + "step": 28761500 + }, + { + "epoch": 83.25, + "learning_rate": 8.387846193034457e-06, + "loss": 1.849, + "step": 28762000 + }, + { + "epoch": 83.26, + "learning_rate": 8.387122545387181e-06, + "loss": 1.8079, + "step": 28762500 + }, + { + "epoch": 83.26, + "learning_rate": 8.386398897739905e-06, + "loss": 1.8406, + "step": 28763000 + }, + { + "epoch": 83.26, + "learning_rate": 8.385675250092627e-06, + "loss": 1.8249, + "step": 28763500 + }, + { + "epoch": 83.26, + "learning_rate": 8.384953049740644e-06, + "loss": 1.8347, + "step": 28764000 + }, + { + "epoch": 83.26, + "learning_rate": 8.384229402093368e-06, + "loss": 1.8125, + "step": 28764500 + }, + { + "epoch": 83.26, + "learning_rate": 8.383505754446092e-06, + "loss": 1.838, + "step": 28765000 + }, + { + "epoch": 83.26, + "learning_rate": 8.382782106798814e-06, + "loss": 1.8367, + "step": 28765500 + }, + { + "epoch": 83.27, + "learning_rate": 8.382059906446832e-06, + "loss": 1.8144, + "step": 28766000 + }, + { + "epoch": 83.27, + "learning_rate": 8.38133770609485e-06, + "loss": 1.813, + "step": 28766500 + }, + { + "epoch": 83.27, + "learning_rate": 8.380614058447573e-06, + "loss": 1.8348, + "step": 28767000 + }, + { + "epoch": 83.27, + "learning_rate": 8.379890410800297e-06, + "loss": 1.8301, + "step": 28767500 + }, + { + "epoch": 83.27, + "learning_rate": 8.379166763153019e-06, + "loss": 1.8282, + "step": 28768000 + }, + { + "epoch": 83.27, + "learning_rate": 8.378443115505743e-06, + "loss": 1.8081, + "step": 28768500 + }, + { + "epoch": 83.27, + "learning_rate": 8.377719467858467e-06, + "loss": 1.8173, + "step": 28769000 + }, + { + "epoch": 83.28, + "learning_rate": 8.376995820211189e-06, + "loss": 1.8356, + "step": 28769500 + }, + { + "epoch": 83.28, + "learning_rate": 8.376272172563913e-06, + "loss": 1.8302, + "step": 28770000 + }, + { + "epoch": 83.28, + "learning_rate": 8.375548524916637e-06, + "loss": 1.8119, + "step": 28770500 + }, + { + "epoch": 83.28, + "learning_rate": 8.37482487726936e-06, + "loss": 1.8298, + "step": 28771000 + }, + { + "epoch": 83.28, + "learning_rate": 8.374101229622083e-06, + "loss": 1.8197, + "step": 28771500 + }, + { + "epoch": 83.28, + "learning_rate": 8.373377581974805e-06, + "loss": 1.8495, + "step": 28772000 + }, + { + "epoch": 83.28, + "learning_rate": 8.372655381622824e-06, + "loss": 1.7945, + "step": 28772500 + }, + { + "epoch": 83.29, + "learning_rate": 8.371933181270842e-06, + "loss": 1.8451, + "step": 28773000 + }, + { + "epoch": 83.29, + "learning_rate": 8.371210980918859e-06, + "loss": 1.8223, + "step": 28773500 + }, + { + "epoch": 83.29, + "learning_rate": 8.370487333271583e-06, + "loss": 1.8307, + "step": 28774000 + }, + { + "epoch": 83.29, + "learning_rate": 8.369763685624307e-06, + "loss": 1.8161, + "step": 28774500 + }, + { + "epoch": 83.29, + "learning_rate": 8.369040037977029e-06, + "loss": 1.829, + "step": 28775000 + }, + { + "epoch": 83.29, + "learning_rate": 8.368316390329751e-06, + "loss": 1.8446, + "step": 28775500 + }, + { + "epoch": 83.29, + "learning_rate": 8.367592742682475e-06, + "loss": 1.8248, + "step": 28776000 + }, + { + "epoch": 83.3, + "learning_rate": 8.366869095035199e-06, + "loss": 1.8326, + "step": 28776500 + }, + { + "epoch": 83.3, + "learning_rate": 8.366146894683216e-06, + "loss": 1.8366, + "step": 28777000 + }, + { + "epoch": 83.3, + "learning_rate": 8.36542324703594e-06, + "loss": 1.8463, + "step": 28777500 + }, + { + "epoch": 83.3, + "learning_rate": 8.364699599388662e-06, + "loss": 1.8301, + "step": 28778000 + }, + { + "epoch": 83.3, + "learning_rate": 8.363975951741386e-06, + "loss": 1.8253, + "step": 28778500 + }, + { + "epoch": 83.3, + "learning_rate": 8.363252304094109e-06, + "loss": 1.836, + "step": 28779000 + }, + { + "epoch": 83.3, + "learning_rate": 8.362528656446832e-06, + "loss": 1.8248, + "step": 28779500 + }, + { + "epoch": 83.31, + "learning_rate": 8.361805008799556e-06, + "loss": 1.8094, + "step": 28780000 + }, + { + "epoch": 83.31, + "learning_rate": 8.361081361152279e-06, + "loss": 1.8224, + "step": 28780500 + }, + { + "epoch": 83.31, + "learning_rate": 8.360357713505003e-06, + "loss": 1.8163, + "step": 28781000 + }, + { + "epoch": 83.31, + "learning_rate": 8.35963551315302e-06, + "loss": 1.8261, + "step": 28781500 + }, + { + "epoch": 83.31, + "learning_rate": 8.358911865505744e-06, + "loss": 1.8349, + "step": 28782000 + }, + { + "epoch": 83.31, + "learning_rate": 8.358188217858466e-06, + "loss": 1.8104, + "step": 28782500 + }, + { + "epoch": 83.32, + "learning_rate": 8.35746457021119e-06, + "loss": 1.8586, + "step": 28783000 + }, + { + "epoch": 83.32, + "learning_rate": 8.356740922563914e-06, + "loss": 1.8259, + "step": 28783500 + }, + { + "epoch": 83.32, + "learning_rate": 8.356018722211931e-06, + "loss": 1.8155, + "step": 28784000 + }, + { + "epoch": 83.32, + "learning_rate": 8.355295074564653e-06, + "loss": 1.8112, + "step": 28784500 + }, + { + "epoch": 83.32, + "learning_rate": 8.354571426917377e-06, + "loss": 1.802, + "step": 28785000 + }, + { + "epoch": 83.32, + "learning_rate": 8.353847779270101e-06, + "loss": 1.8261, + "step": 28785500 + }, + { + "epoch": 83.32, + "learning_rate": 8.353124131622823e-06, + "loss": 1.8077, + "step": 28786000 + }, + { + "epoch": 83.33, + "learning_rate": 8.352403378566136e-06, + "loss": 1.7971, + "step": 28786500 + }, + { + "epoch": 83.33, + "learning_rate": 8.35167973091886e-06, + "loss": 1.8151, + "step": 28787000 + }, + { + "epoch": 83.33, + "learning_rate": 8.350956083271584e-06, + "loss": 1.8239, + "step": 28787500 + }, + { + "epoch": 83.33, + "learning_rate": 8.350232435624306e-06, + "loss": 1.8187, + "step": 28788000 + }, + { + "epoch": 83.33, + "learning_rate": 8.349508787977028e-06, + "loss": 1.8502, + "step": 28788500 + }, + { + "epoch": 83.33, + "learning_rate": 8.348785140329752e-06, + "loss": 1.8255, + "step": 28789000 + }, + { + "epoch": 83.33, + "learning_rate": 8.348061492682476e-06, + "loss": 1.8353, + "step": 28789500 + }, + { + "epoch": 83.34, + "learning_rate": 8.347337845035198e-06, + "loss": 1.8262, + "step": 28790000 + }, + { + "epoch": 83.34, + "learning_rate": 8.346615644683215e-06, + "loss": 1.8205, + "step": 28790500 + }, + { + "epoch": 83.34, + "learning_rate": 8.34589199703594e-06, + "loss": 1.8002, + "step": 28791000 + }, + { + "epoch": 83.34, + "learning_rate": 8.345168349388663e-06, + "loss": 1.8387, + "step": 28791500 + }, + { + "epoch": 83.34, + "learning_rate": 8.344444701741385e-06, + "loss": 1.8057, + "step": 28792000 + }, + { + "epoch": 83.34, + "learning_rate": 8.34372105409411e-06, + "loss": 1.818, + "step": 28792500 + }, + { + "epoch": 83.34, + "learning_rate": 8.342997406446833e-06, + "loss": 1.8135, + "step": 28793000 + }, + { + "epoch": 83.35, + "learning_rate": 8.34227520609485e-06, + "loss": 1.8305, + "step": 28793500 + }, + { + "epoch": 83.35, + "learning_rate": 8.341551558447573e-06, + "loss": 1.7949, + "step": 28794000 + }, + { + "epoch": 83.35, + "learning_rate": 8.340827910800297e-06, + "loss": 1.8449, + "step": 28794500 + }, + { + "epoch": 83.35, + "learning_rate": 8.340105710448316e-06, + "loss": 1.8308, + "step": 28795000 + }, + { + "epoch": 83.35, + "learning_rate": 8.339382062801038e-06, + "loss": 1.8322, + "step": 28795500 + }, + { + "epoch": 83.35, + "learning_rate": 8.33865841515376e-06, + "loss": 1.8268, + "step": 28796000 + }, + { + "epoch": 83.35, + "learning_rate": 8.337934767506484e-06, + "loss": 1.8421, + "step": 28796500 + }, + { + "epoch": 83.36, + "learning_rate": 8.337211119859208e-06, + "loss": 1.8403, + "step": 28797000 + }, + { + "epoch": 83.36, + "learning_rate": 8.33648747221193e-06, + "loss": 1.823, + "step": 28797500 + }, + { + "epoch": 83.36, + "learning_rate": 8.335763824564654e-06, + "loss": 1.8173, + "step": 28798000 + }, + { + "epoch": 83.36, + "learning_rate": 8.335040176917378e-06, + "loss": 1.8309, + "step": 28798500 + }, + { + "epoch": 83.36, + "learning_rate": 8.334317976565395e-06, + "loss": 1.8388, + "step": 28799000 + }, + { + "epoch": 83.36, + "learning_rate": 8.333594328918118e-06, + "loss": 1.831, + "step": 28799500 + }, + { + "epoch": 83.36, + "learning_rate": 8.332870681270841e-06, + "loss": 1.8115, + "step": 28800000 + }, + { + "epoch": 83.37, + "learning_rate": 8.332147033623565e-06, + "loss": 1.819, + "step": 28800500 + }, + { + "epoch": 83.37, + "learning_rate": 8.331423385976288e-06, + "loss": 1.8343, + "step": 28801000 + }, + { + "epoch": 83.37, + "learning_rate": 8.33069973832901e-06, + "loss": 1.8129, + "step": 28801500 + }, + { + "epoch": 83.37, + "learning_rate": 8.329976090681735e-06, + "loss": 1.835, + "step": 28802000 + }, + { + "epoch": 83.37, + "learning_rate": 8.329252443034458e-06, + "loss": 1.8292, + "step": 28802500 + }, + { + "epoch": 83.37, + "learning_rate": 8.328530242682475e-06, + "loss": 1.8259, + "step": 28803000 + }, + { + "epoch": 83.37, + "learning_rate": 8.327806595035197e-06, + "loss": 1.8386, + "step": 28803500 + }, + { + "epoch": 83.38, + "learning_rate": 8.327084394683216e-06, + "loss": 1.853, + "step": 28804000 + }, + { + "epoch": 83.38, + "learning_rate": 8.32636074703594e-06, + "loss": 1.8247, + "step": 28804500 + }, + { + "epoch": 83.38, + "learning_rate": 8.325637099388662e-06, + "loss": 1.8168, + "step": 28805000 + }, + { + "epoch": 83.38, + "learning_rate": 8.324913451741386e-06, + "loss": 1.8183, + "step": 28805500 + }, + { + "epoch": 83.38, + "learning_rate": 8.32418980409411e-06, + "loss": 1.8354, + "step": 28806000 + }, + { + "epoch": 83.38, + "learning_rate": 8.323466156446832e-06, + "loss": 1.8462, + "step": 28806500 + }, + { + "epoch": 83.38, + "learning_rate": 8.32274395609485e-06, + "loss": 1.838, + "step": 28807000 + }, + { + "epoch": 83.39, + "learning_rate": 8.322020308447574e-06, + "loss": 1.8241, + "step": 28807500 + }, + { + "epoch": 83.39, + "learning_rate": 8.321296660800297e-06, + "loss": 1.816, + "step": 28808000 + }, + { + "epoch": 83.39, + "learning_rate": 8.32057301315302e-06, + "loss": 1.8443, + "step": 28808500 + }, + { + "epoch": 83.39, + "learning_rate": 8.319849365505742e-06, + "loss": 1.8436, + "step": 28809000 + }, + { + "epoch": 83.39, + "learning_rate": 8.319125717858468e-06, + "loss": 1.8194, + "step": 28809500 + }, + { + "epoch": 83.39, + "learning_rate": 8.318403517506485e-06, + "loss": 1.8342, + "step": 28810000 + }, + { + "epoch": 83.39, + "learning_rate": 8.317679869859207e-06, + "loss": 1.8208, + "step": 28810500 + }, + { + "epoch": 83.4, + "learning_rate": 8.316957669507224e-06, + "loss": 1.8128, + "step": 28811000 + }, + { + "epoch": 83.4, + "learning_rate": 8.31623402185995e-06, + "loss": 1.8281, + "step": 28811500 + }, + { + "epoch": 83.4, + "learning_rate": 8.315510374212672e-06, + "loss": 1.8153, + "step": 28812000 + }, + { + "epoch": 83.4, + "learning_rate": 8.314786726565394e-06, + "loss": 1.811, + "step": 28812500 + }, + { + "epoch": 83.4, + "learning_rate": 8.314063078918118e-06, + "loss": 1.8122, + "step": 28813000 + }, + { + "epoch": 83.4, + "learning_rate": 8.313339431270842e-06, + "loss": 1.8541, + "step": 28813500 + }, + { + "epoch": 83.4, + "learning_rate": 8.312615783623564e-06, + "loss": 1.8201, + "step": 28814000 + }, + { + "epoch": 83.41, + "learning_rate": 8.311895030566877e-06, + "loss": 1.8314, + "step": 28814500 + }, + { + "epoch": 83.41, + "learning_rate": 8.311171382919599e-06, + "loss": 1.8207, + "step": 28815000 + }, + { + "epoch": 83.41, + "learning_rate": 8.310447735272325e-06, + "loss": 1.8367, + "step": 28815500 + }, + { + "epoch": 83.41, + "learning_rate": 8.309724087625047e-06, + "loss": 1.8416, + "step": 28816000 + }, + { + "epoch": 83.41, + "learning_rate": 8.309000439977769e-06, + "loss": 1.8369, + "step": 28816500 + }, + { + "epoch": 83.41, + "learning_rate": 8.308276792330493e-06, + "loss": 1.8331, + "step": 28817000 + }, + { + "epoch": 83.41, + "learning_rate": 8.307553144683217e-06, + "loss": 1.8272, + "step": 28817500 + }, + { + "epoch": 83.42, + "learning_rate": 8.30682949703594e-06, + "loss": 1.8367, + "step": 28818000 + }, + { + "epoch": 83.42, + "learning_rate": 8.306105849388663e-06, + "loss": 1.8194, + "step": 28818500 + }, + { + "epoch": 83.42, + "learning_rate": 8.305382201741387e-06, + "loss": 1.8357, + "step": 28819000 + }, + { + "epoch": 83.42, + "learning_rate": 8.30465855409411e-06, + "loss": 1.8405, + "step": 28819500 + }, + { + "epoch": 83.42, + "learning_rate": 8.303936353742127e-06, + "loss": 1.8075, + "step": 28820000 + }, + { + "epoch": 83.42, + "learning_rate": 8.30321270609485e-06, + "loss": 1.8165, + "step": 28820500 + }, + { + "epoch": 83.42, + "learning_rate": 8.302489058447574e-06, + "loss": 1.8112, + "step": 28821000 + }, + { + "epoch": 83.43, + "learning_rate": 8.301765410800297e-06, + "loss": 1.8355, + "step": 28821500 + }, + { + "epoch": 83.43, + "learning_rate": 8.301041763153019e-06, + "loss": 1.8112, + "step": 28822000 + }, + { + "epoch": 83.43, + "learning_rate": 8.300318115505744e-06, + "loss": 1.7968, + "step": 28822500 + }, + { + "epoch": 83.43, + "learning_rate": 8.299595915153762e-06, + "loss": 1.8276, + "step": 28823000 + }, + { + "epoch": 83.43, + "learning_rate": 8.298872267506484e-06, + "loss": 1.8221, + "step": 28823500 + }, + { + "epoch": 83.43, + "learning_rate": 8.298148619859208e-06, + "loss": 1.8378, + "step": 28824000 + }, + { + "epoch": 83.44, + "learning_rate": 8.297424972211932e-06, + "loss": 1.8157, + "step": 28824500 + }, + { + "epoch": 83.44, + "learning_rate": 8.296701324564654e-06, + "loss": 1.7994, + "step": 28825000 + }, + { + "epoch": 83.44, + "learning_rate": 8.295977676917376e-06, + "loss": 1.8249, + "step": 28825500 + }, + { + "epoch": 83.44, + "learning_rate": 8.2952540292701e-06, + "loss": 1.7955, + "step": 28826000 + }, + { + "epoch": 83.44, + "learning_rate": 8.294531828918119e-06, + "loss": 1.8157, + "step": 28826500 + }, + { + "epoch": 83.44, + "learning_rate": 8.293808181270841e-06, + "loss": 1.7958, + "step": 28827000 + }, + { + "epoch": 83.44, + "learning_rate": 8.293084533623564e-06, + "loss": 1.8144, + "step": 28827500 + }, + { + "epoch": 83.45, + "learning_rate": 8.292362333271583e-06, + "loss": 1.8252, + "step": 28828000 + }, + { + "epoch": 83.45, + "learning_rate": 8.291638685624306e-06, + "loss": 1.8399, + "step": 28828500 + }, + { + "epoch": 83.45, + "learning_rate": 8.290915037977029e-06, + "loss": 1.8336, + "step": 28829000 + }, + { + "epoch": 83.45, + "learning_rate": 8.290191390329753e-06, + "loss": 1.8193, + "step": 28829500 + }, + { + "epoch": 83.45, + "learning_rate": 8.289467742682477e-06, + "loss": 1.839, + "step": 28830000 + }, + { + "epoch": 83.45, + "learning_rate": 8.288744095035199e-06, + "loss": 1.8552, + "step": 28830500 + }, + { + "epoch": 83.45, + "learning_rate": 8.288020447387921e-06, + "loss": 1.8087, + "step": 28831000 + }, + { + "epoch": 83.46, + "learning_rate": 8.287296799740645e-06, + "loss": 1.8302, + "step": 28831500 + }, + { + "epoch": 83.46, + "learning_rate": 8.286573152093369e-06, + "loss": 1.7973, + "step": 28832000 + }, + { + "epoch": 83.46, + "learning_rate": 8.285849504446091e-06, + "loss": 1.8144, + "step": 28832500 + }, + { + "epoch": 83.46, + "learning_rate": 8.285125856798815e-06, + "loss": 1.8402, + "step": 28833000 + }, + { + "epoch": 83.46, + "learning_rate": 8.284402209151539e-06, + "loss": 1.8143, + "step": 28833500 + }, + { + "epoch": 83.46, + "learning_rate": 8.283678561504261e-06, + "loss": 1.8508, + "step": 28834000 + }, + { + "epoch": 83.46, + "learning_rate": 8.282956361152278e-06, + "loss": 1.8576, + "step": 28834500 + }, + { + "epoch": 83.47, + "learning_rate": 8.282232713505002e-06, + "loss": 1.8521, + "step": 28835000 + }, + { + "epoch": 83.47, + "learning_rate": 8.281509065857726e-06, + "loss": 1.8471, + "step": 28835500 + }, + { + "epoch": 83.47, + "learning_rate": 8.280786865505744e-06, + "loss": 1.8467, + "step": 28836000 + }, + { + "epoch": 83.47, + "learning_rate": 8.280063217858466e-06, + "loss": 1.8143, + "step": 28836500 + }, + { + "epoch": 83.47, + "learning_rate": 8.27933957021119e-06, + "loss": 1.8256, + "step": 28837000 + }, + { + "epoch": 83.47, + "learning_rate": 8.278615922563914e-06, + "loss": 1.8411, + "step": 28837500 + }, + { + "epoch": 83.47, + "learning_rate": 8.277892274916636e-06, + "loss": 1.8224, + "step": 28838000 + }, + { + "epoch": 83.48, + "learning_rate": 8.27716862726936e-06, + "loss": 1.8342, + "step": 28838500 + }, + { + "epoch": 83.48, + "learning_rate": 8.276444979622084e-06, + "loss": 1.8403, + "step": 28839000 + }, + { + "epoch": 83.48, + "learning_rate": 8.275721331974806e-06, + "loss": 1.8142, + "step": 28839500 + }, + { + "epoch": 83.48, + "learning_rate": 8.274997684327528e-06, + "loss": 1.8208, + "step": 28840000 + }, + { + "epoch": 83.48, + "learning_rate": 8.274274036680252e-06, + "loss": 1.8275, + "step": 28840500 + }, + { + "epoch": 83.48, + "learning_rate": 8.273551836328271e-06, + "loss": 1.8426, + "step": 28841000 + }, + { + "epoch": 83.48, + "learning_rate": 8.272828188680993e-06, + "loss": 1.8418, + "step": 28841500 + }, + { + "epoch": 83.49, + "learning_rate": 8.272104541033717e-06, + "loss": 1.8566, + "step": 28842000 + }, + { + "epoch": 83.49, + "learning_rate": 8.27138089338644e-06, + "loss": 1.8223, + "step": 28842500 + }, + { + "epoch": 83.49, + "learning_rate": 8.270657245739163e-06, + "loss": 1.8353, + "step": 28843000 + }, + { + "epoch": 83.49, + "learning_rate": 8.26993504538718e-06, + "loss": 1.8264, + "step": 28843500 + }, + { + "epoch": 83.49, + "learning_rate": 8.269211397739905e-06, + "loss": 1.8095, + "step": 28844000 + }, + { + "epoch": 83.49, + "learning_rate": 8.268487750092627e-06, + "loss": 1.8084, + "step": 28844500 + }, + { + "epoch": 83.49, + "learning_rate": 8.267765549740646e-06, + "loss": 1.8199, + "step": 28845000 + }, + { + "epoch": 83.5, + "learning_rate": 8.267041902093368e-06, + "loss": 1.8022, + "step": 28845500 + }, + { + "epoch": 83.5, + "learning_rate": 8.266319701741385e-06, + "loss": 1.8397, + "step": 28846000 + }, + { + "epoch": 83.5, + "learning_rate": 8.26559605409411e-06, + "loss": 1.8192, + "step": 28846500 + }, + { + "epoch": 83.5, + "learning_rate": 8.264872406446833e-06, + "loss": 1.8018, + "step": 28847000 + }, + { + "epoch": 83.5, + "learning_rate": 8.264148758799555e-06, + "loss": 1.8254, + "step": 28847500 + }, + { + "epoch": 83.5, + "learning_rate": 8.26342511115228e-06, + "loss": 1.8417, + "step": 28848000 + }, + { + "epoch": 83.5, + "learning_rate": 8.262701463505003e-06, + "loss": 1.8113, + "step": 28848500 + }, + { + "epoch": 83.51, + "learning_rate": 8.26197926315302e-06, + "loss": 1.8183, + "step": 28849000 + }, + { + "epoch": 83.51, + "learning_rate": 8.261255615505743e-06, + "loss": 1.8276, + "step": 28849500 + }, + { + "epoch": 83.51, + "learning_rate": 8.260531967858467e-06, + "loss": 1.8191, + "step": 28850000 + }, + { + "epoch": 83.51, + "learning_rate": 8.25980832021119e-06, + "loss": 1.8255, + "step": 28850500 + }, + { + "epoch": 83.51, + "learning_rate": 8.259086119859208e-06, + "loss": 1.8124, + "step": 28851000 + }, + { + "epoch": 83.51, + "learning_rate": 8.25836247221193e-06, + "loss": 1.8569, + "step": 28851500 + }, + { + "epoch": 83.51, + "learning_rate": 8.257638824564654e-06, + "loss": 1.8359, + "step": 28852000 + }, + { + "epoch": 83.52, + "learning_rate": 8.256915176917378e-06, + "loss": 1.8226, + "step": 28852500 + }, + { + "epoch": 83.52, + "learning_rate": 8.2561915292701e-06, + "loss": 1.8458, + "step": 28853000 + }, + { + "epoch": 83.52, + "learning_rate": 8.255467881622824e-06, + "loss": 1.8152, + "step": 28853500 + }, + { + "epoch": 83.52, + "learning_rate": 8.254744233975546e-06, + "loss": 1.8116, + "step": 28854000 + }, + { + "epoch": 83.52, + "learning_rate": 8.25402058632827e-06, + "loss": 1.8134, + "step": 28854500 + }, + { + "epoch": 83.52, + "learning_rate": 8.253296938680994e-06, + "loss": 1.8233, + "step": 28855000 + }, + { + "epoch": 83.52, + "learning_rate": 8.252573291033716e-06, + "loss": 1.8454, + "step": 28855500 + }, + { + "epoch": 83.53, + "learning_rate": 8.25184964338644e-06, + "loss": 1.8223, + "step": 28856000 + }, + { + "epoch": 83.53, + "learning_rate": 8.251125995739162e-06, + "loss": 1.8149, + "step": 28856500 + }, + { + "epoch": 83.53, + "learning_rate": 8.250402348091886e-06, + "loss": 1.8222, + "step": 28857000 + }, + { + "epoch": 83.53, + "learning_rate": 8.249678700444609e-06, + "loss": 1.8363, + "step": 28857500 + }, + { + "epoch": 83.53, + "learning_rate": 8.248955052797333e-06, + "loss": 1.8177, + "step": 28858000 + }, + { + "epoch": 83.53, + "learning_rate": 8.248231405150057e-06, + "loss": 1.8299, + "step": 28858500 + }, + { + "epoch": 83.53, + "learning_rate": 8.247507757502779e-06, + "loss": 1.8311, + "step": 28859000 + }, + { + "epoch": 83.54, + "learning_rate": 8.246784109855503e-06, + "loss": 1.8036, + "step": 28859500 + }, + { + "epoch": 83.54, + "learning_rate": 8.24606190950352e-06, + "loss": 1.8385, + "step": 28860000 + }, + { + "epoch": 83.54, + "learning_rate": 8.245338261856244e-06, + "loss": 1.8164, + "step": 28860500 + }, + { + "epoch": 83.54, + "learning_rate": 8.244614614208966e-06, + "loss": 1.8106, + "step": 28861000 + }, + { + "epoch": 83.54, + "learning_rate": 8.24389096656169e-06, + "loss": 1.833, + "step": 28861500 + }, + { + "epoch": 83.54, + "learning_rate": 8.243167318914414e-06, + "loss": 1.8298, + "step": 28862000 + }, + { + "epoch": 83.55, + "learning_rate": 8.242443671267136e-06, + "loss": 1.8026, + "step": 28862500 + }, + { + "epoch": 83.55, + "learning_rate": 8.241721470915153e-06, + "loss": 1.8131, + "step": 28863000 + }, + { + "epoch": 83.55, + "learning_rate": 8.240997823267877e-06, + "loss": 1.8207, + "step": 28863500 + }, + { + "epoch": 83.55, + "learning_rate": 8.240274175620601e-06, + "loss": 1.8436, + "step": 28864000 + }, + { + "epoch": 83.55, + "learning_rate": 8.239550527973324e-06, + "loss": 1.8199, + "step": 28864500 + }, + { + "epoch": 83.55, + "learning_rate": 8.238826880326047e-06, + "loss": 1.83, + "step": 28865000 + }, + { + "epoch": 83.55, + "learning_rate": 8.238104679974065e-06, + "loss": 1.8337, + "step": 28865500 + }, + { + "epoch": 83.56, + "learning_rate": 8.237381032326789e-06, + "loss": 1.8138, + "step": 28866000 + }, + { + "epoch": 83.56, + "learning_rate": 8.236658831974806e-06, + "loss": 1.8212, + "step": 28866500 + }, + { + "epoch": 83.56, + "learning_rate": 8.235935184327528e-06, + "loss": 1.8386, + "step": 28867000 + }, + { + "epoch": 83.56, + "learning_rate": 8.235211536680252e-06, + "loss": 1.8291, + "step": 28867500 + }, + { + "epoch": 83.56, + "learning_rate": 8.234487889032976e-06, + "loss": 1.8099, + "step": 28868000 + }, + { + "epoch": 83.56, + "learning_rate": 8.233764241385698e-06, + "loss": 1.8138, + "step": 28868500 + }, + { + "epoch": 83.56, + "learning_rate": 8.233040593738422e-06, + "loss": 1.835, + "step": 28869000 + }, + { + "epoch": 83.57, + "learning_rate": 8.232316946091146e-06, + "loss": 1.8366, + "step": 28869500 + }, + { + "epoch": 83.57, + "learning_rate": 8.231594745739163e-06, + "loss": 1.8045, + "step": 28870000 + }, + { + "epoch": 83.57, + "learning_rate": 8.230871098091886e-06, + "loss": 1.8406, + "step": 28870500 + }, + { + "epoch": 83.57, + "learning_rate": 8.23014745044461e-06, + "loss": 1.8256, + "step": 28871000 + }, + { + "epoch": 83.57, + "learning_rate": 8.229423802797333e-06, + "loss": 1.8057, + "step": 28871500 + }, + { + "epoch": 83.57, + "learning_rate": 8.228700155150056e-06, + "loss": 1.8277, + "step": 28872000 + }, + { + "epoch": 83.57, + "learning_rate": 8.22797650750278e-06, + "loss": 1.8133, + "step": 28872500 + }, + { + "epoch": 83.58, + "learning_rate": 8.227252859855503e-06, + "loss": 1.8114, + "step": 28873000 + }, + { + "epoch": 83.58, + "learning_rate": 8.226529212208226e-06, + "loss": 1.8029, + "step": 28873500 + }, + { + "epoch": 83.58, + "learning_rate": 8.225805564560948e-06, + "loss": 1.8352, + "step": 28874000 + }, + { + "epoch": 83.58, + "learning_rate": 8.225083364208967e-06, + "loss": 1.8171, + "step": 28874500 + }, + { + "epoch": 83.58, + "learning_rate": 8.22435971656169e-06, + "loss": 1.8478, + "step": 28875000 + }, + { + "epoch": 83.58, + "learning_rate": 8.223637516209708e-06, + "loss": 1.8568, + "step": 28875500 + }, + { + "epoch": 83.58, + "learning_rate": 8.22291386856243e-06, + "loss": 1.7938, + "step": 28876000 + }, + { + "epoch": 83.59, + "learning_rate": 8.222190220915154e-06, + "loss": 1.8068, + "step": 28876500 + }, + { + "epoch": 83.59, + "learning_rate": 8.221466573267878e-06, + "loss": 1.8431, + "step": 28877000 + }, + { + "epoch": 83.59, + "learning_rate": 8.2207429256206e-06, + "loss": 1.8298, + "step": 28877500 + }, + { + "epoch": 83.59, + "learning_rate": 8.220019277973323e-06, + "loss": 1.8458, + "step": 28878000 + }, + { + "epoch": 83.59, + "learning_rate": 8.219295630326047e-06, + "loss": 1.842, + "step": 28878500 + }, + { + "epoch": 83.59, + "learning_rate": 8.21857198267877e-06, + "loss": 1.8392, + "step": 28879000 + }, + { + "epoch": 83.59, + "learning_rate": 8.217848335031493e-06, + "loss": 1.8292, + "step": 28879500 + }, + { + "epoch": 83.6, + "learning_rate": 8.217126134679512e-06, + "loss": 1.8356, + "step": 28880000 + }, + { + "epoch": 83.6, + "learning_rate": 8.216402487032236e-06, + "loss": 1.8057, + "step": 28880500 + }, + { + "epoch": 83.6, + "learning_rate": 8.215678839384958e-06, + "loss": 1.8142, + "step": 28881000 + }, + { + "epoch": 83.6, + "learning_rate": 8.21495519173768e-06, + "loss": 1.8361, + "step": 28881500 + }, + { + "epoch": 83.6, + "learning_rate": 8.214231544090404e-06, + "loss": 1.8351, + "step": 28882000 + }, + { + "epoch": 83.6, + "learning_rate": 8.213507896443128e-06, + "loss": 1.8314, + "step": 28882500 + }, + { + "epoch": 83.6, + "learning_rate": 8.21278424879585e-06, + "loss": 1.8235, + "step": 28883000 + }, + { + "epoch": 83.61, + "learning_rate": 8.212062048443867e-06, + "loss": 1.8124, + "step": 28883500 + }, + { + "epoch": 83.61, + "learning_rate": 8.211338400796591e-06, + "loss": 1.8158, + "step": 28884000 + }, + { + "epoch": 83.61, + "learning_rate": 8.210614753149315e-06, + "loss": 1.8043, + "step": 28884500 + }, + { + "epoch": 83.61, + "learning_rate": 8.209891105502037e-06, + "loss": 1.8534, + "step": 28885000 + }, + { + "epoch": 83.61, + "learning_rate": 8.209167457854761e-06, + "loss": 1.8139, + "step": 28885500 + }, + { + "epoch": 83.61, + "learning_rate": 8.20844525750278e-06, + "loss": 1.8235, + "step": 28886000 + }, + { + "epoch": 83.61, + "learning_rate": 8.207721609855503e-06, + "loss": 1.8196, + "step": 28886500 + }, + { + "epoch": 83.62, + "learning_rate": 8.206997962208225e-06, + "loss": 1.8198, + "step": 28887000 + }, + { + "epoch": 83.62, + "learning_rate": 8.206274314560949e-06, + "loss": 1.8348, + "step": 28887500 + }, + { + "epoch": 83.62, + "learning_rate": 8.205550666913673e-06, + "loss": 1.8204, + "step": 28888000 + }, + { + "epoch": 83.62, + "learning_rate": 8.204827019266395e-06, + "loss": 1.8461, + "step": 28888500 + }, + { + "epoch": 83.62, + "learning_rate": 8.204103371619117e-06, + "loss": 1.8193, + "step": 28889000 + }, + { + "epoch": 83.62, + "learning_rate": 8.203379723971843e-06, + "loss": 1.8527, + "step": 28889500 + }, + { + "epoch": 83.62, + "learning_rate": 8.20265752361986e-06, + "loss": 1.8107, + "step": 28890000 + }, + { + "epoch": 83.63, + "learning_rate": 8.201933875972582e-06, + "loss": 1.8462, + "step": 28890500 + }, + { + "epoch": 83.63, + "learning_rate": 8.201210228325306e-06, + "loss": 1.8215, + "step": 28891000 + }, + { + "epoch": 83.63, + "learning_rate": 8.20048658067803e-06, + "loss": 1.8338, + "step": 28891500 + }, + { + "epoch": 83.63, + "learning_rate": 8.199764380326047e-06, + "loss": 1.8145, + "step": 28892000 + }, + { + "epoch": 83.63, + "learning_rate": 8.19904073267877e-06, + "loss": 1.8226, + "step": 28892500 + }, + { + "epoch": 83.63, + "learning_rate": 8.198317085031493e-06, + "loss": 1.838, + "step": 28893000 + }, + { + "epoch": 83.63, + "learning_rate": 8.197593437384217e-06, + "loss": 1.8317, + "step": 28893500 + }, + { + "epoch": 83.64, + "learning_rate": 8.19686978973694e-06, + "loss": 1.8192, + "step": 28894000 + }, + { + "epoch": 83.64, + "learning_rate": 8.196146142089662e-06, + "loss": 1.8143, + "step": 28894500 + }, + { + "epoch": 83.64, + "learning_rate": 8.19542394173768e-06, + "loss": 1.8195, + "step": 28895000 + }, + { + "epoch": 83.64, + "learning_rate": 8.1947017413857e-06, + "loss": 1.8432, + "step": 28895500 + }, + { + "epoch": 83.64, + "learning_rate": 8.193978093738422e-06, + "loss": 1.8414, + "step": 28896000 + }, + { + "epoch": 83.64, + "learning_rate": 8.193254446091144e-06, + "loss": 1.8518, + "step": 28896500 + }, + { + "epoch": 83.64, + "learning_rate": 8.192530798443868e-06, + "loss": 1.8295, + "step": 28897000 + }, + { + "epoch": 83.65, + "learning_rate": 8.191807150796592e-06, + "loss": 1.8313, + "step": 28897500 + }, + { + "epoch": 83.65, + "learning_rate": 8.19108495044461e-06, + "loss": 1.8337, + "step": 28898000 + }, + { + "epoch": 83.65, + "learning_rate": 8.190361302797332e-06, + "loss": 1.8242, + "step": 28898500 + }, + { + "epoch": 83.65, + "learning_rate": 8.189637655150057e-06, + "loss": 1.819, + "step": 28899000 + }, + { + "epoch": 83.65, + "learning_rate": 8.18891400750278e-06, + "loss": 1.8323, + "step": 28899500 + }, + { + "epoch": 83.65, + "learning_rate": 8.188190359855502e-06, + "loss": 1.8409, + "step": 28900000 + }, + { + "epoch": 83.66, + "learning_rate": 8.187466712208226e-06, + "loss": 1.8391, + "step": 28900500 + }, + { + "epoch": 83.66, + "learning_rate": 8.18674306456095e-06, + "loss": 1.8579, + "step": 28901000 + }, + { + "epoch": 83.66, + "learning_rate": 8.186019416913672e-06, + "loss": 1.8324, + "step": 28901500 + }, + { + "epoch": 83.66, + "learning_rate": 8.185295769266394e-06, + "loss": 1.8136, + "step": 28902000 + }, + { + "epoch": 83.66, + "learning_rate": 8.184573568914413e-06, + "loss": 1.8346, + "step": 28902500 + }, + { + "epoch": 83.66, + "learning_rate": 8.183849921267137e-06, + "loss": 1.7921, + "step": 28903000 + }, + { + "epoch": 83.66, + "learning_rate": 8.183126273619859e-06, + "loss": 1.8081, + "step": 28903500 + }, + { + "epoch": 83.67, + "learning_rate": 8.182402625972583e-06, + "loss": 1.8258, + "step": 28904000 + }, + { + "epoch": 83.67, + "learning_rate": 8.181678978325307e-06, + "loss": 1.8249, + "step": 28904500 + }, + { + "epoch": 83.67, + "learning_rate": 8.18095533067803e-06, + "loss": 1.8294, + "step": 28905000 + }, + { + "epoch": 83.67, + "learning_rate": 8.180233130326046e-06, + "loss": 1.816, + "step": 28905500 + }, + { + "epoch": 83.67, + "learning_rate": 8.17950948267877e-06, + "loss": 1.8213, + "step": 28906000 + }, + { + "epoch": 83.67, + "learning_rate": 8.178785835031494e-06, + "loss": 1.8545, + "step": 28906500 + }, + { + "epoch": 83.67, + "learning_rate": 8.178062187384217e-06, + "loss": 1.8137, + "step": 28907000 + }, + { + "epoch": 83.68, + "learning_rate": 8.177338539736939e-06, + "loss": 1.8322, + "step": 28907500 + }, + { + "epoch": 83.68, + "learning_rate": 8.176614892089664e-06, + "loss": 1.8167, + "step": 28908000 + }, + { + "epoch": 83.68, + "learning_rate": 8.175892691737682e-06, + "loss": 1.8411, + "step": 28908500 + }, + { + "epoch": 83.68, + "learning_rate": 8.175169044090404e-06, + "loss": 1.8048, + "step": 28909000 + }, + { + "epoch": 83.68, + "learning_rate": 8.174445396443128e-06, + "loss": 1.8285, + "step": 28909500 + }, + { + "epoch": 83.68, + "learning_rate": 8.173721748795852e-06, + "loss": 1.8518, + "step": 28910000 + }, + { + "epoch": 83.68, + "learning_rate": 8.172999548443869e-06, + "loss": 1.8111, + "step": 28910500 + }, + { + "epoch": 83.69, + "learning_rate": 8.172275900796591e-06, + "loss": 1.8222, + "step": 28911000 + }, + { + "epoch": 83.69, + "learning_rate": 8.171552253149315e-06, + "loss": 1.8391, + "step": 28911500 + }, + { + "epoch": 83.69, + "learning_rate": 8.170830052797334e-06, + "loss": 1.8162, + "step": 28912000 + }, + { + "epoch": 83.69, + "learning_rate": 8.170106405150056e-06, + "loss": 1.8264, + "step": 28912500 + }, + { + "epoch": 83.69, + "learning_rate": 8.169382757502779e-06, + "loss": 1.7986, + "step": 28913000 + }, + { + "epoch": 83.69, + "learning_rate": 8.168659109855502e-06, + "loss": 1.8441, + "step": 28913500 + }, + { + "epoch": 83.69, + "learning_rate": 8.167935462208226e-06, + "loss": 1.8024, + "step": 28914000 + }, + { + "epoch": 83.7, + "learning_rate": 8.167211814560949e-06, + "loss": 1.8381, + "step": 28914500 + }, + { + "epoch": 83.7, + "learning_rate": 8.166489614208966e-06, + "loss": 1.8331, + "step": 28915000 + }, + { + "epoch": 83.7, + "learning_rate": 8.16576596656169e-06, + "loss": 1.8446, + "step": 28915500 + }, + { + "epoch": 83.7, + "learning_rate": 8.165042318914414e-06, + "loss": 1.8528, + "step": 28916000 + }, + { + "epoch": 83.7, + "learning_rate": 8.164318671267136e-06, + "loss": 1.8181, + "step": 28916500 + }, + { + "epoch": 83.7, + "learning_rate": 8.16359502361986e-06, + "loss": 1.8185, + "step": 28917000 + }, + { + "epoch": 83.7, + "learning_rate": 8.162871375972584e-06, + "loss": 1.8254, + "step": 28917500 + }, + { + "epoch": 83.71, + "learning_rate": 8.162147728325306e-06, + "loss": 1.8412, + "step": 28918000 + }, + { + "epoch": 83.71, + "learning_rate": 8.161425527973323e-06, + "loss": 1.8276, + "step": 28918500 + }, + { + "epoch": 83.71, + "learning_rate": 8.16070332762134e-06, + "loss": 1.8184, + "step": 28919000 + }, + { + "epoch": 83.71, + "learning_rate": 8.159979679974066e-06, + "loss": 1.8396, + "step": 28919500 + }, + { + "epoch": 83.71, + "learning_rate": 8.159256032326788e-06, + "loss": 1.7902, + "step": 28920000 + }, + { + "epoch": 83.71, + "learning_rate": 8.15853238467951e-06, + "loss": 1.8336, + "step": 28920500 + }, + { + "epoch": 83.71, + "learning_rate": 8.157808737032235e-06, + "loss": 1.8236, + "step": 28921000 + }, + { + "epoch": 83.72, + "learning_rate": 8.157085089384958e-06, + "loss": 1.842, + "step": 28921500 + }, + { + "epoch": 83.72, + "learning_rate": 8.15636144173768e-06, + "loss": 1.8364, + "step": 28922000 + }, + { + "epoch": 83.72, + "learning_rate": 8.155637794090405e-06, + "loss": 1.8129, + "step": 28922500 + }, + { + "epoch": 83.72, + "learning_rate": 8.154914146443129e-06, + "loss": 1.8321, + "step": 28923000 + }, + { + "epoch": 83.72, + "learning_rate": 8.154191946091146e-06, + "loss": 1.8279, + "step": 28923500 + }, + { + "epoch": 83.72, + "learning_rate": 8.153468298443868e-06, + "loss": 1.8326, + "step": 28924000 + }, + { + "epoch": 83.72, + "learning_rate": 8.152744650796592e-06, + "loss": 1.828, + "step": 28924500 + }, + { + "epoch": 83.73, + "learning_rate": 8.152021003149316e-06, + "loss": 1.8348, + "step": 28925000 + }, + { + "epoch": 83.73, + "learning_rate": 8.151297355502038e-06, + "loss": 1.8429, + "step": 28925500 + }, + { + "epoch": 83.73, + "learning_rate": 8.15057370785476e-06, + "loss": 1.8037, + "step": 28926000 + }, + { + "epoch": 83.73, + "learning_rate": 8.149850060207484e-06, + "loss": 1.8138, + "step": 28926500 + }, + { + "epoch": 83.73, + "learning_rate": 8.149127859855503e-06, + "loss": 1.8102, + "step": 28927000 + }, + { + "epoch": 83.73, + "learning_rate": 8.148404212208225e-06, + "loss": 1.8209, + "step": 28927500 + }, + { + "epoch": 83.73, + "learning_rate": 8.14768056456095e-06, + "loss": 1.8388, + "step": 28928000 + }, + { + "epoch": 83.74, + "learning_rate": 8.146956916913673e-06, + "loss": 1.8326, + "step": 28928500 + }, + { + "epoch": 83.74, + "learning_rate": 8.146233269266396e-06, + "loss": 1.8183, + "step": 28929000 + }, + { + "epoch": 83.74, + "learning_rate": 8.145509621619118e-06, + "loss": 1.8171, + "step": 28929500 + }, + { + "epoch": 83.74, + "learning_rate": 8.144785973971842e-06, + "loss": 1.8164, + "step": 28930000 + }, + { + "epoch": 83.74, + "learning_rate": 8.144062326324566e-06, + "loss": 1.8176, + "step": 28930500 + }, + { + "epoch": 83.74, + "learning_rate": 8.143341573267878e-06, + "loss": 1.8211, + "step": 28931000 + }, + { + "epoch": 83.74, + "learning_rate": 8.1426179256206e-06, + "loss": 1.8181, + "step": 28931500 + }, + { + "epoch": 83.75, + "learning_rate": 8.141894277973324e-06, + "loss": 1.8098, + "step": 28932000 + }, + { + "epoch": 83.75, + "learning_rate": 8.141170630326048e-06, + "loss": 1.8437, + "step": 28932500 + }, + { + "epoch": 83.75, + "learning_rate": 8.14044698267877e-06, + "loss": 1.8254, + "step": 28933000 + }, + { + "epoch": 83.75, + "learning_rate": 8.139723335031492e-06, + "loss": 1.8154, + "step": 28933500 + }, + { + "epoch": 83.75, + "learning_rate": 8.138999687384216e-06, + "loss": 1.8376, + "step": 28934000 + }, + { + "epoch": 83.75, + "learning_rate": 8.13827603973694e-06, + "loss": 1.8048, + "step": 28934500 + }, + { + "epoch": 83.75, + "learning_rate": 8.137552392089663e-06, + "loss": 1.8286, + "step": 28935000 + }, + { + "epoch": 83.76, + "learning_rate": 8.136828744442387e-06, + "loss": 1.8495, + "step": 28935500 + }, + { + "epoch": 83.76, + "learning_rate": 8.13610509679511e-06, + "loss": 1.8313, + "step": 28936000 + }, + { + "epoch": 83.76, + "learning_rate": 8.135381449147833e-06, + "loss": 1.8011, + "step": 28936500 + }, + { + "epoch": 83.76, + "learning_rate": 8.134660696091145e-06, + "loss": 1.8255, + "step": 28937000 + }, + { + "epoch": 83.76, + "learning_rate": 8.133937048443869e-06, + "loss": 1.8459, + "step": 28937500 + }, + { + "epoch": 83.76, + "learning_rate": 8.133213400796593e-06, + "loss": 1.8092, + "step": 28938000 + }, + { + "epoch": 83.77, + "learning_rate": 8.132489753149315e-06, + "loss": 1.8357, + "step": 28938500 + }, + { + "epoch": 83.77, + "learning_rate": 8.131766105502037e-06, + "loss": 1.838, + "step": 28939000 + }, + { + "epoch": 83.77, + "learning_rate": 8.131043905150056e-06, + "loss": 1.8221, + "step": 28939500 + }, + { + "epoch": 83.77, + "learning_rate": 8.13032025750278e-06, + "loss": 1.8382, + "step": 28940000 + }, + { + "epoch": 83.77, + "learning_rate": 8.129596609855502e-06, + "loss": 1.8248, + "step": 28940500 + }, + { + "epoch": 83.77, + "learning_rate": 8.128872962208226e-06, + "loss": 1.8379, + "step": 28941000 + }, + { + "epoch": 83.77, + "learning_rate": 8.128149314560949e-06, + "loss": 1.7974, + "step": 28941500 + }, + { + "epoch": 83.78, + "learning_rate": 8.12742856150426e-06, + "loss": 1.8642, + "step": 28942000 + }, + { + "epoch": 83.78, + "learning_rate": 8.126704913856985e-06, + "loss": 1.8268, + "step": 28942500 + }, + { + "epoch": 83.78, + "learning_rate": 8.125981266209707e-06, + "loss": 1.8203, + "step": 28943000 + }, + { + "epoch": 83.78, + "learning_rate": 8.125257618562431e-06, + "loss": 1.8108, + "step": 28943500 + }, + { + "epoch": 83.78, + "learning_rate": 8.124533970915155e-06, + "loss": 1.8111, + "step": 28944000 + }, + { + "epoch": 83.78, + "learning_rate": 8.123810323267877e-06, + "loss": 1.8575, + "step": 28944500 + }, + { + "epoch": 83.78, + "learning_rate": 8.123088122915894e-06, + "loss": 1.8341, + "step": 28945000 + }, + { + "epoch": 83.79, + "learning_rate": 8.122364475268618e-06, + "loss": 1.8046, + "step": 28945500 + }, + { + "epoch": 83.79, + "learning_rate": 8.121640827621342e-06, + "loss": 1.8225, + "step": 28946000 + }, + { + "epoch": 83.79, + "learning_rate": 8.120917179974064e-06, + "loss": 1.8425, + "step": 28946500 + }, + { + "epoch": 83.79, + "learning_rate": 8.120193532326788e-06, + "loss": 1.8105, + "step": 28947000 + }, + { + "epoch": 83.79, + "learning_rate": 8.119469884679512e-06, + "loss": 1.8428, + "step": 28947500 + }, + { + "epoch": 83.79, + "learning_rate": 8.118746237032234e-06, + "loss": 1.8356, + "step": 28948000 + }, + { + "epoch": 83.79, + "learning_rate": 8.118022589384958e-06, + "loss": 1.8165, + "step": 28948500 + }, + { + "epoch": 83.8, + "learning_rate": 8.117300389032976e-06, + "loss": 1.8218, + "step": 28949000 + }, + { + "epoch": 83.8, + "learning_rate": 8.116578188680993e-06, + "loss": 1.8257, + "step": 28949500 + }, + { + "epoch": 83.8, + "learning_rate": 8.115854541033717e-06, + "loss": 1.8004, + "step": 28950000 + }, + { + "epoch": 83.8, + "learning_rate": 8.115130893386439e-06, + "loss": 1.8309, + "step": 28950500 + }, + { + "epoch": 83.8, + "learning_rate": 8.114408693034458e-06, + "loss": 1.8349, + "step": 28951000 + }, + { + "epoch": 83.8, + "learning_rate": 8.11368504538718e-06, + "loss": 1.8377, + "step": 28951500 + }, + { + "epoch": 83.8, + "learning_rate": 8.112961397739904e-06, + "loss": 1.8366, + "step": 28952000 + }, + { + "epoch": 83.81, + "learning_rate": 8.112237750092626e-06, + "loss": 1.8294, + "step": 28952500 + }, + { + "epoch": 83.81, + "learning_rate": 8.11151410244535e-06, + "loss": 1.824, + "step": 28953000 + }, + { + "epoch": 83.81, + "learning_rate": 8.110790454798074e-06, + "loss": 1.8451, + "step": 28953500 + }, + { + "epoch": 83.81, + "learning_rate": 8.110066807150796e-06, + "loss": 1.82, + "step": 28954000 + }, + { + "epoch": 83.81, + "learning_rate": 8.10934315950352e-06, + "loss": 1.799, + "step": 28954500 + }, + { + "epoch": 83.81, + "learning_rate": 8.108619511856244e-06, + "loss": 1.8162, + "step": 28955000 + }, + { + "epoch": 83.81, + "learning_rate": 8.107895864208967e-06, + "loss": 1.8465, + "step": 28955500 + }, + { + "epoch": 83.82, + "learning_rate": 8.10717221656169e-06, + "loss": 1.8423, + "step": 28956000 + }, + { + "epoch": 83.82, + "learning_rate": 8.106448568914413e-06, + "loss": 1.8332, + "step": 28956500 + }, + { + "epoch": 83.82, + "learning_rate": 8.105726368562432e-06, + "loss": 1.8327, + "step": 28957000 + }, + { + "epoch": 83.82, + "learning_rate": 8.105002720915154e-06, + "loss": 1.8391, + "step": 28957500 + }, + { + "epoch": 83.82, + "learning_rate": 8.104279073267878e-06, + "loss": 1.8462, + "step": 28958000 + }, + { + "epoch": 83.82, + "learning_rate": 8.1035554256206e-06, + "loss": 1.8234, + "step": 28958500 + }, + { + "epoch": 83.82, + "learning_rate": 8.102833225268619e-06, + "loss": 1.8208, + "step": 28959000 + }, + { + "epoch": 83.83, + "learning_rate": 8.102109577621341e-06, + "loss": 1.8383, + "step": 28959500 + }, + { + "epoch": 83.83, + "learning_rate": 8.10138737726936e-06, + "loss": 1.842, + "step": 28960000 + }, + { + "epoch": 83.83, + "learning_rate": 8.100663729622082e-06, + "loss": 1.8432, + "step": 28960500 + }, + { + "epoch": 83.83, + "learning_rate": 8.099940081974806e-06, + "loss": 1.8374, + "step": 28961000 + }, + { + "epoch": 83.83, + "learning_rate": 8.099216434327529e-06, + "loss": 1.8324, + "step": 28961500 + }, + { + "epoch": 83.83, + "learning_rate": 8.098492786680253e-06, + "loss": 1.8186, + "step": 28962000 + }, + { + "epoch": 83.83, + "learning_rate": 8.097769139032975e-06, + "loss": 1.8469, + "step": 28962500 + }, + { + "epoch": 83.84, + "learning_rate": 8.097045491385699e-06, + "loss": 1.8448, + "step": 28963000 + }, + { + "epoch": 83.84, + "learning_rate": 8.096321843738423e-06, + "loss": 1.8092, + "step": 28963500 + }, + { + "epoch": 83.84, + "learning_rate": 8.095598196091145e-06, + "loss": 1.8241, + "step": 28964000 + }, + { + "epoch": 83.84, + "learning_rate": 8.094874548443869e-06, + "loss": 1.8218, + "step": 28964500 + }, + { + "epoch": 83.84, + "learning_rate": 8.094150900796591e-06, + "loss": 1.8467, + "step": 28965000 + }, + { + "epoch": 83.84, + "learning_rate": 8.093427253149315e-06, + "loss": 1.8508, + "step": 28965500 + }, + { + "epoch": 83.84, + "learning_rate": 8.092705052797332e-06, + "loss": 1.8471, + "step": 28966000 + }, + { + "epoch": 83.85, + "learning_rate": 8.091981405150056e-06, + "loss": 1.8202, + "step": 28966500 + }, + { + "epoch": 83.85, + "learning_rate": 8.09125775750278e-06, + "loss": 1.85, + "step": 28967000 + }, + { + "epoch": 83.85, + "learning_rate": 8.090534109855502e-06, + "loss": 1.8243, + "step": 28967500 + }, + { + "epoch": 83.85, + "learning_rate": 8.089810462208226e-06, + "loss": 1.826, + "step": 28968000 + }, + { + "epoch": 83.85, + "learning_rate": 8.089086814560948e-06, + "loss": 1.8422, + "step": 28968500 + }, + { + "epoch": 83.85, + "learning_rate": 8.088363166913672e-06, + "loss": 1.8255, + "step": 28969000 + }, + { + "epoch": 83.85, + "learning_rate": 8.087639519266395e-06, + "loss": 1.8569, + "step": 28969500 + }, + { + "epoch": 83.86, + "learning_rate": 8.086917318914414e-06, + "loss": 1.8037, + "step": 28970000 + }, + { + "epoch": 83.86, + "learning_rate": 8.08619511856243e-06, + "loss": 1.8589, + "step": 28970500 + }, + { + "epoch": 83.86, + "learning_rate": 8.085471470915155e-06, + "loss": 1.8252, + "step": 28971000 + }, + { + "epoch": 83.86, + "learning_rate": 8.084747823267877e-06, + "loss": 1.8265, + "step": 28971500 + }, + { + "epoch": 83.86, + "learning_rate": 8.084024175620601e-06, + "loss": 1.8207, + "step": 28972000 + }, + { + "epoch": 83.86, + "learning_rate": 8.083300527973325e-06, + "loss": 1.8148, + "step": 28972500 + }, + { + "epoch": 83.86, + "learning_rate": 8.082578327621342e-06, + "loss": 1.8224, + "step": 28973000 + }, + { + "epoch": 83.87, + "learning_rate": 8.081854679974064e-06, + "loss": 1.8389, + "step": 28973500 + }, + { + "epoch": 83.87, + "learning_rate": 8.081131032326788e-06, + "loss": 1.8339, + "step": 28974000 + }, + { + "epoch": 83.87, + "learning_rate": 8.080407384679512e-06, + "loss": 1.8205, + "step": 28974500 + }, + { + "epoch": 83.87, + "learning_rate": 8.07968518432753e-06, + "loss": 1.8115, + "step": 28975000 + }, + { + "epoch": 83.87, + "learning_rate": 8.078961536680252e-06, + "loss": 1.8407, + "step": 28975500 + }, + { + "epoch": 83.87, + "learning_rate": 8.078237889032976e-06, + "loss": 1.8006, + "step": 28976000 + }, + { + "epoch": 83.88, + "learning_rate": 8.077515688680993e-06, + "loss": 1.8429, + "step": 28976500 + }, + { + "epoch": 83.88, + "learning_rate": 8.076792041033717e-06, + "loss": 1.8381, + "step": 28977000 + }, + { + "epoch": 83.88, + "learning_rate": 8.076068393386439e-06, + "loss": 1.8108, + "step": 28977500 + }, + { + "epoch": 83.88, + "learning_rate": 8.075344745739163e-06, + "loss": 1.8248, + "step": 28978000 + }, + { + "epoch": 83.88, + "learning_rate": 8.074621098091887e-06, + "loss": 1.8218, + "step": 28978500 + }, + { + "epoch": 83.88, + "learning_rate": 8.073897450444609e-06, + "loss": 1.8189, + "step": 28979000 + }, + { + "epoch": 83.88, + "learning_rate": 8.073173802797333e-06, + "loss": 1.8232, + "step": 28979500 + }, + { + "epoch": 83.89, + "learning_rate": 8.072450155150057e-06, + "loss": 1.8231, + "step": 28980000 + }, + { + "epoch": 83.89, + "learning_rate": 8.071726507502779e-06, + "loss": 1.8317, + "step": 28980500 + }, + { + "epoch": 83.89, + "learning_rate": 8.071002859855501e-06, + "loss": 1.8227, + "step": 28981000 + }, + { + "epoch": 83.89, + "learning_rate": 8.07028065950352e-06, + "loss": 1.8214, + "step": 28981500 + }, + { + "epoch": 83.89, + "learning_rate": 8.069557011856244e-06, + "loss": 1.8194, + "step": 28982000 + }, + { + "epoch": 83.89, + "learning_rate": 8.068833364208966e-06, + "loss": 1.8511, + "step": 28982500 + }, + { + "epoch": 83.89, + "learning_rate": 8.068109716561689e-06, + "loss": 1.8182, + "step": 28983000 + }, + { + "epoch": 83.9, + "learning_rate": 8.067386068914413e-06, + "loss": 1.8437, + "step": 28983500 + }, + { + "epoch": 83.9, + "learning_rate": 8.066662421267137e-06, + "loss": 1.8144, + "step": 28984000 + }, + { + "epoch": 83.9, + "learning_rate": 8.065940220915154e-06, + "loss": 1.8406, + "step": 28984500 + }, + { + "epoch": 83.9, + "learning_rate": 8.065216573267878e-06, + "loss": 1.8378, + "step": 28985000 + }, + { + "epoch": 83.9, + "learning_rate": 8.064494372915895e-06, + "loss": 1.8291, + "step": 28985500 + }, + { + "epoch": 83.9, + "learning_rate": 8.063770725268619e-06, + "loss": 1.8337, + "step": 28986000 + }, + { + "epoch": 83.9, + "learning_rate": 8.063047077621341e-06, + "loss": 1.8213, + "step": 28986500 + }, + { + "epoch": 83.91, + "learning_rate": 8.062323429974065e-06, + "loss": 1.8378, + "step": 28987000 + }, + { + "epoch": 83.91, + "learning_rate": 8.061599782326789e-06, + "loss": 1.8213, + "step": 28987500 + }, + { + "epoch": 83.91, + "learning_rate": 8.060876134679511e-06, + "loss": 1.8399, + "step": 28988000 + }, + { + "epoch": 83.91, + "learning_rate": 8.060152487032233e-06, + "loss": 1.8383, + "step": 28988500 + }, + { + "epoch": 83.91, + "learning_rate": 8.059428839384957e-06, + "loss": 1.8351, + "step": 28989000 + }, + { + "epoch": 83.91, + "learning_rate": 8.058705191737681e-06, + "loss": 1.842, + "step": 28989500 + }, + { + "epoch": 83.91, + "learning_rate": 8.057981544090404e-06, + "loss": 1.8346, + "step": 28990000 + }, + { + "epoch": 83.92, + "learning_rate": 8.05725934373842e-06, + "loss": 1.8573, + "step": 28990500 + }, + { + "epoch": 83.92, + "learning_rate": 8.056535696091146e-06, + "loss": 1.8306, + "step": 28991000 + }, + { + "epoch": 83.92, + "learning_rate": 8.055812048443869e-06, + "loss": 1.8347, + "step": 28991500 + }, + { + "epoch": 83.92, + "learning_rate": 8.055088400796591e-06, + "loss": 1.82, + "step": 28992000 + }, + { + "epoch": 83.92, + "learning_rate": 8.054366200444608e-06, + "loss": 1.8472, + "step": 28992500 + }, + { + "epoch": 83.92, + "learning_rate": 8.053642552797334e-06, + "loss": 1.8321, + "step": 28993000 + }, + { + "epoch": 83.92, + "learning_rate": 8.052918905150056e-06, + "loss": 1.8257, + "step": 28993500 + }, + { + "epoch": 83.93, + "learning_rate": 8.052195257502778e-06, + "loss": 1.818, + "step": 28994000 + }, + { + "epoch": 83.93, + "learning_rate": 8.051471609855502e-06, + "loss": 1.8059, + "step": 28994500 + }, + { + "epoch": 83.93, + "learning_rate": 8.050749409503521e-06, + "loss": 1.8469, + "step": 28995000 + }, + { + "epoch": 83.93, + "learning_rate": 8.050025761856243e-06, + "loss": 1.8194, + "step": 28995500 + }, + { + "epoch": 83.93, + "learning_rate": 8.049302114208966e-06, + "loss": 1.8343, + "step": 28996000 + }, + { + "epoch": 83.93, + "learning_rate": 8.048578466561691e-06, + "loss": 1.8011, + "step": 28996500 + }, + { + "epoch": 83.93, + "learning_rate": 8.047854818914413e-06, + "loss": 1.841, + "step": 28997000 + }, + { + "epoch": 83.94, + "learning_rate": 8.047131171267136e-06, + "loss": 1.8182, + "step": 28997500 + }, + { + "epoch": 83.94, + "learning_rate": 8.046408970915153e-06, + "loss": 1.8452, + "step": 28998000 + }, + { + "epoch": 83.94, + "learning_rate": 8.045685323267879e-06, + "loss": 1.852, + "step": 28998500 + }, + { + "epoch": 83.94, + "learning_rate": 8.0449616756206e-06, + "loss": 1.8246, + "step": 28999000 + }, + { + "epoch": 83.94, + "learning_rate": 8.044238027973323e-06, + "loss": 1.8201, + "step": 28999500 + }, + { + "epoch": 83.94, + "learning_rate": 8.043514380326047e-06, + "loss": 1.8356, + "step": 29000000 + }, + { + "epoch": 83.94, + "learning_rate": 8.042790732678771e-06, + "loss": 1.8278, + "step": 29000500 + }, + { + "epoch": 83.95, + "learning_rate": 8.042068532326788e-06, + "loss": 1.8367, + "step": 29001000 + }, + { + "epoch": 83.95, + "learning_rate": 8.04134488467951e-06, + "loss": 1.7993, + "step": 29001500 + }, + { + "epoch": 83.95, + "learning_rate": 8.040621237032234e-06, + "loss": 1.8236, + "step": 29002000 + }, + { + "epoch": 83.95, + "learning_rate": 8.039899036680253e-06, + "loss": 1.7993, + "step": 29002500 + }, + { + "epoch": 83.95, + "learning_rate": 8.039175389032975e-06, + "loss": 1.8634, + "step": 29003000 + }, + { + "epoch": 83.95, + "learning_rate": 8.038451741385698e-06, + "loss": 1.8261, + "step": 29003500 + }, + { + "epoch": 83.95, + "learning_rate": 8.037728093738423e-06, + "loss": 1.832, + "step": 29004000 + }, + { + "epoch": 83.96, + "learning_rate": 8.037004446091146e-06, + "loss": 1.825, + "step": 29004500 + }, + { + "epoch": 83.96, + "learning_rate": 8.036280798443868e-06, + "loss": 1.8507, + "step": 29005000 + }, + { + "epoch": 83.96, + "learning_rate": 8.035557150796592e-06, + "loss": 1.8064, + "step": 29005500 + }, + { + "epoch": 83.96, + "learning_rate": 8.034833503149316e-06, + "loss": 1.826, + "step": 29006000 + }, + { + "epoch": 83.96, + "learning_rate": 8.034109855502038e-06, + "loss": 1.8356, + "step": 29006500 + }, + { + "epoch": 83.96, + "learning_rate": 8.033387655150055e-06, + "loss": 1.8221, + "step": 29007000 + }, + { + "epoch": 83.96, + "learning_rate": 8.032664007502779e-06, + "loss": 1.83, + "step": 29007500 + }, + { + "epoch": 83.97, + "learning_rate": 8.031941807150798e-06, + "loss": 1.8041, + "step": 29008000 + }, + { + "epoch": 83.97, + "learning_rate": 8.03121815950352e-06, + "loss": 1.8383, + "step": 29008500 + }, + { + "epoch": 83.97, + "learning_rate": 8.030494511856242e-06, + "loss": 1.8344, + "step": 29009000 + }, + { + "epoch": 83.97, + "learning_rate": 8.029770864208968e-06, + "loss": 1.8171, + "step": 29009500 + }, + { + "epoch": 83.97, + "learning_rate": 8.02904721656169e-06, + "loss": 1.825, + "step": 29010000 + }, + { + "epoch": 83.97, + "learning_rate": 8.028323568914413e-06, + "loss": 1.8456, + "step": 29010500 + }, + { + "epoch": 83.97, + "learning_rate": 8.027599921267136e-06, + "loss": 1.8305, + "step": 29011000 + }, + { + "epoch": 83.98, + "learning_rate": 8.02687627361986e-06, + "loss": 1.8595, + "step": 29011500 + }, + { + "epoch": 83.98, + "learning_rate": 8.026152625972583e-06, + "loss": 1.851, + "step": 29012000 + }, + { + "epoch": 83.98, + "learning_rate": 8.025428978325305e-06, + "loss": 1.8228, + "step": 29012500 + }, + { + "epoch": 83.98, + "learning_rate": 8.024706777973324e-06, + "loss": 1.8398, + "step": 29013000 + }, + { + "epoch": 83.98, + "learning_rate": 8.023983130326048e-06, + "loss": 1.8326, + "step": 29013500 + }, + { + "epoch": 83.98, + "learning_rate": 8.02325948267877e-06, + "loss": 1.8269, + "step": 29014000 + }, + { + "epoch": 83.99, + "learning_rate": 8.022535835031492e-06, + "loss": 1.8196, + "step": 29014500 + }, + { + "epoch": 83.99, + "learning_rate": 8.021813634679511e-06, + "loss": 1.8159, + "step": 29015000 + }, + { + "epoch": 83.99, + "learning_rate": 8.021089987032235e-06, + "loss": 1.8126, + "step": 29015500 + }, + { + "epoch": 83.99, + "learning_rate": 8.020366339384957e-06, + "loss": 1.8328, + "step": 29016000 + }, + { + "epoch": 83.99, + "learning_rate": 8.019642691737681e-06, + "loss": 1.8244, + "step": 29016500 + }, + { + "epoch": 83.99, + "learning_rate": 8.018919044090405e-06, + "loss": 1.8513, + "step": 29017000 + }, + { + "epoch": 83.99, + "learning_rate": 8.018195396443127e-06, + "loss": 1.8135, + "step": 29017500 + }, + { + "epoch": 84.0, + "learning_rate": 8.01747174879585e-06, + "loss": 1.8204, + "step": 29018000 + }, + { + "epoch": 84.0, + "learning_rate": 8.016749548443869e-06, + "loss": 1.8493, + "step": 29018500 + }, + { + "epoch": 84.0, + "learning_rate": 8.016025900796592e-06, + "loss": 1.8158, + "step": 29019000 + }, + { + "epoch": 84.0, + "learning_rate": 8.01530370044461e-06, + "loss": 1.8117, + "step": 29019500 + }, + { + "epoch": 84.0, + "eval_accuracy": 0.6880829597340532, + "eval_accuracy_mlm": 0.6571719504827696, + "eval_accuracy_nsp": 0.8539916495946249, + "eval_loss": 2.1972768306732178, + "eval_runtime": 331.8951, + "eval_samples_per_second": 1314.831, + "eval_steps_per_second": 54.785, + "step": 29019648 + }, + { + "epoch": 84.0, + "learning_rate": 8.014581500092627e-06, + "loss": 1.833, + "step": 29020000 + }, + { + "epoch": 84.0, + "learning_rate": 8.01385785244535e-06, + "loss": 1.8421, + "step": 29020500 + }, + { + "epoch": 84.0, + "learning_rate": 8.013134204798075e-06, + "loss": 1.8142, + "step": 29021000 + }, + { + "epoch": 84.01, + "learning_rate": 8.012410557150797e-06, + "loss": 1.8187, + "step": 29021500 + }, + { + "epoch": 84.01, + "learning_rate": 8.01168690950352e-06, + "loss": 1.8089, + "step": 29022000 + }, + { + "epoch": 84.01, + "learning_rate": 8.010963261856245e-06, + "loss": 1.834, + "step": 29022500 + }, + { + "epoch": 84.01, + "learning_rate": 8.010239614208967e-06, + "loss": 1.8241, + "step": 29023000 + }, + { + "epoch": 84.01, + "learning_rate": 8.00951596656169e-06, + "loss": 1.8236, + "step": 29023500 + }, + { + "epoch": 84.01, + "learning_rate": 8.008792318914413e-06, + "loss": 1.8181, + "step": 29024000 + }, + { + "epoch": 84.01, + "learning_rate": 8.008068671267137e-06, + "loss": 1.8156, + "step": 29024500 + }, + { + "epoch": 84.02, + "learning_rate": 8.00734502361986e-06, + "loss": 1.7956, + "step": 29025000 + }, + { + "epoch": 84.02, + "learning_rate": 8.006621375972582e-06, + "loss": 1.7979, + "step": 29025500 + }, + { + "epoch": 84.02, + "learning_rate": 8.005897728325307e-06, + "loss": 1.8344, + "step": 29026000 + }, + { + "epoch": 84.02, + "learning_rate": 8.00517408067803e-06, + "loss": 1.8403, + "step": 29026500 + }, + { + "epoch": 84.02, + "learning_rate": 8.004451880326047e-06, + "loss": 1.8157, + "step": 29027000 + }, + { + "epoch": 84.02, + "learning_rate": 8.00372823267877e-06, + "loss": 1.7896, + "step": 29027500 + }, + { + "epoch": 84.02, + "learning_rate": 8.003004585031495e-06, + "loss": 1.8299, + "step": 29028000 + }, + { + "epoch": 84.03, + "learning_rate": 8.002280937384217e-06, + "loss": 1.7937, + "step": 29028500 + }, + { + "epoch": 84.03, + "learning_rate": 8.001558737032234e-06, + "loss": 1.8232, + "step": 29029000 + }, + { + "epoch": 84.03, + "learning_rate": 8.000835089384958e-06, + "loss": 1.8142, + "step": 29029500 + }, + { + "epoch": 84.03, + "learning_rate": 8.000111441737682e-06, + "loss": 1.7983, + "step": 29030000 + }, + { + "epoch": 84.03, + "learning_rate": 7.999387794090404e-06, + "loss": 1.8046, + "step": 29030500 + }, + { + "epoch": 84.03, + "learning_rate": 7.998665593738421e-06, + "loss": 1.8189, + "step": 29031000 + }, + { + "epoch": 84.03, + "learning_rate": 7.997941946091145e-06, + "loss": 1.8289, + "step": 29031500 + }, + { + "epoch": 84.04, + "learning_rate": 7.99721829844387e-06, + "loss": 1.8186, + "step": 29032000 + }, + { + "epoch": 84.04, + "learning_rate": 7.996494650796592e-06, + "loss": 1.79, + "step": 29032500 + }, + { + "epoch": 84.04, + "learning_rate": 7.995771003149314e-06, + "loss": 1.8202, + "step": 29033000 + }, + { + "epoch": 84.04, + "learning_rate": 7.995048802797333e-06, + "loss": 1.8355, + "step": 29033500 + }, + { + "epoch": 84.04, + "learning_rate": 7.994325155150057e-06, + "loss": 1.8257, + "step": 29034000 + }, + { + "epoch": 84.04, + "learning_rate": 7.993601507502779e-06, + "loss": 1.8238, + "step": 29034500 + }, + { + "epoch": 84.04, + "learning_rate": 7.992877859855503e-06, + "loss": 1.8353, + "step": 29035000 + }, + { + "epoch": 84.05, + "learning_rate": 7.992154212208227e-06, + "loss": 1.8184, + "step": 29035500 + }, + { + "epoch": 84.05, + "learning_rate": 7.991430564560949e-06, + "loss": 1.8156, + "step": 29036000 + }, + { + "epoch": 84.05, + "learning_rate": 7.990708364208966e-06, + "loss": 1.8087, + "step": 29036500 + }, + { + "epoch": 84.05, + "learning_rate": 7.98998471656169e-06, + "loss": 1.8263, + "step": 29037000 + }, + { + "epoch": 84.05, + "learning_rate": 7.989261068914414e-06, + "loss": 1.8425, + "step": 29037500 + }, + { + "epoch": 84.05, + "learning_rate": 7.988537421267136e-06, + "loss": 1.8242, + "step": 29038000 + }, + { + "epoch": 84.05, + "learning_rate": 7.987813773619859e-06, + "loss": 1.7974, + "step": 29038500 + }, + { + "epoch": 84.06, + "learning_rate": 7.987091573267878e-06, + "loss": 1.8451, + "step": 29039000 + }, + { + "epoch": 84.06, + "learning_rate": 7.986369372915895e-06, + "loss": 1.8063, + "step": 29039500 + }, + { + "epoch": 84.06, + "learning_rate": 7.985645725268619e-06, + "loss": 1.8118, + "step": 29040000 + }, + { + "epoch": 84.06, + "learning_rate": 7.984922077621341e-06, + "loss": 1.8011, + "step": 29040500 + }, + { + "epoch": 84.06, + "learning_rate": 7.984198429974065e-06, + "loss": 1.8133, + "step": 29041000 + }, + { + "epoch": 84.06, + "learning_rate": 7.983474782326789e-06, + "loss": 1.8263, + "step": 29041500 + }, + { + "epoch": 84.06, + "learning_rate": 7.982751134679511e-06, + "loss": 1.8098, + "step": 29042000 + }, + { + "epoch": 84.07, + "learning_rate": 7.982027487032235e-06, + "loss": 1.8301, + "step": 29042500 + }, + { + "epoch": 84.07, + "learning_rate": 7.981303839384959e-06, + "loss": 1.8457, + "step": 29043000 + }, + { + "epoch": 84.07, + "learning_rate": 7.980580191737681e-06, + "loss": 1.8161, + "step": 29043500 + }, + { + "epoch": 84.07, + "learning_rate": 7.979857991385698e-06, + "loss": 1.8196, + "step": 29044000 + }, + { + "epoch": 84.07, + "learning_rate": 7.979134343738422e-06, + "loss": 1.8073, + "step": 29044500 + }, + { + "epoch": 84.07, + "learning_rate": 7.978410696091146e-06, + "loss": 1.8159, + "step": 29045000 + }, + { + "epoch": 84.07, + "learning_rate": 7.977687048443868e-06, + "loss": 1.8287, + "step": 29045500 + }, + { + "epoch": 84.08, + "learning_rate": 7.976964848091886e-06, + "loss": 1.8159, + "step": 29046000 + }, + { + "epoch": 84.08, + "learning_rate": 7.97624120044461e-06, + "loss": 1.8035, + "step": 29046500 + }, + { + "epoch": 84.08, + "learning_rate": 7.975517552797334e-06, + "loss": 1.8168, + "step": 29047000 + }, + { + "epoch": 84.08, + "learning_rate": 7.97479535244535e-06, + "loss": 1.8053, + "step": 29047500 + }, + { + "epoch": 84.08, + "learning_rate": 7.974071704798073e-06, + "loss": 1.8337, + "step": 29048000 + }, + { + "epoch": 84.08, + "learning_rate": 7.973348057150797e-06, + "loss": 1.8109, + "step": 29048500 + }, + { + "epoch": 84.08, + "learning_rate": 7.972624409503521e-06, + "loss": 1.8292, + "step": 29049000 + }, + { + "epoch": 84.09, + "learning_rate": 7.971900761856243e-06, + "loss": 1.8202, + "step": 29049500 + }, + { + "epoch": 84.09, + "learning_rate": 7.971177114208967e-06, + "loss": 1.8128, + "step": 29050000 + }, + { + "epoch": 84.09, + "learning_rate": 7.97045346656169e-06, + "loss": 1.8209, + "step": 29050500 + }, + { + "epoch": 84.09, + "learning_rate": 7.969729818914413e-06, + "loss": 1.795, + "step": 29051000 + }, + { + "epoch": 84.09, + "learning_rate": 7.969006171267135e-06, + "loss": 1.8093, + "step": 29051500 + }, + { + "epoch": 84.09, + "learning_rate": 7.96828252361986e-06, + "loss": 1.8038, + "step": 29052000 + }, + { + "epoch": 84.1, + "learning_rate": 7.967558875972583e-06, + "loss": 1.8244, + "step": 29052500 + }, + { + "epoch": 84.1, + "learning_rate": 7.966835228325306e-06, + "loss": 1.8071, + "step": 29053000 + }, + { + "epoch": 84.1, + "learning_rate": 7.966113027973324e-06, + "loss": 1.7958, + "step": 29053500 + }, + { + "epoch": 84.1, + "learning_rate": 7.965389380326047e-06, + "loss": 1.8157, + "step": 29054000 + }, + { + "epoch": 84.1, + "learning_rate": 7.96466573267877e-06, + "loss": 1.8529, + "step": 29054500 + }, + { + "epoch": 84.1, + "learning_rate": 7.963942085031493e-06, + "loss": 1.8146, + "step": 29055000 + }, + { + "epoch": 84.1, + "learning_rate": 7.963218437384217e-06, + "loss": 1.8112, + "step": 29055500 + }, + { + "epoch": 84.11, + "learning_rate": 7.96249478973694e-06, + "loss": 1.8217, + "step": 29056000 + }, + { + "epoch": 84.11, + "learning_rate": 7.961772589384958e-06, + "loss": 1.8158, + "step": 29056500 + }, + { + "epoch": 84.11, + "learning_rate": 7.96104894173768e-06, + "loss": 1.7986, + "step": 29057000 + }, + { + "epoch": 84.11, + "learning_rate": 7.960325294090404e-06, + "loss": 1.7896, + "step": 29057500 + }, + { + "epoch": 84.11, + "learning_rate": 7.959603093738421e-06, + "loss": 1.8426, + "step": 29058000 + }, + { + "epoch": 84.11, + "learning_rate": 7.958879446091145e-06, + "loss": 1.8119, + "step": 29058500 + }, + { + "epoch": 84.11, + "learning_rate": 7.95815579844387e-06, + "loss": 1.8128, + "step": 29059000 + }, + { + "epoch": 84.12, + "learning_rate": 7.957432150796591e-06, + "loss": 1.8097, + "step": 29059500 + }, + { + "epoch": 84.12, + "learning_rate": 7.956708503149315e-06, + "loss": 1.8358, + "step": 29060000 + }, + { + "epoch": 84.12, + "learning_rate": 7.955984855502038e-06, + "loss": 1.8049, + "step": 29060500 + }, + { + "epoch": 84.12, + "learning_rate": 7.955261207854762e-06, + "loss": 1.8103, + "step": 29061000 + }, + { + "epoch": 84.12, + "learning_rate": 7.954539007502779e-06, + "loss": 1.8063, + "step": 29061500 + }, + { + "epoch": 84.12, + "learning_rate": 7.953815359855503e-06, + "loss": 1.8149, + "step": 29062000 + }, + { + "epoch": 84.12, + "learning_rate": 7.953091712208225e-06, + "loss": 1.8172, + "step": 29062500 + }, + { + "epoch": 84.13, + "learning_rate": 7.952368064560949e-06, + "loss": 1.8245, + "step": 29063000 + }, + { + "epoch": 84.13, + "learning_rate": 7.951644416913673e-06, + "loss": 1.8322, + "step": 29063500 + }, + { + "epoch": 84.13, + "learning_rate": 7.950920769266395e-06, + "loss": 1.8208, + "step": 29064000 + }, + { + "epoch": 84.13, + "learning_rate": 7.950197121619119e-06, + "loss": 1.7943, + "step": 29064500 + }, + { + "epoch": 84.13, + "learning_rate": 7.949473473971841e-06, + "loss": 1.837, + "step": 29065000 + }, + { + "epoch": 84.13, + "learning_rate": 7.948749826324565e-06, + "loss": 1.8096, + "step": 29065500 + }, + { + "epoch": 84.13, + "learning_rate": 7.948026178677289e-06, + "loss": 1.8613, + "step": 29066000 + }, + { + "epoch": 84.14, + "learning_rate": 7.947302531030011e-06, + "loss": 1.8172, + "step": 29066500 + }, + { + "epoch": 84.14, + "learning_rate": 7.946580330678029e-06, + "loss": 1.8133, + "step": 29067000 + }, + { + "epoch": 84.14, + "learning_rate": 7.945856683030752e-06, + "loss": 1.8353, + "step": 29067500 + }, + { + "epoch": 84.14, + "learning_rate": 7.945133035383476e-06, + "loss": 1.8244, + "step": 29068000 + }, + { + "epoch": 84.14, + "learning_rate": 7.944410835031494e-06, + "loss": 1.8507, + "step": 29068500 + }, + { + "epoch": 84.14, + "learning_rate": 7.943687187384216e-06, + "loss": 1.8056, + "step": 29069000 + }, + { + "epoch": 84.14, + "learning_rate": 7.94296353973694e-06, + "loss": 1.7867, + "step": 29069500 + }, + { + "epoch": 84.15, + "learning_rate": 7.942239892089664e-06, + "loss": 1.8102, + "step": 29070000 + }, + { + "epoch": 84.15, + "learning_rate": 7.941516244442386e-06, + "loss": 1.8037, + "step": 29070500 + }, + { + "epoch": 84.15, + "learning_rate": 7.94079259679511e-06, + "loss": 1.8377, + "step": 29071000 + }, + { + "epoch": 84.15, + "learning_rate": 7.940068949147834e-06, + "loss": 1.7882, + "step": 29071500 + }, + { + "epoch": 84.15, + "learning_rate": 7.939345301500556e-06, + "loss": 1.7936, + "step": 29072000 + }, + { + "epoch": 84.15, + "learning_rate": 7.938621653853278e-06, + "loss": 1.8299, + "step": 29072500 + }, + { + "epoch": 84.15, + "learning_rate": 7.937898006206002e-06, + "loss": 1.8388, + "step": 29073000 + }, + { + "epoch": 84.16, + "learning_rate": 7.937174358558726e-06, + "loss": 1.82, + "step": 29073500 + }, + { + "epoch": 84.16, + "learning_rate": 7.936452158206743e-06, + "loss": 1.8471, + "step": 29074000 + }, + { + "epoch": 84.16, + "learning_rate": 7.935728510559467e-06, + "loss": 1.8045, + "step": 29074500 + }, + { + "epoch": 84.16, + "learning_rate": 7.93500486291219e-06, + "loss": 1.8247, + "step": 29075000 + }, + { + "epoch": 84.16, + "learning_rate": 7.934281215264914e-06, + "loss": 1.8377, + "step": 29075500 + }, + { + "epoch": 84.16, + "learning_rate": 7.93355901491293e-06, + "loss": 1.819, + "step": 29076000 + }, + { + "epoch": 84.16, + "learning_rate": 7.932835367265655e-06, + "loss": 1.8008, + "step": 29076500 + }, + { + "epoch": 84.17, + "learning_rate": 7.932113166913672e-06, + "loss": 1.8022, + "step": 29077000 + }, + { + "epoch": 84.17, + "learning_rate": 7.931389519266396e-06, + "loss": 1.8129, + "step": 29077500 + }, + { + "epoch": 84.17, + "learning_rate": 7.930665871619118e-06, + "loss": 1.8276, + "step": 29078000 + }, + { + "epoch": 84.17, + "learning_rate": 7.929942223971842e-06, + "loss": 1.7854, + "step": 29078500 + }, + { + "epoch": 84.17, + "learning_rate": 7.929218576324566e-06, + "loss": 1.8389, + "step": 29079000 + }, + { + "epoch": 84.17, + "learning_rate": 7.928496375972583e-06, + "loss": 1.8149, + "step": 29079500 + }, + { + "epoch": 84.17, + "learning_rate": 7.927772728325305e-06, + "loss": 1.822, + "step": 29080000 + }, + { + "epoch": 84.18, + "learning_rate": 7.92704908067803e-06, + "loss": 1.8405, + "step": 29080500 + }, + { + "epoch": 84.18, + "learning_rate": 7.926325433030753e-06, + "loss": 1.816, + "step": 29081000 + }, + { + "epoch": 84.18, + "learning_rate": 7.925601785383476e-06, + "loss": 1.7996, + "step": 29081500 + }, + { + "epoch": 84.18, + "learning_rate": 7.924878137736198e-06, + "loss": 1.786, + "step": 29082000 + }, + { + "epoch": 84.18, + "learning_rate": 7.924154490088922e-06, + "loss": 1.8284, + "step": 29082500 + }, + { + "epoch": 84.18, + "learning_rate": 7.923430842441646e-06, + "loss": 1.8129, + "step": 29083000 + }, + { + "epoch": 84.18, + "learning_rate": 7.922707194794368e-06, + "loss": 1.8122, + "step": 29083500 + }, + { + "epoch": 84.19, + "learning_rate": 7.921983547147092e-06, + "loss": 1.8267, + "step": 29084000 + }, + { + "epoch": 84.19, + "learning_rate": 7.921259899499816e-06, + "loss": 1.8092, + "step": 29084500 + }, + { + "epoch": 84.19, + "learning_rate": 7.920536251852538e-06, + "loss": 1.8261, + "step": 29085000 + }, + { + "epoch": 84.19, + "learning_rate": 7.919814051500555e-06, + "loss": 1.7743, + "step": 29085500 + }, + { + "epoch": 84.19, + "learning_rate": 7.919091851148574e-06, + "loss": 1.8171, + "step": 29086000 + }, + { + "epoch": 84.19, + "learning_rate": 7.918368203501298e-06, + "loss": 1.8131, + "step": 29086500 + }, + { + "epoch": 84.19, + "learning_rate": 7.91764455585402e-06, + "loss": 1.8109, + "step": 29087000 + }, + { + "epoch": 84.2, + "learning_rate": 7.916920908206743e-06, + "loss": 1.8242, + "step": 29087500 + }, + { + "epoch": 84.2, + "learning_rate": 7.916197260559466e-06, + "loss": 1.7861, + "step": 29088000 + }, + { + "epoch": 84.2, + "learning_rate": 7.915475060207485e-06, + "loss": 1.8299, + "step": 29088500 + }, + { + "epoch": 84.2, + "learning_rate": 7.914751412560208e-06, + "loss": 1.8302, + "step": 29089000 + }, + { + "epoch": 84.2, + "learning_rate": 7.91402776491293e-06, + "loss": 1.8108, + "step": 29089500 + }, + { + "epoch": 84.2, + "learning_rate": 7.913304117265655e-06, + "loss": 1.8053, + "step": 29090000 + }, + { + "epoch": 84.21, + "learning_rate": 7.912583364208968e-06, + "loss": 1.8233, + "step": 29090500 + }, + { + "epoch": 84.21, + "learning_rate": 7.91185971656169e-06, + "loss": 1.806, + "step": 29091000 + }, + { + "epoch": 84.21, + "learning_rate": 7.911136068914412e-06, + "loss": 1.8353, + "step": 29091500 + }, + { + "epoch": 84.21, + "learning_rate": 7.910412421267136e-06, + "loss": 1.8359, + "step": 29092000 + }, + { + "epoch": 84.21, + "learning_rate": 7.90968877361986e-06, + "loss": 1.8241, + "step": 29092500 + }, + { + "epoch": 84.21, + "learning_rate": 7.908965125972582e-06, + "loss": 1.8222, + "step": 29093000 + }, + { + "epoch": 84.21, + "learning_rate": 7.908241478325306e-06, + "loss": 1.8223, + "step": 29093500 + }, + { + "epoch": 84.22, + "learning_rate": 7.90751783067803e-06, + "loss": 1.8093, + "step": 29094000 + }, + { + "epoch": 84.22, + "learning_rate": 7.906794183030752e-06, + "loss": 1.7983, + "step": 29094500 + }, + { + "epoch": 84.22, + "learning_rate": 7.906070535383475e-06, + "loss": 1.8378, + "step": 29095000 + }, + { + "epoch": 84.22, + "learning_rate": 7.9053468877362e-06, + "loss": 1.8225, + "step": 29095500 + }, + { + "epoch": 84.22, + "learning_rate": 7.904624687384217e-06, + "loss": 1.8165, + "step": 29096000 + }, + { + "epoch": 84.22, + "learning_rate": 7.90390103973694e-06, + "loss": 1.8201, + "step": 29096500 + }, + { + "epoch": 84.22, + "learning_rate": 7.903177392089662e-06, + "loss": 1.8221, + "step": 29097000 + }, + { + "epoch": 84.23, + "learning_rate": 7.902453744442388e-06, + "loss": 1.8279, + "step": 29097500 + }, + { + "epoch": 84.23, + "learning_rate": 7.90173009679511e-06, + "loss": 1.8122, + "step": 29098000 + }, + { + "epoch": 84.23, + "learning_rate": 7.901006449147832e-06, + "loss": 1.817, + "step": 29098500 + }, + { + "epoch": 84.23, + "learning_rate": 7.900282801500556e-06, + "loss": 1.8168, + "step": 29099000 + }, + { + "epoch": 84.23, + "learning_rate": 7.89955915385328e-06, + "loss": 1.8087, + "step": 29099500 + }, + { + "epoch": 84.23, + "learning_rate": 7.898836953501297e-06, + "loss": 1.8326, + "step": 29100000 + }, + { + "epoch": 84.23, + "learning_rate": 7.89811330585402e-06, + "loss": 1.8001, + "step": 29100500 + }, + { + "epoch": 84.24, + "learning_rate": 7.897389658206743e-06, + "loss": 1.7939, + "step": 29101000 + }, + { + "epoch": 84.24, + "learning_rate": 7.896667457854762e-06, + "loss": 1.8373, + "step": 29101500 + }, + { + "epoch": 84.24, + "learning_rate": 7.895943810207484e-06, + "loss": 1.7953, + "step": 29102000 + }, + { + "epoch": 84.24, + "learning_rate": 7.895221609855502e-06, + "loss": 1.8037, + "step": 29102500 + }, + { + "epoch": 84.24, + "learning_rate": 7.894497962208226e-06, + "loss": 1.8302, + "step": 29103000 + }, + { + "epoch": 84.24, + "learning_rate": 7.89377431456095e-06, + "loss": 1.8167, + "step": 29103500 + }, + { + "epoch": 84.24, + "learning_rate": 7.893050666913672e-06, + "loss": 1.811, + "step": 29104000 + }, + { + "epoch": 84.25, + "learning_rate": 7.892327019266394e-06, + "loss": 1.8069, + "step": 29104500 + }, + { + "epoch": 84.25, + "learning_rate": 7.89160337161912e-06, + "loss": 1.8236, + "step": 29105000 + }, + { + "epoch": 84.25, + "learning_rate": 7.890879723971842e-06, + "loss": 1.7918, + "step": 29105500 + }, + { + "epoch": 84.25, + "learning_rate": 7.890156076324564e-06, + "loss": 1.8134, + "step": 29106000 + }, + { + "epoch": 84.25, + "learning_rate": 7.889432428677288e-06, + "loss": 1.8137, + "step": 29106500 + }, + { + "epoch": 84.25, + "learning_rate": 7.888708781030012e-06, + "loss": 1.8067, + "step": 29107000 + }, + { + "epoch": 84.25, + "learning_rate": 7.887985133382734e-06, + "loss": 1.8133, + "step": 29107500 + }, + { + "epoch": 84.26, + "learning_rate": 7.887261485735458e-06, + "loss": 1.8104, + "step": 29108000 + }, + { + "epoch": 84.26, + "learning_rate": 7.88654073267877e-06, + "loss": 1.8148, + "step": 29108500 + }, + { + "epoch": 84.26, + "learning_rate": 7.885817085031494e-06, + "loss": 1.8304, + "step": 29109000 + }, + { + "epoch": 84.26, + "learning_rate": 7.885093437384217e-06, + "loss": 1.8254, + "step": 29109500 + }, + { + "epoch": 84.26, + "learning_rate": 7.884369789736939e-06, + "loss": 1.8168, + "step": 29110000 + }, + { + "epoch": 84.26, + "learning_rate": 7.883646142089664e-06, + "loss": 1.8219, + "step": 29110500 + }, + { + "epoch": 84.26, + "learning_rate": 7.882922494442387e-06, + "loss": 1.8243, + "step": 29111000 + }, + { + "epoch": 84.27, + "learning_rate": 7.882198846795109e-06, + "loss": 1.8226, + "step": 29111500 + }, + { + "epoch": 84.27, + "learning_rate": 7.881475199147833e-06, + "loss": 1.848, + "step": 29112000 + }, + { + "epoch": 84.27, + "learning_rate": 7.880752998795852e-06, + "loss": 1.82, + "step": 29112500 + }, + { + "epoch": 84.27, + "learning_rate": 7.880029351148574e-06, + "loss": 1.8368, + "step": 29113000 + }, + { + "epoch": 84.27, + "learning_rate": 7.879307150796591e-06, + "loss": 1.8191, + "step": 29113500 + }, + { + "epoch": 84.27, + "learning_rate": 7.878583503149315e-06, + "loss": 1.7996, + "step": 29114000 + }, + { + "epoch": 84.27, + "learning_rate": 7.877859855502039e-06, + "loss": 1.8083, + "step": 29114500 + }, + { + "epoch": 84.28, + "learning_rate": 7.877136207854761e-06, + "loss": 1.8128, + "step": 29115000 + }, + { + "epoch": 84.28, + "learning_rate": 7.876412560207484e-06, + "loss": 1.7979, + "step": 29115500 + }, + { + "epoch": 84.28, + "learning_rate": 7.875690359855503e-06, + "loss": 1.8362, + "step": 29116000 + }, + { + "epoch": 84.28, + "learning_rate": 7.874966712208226e-06, + "loss": 1.8133, + "step": 29116500 + }, + { + "epoch": 84.28, + "learning_rate": 7.874243064560949e-06, + "loss": 1.7941, + "step": 29117000 + }, + { + "epoch": 84.28, + "learning_rate": 7.873519416913671e-06, + "loss": 1.812, + "step": 29117500 + }, + { + "epoch": 84.28, + "learning_rate": 7.872795769266397e-06, + "loss": 1.8408, + "step": 29118000 + }, + { + "epoch": 84.29, + "learning_rate": 7.872073568914414e-06, + "loss": 1.816, + "step": 29118500 + }, + { + "epoch": 84.29, + "learning_rate": 7.871349921267136e-06, + "loss": 1.834, + "step": 29119000 + }, + { + "epoch": 84.29, + "learning_rate": 7.870626273619858e-06, + "loss": 1.7816, + "step": 29119500 + }, + { + "epoch": 84.29, + "learning_rate": 7.869902625972584e-06, + "loss": 1.8292, + "step": 29120000 + }, + { + "epoch": 84.29, + "learning_rate": 7.869180425620601e-06, + "loss": 1.7958, + "step": 29120500 + }, + { + "epoch": 84.29, + "learning_rate": 7.868456777973323e-06, + "loss": 1.8309, + "step": 29121000 + }, + { + "epoch": 84.29, + "learning_rate": 7.867733130326047e-06, + "loss": 1.8218, + "step": 29121500 + }, + { + "epoch": 84.3, + "learning_rate": 7.867009482678771e-06, + "loss": 1.8499, + "step": 29122000 + }, + { + "epoch": 84.3, + "learning_rate": 7.866285835031493e-06, + "loss": 1.7968, + "step": 29122500 + }, + { + "epoch": 84.3, + "learning_rate": 7.86556363467951e-06, + "loss": 1.8342, + "step": 29123000 + }, + { + "epoch": 84.3, + "learning_rate": 7.864839987032235e-06, + "loss": 1.8007, + "step": 29123500 + }, + { + "epoch": 84.3, + "learning_rate": 7.864116339384959e-06, + "loss": 1.8153, + "step": 29124000 + }, + { + "epoch": 84.3, + "learning_rate": 7.86339269173768e-06, + "loss": 1.821, + "step": 29124500 + }, + { + "epoch": 84.3, + "learning_rate": 7.862669044090403e-06, + "loss": 1.8205, + "step": 29125000 + }, + { + "epoch": 84.31, + "learning_rate": 7.861946843738422e-06, + "loss": 1.814, + "step": 29125500 + }, + { + "epoch": 84.31, + "learning_rate": 7.861223196091146e-06, + "loss": 1.8111, + "step": 29126000 + }, + { + "epoch": 84.31, + "learning_rate": 7.860499548443868e-06, + "loss": 1.8439, + "step": 29126500 + }, + { + "epoch": 84.31, + "learning_rate": 7.859775900796592e-06, + "loss": 1.8259, + "step": 29127000 + }, + { + "epoch": 84.31, + "learning_rate": 7.859052253149316e-06, + "loss": 1.8094, + "step": 29127500 + }, + { + "epoch": 84.31, + "learning_rate": 7.858328605502038e-06, + "loss": 1.8303, + "step": 29128000 + }, + { + "epoch": 84.32, + "learning_rate": 7.85760495785476e-06, + "loss": 1.8306, + "step": 29128500 + }, + { + "epoch": 84.32, + "learning_rate": 7.85688275750278e-06, + "loss": 1.8125, + "step": 29129000 + }, + { + "epoch": 84.32, + "learning_rate": 7.856159109855503e-06, + "loss": 1.84, + "step": 29129500 + }, + { + "epoch": 84.32, + "learning_rate": 7.855435462208226e-06, + "loss": 1.824, + "step": 29130000 + }, + { + "epoch": 84.32, + "learning_rate": 7.854711814560948e-06, + "loss": 1.8083, + "step": 29130500 + }, + { + "epoch": 84.32, + "learning_rate": 7.853989614208967e-06, + "loss": 1.8408, + "step": 29131000 + }, + { + "epoch": 84.32, + "learning_rate": 7.85326596656169e-06, + "loss": 1.7977, + "step": 29131500 + }, + { + "epoch": 84.33, + "learning_rate": 7.852542318914413e-06, + "loss": 1.8182, + "step": 29132000 + }, + { + "epoch": 84.33, + "learning_rate": 7.851818671267137e-06, + "loss": 1.8367, + "step": 29132500 + }, + { + "epoch": 84.33, + "learning_rate": 7.85109502361986e-06, + "loss": 1.818, + "step": 29133000 + }, + { + "epoch": 84.33, + "learning_rate": 7.850372823267878e-06, + "loss": 1.799, + "step": 29133500 + }, + { + "epoch": 84.33, + "learning_rate": 7.8496491756206e-06, + "loss": 1.8322, + "step": 29134000 + }, + { + "epoch": 84.33, + "learning_rate": 7.848925527973324e-06, + "loss": 1.8194, + "step": 29134500 + }, + { + "epoch": 84.33, + "learning_rate": 7.848201880326048e-06, + "loss": 1.8176, + "step": 29135000 + }, + { + "epoch": 84.34, + "learning_rate": 7.84747823267877e-06, + "loss": 1.8317, + "step": 29135500 + }, + { + "epoch": 84.34, + "learning_rate": 7.846754585031493e-06, + "loss": 1.8235, + "step": 29136000 + }, + { + "epoch": 84.34, + "learning_rate": 7.846032384679512e-06, + "loss": 1.8301, + "step": 29136500 + }, + { + "epoch": 84.34, + "learning_rate": 7.845308737032235e-06, + "loss": 1.8583, + "step": 29137000 + }, + { + "epoch": 84.34, + "learning_rate": 7.844585089384958e-06, + "loss": 1.812, + "step": 29137500 + }, + { + "epoch": 84.34, + "learning_rate": 7.84386144173768e-06, + "loss": 1.8148, + "step": 29138000 + }, + { + "epoch": 84.34, + "learning_rate": 7.843137794090404e-06, + "loss": 1.8121, + "step": 29138500 + }, + { + "epoch": 84.35, + "learning_rate": 7.842414146443128e-06, + "loss": 1.8269, + "step": 29139000 + }, + { + "epoch": 84.35, + "learning_rate": 7.841691946091145e-06, + "loss": 1.8222, + "step": 29139500 + }, + { + "epoch": 84.35, + "learning_rate": 7.840968298443869e-06, + "loss": 1.825, + "step": 29140000 + }, + { + "epoch": 84.35, + "learning_rate": 7.840246098091886e-06, + "loss": 1.839, + "step": 29140500 + }, + { + "epoch": 84.35, + "learning_rate": 7.83952245044461e-06, + "loss": 1.8135, + "step": 29141000 + }, + { + "epoch": 84.35, + "learning_rate": 7.838798802797332e-06, + "loss": 1.8147, + "step": 29141500 + }, + { + "epoch": 84.35, + "learning_rate": 7.838075155150056e-06, + "loss": 1.8077, + "step": 29142000 + }, + { + "epoch": 84.36, + "learning_rate": 7.83735150750278e-06, + "loss": 1.8291, + "step": 29142500 + }, + { + "epoch": 84.36, + "learning_rate": 7.836627859855502e-06, + "loss": 1.7929, + "step": 29143000 + }, + { + "epoch": 84.36, + "learning_rate": 7.835904212208225e-06, + "loss": 1.8359, + "step": 29143500 + }, + { + "epoch": 84.36, + "learning_rate": 7.835180564560949e-06, + "loss": 1.8215, + "step": 29144000 + }, + { + "epoch": 84.36, + "learning_rate": 7.834458364208968e-06, + "loss": 1.8359, + "step": 29144500 + }, + { + "epoch": 84.36, + "learning_rate": 7.83373471656169e-06, + "loss": 1.8113, + "step": 29145000 + }, + { + "epoch": 84.36, + "learning_rate": 7.833011068914414e-06, + "loss": 1.8297, + "step": 29145500 + }, + { + "epoch": 84.37, + "learning_rate": 7.832287421267136e-06, + "loss": 1.7915, + "step": 29146000 + }, + { + "epoch": 84.37, + "learning_rate": 7.83156377361986e-06, + "loss": 1.8324, + "step": 29146500 + }, + { + "epoch": 84.37, + "learning_rate": 7.830840125972582e-06, + "loss": 1.8113, + "step": 29147000 + }, + { + "epoch": 84.37, + "learning_rate": 7.830116478325306e-06, + "loss": 1.8459, + "step": 29147500 + }, + { + "epoch": 84.37, + "learning_rate": 7.82939283067803e-06, + "loss": 1.8136, + "step": 29148000 + }, + { + "epoch": 84.37, + "learning_rate": 7.828669183030752e-06, + "loss": 1.8229, + "step": 29148500 + }, + { + "epoch": 84.37, + "learning_rate": 7.82794698267877e-06, + "loss": 1.8305, + "step": 29149000 + }, + { + "epoch": 84.38, + "learning_rate": 7.827223335031493e-06, + "loss": 1.8326, + "step": 29149500 + }, + { + "epoch": 84.38, + "learning_rate": 7.826499687384217e-06, + "loss": 1.8212, + "step": 29150000 + }, + { + "epoch": 84.38, + "learning_rate": 7.82577603973694e-06, + "loss": 1.822, + "step": 29150500 + }, + { + "epoch": 84.38, + "learning_rate": 7.825052392089663e-06, + "loss": 1.8205, + "step": 29151000 + }, + { + "epoch": 84.38, + "learning_rate": 7.82433019173768e-06, + "loss": 1.8183, + "step": 29151500 + }, + { + "epoch": 84.38, + "learning_rate": 7.823606544090405e-06, + "loss": 1.793, + "step": 29152000 + }, + { + "epoch": 84.38, + "learning_rate": 7.822882896443127e-06, + "loss": 1.8091, + "step": 29152500 + }, + { + "epoch": 84.39, + "learning_rate": 7.82215924879585e-06, + "loss": 1.814, + "step": 29153000 + }, + { + "epoch": 84.39, + "learning_rate": 7.821435601148575e-06, + "loss": 1.8331, + "step": 29153500 + }, + { + "epoch": 84.39, + "learning_rate": 7.820713400796592e-06, + "loss": 1.8322, + "step": 29154000 + }, + { + "epoch": 84.39, + "learning_rate": 7.819989753149314e-06, + "loss": 1.8286, + "step": 29154500 + }, + { + "epoch": 84.39, + "learning_rate": 7.819266105502038e-06, + "loss": 1.829, + "step": 29155000 + }, + { + "epoch": 84.39, + "learning_rate": 7.818542457854762e-06, + "loss": 1.8059, + "step": 29155500 + }, + { + "epoch": 84.39, + "learning_rate": 7.81782025750278e-06, + "loss": 1.843, + "step": 29156000 + }, + { + "epoch": 84.4, + "learning_rate": 7.817096609855502e-06, + "loss": 1.8278, + "step": 29156500 + }, + { + "epoch": 84.4, + "learning_rate": 7.816372962208225e-06, + "loss": 1.8285, + "step": 29157000 + }, + { + "epoch": 84.4, + "learning_rate": 7.81564931456095e-06, + "loss": 1.8546, + "step": 29157500 + }, + { + "epoch": 84.4, + "learning_rate": 7.814925666913672e-06, + "loss": 1.7881, + "step": 29158000 + }, + { + "epoch": 84.4, + "learning_rate": 7.81420346656169e-06, + "loss": 1.8323, + "step": 29158500 + }, + { + "epoch": 84.4, + "learning_rate": 7.813479818914413e-06, + "loss": 1.8288, + "step": 29159000 + }, + { + "epoch": 84.4, + "learning_rate": 7.812756171267137e-06, + "loss": 1.8224, + "step": 29159500 + }, + { + "epoch": 84.41, + "learning_rate": 7.812032523619859e-06, + "loss": 1.8234, + "step": 29160000 + }, + { + "epoch": 84.41, + "learning_rate": 7.811308875972583e-06, + "loss": 1.8382, + "step": 29160500 + }, + { + "epoch": 84.41, + "learning_rate": 7.810585228325307e-06, + "loss": 1.8311, + "step": 29161000 + }, + { + "epoch": 84.41, + "learning_rate": 7.809861580678029e-06, + "loss": 1.8303, + "step": 29161500 + }, + { + "epoch": 84.41, + "learning_rate": 7.809137933030753e-06, + "loss": 1.8269, + "step": 29162000 + }, + { + "epoch": 84.41, + "learning_rate": 7.80841573267877e-06, + "loss": 1.8171, + "step": 29162500 + }, + { + "epoch": 84.41, + "learning_rate": 7.807693532326787e-06, + "loss": 1.8042, + "step": 29163000 + }, + { + "epoch": 84.42, + "learning_rate": 7.806969884679511e-06, + "loss": 1.8243, + "step": 29163500 + }, + { + "epoch": 84.42, + "learning_rate": 7.806246237032235e-06, + "loss": 1.8191, + "step": 29164000 + }, + { + "epoch": 84.42, + "learning_rate": 7.805524036680253e-06, + "loss": 1.8425, + "step": 29164500 + }, + { + "epoch": 84.42, + "learning_rate": 7.804800389032975e-06, + "loss": 1.8137, + "step": 29165000 + }, + { + "epoch": 84.42, + "learning_rate": 7.804076741385699e-06, + "loss": 1.8261, + "step": 29165500 + }, + { + "epoch": 84.42, + "learning_rate": 7.803353093738423e-06, + "loss": 1.8078, + "step": 29166000 + }, + { + "epoch": 84.43, + "learning_rate": 7.802629446091145e-06, + "loss": 1.8151, + "step": 29166500 + }, + { + "epoch": 84.43, + "learning_rate": 7.801905798443869e-06, + "loss": 1.8128, + "step": 29167000 + }, + { + "epoch": 84.43, + "learning_rate": 7.801182150796591e-06, + "loss": 1.8359, + "step": 29167500 + }, + { + "epoch": 84.43, + "learning_rate": 7.800458503149315e-06, + "loss": 1.8248, + "step": 29168000 + }, + { + "epoch": 84.43, + "learning_rate": 7.799734855502037e-06, + "loss": 1.8165, + "step": 29168500 + }, + { + "epoch": 84.43, + "learning_rate": 7.799012655150056e-06, + "loss": 1.8281, + "step": 29169000 + }, + { + "epoch": 84.43, + "learning_rate": 7.798289007502778e-06, + "loss": 1.8276, + "step": 29169500 + }, + { + "epoch": 84.44, + "learning_rate": 7.797565359855502e-06, + "loss": 1.8328, + "step": 29170000 + }, + { + "epoch": 84.44, + "learning_rate": 7.796841712208226e-06, + "loss": 1.8137, + "step": 29170500 + }, + { + "epoch": 84.44, + "learning_rate": 7.796118064560948e-06, + "loss": 1.8474, + "step": 29171000 + }, + { + "epoch": 84.44, + "learning_rate": 7.795394416913672e-06, + "loss": 1.8255, + "step": 29171500 + }, + { + "epoch": 84.44, + "learning_rate": 7.794670769266395e-06, + "loss": 1.8386, + "step": 29172000 + }, + { + "epoch": 84.44, + "learning_rate": 7.793948568914414e-06, + "loss": 1.8241, + "step": 29172500 + }, + { + "epoch": 84.44, + "learning_rate": 7.793224921267136e-06, + "loss": 1.8366, + "step": 29173000 + }, + { + "epoch": 84.45, + "learning_rate": 7.79250127361986e-06, + "loss": 1.8281, + "step": 29173500 + }, + { + "epoch": 84.45, + "learning_rate": 7.791777625972582e-06, + "loss": 1.8147, + "step": 29174000 + }, + { + "epoch": 84.45, + "learning_rate": 7.791053978325306e-06, + "loss": 1.8152, + "step": 29174500 + }, + { + "epoch": 84.45, + "learning_rate": 7.79033033067803e-06, + "loss": 1.8098, + "step": 29175000 + }, + { + "epoch": 84.45, + "learning_rate": 7.789608130326047e-06, + "loss": 1.8357, + "step": 29175500 + }, + { + "epoch": 84.45, + "learning_rate": 7.78888448267877e-06, + "loss": 1.7985, + "step": 29176000 + }, + { + "epoch": 84.45, + "learning_rate": 7.788160835031493e-06, + "loss": 1.832, + "step": 29176500 + }, + { + "epoch": 84.46, + "learning_rate": 7.787437187384217e-06, + "loss": 1.8163, + "step": 29177000 + }, + { + "epoch": 84.46, + "learning_rate": 7.786714987032234e-06, + "loss": 1.8465, + "step": 29177500 + }, + { + "epoch": 84.46, + "learning_rate": 7.785991339384958e-06, + "loss": 1.8223, + "step": 29178000 + }, + { + "epoch": 84.46, + "learning_rate": 7.78526769173768e-06, + "loss": 1.8197, + "step": 29178500 + }, + { + "epoch": 84.46, + "learning_rate": 7.7845454913857e-06, + "loss": 1.8327, + "step": 29179000 + }, + { + "epoch": 84.46, + "learning_rate": 7.783823291033717e-06, + "loss": 1.8212, + "step": 29179500 + }, + { + "epoch": 84.46, + "learning_rate": 7.783099643386439e-06, + "loss": 1.8055, + "step": 29180000 + }, + { + "epoch": 84.47, + "learning_rate": 7.782375995739163e-06, + "loss": 1.8028, + "step": 29180500 + }, + { + "epoch": 84.47, + "learning_rate": 7.781652348091887e-06, + "loss": 1.8178, + "step": 29181000 + }, + { + "epoch": 84.47, + "learning_rate": 7.780928700444609e-06, + "loss": 1.8404, + "step": 29181500 + }, + { + "epoch": 84.47, + "learning_rate": 7.780205052797333e-06, + "loss": 1.8069, + "step": 29182000 + }, + { + "epoch": 84.47, + "learning_rate": 7.779481405150057e-06, + "loss": 1.822, + "step": 29182500 + }, + { + "epoch": 84.47, + "learning_rate": 7.77875775750278e-06, + "loss": 1.8174, + "step": 29183000 + }, + { + "epoch": 84.47, + "learning_rate": 7.778034109855501e-06, + "loss": 1.8279, + "step": 29183500 + }, + { + "epoch": 84.48, + "learning_rate": 7.777310462208225e-06, + "loss": 1.848, + "step": 29184000 + }, + { + "epoch": 84.48, + "learning_rate": 7.77658681456095e-06, + "loss": 1.8192, + "step": 29184500 + }, + { + "epoch": 84.48, + "learning_rate": 7.775863166913672e-06, + "loss": 1.8231, + "step": 29185000 + }, + { + "epoch": 84.48, + "learning_rate": 7.775140966561689e-06, + "loss": 1.8278, + "step": 29185500 + }, + { + "epoch": 84.48, + "learning_rate": 7.774417318914413e-06, + "loss": 1.8415, + "step": 29186000 + }, + { + "epoch": 84.48, + "learning_rate": 7.773693671267137e-06, + "loss": 1.8072, + "step": 29186500 + }, + { + "epoch": 84.48, + "learning_rate": 7.772970023619859e-06, + "loss": 1.8159, + "step": 29187000 + }, + { + "epoch": 84.49, + "learning_rate": 7.772246375972583e-06, + "loss": 1.8504, + "step": 29187500 + }, + { + "epoch": 84.49, + "learning_rate": 7.771522728325307e-06, + "loss": 1.8139, + "step": 29188000 + }, + { + "epoch": 84.49, + "learning_rate": 7.770800527973324e-06, + "loss": 1.7824, + "step": 29188500 + }, + { + "epoch": 84.49, + "learning_rate": 7.770076880326046e-06, + "loss": 1.8395, + "step": 29189000 + }, + { + "epoch": 84.49, + "learning_rate": 7.76935323267877e-06, + "loss": 1.8084, + "step": 29189500 + }, + { + "epoch": 84.49, + "learning_rate": 7.768629585031494e-06, + "loss": 1.8212, + "step": 29190000 + }, + { + "epoch": 84.49, + "learning_rate": 7.767905937384216e-06, + "loss": 1.7961, + "step": 29190500 + }, + { + "epoch": 84.5, + "learning_rate": 7.76718228973694e-06, + "loss": 1.834, + "step": 29191000 + }, + { + "epoch": 84.5, + "learning_rate": 7.766458642089664e-06, + "loss": 1.8063, + "step": 29191500 + }, + { + "epoch": 84.5, + "learning_rate": 7.765734994442386e-06, + "loss": 1.8445, + "step": 29192000 + }, + { + "epoch": 84.5, + "learning_rate": 7.765011346795109e-06, + "loss": 1.8149, + "step": 29192500 + }, + { + "epoch": 84.5, + "learning_rate": 7.764287699147833e-06, + "loss": 1.8362, + "step": 29193000 + }, + { + "epoch": 84.5, + "learning_rate": 7.763565498795851e-06, + "loss": 1.8091, + "step": 29193500 + }, + { + "epoch": 84.5, + "learning_rate": 7.762841851148574e-06, + "loss": 1.8186, + "step": 29194000 + }, + { + "epoch": 84.51, + "learning_rate": 7.762118203501296e-06, + "loss": 1.8077, + "step": 29194500 + }, + { + "epoch": 84.51, + "learning_rate": 7.761394555854022e-06, + "loss": 1.8433, + "step": 29195000 + }, + { + "epoch": 84.51, + "learning_rate": 7.760670908206744e-06, + "loss": 1.8217, + "step": 29195500 + }, + { + "epoch": 84.51, + "learning_rate": 7.759947260559466e-06, + "loss": 1.8142, + "step": 29196000 + }, + { + "epoch": 84.51, + "learning_rate": 7.75922361291219e-06, + "loss": 1.8165, + "step": 29196500 + }, + { + "epoch": 84.51, + "learning_rate": 7.758501412560209e-06, + "loss": 1.8181, + "step": 29197000 + }, + { + "epoch": 84.51, + "learning_rate": 7.757779212208226e-06, + "loss": 1.8155, + "step": 29197500 + }, + { + "epoch": 84.52, + "learning_rate": 7.757055564560948e-06, + "loss": 1.8263, + "step": 29198000 + }, + { + "epoch": 84.52, + "learning_rate": 7.756331916913672e-06, + "loss": 1.8061, + "step": 29198500 + }, + { + "epoch": 84.52, + "learning_rate": 7.755608269266396e-06, + "loss": 1.8346, + "step": 29199000 + }, + { + "epoch": 84.52, + "learning_rate": 7.754884621619118e-06, + "loss": 1.8518, + "step": 29199500 + }, + { + "epoch": 84.52, + "learning_rate": 7.75416097397184e-06, + "loss": 1.8204, + "step": 29200000 + }, + { + "epoch": 84.52, + "learning_rate": 7.753437326324565e-06, + "loss": 1.8538, + "step": 29200500 + }, + { + "epoch": 84.52, + "learning_rate": 7.752715125972584e-06, + "loss": 1.8271, + "step": 29201000 + }, + { + "epoch": 84.53, + "learning_rate": 7.751991478325306e-06, + "loss": 1.786, + "step": 29201500 + }, + { + "epoch": 84.53, + "learning_rate": 7.751267830678028e-06, + "loss": 1.811, + "step": 29202000 + }, + { + "epoch": 84.53, + "learning_rate": 7.750544183030754e-06, + "loss": 1.8003, + "step": 29202500 + }, + { + "epoch": 84.53, + "learning_rate": 7.749820535383476e-06, + "loss": 1.8391, + "step": 29203000 + }, + { + "epoch": 84.53, + "learning_rate": 7.749096887736198e-06, + "loss": 1.8234, + "step": 29203500 + }, + { + "epoch": 84.53, + "learning_rate": 7.748373240088922e-06, + "loss": 1.8291, + "step": 29204000 + }, + { + "epoch": 84.54, + "learning_rate": 7.747649592441646e-06, + "loss": 1.833, + "step": 29204500 + }, + { + "epoch": 84.54, + "learning_rate": 7.746927392089663e-06, + "loss": 1.84, + "step": 29205000 + }, + { + "epoch": 84.54, + "learning_rate": 7.746203744442385e-06, + "loss": 1.8181, + "step": 29205500 + }, + { + "epoch": 84.54, + "learning_rate": 7.74548009679511e-06, + "loss": 1.8282, + "step": 29206000 + }, + { + "epoch": 84.54, + "learning_rate": 7.744756449147833e-06, + "loss": 1.8034, + "step": 29206500 + }, + { + "epoch": 84.54, + "learning_rate": 7.744032801500556e-06, + "loss": 1.8447, + "step": 29207000 + }, + { + "epoch": 84.54, + "learning_rate": 7.743310601148573e-06, + "loss": 1.8269, + "step": 29207500 + }, + { + "epoch": 84.55, + "learning_rate": 7.742586953501298e-06, + "loss": 1.8233, + "step": 29208000 + }, + { + "epoch": 84.55, + "learning_rate": 7.74186330585402e-06, + "loss": 1.817, + "step": 29208500 + }, + { + "epoch": 84.55, + "learning_rate": 7.741139658206743e-06, + "loss": 1.8204, + "step": 29209000 + }, + { + "epoch": 84.55, + "learning_rate": 7.74041745785476e-06, + "loss": 1.8364, + "step": 29209500 + }, + { + "epoch": 84.55, + "learning_rate": 7.739693810207486e-06, + "loss": 1.7921, + "step": 29210000 + }, + { + "epoch": 84.55, + "learning_rate": 7.738970162560208e-06, + "loss": 1.8485, + "step": 29210500 + }, + { + "epoch": 84.55, + "learning_rate": 7.73824651491293e-06, + "loss": 1.8265, + "step": 29211000 + }, + { + "epoch": 84.56, + "learning_rate": 7.737522867265654e-06, + "loss": 1.8271, + "step": 29211500 + }, + { + "epoch": 84.56, + "learning_rate": 7.736800666913673e-06, + "loss": 1.8352, + "step": 29212000 + }, + { + "epoch": 84.56, + "learning_rate": 7.736077019266395e-06, + "loss": 1.8136, + "step": 29212500 + }, + { + "epoch": 84.56, + "learning_rate": 7.735353371619118e-06, + "loss": 1.8383, + "step": 29213000 + }, + { + "epoch": 84.56, + "learning_rate": 7.734629723971843e-06, + "loss": 1.8125, + "step": 29213500 + }, + { + "epoch": 84.56, + "learning_rate": 7.733906076324565e-06, + "loss": 1.8322, + "step": 29214000 + }, + { + "epoch": 84.56, + "learning_rate": 7.733183875972583e-06, + "loss": 1.828, + "step": 29214500 + }, + { + "epoch": 84.57, + "learning_rate": 7.732460228325305e-06, + "loss": 1.8233, + "step": 29215000 + }, + { + "epoch": 84.57, + "learning_rate": 7.73173658067803e-06, + "loss": 1.8301, + "step": 29215500 + }, + { + "epoch": 84.57, + "learning_rate": 7.731012933030753e-06, + "loss": 1.8432, + "step": 29216000 + }, + { + "epoch": 84.57, + "learning_rate": 7.730289285383475e-06, + "loss": 1.8482, + "step": 29216500 + }, + { + "epoch": 84.57, + "learning_rate": 7.729565637736199e-06, + "loss": 1.8298, + "step": 29217000 + }, + { + "epoch": 84.57, + "learning_rate": 7.728843437384218e-06, + "loss": 1.8585, + "step": 29217500 + }, + { + "epoch": 84.57, + "learning_rate": 7.728121237032235e-06, + "loss": 1.8561, + "step": 29218000 + }, + { + "epoch": 84.58, + "learning_rate": 7.727397589384957e-06, + "loss": 1.8041, + "step": 29218500 + }, + { + "epoch": 84.58, + "learning_rate": 7.72667394173768e-06, + "loss": 1.8322, + "step": 29219000 + }, + { + "epoch": 84.58, + "learning_rate": 7.725950294090405e-06, + "loss": 1.8121, + "step": 29219500 + }, + { + "epoch": 84.58, + "learning_rate": 7.725228093738422e-06, + "loss": 1.8242, + "step": 29220000 + }, + { + "epoch": 84.58, + "learning_rate": 7.724504446091145e-06, + "loss": 1.8242, + "step": 29220500 + }, + { + "epoch": 84.58, + "learning_rate": 7.723780798443869e-06, + "loss": 1.8104, + "step": 29221000 + }, + { + "epoch": 84.58, + "learning_rate": 7.723057150796593e-06, + "loss": 1.8215, + "step": 29221500 + }, + { + "epoch": 84.59, + "learning_rate": 7.722333503149315e-06, + "loss": 1.8197, + "step": 29222000 + }, + { + "epoch": 84.59, + "learning_rate": 7.721609855502037e-06, + "loss": 1.8121, + "step": 29222500 + }, + { + "epoch": 84.59, + "learning_rate": 7.720886207854763e-06, + "loss": 1.8561, + "step": 29223000 + }, + { + "epoch": 84.59, + "learning_rate": 7.720162560207485e-06, + "loss": 1.8033, + "step": 29223500 + }, + { + "epoch": 84.59, + "learning_rate": 7.719438912560207e-06, + "loss": 1.8424, + "step": 29224000 + }, + { + "epoch": 84.59, + "learning_rate": 7.718716712208224e-06, + "loss": 1.8088, + "step": 29224500 + }, + { + "epoch": 84.59, + "learning_rate": 7.717994511856243e-06, + "loss": 1.8149, + "step": 29225000 + }, + { + "epoch": 84.6, + "learning_rate": 7.717272311504262e-06, + "loss": 1.8243, + "step": 29225500 + }, + { + "epoch": 84.6, + "learning_rate": 7.716548663856984e-06, + "loss": 1.8461, + "step": 29226000 + }, + { + "epoch": 84.6, + "learning_rate": 7.715825016209707e-06, + "loss": 1.8361, + "step": 29226500 + }, + { + "epoch": 84.6, + "learning_rate": 7.715101368562432e-06, + "loss": 1.8211, + "step": 29227000 + }, + { + "epoch": 84.6, + "learning_rate": 7.714377720915155e-06, + "loss": 1.8281, + "step": 29227500 + }, + { + "epoch": 84.6, + "learning_rate": 7.713654073267877e-06, + "loss": 1.8182, + "step": 29228000 + }, + { + "epoch": 84.6, + "learning_rate": 7.7129304256206e-06, + "loss": 1.8266, + "step": 29228500 + }, + { + "epoch": 84.61, + "learning_rate": 7.712206777973325e-06, + "loss": 1.8366, + "step": 29229000 + }, + { + "epoch": 84.61, + "learning_rate": 7.711484577621342e-06, + "loss": 1.8279, + "step": 29229500 + }, + { + "epoch": 84.61, + "learning_rate": 7.710760929974064e-06, + "loss": 1.8505, + "step": 29230000 + }, + { + "epoch": 84.61, + "learning_rate": 7.710037282326788e-06, + "loss": 1.8142, + "step": 29230500 + }, + { + "epoch": 84.61, + "learning_rate": 7.709313634679512e-06, + "loss": 1.8213, + "step": 29231000 + }, + { + "epoch": 84.61, + "learning_rate": 7.708589987032234e-06, + "loss": 1.8358, + "step": 29231500 + }, + { + "epoch": 84.61, + "learning_rate": 7.707866339384958e-06, + "loss": 1.8623, + "step": 29232000 + }, + { + "epoch": 84.62, + "learning_rate": 7.707142691737682e-06, + "loss": 1.8453, + "step": 29232500 + }, + { + "epoch": 84.62, + "learning_rate": 7.706419044090404e-06, + "loss": 1.7991, + "step": 29233000 + }, + { + "epoch": 84.62, + "learning_rate": 7.705695396443127e-06, + "loss": 1.8315, + "step": 29233500 + }, + { + "epoch": 84.62, + "learning_rate": 7.70497174879585e-06, + "loss": 1.8272, + "step": 29234000 + }, + { + "epoch": 84.62, + "learning_rate": 7.704248101148574e-06, + "loss": 1.8159, + "step": 29234500 + }, + { + "epoch": 84.62, + "learning_rate": 7.703524453501297e-06, + "loss": 1.8092, + "step": 29235000 + }, + { + "epoch": 84.62, + "learning_rate": 7.70280080585402e-06, + "loss": 1.8299, + "step": 29235500 + }, + { + "epoch": 84.63, + "learning_rate": 7.702078605502038e-06, + "loss": 1.8387, + "step": 29236000 + }, + { + "epoch": 84.63, + "learning_rate": 7.701354957854762e-06, + "loss": 1.871, + "step": 29236500 + }, + { + "epoch": 84.63, + "learning_rate": 7.700631310207484e-06, + "loss": 1.8289, + "step": 29237000 + }, + { + "epoch": 84.63, + "learning_rate": 7.699907662560208e-06, + "loss": 1.8126, + "step": 29237500 + }, + { + "epoch": 84.63, + "learning_rate": 7.699184014912932e-06, + "loss": 1.827, + "step": 29238000 + }, + { + "epoch": 84.63, + "learning_rate": 7.698460367265654e-06, + "loss": 1.8427, + "step": 29238500 + }, + { + "epoch": 84.63, + "learning_rate": 7.697736719618378e-06, + "loss": 1.806, + "step": 29239000 + }, + { + "epoch": 84.64, + "learning_rate": 7.697013071971102e-06, + "loss": 1.8305, + "step": 29239500 + }, + { + "epoch": 84.64, + "learning_rate": 7.69629087161912e-06, + "loss": 1.8037, + "step": 29240000 + }, + { + "epoch": 84.64, + "learning_rate": 7.695567223971841e-06, + "loss": 1.7975, + "step": 29240500 + }, + { + "epoch": 84.64, + "learning_rate": 7.694846470915154e-06, + "loss": 1.8386, + "step": 29241000 + }, + { + "epoch": 84.64, + "learning_rate": 7.694122823267878e-06, + "loss": 1.8063, + "step": 29241500 + }, + { + "epoch": 84.64, + "learning_rate": 7.693399175620602e-06, + "loss": 1.7979, + "step": 29242000 + }, + { + "epoch": 84.65, + "learning_rate": 7.692675527973324e-06, + "loss": 1.8127, + "step": 29242500 + }, + { + "epoch": 84.65, + "learning_rate": 7.691951880326046e-06, + "loss": 1.8153, + "step": 29243000 + }, + { + "epoch": 84.65, + "learning_rate": 7.69122823267877e-06, + "loss": 1.8214, + "step": 29243500 + }, + { + "epoch": 84.65, + "learning_rate": 7.690504585031494e-06, + "loss": 1.8272, + "step": 29244000 + }, + { + "epoch": 84.65, + "learning_rate": 7.689780937384216e-06, + "loss": 1.8219, + "step": 29244500 + }, + { + "epoch": 84.65, + "learning_rate": 7.689058737032235e-06, + "loss": 1.8272, + "step": 29245000 + }, + { + "epoch": 84.65, + "learning_rate": 7.688335089384959e-06, + "loss": 1.8479, + "step": 29245500 + }, + { + "epoch": 84.66, + "learning_rate": 7.687611441737681e-06, + "loss": 1.8487, + "step": 29246000 + }, + { + "epoch": 84.66, + "learning_rate": 7.686887794090403e-06, + "loss": 1.8267, + "step": 29246500 + }, + { + "epoch": 84.66, + "learning_rate": 7.686164146443127e-06, + "loss": 1.8073, + "step": 29247000 + }, + { + "epoch": 84.66, + "learning_rate": 7.685440498795851e-06, + "loss": 1.8273, + "step": 29247500 + }, + { + "epoch": 84.66, + "learning_rate": 7.684716851148574e-06, + "loss": 1.8574, + "step": 29248000 + }, + { + "epoch": 84.66, + "learning_rate": 7.683993203501297e-06, + "loss": 1.8032, + "step": 29248500 + }, + { + "epoch": 84.66, + "learning_rate": 7.683271003149315e-06, + "loss": 1.8217, + "step": 29249000 + }, + { + "epoch": 84.67, + "learning_rate": 7.682547355502039e-06, + "loss": 1.8175, + "step": 29249500 + }, + { + "epoch": 84.67, + "learning_rate": 7.681825155150056e-06, + "loss": 1.8106, + "step": 29250000 + }, + { + "epoch": 84.67, + "learning_rate": 7.68110150750278e-06, + "loss": 1.7981, + "step": 29250500 + }, + { + "epoch": 84.67, + "learning_rate": 7.680379307150797e-06, + "loss": 1.8341, + "step": 29251000 + }, + { + "epoch": 84.67, + "learning_rate": 7.679655659503521e-06, + "loss": 1.8391, + "step": 29251500 + }, + { + "epoch": 84.67, + "learning_rate": 7.678932011856243e-06, + "loss": 1.8136, + "step": 29252000 + }, + { + "epoch": 84.67, + "learning_rate": 7.678208364208967e-06, + "loss": 1.82, + "step": 29252500 + }, + { + "epoch": 84.68, + "learning_rate": 7.677486163856984e-06, + "loss": 1.8341, + "step": 29253000 + }, + { + "epoch": 84.68, + "learning_rate": 7.676762516209708e-06, + "loss": 1.8002, + "step": 29253500 + }, + { + "epoch": 84.68, + "learning_rate": 7.67603886856243e-06, + "loss": 1.8595, + "step": 29254000 + }, + { + "epoch": 84.68, + "learning_rate": 7.675315220915154e-06, + "loss": 1.81, + "step": 29254500 + }, + { + "epoch": 84.68, + "learning_rate": 7.674591573267878e-06, + "loss": 1.7963, + "step": 29255000 + }, + { + "epoch": 84.68, + "learning_rate": 7.6738679256206e-06, + "loss": 1.8266, + "step": 29255500 + }, + { + "epoch": 84.68, + "learning_rate": 7.673144277973323e-06, + "loss": 1.8315, + "step": 29256000 + }, + { + "epoch": 84.69, + "learning_rate": 7.672420630326047e-06, + "loss": 1.8189, + "step": 29256500 + }, + { + "epoch": 84.69, + "learning_rate": 7.67169698267877e-06, + "loss": 1.8372, + "step": 29257000 + }, + { + "epoch": 84.69, + "learning_rate": 7.670973335031493e-06, + "loss": 1.8386, + "step": 29257500 + }, + { + "epoch": 84.69, + "learning_rate": 7.670249687384217e-06, + "loss": 1.8245, + "step": 29258000 + }, + { + "epoch": 84.69, + "learning_rate": 7.66952603973694e-06, + "loss": 1.828, + "step": 29258500 + }, + { + "epoch": 84.69, + "learning_rate": 7.668803839384958e-06, + "loss": 1.8017, + "step": 29259000 + }, + { + "epoch": 84.69, + "learning_rate": 7.668081639032975e-06, + "loss": 1.8005, + "step": 29259500 + }, + { + "epoch": 84.7, + "learning_rate": 7.6673579913857e-06, + "loss": 1.8156, + "step": 29260000 + }, + { + "epoch": 84.7, + "learning_rate": 7.666634343738421e-06, + "loss": 1.8186, + "step": 29260500 + }, + { + "epoch": 84.7, + "learning_rate": 7.665910696091145e-06, + "loss": 1.8255, + "step": 29261000 + }, + { + "epoch": 84.7, + "learning_rate": 7.665187048443868e-06, + "loss": 1.7977, + "step": 29261500 + }, + { + "epoch": 84.7, + "learning_rate": 7.664463400796592e-06, + "loss": 1.8167, + "step": 29262000 + }, + { + "epoch": 84.7, + "learning_rate": 7.663741200444609e-06, + "loss": 1.8199, + "step": 29262500 + }, + { + "epoch": 84.7, + "learning_rate": 7.663017552797333e-06, + "loss": 1.8223, + "step": 29263000 + }, + { + "epoch": 84.71, + "learning_rate": 7.662293905150057e-06, + "loss": 1.8269, + "step": 29263500 + }, + { + "epoch": 84.71, + "learning_rate": 7.661571704798074e-06, + "loss": 1.806, + "step": 29264000 + }, + { + "epoch": 84.71, + "learning_rate": 7.660848057150798e-06, + "loss": 1.8191, + "step": 29264500 + }, + { + "epoch": 84.71, + "learning_rate": 7.66012440950352e-06, + "loss": 1.8106, + "step": 29265000 + }, + { + "epoch": 84.71, + "learning_rate": 7.659400761856244e-06, + "loss": 1.8385, + "step": 29265500 + }, + { + "epoch": 84.71, + "learning_rate": 7.658678561504261e-06, + "loss": 1.8143, + "step": 29266000 + }, + { + "epoch": 84.71, + "learning_rate": 7.657954913856985e-06, + "loss": 1.793, + "step": 29266500 + }, + { + "epoch": 84.72, + "learning_rate": 7.657231266209707e-06, + "loss": 1.8201, + "step": 29267000 + }, + { + "epoch": 84.72, + "learning_rate": 7.656507618562431e-06, + "loss": 1.8259, + "step": 29267500 + }, + { + "epoch": 84.72, + "learning_rate": 7.655783970915154e-06, + "loss": 1.8215, + "step": 29268000 + }, + { + "epoch": 84.72, + "learning_rate": 7.655060323267878e-06, + "loss": 1.8272, + "step": 29268500 + }, + { + "epoch": 84.72, + "learning_rate": 7.6543366756206e-06, + "loss": 1.8317, + "step": 29269000 + }, + { + "epoch": 84.72, + "learning_rate": 7.653613027973324e-06, + "loss": 1.841, + "step": 29269500 + }, + { + "epoch": 84.72, + "learning_rate": 7.652889380326048e-06, + "loss": 1.8171, + "step": 29270000 + }, + { + "epoch": 84.73, + "learning_rate": 7.65216573267877e-06, + "loss": 1.8262, + "step": 29270500 + }, + { + "epoch": 84.73, + "learning_rate": 7.651443532326789e-06, + "loss": 1.8319, + "step": 29271000 + }, + { + "epoch": 84.73, + "learning_rate": 7.650721331974806e-06, + "loss": 1.8117, + "step": 29271500 + }, + { + "epoch": 84.73, + "learning_rate": 7.649997684327528e-06, + "loss": 1.8237, + "step": 29272000 + }, + { + "epoch": 84.73, + "learning_rate": 7.649274036680252e-06, + "loss": 1.8273, + "step": 29272500 + }, + { + "epoch": 84.73, + "learning_rate": 7.648550389032976e-06, + "loss": 1.8363, + "step": 29273000 + }, + { + "epoch": 84.73, + "learning_rate": 7.647826741385698e-06, + "loss": 1.8375, + "step": 29273500 + }, + { + "epoch": 84.74, + "learning_rate": 7.647103093738422e-06, + "loss": 1.8232, + "step": 29274000 + }, + { + "epoch": 84.74, + "learning_rate": 7.646379446091145e-06, + "loss": 1.8189, + "step": 29274500 + }, + { + "epoch": 84.74, + "learning_rate": 7.645655798443868e-06, + "loss": 1.8423, + "step": 29275000 + }, + { + "epoch": 84.74, + "learning_rate": 7.644933598091886e-06, + "loss": 1.8232, + "step": 29275500 + }, + { + "epoch": 84.74, + "learning_rate": 7.64420995044461e-06, + "loss": 1.8277, + "step": 29276000 + }, + { + "epoch": 84.74, + "learning_rate": 7.643486302797334e-06, + "loss": 1.8022, + "step": 29276500 + }, + { + "epoch": 84.74, + "learning_rate": 7.642762655150056e-06, + "loss": 1.8035, + "step": 29277000 + }, + { + "epoch": 84.75, + "learning_rate": 7.64203900750278e-06, + "loss": 1.8501, + "step": 29277500 + }, + { + "epoch": 84.75, + "learning_rate": 7.641315359855502e-06, + "loss": 1.8232, + "step": 29278000 + }, + { + "epoch": 84.75, + "learning_rate": 7.640594606798814e-06, + "loss": 1.8131, + "step": 29278500 + }, + { + "epoch": 84.75, + "learning_rate": 7.639870959151538e-06, + "loss": 1.828, + "step": 29279000 + }, + { + "epoch": 84.75, + "learning_rate": 7.63914731150426e-06, + "loss": 1.8332, + "step": 29279500 + }, + { + "epoch": 84.75, + "learning_rate": 7.638423663856984e-06, + "loss": 1.8343, + "step": 29280000 + }, + { + "epoch": 84.76, + "learning_rate": 7.637700016209708e-06, + "loss": 1.8334, + "step": 29280500 + }, + { + "epoch": 84.76, + "learning_rate": 7.63697636856243e-06, + "loss": 1.82, + "step": 29281000 + }, + { + "epoch": 84.76, + "learning_rate": 7.636252720915154e-06, + "loss": 1.8198, + "step": 29281500 + }, + { + "epoch": 84.76, + "learning_rate": 7.635529073267878e-06, + "loss": 1.8298, + "step": 29282000 + }, + { + "epoch": 84.76, + "learning_rate": 7.634806872915896e-06, + "loss": 1.8418, + "step": 29282500 + }, + { + "epoch": 84.76, + "learning_rate": 7.634084672563913e-06, + "loss": 1.8542, + "step": 29283000 + }, + { + "epoch": 84.76, + "learning_rate": 7.633361024916637e-06, + "loss": 1.8269, + "step": 29283500 + }, + { + "epoch": 84.77, + "learning_rate": 7.632637377269359e-06, + "loss": 1.8633, + "step": 29284000 + }, + { + "epoch": 84.77, + "learning_rate": 7.631913729622083e-06, + "loss": 1.8108, + "step": 29284500 + }, + { + "epoch": 84.77, + "learning_rate": 7.631190081974805e-06, + "loss": 1.8127, + "step": 29285000 + }, + { + "epoch": 84.77, + "learning_rate": 7.630466434327529e-06, + "loss": 1.8271, + "step": 29285500 + }, + { + "epoch": 84.77, + "learning_rate": 7.629742786680253e-06, + "loss": 1.8562, + "step": 29286000 + }, + { + "epoch": 84.77, + "learning_rate": 7.629019139032975e-06, + "loss": 1.8253, + "step": 29286500 + }, + { + "epoch": 84.77, + "learning_rate": 7.628295491385699e-06, + "loss": 1.8374, + "step": 29287000 + }, + { + "epoch": 84.78, + "learning_rate": 7.627573291033717e-06, + "loss": 1.8113, + "step": 29287500 + }, + { + "epoch": 84.78, + "learning_rate": 7.6268496433864395e-06, + "loss": 1.8171, + "step": 29288000 + }, + { + "epoch": 84.78, + "learning_rate": 7.6261259957391625e-06, + "loss": 1.851, + "step": 29288500 + }, + { + "epoch": 84.78, + "learning_rate": 7.6254023480918865e-06, + "loss": 1.8268, + "step": 29289000 + }, + { + "epoch": 84.78, + "learning_rate": 7.6246787004446096e-06, + "loss": 1.8049, + "step": 29289500 + }, + { + "epoch": 84.78, + "learning_rate": 7.623956500092627e-06, + "loss": 1.8095, + "step": 29290000 + }, + { + "epoch": 84.78, + "learning_rate": 7.62323285244535e-06, + "loss": 1.8019, + "step": 29290500 + }, + { + "epoch": 84.79, + "learning_rate": 7.622509204798074e-06, + "loss": 1.8253, + "step": 29291000 + }, + { + "epoch": 84.79, + "learning_rate": 7.621785557150797e-06, + "loss": 1.8327, + "step": 29291500 + }, + { + "epoch": 84.79, + "learning_rate": 7.62106190950352e-06, + "loss": 1.817, + "step": 29292000 + }, + { + "epoch": 84.79, + "learning_rate": 7.620339709151537e-06, + "loss": 1.8123, + "step": 29292500 + }, + { + "epoch": 84.79, + "learning_rate": 7.619616061504262e-06, + "loss": 1.8011, + "step": 29293000 + }, + { + "epoch": 84.79, + "learning_rate": 7.618892413856984e-06, + "loss": 1.8252, + "step": 29293500 + }, + { + "epoch": 84.79, + "learning_rate": 7.618168766209707e-06, + "loss": 1.8153, + "step": 29294000 + }, + { + "epoch": 84.8, + "learning_rate": 7.6174465658577246e-06, + "loss": 1.8532, + "step": 29294500 + }, + { + "epoch": 84.8, + "learning_rate": 7.616722918210449e-06, + "loss": 1.7922, + "step": 29295000 + }, + { + "epoch": 84.8, + "learning_rate": 7.6159992705631716e-06, + "loss": 1.8177, + "step": 29295500 + }, + { + "epoch": 84.8, + "learning_rate": 7.615275622915895e-06, + "loss": 1.8176, + "step": 29296000 + }, + { + "epoch": 84.8, + "learning_rate": 7.614551975268619e-06, + "loss": 1.8443, + "step": 29296500 + }, + { + "epoch": 84.8, + "learning_rate": 7.613828327621342e-06, + "loss": 1.8137, + "step": 29297000 + }, + { + "epoch": 84.8, + "learning_rate": 7.61310612726936e-06, + "loss": 1.8122, + "step": 29297500 + }, + { + "epoch": 84.81, + "learning_rate": 7.612382479622082e-06, + "loss": 1.8151, + "step": 29298000 + }, + { + "epoch": 84.81, + "learning_rate": 7.6116602792701e-06, + "loss": 1.8338, + "step": 29298500 + }, + { + "epoch": 84.81, + "learning_rate": 7.610936631622824e-06, + "loss": 1.8218, + "step": 29299000 + }, + { + "epoch": 84.81, + "learning_rate": 7.610212983975547e-06, + "loss": 1.8038, + "step": 29299500 + }, + { + "epoch": 84.81, + "learning_rate": 7.609489336328269e-06, + "loss": 1.8173, + "step": 29300000 + }, + { + "epoch": 84.81, + "learning_rate": 7.608765688680994e-06, + "loss": 1.8502, + "step": 29300500 + }, + { + "epoch": 84.81, + "learning_rate": 7.608042041033716e-06, + "loss": 1.8228, + "step": 29301000 + }, + { + "epoch": 84.82, + "learning_rate": 7.607318393386439e-06, + "loss": 1.8427, + "step": 29301500 + }, + { + "epoch": 84.82, + "learning_rate": 7.606594745739163e-06, + "loss": 1.8015, + "step": 29302000 + }, + { + "epoch": 84.82, + "learning_rate": 7.6058710980918864e-06, + "loss": 1.8021, + "step": 29302500 + }, + { + "epoch": 84.82, + "learning_rate": 7.6051474504446095e-06, + "loss": 1.8139, + "step": 29303000 + }, + { + "epoch": 84.82, + "learning_rate": 7.604425250092627e-06, + "loss": 1.8322, + "step": 29303500 + }, + { + "epoch": 84.82, + "learning_rate": 7.6037016024453515e-06, + "loss": 1.8041, + "step": 29304000 + }, + { + "epoch": 84.82, + "learning_rate": 7.602977954798074e-06, + "loss": 1.8178, + "step": 29304500 + }, + { + "epoch": 84.83, + "learning_rate": 7.602254307150797e-06, + "loss": 1.8123, + "step": 29305000 + }, + { + "epoch": 84.83, + "learning_rate": 7.601532106798814e-06, + "loss": 1.8283, + "step": 29305500 + }, + { + "epoch": 84.83, + "learning_rate": 7.600808459151539e-06, + "loss": 1.8532, + "step": 29306000 + }, + { + "epoch": 84.83, + "learning_rate": 7.600084811504261e-06, + "loss": 1.8219, + "step": 29306500 + }, + { + "epoch": 84.83, + "learning_rate": 7.599361163856984e-06, + "loss": 1.8496, + "step": 29307000 + }, + { + "epoch": 84.83, + "learning_rate": 7.598637516209707e-06, + "loss": 1.7974, + "step": 29307500 + }, + { + "epoch": 84.83, + "learning_rate": 7.597913868562431e-06, + "loss": 1.8445, + "step": 29308000 + }, + { + "epoch": 84.84, + "learning_rate": 7.597190220915154e-06, + "loss": 1.8341, + "step": 29308500 + }, + { + "epoch": 84.84, + "learning_rate": 7.5964665732678765e-06, + "loss": 1.7889, + "step": 29309000 + }, + { + "epoch": 84.84, + "learning_rate": 7.595742925620601e-06, + "loss": 1.8195, + "step": 29309500 + }, + { + "epoch": 84.84, + "learning_rate": 7.5950207252686185e-06, + "loss": 1.8328, + "step": 29310000 + }, + { + "epoch": 84.84, + "learning_rate": 7.594297077621342e-06, + "loss": 1.8185, + "step": 29310500 + }, + { + "epoch": 84.84, + "learning_rate": 7.593574877269359e-06, + "loss": 1.8046, + "step": 29311000 + }, + { + "epoch": 84.84, + "learning_rate": 7.592851229622084e-06, + "loss": 1.83, + "step": 29311500 + }, + { + "epoch": 84.85, + "learning_rate": 7.592127581974806e-06, + "loss": 1.8248, + "step": 29312000 + }, + { + "epoch": 84.85, + "learning_rate": 7.591403934327529e-06, + "loss": 1.8357, + "step": 29312500 + }, + { + "epoch": 84.85, + "learning_rate": 7.590680286680252e-06, + "loss": 1.8083, + "step": 29313000 + }, + { + "epoch": 84.85, + "learning_rate": 7.589958086328271e-06, + "loss": 1.8002, + "step": 29313500 + }, + { + "epoch": 84.85, + "learning_rate": 7.589234438680993e-06, + "loss": 1.814, + "step": 29314000 + }, + { + "epoch": 84.85, + "learning_rate": 7.588510791033716e-06, + "loss": 1.7825, + "step": 29314500 + }, + { + "epoch": 84.85, + "learning_rate": 7.587787143386439e-06, + "loss": 1.8282, + "step": 29315000 + }, + { + "epoch": 84.86, + "learning_rate": 7.587064943034458e-06, + "loss": 1.8848, + "step": 29315500 + }, + { + "epoch": 84.86, + "learning_rate": 7.586341295387181e-06, + "loss": 1.8334, + "step": 29316000 + }, + { + "epoch": 84.86, + "learning_rate": 7.585617647739904e-06, + "loss": 1.8289, + "step": 29316500 + }, + { + "epoch": 84.86, + "learning_rate": 7.584894000092627e-06, + "loss": 1.8118, + "step": 29317000 + }, + { + "epoch": 84.86, + "learning_rate": 7.584170352445351e-06, + "loss": 1.8372, + "step": 29317500 + }, + { + "epoch": 84.86, + "learning_rate": 7.583446704798074e-06, + "loss": 1.7997, + "step": 29318000 + }, + { + "epoch": 84.87, + "learning_rate": 7.582723057150797e-06, + "loss": 1.8088, + "step": 29318500 + }, + { + "epoch": 84.87, + "learning_rate": 7.581999409503521e-06, + "loss": 1.8175, + "step": 29319000 + }, + { + "epoch": 84.87, + "learning_rate": 7.581275761856244e-06, + "loss": 1.8289, + "step": 29319500 + }, + { + "epoch": 84.87, + "learning_rate": 7.580553561504261e-06, + "loss": 1.8459, + "step": 29320000 + }, + { + "epoch": 84.87, + "learning_rate": 7.579829913856984e-06, + "loss": 1.7984, + "step": 29320500 + }, + { + "epoch": 84.87, + "learning_rate": 7.579106266209708e-06, + "loss": 1.8319, + "step": 29321000 + }, + { + "epoch": 84.87, + "learning_rate": 7.578382618562431e-06, + "loss": 1.8084, + "step": 29321500 + }, + { + "epoch": 84.88, + "learning_rate": 7.577660418210448e-06, + "loss": 1.8325, + "step": 29322000 + }, + { + "epoch": 84.88, + "learning_rate": 7.5769367705631715e-06, + "loss": 1.8184, + "step": 29322500 + }, + { + "epoch": 84.88, + "learning_rate": 7.576213122915895e-06, + "loss": 1.8088, + "step": 29323000 + }, + { + "epoch": 84.88, + "learning_rate": 7.5754894752686185e-06, + "loss": 1.8291, + "step": 29323500 + }, + { + "epoch": 84.88, + "learning_rate": 7.5747658276213416e-06, + "loss": 1.8144, + "step": 29324000 + }, + { + "epoch": 84.88, + "learning_rate": 7.5740421799740655e-06, + "loss": 1.8423, + "step": 29324500 + }, + { + "epoch": 84.88, + "learning_rate": 7.5733185323267886e-06, + "loss": 1.8151, + "step": 29325000 + }, + { + "epoch": 84.89, + "learning_rate": 7.572594884679511e-06, + "loss": 1.8248, + "step": 29325500 + }, + { + "epoch": 84.89, + "learning_rate": 7.571872684327529e-06, + "loss": 1.8201, + "step": 29326000 + }, + { + "epoch": 84.89, + "learning_rate": 7.571149036680253e-06, + "loss": 1.8229, + "step": 29326500 + }, + { + "epoch": 84.89, + "learning_rate": 7.570425389032976e-06, + "loss": 1.8146, + "step": 29327000 + }, + { + "epoch": 84.89, + "learning_rate": 7.569701741385698e-06, + "loss": 1.83, + "step": 29327500 + }, + { + "epoch": 84.89, + "learning_rate": 7.568979541033716e-06, + "loss": 1.8171, + "step": 29328000 + }, + { + "epoch": 84.89, + "learning_rate": 7.56825589338644e-06, + "loss": 1.7998, + "step": 29328500 + }, + { + "epoch": 84.9, + "learning_rate": 7.567532245739163e-06, + "loss": 1.7945, + "step": 29329000 + }, + { + "epoch": 84.9, + "learning_rate": 7.566808598091886e-06, + "loss": 1.8038, + "step": 29329500 + }, + { + "epoch": 84.9, + "learning_rate": 7.5660849504446086e-06, + "loss": 1.8233, + "step": 29330000 + }, + { + "epoch": 84.9, + "learning_rate": 7.5653627500926275e-06, + "loss": 1.8069, + "step": 29330500 + }, + { + "epoch": 84.9, + "learning_rate": 7.564639102445351e-06, + "loss": 1.7961, + "step": 29331000 + }, + { + "epoch": 84.9, + "learning_rate": 7.563915454798074e-06, + "loss": 1.8026, + "step": 29331500 + }, + { + "epoch": 84.9, + "learning_rate": 7.563191807150798e-06, + "loss": 1.8146, + "step": 29332000 + }, + { + "epoch": 84.91, + "learning_rate": 7.562468159503521e-06, + "loss": 1.8605, + "step": 29332500 + }, + { + "epoch": 84.91, + "learning_rate": 7.561744511856243e-06, + "loss": 1.8249, + "step": 29333000 + }, + { + "epoch": 84.91, + "learning_rate": 7.561020864208966e-06, + "loss": 1.8226, + "step": 29333500 + }, + { + "epoch": 84.91, + "learning_rate": 7.56029721656169e-06, + "loss": 1.8238, + "step": 29334000 + }, + { + "epoch": 84.91, + "learning_rate": 7.559575016209708e-06, + "loss": 1.8341, + "step": 29334500 + }, + { + "epoch": 84.91, + "learning_rate": 7.558851368562431e-06, + "loss": 1.8206, + "step": 29335000 + }, + { + "epoch": 84.91, + "learning_rate": 7.558127720915153e-06, + "loss": 1.8295, + "step": 29335500 + }, + { + "epoch": 84.92, + "learning_rate": 7.557404073267878e-06, + "loss": 1.7973, + "step": 29336000 + }, + { + "epoch": 84.92, + "learning_rate": 7.5566804256206e-06, + "loss": 1.8149, + "step": 29336500 + }, + { + "epoch": 84.92, + "learning_rate": 7.5559582252686184e-06, + "loss": 1.8196, + "step": 29337000 + }, + { + "epoch": 84.92, + "learning_rate": 7.555234577621341e-06, + "loss": 1.8167, + "step": 29337500 + }, + { + "epoch": 84.92, + "learning_rate": 7.5545109299740654e-06, + "loss": 1.7899, + "step": 29338000 + }, + { + "epoch": 84.92, + "learning_rate": 7.553787282326788e-06, + "loss": 1.8071, + "step": 29338500 + }, + { + "epoch": 84.92, + "learning_rate": 7.553063634679511e-06, + "loss": 1.8094, + "step": 29339000 + }, + { + "epoch": 84.93, + "learning_rate": 7.552339987032235e-06, + "loss": 1.7853, + "step": 29339500 + }, + { + "epoch": 84.93, + "learning_rate": 7.551617786680253e-06, + "loss": 1.8053, + "step": 29340000 + }, + { + "epoch": 84.93, + "learning_rate": 7.550894139032976e-06, + "loss": 1.8471, + "step": 29340500 + }, + { + "epoch": 84.93, + "learning_rate": 7.550171938680993e-06, + "loss": 1.8304, + "step": 29341000 + }, + { + "epoch": 84.93, + "learning_rate": 7.549448291033717e-06, + "loss": 1.8371, + "step": 29341500 + }, + { + "epoch": 84.93, + "learning_rate": 7.54872464338644e-06, + "loss": 1.8137, + "step": 29342000 + }, + { + "epoch": 84.93, + "learning_rate": 7.548000995739163e-06, + "loss": 1.8125, + "step": 29342500 + }, + { + "epoch": 84.94, + "learning_rate": 7.547277348091885e-06, + "loss": 1.8112, + "step": 29343000 + }, + { + "epoch": 84.94, + "learning_rate": 7.54655370044461e-06, + "loss": 1.7889, + "step": 29343500 + }, + { + "epoch": 84.94, + "learning_rate": 7.5458300527973324e-06, + "loss": 1.8164, + "step": 29344000 + }, + { + "epoch": 84.94, + "learning_rate": 7.5451064051500555e-06, + "loss": 1.829, + "step": 29344500 + }, + { + "epoch": 84.94, + "learning_rate": 7.5443827575027794e-06, + "loss": 1.8108, + "step": 29345000 + }, + { + "epoch": 84.94, + "learning_rate": 7.5436591098555025e-06, + "loss": 1.8138, + "step": 29345500 + }, + { + "epoch": 84.94, + "learning_rate": 7.542935462208226e-06, + "loss": 1.8252, + "step": 29346000 + }, + { + "epoch": 84.95, + "learning_rate": 7.542213261856243e-06, + "loss": 1.8213, + "step": 29346500 + }, + { + "epoch": 84.95, + "learning_rate": 7.541489614208968e-06, + "loss": 1.8217, + "step": 29347000 + }, + { + "epoch": 84.95, + "learning_rate": 7.54076596656169e-06, + "loss": 1.8483, + "step": 29347500 + }, + { + "epoch": 84.95, + "learning_rate": 7.540042318914413e-06, + "loss": 1.8394, + "step": 29348000 + }, + { + "epoch": 84.95, + "learning_rate": 7.539318671267136e-06, + "loss": 1.8231, + "step": 29348500 + }, + { + "epoch": 84.95, + "learning_rate": 7.538596470915155e-06, + "loss": 1.8196, + "step": 29349000 + }, + { + "epoch": 84.95, + "learning_rate": 7.537872823267877e-06, + "loss": 1.8159, + "step": 29349500 + }, + { + "epoch": 84.96, + "learning_rate": 7.5371491756206e-06, + "loss": 1.8034, + "step": 29350000 + }, + { + "epoch": 84.96, + "learning_rate": 7.536425527973323e-06, + "loss": 1.8236, + "step": 29350500 + }, + { + "epoch": 84.96, + "learning_rate": 7.535703327621342e-06, + "loss": 1.8094, + "step": 29351000 + }, + { + "epoch": 84.96, + "learning_rate": 7.5349796799740645e-06, + "loss": 1.8445, + "step": 29351500 + }, + { + "epoch": 84.96, + "learning_rate": 7.534256032326788e-06, + "loss": 1.7982, + "step": 29352000 + }, + { + "epoch": 84.96, + "learning_rate": 7.533533831974805e-06, + "loss": 1.823, + "step": 29352500 + }, + { + "epoch": 84.96, + "learning_rate": 7.53281018432753e-06, + "loss": 1.8223, + "step": 29353000 + }, + { + "epoch": 84.97, + "learning_rate": 7.532086536680253e-06, + "loss": 1.8225, + "step": 29353500 + }, + { + "epoch": 84.97, + "learning_rate": 7.531362889032975e-06, + "loss": 1.8303, + "step": 29354000 + }, + { + "epoch": 84.97, + "learning_rate": 7.5306392413857e-06, + "loss": 1.8214, + "step": 29354500 + }, + { + "epoch": 84.97, + "learning_rate": 7.529915593738422e-06, + "loss": 1.8319, + "step": 29355000 + }, + { + "epoch": 84.97, + "learning_rate": 7.52919339338644e-06, + "loss": 1.8083, + "step": 29355500 + }, + { + "epoch": 84.97, + "learning_rate": 7.528469745739162e-06, + "loss": 1.8144, + "step": 29356000 + }, + { + "epoch": 84.98, + "learning_rate": 7.527746098091887e-06, + "loss": 1.7986, + "step": 29356500 + }, + { + "epoch": 84.98, + "learning_rate": 7.527022450444609e-06, + "loss": 1.8313, + "step": 29357000 + }, + { + "epoch": 84.98, + "learning_rate": 7.526298802797332e-06, + "loss": 1.8424, + "step": 29357500 + }, + { + "epoch": 84.98, + "learning_rate": 7.5255751551500555e-06, + "loss": 1.8297, + "step": 29358000 + }, + { + "epoch": 84.98, + "learning_rate": 7.524851507502779e-06, + "loss": 1.8413, + "step": 29358500 + }, + { + "epoch": 84.98, + "learning_rate": 7.524129307150797e-06, + "loss": 1.8378, + "step": 29359000 + }, + { + "epoch": 84.98, + "learning_rate": 7.52340565950352e-06, + "loss": 1.8011, + "step": 29359500 + }, + { + "epoch": 84.99, + "learning_rate": 7.5226820118562445e-06, + "loss": 1.8068, + "step": 29360000 + }, + { + "epoch": 84.99, + "learning_rate": 7.521959811504262e-06, + "loss": 1.8668, + "step": 29360500 + }, + { + "epoch": 84.99, + "learning_rate": 7.521236163856985e-06, + "loss": 1.8227, + "step": 29361000 + }, + { + "epoch": 84.99, + "learning_rate": 7.520512516209707e-06, + "loss": 1.815, + "step": 29361500 + }, + { + "epoch": 84.99, + "learning_rate": 7.519788868562432e-06, + "loss": 1.8104, + "step": 29362000 + }, + { + "epoch": 84.99, + "learning_rate": 7.519065220915154e-06, + "loss": 1.8364, + "step": 29362500 + }, + { + "epoch": 84.99, + "learning_rate": 7.518341573267877e-06, + "loss": 1.813, + "step": 29363000 + }, + { + "epoch": 85.0, + "learning_rate": 7.5176179256206e-06, + "loss": 1.8539, + "step": 29363500 + }, + { + "epoch": 85.0, + "learning_rate": 7.516894277973324e-06, + "loss": 1.8499, + "step": 29364000 + }, + { + "epoch": 85.0, + "learning_rate": 7.516170630326047e-06, + "loss": 1.8189, + "step": 29364500 + }, + { + "epoch": 85.0, + "learning_rate": 7.51544698267877e-06, + "loss": 1.8014, + "step": 29365000 + }, + { + "epoch": 85.0, + "eval_accuracy": 0.6880164121352734, + "eval_accuracy_mlm": 0.6568216000283631, + "eval_accuracy_nsp": 0.8553665791294863, + "eval_loss": 2.2023632526397705, + "eval_runtime": 331.6134, + "eval_samples_per_second": 1315.948, + "eval_steps_per_second": 54.832, + "step": 29365120 + }, + { + "epoch": 85.0, + "learning_rate": 7.514723335031494e-06, + "loss": 1.8343, + "step": 29365500 + }, + { + "epoch": 85.0, + "learning_rate": 7.5140025819748065e-06, + "loss": 1.8123, + "step": 29366000 + }, + { + "epoch": 85.0, + "learning_rate": 7.51327893432753e-06, + "loss": 1.8284, + "step": 29366500 + }, + { + "epoch": 85.01, + "learning_rate": 7.512555286680252e-06, + "loss": 1.7882, + "step": 29367000 + }, + { + "epoch": 85.01, + "learning_rate": 7.511831639032975e-06, + "loss": 1.7784, + "step": 29367500 + }, + { + "epoch": 85.01, + "learning_rate": 7.511107991385699e-06, + "loss": 1.8092, + "step": 29368000 + }, + { + "epoch": 85.01, + "learning_rate": 7.510384343738422e-06, + "loss": 1.8391, + "step": 29368500 + }, + { + "epoch": 85.01, + "learning_rate": 7.509660696091145e-06, + "loss": 1.8096, + "step": 29369000 + }, + { + "epoch": 85.01, + "learning_rate": 7.508937048443869e-06, + "loss": 1.7975, + "step": 29369500 + }, + { + "epoch": 85.01, + "learning_rate": 7.508213400796592e-06, + "loss": 1.8003, + "step": 29370000 + }, + { + "epoch": 85.02, + "learning_rate": 7.507489753149314e-06, + "loss": 1.7968, + "step": 29370500 + }, + { + "epoch": 85.02, + "learning_rate": 7.506766105502037e-06, + "loss": 1.7995, + "step": 29371000 + }, + { + "epoch": 85.02, + "learning_rate": 7.506042457854762e-06, + "loss": 1.8169, + "step": 29371500 + }, + { + "epoch": 85.02, + "learning_rate": 7.505318810207484e-06, + "loss": 1.8182, + "step": 29372000 + }, + { + "epoch": 85.02, + "learning_rate": 7.504595162560207e-06, + "loss": 1.822, + "step": 29372500 + }, + { + "epoch": 85.02, + "learning_rate": 7.503872962208226e-06, + "loss": 1.8308, + "step": 29373000 + }, + { + "epoch": 85.02, + "learning_rate": 7.5031493145609494e-06, + "loss": 1.8135, + "step": 29373500 + }, + { + "epoch": 85.03, + "learning_rate": 7.502427114208967e-06, + "loss": 1.8089, + "step": 29374000 + }, + { + "epoch": 85.03, + "learning_rate": 7.50170346656169e-06, + "loss": 1.7905, + "step": 29374500 + }, + { + "epoch": 85.03, + "learning_rate": 7.500979818914414e-06, + "loss": 1.8199, + "step": 29375000 + }, + { + "epoch": 85.03, + "learning_rate": 7.500256171267137e-06, + "loss": 1.8124, + "step": 29375500 + }, + { + "epoch": 85.03, + "learning_rate": 7.499532523619859e-06, + "loss": 1.8014, + "step": 29376000 + }, + { + "epoch": 85.03, + "learning_rate": 7.498808875972582e-06, + "loss": 1.8236, + "step": 29376500 + }, + { + "epoch": 85.03, + "learning_rate": 7.498085228325306e-06, + "loss": 1.8074, + "step": 29377000 + }, + { + "epoch": 85.04, + "learning_rate": 7.497361580678029e-06, + "loss": 1.7947, + "step": 29377500 + }, + { + "epoch": 85.04, + "learning_rate": 7.496637933030752e-06, + "loss": 1.7856, + "step": 29378000 + }, + { + "epoch": 85.04, + "learning_rate": 7.495914285383476e-06, + "loss": 1.7997, + "step": 29378500 + }, + { + "epoch": 85.04, + "learning_rate": 7.495190637736199e-06, + "loss": 1.7985, + "step": 29379000 + }, + { + "epoch": 85.04, + "learning_rate": 7.494466990088922e-06, + "loss": 1.7922, + "step": 29379500 + }, + { + "epoch": 85.04, + "learning_rate": 7.4937433424416445e-06, + "loss": 1.7872, + "step": 29380000 + }, + { + "epoch": 85.04, + "learning_rate": 7.4930225893849584e-06, + "loss": 1.7991, + "step": 29380500 + }, + { + "epoch": 85.05, + "learning_rate": 7.492300389032976e-06, + "loss": 1.8179, + "step": 29381000 + }, + { + "epoch": 85.05, + "learning_rate": 7.491578188680994e-06, + "loss": 1.7883, + "step": 29381500 + }, + { + "epoch": 85.05, + "learning_rate": 7.490854541033716e-06, + "loss": 1.8012, + "step": 29382000 + }, + { + "epoch": 85.05, + "learning_rate": 7.490130893386439e-06, + "loss": 1.8042, + "step": 29382500 + }, + { + "epoch": 85.05, + "learning_rate": 7.489407245739163e-06, + "loss": 1.831, + "step": 29383000 + }, + { + "epoch": 85.05, + "learning_rate": 7.488683598091886e-06, + "loss": 1.7931, + "step": 29383500 + }, + { + "epoch": 85.05, + "learning_rate": 7.487959950444609e-06, + "loss": 1.817, + "step": 29384000 + }, + { + "epoch": 85.06, + "learning_rate": 7.487236302797333e-06, + "loss": 1.7861, + "step": 29384500 + }, + { + "epoch": 85.06, + "learning_rate": 7.486512655150056e-06, + "loss": 1.805, + "step": 29385000 + }, + { + "epoch": 85.06, + "learning_rate": 7.485789007502779e-06, + "loss": 1.8087, + "step": 29385500 + }, + { + "epoch": 85.06, + "learning_rate": 7.4850668071507965e-06, + "loss": 1.8216, + "step": 29386000 + }, + { + "epoch": 85.06, + "learning_rate": 7.4843431595035205e-06, + "loss": 1.7959, + "step": 29386500 + }, + { + "epoch": 85.06, + "learning_rate": 7.4836195118562435e-06, + "loss": 1.8292, + "step": 29387000 + }, + { + "epoch": 85.06, + "learning_rate": 7.482895864208967e-06, + "loss": 1.8095, + "step": 29387500 + }, + { + "epoch": 85.07, + "learning_rate": 7.482172216561689e-06, + "loss": 1.7998, + "step": 29388000 + }, + { + "epoch": 85.07, + "learning_rate": 7.481448568914414e-06, + "loss": 1.804, + "step": 29388500 + }, + { + "epoch": 85.07, + "learning_rate": 7.480726368562431e-06, + "loss": 1.8325, + "step": 29389000 + }, + { + "epoch": 85.07, + "learning_rate": 7.480002720915154e-06, + "loss": 1.8157, + "step": 29389500 + }, + { + "epoch": 85.07, + "learning_rate": 7.479279073267878e-06, + "loss": 1.8044, + "step": 29390000 + }, + { + "epoch": 85.07, + "learning_rate": 7.478555425620601e-06, + "loss": 1.8099, + "step": 29390500 + }, + { + "epoch": 85.07, + "learning_rate": 7.477831777973324e-06, + "loss": 1.8019, + "step": 29391000 + }, + { + "epoch": 85.08, + "learning_rate": 7.477108130326046e-06, + "loss": 1.8161, + "step": 29391500 + }, + { + "epoch": 85.08, + "learning_rate": 7.476384482678771e-06, + "loss": 1.8199, + "step": 29392000 + }, + { + "epoch": 85.08, + "learning_rate": 7.475660835031493e-06, + "loss": 1.7713, + "step": 29392500 + }, + { + "epoch": 85.08, + "learning_rate": 7.474937187384216e-06, + "loss": 1.7959, + "step": 29393000 + }, + { + "epoch": 85.08, + "learning_rate": 7.474214987032234e-06, + "loss": 1.8143, + "step": 29393500 + }, + { + "epoch": 85.08, + "learning_rate": 7.473494233975546e-06, + "loss": 1.805, + "step": 29394000 + }, + { + "epoch": 85.09, + "learning_rate": 7.472770586328271e-06, + "loss": 1.8213, + "step": 29394500 + }, + { + "epoch": 85.09, + "learning_rate": 7.472046938680993e-06, + "loss": 1.8171, + "step": 29395000 + }, + { + "epoch": 85.09, + "learning_rate": 7.471323291033716e-06, + "loss": 1.8002, + "step": 29395500 + }, + { + "epoch": 85.09, + "learning_rate": 7.47059964338644e-06, + "loss": 1.8093, + "step": 29396000 + }, + { + "epoch": 85.09, + "learning_rate": 7.469875995739163e-06, + "loss": 1.8306, + "step": 29396500 + }, + { + "epoch": 85.09, + "learning_rate": 7.469152348091886e-06, + "loss": 1.7977, + "step": 29397000 + }, + { + "epoch": 85.09, + "learning_rate": 7.468428700444609e-06, + "loss": 1.8182, + "step": 29397500 + }, + { + "epoch": 85.1, + "learning_rate": 7.467705052797333e-06, + "loss": 1.8069, + "step": 29398000 + }, + { + "epoch": 85.1, + "learning_rate": 7.466981405150056e-06, + "loss": 1.827, + "step": 29398500 + }, + { + "epoch": 85.1, + "learning_rate": 7.466257757502778e-06, + "loss": 1.801, + "step": 29399000 + }, + { + "epoch": 85.1, + "learning_rate": 7.465534109855503e-06, + "loss": 1.802, + "step": 29399500 + }, + { + "epoch": 85.1, + "learning_rate": 7.464810462208225e-06, + "loss": 1.7935, + "step": 29400000 + }, + { + "epoch": 85.1, + "learning_rate": 7.4640868145609485e-06, + "loss": 1.8154, + "step": 29400500 + }, + { + "epoch": 85.1, + "learning_rate": 7.463364614208966e-06, + "loss": 1.8111, + "step": 29401000 + }, + { + "epoch": 85.11, + "learning_rate": 7.4626409665616905e-06, + "loss": 1.8172, + "step": 29401500 + }, + { + "epoch": 85.11, + "learning_rate": 7.461917318914413e-06, + "loss": 1.8075, + "step": 29402000 + }, + { + "epoch": 85.11, + "learning_rate": 7.461193671267136e-06, + "loss": 1.8172, + "step": 29402500 + }, + { + "epoch": 85.11, + "learning_rate": 7.460470023619861e-06, + "loss": 1.8161, + "step": 29403000 + }, + { + "epoch": 85.11, + "learning_rate": 7.459746375972583e-06, + "loss": 1.8142, + "step": 29403500 + }, + { + "epoch": 85.11, + "learning_rate": 7.459022728325306e-06, + "loss": 1.8451, + "step": 29404000 + }, + { + "epoch": 85.11, + "learning_rate": 7.458299080678029e-06, + "loss": 1.7921, + "step": 29404500 + }, + { + "epoch": 85.12, + "learning_rate": 7.457576880326048e-06, + "loss": 1.8408, + "step": 29405000 + }, + { + "epoch": 85.12, + "learning_rate": 7.45685323267877e-06, + "loss": 1.7977, + "step": 29405500 + }, + { + "epoch": 85.12, + "learning_rate": 7.456129585031493e-06, + "loss": 1.8178, + "step": 29406000 + }, + { + "epoch": 85.12, + "learning_rate": 7.455405937384216e-06, + "loss": 1.8175, + "step": 29406500 + }, + { + "epoch": 85.12, + "learning_rate": 7.454683737032235e-06, + "loss": 1.8103, + "step": 29407000 + }, + { + "epoch": 85.12, + "learning_rate": 7.4539600893849575e-06, + "loss": 1.8051, + "step": 29407500 + }, + { + "epoch": 85.12, + "learning_rate": 7.453236441737681e-06, + "loss": 1.8154, + "step": 29408000 + }, + { + "epoch": 85.13, + "learning_rate": 7.452512794090404e-06, + "loss": 1.8123, + "step": 29408500 + }, + { + "epoch": 85.13, + "learning_rate": 7.451789146443128e-06, + "loss": 1.8057, + "step": 29409000 + }, + { + "epoch": 85.13, + "learning_rate": 7.45106839338644e-06, + "loss": 1.8153, + "step": 29409500 + }, + { + "epoch": 85.13, + "learning_rate": 7.450344745739163e-06, + "loss": 1.85, + "step": 29410000 + }, + { + "epoch": 85.13, + "learning_rate": 7.449621098091886e-06, + "loss": 1.8069, + "step": 29410500 + }, + { + "epoch": 85.13, + "learning_rate": 7.44889745044461e-06, + "loss": 1.8025, + "step": 29411000 + }, + { + "epoch": 85.13, + "learning_rate": 7.448173802797333e-06, + "loss": 1.7944, + "step": 29411500 + }, + { + "epoch": 85.14, + "learning_rate": 7.447450155150055e-06, + "loss": 1.8368, + "step": 29412000 + }, + { + "epoch": 85.14, + "learning_rate": 7.44672650750278e-06, + "loss": 1.7979, + "step": 29412500 + }, + { + "epoch": 85.14, + "learning_rate": 7.446002859855502e-06, + "loss": 1.8101, + "step": 29413000 + }, + { + "epoch": 85.14, + "learning_rate": 7.44528065950352e-06, + "loss": 1.8154, + "step": 29413500 + }, + { + "epoch": 85.14, + "learning_rate": 7.444557011856243e-06, + "loss": 1.829, + "step": 29414000 + }, + { + "epoch": 85.14, + "learning_rate": 7.443833364208967e-06, + "loss": 1.7983, + "step": 29414500 + }, + { + "epoch": 85.14, + "learning_rate": 7.4431097165616904e-06, + "loss": 1.794, + "step": 29415000 + }, + { + "epoch": 85.15, + "learning_rate": 7.442386068914413e-06, + "loss": 1.8181, + "step": 29415500 + }, + { + "epoch": 85.15, + "learning_rate": 7.441663868562431e-06, + "loss": 1.8119, + "step": 29416000 + }, + { + "epoch": 85.15, + "learning_rate": 7.440940220915155e-06, + "loss": 1.8354, + "step": 29416500 + }, + { + "epoch": 85.15, + "learning_rate": 7.440216573267878e-06, + "loss": 1.8006, + "step": 29417000 + }, + { + "epoch": 85.15, + "learning_rate": 7.4394929256206e-06, + "loss": 1.7893, + "step": 29417500 + }, + { + "epoch": 85.15, + "learning_rate": 7.438770725268618e-06, + "loss": 1.8167, + "step": 29418000 + }, + { + "epoch": 85.15, + "learning_rate": 7.438047077621342e-06, + "loss": 1.809, + "step": 29418500 + }, + { + "epoch": 85.16, + "learning_rate": 7.437324877269359e-06, + "loss": 1.7953, + "step": 29419000 + }, + { + "epoch": 85.16, + "learning_rate": 7.436601229622082e-06, + "loss": 1.8119, + "step": 29419500 + }, + { + "epoch": 85.16, + "learning_rate": 7.4358775819748055e-06, + "loss": 1.8307, + "step": 29420000 + }, + { + "epoch": 85.16, + "learning_rate": 7.435153934327529e-06, + "loss": 1.8, + "step": 29420500 + }, + { + "epoch": 85.16, + "learning_rate": 7.4344302866802525e-06, + "loss": 1.8198, + "step": 29421000 + }, + { + "epoch": 85.16, + "learning_rate": 7.4337066390329755e-06, + "loss": 1.8089, + "step": 29421500 + }, + { + "epoch": 85.16, + "learning_rate": 7.4329829913856995e-06, + "loss": 1.831, + "step": 29422000 + }, + { + "epoch": 85.17, + "learning_rate": 7.4322593437384226e-06, + "loss": 1.8217, + "step": 29422500 + }, + { + "epoch": 85.17, + "learning_rate": 7.431535696091145e-06, + "loss": 1.8175, + "step": 29423000 + }, + { + "epoch": 85.17, + "learning_rate": 7.430812048443868e-06, + "loss": 1.8064, + "step": 29423500 + }, + { + "epoch": 85.17, + "learning_rate": 7.430089848091887e-06, + "loss": 1.8073, + "step": 29424000 + }, + { + "epoch": 85.17, + "learning_rate": 7.42936620044461e-06, + "loss": 1.8103, + "step": 29424500 + }, + { + "epoch": 85.17, + "learning_rate": 7.428642552797332e-06, + "loss": 1.8039, + "step": 29425000 + }, + { + "epoch": 85.17, + "learning_rate": 7.427918905150055e-06, + "loss": 1.7891, + "step": 29425500 + }, + { + "epoch": 85.18, + "learning_rate": 7.427195257502779e-06, + "loss": 1.8317, + "step": 29426000 + }, + { + "epoch": 85.18, + "learning_rate": 7.426471609855502e-06, + "loss": 1.8016, + "step": 29426500 + }, + { + "epoch": 85.18, + "learning_rate": 7.4257494095035195e-06, + "loss": 1.7983, + "step": 29427000 + }, + { + "epoch": 85.18, + "learning_rate": 7.425025761856244e-06, + "loss": 1.8215, + "step": 29427500 + }, + { + "epoch": 85.18, + "learning_rate": 7.424302114208967e-06, + "loss": 1.8157, + "step": 29428000 + }, + { + "epoch": 85.18, + "learning_rate": 7.4235784665616896e-06, + "loss": 1.818, + "step": 29428500 + }, + { + "epoch": 85.18, + "learning_rate": 7.422856266209708e-06, + "loss": 1.7939, + "step": 29429000 + }, + { + "epoch": 85.19, + "learning_rate": 7.4221326185624316e-06, + "loss": 1.818, + "step": 29429500 + }, + { + "epoch": 85.19, + "learning_rate": 7.421410418210449e-06, + "loss": 1.795, + "step": 29430000 + }, + { + "epoch": 85.19, + "learning_rate": 7.420686770563172e-06, + "loss": 1.8453, + "step": 29430500 + }, + { + "epoch": 85.19, + "learning_rate": 7.419963122915895e-06, + "loss": 1.7924, + "step": 29431000 + }, + { + "epoch": 85.19, + "learning_rate": 7.419239475268619e-06, + "loss": 1.8136, + "step": 29431500 + }, + { + "epoch": 85.19, + "learning_rate": 7.418515827621342e-06, + "loss": 1.8025, + "step": 29432000 + }, + { + "epoch": 85.2, + "learning_rate": 7.417792179974064e-06, + "loss": 1.828, + "step": 29432500 + }, + { + "epoch": 85.2, + "learning_rate": 7.417069979622082e-06, + "loss": 1.8178, + "step": 29433000 + }, + { + "epoch": 85.2, + "learning_rate": 7.416346331974806e-06, + "loss": 1.7906, + "step": 29433500 + }, + { + "epoch": 85.2, + "learning_rate": 7.415622684327529e-06, + "loss": 1.8221, + "step": 29434000 + }, + { + "epoch": 85.2, + "learning_rate": 7.414899036680252e-06, + "loss": 1.8277, + "step": 29434500 + }, + { + "epoch": 85.2, + "learning_rate": 7.414175389032975e-06, + "loss": 1.83, + "step": 29435000 + }, + { + "epoch": 85.2, + "learning_rate": 7.413451741385699e-06, + "loss": 1.7964, + "step": 29435500 + }, + { + "epoch": 85.21, + "learning_rate": 7.412728093738422e-06, + "loss": 1.817, + "step": 29436000 + }, + { + "epoch": 85.21, + "learning_rate": 7.412004446091145e-06, + "loss": 1.8139, + "step": 29436500 + }, + { + "epoch": 85.21, + "learning_rate": 7.411280798443869e-06, + "loss": 1.8222, + "step": 29437000 + }, + { + "epoch": 85.21, + "learning_rate": 7.410557150796592e-06, + "loss": 1.8024, + "step": 29437500 + }, + { + "epoch": 85.21, + "learning_rate": 7.409833503149315e-06, + "loss": 1.8135, + "step": 29438000 + }, + { + "epoch": 85.21, + "learning_rate": 7.409109855502037e-06, + "loss": 1.7896, + "step": 29438500 + }, + { + "epoch": 85.21, + "learning_rate": 7.408386207854762e-06, + "loss": 1.8223, + "step": 29439000 + }, + { + "epoch": 85.22, + "learning_rate": 7.407666902093368e-06, + "loss": 1.8089, + "step": 29439500 + }, + { + "epoch": 85.22, + "learning_rate": 7.406943254446091e-06, + "loss": 1.8215, + "step": 29440000 + }, + { + "epoch": 85.22, + "learning_rate": 7.4062196067988144e-06, + "loss": 1.8203, + "step": 29440500 + }, + { + "epoch": 85.22, + "learning_rate": 7.405495959151538e-06, + "loss": 1.809, + "step": 29441000 + }, + { + "epoch": 85.22, + "learning_rate": 7.4047723115042614e-06, + "loss": 1.8145, + "step": 29441500 + }, + { + "epoch": 85.22, + "learning_rate": 7.4040486638569845e-06, + "loss": 1.8107, + "step": 29442000 + }, + { + "epoch": 85.22, + "learning_rate": 7.403325016209707e-06, + "loss": 1.8143, + "step": 29442500 + }, + { + "epoch": 85.23, + "learning_rate": 7.4026013685624315e-06, + "loss": 1.7909, + "step": 29443000 + }, + { + "epoch": 85.23, + "learning_rate": 7.401877720915154e-06, + "loss": 1.8128, + "step": 29443500 + }, + { + "epoch": 85.23, + "learning_rate": 7.401155520563172e-06, + "loss": 1.8394, + "step": 29444000 + }, + { + "epoch": 85.23, + "learning_rate": 7.400433320211189e-06, + "loss": 1.8011, + "step": 29444500 + }, + { + "epoch": 85.23, + "learning_rate": 7.399709672563913e-06, + "loss": 1.8345, + "step": 29445000 + }, + { + "epoch": 85.23, + "learning_rate": 7.398986024916636e-06, + "loss": 1.8197, + "step": 29445500 + }, + { + "epoch": 85.23, + "learning_rate": 7.398262377269359e-06, + "loss": 1.8072, + "step": 29446000 + }, + { + "epoch": 85.24, + "learning_rate": 7.397538729622083e-06, + "loss": 1.7898, + "step": 29446500 + }, + { + "epoch": 85.24, + "learning_rate": 7.396815081974806e-06, + "loss": 1.8047, + "step": 29447000 + }, + { + "epoch": 85.24, + "learning_rate": 7.396091434327529e-06, + "loss": 1.7934, + "step": 29447500 + }, + { + "epoch": 85.24, + "learning_rate": 7.3953677866802515e-06, + "loss": 1.8257, + "step": 29448000 + }, + { + "epoch": 85.24, + "learning_rate": 7.394644139032976e-06, + "loss": 1.808, + "step": 29448500 + }, + { + "epoch": 85.24, + "learning_rate": 7.3939219386809935e-06, + "loss": 1.8222, + "step": 29449000 + }, + { + "epoch": 85.24, + "learning_rate": 7.393199738329011e-06, + "loss": 1.82, + "step": 29449500 + }, + { + "epoch": 85.25, + "learning_rate": 7.392476090681734e-06, + "loss": 1.815, + "step": 29450000 + }, + { + "epoch": 85.25, + "learning_rate": 7.391752443034458e-06, + "loss": 1.8292, + "step": 29450500 + }, + { + "epoch": 85.25, + "learning_rate": 7.391028795387181e-06, + "loss": 1.823, + "step": 29451000 + }, + { + "epoch": 85.25, + "learning_rate": 7.390305147739904e-06, + "loss": 1.809, + "step": 29451500 + }, + { + "epoch": 85.25, + "learning_rate": 7.389581500092627e-06, + "loss": 1.8231, + "step": 29452000 + }, + { + "epoch": 85.25, + "learning_rate": 7.388857852445351e-06, + "loss": 1.812, + "step": 29452500 + }, + { + "epoch": 85.25, + "learning_rate": 7.388134204798074e-06, + "loss": 1.8117, + "step": 29453000 + }, + { + "epoch": 85.26, + "learning_rate": 7.387412004446091e-06, + "loss": 1.8214, + "step": 29453500 + }, + { + "epoch": 85.26, + "learning_rate": 7.386688356798814e-06, + "loss": 1.8085, + "step": 29454000 + }, + { + "epoch": 85.26, + "learning_rate": 7.385964709151538e-06, + "loss": 1.8439, + "step": 29454500 + }, + { + "epoch": 85.26, + "learning_rate": 7.385241061504261e-06, + "loss": 1.8117, + "step": 29455000 + }, + { + "epoch": 85.26, + "learning_rate": 7.384517413856984e-06, + "loss": 1.7961, + "step": 29455500 + }, + { + "epoch": 85.26, + "learning_rate": 7.383793766209708e-06, + "loss": 1.8002, + "step": 29456000 + }, + { + "epoch": 85.26, + "learning_rate": 7.383070118562431e-06, + "loss": 1.805, + "step": 29456500 + }, + { + "epoch": 85.27, + "learning_rate": 7.382346470915154e-06, + "loss": 1.8211, + "step": 29457000 + }, + { + "epoch": 85.27, + "learning_rate": 7.381624270563171e-06, + "loss": 1.8387, + "step": 29457500 + }, + { + "epoch": 85.27, + "learning_rate": 7.380900622915896e-06, + "loss": 1.7936, + "step": 29458000 + }, + { + "epoch": 85.27, + "learning_rate": 7.380176975268619e-06, + "loss": 1.8544, + "step": 29458500 + }, + { + "epoch": 85.27, + "learning_rate": 7.379453327621341e-06, + "loss": 1.8093, + "step": 29459000 + }, + { + "epoch": 85.27, + "learning_rate": 7.378729679974066e-06, + "loss": 1.7719, + "step": 29459500 + }, + { + "epoch": 85.27, + "learning_rate": 7.378007479622083e-06, + "loss": 1.8185, + "step": 29460000 + }, + { + "epoch": 85.28, + "learning_rate": 7.377283831974806e-06, + "loss": 1.8164, + "step": 29460500 + }, + { + "epoch": 85.28, + "learning_rate": 7.376561631622823e-06, + "loss": 1.7956, + "step": 29461000 + }, + { + "epoch": 85.28, + "learning_rate": 7.3758379839755465e-06, + "loss": 1.8328, + "step": 29461500 + }, + { + "epoch": 85.28, + "learning_rate": 7.37511433632827e-06, + "loss": 1.7834, + "step": 29462000 + }, + { + "epoch": 85.28, + "learning_rate": 7.3743906886809935e-06, + "loss": 1.8093, + "step": 29462500 + }, + { + "epoch": 85.28, + "learning_rate": 7.373667041033716e-06, + "loss": 1.8159, + "step": 29463000 + }, + { + "epoch": 85.28, + "learning_rate": 7.3729433933864405e-06, + "loss": 1.8107, + "step": 29463500 + }, + { + "epoch": 85.29, + "learning_rate": 7.372219745739163e-06, + "loss": 1.8166, + "step": 29464000 + }, + { + "epoch": 85.29, + "learning_rate": 7.371496098091886e-06, + "loss": 1.8245, + "step": 29464500 + }, + { + "epoch": 85.29, + "learning_rate": 7.370772450444609e-06, + "loss": 1.8027, + "step": 29465000 + }, + { + "epoch": 85.29, + "learning_rate": 7.370048802797333e-06, + "loss": 1.8003, + "step": 29465500 + }, + { + "epoch": 85.29, + "learning_rate": 7.369326602445351e-06, + "loss": 1.8233, + "step": 29466000 + }, + { + "epoch": 85.29, + "learning_rate": 7.368602954798073e-06, + "loss": 1.8282, + "step": 29466500 + }, + { + "epoch": 85.29, + "learning_rate": 7.367879307150798e-06, + "loss": 1.8009, + "step": 29467000 + }, + { + "epoch": 85.3, + "learning_rate": 7.36715565950352e-06, + "loss": 1.8141, + "step": 29467500 + }, + { + "epoch": 85.3, + "learning_rate": 7.366432011856243e-06, + "loss": 1.8042, + "step": 29468000 + }, + { + "epoch": 85.3, + "learning_rate": 7.3657098115042605e-06, + "loss": 1.8368, + "step": 29468500 + }, + { + "epoch": 85.3, + "learning_rate": 7.364986163856985e-06, + "loss": 1.8155, + "step": 29469000 + }, + { + "epoch": 85.3, + "learning_rate": 7.3642625162097075e-06, + "loss": 1.7819, + "step": 29469500 + }, + { + "epoch": 85.3, + "learning_rate": 7.3635388685624306e-06, + "loss": 1.8412, + "step": 29470000 + }, + { + "epoch": 85.31, + "learning_rate": 7.362815220915154e-06, + "loss": 1.8094, + "step": 29470500 + }, + { + "epoch": 85.31, + "learning_rate": 7.362091573267878e-06, + "loss": 1.7764, + "step": 29471000 + }, + { + "epoch": 85.31, + "learning_rate": 7.361367925620601e-06, + "loss": 1.8049, + "step": 29471500 + }, + { + "epoch": 85.31, + "learning_rate": 7.360644277973324e-06, + "loss": 1.8087, + "step": 29472000 + }, + { + "epoch": 85.31, + "learning_rate": 7.359920630326048e-06, + "loss": 1.8234, + "step": 29472500 + }, + { + "epoch": 85.31, + "learning_rate": 7.359198429974065e-06, + "loss": 1.8154, + "step": 29473000 + }, + { + "epoch": 85.31, + "learning_rate": 7.358474782326788e-06, + "loss": 1.8275, + "step": 29473500 + }, + { + "epoch": 85.32, + "learning_rate": 7.357751134679511e-06, + "loss": 1.8046, + "step": 29474000 + }, + { + "epoch": 85.32, + "learning_rate": 7.357027487032235e-06, + "loss": 1.7998, + "step": 29474500 + }, + { + "epoch": 85.32, + "learning_rate": 7.356303839384958e-06, + "loss": 1.8173, + "step": 29475000 + }, + { + "epoch": 85.32, + "learning_rate": 7.355581639032975e-06, + "loss": 1.839, + "step": 29475500 + }, + { + "epoch": 85.32, + "learning_rate": 7.354859438680993e-06, + "loss": 1.8025, + "step": 29476000 + }, + { + "epoch": 85.32, + "learning_rate": 7.354135791033717e-06, + "loss": 1.8103, + "step": 29476500 + }, + { + "epoch": 85.32, + "learning_rate": 7.3534121433864404e-06, + "loss": 1.8313, + "step": 29477000 + }, + { + "epoch": 85.33, + "learning_rate": 7.352688495739163e-06, + "loss": 1.8168, + "step": 29477500 + }, + { + "epoch": 85.33, + "learning_rate": 7.351964848091886e-06, + "loss": 1.811, + "step": 29478000 + }, + { + "epoch": 85.33, + "learning_rate": 7.35124120044461e-06, + "loss": 1.7918, + "step": 29478500 + }, + { + "epoch": 85.33, + "learning_rate": 7.350517552797333e-06, + "loss": 1.8032, + "step": 29479000 + }, + { + "epoch": 85.33, + "learning_rate": 7.349793905150056e-06, + "loss": 1.8505, + "step": 29479500 + }, + { + "epoch": 85.33, + "learning_rate": 7.34907025750278e-06, + "loss": 1.7942, + "step": 29480000 + }, + { + "epoch": 85.33, + "learning_rate": 7.348346609855503e-06, + "loss": 1.8179, + "step": 29480500 + }, + { + "epoch": 85.34, + "learning_rate": 7.34762440950352e-06, + "loss": 1.8134, + "step": 29481000 + }, + { + "epoch": 85.34, + "learning_rate": 7.346900761856243e-06, + "loss": 1.7972, + "step": 29481500 + }, + { + "epoch": 85.34, + "learning_rate": 7.3461785615042604e-06, + "loss": 1.8265, + "step": 29482000 + }, + { + "epoch": 85.34, + "learning_rate": 7.345456361152279e-06, + "loss": 1.8336, + "step": 29482500 + }, + { + "epoch": 85.34, + "learning_rate": 7.3447327135050025e-06, + "loss": 1.8228, + "step": 29483000 + }, + { + "epoch": 85.34, + "learning_rate": 7.3440090658577255e-06, + "loss": 1.8014, + "step": 29483500 + }, + { + "epoch": 85.34, + "learning_rate": 7.3432854182104495e-06, + "loss": 1.7873, + "step": 29484000 + }, + { + "epoch": 85.35, + "learning_rate": 7.3425617705631725e-06, + "loss": 1.8224, + "step": 29484500 + }, + { + "epoch": 85.35, + "learning_rate": 7.341838122915895e-06, + "loss": 1.8172, + "step": 29485000 + }, + { + "epoch": 85.35, + "learning_rate": 7.341114475268618e-06, + "loss": 1.8174, + "step": 29485500 + }, + { + "epoch": 85.35, + "learning_rate": 7.340390827621342e-06, + "loss": 1.8329, + "step": 29486000 + }, + { + "epoch": 85.35, + "learning_rate": 7.339667179974065e-06, + "loss": 1.8069, + "step": 29486500 + }, + { + "epoch": 85.35, + "learning_rate": 7.338943532326788e-06, + "loss": 1.7879, + "step": 29487000 + }, + { + "epoch": 85.35, + "learning_rate": 7.338219884679512e-06, + "loss": 1.8339, + "step": 29487500 + }, + { + "epoch": 85.36, + "learning_rate": 7.337496237032235e-06, + "loss": 1.7967, + "step": 29488000 + }, + { + "epoch": 85.36, + "learning_rate": 7.336774036680252e-06, + "loss": 1.7989, + "step": 29488500 + }, + { + "epoch": 85.36, + "learning_rate": 7.336050389032975e-06, + "loss": 1.8246, + "step": 29489000 + }, + { + "epoch": 85.36, + "learning_rate": 7.335326741385699e-06, + "loss": 1.8039, + "step": 29489500 + }, + { + "epoch": 85.36, + "learning_rate": 7.334603093738422e-06, + "loss": 1.8219, + "step": 29490000 + }, + { + "epoch": 85.36, + "learning_rate": 7.3338808933864395e-06, + "loss": 1.8139, + "step": 29490500 + }, + { + "epoch": 85.36, + "learning_rate": 7.333157245739163e-06, + "loss": 1.8107, + "step": 29491000 + }, + { + "epoch": 85.37, + "learning_rate": 7.3324335980918866e-06, + "loss": 1.8152, + "step": 29491500 + }, + { + "epoch": 85.37, + "learning_rate": 7.33170995044461e-06, + "loss": 1.8087, + "step": 29492000 + }, + { + "epoch": 85.37, + "learning_rate": 7.330986302797333e-06, + "loss": 1.8078, + "step": 29492500 + }, + { + "epoch": 85.37, + "learning_rate": 7.33026410244535e-06, + "loss": 1.8262, + "step": 29493000 + }, + { + "epoch": 85.37, + "learning_rate": 7.329540454798074e-06, + "loss": 1.8242, + "step": 29493500 + }, + { + "epoch": 85.37, + "learning_rate": 7.328816807150797e-06, + "loss": 1.8116, + "step": 29494000 + }, + { + "epoch": 85.37, + "learning_rate": 7.32809315950352e-06, + "loss": 1.7742, + "step": 29494500 + }, + { + "epoch": 85.38, + "learning_rate": 7.327370959151537e-06, + "loss": 1.8185, + "step": 29495000 + }, + { + "epoch": 85.38, + "learning_rate": 7.326647311504261e-06, + "loss": 1.8181, + "step": 29495500 + }, + { + "epoch": 85.38, + "learning_rate": 7.325923663856984e-06, + "loss": 1.8083, + "step": 29496000 + }, + { + "epoch": 85.38, + "learning_rate": 7.325200016209707e-06, + "loss": 1.8335, + "step": 29496500 + }, + { + "epoch": 85.38, + "learning_rate": 7.324476368562431e-06, + "loss": 1.8224, + "step": 29497000 + }, + { + "epoch": 85.38, + "learning_rate": 7.323752720915154e-06, + "loss": 1.8385, + "step": 29497500 + }, + { + "epoch": 85.38, + "learning_rate": 7.323030520563172e-06, + "loss": 1.8061, + "step": 29498000 + }, + { + "epoch": 85.39, + "learning_rate": 7.322306872915895e-06, + "loss": 1.8145, + "step": 29498500 + }, + { + "epoch": 85.39, + "learning_rate": 7.321583225268619e-06, + "loss": 1.8325, + "step": 29499000 + }, + { + "epoch": 85.39, + "learning_rate": 7.320859577621342e-06, + "loss": 1.8178, + "step": 29499500 + }, + { + "epoch": 85.39, + "learning_rate": 7.320137377269359e-06, + "loss": 1.809, + "step": 29500000 + }, + { + "epoch": 85.39, + "learning_rate": 7.319413729622082e-06, + "loss": 1.796, + "step": 29500500 + }, + { + "epoch": 85.39, + "learning_rate": 7.318691529270099e-06, + "loss": 1.8261, + "step": 29501000 + }, + { + "epoch": 85.39, + "learning_rate": 7.317967881622824e-06, + "loss": 1.8323, + "step": 29501500 + }, + { + "epoch": 85.4, + "learning_rate": 7.317244233975547e-06, + "loss": 1.8177, + "step": 29502000 + }, + { + "epoch": 85.4, + "learning_rate": 7.316520586328269e-06, + "loss": 1.7953, + "step": 29502500 + }, + { + "epoch": 85.4, + "learning_rate": 7.315796938680994e-06, + "loss": 1.8202, + "step": 29503000 + }, + { + "epoch": 85.4, + "learning_rate": 7.315073291033716e-06, + "loss": 1.8476, + "step": 29503500 + }, + { + "epoch": 85.4, + "learning_rate": 7.3143496433864395e-06, + "loss": 1.8035, + "step": 29504000 + }, + { + "epoch": 85.4, + "learning_rate": 7.313627443034457e-06, + "loss": 1.8288, + "step": 29504500 + }, + { + "epoch": 85.4, + "learning_rate": 7.3129037953871815e-06, + "loss": 1.8022, + "step": 29505000 + }, + { + "epoch": 85.41, + "learning_rate": 7.312180147739904e-06, + "loss": 1.8193, + "step": 29505500 + }, + { + "epoch": 85.41, + "learning_rate": 7.311456500092627e-06, + "loss": 1.8123, + "step": 29506000 + }, + { + "epoch": 85.41, + "learning_rate": 7.310732852445351e-06, + "loss": 1.8232, + "step": 29506500 + }, + { + "epoch": 85.41, + "learning_rate": 7.310009204798074e-06, + "loss": 1.8324, + "step": 29507000 + }, + { + "epoch": 85.41, + "learning_rate": 7.309285557150797e-06, + "loss": 1.8387, + "step": 29507500 + }, + { + "epoch": 85.41, + "learning_rate": 7.30856190950352e-06, + "loss": 1.7981, + "step": 29508000 + }, + { + "epoch": 85.42, + "learning_rate": 7.307838261856244e-06, + "loss": 1.8019, + "step": 29508500 + }, + { + "epoch": 85.42, + "learning_rate": 7.307114614208967e-06, + "loss": 1.822, + "step": 29509000 + }, + { + "epoch": 85.42, + "learning_rate": 7.306392413856984e-06, + "loss": 1.8114, + "step": 29509500 + }, + { + "epoch": 85.42, + "learning_rate": 7.305668766209707e-06, + "loss": 1.8218, + "step": 29510000 + }, + { + "epoch": 85.42, + "learning_rate": 7.304945118562431e-06, + "loss": 1.8075, + "step": 29510500 + }, + { + "epoch": 85.42, + "learning_rate": 7.304221470915154e-06, + "loss": 1.8095, + "step": 29511000 + }, + { + "epoch": 85.42, + "learning_rate": 7.303499270563172e-06, + "loss": 1.8068, + "step": 29511500 + }, + { + "epoch": 85.43, + "learning_rate": 7.302775622915895e-06, + "loss": 1.7787, + "step": 29512000 + }, + { + "epoch": 85.43, + "learning_rate": 7.302051975268619e-06, + "loss": 1.8149, + "step": 29512500 + }, + { + "epoch": 85.43, + "learning_rate": 7.301328327621342e-06, + "loss": 1.8022, + "step": 29513000 + }, + { + "epoch": 85.43, + "learning_rate": 7.300604679974064e-06, + "loss": 1.8113, + "step": 29513500 + }, + { + "epoch": 85.43, + "learning_rate": 7.299881032326789e-06, + "loss": 1.806, + "step": 29514000 + }, + { + "epoch": 85.43, + "learning_rate": 7.299157384679512e-06, + "loss": 1.795, + "step": 29514500 + }, + { + "epoch": 85.43, + "learning_rate": 7.298433737032234e-06, + "loss": 1.8412, + "step": 29515000 + }, + { + "epoch": 85.44, + "learning_rate": 7.297711536680252e-06, + "loss": 1.8284, + "step": 29515500 + }, + { + "epoch": 85.44, + "learning_rate": 7.296987889032976e-06, + "loss": 1.8341, + "step": 29516000 + }, + { + "epoch": 85.44, + "learning_rate": 7.296264241385699e-06, + "loss": 1.8261, + "step": 29516500 + }, + { + "epoch": 85.44, + "learning_rate": 7.295540593738421e-06, + "loss": 1.8122, + "step": 29517000 + }, + { + "epoch": 85.44, + "learning_rate": 7.294816946091146e-06, + "loss": 1.7986, + "step": 29517500 + }, + { + "epoch": 85.44, + "learning_rate": 7.294094745739163e-06, + "loss": 1.7994, + "step": 29518000 + }, + { + "epoch": 85.44, + "learning_rate": 7.2933710980918865e-06, + "loss": 1.8206, + "step": 29518500 + }, + { + "epoch": 85.45, + "learning_rate": 7.292647450444609e-06, + "loss": 1.8209, + "step": 29519000 + }, + { + "epoch": 85.45, + "learning_rate": 7.291925250092627e-06, + "loss": 1.8279, + "step": 29519500 + }, + { + "epoch": 85.45, + "learning_rate": 7.291201602445351e-06, + "loss": 1.8047, + "step": 29520000 + }, + { + "epoch": 85.45, + "learning_rate": 7.290480849388663e-06, + "loss": 1.822, + "step": 29520500 + }, + { + "epoch": 85.45, + "learning_rate": 7.289757201741386e-06, + "loss": 1.8241, + "step": 29521000 + }, + { + "epoch": 85.45, + "learning_rate": 7.289033554094109e-06, + "loss": 1.8201, + "step": 29521500 + }, + { + "epoch": 85.45, + "learning_rate": 7.288309906446833e-06, + "loss": 1.8068, + "step": 29522000 + }, + { + "epoch": 85.46, + "learning_rate": 7.287586258799556e-06, + "loss": 1.8042, + "step": 29522500 + }, + { + "epoch": 85.46, + "learning_rate": 7.286862611152278e-06, + "loss": 1.807, + "step": 29523000 + }, + { + "epoch": 85.46, + "learning_rate": 7.286138963505003e-06, + "loss": 1.818, + "step": 29523500 + }, + { + "epoch": 85.46, + "learning_rate": 7.285415315857725e-06, + "loss": 1.808, + "step": 29524000 + }, + { + "epoch": 85.46, + "learning_rate": 7.2846931155057435e-06, + "loss": 1.8425, + "step": 29524500 + }, + { + "epoch": 85.46, + "learning_rate": 7.283969467858466e-06, + "loss": 1.8036, + "step": 29525000 + }, + { + "epoch": 85.46, + "learning_rate": 7.2832458202111905e-06, + "loss": 1.7906, + "step": 29525500 + }, + { + "epoch": 85.47, + "learning_rate": 7.282522172563913e-06, + "loss": 1.835, + "step": 29526000 + }, + { + "epoch": 85.47, + "learning_rate": 7.281798524916636e-06, + "loss": 1.7935, + "step": 29526500 + }, + { + "epoch": 85.47, + "learning_rate": 7.281076324564654e-06, + "loss": 1.8343, + "step": 29527000 + }, + { + "epoch": 85.47, + "learning_rate": 7.280352676917378e-06, + "loss": 1.8296, + "step": 29527500 + }, + { + "epoch": 85.47, + "learning_rate": 7.279629029270101e-06, + "loss": 1.8518, + "step": 29528000 + }, + { + "epoch": 85.47, + "learning_rate": 7.278905381622823e-06, + "loss": 1.8182, + "step": 29528500 + }, + { + "epoch": 85.47, + "learning_rate": 7.278181733975546e-06, + "loss": 1.8231, + "step": 29529000 + }, + { + "epoch": 85.48, + "learning_rate": 7.277459533623565e-06, + "loss": 1.7998, + "step": 29529500 + }, + { + "epoch": 85.48, + "learning_rate": 7.276735885976288e-06, + "loss": 1.7942, + "step": 29530000 + }, + { + "epoch": 85.48, + "learning_rate": 7.2760122383290105e-06, + "loss": 1.8349, + "step": 29530500 + }, + { + "epoch": 85.48, + "learning_rate": 7.275288590681735e-06, + "loss": 1.8076, + "step": 29531000 + }, + { + "epoch": 85.48, + "learning_rate": 7.2745649430344575e-06, + "loss": 1.7918, + "step": 29531500 + }, + { + "epoch": 85.48, + "learning_rate": 7.2738412953871806e-06, + "loss": 1.8411, + "step": 29532000 + }, + { + "epoch": 85.48, + "learning_rate": 7.273117647739904e-06, + "loss": 1.8253, + "step": 29532500 + }, + { + "epoch": 85.49, + "learning_rate": 7.272394000092628e-06, + "loss": 1.8548, + "step": 29533000 + }, + { + "epoch": 85.49, + "learning_rate": 7.271671799740646e-06, + "loss": 1.833, + "step": 29533500 + }, + { + "epoch": 85.49, + "learning_rate": 7.270948152093368e-06, + "loss": 1.8118, + "step": 29534000 + }, + { + "epoch": 85.49, + "learning_rate": 7.270224504446091e-06, + "loss": 1.8082, + "step": 29534500 + }, + { + "epoch": 85.49, + "learning_rate": 7.269500856798815e-06, + "loss": 1.8259, + "step": 29535000 + }, + { + "epoch": 85.49, + "learning_rate": 7.268777209151538e-06, + "loss": 1.8024, + "step": 29535500 + }, + { + "epoch": 85.49, + "learning_rate": 7.268053561504261e-06, + "loss": 1.82, + "step": 29536000 + }, + { + "epoch": 85.5, + "learning_rate": 7.267329913856985e-06, + "loss": 1.8318, + "step": 29536500 + }, + { + "epoch": 85.5, + "learning_rate": 7.266607713505002e-06, + "loss": 1.8075, + "step": 29537000 + }, + { + "epoch": 85.5, + "learning_rate": 7.265884065857725e-06, + "loss": 1.8049, + "step": 29537500 + }, + { + "epoch": 85.5, + "learning_rate": 7.265160418210448e-06, + "loss": 1.839, + "step": 29538000 + }, + { + "epoch": 85.5, + "learning_rate": 7.264436770563172e-06, + "loss": 1.8072, + "step": 29538500 + }, + { + "epoch": 85.5, + "learning_rate": 7.263713122915895e-06, + "loss": 1.8111, + "step": 29539000 + }, + { + "epoch": 85.5, + "learning_rate": 7.2629894752686185e-06, + "loss": 1.843, + "step": 29539500 + }, + { + "epoch": 85.51, + "learning_rate": 7.262265827621341e-06, + "loss": 1.8209, + "step": 29540000 + }, + { + "epoch": 85.51, + "learning_rate": 7.2615421799740655e-06, + "loss": 1.8067, + "step": 29540500 + }, + { + "epoch": 85.51, + "learning_rate": 7.260819979622083e-06, + "loss": 1.86, + "step": 29541000 + }, + { + "epoch": 85.51, + "learning_rate": 7.260096331974806e-06, + "loss": 1.8124, + "step": 29541500 + }, + { + "epoch": 85.51, + "learning_rate": 7.259372684327528e-06, + "loss": 1.8304, + "step": 29542000 + }, + { + "epoch": 85.51, + "learning_rate": 7.258649036680253e-06, + "loss": 1.8042, + "step": 29542500 + }, + { + "epoch": 85.51, + "learning_rate": 7.257925389032975e-06, + "loss": 1.8072, + "step": 29543000 + }, + { + "epoch": 85.52, + "learning_rate": 7.257201741385698e-06, + "loss": 1.7948, + "step": 29543500 + }, + { + "epoch": 85.52, + "learning_rate": 7.256478093738422e-06, + "loss": 1.7957, + "step": 29544000 + }, + { + "epoch": 85.52, + "learning_rate": 7.255754446091145e-06, + "loss": 1.81, + "step": 29544500 + }, + { + "epoch": 85.52, + "learning_rate": 7.255032245739163e-06, + "loss": 1.8174, + "step": 29545000 + }, + { + "epoch": 85.52, + "learning_rate": 7.2543085980918855e-06, + "loss": 1.8252, + "step": 29545500 + }, + { + "epoch": 85.52, + "learning_rate": 7.25358495044461e-06, + "loss": 1.7982, + "step": 29546000 + }, + { + "epoch": 85.53, + "learning_rate": 7.2528613027973325e-06, + "loss": 1.8269, + "step": 29546500 + }, + { + "epoch": 85.53, + "learning_rate": 7.252137655150056e-06, + "loss": 1.8092, + "step": 29547000 + }, + { + "epoch": 85.53, + "learning_rate": 7.2514140075027795e-06, + "loss": 1.8291, + "step": 29547500 + }, + { + "epoch": 85.53, + "learning_rate": 7.250691807150798e-06, + "loss": 1.8082, + "step": 29548000 + }, + { + "epoch": 85.53, + "learning_rate": 7.24996815950352e-06, + "loss": 1.8201, + "step": 29548500 + }, + { + "epoch": 85.53, + "learning_rate": 7.249244511856243e-06, + "loss": 1.8044, + "step": 29549000 + }, + { + "epoch": 85.53, + "learning_rate": 7.248520864208967e-06, + "loss": 1.8375, + "step": 29549500 + }, + { + "epoch": 85.54, + "learning_rate": 7.24779721656169e-06, + "loss": 1.8352, + "step": 29550000 + }, + { + "epoch": 85.54, + "learning_rate": 7.247076463505002e-06, + "loss": 1.8121, + "step": 29550500 + }, + { + "epoch": 85.54, + "learning_rate": 7.246352815857725e-06, + "loss": 1.8492, + "step": 29551000 + }, + { + "epoch": 85.54, + "learning_rate": 7.245629168210449e-06, + "loss": 1.798, + "step": 29551500 + }, + { + "epoch": 85.54, + "learning_rate": 7.244906967858467e-06, + "loss": 1.806, + "step": 29552000 + }, + { + "epoch": 85.54, + "learning_rate": 7.2441833202111895e-06, + "loss": 1.7815, + "step": 29552500 + }, + { + "epoch": 85.54, + "learning_rate": 7.243459672563913e-06, + "loss": 1.821, + "step": 29553000 + }, + { + "epoch": 85.55, + "learning_rate": 7.2427360249166365e-06, + "loss": 1.8158, + "step": 29553500 + }, + { + "epoch": 85.55, + "learning_rate": 7.24201237726936e-06, + "loss": 1.8058, + "step": 29554000 + }, + { + "epoch": 85.55, + "learning_rate": 7.241288729622083e-06, + "loss": 1.8249, + "step": 29554500 + }, + { + "epoch": 85.55, + "learning_rate": 7.240565081974805e-06, + "loss": 1.8154, + "step": 29555000 + }, + { + "epoch": 85.55, + "learning_rate": 7.23984143432753e-06, + "loss": 1.8132, + "step": 29555500 + }, + { + "epoch": 85.55, + "learning_rate": 7.239117786680252e-06, + "loss": 1.8276, + "step": 29556000 + }, + { + "epoch": 85.55, + "learning_rate": 7.238394139032975e-06, + "loss": 1.8171, + "step": 29556500 + }, + { + "epoch": 85.56, + "learning_rate": 7.237670491385699e-06, + "loss": 1.804, + "step": 29557000 + }, + { + "epoch": 85.56, + "learning_rate": 7.236946843738422e-06, + "loss": 1.8301, + "step": 29557500 + }, + { + "epoch": 85.56, + "learning_rate": 7.236223196091145e-06, + "loss": 1.7991, + "step": 29558000 + }, + { + "epoch": 85.56, + "learning_rate": 7.235499548443868e-06, + "loss": 1.8128, + "step": 29558500 + }, + { + "epoch": 85.56, + "learning_rate": 7.234777348091887e-06, + "loss": 1.7934, + "step": 29559000 + }, + { + "epoch": 85.56, + "learning_rate": 7.234053700444609e-06, + "loss": 1.7979, + "step": 29559500 + }, + { + "epoch": 85.56, + "learning_rate": 7.2333300527973325e-06, + "loss": 1.8125, + "step": 29560000 + }, + { + "epoch": 85.57, + "learning_rate": 7.2326064051500555e-06, + "loss": 1.8544, + "step": 29560500 + }, + { + "epoch": 85.57, + "learning_rate": 7.2318842047980745e-06, + "loss": 1.8219, + "step": 29561000 + }, + { + "epoch": 85.57, + "learning_rate": 7.231160557150797e-06, + "loss": 1.8144, + "step": 29561500 + }, + { + "epoch": 85.57, + "learning_rate": 7.23043690950352e-06, + "loss": 1.8203, + "step": 29562000 + }, + { + "epoch": 85.57, + "learning_rate": 7.229713261856244e-06, + "loss": 1.8189, + "step": 29562500 + }, + { + "epoch": 85.57, + "learning_rate": 7.228989614208967e-06, + "loss": 1.8041, + "step": 29563000 + }, + { + "epoch": 85.57, + "learning_rate": 7.22826596656169e-06, + "loss": 1.8104, + "step": 29563500 + }, + { + "epoch": 85.58, + "learning_rate": 7.227543766209707e-06, + "loss": 1.7978, + "step": 29564000 + }, + { + "epoch": 85.58, + "learning_rate": 7.226820118562432e-06, + "loss": 1.8047, + "step": 29564500 + }, + { + "epoch": 85.58, + "learning_rate": 7.226096470915154e-06, + "loss": 1.8078, + "step": 29565000 + }, + { + "epoch": 85.58, + "learning_rate": 7.225374270563172e-06, + "loss": 1.8322, + "step": 29565500 + }, + { + "epoch": 85.58, + "learning_rate": 7.2246506229158945e-06, + "loss": 1.805, + "step": 29566000 + }, + { + "epoch": 85.58, + "learning_rate": 7.223926975268619e-06, + "loss": 1.817, + "step": 29566500 + }, + { + "epoch": 85.58, + "learning_rate": 7.2232033276213415e-06, + "loss": 1.8272, + "step": 29567000 + }, + { + "epoch": 85.59, + "learning_rate": 7.2224796799740646e-06, + "loss": 1.8039, + "step": 29567500 + }, + { + "epoch": 85.59, + "learning_rate": 7.221757479622082e-06, + "loss": 1.7826, + "step": 29568000 + }, + { + "epoch": 85.59, + "learning_rate": 7.221033831974807e-06, + "loss": 1.8137, + "step": 29568500 + }, + { + "epoch": 85.59, + "learning_rate": 7.220310184327529e-06, + "loss": 1.8121, + "step": 29569000 + }, + { + "epoch": 85.59, + "learning_rate": 7.219586536680252e-06, + "loss": 1.8385, + "step": 29569500 + }, + { + "epoch": 85.59, + "learning_rate": 7.218862889032975e-06, + "loss": 1.8089, + "step": 29570000 + }, + { + "epoch": 85.59, + "learning_rate": 7.218140688680994e-06, + "loss": 1.8102, + "step": 29570500 + }, + { + "epoch": 85.6, + "learning_rate": 7.217417041033717e-06, + "loss": 1.8276, + "step": 29571000 + }, + { + "epoch": 85.6, + "learning_rate": 7.216693393386439e-06, + "loss": 1.8373, + "step": 29571500 + }, + { + "epoch": 85.6, + "learning_rate": 7.215969745739164e-06, + "loss": 1.8201, + "step": 29572000 + }, + { + "epoch": 85.6, + "learning_rate": 7.215246098091886e-06, + "loss": 1.8177, + "step": 29572500 + }, + { + "epoch": 85.6, + "learning_rate": 7.214522450444609e-06, + "loss": 1.8013, + "step": 29573000 + }, + { + "epoch": 85.6, + "learning_rate": 7.213798802797332e-06, + "loss": 1.7819, + "step": 29573500 + }, + { + "epoch": 85.6, + "learning_rate": 7.213075155150056e-06, + "loss": 1.8307, + "step": 29574000 + }, + { + "epoch": 85.61, + "learning_rate": 7.212351507502779e-06, + "loss": 1.7874, + "step": 29574500 + }, + { + "epoch": 85.61, + "learning_rate": 7.211629307150797e-06, + "loss": 1.8194, + "step": 29575000 + }, + { + "epoch": 85.61, + "learning_rate": 7.21090565950352e-06, + "loss": 1.8334, + "step": 29575500 + }, + { + "epoch": 85.61, + "learning_rate": 7.210182011856244e-06, + "loss": 1.8259, + "step": 29576000 + }, + { + "epoch": 85.61, + "learning_rate": 7.209458364208967e-06, + "loss": 1.8054, + "step": 29576500 + }, + { + "epoch": 85.61, + "learning_rate": 7.20873471656169e-06, + "loss": 1.8422, + "step": 29577000 + }, + { + "epoch": 85.61, + "learning_rate": 7.208012516209707e-06, + "loss": 1.8571, + "step": 29577500 + }, + { + "epoch": 85.62, + "learning_rate": 7.207288868562431e-06, + "loss": 1.8044, + "step": 29578000 + }, + { + "epoch": 85.62, + "learning_rate": 7.206566668210449e-06, + "loss": 1.8173, + "step": 29578500 + }, + { + "epoch": 85.62, + "learning_rate": 7.205843020563171e-06, + "loss": 1.8222, + "step": 29579000 + }, + { + "epoch": 85.62, + "learning_rate": 7.205119372915894e-06, + "loss": 1.8344, + "step": 29579500 + }, + { + "epoch": 85.62, + "learning_rate": 7.204395725268618e-06, + "loss": 1.8099, + "step": 29580000 + }, + { + "epoch": 85.62, + "learning_rate": 7.2036720776213414e-06, + "loss": 1.8269, + "step": 29580500 + }, + { + "epoch": 85.62, + "learning_rate": 7.2029484299740645e-06, + "loss": 1.8147, + "step": 29581000 + }, + { + "epoch": 85.63, + "learning_rate": 7.2022247823267884e-06, + "loss": 1.8063, + "step": 29581500 + }, + { + "epoch": 85.63, + "learning_rate": 7.2015011346795115e-06, + "loss": 1.8199, + "step": 29582000 + }, + { + "epoch": 85.63, + "learning_rate": 7.200778934327529e-06, + "loss": 1.8048, + "step": 29582500 + }, + { + "epoch": 85.63, + "learning_rate": 7.200055286680252e-06, + "loss": 1.8181, + "step": 29583000 + }, + { + "epoch": 85.63, + "learning_rate": 7.199331639032976e-06, + "loss": 1.7908, + "step": 29583500 + }, + { + "epoch": 85.63, + "learning_rate": 7.198607991385699e-06, + "loss": 1.7858, + "step": 29584000 + }, + { + "epoch": 85.64, + "learning_rate": 7.197884343738422e-06, + "loss": 1.8285, + "step": 29584500 + }, + { + "epoch": 85.64, + "learning_rate": 7.197162143386439e-06, + "loss": 1.8263, + "step": 29585000 + }, + { + "epoch": 85.64, + "learning_rate": 7.196438495739163e-06, + "loss": 1.8024, + "step": 29585500 + }, + { + "epoch": 85.64, + "learning_rate": 7.195714848091886e-06, + "loss": 1.7999, + "step": 29586000 + }, + { + "epoch": 85.64, + "learning_rate": 7.194991200444609e-06, + "loss": 1.8091, + "step": 29586500 + }, + { + "epoch": 85.64, + "learning_rate": 7.194267552797333e-06, + "loss": 1.8055, + "step": 29587000 + }, + { + "epoch": 85.64, + "learning_rate": 7.193543905150056e-06, + "loss": 1.81, + "step": 29587500 + }, + { + "epoch": 85.65, + "learning_rate": 7.1928217047980735e-06, + "loss": 1.8205, + "step": 29588000 + }, + { + "epoch": 85.65, + "learning_rate": 7.192099504446092e-06, + "loss": 1.8074, + "step": 29588500 + }, + { + "epoch": 85.65, + "learning_rate": 7.191375856798814e-06, + "loss": 1.8208, + "step": 29589000 + }, + { + "epoch": 85.65, + "learning_rate": 7.190652209151539e-06, + "loss": 1.8069, + "step": 29589500 + }, + { + "epoch": 85.65, + "learning_rate": 7.189928561504261e-06, + "loss": 1.8024, + "step": 29590000 + }, + { + "epoch": 85.65, + "learning_rate": 7.189204913856984e-06, + "loss": 1.8165, + "step": 29590500 + }, + { + "epoch": 85.65, + "learning_rate": 7.188481266209708e-06, + "loss": 1.8357, + "step": 29591000 + }, + { + "epoch": 85.66, + "learning_rate": 7.187757618562431e-06, + "loss": 1.8239, + "step": 29591500 + }, + { + "epoch": 85.66, + "learning_rate": 7.187033970915154e-06, + "loss": 1.8038, + "step": 29592000 + }, + { + "epoch": 85.66, + "learning_rate": 7.186310323267878e-06, + "loss": 1.815, + "step": 29592500 + }, + { + "epoch": 85.66, + "learning_rate": 7.185586675620601e-06, + "loss": 1.8059, + "step": 29593000 + }, + { + "epoch": 85.66, + "learning_rate": 7.184863027973323e-06, + "loss": 1.8053, + "step": 29593500 + }, + { + "epoch": 85.66, + "learning_rate": 7.184140827621341e-06, + "loss": 1.8204, + "step": 29594000 + }, + { + "epoch": 85.66, + "learning_rate": 7.183417179974065e-06, + "loss": 1.8182, + "step": 29594500 + }, + { + "epoch": 85.67, + "learning_rate": 7.182694979622083e-06, + "loss": 1.8368, + "step": 29595000 + }, + { + "epoch": 85.67, + "learning_rate": 7.181972779270101e-06, + "loss": 1.7967, + "step": 29595500 + }, + { + "epoch": 85.67, + "learning_rate": 7.181249131622824e-06, + "loss": 1.8115, + "step": 29596000 + }, + { + "epoch": 85.67, + "learning_rate": 7.180525483975546e-06, + "loss": 1.8404, + "step": 29596500 + }, + { + "epoch": 85.67, + "learning_rate": 7.179801836328271e-06, + "loss": 1.8221, + "step": 29597000 + }, + { + "epoch": 85.67, + "learning_rate": 7.179078188680993e-06, + "loss": 1.8358, + "step": 29597500 + }, + { + "epoch": 85.67, + "learning_rate": 7.178354541033716e-06, + "loss": 1.8101, + "step": 29598000 + }, + { + "epoch": 85.68, + "learning_rate": 7.17763089338644e-06, + "loss": 1.7923, + "step": 29598500 + }, + { + "epoch": 85.68, + "learning_rate": 7.176907245739163e-06, + "loss": 1.8161, + "step": 29599000 + }, + { + "epoch": 85.68, + "learning_rate": 7.176183598091886e-06, + "loss": 1.8168, + "step": 29599500 + }, + { + "epoch": 85.68, + "learning_rate": 7.175459950444608e-06, + "loss": 1.8542, + "step": 29600000 + }, + { + "epoch": 85.68, + "learning_rate": 7.174739197387922e-06, + "loss": 1.8186, + "step": 29600500 + }, + { + "epoch": 85.68, + "learning_rate": 7.174015549740645e-06, + "loss": 1.8059, + "step": 29601000 + }, + { + "epoch": 85.68, + "learning_rate": 7.1732919020933685e-06, + "loss": 1.8265, + "step": 29601500 + }, + { + "epoch": 85.69, + "learning_rate": 7.172568254446091e-06, + "loss": 1.8076, + "step": 29602000 + }, + { + "epoch": 85.69, + "learning_rate": 7.1718446067988155e-06, + "loss": 1.831, + "step": 29602500 + }, + { + "epoch": 85.69, + "learning_rate": 7.171120959151538e-06, + "loss": 1.8225, + "step": 29603000 + }, + { + "epoch": 85.69, + "learning_rate": 7.170397311504261e-06, + "loss": 1.8151, + "step": 29603500 + }, + { + "epoch": 85.69, + "learning_rate": 7.169673663856985e-06, + "loss": 1.8152, + "step": 29604000 + }, + { + "epoch": 85.69, + "learning_rate": 7.168950016209708e-06, + "loss": 1.8164, + "step": 29604500 + }, + { + "epoch": 85.69, + "learning_rate": 7.168226368562431e-06, + "loss": 1.7987, + "step": 29605000 + }, + { + "epoch": 85.7, + "learning_rate": 7.167502720915153e-06, + "loss": 1.7922, + "step": 29605500 + }, + { + "epoch": 85.7, + "learning_rate": 7.166779073267878e-06, + "loss": 1.8333, + "step": 29606000 + }, + { + "epoch": 85.7, + "learning_rate": 7.1660554256206e-06, + "loss": 1.8024, + "step": 29606500 + }, + { + "epoch": 85.7, + "learning_rate": 7.165333225268618e-06, + "loss": 1.8052, + "step": 29607000 + }, + { + "epoch": 85.7, + "learning_rate": 7.164609577621341e-06, + "loss": 1.8249, + "step": 29607500 + }, + { + "epoch": 85.7, + "learning_rate": 7.163885929974065e-06, + "loss": 1.8403, + "step": 29608000 + }, + { + "epoch": 85.7, + "learning_rate": 7.163162282326788e-06, + "loss": 1.8221, + "step": 29608500 + }, + { + "epoch": 85.71, + "learning_rate": 7.1624386346795106e-06, + "loss": 1.7836, + "step": 29609000 + }, + { + "epoch": 85.71, + "learning_rate": 7.161716434327529e-06, + "loss": 1.8174, + "step": 29609500 + }, + { + "epoch": 85.71, + "learning_rate": 7.160992786680253e-06, + "loss": 1.8151, + "step": 29610000 + }, + { + "epoch": 85.71, + "learning_rate": 7.16027058632827e-06, + "loss": 1.7995, + "step": 29610500 + }, + { + "epoch": 85.71, + "learning_rate": 7.159546938680993e-06, + "loss": 1.8053, + "step": 29611000 + }, + { + "epoch": 85.71, + "learning_rate": 7.158823291033717e-06, + "loss": 1.8129, + "step": 29611500 + }, + { + "epoch": 85.71, + "learning_rate": 7.15809964338644e-06, + "loss": 1.8026, + "step": 29612000 + }, + { + "epoch": 85.72, + "learning_rate": 7.157375995739163e-06, + "loss": 1.8135, + "step": 29612500 + }, + { + "epoch": 85.72, + "learning_rate": 7.156652348091886e-06, + "loss": 1.8086, + "step": 29613000 + }, + { + "epoch": 85.72, + "learning_rate": 7.15592870044461e-06, + "loss": 1.7954, + "step": 29613500 + }, + { + "epoch": 85.72, + "learning_rate": 7.155205052797333e-06, + "loss": 1.8314, + "step": 29614000 + }, + { + "epoch": 85.72, + "learning_rate": 7.154481405150055e-06, + "loss": 1.8128, + "step": 29614500 + }, + { + "epoch": 85.72, + "learning_rate": 7.1537592047980734e-06, + "loss": 1.8218, + "step": 29615000 + }, + { + "epoch": 85.72, + "learning_rate": 7.153035557150797e-06, + "loss": 1.7991, + "step": 29615500 + }, + { + "epoch": 85.73, + "learning_rate": 7.1523119095035204e-06, + "loss": 1.8102, + "step": 29616000 + }, + { + "epoch": 85.73, + "learning_rate": 7.151589709151538e-06, + "loss": 1.8248, + "step": 29616500 + }, + { + "epoch": 85.73, + "learning_rate": 7.150866061504261e-06, + "loss": 1.8068, + "step": 29617000 + }, + { + "epoch": 85.73, + "learning_rate": 7.150142413856985e-06, + "loss": 1.7997, + "step": 29617500 + }, + { + "epoch": 85.73, + "learning_rate": 7.149418766209708e-06, + "loss": 1.8076, + "step": 29618000 + }, + { + "epoch": 85.73, + "learning_rate": 7.148696565857725e-06, + "loss": 1.8304, + "step": 29618500 + }, + { + "epoch": 85.73, + "learning_rate": 7.147972918210449e-06, + "loss": 1.8005, + "step": 29619000 + }, + { + "epoch": 85.74, + "learning_rate": 7.147249270563172e-06, + "loss": 1.8306, + "step": 29619500 + }, + { + "epoch": 85.74, + "learning_rate": 7.146525622915895e-06, + "loss": 1.8096, + "step": 29620000 + }, + { + "epoch": 85.74, + "learning_rate": 7.145801975268618e-06, + "loss": 1.8093, + "step": 29620500 + }, + { + "epoch": 85.74, + "learning_rate": 7.145078327621342e-06, + "loss": 1.8276, + "step": 29621000 + }, + { + "epoch": 85.74, + "learning_rate": 7.144356127269359e-06, + "loss": 1.8128, + "step": 29621500 + }, + { + "epoch": 85.74, + "learning_rate": 7.1436324796220825e-06, + "loss": 1.8016, + "step": 29622000 + }, + { + "epoch": 85.75, + "learning_rate": 7.1429088319748055e-06, + "loss": 1.8253, + "step": 29622500 + }, + { + "epoch": 85.75, + "learning_rate": 7.1421851843275295e-06, + "loss": 1.8142, + "step": 29623000 + }, + { + "epoch": 85.75, + "learning_rate": 7.1414615366802525e-06, + "loss": 1.8015, + "step": 29623500 + }, + { + "epoch": 85.75, + "learning_rate": 7.140737889032975e-06, + "loss": 1.8453, + "step": 29624000 + }, + { + "epoch": 85.75, + "learning_rate": 7.1400142413856996e-06, + "loss": 1.8206, + "step": 29624500 + }, + { + "epoch": 85.75, + "learning_rate": 7.139292041033717e-06, + "loss": 1.8323, + "step": 29625000 + }, + { + "epoch": 85.75, + "learning_rate": 7.13856839338644e-06, + "loss": 1.8086, + "step": 29625500 + }, + { + "epoch": 85.76, + "learning_rate": 7.137844745739163e-06, + "loss": 1.8492, + "step": 29626000 + }, + { + "epoch": 85.76, + "learning_rate": 7.137121098091887e-06, + "loss": 1.7921, + "step": 29626500 + }, + { + "epoch": 85.76, + "learning_rate": 7.13639745044461e-06, + "loss": 1.8132, + "step": 29627000 + }, + { + "epoch": 85.76, + "learning_rate": 7.135673802797332e-06, + "loss": 1.8338, + "step": 29627500 + }, + { + "epoch": 85.76, + "learning_rate": 7.134950155150055e-06, + "loss": 1.8008, + "step": 29628000 + }, + { + "epoch": 85.76, + "learning_rate": 7.134226507502779e-06, + "loss": 1.8223, + "step": 29628500 + }, + { + "epoch": 85.76, + "learning_rate": 7.133502859855502e-06, + "loss": 1.8013, + "step": 29629000 + }, + { + "epoch": 85.77, + "learning_rate": 7.132779212208225e-06, + "loss": 1.7769, + "step": 29629500 + }, + { + "epoch": 85.77, + "learning_rate": 7.132055564560949e-06, + "loss": 1.8131, + "step": 29630000 + }, + { + "epoch": 85.77, + "learning_rate": 7.131331916913672e-06, + "loss": 1.8474, + "step": 29630500 + }, + { + "epoch": 85.77, + "learning_rate": 7.13060971656169e-06, + "loss": 1.8278, + "step": 29631000 + }, + { + "epoch": 85.77, + "learning_rate": 7.129886068914413e-06, + "loss": 1.829, + "step": 29631500 + }, + { + "epoch": 85.77, + "learning_rate": 7.129162421267137e-06, + "loss": 1.7918, + "step": 29632000 + }, + { + "epoch": 85.77, + "learning_rate": 7.12843877361986e-06, + "loss": 1.8141, + "step": 29632500 + }, + { + "epoch": 85.78, + "learning_rate": 7.127716573267877e-06, + "loss": 1.7849, + "step": 29633000 + }, + { + "epoch": 85.78, + "learning_rate": 7.126994372915895e-06, + "loss": 1.831, + "step": 29633500 + }, + { + "epoch": 85.78, + "learning_rate": 7.126270725268619e-06, + "loss": 1.8048, + "step": 29634000 + }, + { + "epoch": 85.78, + "learning_rate": 7.125547077621342e-06, + "loss": 1.8106, + "step": 29634500 + }, + { + "epoch": 85.78, + "learning_rate": 7.124823429974064e-06, + "loss": 1.8055, + "step": 29635000 + }, + { + "epoch": 85.78, + "learning_rate": 7.124099782326787e-06, + "loss": 1.7954, + "step": 29635500 + }, + { + "epoch": 85.78, + "learning_rate": 7.123376134679511e-06, + "loss": 1.8082, + "step": 29636000 + }, + { + "epoch": 85.79, + "learning_rate": 7.122652487032234e-06, + "loss": 1.7923, + "step": 29636500 + }, + { + "epoch": 85.79, + "learning_rate": 7.121930286680252e-06, + "loss": 1.8231, + "step": 29637000 + }, + { + "epoch": 85.79, + "learning_rate": 7.121206639032975e-06, + "loss": 1.8192, + "step": 29637500 + }, + { + "epoch": 85.79, + "learning_rate": 7.1204829913856995e-06, + "loss": 1.8068, + "step": 29638000 + }, + { + "epoch": 85.79, + "learning_rate": 7.119759343738422e-06, + "loss": 1.807, + "step": 29638500 + }, + { + "epoch": 85.79, + "learning_rate": 7.11903714338644e-06, + "loss": 1.7766, + "step": 29639000 + }, + { + "epoch": 85.79, + "learning_rate": 7.118313495739164e-06, + "loss": 1.8065, + "step": 29639500 + }, + { + "epoch": 85.8, + "learning_rate": 7.117589848091887e-06, + "loss": 1.8175, + "step": 29640000 + }, + { + "epoch": 85.8, + "learning_rate": 7.116866200444609e-06, + "loss": 1.7879, + "step": 29640500 + }, + { + "epoch": 85.8, + "learning_rate": 7.116144000092627e-06, + "loss": 1.8108, + "step": 29641000 + }, + { + "epoch": 85.8, + "learning_rate": 7.115420352445351e-06, + "loss": 1.8236, + "step": 29641500 + }, + { + "epoch": 85.8, + "learning_rate": 7.114696704798074e-06, + "loss": 1.7955, + "step": 29642000 + }, + { + "epoch": 85.8, + "learning_rate": 7.113973057150796e-06, + "loss": 1.8124, + "step": 29642500 + }, + { + "epoch": 85.8, + "learning_rate": 7.1132494095035195e-06, + "loss": 1.821, + "step": 29643000 + }, + { + "epoch": 85.81, + "learning_rate": 7.1125272091515384e-06, + "loss": 1.8074, + "step": 29643500 + }, + { + "epoch": 85.81, + "learning_rate": 7.1118035615042615e-06, + "loss": 1.8385, + "step": 29644000 + }, + { + "epoch": 85.81, + "learning_rate": 7.111079913856985e-06, + "loss": 1.803, + "step": 29644500 + }, + { + "epoch": 85.81, + "learning_rate": 7.110356266209707e-06, + "loss": 1.8247, + "step": 29645000 + }, + { + "epoch": 85.81, + "learning_rate": 7.109632618562432e-06, + "loss": 1.8097, + "step": 29645500 + }, + { + "epoch": 85.81, + "learning_rate": 7.108908970915154e-06, + "loss": 1.8128, + "step": 29646000 + }, + { + "epoch": 85.81, + "learning_rate": 7.108185323267877e-06, + "loss": 1.817, + "step": 29646500 + }, + { + "epoch": 85.82, + "learning_rate": 7.107461675620601e-06, + "loss": 1.8081, + "step": 29647000 + }, + { + "epoch": 85.82, + "learning_rate": 7.106739475268619e-06, + "loss": 1.8241, + "step": 29647500 + }, + { + "epoch": 85.82, + "learning_rate": 7.106015827621341e-06, + "loss": 1.8232, + "step": 29648000 + }, + { + "epoch": 85.82, + "learning_rate": 7.105292179974064e-06, + "loss": 1.8123, + "step": 29648500 + }, + { + "epoch": 85.82, + "learning_rate": 7.104568532326788e-06, + "loss": 1.8007, + "step": 29649000 + }, + { + "epoch": 85.82, + "learning_rate": 7.103846331974806e-06, + "loss": 1.8193, + "step": 29649500 + }, + { + "epoch": 85.82, + "learning_rate": 7.1031226843275285e-06, + "loss": 1.8123, + "step": 29650000 + }, + { + "epoch": 85.83, + "learning_rate": 7.102400483975547e-06, + "loss": 1.8203, + "step": 29650500 + }, + { + "epoch": 85.83, + "learning_rate": 7.1016768363282705e-06, + "loss": 1.801, + "step": 29651000 + }, + { + "epoch": 85.83, + "learning_rate": 7.100953188680994e-06, + "loss": 1.8418, + "step": 29651500 + }, + { + "epoch": 85.83, + "learning_rate": 7.100229541033717e-06, + "loss": 1.7934, + "step": 29652000 + }, + { + "epoch": 85.83, + "learning_rate": 7.099505893386439e-06, + "loss": 1.7956, + "step": 29652500 + }, + { + "epoch": 85.83, + "learning_rate": 7.098785140329751e-06, + "loss": 1.8027, + "step": 29653000 + }, + { + "epoch": 85.83, + "learning_rate": 7.098061492682476e-06, + "loss": 1.8238, + "step": 29653500 + }, + { + "epoch": 85.84, + "learning_rate": 7.097337845035198e-06, + "loss": 1.8305, + "step": 29654000 + }, + { + "epoch": 85.84, + "learning_rate": 7.096614197387921e-06, + "loss": 1.7944, + "step": 29654500 + }, + { + "epoch": 85.84, + "learning_rate": 7.095890549740645e-06, + "loss": 1.7939, + "step": 29655000 + }, + { + "epoch": 85.84, + "learning_rate": 7.095166902093368e-06, + "loss": 1.8169, + "step": 29655500 + }, + { + "epoch": 85.84, + "learning_rate": 7.094443254446091e-06, + "loss": 1.81, + "step": 29656000 + }, + { + "epoch": 85.84, + "learning_rate": 7.0937196067988145e-06, + "loss": 1.821, + "step": 29656500 + }, + { + "epoch": 85.84, + "learning_rate": 7.092995959151538e-06, + "loss": 1.8091, + "step": 29657000 + }, + { + "epoch": 85.85, + "learning_rate": 7.0922723115042615e-06, + "loss": 1.8233, + "step": 29657500 + }, + { + "epoch": 85.85, + "learning_rate": 7.091548663856984e-06, + "loss": 1.8329, + "step": 29658000 + }, + { + "epoch": 85.85, + "learning_rate": 7.0908250162097085e-06, + "loss": 1.8263, + "step": 29658500 + }, + { + "epoch": 85.85, + "learning_rate": 7.090102815857726e-06, + "loss": 1.8129, + "step": 29659000 + }, + { + "epoch": 85.85, + "learning_rate": 7.089379168210449e-06, + "loss": 1.7994, + "step": 29659500 + }, + { + "epoch": 85.85, + "learning_rate": 7.088655520563171e-06, + "loss": 1.8096, + "step": 29660000 + }, + { + "epoch": 85.86, + "learning_rate": 7.087931872915896e-06, + "loss": 1.8112, + "step": 29660500 + }, + { + "epoch": 85.86, + "learning_rate": 7.087208225268618e-06, + "loss": 1.8121, + "step": 29661000 + }, + { + "epoch": 85.86, + "learning_rate": 7.086486024916636e-06, + "loss": 1.8305, + "step": 29661500 + }, + { + "epoch": 85.86, + "learning_rate": 7.085762377269358e-06, + "loss": 1.8024, + "step": 29662000 + }, + { + "epoch": 85.86, + "learning_rate": 7.085038729622083e-06, + "loss": 1.8217, + "step": 29662500 + }, + { + "epoch": 85.86, + "learning_rate": 7.084315081974806e-06, + "loss": 1.7958, + "step": 29663000 + }, + { + "epoch": 85.86, + "learning_rate": 7.0835914343275285e-06, + "loss": 1.817, + "step": 29663500 + }, + { + "epoch": 85.87, + "learning_rate": 7.082867786680253e-06, + "loss": 1.7998, + "step": 29664000 + }, + { + "epoch": 85.87, + "learning_rate": 7.0821455863282705e-06, + "loss": 1.8058, + "step": 29664500 + }, + { + "epoch": 85.87, + "learning_rate": 7.0814219386809936e-06, + "loss": 1.8142, + "step": 29665000 + }, + { + "epoch": 85.87, + "learning_rate": 7.080698291033716e-06, + "loss": 1.7899, + "step": 29665500 + }, + { + "epoch": 85.87, + "learning_rate": 7.0799746433864406e-06, + "loss": 1.8122, + "step": 29666000 + }, + { + "epoch": 85.87, + "learning_rate": 7.079250995739163e-06, + "loss": 1.8138, + "step": 29666500 + }, + { + "epoch": 85.87, + "learning_rate": 7.078527348091886e-06, + "loss": 1.8058, + "step": 29667000 + }, + { + "epoch": 85.88, + "learning_rate": 7.077803700444609e-06, + "loss": 1.8106, + "step": 29667500 + }, + { + "epoch": 85.88, + "learning_rate": 7.077080052797333e-06, + "loss": 1.8015, + "step": 29668000 + }, + { + "epoch": 85.88, + "learning_rate": 7.07635785244535e-06, + "loss": 1.8213, + "step": 29668500 + }, + { + "epoch": 85.88, + "learning_rate": 7.075634204798073e-06, + "loss": 1.8454, + "step": 29669000 + }, + { + "epoch": 85.88, + "learning_rate": 7.074910557150798e-06, + "loss": 1.8116, + "step": 29669500 + }, + { + "epoch": 85.88, + "learning_rate": 7.07418690950352e-06, + "loss": 1.8019, + "step": 29670000 + }, + { + "epoch": 85.88, + "learning_rate": 7.073464709151538e-06, + "loss": 1.8057, + "step": 29670500 + }, + { + "epoch": 85.89, + "learning_rate": 7.072742508799556e-06, + "loss": 1.8446, + "step": 29671000 + }, + { + "epoch": 85.89, + "learning_rate": 7.072020308447573e-06, + "loss": 1.8203, + "step": 29671500 + }, + { + "epoch": 85.89, + "learning_rate": 7.071296660800298e-06, + "loss": 1.8158, + "step": 29672000 + }, + { + "epoch": 85.89, + "learning_rate": 7.07057301315302e-06, + "loss": 1.823, + "step": 29672500 + }, + { + "epoch": 85.89, + "learning_rate": 7.069849365505743e-06, + "loss": 1.808, + "step": 29673000 + }, + { + "epoch": 85.89, + "learning_rate": 7.069125717858466e-06, + "loss": 1.8111, + "step": 29673500 + }, + { + "epoch": 85.89, + "learning_rate": 7.06840207021119e-06, + "loss": 1.824, + "step": 29674000 + }, + { + "epoch": 85.9, + "learning_rate": 7.067678422563913e-06, + "loss": 1.7828, + "step": 29674500 + }, + { + "epoch": 85.9, + "learning_rate": 7.066954774916635e-06, + "loss": 1.829, + "step": 29675000 + }, + { + "epoch": 85.9, + "learning_rate": 7.066232574564654e-06, + "loss": 1.8159, + "step": 29675500 + }, + { + "epoch": 85.9, + "learning_rate": 7.065508926917377e-06, + "loss": 1.8433, + "step": 29676000 + }, + { + "epoch": 85.9, + "learning_rate": 7.0647852792701e-06, + "loss": 1.8166, + "step": 29676500 + }, + { + "epoch": 85.9, + "learning_rate": 7.0640616316228234e-06, + "loss": 1.8298, + "step": 29677000 + }, + { + "epoch": 85.9, + "learning_rate": 7.063337983975547e-06, + "loss": 1.7998, + "step": 29677500 + }, + { + "epoch": 85.91, + "learning_rate": 7.062615783623565e-06, + "loss": 1.8396, + "step": 29678000 + }, + { + "epoch": 85.91, + "learning_rate": 7.061892135976288e-06, + "loss": 1.8131, + "step": 29678500 + }, + { + "epoch": 85.91, + "learning_rate": 7.061168488329011e-06, + "loss": 1.7934, + "step": 29679000 + }, + { + "epoch": 85.91, + "learning_rate": 7.060444840681735e-06, + "loss": 1.8106, + "step": 29679500 + }, + { + "epoch": 85.91, + "learning_rate": 7.059721193034458e-06, + "loss": 1.8208, + "step": 29680000 + }, + { + "epoch": 85.91, + "learning_rate": 7.05899754538718e-06, + "loss": 1.8378, + "step": 29680500 + }, + { + "epoch": 85.91, + "learning_rate": 7.058273897739905e-06, + "loss": 1.8091, + "step": 29681000 + }, + { + "epoch": 85.92, + "learning_rate": 7.057550250092627e-06, + "loss": 1.7957, + "step": 29681500 + }, + { + "epoch": 85.92, + "learning_rate": 7.05682949703594e-06, + "loss": 1.8082, + "step": 29682000 + }, + { + "epoch": 85.92, + "learning_rate": 7.056105849388662e-06, + "loss": 1.8343, + "step": 29682500 + }, + { + "epoch": 85.92, + "learning_rate": 7.0553822017413854e-06, + "loss": 1.8202, + "step": 29683000 + }, + { + "epoch": 85.92, + "learning_rate": 7.054658554094109e-06, + "loss": 1.7903, + "step": 29683500 + }, + { + "epoch": 85.92, + "learning_rate": 7.0539349064468324e-06, + "loss": 1.8242, + "step": 29684000 + }, + { + "epoch": 85.92, + "learning_rate": 7.0532112587995555e-06, + "loss": 1.7962, + "step": 29684500 + }, + { + "epoch": 85.93, + "learning_rate": 7.0524890584475745e-06, + "loss": 1.8026, + "step": 29685000 + }, + { + "epoch": 85.93, + "learning_rate": 7.051766858095592e-06, + "loss": 1.7886, + "step": 29685500 + }, + { + "epoch": 85.93, + "learning_rate": 7.051043210448315e-06, + "loss": 1.8119, + "step": 29686000 + }, + { + "epoch": 85.93, + "learning_rate": 7.050319562801037e-06, + "loss": 1.8018, + "step": 29686500 + }, + { + "epoch": 85.93, + "learning_rate": 7.049595915153762e-06, + "loss": 1.7875, + "step": 29687000 + }, + { + "epoch": 85.93, + "learning_rate": 7.048872267506484e-06, + "loss": 1.8333, + "step": 29687500 + }, + { + "epoch": 85.93, + "learning_rate": 7.048148619859207e-06, + "loss": 1.8068, + "step": 29688000 + }, + { + "epoch": 85.94, + "learning_rate": 7.04742497221193e-06, + "loss": 1.8118, + "step": 29688500 + }, + { + "epoch": 85.94, + "learning_rate": 7.046701324564654e-06, + "loss": 1.8259, + "step": 29689000 + }, + { + "epoch": 85.94, + "learning_rate": 7.045977676917377e-06, + "loss": 1.8196, + "step": 29689500 + }, + { + "epoch": 85.94, + "learning_rate": 7.0452540292701e-06, + "loss": 1.8092, + "step": 29690000 + }, + { + "epoch": 85.94, + "learning_rate": 7.044530381622824e-06, + "loss": 1.8165, + "step": 29690500 + }, + { + "epoch": 85.94, + "learning_rate": 7.043806733975547e-06, + "loss": 1.8074, + "step": 29691000 + }, + { + "epoch": 85.94, + "learning_rate": 7.0430845336235646e-06, + "loss": 1.8085, + "step": 29691500 + }, + { + "epoch": 85.95, + "learning_rate": 7.042360885976288e-06, + "loss": 1.7995, + "step": 29692000 + }, + { + "epoch": 85.95, + "learning_rate": 7.0416372383290116e-06, + "loss": 1.8559, + "step": 29692500 + }, + { + "epoch": 85.95, + "learning_rate": 7.040915037977029e-06, + "loss": 1.7842, + "step": 29693000 + }, + { + "epoch": 85.95, + "learning_rate": 7.040191390329752e-06, + "loss": 1.832, + "step": 29693500 + }, + { + "epoch": 85.95, + "learning_rate": 7.039467742682475e-06, + "loss": 1.8214, + "step": 29694000 + }, + { + "epoch": 85.95, + "learning_rate": 7.038744095035199e-06, + "loss": 1.8163, + "step": 29694500 + }, + { + "epoch": 85.95, + "learning_rate": 7.038020447387922e-06, + "loss": 1.7967, + "step": 29695000 + }, + { + "epoch": 85.96, + "learning_rate": 7.037296799740645e-06, + "loss": 1.8295, + "step": 29695500 + }, + { + "epoch": 85.96, + "learning_rate": 7.036574599388662e-06, + "loss": 1.8278, + "step": 29696000 + }, + { + "epoch": 85.96, + "learning_rate": 7.035850951741386e-06, + "loss": 1.8399, + "step": 29696500 + }, + { + "epoch": 85.96, + "learning_rate": 7.035127304094109e-06, + "loss": 1.818, + "step": 29697000 + }, + { + "epoch": 85.96, + "learning_rate": 7.034403656446832e-06, + "loss": 1.8296, + "step": 29697500 + }, + { + "epoch": 85.96, + "learning_rate": 7.033680008799556e-06, + "loss": 1.8171, + "step": 29698000 + }, + { + "epoch": 85.96, + "learning_rate": 7.032956361152279e-06, + "loss": 1.8105, + "step": 29698500 + }, + { + "epoch": 85.97, + "learning_rate": 7.032232713505002e-06, + "loss": 1.8188, + "step": 29699000 + }, + { + "epoch": 85.97, + "learning_rate": 7.031509065857725e-06, + "loss": 1.828, + "step": 29699500 + }, + { + "epoch": 85.97, + "learning_rate": 7.030785418210449e-06, + "loss": 1.8288, + "step": 29700000 + }, + { + "epoch": 85.97, + "learning_rate": 7.030063217858467e-06, + "loss": 1.8409, + "step": 29700500 + }, + { + "epoch": 85.97, + "learning_rate": 7.02933957021119e-06, + "loss": 1.8009, + "step": 29701000 + }, + { + "epoch": 85.97, + "learning_rate": 7.028615922563912e-06, + "loss": 1.7998, + "step": 29701500 + }, + { + "epoch": 85.98, + "learning_rate": 7.027892274916637e-06, + "loss": 1.7893, + "step": 29702000 + }, + { + "epoch": 85.98, + "learning_rate": 7.027171521859949e-06, + "loss": 1.8123, + "step": 29702500 + }, + { + "epoch": 85.98, + "learning_rate": 7.026447874212671e-06, + "loss": 1.7961, + "step": 29703000 + }, + { + "epoch": 85.98, + "learning_rate": 7.025724226565394e-06, + "loss": 1.8147, + "step": 29703500 + }, + { + "epoch": 85.98, + "learning_rate": 7.025000578918118e-06, + "loss": 1.8074, + "step": 29704000 + }, + { + "epoch": 85.98, + "learning_rate": 7.0242783785661364e-06, + "loss": 1.8356, + "step": 29704500 + }, + { + "epoch": 85.98, + "learning_rate": 7.023556178214154e-06, + "loss": 1.8284, + "step": 29705000 + }, + { + "epoch": 85.99, + "learning_rate": 7.022832530566877e-06, + "loss": 1.8202, + "step": 29705500 + }, + { + "epoch": 85.99, + "learning_rate": 7.022108882919601e-06, + "loss": 1.8051, + "step": 29706000 + }, + { + "epoch": 85.99, + "learning_rate": 7.021385235272324e-06, + "loss": 1.8213, + "step": 29706500 + }, + { + "epoch": 85.99, + "learning_rate": 7.020661587625047e-06, + "loss": 1.7744, + "step": 29707000 + }, + { + "epoch": 85.99, + "learning_rate": 7.019937939977769e-06, + "loss": 1.8404, + "step": 29707500 + }, + { + "epoch": 85.99, + "learning_rate": 7.019214292330494e-06, + "loss": 1.8147, + "step": 29708000 + }, + { + "epoch": 85.99, + "learning_rate": 7.018492091978511e-06, + "loss": 1.8006, + "step": 29708500 + }, + { + "epoch": 86.0, + "learning_rate": 7.017768444331234e-06, + "loss": 1.812, + "step": 29709000 + }, + { + "epoch": 86.0, + "learning_rate": 7.0170447966839564e-06, + "loss": 1.8255, + "step": 29709500 + }, + { + "epoch": 86.0, + "learning_rate": 7.016321149036681e-06, + "loss": 1.8123, + "step": 29710000 + }, + { + "epoch": 86.0, + "learning_rate": 7.0155989486846985e-06, + "loss": 1.8029, + "step": 29710500 + }, + { + "epoch": 86.0, + "eval_accuracy": 0.6887171585544973, + "eval_accuracy_mlm": 0.6578651829440271, + "eval_accuracy_nsp": 0.8541566411388083, + "eval_loss": 2.1977808475494385, + "eval_runtime": 331.6135, + "eval_samples_per_second": 1315.947, + "eval_steps_per_second": 54.832, + "step": 29710592 + }, + { + "epoch": 86.0, + "learning_rate": 7.0148753010374215e-06, + "loss": 1.7942, + "step": 29711000 + }, + { + "epoch": 86.0, + "learning_rate": 7.0141516533901455e-06, + "loss": 1.7909, + "step": 29711500 + }, + { + "epoch": 86.0, + "learning_rate": 7.0134280057428685e-06, + "loss": 1.8082, + "step": 29712000 + }, + { + "epoch": 86.01, + "learning_rate": 7.012705805390886e-06, + "loss": 1.8063, + "step": 29712500 + }, + { + "epoch": 86.01, + "learning_rate": 7.011982157743609e-06, + "loss": 1.8065, + "step": 29713000 + }, + { + "epoch": 86.01, + "learning_rate": 7.011258510096333e-06, + "loss": 1.8123, + "step": 29713500 + }, + { + "epoch": 86.01, + "learning_rate": 7.010536309744351e-06, + "loss": 1.7888, + "step": 29714000 + }, + { + "epoch": 86.01, + "learning_rate": 7.009812662097073e-06, + "loss": 1.8073, + "step": 29714500 + }, + { + "epoch": 86.01, + "learning_rate": 7.009089014449796e-06, + "loss": 1.818, + "step": 29715000 + }, + { + "epoch": 86.01, + "learning_rate": 7.00836536680252e-06, + "loss": 1.8077, + "step": 29715500 + }, + { + "epoch": 86.02, + "learning_rate": 7.007641719155243e-06, + "loss": 1.8252, + "step": 29716000 + }, + { + "epoch": 86.02, + "learning_rate": 7.006918071507966e-06, + "loss": 1.7972, + "step": 29716500 + }, + { + "epoch": 86.02, + "learning_rate": 7.0061944238606885e-06, + "loss": 1.8308, + "step": 29717000 + }, + { + "epoch": 86.02, + "learning_rate": 7.005470776213413e-06, + "loss": 1.8159, + "step": 29717500 + }, + { + "epoch": 86.02, + "learning_rate": 7.0047471285661355e-06, + "loss": 1.8374, + "step": 29718000 + }, + { + "epoch": 86.02, + "learning_rate": 7.004023480918859e-06, + "loss": 1.7852, + "step": 29718500 + }, + { + "epoch": 86.02, + "learning_rate": 7.0032998332715825e-06, + "loss": 1.7811, + "step": 29719000 + }, + { + "epoch": 86.03, + "learning_rate": 7.002576185624306e-06, + "loss": 1.821, + "step": 29719500 + }, + { + "epoch": 86.03, + "learning_rate": 7.001853985272324e-06, + "loss": 1.8059, + "step": 29720000 + }, + { + "epoch": 86.03, + "learning_rate": 7.001130337625046e-06, + "loss": 1.7965, + "step": 29720500 + }, + { + "epoch": 86.03, + "learning_rate": 7.000406689977771e-06, + "loss": 1.8121, + "step": 29721000 + }, + { + "epoch": 86.03, + "learning_rate": 6.999683042330493e-06, + "loss": 1.7983, + "step": 29721500 + }, + { + "epoch": 86.03, + "learning_rate": 6.998959394683216e-06, + "loss": 1.8039, + "step": 29722000 + }, + { + "epoch": 86.03, + "learning_rate": 6.998237194331233e-06, + "loss": 1.796, + "step": 29722500 + }, + { + "epoch": 86.04, + "learning_rate": 6.997513546683958e-06, + "loss": 1.8091, + "step": 29723000 + }, + { + "epoch": 86.04, + "learning_rate": 6.99678989903668e-06, + "loss": 1.7802, + "step": 29723500 + }, + { + "epoch": 86.04, + "learning_rate": 6.996066251389403e-06, + "loss": 1.7894, + "step": 29724000 + }, + { + "epoch": 86.04, + "learning_rate": 6.995345498332716e-06, + "loss": 1.8035, + "step": 29724500 + }, + { + "epoch": 86.04, + "learning_rate": 6.99462185068544e-06, + "loss": 1.8062, + "step": 29725000 + }, + { + "epoch": 86.04, + "learning_rate": 6.993898203038163e-06, + "loss": 1.8306, + "step": 29725500 + }, + { + "epoch": 86.04, + "learning_rate": 6.993174555390886e-06, + "loss": 1.8104, + "step": 29726000 + }, + { + "epoch": 86.05, + "learning_rate": 6.992450907743609e-06, + "loss": 1.8223, + "step": 29726500 + }, + { + "epoch": 86.05, + "learning_rate": 6.991727260096333e-06, + "loss": 1.818, + "step": 29727000 + }, + { + "epoch": 86.05, + "learning_rate": 6.99100505974435e-06, + "loss": 1.8039, + "step": 29727500 + }, + { + "epoch": 86.05, + "learning_rate": 6.990281412097073e-06, + "loss": 1.8326, + "step": 29728000 + }, + { + "epoch": 86.05, + "learning_rate": 6.989557764449796e-06, + "loss": 1.7934, + "step": 29728500 + }, + { + "epoch": 86.05, + "learning_rate": 6.98883411680252e-06, + "loss": 1.7882, + "step": 29729000 + }, + { + "epoch": 86.05, + "learning_rate": 6.988110469155243e-06, + "loss": 1.7989, + "step": 29729500 + }, + { + "epoch": 86.06, + "learning_rate": 6.987386821507965e-06, + "loss": 1.777, + "step": 29730000 + }, + { + "epoch": 86.06, + "learning_rate": 6.986664621155984e-06, + "loss": 1.785, + "step": 29730500 + }, + { + "epoch": 86.06, + "learning_rate": 6.985940973508707e-06, + "loss": 1.8132, + "step": 29731000 + }, + { + "epoch": 86.06, + "learning_rate": 6.9852173258614305e-06, + "loss": 1.8205, + "step": 29731500 + }, + { + "epoch": 86.06, + "learning_rate": 6.984493678214154e-06, + "loss": 1.791, + "step": 29732000 + }, + { + "epoch": 86.06, + "learning_rate": 6.9837700305668775e-06, + "loss": 1.8254, + "step": 29732500 + }, + { + "epoch": 86.06, + "learning_rate": 6.983046382919601e-06, + "loss": 1.8278, + "step": 29733000 + }, + { + "epoch": 86.07, + "learning_rate": 6.982322735272323e-06, + "loss": 1.8181, + "step": 29733500 + }, + { + "epoch": 86.07, + "learning_rate": 6.981599087625048e-06, + "loss": 1.7845, + "step": 29734000 + }, + { + "epoch": 86.07, + "learning_rate": 6.98087543997777e-06, + "loss": 1.7865, + "step": 29734500 + }, + { + "epoch": 86.07, + "learning_rate": 6.980151792330493e-06, + "loss": 1.7887, + "step": 29735000 + }, + { + "epoch": 86.07, + "learning_rate": 6.97942959197851e-06, + "loss": 1.8078, + "step": 29735500 + }, + { + "epoch": 86.07, + "learning_rate": 6.978707391626528e-06, + "loss": 1.8032, + "step": 29736000 + }, + { + "epoch": 86.07, + "learning_rate": 6.977983743979252e-06, + "loss": 1.7904, + "step": 29736500 + }, + { + "epoch": 86.08, + "learning_rate": 6.9772615436272694e-06, + "loss": 1.7678, + "step": 29737000 + }, + { + "epoch": 86.08, + "learning_rate": 6.9765378959799925e-06, + "loss": 1.8355, + "step": 29737500 + }, + { + "epoch": 86.08, + "learning_rate": 6.975814248332716e-06, + "loss": 1.795, + "step": 29738000 + }, + { + "epoch": 86.08, + "learning_rate": 6.9750906006854395e-06, + "loss": 1.82, + "step": 29738500 + }, + { + "epoch": 86.08, + "learning_rate": 6.974366953038163e-06, + "loss": 1.8277, + "step": 29739000 + }, + { + "epoch": 86.08, + "learning_rate": 6.973643305390886e-06, + "loss": 1.8009, + "step": 29739500 + }, + { + "epoch": 86.09, + "learning_rate": 6.97291965774361e-06, + "loss": 1.8162, + "step": 29740000 + }, + { + "epoch": 86.09, + "learning_rate": 6.972196010096333e-06, + "loss": 1.8026, + "step": 29740500 + }, + { + "epoch": 86.09, + "learning_rate": 6.971472362449055e-06, + "loss": 1.8045, + "step": 29741000 + }, + { + "epoch": 86.09, + "learning_rate": 6.97074871480178e-06, + "loss": 1.829, + "step": 29741500 + }, + { + "epoch": 86.09, + "learning_rate": 6.970025067154502e-06, + "loss": 1.8101, + "step": 29742000 + }, + { + "epoch": 86.09, + "learning_rate": 6.969301419507225e-06, + "loss": 1.8071, + "step": 29742500 + }, + { + "epoch": 86.09, + "learning_rate": 6.968579219155242e-06, + "loss": 1.8088, + "step": 29743000 + }, + { + "epoch": 86.1, + "learning_rate": 6.967855571507967e-06, + "loss": 1.8201, + "step": 29743500 + }, + { + "epoch": 86.1, + "learning_rate": 6.967133371155984e-06, + "loss": 1.7804, + "step": 29744000 + }, + { + "epoch": 86.1, + "learning_rate": 6.966409723508707e-06, + "loss": 1.8005, + "step": 29744500 + }, + { + "epoch": 86.1, + "learning_rate": 6.9656860758614305e-06, + "loss": 1.796, + "step": 29745000 + }, + { + "epoch": 86.1, + "learning_rate": 6.964962428214154e-06, + "loss": 1.8071, + "step": 29745500 + }, + { + "epoch": 86.1, + "learning_rate": 6.9642387805668775e-06, + "loss": 1.8156, + "step": 29746000 + }, + { + "epoch": 86.1, + "learning_rate": 6.9635151329196e-06, + "loss": 1.8132, + "step": 29746500 + }, + { + "epoch": 86.11, + "learning_rate": 6.962792932567618e-06, + "loss": 1.7883, + "step": 29747000 + }, + { + "epoch": 86.11, + "learning_rate": 6.962069284920342e-06, + "loss": 1.8145, + "step": 29747500 + }, + { + "epoch": 86.11, + "learning_rate": 6.961345637273065e-06, + "loss": 1.8117, + "step": 29748000 + }, + { + "epoch": 86.11, + "learning_rate": 6.960621989625787e-06, + "loss": 1.8144, + "step": 29748500 + }, + { + "epoch": 86.11, + "learning_rate": 6.95989834197851e-06, + "loss": 1.8038, + "step": 29749000 + }, + { + "epoch": 86.11, + "learning_rate": 6.959174694331234e-06, + "loss": 1.8127, + "step": 29749500 + }, + { + "epoch": 86.11, + "learning_rate": 6.958451046683957e-06, + "loss": 1.7943, + "step": 29750000 + }, + { + "epoch": 86.12, + "learning_rate": 6.95772739903668e-06, + "loss": 1.8107, + "step": 29750500 + }, + { + "epoch": 86.12, + "learning_rate": 6.957003751389404e-06, + "loss": 1.7924, + "step": 29751000 + }, + { + "epoch": 86.12, + "learning_rate": 6.956280103742127e-06, + "loss": 1.8092, + "step": 29751500 + }, + { + "epoch": 86.12, + "learning_rate": 6.9555579033901445e-06, + "loss": 1.81, + "step": 29752000 + }, + { + "epoch": 86.12, + "learning_rate": 6.9548357030381626e-06, + "loss": 1.809, + "step": 29752500 + }, + { + "epoch": 86.12, + "learning_rate": 6.9541120553908865e-06, + "loss": 1.781, + "step": 29753000 + }, + { + "epoch": 86.12, + "learning_rate": 6.9533884077436096e-06, + "loss": 1.8043, + "step": 29753500 + }, + { + "epoch": 86.13, + "learning_rate": 6.952664760096332e-06, + "loss": 1.7764, + "step": 29754000 + }, + { + "epoch": 86.13, + "learning_rate": 6.951941112449055e-06, + "loss": 1.8324, + "step": 29754500 + }, + { + "epoch": 86.13, + "learning_rate": 6.951217464801779e-06, + "loss": 1.7951, + "step": 29755000 + }, + { + "epoch": 86.13, + "learning_rate": 6.950493817154502e-06, + "loss": 1.8059, + "step": 29755500 + }, + { + "epoch": 86.13, + "learning_rate": 6.949770169507225e-06, + "loss": 1.8034, + "step": 29756000 + }, + { + "epoch": 86.13, + "learning_rate": 6.949046521859949e-06, + "loss": 1.8039, + "step": 29756500 + }, + { + "epoch": 86.13, + "learning_rate": 6.948322874212672e-06, + "loss": 1.8332, + "step": 29757000 + }, + { + "epoch": 86.14, + "learning_rate": 6.947599226565395e-06, + "loss": 1.8153, + "step": 29757500 + }, + { + "epoch": 86.14, + "learning_rate": 6.946877026213412e-06, + "loss": 1.7899, + "step": 29758000 + }, + { + "epoch": 86.14, + "learning_rate": 6.946153378566136e-06, + "loss": 1.8233, + "step": 29758500 + }, + { + "epoch": 86.14, + "learning_rate": 6.945431178214154e-06, + "loss": 1.7933, + "step": 29759000 + }, + { + "epoch": 86.14, + "learning_rate": 6.9447075305668766e-06, + "loss": 1.8211, + "step": 29759500 + }, + { + "epoch": 86.14, + "learning_rate": 6.9439838829196e-06, + "loss": 1.8031, + "step": 29760000 + }, + { + "epoch": 86.14, + "learning_rate": 6.9432602352723236e-06, + "loss": 1.8123, + "step": 29760500 + }, + { + "epoch": 86.15, + "learning_rate": 6.942536587625047e-06, + "loss": 1.8119, + "step": 29761000 + }, + { + "epoch": 86.15, + "learning_rate": 6.94181293997777e-06, + "loss": 1.8341, + "step": 29761500 + }, + { + "epoch": 86.15, + "learning_rate": 6.941089292330494e-06, + "loss": 1.8165, + "step": 29762000 + }, + { + "epoch": 86.15, + "learning_rate": 6.940365644683217e-06, + "loss": 1.833, + "step": 29762500 + }, + { + "epoch": 86.15, + "learning_rate": 6.93964199703594e-06, + "loss": 1.8097, + "step": 29763000 + }, + { + "epoch": 86.15, + "learning_rate": 6.938919796683957e-06, + "loss": 1.8034, + "step": 29763500 + }, + { + "epoch": 86.15, + "learning_rate": 6.938196149036681e-06, + "loss": 1.8095, + "step": 29764000 + }, + { + "epoch": 86.16, + "learning_rate": 6.937472501389404e-06, + "loss": 1.8142, + "step": 29764500 + }, + { + "epoch": 86.16, + "learning_rate": 6.936748853742127e-06, + "loss": 1.7937, + "step": 29765000 + }, + { + "epoch": 86.16, + "learning_rate": 6.936026653390144e-06, + "loss": 1.8075, + "step": 29765500 + }, + { + "epoch": 86.16, + "learning_rate": 6.935303005742868e-06, + "loss": 1.7978, + "step": 29766000 + }, + { + "epoch": 86.16, + "learning_rate": 6.934579358095591e-06, + "loss": 1.82, + "step": 29766500 + }, + { + "epoch": 86.16, + "learning_rate": 6.9338557104483145e-06, + "loss": 1.757, + "step": 29767000 + }, + { + "epoch": 86.16, + "learning_rate": 6.933133510096332e-06, + "loss": 1.8271, + "step": 29767500 + }, + { + "epoch": 86.17, + "learning_rate": 6.932409862449056e-06, + "loss": 1.8089, + "step": 29768000 + }, + { + "epoch": 86.17, + "learning_rate": 6.931686214801779e-06, + "loss": 1.7651, + "step": 29768500 + }, + { + "epoch": 86.17, + "learning_rate": 6.930962567154502e-06, + "loss": 1.8187, + "step": 29769000 + }, + { + "epoch": 86.17, + "learning_rate": 6.930238919507225e-06, + "loss": 1.8107, + "step": 29769500 + }, + { + "epoch": 86.17, + "learning_rate": 6.929515271859949e-06, + "loss": 1.7893, + "step": 29770000 + }, + { + "epoch": 86.17, + "learning_rate": 6.928791624212672e-06, + "loss": 1.7851, + "step": 29770500 + }, + { + "epoch": 86.17, + "learning_rate": 6.928067976565394e-06, + "loss": 1.8108, + "step": 29771000 + }, + { + "epoch": 86.18, + "learning_rate": 6.927345776213413e-06, + "loss": 1.8118, + "step": 29771500 + }, + { + "epoch": 86.18, + "learning_rate": 6.926622128566136e-06, + "loss": 1.8219, + "step": 29772000 + }, + { + "epoch": 86.18, + "learning_rate": 6.925898480918859e-06, + "loss": 1.818, + "step": 29772500 + }, + { + "epoch": 86.18, + "learning_rate": 6.9251748332715815e-06, + "loss": 1.8062, + "step": 29773000 + }, + { + "epoch": 86.18, + "learning_rate": 6.924451185624306e-06, + "loss": 1.8163, + "step": 29773500 + }, + { + "epoch": 86.18, + "learning_rate": 6.9237275379770285e-06, + "loss": 1.8117, + "step": 29774000 + }, + { + "epoch": 86.18, + "learning_rate": 6.923003890329752e-06, + "loss": 1.8094, + "step": 29774500 + }, + { + "epoch": 86.19, + "learning_rate": 6.922280242682476e-06, + "loss": 1.8207, + "step": 29775000 + }, + { + "epoch": 86.19, + "learning_rate": 6.921558042330494e-06, + "loss": 1.7925, + "step": 29775500 + }, + { + "epoch": 86.19, + "learning_rate": 6.920835841978511e-06, + "loss": 1.8096, + "step": 29776000 + }, + { + "epoch": 86.19, + "learning_rate": 6.920112194331234e-06, + "loss": 1.8236, + "step": 29776500 + }, + { + "epoch": 86.19, + "learning_rate": 6.919389993979251e-06, + "loss": 1.8176, + "step": 29777000 + }, + { + "epoch": 86.19, + "learning_rate": 6.918666346331976e-06, + "loss": 1.7865, + "step": 29777500 + }, + { + "epoch": 86.2, + "learning_rate": 6.917942698684698e-06, + "loss": 1.8203, + "step": 29778000 + }, + { + "epoch": 86.2, + "learning_rate": 6.917219051037421e-06, + "loss": 1.8084, + "step": 29778500 + }, + { + "epoch": 86.2, + "learning_rate": 6.916495403390145e-06, + "loss": 1.8126, + "step": 29779000 + }, + { + "epoch": 86.2, + "learning_rate": 6.915771755742868e-06, + "loss": 1.8022, + "step": 29779500 + }, + { + "epoch": 86.2, + "learning_rate": 6.915048108095591e-06, + "loss": 1.7627, + "step": 29780000 + }, + { + "epoch": 86.2, + "learning_rate": 6.914324460448314e-06, + "loss": 1.8059, + "step": 29780500 + }, + { + "epoch": 86.2, + "learning_rate": 6.9136022600963325e-06, + "loss": 1.8046, + "step": 29781000 + }, + { + "epoch": 86.21, + "learning_rate": 6.912878612449056e-06, + "loss": 1.7891, + "step": 29781500 + }, + { + "epoch": 86.21, + "learning_rate": 6.912156412097074e-06, + "loss": 1.7927, + "step": 29782000 + }, + { + "epoch": 86.21, + "learning_rate": 6.911432764449796e-06, + "loss": 1.8031, + "step": 29782500 + }, + { + "epoch": 86.21, + "learning_rate": 6.910709116802521e-06, + "loss": 1.8083, + "step": 29783000 + }, + { + "epoch": 86.21, + "learning_rate": 6.909985469155243e-06, + "loss": 1.8047, + "step": 29783500 + }, + { + "epoch": 86.21, + "learning_rate": 6.909261821507966e-06, + "loss": 1.8085, + "step": 29784000 + }, + { + "epoch": 86.21, + "learning_rate": 6.908538173860689e-06, + "loss": 1.7981, + "step": 29784500 + }, + { + "epoch": 86.22, + "learning_rate": 6.907814526213413e-06, + "loss": 1.8112, + "step": 29785000 + }, + { + "epoch": 86.22, + "learning_rate": 6.907090878566136e-06, + "loss": 1.7989, + "step": 29785500 + }, + { + "epoch": 86.22, + "learning_rate": 6.906370125509448e-06, + "loss": 1.7878, + "step": 29786000 + }, + { + "epoch": 86.22, + "learning_rate": 6.905646477862171e-06, + "loss": 1.8176, + "step": 29786500 + }, + { + "epoch": 86.22, + "learning_rate": 6.904922830214895e-06, + "loss": 1.7928, + "step": 29787000 + }, + { + "epoch": 86.22, + "learning_rate": 6.904199182567618e-06, + "loss": 1.798, + "step": 29787500 + }, + { + "epoch": 86.22, + "learning_rate": 6.903475534920341e-06, + "loss": 1.8519, + "step": 29788000 + }, + { + "epoch": 86.23, + "learning_rate": 6.9027518872730655e-06, + "loss": 1.7654, + "step": 29788500 + }, + { + "epoch": 86.23, + "learning_rate": 6.902028239625788e-06, + "loss": 1.8099, + "step": 29789000 + }, + { + "epoch": 86.23, + "learning_rate": 6.901304591978511e-06, + "loss": 1.7896, + "step": 29789500 + }, + { + "epoch": 86.23, + "learning_rate": 6.900580944331234e-06, + "loss": 1.8094, + "step": 29790000 + }, + { + "epoch": 86.23, + "learning_rate": 6.899858743979253e-06, + "loss": 1.7939, + "step": 29790500 + }, + { + "epoch": 86.23, + "learning_rate": 6.899135096331975e-06, + "loss": 1.8004, + "step": 29791000 + }, + { + "epoch": 86.23, + "learning_rate": 6.898411448684698e-06, + "loss": 1.8175, + "step": 29791500 + }, + { + "epoch": 86.24, + "learning_rate": 6.897687801037421e-06, + "loss": 1.7847, + "step": 29792000 + }, + { + "epoch": 86.24, + "learning_rate": 6.896964153390145e-06, + "loss": 1.787, + "step": 29792500 + }, + { + "epoch": 86.24, + "learning_rate": 6.896240505742868e-06, + "loss": 1.8156, + "step": 29793000 + }, + { + "epoch": 86.24, + "learning_rate": 6.8955183053908855e-06, + "loss": 1.8159, + "step": 29793500 + }, + { + "epoch": 86.24, + "learning_rate": 6.8947946577436086e-06, + "loss": 1.7934, + "step": 29794000 + }, + { + "epoch": 86.24, + "learning_rate": 6.8940710100963325e-06, + "loss": 1.8045, + "step": 29794500 + }, + { + "epoch": 86.24, + "learning_rate": 6.8933473624490556e-06, + "loss": 1.8087, + "step": 29795000 + }, + { + "epoch": 86.25, + "learning_rate": 6.892625162097073e-06, + "loss": 1.791, + "step": 29795500 + }, + { + "epoch": 86.25, + "learning_rate": 6.891901514449796e-06, + "loss": 1.8146, + "step": 29796000 + }, + { + "epoch": 86.25, + "learning_rate": 6.89117786680252e-06, + "loss": 1.8239, + "step": 29796500 + }, + { + "epoch": 86.25, + "learning_rate": 6.890454219155243e-06, + "loss": 1.7856, + "step": 29797000 + }, + { + "epoch": 86.25, + "learning_rate": 6.889730571507966e-06, + "loss": 1.8293, + "step": 29797500 + }, + { + "epoch": 86.25, + "learning_rate": 6.88900692386069e-06, + "loss": 1.8236, + "step": 29798000 + }, + { + "epoch": 86.25, + "learning_rate": 6.888283276213413e-06, + "loss": 1.7856, + "step": 29798500 + }, + { + "epoch": 86.26, + "learning_rate": 6.887559628566135e-06, + "loss": 1.794, + "step": 29799000 + }, + { + "epoch": 86.26, + "learning_rate": 6.8868388755094475e-06, + "loss": 1.8041, + "step": 29799500 + }, + { + "epoch": 86.26, + "learning_rate": 6.886115227862172e-06, + "loss": 1.8215, + "step": 29800000 + }, + { + "epoch": 86.26, + "learning_rate": 6.885391580214895e-06, + "loss": 1.8109, + "step": 29800500 + }, + { + "epoch": 86.26, + "learning_rate": 6.884667932567618e-06, + "loss": 1.797, + "step": 29801000 + }, + { + "epoch": 86.26, + "learning_rate": 6.883944284920341e-06, + "loss": 1.8307, + "step": 29801500 + }, + { + "epoch": 86.26, + "learning_rate": 6.88322208456836e-06, + "loss": 1.8059, + "step": 29802000 + }, + { + "epoch": 86.27, + "learning_rate": 6.882499884216377e-06, + "loss": 1.8079, + "step": 29802500 + }, + { + "epoch": 86.27, + "learning_rate": 6.8817762365691e-06, + "loss": 1.788, + "step": 29803000 + }, + { + "epoch": 86.27, + "learning_rate": 6.881052588921823e-06, + "loss": 1.8097, + "step": 29803500 + }, + { + "epoch": 86.27, + "learning_rate": 6.880328941274547e-06, + "loss": 1.7836, + "step": 29804000 + }, + { + "epoch": 86.27, + "learning_rate": 6.87960529362727e-06, + "loss": 1.7991, + "step": 29804500 + }, + { + "epoch": 86.27, + "learning_rate": 6.878881645979992e-06, + "loss": 1.8143, + "step": 29805000 + }, + { + "epoch": 86.27, + "learning_rate": 6.878157998332715e-06, + "loss": 1.7954, + "step": 29805500 + }, + { + "epoch": 86.28, + "learning_rate": 6.877434350685439e-06, + "loss": 1.7959, + "step": 29806000 + }, + { + "epoch": 86.28, + "learning_rate": 6.876710703038162e-06, + "loss": 1.8276, + "step": 29806500 + }, + { + "epoch": 86.28, + "learning_rate": 6.8759870553908854e-06, + "loss": 1.8175, + "step": 29807000 + }, + { + "epoch": 86.28, + "learning_rate": 6.875263407743609e-06, + "loss": 1.7861, + "step": 29807500 + }, + { + "epoch": 86.28, + "learning_rate": 6.8745397600963324e-06, + "loss": 1.8043, + "step": 29808000 + }, + { + "epoch": 86.28, + "learning_rate": 6.8738161124490555e-06, + "loss": 1.7998, + "step": 29808500 + }, + { + "epoch": 86.28, + "learning_rate": 6.873093912097073e-06, + "loss": 1.8135, + "step": 29809000 + }, + { + "epoch": 86.29, + "learning_rate": 6.872370264449797e-06, + "loss": 1.7984, + "step": 29809500 + }, + { + "epoch": 86.29, + "learning_rate": 6.87164661680252e-06, + "loss": 1.815, + "step": 29810000 + }, + { + "epoch": 86.29, + "learning_rate": 6.870922969155243e-06, + "loss": 1.811, + "step": 29810500 + }, + { + "epoch": 86.29, + "learning_rate": 6.870199321507967e-06, + "loss": 1.8192, + "step": 29811000 + }, + { + "epoch": 86.29, + "learning_rate": 6.86947567386069e-06, + "loss": 1.8312, + "step": 29811500 + }, + { + "epoch": 86.29, + "learning_rate": 6.868752026213412e-06, + "loss": 1.8217, + "step": 29812000 + }, + { + "epoch": 86.29, + "learning_rate": 6.868028378566135e-06, + "loss": 1.8298, + "step": 29812500 + }, + { + "epoch": 86.3, + "learning_rate": 6.8673076255094474e-06, + "loss": 1.7917, + "step": 29813000 + }, + { + "epoch": 86.3, + "learning_rate": 6.866583977862172e-06, + "loss": 1.8095, + "step": 29813500 + }, + { + "epoch": 86.3, + "learning_rate": 6.8658603302148945e-06, + "loss": 1.7854, + "step": 29814000 + }, + { + "epoch": 86.3, + "learning_rate": 6.8651366825676175e-06, + "loss": 1.8135, + "step": 29814500 + }, + { + "epoch": 86.3, + "learning_rate": 6.8644130349203415e-06, + "loss": 1.7928, + "step": 29815000 + }, + { + "epoch": 86.3, + "learning_rate": 6.8636893872730645e-06, + "loss": 1.821, + "step": 29815500 + }, + { + "epoch": 86.31, + "learning_rate": 6.862965739625788e-06, + "loss": 1.7969, + "step": 29816000 + }, + { + "epoch": 86.31, + "learning_rate": 6.862243539273805e-06, + "loss": 1.8349, + "step": 29816500 + }, + { + "epoch": 86.31, + "learning_rate": 6.861519891626529e-06, + "loss": 1.7915, + "step": 29817000 + }, + { + "epoch": 86.31, + "learning_rate": 6.860796243979252e-06, + "loss": 1.7765, + "step": 29817500 + }, + { + "epoch": 86.31, + "learning_rate": 6.860072596331975e-06, + "loss": 1.8081, + "step": 29818000 + }, + { + "epoch": 86.31, + "learning_rate": 6.859348948684699e-06, + "loss": 1.8366, + "step": 29818500 + }, + { + "epoch": 86.31, + "learning_rate": 6.858626748332717e-06, + "loss": 1.8021, + "step": 29819000 + }, + { + "epoch": 86.32, + "learning_rate": 6.857904547980734e-06, + "loss": 1.7975, + "step": 29819500 + }, + { + "epoch": 86.32, + "learning_rate": 6.857180900333457e-06, + "loss": 1.8394, + "step": 29820000 + }, + { + "epoch": 86.32, + "learning_rate": 6.8564572526861795e-06, + "loss": 1.8023, + "step": 29820500 + }, + { + "epoch": 86.32, + "learning_rate": 6.855733605038904e-06, + "loss": 1.7921, + "step": 29821000 + }, + { + "epoch": 86.32, + "learning_rate": 6.8550099573916266e-06, + "loss": 1.795, + "step": 29821500 + }, + { + "epoch": 86.32, + "learning_rate": 6.85428630974435e-06, + "loss": 1.808, + "step": 29822000 + }, + { + "epoch": 86.32, + "learning_rate": 6.8535626620970736e-06, + "loss": 1.7871, + "step": 29822500 + }, + { + "epoch": 86.33, + "learning_rate": 6.852839014449797e-06, + "loss": 1.8114, + "step": 29823000 + }, + { + "epoch": 86.33, + "learning_rate": 6.85211536680252e-06, + "loss": 1.8029, + "step": 29823500 + }, + { + "epoch": 86.33, + "learning_rate": 6.851393166450537e-06, + "loss": 1.7708, + "step": 29824000 + }, + { + "epoch": 86.33, + "learning_rate": 6.850669518803261e-06, + "loss": 1.812, + "step": 29824500 + }, + { + "epoch": 86.33, + "learning_rate": 6.849945871155984e-06, + "loss": 1.8269, + "step": 29825000 + }, + { + "epoch": 86.33, + "learning_rate": 6.849222223508707e-06, + "loss": 1.7907, + "step": 29825500 + }, + { + "epoch": 86.33, + "learning_rate": 6.848500023156724e-06, + "loss": 1.7909, + "step": 29826000 + }, + { + "epoch": 86.34, + "learning_rate": 6.847776375509449e-06, + "loss": 1.8143, + "step": 29826500 + }, + { + "epoch": 86.34, + "learning_rate": 6.847052727862171e-06, + "loss": 1.8055, + "step": 29827000 + }, + { + "epoch": 86.34, + "learning_rate": 6.846329080214894e-06, + "loss": 1.8128, + "step": 29827500 + }, + { + "epoch": 86.34, + "learning_rate": 6.845605432567618e-06, + "loss": 1.7995, + "step": 29828000 + }, + { + "epoch": 86.34, + "learning_rate": 6.8448832322156364e-06, + "loss": 1.7957, + "step": 29828500 + }, + { + "epoch": 86.34, + "learning_rate": 6.844159584568359e-06, + "loss": 1.8045, + "step": 29829000 + }, + { + "epoch": 86.34, + "learning_rate": 6.843435936921082e-06, + "loss": 1.7986, + "step": 29829500 + }, + { + "epoch": 86.35, + "learning_rate": 6.842712289273806e-06, + "loss": 1.8055, + "step": 29830000 + }, + { + "epoch": 86.35, + "learning_rate": 6.841988641626529e-06, + "loss": 1.8119, + "step": 29830500 + }, + { + "epoch": 86.35, + "learning_rate": 6.841266441274546e-06, + "loss": 1.8108, + "step": 29831000 + }, + { + "epoch": 86.35, + "learning_rate": 6.840542793627269e-06, + "loss": 1.7868, + "step": 29831500 + }, + { + "epoch": 86.35, + "learning_rate": 6.839819145979994e-06, + "loss": 1.7819, + "step": 29832000 + }, + { + "epoch": 86.35, + "learning_rate": 6.839095498332716e-06, + "loss": 1.8316, + "step": 29832500 + }, + { + "epoch": 86.35, + "learning_rate": 6.838371850685439e-06, + "loss": 1.7978, + "step": 29833000 + }, + { + "epoch": 86.36, + "learning_rate": 6.837648203038162e-06, + "loss": 1.8445, + "step": 29833500 + }, + { + "epoch": 86.36, + "learning_rate": 6.836924555390886e-06, + "loss": 1.8006, + "step": 29834000 + }, + { + "epoch": 86.36, + "learning_rate": 6.836200907743609e-06, + "loss": 1.8312, + "step": 29834500 + }, + { + "epoch": 86.36, + "learning_rate": 6.8354787073916265e-06, + "loss": 1.7943, + "step": 29835000 + }, + { + "epoch": 86.36, + "learning_rate": 6.8347550597443504e-06, + "loss": 1.8034, + "step": 29835500 + }, + { + "epoch": 86.36, + "learning_rate": 6.8340314120970735e-06, + "loss": 1.8128, + "step": 29836000 + }, + { + "epoch": 86.36, + "learning_rate": 6.833307764449797e-06, + "loss": 1.7845, + "step": 29836500 + }, + { + "epoch": 86.37, + "learning_rate": 6.83258411680252e-06, + "loss": 1.8214, + "step": 29837000 + }, + { + "epoch": 86.37, + "learning_rate": 6.831861916450538e-06, + "loss": 1.8175, + "step": 29837500 + }, + { + "epoch": 86.37, + "learning_rate": 6.831138268803261e-06, + "loss": 1.7928, + "step": 29838000 + }, + { + "epoch": 86.37, + "learning_rate": 6.830416068451279e-06, + "loss": 1.8184, + "step": 29838500 + }, + { + "epoch": 86.37, + "learning_rate": 6.829692420804001e-06, + "loss": 1.789, + "step": 29839000 + }, + { + "epoch": 86.37, + "learning_rate": 6.828968773156726e-06, + "loss": 1.8178, + "step": 29839500 + }, + { + "epoch": 86.37, + "learning_rate": 6.828245125509448e-06, + "loss": 1.8102, + "step": 29840000 + }, + { + "epoch": 86.38, + "learning_rate": 6.827521477862171e-06, + "loss": 1.7935, + "step": 29840500 + }, + { + "epoch": 86.38, + "learning_rate": 6.826797830214894e-06, + "loss": 1.8093, + "step": 29841000 + }, + { + "epoch": 86.38, + "learning_rate": 6.826074182567618e-06, + "loss": 1.8121, + "step": 29841500 + }, + { + "epoch": 86.38, + "learning_rate": 6.825350534920341e-06, + "loss": 1.8207, + "step": 29842000 + }, + { + "epoch": 86.38, + "learning_rate": 6.824629781863654e-06, + "loss": 1.8032, + "step": 29842500 + }, + { + "epoch": 86.38, + "learning_rate": 6.823906134216376e-06, + "loss": 1.8011, + "step": 29843000 + }, + { + "epoch": 86.38, + "learning_rate": 6.823182486569101e-06, + "loss": 1.8326, + "step": 29843500 + }, + { + "epoch": 86.39, + "learning_rate": 6.822458838921824e-06, + "loss": 1.822, + "step": 29844000 + }, + { + "epoch": 86.39, + "learning_rate": 6.821735191274546e-06, + "loss": 1.8237, + "step": 29844500 + }, + { + "epoch": 86.39, + "learning_rate": 6.821012990922564e-06, + "loss": 1.8125, + "step": 29845000 + }, + { + "epoch": 86.39, + "learning_rate": 6.820289343275288e-06, + "loss": 1.802, + "step": 29845500 + }, + { + "epoch": 86.39, + "learning_rate": 6.819565695628011e-06, + "loss": 1.7967, + "step": 29846000 + }, + { + "epoch": 86.39, + "learning_rate": 6.818842047980733e-06, + "loss": 1.7995, + "step": 29846500 + }, + { + "epoch": 86.39, + "learning_rate": 6.818119847628751e-06, + "loss": 1.8095, + "step": 29847000 + }, + { + "epoch": 86.4, + "learning_rate": 6.817396199981475e-06, + "loss": 1.8265, + "step": 29847500 + }, + { + "epoch": 86.4, + "learning_rate": 6.816672552334198e-06, + "loss": 1.7769, + "step": 29848000 + }, + { + "epoch": 86.4, + "learning_rate": 6.815948904686921e-06, + "loss": 1.7864, + "step": 29848500 + }, + { + "epoch": 86.4, + "learning_rate": 6.815225257039645e-06, + "loss": 1.7968, + "step": 29849000 + }, + { + "epoch": 86.4, + "learning_rate": 6.814501609392368e-06, + "loss": 1.8187, + "step": 29849500 + }, + { + "epoch": 86.4, + "learning_rate": 6.813777961745091e-06, + "loss": 1.7943, + "step": 29850000 + }, + { + "epoch": 86.4, + "learning_rate": 6.813054314097814e-06, + "loss": 1.8311, + "step": 29850500 + }, + { + "epoch": 86.41, + "learning_rate": 6.812330666450538e-06, + "loss": 1.7921, + "step": 29851000 + }, + { + "epoch": 86.41, + "learning_rate": 6.811608466098556e-06, + "loss": 1.8337, + "step": 29851500 + }, + { + "epoch": 86.41, + "learning_rate": 6.810884818451278e-06, + "loss": 1.7949, + "step": 29852000 + }, + { + "epoch": 86.41, + "learning_rate": 6.810161170804001e-06, + "loss": 1.813, + "step": 29852500 + }, + { + "epoch": 86.41, + "learning_rate": 6.809437523156725e-06, + "loss": 1.7746, + "step": 29853000 + }, + { + "epoch": 86.41, + "learning_rate": 6.808715322804743e-06, + "loss": 1.7975, + "step": 29853500 + }, + { + "epoch": 86.42, + "learning_rate": 6.80799312245276e-06, + "loss": 1.8237, + "step": 29854000 + }, + { + "epoch": 86.42, + "learning_rate": 6.8072694748054835e-06, + "loss": 1.8037, + "step": 29854500 + }, + { + "epoch": 86.42, + "learning_rate": 6.806545827158207e-06, + "loss": 1.8153, + "step": 29855000 + }, + { + "epoch": 86.42, + "learning_rate": 6.8058221795109305e-06, + "loss": 1.7892, + "step": 29855500 + }, + { + "epoch": 86.42, + "learning_rate": 6.805098531863653e-06, + "loss": 1.8273, + "step": 29856000 + }, + { + "epoch": 86.42, + "learning_rate": 6.8043748842163775e-06, + "loss": 1.8331, + "step": 29856500 + }, + { + "epoch": 86.42, + "learning_rate": 6.803651236569101e-06, + "loss": 1.8193, + "step": 29857000 + }, + { + "epoch": 86.43, + "learning_rate": 6.802927588921823e-06, + "loss": 1.8437, + "step": 29857500 + }, + { + "epoch": 86.43, + "learning_rate": 6.802203941274546e-06, + "loss": 1.8086, + "step": 29858000 + }, + { + "epoch": 86.43, + "learning_rate": 6.80148029362727e-06, + "loss": 1.8325, + "step": 29858500 + }, + { + "epoch": 86.43, + "learning_rate": 6.800756645979993e-06, + "loss": 1.7911, + "step": 29859000 + }, + { + "epoch": 86.43, + "learning_rate": 6.800032998332716e-06, + "loss": 1.8359, + "step": 29859500 + }, + { + "epoch": 86.43, + "learning_rate": 6.79930935068544e-06, + "loss": 1.8307, + "step": 29860000 + }, + { + "epoch": 86.43, + "learning_rate": 6.798585703038163e-06, + "loss": 1.813, + "step": 29860500 + }, + { + "epoch": 86.44, + "learning_rate": 6.797862055390885e-06, + "loss": 1.8099, + "step": 29861000 + }, + { + "epoch": 86.44, + "learning_rate": 6.797139855038903e-06, + "loss": 1.8023, + "step": 29861500 + }, + { + "epoch": 86.44, + "learning_rate": 6.796416207391627e-06, + "loss": 1.8077, + "step": 29862000 + }, + { + "epoch": 86.44, + "learning_rate": 6.795694007039645e-06, + "loss": 1.8272, + "step": 29862500 + }, + { + "epoch": 86.44, + "learning_rate": 6.794970359392368e-06, + "loss": 1.8002, + "step": 29863000 + }, + { + "epoch": 86.44, + "learning_rate": 6.794246711745091e-06, + "loss": 1.8133, + "step": 29863500 + }, + { + "epoch": 86.44, + "learning_rate": 6.793523064097815e-06, + "loss": 1.825, + "step": 29864000 + }, + { + "epoch": 86.45, + "learning_rate": 6.792799416450538e-06, + "loss": 1.795, + "step": 29864500 + }, + { + "epoch": 86.45, + "learning_rate": 6.792075768803261e-06, + "loss": 1.8125, + "step": 29865000 + }, + { + "epoch": 86.45, + "learning_rate": 6.791353568451278e-06, + "loss": 1.816, + "step": 29865500 + }, + { + "epoch": 86.45, + "learning_rate": 6.790629920804002e-06, + "loss": 1.8272, + "step": 29866000 + }, + { + "epoch": 86.45, + "learning_rate": 6.789906273156725e-06, + "loss": 1.8044, + "step": 29866500 + }, + { + "epoch": 86.45, + "learning_rate": 6.789184072804742e-06, + "loss": 1.8104, + "step": 29867000 + }, + { + "epoch": 86.45, + "learning_rate": 6.788460425157465e-06, + "loss": 1.8036, + "step": 29867500 + }, + { + "epoch": 86.46, + "learning_rate": 6.787736777510189e-06, + "loss": 1.8056, + "step": 29868000 + }, + { + "epoch": 86.46, + "learning_rate": 6.787013129862912e-06, + "loss": 1.8417, + "step": 29868500 + }, + { + "epoch": 86.46, + "learning_rate": 6.7862894822156354e-06, + "loss": 1.8231, + "step": 29869000 + }, + { + "epoch": 86.46, + "learning_rate": 6.785565834568359e-06, + "loss": 1.8104, + "step": 29869500 + }, + { + "epoch": 86.46, + "learning_rate": 6.7848421869210824e-06, + "loss": 1.7812, + "step": 29870000 + }, + { + "epoch": 86.46, + "learning_rate": 6.7841199865691e-06, + "loss": 1.8048, + "step": 29870500 + }, + { + "epoch": 86.46, + "learning_rate": 6.783396338921823e-06, + "loss": 1.8066, + "step": 29871000 + }, + { + "epoch": 86.47, + "learning_rate": 6.782672691274547e-06, + "loss": 1.8158, + "step": 29871500 + }, + { + "epoch": 86.47, + "learning_rate": 6.78194904362727e-06, + "loss": 1.7987, + "step": 29872000 + }, + { + "epoch": 86.47, + "learning_rate": 6.781225395979993e-06, + "loss": 1.8062, + "step": 29872500 + }, + { + "epoch": 86.47, + "learning_rate": 6.780501748332715e-06, + "loss": 1.789, + "step": 29873000 + }, + { + "epoch": 86.47, + "learning_rate": 6.77977810068544e-06, + "loss": 1.8114, + "step": 29873500 + }, + { + "epoch": 86.47, + "learning_rate": 6.779054453038162e-06, + "loss": 1.7924, + "step": 29874000 + }, + { + "epoch": 86.47, + "learning_rate": 6.778330805390885e-06, + "loss": 1.8158, + "step": 29874500 + }, + { + "epoch": 86.48, + "learning_rate": 6.77760715774361e-06, + "loss": 1.8238, + "step": 29875000 + }, + { + "epoch": 86.48, + "learning_rate": 6.776884957391627e-06, + "loss": 1.8316, + "step": 29875500 + }, + { + "epoch": 86.48, + "learning_rate": 6.77616130974435e-06, + "loss": 1.7889, + "step": 29876000 + }, + { + "epoch": 86.48, + "learning_rate": 6.7754376620970725e-06, + "loss": 1.8144, + "step": 29876500 + }, + { + "epoch": 86.48, + "learning_rate": 6.774714014449797e-06, + "loss": 1.7953, + "step": 29877000 + }, + { + "epoch": 86.48, + "learning_rate": 6.7739903668025195e-06, + "loss": 1.7803, + "step": 29877500 + }, + { + "epoch": 86.48, + "learning_rate": 6.773266719155243e-06, + "loss": 1.8174, + "step": 29878000 + }, + { + "epoch": 86.49, + "learning_rate": 6.7725430715079665e-06, + "loss": 1.7986, + "step": 29878500 + }, + { + "epoch": 86.49, + "learning_rate": 6.77181942386069e-06, + "loss": 1.8107, + "step": 29879000 + }, + { + "epoch": 86.49, + "learning_rate": 6.771097223508707e-06, + "loss": 1.7875, + "step": 29879500 + }, + { + "epoch": 86.49, + "learning_rate": 6.77037357586143e-06, + "loss": 1.8079, + "step": 29880000 + }, + { + "epoch": 86.49, + "learning_rate": 6.769649928214154e-06, + "loss": 1.8216, + "step": 29880500 + }, + { + "epoch": 86.49, + "learning_rate": 6.768926280566877e-06, + "loss": 1.8209, + "step": 29881000 + }, + { + "epoch": 86.49, + "learning_rate": 6.7682026329196e-06, + "loss": 1.795, + "step": 29881500 + }, + { + "epoch": 86.5, + "learning_rate": 6.767480432567617e-06, + "loss": 1.83, + "step": 29882000 + }, + { + "epoch": 86.5, + "learning_rate": 6.766756784920342e-06, + "loss": 1.7991, + "step": 29882500 + }, + { + "epoch": 86.5, + "learning_rate": 6.766033137273064e-06, + "loss": 1.7896, + "step": 29883000 + }, + { + "epoch": 86.5, + "learning_rate": 6.765309489625787e-06, + "loss": 1.8229, + "step": 29883500 + }, + { + "epoch": 86.5, + "learning_rate": 6.7645858419785104e-06, + "loss": 1.815, + "step": 29884000 + }, + { + "epoch": 86.5, + "learning_rate": 6.763863641626529e-06, + "loss": 1.838, + "step": 29884500 + }, + { + "epoch": 86.5, + "learning_rate": 6.763141441274547e-06, + "loss": 1.8147, + "step": 29885000 + }, + { + "epoch": 86.51, + "learning_rate": 6.76241779362727e-06, + "loss": 1.8001, + "step": 29885500 + }, + { + "epoch": 86.51, + "learning_rate": 6.761694145979992e-06, + "loss": 1.8085, + "step": 29886000 + }, + { + "epoch": 86.51, + "learning_rate": 6.760970498332717e-06, + "loss": 1.8005, + "step": 29886500 + }, + { + "epoch": 86.51, + "learning_rate": 6.76024685068544e-06, + "loss": 1.8292, + "step": 29887000 + }, + { + "epoch": 86.51, + "learning_rate": 6.759523203038162e-06, + "loss": 1.8282, + "step": 29887500 + }, + { + "epoch": 86.51, + "learning_rate": 6.758799555390887e-06, + "loss": 1.8021, + "step": 29888000 + }, + { + "epoch": 86.51, + "learning_rate": 6.758075907743609e-06, + "loss": 1.8121, + "step": 29888500 + }, + { + "epoch": 86.52, + "learning_rate": 6.757352260096332e-06, + "loss": 1.825, + "step": 29889000 + }, + { + "epoch": 86.52, + "learning_rate": 6.756630059744349e-06, + "loss": 1.7995, + "step": 29889500 + }, + { + "epoch": 86.52, + "learning_rate": 6.755906412097074e-06, + "loss": 1.8154, + "step": 29890000 + }, + { + "epoch": 86.52, + "learning_rate": 6.755184211745091e-06, + "loss": 1.8154, + "step": 29890500 + }, + { + "epoch": 86.52, + "learning_rate": 6.7544605640978145e-06, + "loss": 1.8169, + "step": 29891000 + }, + { + "epoch": 86.52, + "learning_rate": 6.753736916450537e-06, + "loss": 1.8122, + "step": 29891500 + }, + { + "epoch": 86.53, + "learning_rate": 6.7530132688032615e-06, + "loss": 1.7977, + "step": 29892000 + }, + { + "epoch": 86.53, + "learning_rate": 6.752289621155984e-06, + "loss": 1.8163, + "step": 29892500 + }, + { + "epoch": 86.53, + "learning_rate": 6.751565973508707e-06, + "loss": 1.7756, + "step": 29893000 + }, + { + "epoch": 86.53, + "learning_rate": 6.750842325861432e-06, + "loss": 1.7799, + "step": 29893500 + }, + { + "epoch": 86.53, + "learning_rate": 6.750118678214154e-06, + "loss": 1.8228, + "step": 29894000 + }, + { + "epoch": 86.53, + "learning_rate": 6.749396477862172e-06, + "loss": 1.8082, + "step": 29894500 + }, + { + "epoch": 86.53, + "learning_rate": 6.748674277510189e-06, + "loss": 1.7961, + "step": 29895000 + }, + { + "epoch": 86.54, + "learning_rate": 6.747950629862912e-06, + "loss": 1.8145, + "step": 29895500 + }, + { + "epoch": 86.54, + "learning_rate": 6.747226982215636e-06, + "loss": 1.8172, + "step": 29896000 + }, + { + "epoch": 86.54, + "learning_rate": 6.746503334568359e-06, + "loss": 1.7858, + "step": 29896500 + }, + { + "epoch": 86.54, + "learning_rate": 6.7457796869210815e-06, + "loss": 1.8121, + "step": 29897000 + }, + { + "epoch": 86.54, + "learning_rate": 6.745056039273806e-06, + "loss": 1.7836, + "step": 29897500 + }, + { + "epoch": 86.54, + "learning_rate": 6.7443323916265285e-06, + "loss": 1.7921, + "step": 29898000 + }, + { + "epoch": 86.54, + "learning_rate": 6.7436087439792516e-06, + "loss": 1.8267, + "step": 29898500 + }, + { + "epoch": 86.55, + "learning_rate": 6.742886543627269e-06, + "loss": 1.7937, + "step": 29899000 + }, + { + "epoch": 86.55, + "learning_rate": 6.742162895979994e-06, + "loss": 1.7905, + "step": 29899500 + }, + { + "epoch": 86.55, + "learning_rate": 6.741440695628011e-06, + "loss": 1.7735, + "step": 29900000 + }, + { + "epoch": 86.55, + "learning_rate": 6.740717047980734e-06, + "loss": 1.8119, + "step": 29900500 + }, + { + "epoch": 86.55, + "learning_rate": 6.739993400333457e-06, + "loss": 1.8253, + "step": 29901000 + }, + { + "epoch": 86.55, + "learning_rate": 6.739269752686181e-06, + "loss": 1.8052, + "step": 29901500 + }, + { + "epoch": 86.55, + "learning_rate": 6.738546105038904e-06, + "loss": 1.8062, + "step": 29902000 + }, + { + "epoch": 86.56, + "learning_rate": 6.737822457391626e-06, + "loss": 1.805, + "step": 29902500 + }, + { + "epoch": 86.56, + "learning_rate": 6.737098809744351e-06, + "loss": 1.799, + "step": 29903000 + }, + { + "epoch": 86.56, + "learning_rate": 6.736375162097073e-06, + "loss": 1.8083, + "step": 29903500 + }, + { + "epoch": 86.56, + "learning_rate": 6.735651514449796e-06, + "loss": 1.8151, + "step": 29904000 + }, + { + "epoch": 86.56, + "learning_rate": 6.734927866802519e-06, + "loss": 1.7974, + "step": 29904500 + }, + { + "epoch": 86.56, + "learning_rate": 6.734205666450538e-06, + "loss": 1.8088, + "step": 29905000 + }, + { + "epoch": 86.56, + "learning_rate": 6.733482018803261e-06, + "loss": 1.8159, + "step": 29905500 + }, + { + "epoch": 86.57, + "learning_rate": 6.732758371155984e-06, + "loss": 1.785, + "step": 29906000 + }, + { + "epoch": 86.57, + "learning_rate": 6.732034723508707e-06, + "loss": 1.7927, + "step": 29906500 + }, + { + "epoch": 86.57, + "learning_rate": 6.731311075861431e-06, + "loss": 1.8074, + "step": 29907000 + }, + { + "epoch": 86.57, + "learning_rate": 6.730587428214154e-06, + "loss": 1.8039, + "step": 29907500 + }, + { + "epoch": 86.57, + "learning_rate": 6.729866675157466e-06, + "loss": 1.8067, + "step": 29908000 + }, + { + "epoch": 86.57, + "learning_rate": 6.729143027510189e-06, + "loss": 1.8141, + "step": 29908500 + }, + { + "epoch": 86.57, + "learning_rate": 6.728419379862913e-06, + "loss": 1.8083, + "step": 29909000 + }, + { + "epoch": 86.58, + "learning_rate": 6.727695732215636e-06, + "loss": 1.7784, + "step": 29909500 + }, + { + "epoch": 86.58, + "learning_rate": 6.726972084568358e-06, + "loss": 1.8316, + "step": 29910000 + }, + { + "epoch": 86.58, + "learning_rate": 6.7262484369210814e-06, + "loss": 1.8186, + "step": 29910500 + }, + { + "epoch": 86.58, + "learning_rate": 6.725524789273805e-06, + "loss": 1.7813, + "step": 29911000 + }, + { + "epoch": 86.58, + "learning_rate": 6.7248011416265284e-06, + "loss": 1.7994, + "step": 29911500 + }, + { + "epoch": 86.58, + "learning_rate": 6.7240774939792515e-06, + "loss": 1.8025, + "step": 29912000 + }, + { + "epoch": 86.58, + "learning_rate": 6.7233552936272705e-06, + "loss": 1.8096, + "step": 29912500 + }, + { + "epoch": 86.59, + "learning_rate": 6.7226316459799935e-06, + "loss": 1.8413, + "step": 29913000 + }, + { + "epoch": 86.59, + "learning_rate": 6.721907998332716e-06, + "loss": 1.8226, + "step": 29913500 + }, + { + "epoch": 86.59, + "learning_rate": 6.721184350685439e-06, + "loss": 1.8148, + "step": 29914000 + }, + { + "epoch": 86.59, + "learning_rate": 6.720460703038163e-06, + "loss": 1.8021, + "step": 29914500 + }, + { + "epoch": 86.59, + "learning_rate": 6.719738502686181e-06, + "loss": 1.8284, + "step": 29915000 + }, + { + "epoch": 86.59, + "learning_rate": 6.719014855038903e-06, + "loss": 1.7991, + "step": 29915500 + }, + { + "epoch": 86.59, + "learning_rate": 6.718291207391626e-06, + "loss": 1.7827, + "step": 29916000 + }, + { + "epoch": 86.6, + "learning_rate": 6.71756755974435e-06, + "loss": 1.7843, + "step": 29916500 + }, + { + "epoch": 86.6, + "learning_rate": 6.716843912097073e-06, + "loss": 1.8041, + "step": 29917000 + }, + { + "epoch": 86.6, + "learning_rate": 6.7161217117450905e-06, + "loss": 1.7988, + "step": 29917500 + }, + { + "epoch": 86.6, + "learning_rate": 6.7153995113931086e-06, + "loss": 1.8287, + "step": 29918000 + }, + { + "epoch": 86.6, + "learning_rate": 6.7146758637458325e-06, + "loss": 1.8156, + "step": 29918500 + }, + { + "epoch": 86.6, + "learning_rate": 6.7139522160985556e-06, + "loss": 1.7967, + "step": 29919000 + }, + { + "epoch": 86.6, + "learning_rate": 6.713228568451279e-06, + "loss": 1.8212, + "step": 29919500 + }, + { + "epoch": 86.61, + "learning_rate": 6.712506368099296e-06, + "loss": 1.8126, + "step": 29920000 + }, + { + "epoch": 86.61, + "learning_rate": 6.71178272045202e-06, + "loss": 1.7994, + "step": 29920500 + }, + { + "epoch": 86.61, + "learning_rate": 6.711059072804743e-06, + "loss": 1.7849, + "step": 29921000 + }, + { + "epoch": 86.61, + "learning_rate": 6.710335425157466e-06, + "loss": 1.8113, + "step": 29921500 + }, + { + "epoch": 86.61, + "learning_rate": 6.70961177751019e-06, + "loss": 1.8252, + "step": 29922000 + }, + { + "epoch": 86.61, + "learning_rate": 6.708888129862913e-06, + "loss": 1.8114, + "step": 29922500 + }, + { + "epoch": 86.61, + "learning_rate": 6.708164482215635e-06, + "loss": 1.8008, + "step": 29923000 + }, + { + "epoch": 86.62, + "learning_rate": 6.707440834568358e-06, + "loss": 1.8106, + "step": 29923500 + }, + { + "epoch": 86.62, + "learning_rate": 6.706717186921082e-06, + "loss": 1.8122, + "step": 29924000 + }, + { + "epoch": 86.62, + "learning_rate": 6.705993539273805e-06, + "loss": 1.7963, + "step": 29924500 + }, + { + "epoch": 86.62, + "learning_rate": 6.705271338921823e-06, + "loss": 1.8098, + "step": 29925000 + }, + { + "epoch": 86.62, + "learning_rate": 6.704547691274546e-06, + "loss": 1.7944, + "step": 29925500 + }, + { + "epoch": 86.62, + "learning_rate": 6.70382404362727e-06, + "loss": 1.8149, + "step": 29926000 + }, + { + "epoch": 86.62, + "learning_rate": 6.703100395979993e-06, + "loss": 1.793, + "step": 29926500 + }, + { + "epoch": 86.63, + "learning_rate": 6.702376748332716e-06, + "loss": 1.7886, + "step": 29927000 + }, + { + "epoch": 86.63, + "learning_rate": 6.701655995276028e-06, + "loss": 1.8079, + "step": 29927500 + }, + { + "epoch": 86.63, + "learning_rate": 6.700932347628752e-06, + "loss": 1.8061, + "step": 29928000 + }, + { + "epoch": 86.63, + "learning_rate": 6.700208699981475e-06, + "loss": 1.8068, + "step": 29928500 + }, + { + "epoch": 86.63, + "learning_rate": 6.699485052334198e-06, + "loss": 1.7873, + "step": 29929000 + }, + { + "epoch": 86.63, + "learning_rate": 6.698761404686922e-06, + "loss": 1.8184, + "step": 29929500 + }, + { + "epoch": 86.64, + "learning_rate": 6.698037757039645e-06, + "loss": 1.8363, + "step": 29930000 + }, + { + "epoch": 86.64, + "learning_rate": 6.697314109392368e-06, + "loss": 1.8307, + "step": 29930500 + }, + { + "epoch": 86.64, + "learning_rate": 6.69659046174509e-06, + "loss": 1.8157, + "step": 29931000 + }, + { + "epoch": 86.64, + "learning_rate": 6.695868261393109e-06, + "loss": 1.8168, + "step": 29931500 + }, + { + "epoch": 86.64, + "learning_rate": 6.6951446137458324e-06, + "loss": 1.7983, + "step": 29932000 + }, + { + "epoch": 86.64, + "learning_rate": 6.6944209660985555e-06, + "loss": 1.7923, + "step": 29932500 + }, + { + "epoch": 86.64, + "learning_rate": 6.693697318451278e-06, + "loss": 1.8385, + "step": 29933000 + }, + { + "epoch": 86.65, + "learning_rate": 6.692975118099297e-06, + "loss": 1.8269, + "step": 29933500 + }, + { + "epoch": 86.65, + "learning_rate": 6.69225147045202e-06, + "loss": 1.7897, + "step": 29934000 + }, + { + "epoch": 86.65, + "learning_rate": 6.691527822804743e-06, + "loss": 1.81, + "step": 29934500 + }, + { + "epoch": 86.65, + "learning_rate": 6.690804175157465e-06, + "loss": 1.8119, + "step": 29935000 + }, + { + "epoch": 86.65, + "learning_rate": 6.69008052751019e-06, + "loss": 1.7996, + "step": 29935500 + }, + { + "epoch": 86.65, + "learning_rate": 6.689358327158207e-06, + "loss": 1.7904, + "step": 29936000 + }, + { + "epoch": 86.65, + "learning_rate": 6.68863467951093e-06, + "loss": 1.806, + "step": 29936500 + }, + { + "epoch": 86.66, + "learning_rate": 6.687911031863653e-06, + "loss": 1.8117, + "step": 29937000 + }, + { + "epoch": 86.66, + "learning_rate": 6.687187384216377e-06, + "loss": 1.7923, + "step": 29937500 + }, + { + "epoch": 86.66, + "learning_rate": 6.6864637365691e-06, + "loss": 1.8179, + "step": 29938000 + }, + { + "epoch": 86.66, + "learning_rate": 6.6857400889218225e-06, + "loss": 1.7966, + "step": 29938500 + }, + { + "epoch": 86.66, + "learning_rate": 6.685016441274547e-06, + "loss": 1.7935, + "step": 29939000 + }, + { + "epoch": 86.66, + "learning_rate": 6.6842927936272695e-06, + "loss": 1.8116, + "step": 29939500 + }, + { + "epoch": 86.66, + "learning_rate": 6.683569145979993e-06, + "loss": 1.8065, + "step": 29940000 + }, + { + "epoch": 86.67, + "learning_rate": 6.682845498332716e-06, + "loss": 1.8147, + "step": 29940500 + }, + { + "epoch": 86.67, + "learning_rate": 6.68212185068544e-06, + "loss": 1.8148, + "step": 29941000 + }, + { + "epoch": 86.67, + "learning_rate": 6.681398203038163e-06, + "loss": 1.8076, + "step": 29941500 + }, + { + "epoch": 86.67, + "learning_rate": 6.68067600268618e-06, + "loss": 1.8123, + "step": 29942000 + }, + { + "epoch": 86.67, + "learning_rate": 6.679953802334197e-06, + "loss": 1.785, + "step": 29942500 + }, + { + "epoch": 86.67, + "learning_rate": 6.679231601982216e-06, + "loss": 1.8179, + "step": 29943000 + }, + { + "epoch": 86.67, + "learning_rate": 6.678507954334939e-06, + "loss": 1.8158, + "step": 29943500 + }, + { + "epoch": 86.68, + "learning_rate": 6.677784306687662e-06, + "loss": 1.802, + "step": 29944000 + }, + { + "epoch": 86.68, + "learning_rate": 6.677060659040385e-06, + "loss": 1.8043, + "step": 29944500 + }, + { + "epoch": 86.68, + "learning_rate": 6.676337011393109e-06, + "loss": 1.811, + "step": 29945000 + }, + { + "epoch": 86.68, + "learning_rate": 6.675613363745832e-06, + "loss": 1.7992, + "step": 29945500 + }, + { + "epoch": 86.68, + "learning_rate": 6.674889716098555e-06, + "loss": 1.8119, + "step": 29946000 + }, + { + "epoch": 86.68, + "learning_rate": 6.674166068451279e-06, + "loss": 1.7955, + "step": 29946500 + }, + { + "epoch": 86.68, + "learning_rate": 6.673442420804002e-06, + "loss": 1.8074, + "step": 29947000 + }, + { + "epoch": 86.69, + "learning_rate": 6.67272022045202e-06, + "loss": 1.7968, + "step": 29947500 + }, + { + "epoch": 86.69, + "learning_rate": 6.671996572804742e-06, + "loss": 1.783, + "step": 29948000 + }, + { + "epoch": 86.69, + "learning_rate": 6.671274372452761e-06, + "loss": 1.7843, + "step": 29948500 + }, + { + "epoch": 86.69, + "learning_rate": 6.670550724805484e-06, + "loss": 1.804, + "step": 29949000 + }, + { + "epoch": 86.69, + "learning_rate": 6.669827077158207e-06, + "loss": 1.799, + "step": 29949500 + }, + { + "epoch": 86.69, + "learning_rate": 6.66910342951093e-06, + "loss": 1.8334, + "step": 29950000 + }, + { + "epoch": 86.69, + "learning_rate": 6.668379781863654e-06, + "loss": 1.7898, + "step": 29950500 + }, + { + "epoch": 86.7, + "learning_rate": 6.667656134216377e-06, + "loss": 1.7964, + "step": 29951000 + }, + { + "epoch": 86.7, + "learning_rate": 6.666932486569099e-06, + "loss": 1.8334, + "step": 29951500 + }, + { + "epoch": 86.7, + "learning_rate": 6.666208838921824e-06, + "loss": 1.8103, + "step": 29952000 + }, + { + "epoch": 86.7, + "learning_rate": 6.665485191274546e-06, + "loss": 1.8052, + "step": 29952500 + }, + { + "epoch": 86.7, + "learning_rate": 6.6647629909225645e-06, + "loss": 1.7852, + "step": 29953000 + }, + { + "epoch": 86.7, + "learning_rate": 6.664039343275287e-06, + "loss": 1.8155, + "step": 29953500 + }, + { + "epoch": 86.7, + "learning_rate": 6.6633156956280115e-06, + "loss": 1.8041, + "step": 29954000 + }, + { + "epoch": 86.71, + "learning_rate": 6.662592047980734e-06, + "loss": 1.7877, + "step": 29954500 + }, + { + "epoch": 86.71, + "learning_rate": 6.661868400333457e-06, + "loss": 1.7974, + "step": 29955000 + }, + { + "epoch": 86.71, + "learning_rate": 6.66114475268618e-06, + "loss": 1.8468, + "step": 29955500 + }, + { + "epoch": 86.71, + "learning_rate": 6.660422552334199e-06, + "loss": 1.8045, + "step": 29956000 + }, + { + "epoch": 86.71, + "learning_rate": 6.659700351982216e-06, + "loss": 1.8258, + "step": 29956500 + }, + { + "epoch": 86.71, + "learning_rate": 6.658976704334939e-06, + "loss": 1.8164, + "step": 29957000 + }, + { + "epoch": 86.71, + "learning_rate": 6.658253056687662e-06, + "loss": 1.8145, + "step": 29957500 + }, + { + "epoch": 86.72, + "learning_rate": 6.657529409040386e-06, + "loss": 1.8167, + "step": 29958000 + }, + { + "epoch": 86.72, + "learning_rate": 6.656805761393109e-06, + "loss": 1.818, + "step": 29958500 + }, + { + "epoch": 86.72, + "learning_rate": 6.6560821137458315e-06, + "loss": 1.8135, + "step": 29959000 + }, + { + "epoch": 86.72, + "learning_rate": 6.655358466098556e-06, + "loss": 1.8195, + "step": 29959500 + }, + { + "epoch": 86.72, + "learning_rate": 6.6546348184512785e-06, + "loss": 1.8148, + "step": 29960000 + }, + { + "epoch": 86.72, + "learning_rate": 6.6539111708040016e-06, + "loss": 1.8047, + "step": 29960500 + }, + { + "epoch": 86.72, + "learning_rate": 6.653188970452019e-06, + "loss": 1.8386, + "step": 29961000 + }, + { + "epoch": 86.73, + "learning_rate": 6.652465322804744e-06, + "loss": 1.8289, + "step": 29961500 + }, + { + "epoch": 86.73, + "learning_rate": 6.651741675157467e-06, + "loss": 1.8005, + "step": 29962000 + }, + { + "epoch": 86.73, + "learning_rate": 6.651018027510189e-06, + "loss": 1.8171, + "step": 29962500 + }, + { + "epoch": 86.73, + "learning_rate": 6.650294379862912e-06, + "loss": 1.7933, + "step": 29963000 + }, + { + "epoch": 86.73, + "learning_rate": 6.649570732215636e-06, + "loss": 1.7961, + "step": 29963500 + }, + { + "epoch": 86.73, + "learning_rate": 6.648848531863654e-06, + "loss": 1.8021, + "step": 29964000 + }, + { + "epoch": 86.73, + "learning_rate": 6.648124884216376e-06, + "loss": 1.825, + "step": 29964500 + }, + { + "epoch": 86.74, + "learning_rate": 6.647401236569099e-06, + "loss": 1.8038, + "step": 29965000 + }, + { + "epoch": 86.74, + "learning_rate": 6.646677588921823e-06, + "loss": 1.7941, + "step": 29965500 + }, + { + "epoch": 86.74, + "learning_rate": 6.645953941274546e-06, + "loss": 1.8318, + "step": 29966000 + }, + { + "epoch": 86.74, + "learning_rate": 6.645230293627269e-06, + "loss": 1.8136, + "step": 29966500 + }, + { + "epoch": 86.74, + "learning_rate": 6.644509540570582e-06, + "loss": 1.8013, + "step": 29967000 + }, + { + "epoch": 86.74, + "learning_rate": 6.643785892923306e-06, + "loss": 1.787, + "step": 29967500 + }, + { + "epoch": 86.75, + "learning_rate": 6.643062245276029e-06, + "loss": 1.8029, + "step": 29968000 + }, + { + "epoch": 86.75, + "learning_rate": 6.642338597628752e-06, + "loss": 1.8033, + "step": 29968500 + }, + { + "epoch": 86.75, + "learning_rate": 6.641614949981476e-06, + "loss": 1.792, + "step": 29969000 + }, + { + "epoch": 86.75, + "learning_rate": 6.640891302334199e-06, + "loss": 1.8013, + "step": 29969500 + }, + { + "epoch": 86.75, + "learning_rate": 6.640169101982216e-06, + "loss": 1.8276, + "step": 29970000 + }, + { + "epoch": 86.75, + "learning_rate": 6.639446901630233e-06, + "loss": 1.7905, + "step": 29970500 + }, + { + "epoch": 86.75, + "learning_rate": 6.638723253982956e-06, + "loss": 1.8152, + "step": 29971000 + }, + { + "epoch": 86.76, + "learning_rate": 6.63799960633568e-06, + "loss": 1.8306, + "step": 29971500 + }, + { + "epoch": 86.76, + "learning_rate": 6.637275958688403e-06, + "loss": 1.8156, + "step": 29972000 + }, + { + "epoch": 86.76, + "learning_rate": 6.6365523110411264e-06, + "loss": 1.7857, + "step": 29972500 + }, + { + "epoch": 86.76, + "learning_rate": 6.63582866339385e-06, + "loss": 1.8184, + "step": 29973000 + }, + { + "epoch": 86.76, + "learning_rate": 6.6351050157465735e-06, + "loss": 1.8101, + "step": 29973500 + }, + { + "epoch": 86.76, + "learning_rate": 6.6343813680992965e-06, + "loss": 1.792, + "step": 29974000 + }, + { + "epoch": 86.76, + "learning_rate": 6.633657720452019e-06, + "loss": 1.8222, + "step": 29974500 + }, + { + "epoch": 86.77, + "learning_rate": 6.6329340728047435e-06, + "loss": 1.795, + "step": 29975000 + }, + { + "epoch": 86.77, + "learning_rate": 6.632210425157466e-06, + "loss": 1.8394, + "step": 29975500 + }, + { + "epoch": 86.77, + "learning_rate": 6.631486777510189e-06, + "loss": 1.8049, + "step": 29976000 + }, + { + "epoch": 86.77, + "learning_rate": 6.630763129862913e-06, + "loss": 1.7809, + "step": 29976500 + }, + { + "epoch": 86.77, + "learning_rate": 6.630040929510931e-06, + "loss": 1.8096, + "step": 29977000 + }, + { + "epoch": 86.77, + "learning_rate": 6.629317281863653e-06, + "loss": 1.7851, + "step": 29977500 + }, + { + "epoch": 86.77, + "learning_rate": 6.628593634216376e-06, + "loss": 1.7994, + "step": 29978000 + }, + { + "epoch": 86.78, + "learning_rate": 6.6278699865691e-06, + "loss": 1.807, + "step": 29978500 + }, + { + "epoch": 86.78, + "learning_rate": 6.627147786217118e-06, + "loss": 1.7975, + "step": 29979000 + }, + { + "epoch": 86.78, + "learning_rate": 6.6264255858651355e-06, + "loss": 1.8024, + "step": 29979500 + }, + { + "epoch": 86.78, + "learning_rate": 6.6257019382178585e-06, + "loss": 1.8017, + "step": 29980000 + }, + { + "epoch": 86.78, + "learning_rate": 6.6249782905705825e-06, + "loss": 1.8096, + "step": 29980500 + }, + { + "epoch": 86.78, + "learning_rate": 6.6242546429233056e-06, + "loss": 1.8005, + "step": 29981000 + }, + { + "epoch": 86.78, + "learning_rate": 6.623530995276029e-06, + "loss": 1.8274, + "step": 29981500 + }, + { + "epoch": 86.79, + "learning_rate": 6.622808794924046e-06, + "loss": 1.818, + "step": 29982000 + }, + { + "epoch": 86.79, + "learning_rate": 6.62208514727677e-06, + "loss": 1.8187, + "step": 29982500 + }, + { + "epoch": 86.79, + "learning_rate": 6.621361499629493e-06, + "loss": 1.8091, + "step": 29983000 + }, + { + "epoch": 86.79, + "learning_rate": 6.620637851982216e-06, + "loss": 1.8219, + "step": 29983500 + }, + { + "epoch": 86.79, + "learning_rate": 6.619914204334938e-06, + "loss": 1.8212, + "step": 29984000 + }, + { + "epoch": 86.79, + "learning_rate": 6.619190556687663e-06, + "loss": 1.7989, + "step": 29984500 + }, + { + "epoch": 86.79, + "learning_rate": 6.618466909040385e-06, + "loss": 1.8167, + "step": 29985000 + }, + { + "epoch": 86.8, + "learning_rate": 6.617744708688403e-06, + "loss": 1.7991, + "step": 29985500 + }, + { + "epoch": 86.8, + "learning_rate": 6.617021061041127e-06, + "loss": 1.8201, + "step": 29986000 + }, + { + "epoch": 86.8, + "learning_rate": 6.61629741339385e-06, + "loss": 1.816, + "step": 29986500 + }, + { + "epoch": 86.8, + "learning_rate": 6.615573765746573e-06, + "loss": 1.8332, + "step": 29987000 + }, + { + "epoch": 86.8, + "learning_rate": 6.614850118099296e-06, + "loss": 1.8142, + "step": 29987500 + }, + { + "epoch": 86.8, + "learning_rate": 6.614127917747315e-06, + "loss": 1.822, + "step": 29988000 + }, + { + "epoch": 86.8, + "learning_rate": 6.613404270100038e-06, + "loss": 1.8019, + "step": 29988500 + }, + { + "epoch": 86.81, + "learning_rate": 6.612680622452761e-06, + "loss": 1.8028, + "step": 29989000 + }, + { + "epoch": 86.81, + "learning_rate": 6.611956974805483e-06, + "loss": 1.7925, + "step": 29989500 + }, + { + "epoch": 86.81, + "learning_rate": 6.611233327158208e-06, + "loss": 1.7889, + "step": 29990000 + }, + { + "epoch": 86.81, + "learning_rate": 6.61050967951093e-06, + "loss": 1.814, + "step": 29990500 + }, + { + "epoch": 86.81, + "learning_rate": 6.609786031863653e-06, + "loss": 1.8052, + "step": 29991000 + }, + { + "epoch": 86.81, + "learning_rate": 6.609062384216377e-06, + "loss": 1.8086, + "step": 29991500 + }, + { + "epoch": 86.81, + "learning_rate": 6.6083387365691e-06, + "loss": 1.8225, + "step": 29992000 + }, + { + "epoch": 86.82, + "learning_rate": 6.607616536217117e-06, + "loss": 1.8225, + "step": 29992500 + }, + { + "epoch": 86.82, + "learning_rate": 6.60689288856984e-06, + "loss": 1.7744, + "step": 29993000 + }, + { + "epoch": 86.82, + "learning_rate": 6.606169240922565e-06, + "loss": 1.8262, + "step": 29993500 + }, + { + "epoch": 86.82, + "learning_rate": 6.605445593275287e-06, + "loss": 1.7938, + "step": 29994000 + }, + { + "epoch": 86.82, + "learning_rate": 6.6047219456280105e-06, + "loss": 1.7931, + "step": 29994500 + }, + { + "epoch": 86.82, + "learning_rate": 6.6039982979807336e-06, + "loss": 1.8074, + "step": 29995000 + }, + { + "epoch": 86.82, + "learning_rate": 6.6032760976287525e-06, + "loss": 1.8451, + "step": 29995500 + }, + { + "epoch": 86.83, + "learning_rate": 6.602552449981475e-06, + "loss": 1.8105, + "step": 29996000 + }, + { + "epoch": 86.83, + "learning_rate": 6.601828802334198e-06, + "loss": 1.7916, + "step": 29996500 + }, + { + "epoch": 86.83, + "learning_rate": 6.601105154686922e-06, + "loss": 1.7984, + "step": 29997000 + }, + { + "epoch": 86.83, + "learning_rate": 6.60038295433494e-06, + "loss": 1.7943, + "step": 29997500 + }, + { + "epoch": 86.83, + "learning_rate": 6.599659306687662e-06, + "loss": 1.8114, + "step": 29998000 + }, + { + "epoch": 86.83, + "learning_rate": 6.598935659040385e-06, + "loss": 1.7875, + "step": 29998500 + }, + { + "epoch": 86.83, + "learning_rate": 6.598212011393109e-06, + "loss": 1.8235, + "step": 29999000 + }, + { + "epoch": 86.84, + "learning_rate": 6.597488363745832e-06, + "loss": 1.8103, + "step": 29999500 + }, + { + "epoch": 86.84, + "learning_rate": 6.59676616339385e-06, + "loss": 1.8069, + "step": 30000000 + }, + { + "epoch": 86.84, + "learning_rate": 6.5960425157465725e-06, + "loss": 1.8024, + "step": 30000500 + }, + { + "epoch": 86.84, + "learning_rate": 6.595318868099297e-06, + "loss": 1.8211, + "step": 30001000 + }, + { + "epoch": 86.84, + "learning_rate": 6.5945952204520195e-06, + "loss": 1.7743, + "step": 30001500 + }, + { + "epoch": 86.84, + "learning_rate": 6.593873020100038e-06, + "loss": 1.7974, + "step": 30002000 + }, + { + "epoch": 86.84, + "learning_rate": 6.59314937245276e-06, + "loss": 1.7989, + "step": 30002500 + }, + { + "epoch": 86.85, + "learning_rate": 6.592425724805485e-06, + "loss": 1.8222, + "step": 30003000 + }, + { + "epoch": 86.85, + "learning_rate": 6.591702077158207e-06, + "loss": 1.8143, + "step": 30003500 + }, + { + "epoch": 86.85, + "learning_rate": 6.59097842951093e-06, + "loss": 1.781, + "step": 30004000 + }, + { + "epoch": 86.85, + "learning_rate": 6.590254781863653e-06, + "loss": 1.8252, + "step": 30004500 + }, + { + "epoch": 86.85, + "learning_rate": 6.589532581511672e-06, + "loss": 1.8309, + "step": 30005000 + }, + { + "epoch": 86.85, + "learning_rate": 6.588810381159689e-06, + "loss": 1.8055, + "step": 30005500 + }, + { + "epoch": 86.86, + "learning_rate": 6.588086733512412e-06, + "loss": 1.8173, + "step": 30006000 + }, + { + "epoch": 86.86, + "learning_rate": 6.5873645331604295e-06, + "loss": 1.8616, + "step": 30006500 + }, + { + "epoch": 86.86, + "learning_rate": 6.586640885513154e-06, + "loss": 1.7874, + "step": 30007000 + }, + { + "epoch": 86.86, + "learning_rate": 6.5859172378658765e-06, + "loss": 1.7936, + "step": 30007500 + }, + { + "epoch": 86.86, + "learning_rate": 6.5851935902186e-06, + "loss": 1.7917, + "step": 30008000 + }, + { + "epoch": 86.86, + "learning_rate": 6.584469942571323e-06, + "loss": 1.8293, + "step": 30008500 + }, + { + "epoch": 86.86, + "learning_rate": 6.583746294924047e-06, + "loss": 1.8149, + "step": 30009000 + }, + { + "epoch": 86.87, + "learning_rate": 6.58302264727677e-06, + "loss": 1.7915, + "step": 30009500 + }, + { + "epoch": 86.87, + "learning_rate": 6.582298999629492e-06, + "loss": 1.7981, + "step": 30010000 + }, + { + "epoch": 86.87, + "learning_rate": 6.581575351982217e-06, + "loss": 1.8037, + "step": 30010500 + }, + { + "epoch": 86.87, + "learning_rate": 6.580851704334939e-06, + "loss": 1.8024, + "step": 30011000 + }, + { + "epoch": 86.87, + "learning_rate": 6.580128056687662e-06, + "loss": 1.7933, + "step": 30011500 + }, + { + "epoch": 86.87, + "learning_rate": 6.579404409040385e-06, + "loss": 1.811, + "step": 30012000 + }, + { + "epoch": 86.87, + "learning_rate": 6.578682208688404e-06, + "loss": 1.8179, + "step": 30012500 + }, + { + "epoch": 86.88, + "learning_rate": 6.577958561041127e-06, + "loss": 1.7737, + "step": 30013000 + }, + { + "epoch": 86.88, + "learning_rate": 6.577236360689144e-06, + "loss": 1.8013, + "step": 30013500 + }, + { + "epoch": 86.88, + "learning_rate": 6.5765127130418675e-06, + "loss": 1.8067, + "step": 30014000 + }, + { + "epoch": 86.88, + "learning_rate": 6.575789065394591e-06, + "loss": 1.8279, + "step": 30014500 + }, + { + "epoch": 86.88, + "learning_rate": 6.5750654177473145e-06, + "loss": 1.8118, + "step": 30015000 + }, + { + "epoch": 86.88, + "learning_rate": 6.574341770100037e-06, + "loss": 1.8106, + "step": 30015500 + }, + { + "epoch": 86.88, + "learning_rate": 6.5736181224527615e-06, + "loss": 1.8111, + "step": 30016000 + }, + { + "epoch": 86.89, + "learning_rate": 6.572894474805484e-06, + "loss": 1.8063, + "step": 30016500 + }, + { + "epoch": 86.89, + "learning_rate": 6.572170827158207e-06, + "loss": 1.822, + "step": 30017000 + }, + { + "epoch": 86.89, + "learning_rate": 6.57144717951093e-06, + "loss": 1.8151, + "step": 30017500 + }, + { + "epoch": 86.89, + "learning_rate": 6.570723531863654e-06, + "loss": 1.7945, + "step": 30018000 + }, + { + "epoch": 86.89, + "learning_rate": 6.569999884216377e-06, + "loss": 1.7892, + "step": 30018500 + }, + { + "epoch": 86.89, + "learning_rate": 6.569277683864394e-06, + "loss": 1.7787, + "step": 30019000 + }, + { + "epoch": 86.89, + "learning_rate": 6.568554036217117e-06, + "loss": 1.7872, + "step": 30019500 + }, + { + "epoch": 86.9, + "learning_rate": 6.567830388569841e-06, + "loss": 1.8148, + "step": 30020000 + }, + { + "epoch": 86.9, + "learning_rate": 6.567106740922564e-06, + "loss": 1.8204, + "step": 30020500 + }, + { + "epoch": 86.9, + "learning_rate": 6.5663845405705815e-06, + "loss": 1.7992, + "step": 30021000 + }, + { + "epoch": 86.9, + "learning_rate": 6.5656608929233046e-06, + "loss": 1.7898, + "step": 30021500 + }, + { + "epoch": 86.9, + "learning_rate": 6.5649372452760285e-06, + "loss": 1.8133, + "step": 30022000 + }, + { + "epoch": 86.9, + "learning_rate": 6.5642135976287516e-06, + "loss": 1.8168, + "step": 30022500 + }, + { + "epoch": 86.9, + "learning_rate": 6.563491397276769e-06, + "loss": 1.8093, + "step": 30023000 + }, + { + "epoch": 86.91, + "learning_rate": 6.562767749629492e-06, + "loss": 1.8076, + "step": 30023500 + }, + { + "epoch": 86.91, + "learning_rate": 6.562044101982217e-06, + "loss": 1.805, + "step": 30024000 + }, + { + "epoch": 86.91, + "learning_rate": 6.561320454334939e-06, + "loss": 1.8228, + "step": 30024500 + }, + { + "epoch": 86.91, + "learning_rate": 6.560596806687662e-06, + "loss": 1.8236, + "step": 30025000 + }, + { + "epoch": 86.91, + "learning_rate": 6.559873159040386e-06, + "loss": 1.7984, + "step": 30025500 + }, + { + "epoch": 86.91, + "learning_rate": 6.559150958688404e-06, + "loss": 1.8144, + "step": 30026000 + }, + { + "epoch": 86.91, + "learning_rate": 6.558427311041126e-06, + "loss": 1.8399, + "step": 30026500 + }, + { + "epoch": 86.92, + "learning_rate": 6.557703663393849e-06, + "loss": 1.8146, + "step": 30027000 + }, + { + "epoch": 86.92, + "learning_rate": 6.556980015746573e-06, + "loss": 1.8259, + "step": 30027500 + }, + { + "epoch": 86.92, + "learning_rate": 6.556257815394591e-06, + "loss": 1.8174, + "step": 30028000 + }, + { + "epoch": 86.92, + "learning_rate": 6.555534167747314e-06, + "loss": 1.825, + "step": 30028500 + }, + { + "epoch": 86.92, + "learning_rate": 6.554810520100037e-06, + "loss": 1.8218, + "step": 30029000 + }, + { + "epoch": 86.92, + "learning_rate": 6.554086872452761e-06, + "loss": 1.8361, + "step": 30029500 + }, + { + "epoch": 86.92, + "learning_rate": 6.553363224805484e-06, + "loss": 1.7923, + "step": 30030000 + }, + { + "epoch": 86.93, + "learning_rate": 6.552641024453502e-06, + "loss": 1.804, + "step": 30030500 + }, + { + "epoch": 86.93, + "learning_rate": 6.551917376806224e-06, + "loss": 1.807, + "step": 30031000 + }, + { + "epoch": 86.93, + "learning_rate": 6.551193729158949e-06, + "loss": 1.8177, + "step": 30031500 + }, + { + "epoch": 86.93, + "learning_rate": 6.550470081511671e-06, + "loss": 1.8226, + "step": 30032000 + }, + { + "epoch": 86.93, + "learning_rate": 6.549747881159689e-06, + "loss": 1.823, + "step": 30032500 + }, + { + "epoch": 86.93, + "learning_rate": 6.549024233512413e-06, + "loss": 1.8143, + "step": 30033000 + }, + { + "epoch": 86.93, + "learning_rate": 6.54830203316043e-06, + "loss": 1.8031, + "step": 30033500 + }, + { + "epoch": 86.94, + "learning_rate": 6.547578385513153e-06, + "loss": 1.7879, + "step": 30034000 + }, + { + "epoch": 86.94, + "learning_rate": 6.5468547378658764e-06, + "loss": 1.804, + "step": 30034500 + }, + { + "epoch": 86.94, + "learning_rate": 6.5461310902186e-06, + "loss": 1.8127, + "step": 30035000 + }, + { + "epoch": 86.94, + "learning_rate": 6.5454074425713234e-06, + "loss": 1.8242, + "step": 30035500 + }, + { + "epoch": 86.94, + "learning_rate": 6.544683794924046e-06, + "loss": 1.8213, + "step": 30036000 + }, + { + "epoch": 86.94, + "learning_rate": 6.543960147276769e-06, + "loss": 1.7922, + "step": 30036500 + }, + { + "epoch": 86.94, + "learning_rate": 6.543237946924788e-06, + "loss": 1.7875, + "step": 30037000 + }, + { + "epoch": 86.95, + "learning_rate": 6.542514299277511e-06, + "loss": 1.8077, + "step": 30037500 + }, + { + "epoch": 86.95, + "learning_rate": 6.541790651630234e-06, + "loss": 1.8171, + "step": 30038000 + }, + { + "epoch": 86.95, + "learning_rate": 6.541067003982956e-06, + "loss": 1.8112, + "step": 30038500 + }, + { + "epoch": 86.95, + "learning_rate": 6.540343356335681e-06, + "loss": 1.8158, + "step": 30039000 + }, + { + "epoch": 86.95, + "learning_rate": 6.539619708688403e-06, + "loss": 1.8263, + "step": 30039500 + }, + { + "epoch": 86.95, + "learning_rate": 6.538896061041126e-06, + "loss": 1.7942, + "step": 30040000 + }, + { + "epoch": 86.95, + "learning_rate": 6.53817241339385e-06, + "loss": 1.8185, + "step": 30040500 + }, + { + "epoch": 86.96, + "learning_rate": 6.537450213041868e-06, + "loss": 1.8064, + "step": 30041000 + }, + { + "epoch": 86.96, + "learning_rate": 6.5367265653945904e-06, + "loss": 1.7902, + "step": 30041500 + }, + { + "epoch": 86.96, + "learning_rate": 6.5360029177473135e-06, + "loss": 1.8164, + "step": 30042000 + }, + { + "epoch": 86.96, + "learning_rate": 6.5352792701000375e-06, + "loss": 1.828, + "step": 30042500 + }, + { + "epoch": 86.96, + "learning_rate": 6.5345556224527605e-06, + "loss": 1.7964, + "step": 30043000 + }, + { + "epoch": 86.96, + "learning_rate": 6.533831974805484e-06, + "loss": 1.8194, + "step": 30043500 + }, + { + "epoch": 86.97, + "learning_rate": 6.533108327158207e-06, + "loss": 1.7874, + "step": 30044000 + }, + { + "epoch": 86.97, + "learning_rate": 6.532384679510931e-06, + "loss": 1.7989, + "step": 30044500 + }, + { + "epoch": 86.97, + "learning_rate": 6.531661031863654e-06, + "loss": 1.8051, + "step": 30045000 + }, + { + "epoch": 86.97, + "learning_rate": 6.530938831511671e-06, + "loss": 1.8054, + "step": 30045500 + }, + { + "epoch": 86.97, + "learning_rate": 6.530216631159688e-06, + "loss": 1.8082, + "step": 30046000 + }, + { + "epoch": 86.97, + "learning_rate": 6.529492983512413e-06, + "loss": 1.8469, + "step": 30046500 + }, + { + "epoch": 86.97, + "learning_rate": 6.52877078316043e-06, + "loss": 1.8226, + "step": 30047000 + }, + { + "epoch": 86.98, + "learning_rate": 6.528047135513153e-06, + "loss": 1.8128, + "step": 30047500 + }, + { + "epoch": 86.98, + "learning_rate": 6.5273234878658755e-06, + "loss": 1.8214, + "step": 30048000 + }, + { + "epoch": 86.98, + "learning_rate": 6.5265998402186e-06, + "loss": 1.8181, + "step": 30048500 + }, + { + "epoch": 86.98, + "learning_rate": 6.525876192571323e-06, + "loss": 1.8005, + "step": 30049000 + }, + { + "epoch": 86.98, + "learning_rate": 6.525152544924046e-06, + "loss": 1.8257, + "step": 30049500 + }, + { + "epoch": 86.98, + "learning_rate": 6.52442889727677e-06, + "loss": 1.8179, + "step": 30050000 + }, + { + "epoch": 86.98, + "learning_rate": 6.523705249629493e-06, + "loss": 1.8104, + "step": 30050500 + }, + { + "epoch": 86.99, + "learning_rate": 6.522981601982216e-06, + "loss": 1.8257, + "step": 30051000 + }, + { + "epoch": 86.99, + "learning_rate": 6.522259401630233e-06, + "loss": 1.7972, + "step": 30051500 + }, + { + "epoch": 86.99, + "learning_rate": 6.521535753982958e-06, + "loss": 1.8029, + "step": 30052000 + }, + { + "epoch": 86.99, + "learning_rate": 6.52081210633568e-06, + "loss": 1.8107, + "step": 30052500 + }, + { + "epoch": 86.99, + "learning_rate": 6.520088458688403e-06, + "loss": 1.7675, + "step": 30053000 + }, + { + "epoch": 86.99, + "learning_rate": 6.51936625833642e-06, + "loss": 1.8362, + "step": 30053500 + }, + { + "epoch": 86.99, + "learning_rate": 6.518642610689145e-06, + "loss": 1.8298, + "step": 30054000 + }, + { + "epoch": 87.0, + "learning_rate": 6.517918963041867e-06, + "loss": 1.8141, + "step": 30054500 + }, + { + "epoch": 87.0, + "learning_rate": 6.517196762689885e-06, + "loss": 1.7949, + "step": 30055000 + }, + { + "epoch": 87.0, + "learning_rate": 6.5164731150426085e-06, + "loss": 1.8136, + "step": 30055500 + }, + { + "epoch": 87.0, + "learning_rate": 6.515749467395332e-06, + "loss": 1.8164, + "step": 30056000 + }, + { + "epoch": 87.0, + "eval_accuracy": 0.6891758386419078, + "eval_accuracy_mlm": 0.6582064760563344, + "eval_accuracy_nsp": 0.8552474185697982, + "eval_loss": 2.1924755573272705, + "eval_runtime": 331.6095, + "eval_samples_per_second": 1315.964, + "eval_steps_per_second": 54.833, + "step": 30056064 + }, + { + "epoch": 87.0, + "learning_rate": 6.5150258197480555e-06, + "loss": 1.7942, + "step": 30056500 + }, + { + "epoch": 87.0, + "learning_rate": 6.514303619396073e-06, + "loss": 1.7978, + "step": 30057000 + }, + { + "epoch": 87.0, + "learning_rate": 6.513579971748796e-06, + "loss": 1.7773, + "step": 30057500 + }, + { + "epoch": 87.01, + "learning_rate": 6.51285632410152e-06, + "loss": 1.802, + "step": 30058000 + }, + { + "epoch": 87.01, + "learning_rate": 6.512132676454243e-06, + "loss": 1.8097, + "step": 30058500 + }, + { + "epoch": 87.01, + "learning_rate": 6.511409028806965e-06, + "loss": 1.8013, + "step": 30059000 + }, + { + "epoch": 87.01, + "learning_rate": 6.51068538115969e-06, + "loss": 1.8092, + "step": 30059500 + }, + { + "epoch": 87.01, + "learning_rate": 6.509961733512412e-06, + "loss": 1.824, + "step": 30060000 + }, + { + "epoch": 87.01, + "learning_rate": 6.509238085865135e-06, + "loss": 1.8, + "step": 30060500 + }, + { + "epoch": 87.01, + "learning_rate": 6.508514438217858e-06, + "loss": 1.7946, + "step": 30061000 + }, + { + "epoch": 87.02, + "learning_rate": 6.507790790570582e-06, + "loss": 1.8039, + "step": 30061500 + }, + { + "epoch": 87.02, + "learning_rate": 6.507067142923305e-06, + "loss": 1.8098, + "step": 30062000 + }, + { + "epoch": 87.02, + "learning_rate": 6.506343495276028e-06, + "loss": 1.8167, + "step": 30062500 + }, + { + "epoch": 87.02, + "learning_rate": 6.505621294924047e-06, + "loss": 1.7944, + "step": 30063000 + }, + { + "epoch": 87.02, + "learning_rate": 6.5048976472767695e-06, + "loss": 1.7646, + "step": 30063500 + }, + { + "epoch": 87.02, + "learning_rate": 6.504173999629493e-06, + "loss": 1.812, + "step": 30064000 + }, + { + "epoch": 87.02, + "learning_rate": 6.503450351982216e-06, + "loss": 1.7998, + "step": 30064500 + }, + { + "epoch": 87.03, + "learning_rate": 6.502728151630235e-06, + "loss": 1.792, + "step": 30065000 + }, + { + "epoch": 87.03, + "learning_rate": 6.502004503982957e-06, + "loss": 1.8077, + "step": 30065500 + }, + { + "epoch": 87.03, + "learning_rate": 6.50128085633568e-06, + "loss": 1.7947, + "step": 30066000 + }, + { + "epoch": 87.03, + "learning_rate": 6.500557208688403e-06, + "loss": 1.7911, + "step": 30066500 + }, + { + "epoch": 87.03, + "learning_rate": 6.499833561041127e-06, + "loss": 1.8124, + "step": 30067000 + }, + { + "epoch": 87.03, + "learning_rate": 6.49910991339385e-06, + "loss": 1.8009, + "step": 30067500 + }, + { + "epoch": 87.03, + "learning_rate": 6.498386265746573e-06, + "loss": 1.813, + "step": 30068000 + }, + { + "epoch": 87.04, + "learning_rate": 6.497662618099297e-06, + "loss": 1.8096, + "step": 30068500 + }, + { + "epoch": 87.04, + "learning_rate": 6.496940417747314e-06, + "loss": 1.8371, + "step": 30069000 + }, + { + "epoch": 87.04, + "learning_rate": 6.496216770100037e-06, + "loss": 1.7751, + "step": 30069500 + }, + { + "epoch": 87.04, + "learning_rate": 6.4954931224527604e-06, + "loss": 1.8177, + "step": 30070000 + }, + { + "epoch": 87.04, + "learning_rate": 6.494769474805484e-06, + "loss": 1.784, + "step": 30070500 + }, + { + "epoch": 87.04, + "learning_rate": 6.4940458271582074e-06, + "loss": 1.7932, + "step": 30071000 + }, + { + "epoch": 87.04, + "learning_rate": 6.49332217951093e-06, + "loss": 1.7751, + "step": 30071500 + }, + { + "epoch": 87.05, + "learning_rate": 6.492599979158948e-06, + "loss": 1.8265, + "step": 30072000 + }, + { + "epoch": 87.05, + "learning_rate": 6.491876331511672e-06, + "loss": 1.8097, + "step": 30072500 + }, + { + "epoch": 87.05, + "learning_rate": 6.491152683864395e-06, + "loss": 1.7939, + "step": 30073000 + }, + { + "epoch": 87.05, + "learning_rate": 6.490429036217118e-06, + "loss": 1.7805, + "step": 30073500 + }, + { + "epoch": 87.05, + "learning_rate": 6.489705388569842e-06, + "loss": 1.784, + "step": 30074000 + }, + { + "epoch": 87.05, + "learning_rate": 6.488981740922565e-06, + "loss": 1.7833, + "step": 30074500 + }, + { + "epoch": 87.05, + "learning_rate": 6.488259540570582e-06, + "loss": 1.804, + "step": 30075000 + }, + { + "epoch": 87.06, + "learning_rate": 6.487535892923305e-06, + "loss": 1.7886, + "step": 30075500 + }, + { + "epoch": 87.06, + "learning_rate": 6.486812245276029e-06, + "loss": 1.7812, + "step": 30076000 + }, + { + "epoch": 87.06, + "learning_rate": 6.486088597628752e-06, + "loss": 1.8028, + "step": 30076500 + }, + { + "epoch": 87.06, + "learning_rate": 6.4853649499814744e-06, + "loss": 1.8244, + "step": 30077000 + }, + { + "epoch": 87.06, + "learning_rate": 6.4846427496294925e-06, + "loss": 1.8163, + "step": 30077500 + }, + { + "epoch": 87.06, + "learning_rate": 6.4839191019822165e-06, + "loss": 1.7895, + "step": 30078000 + }, + { + "epoch": 87.06, + "learning_rate": 6.4831954543349395e-06, + "loss": 1.82, + "step": 30078500 + }, + { + "epoch": 87.07, + "learning_rate": 6.482471806687662e-06, + "loss": 1.7831, + "step": 30079000 + }, + { + "epoch": 87.07, + "learning_rate": 6.48174960633568e-06, + "loss": 1.7943, + "step": 30079500 + }, + { + "epoch": 87.07, + "learning_rate": 6.481025958688404e-06, + "loss": 1.7992, + "step": 30080000 + }, + { + "epoch": 87.07, + "learning_rate": 6.480302311041127e-06, + "loss": 1.8005, + "step": 30080500 + }, + { + "epoch": 87.07, + "learning_rate": 6.47957866339385e-06, + "loss": 1.8163, + "step": 30081000 + }, + { + "epoch": 87.07, + "learning_rate": 6.478855015746572e-06, + "loss": 1.8188, + "step": 30081500 + }, + { + "epoch": 87.08, + "learning_rate": 6.478132815394591e-06, + "loss": 1.8054, + "step": 30082000 + }, + { + "epoch": 87.08, + "learning_rate": 6.477410615042609e-06, + "loss": 1.8262, + "step": 30082500 + }, + { + "epoch": 87.08, + "learning_rate": 6.4766869673953315e-06, + "loss": 1.8111, + "step": 30083000 + }, + { + "epoch": 87.08, + "learning_rate": 6.4759633197480546e-06, + "loss": 1.7927, + "step": 30083500 + }, + { + "epoch": 87.08, + "learning_rate": 6.4752396721007785e-06, + "loss": 1.8114, + "step": 30084000 + }, + { + "epoch": 87.08, + "learning_rate": 6.4745160244535016e-06, + "loss": 1.8165, + "step": 30084500 + }, + { + "epoch": 87.08, + "learning_rate": 6.473792376806225e-06, + "loss": 1.771, + "step": 30085000 + }, + { + "epoch": 87.09, + "learning_rate": 6.4730687291589486e-06, + "loss": 1.7927, + "step": 30085500 + }, + { + "epoch": 87.09, + "learning_rate": 6.472345081511672e-06, + "loss": 1.8014, + "step": 30086000 + }, + { + "epoch": 87.09, + "learning_rate": 6.471622881159689e-06, + "loss": 1.8011, + "step": 30086500 + }, + { + "epoch": 87.09, + "learning_rate": 6.470899233512412e-06, + "loss": 1.7978, + "step": 30087000 + }, + { + "epoch": 87.09, + "learning_rate": 6.470175585865136e-06, + "loss": 1.7782, + "step": 30087500 + }, + { + "epoch": 87.09, + "learning_rate": 6.469451938217859e-06, + "loss": 1.8051, + "step": 30088000 + }, + { + "epoch": 87.09, + "learning_rate": 6.468728290570582e-06, + "loss": 1.8114, + "step": 30088500 + }, + { + "epoch": 87.1, + "learning_rate": 6.468006090218599e-06, + "loss": 1.8095, + "step": 30089000 + }, + { + "epoch": 87.1, + "learning_rate": 6.467282442571323e-06, + "loss": 1.8022, + "step": 30089500 + }, + { + "epoch": 87.1, + "learning_rate": 6.466558794924046e-06, + "loss": 1.8082, + "step": 30090000 + }, + { + "epoch": 87.1, + "learning_rate": 6.4658365945720636e-06, + "loss": 1.7866, + "step": 30090500 + }, + { + "epoch": 87.1, + "learning_rate": 6.465112946924787e-06, + "loss": 1.8139, + "step": 30091000 + }, + { + "epoch": 87.1, + "learning_rate": 6.464389299277511e-06, + "loss": 1.8034, + "step": 30091500 + }, + { + "epoch": 87.1, + "learning_rate": 6.463665651630234e-06, + "loss": 1.81, + "step": 30092000 + }, + { + "epoch": 87.11, + "learning_rate": 6.462942003982957e-06, + "loss": 1.8135, + "step": 30092500 + }, + { + "epoch": 87.11, + "learning_rate": 6.462218356335681e-06, + "loss": 1.7939, + "step": 30093000 + }, + { + "epoch": 87.11, + "learning_rate": 6.461494708688404e-06, + "loss": 1.7994, + "step": 30093500 + }, + { + "epoch": 87.11, + "learning_rate": 6.460771061041127e-06, + "loss": 1.778, + "step": 30094000 + }, + { + "epoch": 87.11, + "learning_rate": 6.460047413393849e-06, + "loss": 1.7698, + "step": 30094500 + }, + { + "epoch": 87.11, + "learning_rate": 6.459325213041868e-06, + "loss": 1.7963, + "step": 30095000 + }, + { + "epoch": 87.11, + "learning_rate": 6.458601565394591e-06, + "loss": 1.7621, + "step": 30095500 + }, + { + "epoch": 87.12, + "learning_rate": 6.457879365042608e-06, + "loss": 1.8181, + "step": 30096000 + }, + { + "epoch": 87.12, + "learning_rate": 6.457155717395331e-06, + "loss": 1.808, + "step": 30096500 + }, + { + "epoch": 87.12, + "learning_rate": 6.456432069748055e-06, + "loss": 1.7986, + "step": 30097000 + }, + { + "epoch": 87.12, + "learning_rate": 6.4557084221007784e-06, + "loss": 1.7825, + "step": 30097500 + }, + { + "epoch": 87.12, + "learning_rate": 6.4549847744535015e-06, + "loss": 1.7975, + "step": 30098000 + }, + { + "epoch": 87.12, + "learning_rate": 6.454261126806225e-06, + "loss": 1.7896, + "step": 30098500 + }, + { + "epoch": 87.12, + "learning_rate": 6.4535374791589485e-06, + "loss": 1.7861, + "step": 30099000 + }, + { + "epoch": 87.13, + "learning_rate": 6.452815278806966e-06, + "loss": 1.8178, + "step": 30099500 + }, + { + "epoch": 87.13, + "learning_rate": 6.452091631159689e-06, + "loss": 1.7814, + "step": 30100000 + }, + { + "epoch": 87.13, + "learning_rate": 6.451367983512413e-06, + "loss": 1.8026, + "step": 30100500 + }, + { + "epoch": 87.13, + "learning_rate": 6.450644335865136e-06, + "loss": 1.8063, + "step": 30101000 + }, + { + "epoch": 87.13, + "learning_rate": 6.449920688217859e-06, + "loss": 1.7804, + "step": 30101500 + }, + { + "epoch": 87.13, + "learning_rate": 6.449197040570581e-06, + "loss": 1.8241, + "step": 30102000 + }, + { + "epoch": 87.13, + "learning_rate": 6.448473392923306e-06, + "loss": 1.7836, + "step": 30102500 + }, + { + "epoch": 87.14, + "learning_rate": 6.447749745276028e-06, + "loss": 1.7849, + "step": 30103000 + }, + { + "epoch": 87.14, + "learning_rate": 6.447026097628751e-06, + "loss": 1.7974, + "step": 30103500 + }, + { + "epoch": 87.14, + "learning_rate": 6.4463038972767685e-06, + "loss": 1.7953, + "step": 30104000 + }, + { + "epoch": 87.14, + "learning_rate": 6.445580249629493e-06, + "loss": 1.803, + "step": 30104500 + }, + { + "epoch": 87.14, + "learning_rate": 6.444856601982216e-06, + "loss": 1.8166, + "step": 30105000 + }, + { + "epoch": 87.14, + "learning_rate": 6.444132954334939e-06, + "loss": 1.8076, + "step": 30105500 + }, + { + "epoch": 87.14, + "learning_rate": 6.443409306687663e-06, + "loss": 1.7865, + "step": 30106000 + }, + { + "epoch": 87.15, + "learning_rate": 6.442687106335681e-06, + "loss": 1.8056, + "step": 30106500 + }, + { + "epoch": 87.15, + "learning_rate": 6.441963458688404e-06, + "loss": 1.7844, + "step": 30107000 + }, + { + "epoch": 87.15, + "learning_rate": 6.441239811041126e-06, + "loss": 1.8162, + "step": 30107500 + }, + { + "epoch": 87.15, + "learning_rate": 6.440517610689144e-06, + "loss": 1.7847, + "step": 30108000 + }, + { + "epoch": 87.15, + "learning_rate": 6.439793963041868e-06, + "loss": 1.7984, + "step": 30108500 + }, + { + "epoch": 87.15, + "learning_rate": 6.439070315394591e-06, + "loss": 1.8149, + "step": 30109000 + }, + { + "epoch": 87.15, + "learning_rate": 6.438346667747313e-06, + "loss": 1.7943, + "step": 30109500 + }, + { + "epoch": 87.16, + "learning_rate": 6.437623020100038e-06, + "loss": 1.7988, + "step": 30110000 + }, + { + "epoch": 87.16, + "learning_rate": 6.43689937245276e-06, + "loss": 1.7816, + "step": 30110500 + }, + { + "epoch": 87.16, + "learning_rate": 6.436175724805483e-06, + "loss": 1.8047, + "step": 30111000 + }, + { + "epoch": 87.16, + "learning_rate": 6.4354520771582064e-06, + "loss": 1.8152, + "step": 30111500 + }, + { + "epoch": 87.16, + "learning_rate": 6.43472842951093e-06, + "loss": 1.8119, + "step": 30112000 + }, + { + "epoch": 87.16, + "learning_rate": 6.434007676454243e-06, + "loss": 1.8216, + "step": 30112500 + }, + { + "epoch": 87.16, + "learning_rate": 6.433284028806966e-06, + "loss": 1.8085, + "step": 30113000 + }, + { + "epoch": 87.17, + "learning_rate": 6.432560381159689e-06, + "loss": 1.8099, + "step": 30113500 + }, + { + "epoch": 87.17, + "learning_rate": 6.431836733512413e-06, + "loss": 1.8064, + "step": 30114000 + }, + { + "epoch": 87.17, + "learning_rate": 6.431113085865136e-06, + "loss": 1.805, + "step": 30114500 + }, + { + "epoch": 87.17, + "learning_rate": 6.430389438217858e-06, + "loss": 1.8126, + "step": 30115000 + }, + { + "epoch": 87.17, + "learning_rate": 6.429667237865876e-06, + "loss": 1.806, + "step": 30115500 + }, + { + "epoch": 87.17, + "learning_rate": 6.4289435902186e-06, + "loss": 1.826, + "step": 30116000 + }, + { + "epoch": 87.17, + "learning_rate": 6.428221389866617e-06, + "loss": 1.7846, + "step": 30116500 + }, + { + "epoch": 87.18, + "learning_rate": 6.42749774221934e-06, + "loss": 1.8013, + "step": 30117000 + }, + { + "epoch": 87.18, + "learning_rate": 6.4267740945720635e-06, + "loss": 1.8039, + "step": 30117500 + }, + { + "epoch": 87.18, + "learning_rate": 6.426050446924787e-06, + "loss": 1.8032, + "step": 30118000 + }, + { + "epoch": 87.18, + "learning_rate": 6.4253267992775105e-06, + "loss": 1.7812, + "step": 30118500 + }, + { + "epoch": 87.18, + "learning_rate": 6.4246031516302336e-06, + "loss": 1.8051, + "step": 30119000 + }, + { + "epoch": 87.18, + "learning_rate": 6.4238795039829575e-06, + "loss": 1.7567, + "step": 30119500 + }, + { + "epoch": 87.19, + "learning_rate": 6.4231558563356806e-06, + "loss": 1.7968, + "step": 30120000 + }, + { + "epoch": 87.19, + "learning_rate": 6.422432208688403e-06, + "loss": 1.7963, + "step": 30120500 + }, + { + "epoch": 87.19, + "learning_rate": 6.4217085610411276e-06, + "loss": 1.7791, + "step": 30121000 + }, + { + "epoch": 87.19, + "learning_rate": 6.42098491339385e-06, + "loss": 1.7951, + "step": 30121500 + }, + { + "epoch": 87.19, + "learning_rate": 6.420261265746573e-06, + "loss": 1.7817, + "step": 30122000 + }, + { + "epoch": 87.19, + "learning_rate": 6.419537618099296e-06, + "loss": 1.7905, + "step": 30122500 + }, + { + "epoch": 87.19, + "learning_rate": 6.41881397045202e-06, + "loss": 1.8043, + "step": 30123000 + }, + { + "epoch": 87.2, + "learning_rate": 6.418091770100038e-06, + "loss": 1.8145, + "step": 30123500 + }, + { + "epoch": 87.2, + "learning_rate": 6.41736812245276e-06, + "loss": 1.8053, + "step": 30124000 + }, + { + "epoch": 87.2, + "learning_rate": 6.416644474805483e-06, + "loss": 1.825, + "step": 30124500 + }, + { + "epoch": 87.2, + "learning_rate": 6.415920827158207e-06, + "loss": 1.8062, + "step": 30125000 + }, + { + "epoch": 87.2, + "learning_rate": 6.41519717951093e-06, + "loss": 1.7965, + "step": 30125500 + }, + { + "epoch": 87.2, + "learning_rate": 6.414473531863653e-06, + "loss": 1.7963, + "step": 30126000 + }, + { + "epoch": 87.2, + "learning_rate": 6.413751331511671e-06, + "loss": 1.8085, + "step": 30126500 + }, + { + "epoch": 87.21, + "learning_rate": 6.4130276838643946e-06, + "loss": 1.7808, + "step": 30127000 + }, + { + "epoch": 87.21, + "learning_rate": 6.412304036217118e-06, + "loss": 1.7919, + "step": 30127500 + }, + { + "epoch": 87.21, + "learning_rate": 6.411580388569841e-06, + "loss": 1.8029, + "step": 30128000 + }, + { + "epoch": 87.21, + "learning_rate": 6.410856740922565e-06, + "loss": 1.8085, + "step": 30128500 + }, + { + "epoch": 87.21, + "learning_rate": 6.410133093275288e-06, + "loss": 1.8137, + "step": 30129000 + }, + { + "epoch": 87.21, + "learning_rate": 6.409409445628011e-06, + "loss": 1.7976, + "step": 30129500 + }, + { + "epoch": 87.21, + "learning_rate": 6.408685797980733e-06, + "loss": 1.8095, + "step": 30130000 + }, + { + "epoch": 87.22, + "learning_rate": 6.407963597628752e-06, + "loss": 1.7932, + "step": 30130500 + }, + { + "epoch": 87.22, + "learning_rate": 6.40724139727677e-06, + "loss": 1.8056, + "step": 30131000 + }, + { + "epoch": 87.22, + "learning_rate": 6.406517749629492e-06, + "loss": 1.821, + "step": 30131500 + }, + { + "epoch": 87.22, + "learning_rate": 6.405794101982215e-06, + "loss": 1.7971, + "step": 30132000 + }, + { + "epoch": 87.22, + "learning_rate": 6.405070454334939e-06, + "loss": 1.8057, + "step": 30132500 + }, + { + "epoch": 87.22, + "learning_rate": 6.4043482539829574e-06, + "loss": 1.7888, + "step": 30133000 + }, + { + "epoch": 87.22, + "learning_rate": 6.40362460633568e-06, + "loss": 1.7913, + "step": 30133500 + }, + { + "epoch": 87.23, + "learning_rate": 6.402900958688403e-06, + "loss": 1.8207, + "step": 30134000 + }, + { + "epoch": 87.23, + "learning_rate": 6.402177311041127e-06, + "loss": 1.7701, + "step": 30134500 + }, + { + "epoch": 87.23, + "learning_rate": 6.40145366339385e-06, + "loss": 1.8047, + "step": 30135000 + }, + { + "epoch": 87.23, + "learning_rate": 6.400730015746573e-06, + "loss": 1.8044, + "step": 30135500 + }, + { + "epoch": 87.23, + "learning_rate": 6.400006368099297e-06, + "loss": 1.7673, + "step": 30136000 + }, + { + "epoch": 87.23, + "learning_rate": 6.39928272045202e-06, + "loss": 1.8202, + "step": 30136500 + }, + { + "epoch": 87.23, + "learning_rate": 6.398559072804743e-06, + "loss": 1.796, + "step": 30137000 + }, + { + "epoch": 87.24, + "learning_rate": 6.397835425157465e-06, + "loss": 1.8184, + "step": 30137500 + }, + { + "epoch": 87.24, + "learning_rate": 6.397113224805484e-06, + "loss": 1.8206, + "step": 30138000 + }, + { + "epoch": 87.24, + "learning_rate": 6.396391024453502e-06, + "loss": 1.8303, + "step": 30138500 + }, + { + "epoch": 87.24, + "learning_rate": 6.3956673768062244e-06, + "loss": 1.8135, + "step": 30139000 + }, + { + "epoch": 87.24, + "learning_rate": 6.3949437291589475e-06, + "loss": 1.7973, + "step": 30139500 + }, + { + "epoch": 87.24, + "learning_rate": 6.3942200815116714e-06, + "loss": 1.8085, + "step": 30140000 + }, + { + "epoch": 87.24, + "learning_rate": 6.3934964338643945e-06, + "loss": 1.7961, + "step": 30140500 + }, + { + "epoch": 87.25, + "learning_rate": 6.392772786217118e-06, + "loss": 1.7932, + "step": 30141000 + }, + { + "epoch": 87.25, + "learning_rate": 6.392050585865135e-06, + "loss": 1.7879, + "step": 30141500 + }, + { + "epoch": 87.25, + "learning_rate": 6.39132693821786e-06, + "loss": 1.7904, + "step": 30142000 + }, + { + "epoch": 87.25, + "learning_rate": 6.390603290570582e-06, + "loss": 1.8028, + "step": 30142500 + }, + { + "epoch": 87.25, + "learning_rate": 6.389879642923305e-06, + "loss": 1.8187, + "step": 30143000 + }, + { + "epoch": 87.25, + "learning_rate": 6.389155995276029e-06, + "loss": 1.8192, + "step": 30143500 + }, + { + "epoch": 87.25, + "learning_rate": 6.388432347628752e-06, + "loss": 1.7982, + "step": 30144000 + }, + { + "epoch": 87.26, + "learning_rate": 6.387708699981475e-06, + "loss": 1.8216, + "step": 30144500 + }, + { + "epoch": 87.26, + "learning_rate": 6.386985052334197e-06, + "loss": 1.8142, + "step": 30145000 + }, + { + "epoch": 87.26, + "learning_rate": 6.386262851982216e-06, + "loss": 1.8081, + "step": 30145500 + }, + { + "epoch": 87.26, + "learning_rate": 6.385539204334939e-06, + "loss": 1.7903, + "step": 30146000 + }, + { + "epoch": 87.26, + "learning_rate": 6.384815556687662e-06, + "loss": 1.7799, + "step": 30146500 + }, + { + "epoch": 87.26, + "learning_rate": 6.384091909040385e-06, + "loss": 1.7961, + "step": 30147000 + }, + { + "epoch": 87.26, + "learning_rate": 6.383368261393109e-06, + "loss": 1.8214, + "step": 30147500 + }, + { + "epoch": 87.27, + "learning_rate": 6.382646061041127e-06, + "loss": 1.8114, + "step": 30148000 + }, + { + "epoch": 87.27, + "learning_rate": 6.38192241339385e-06, + "loss": 1.7829, + "step": 30148500 + }, + { + "epoch": 87.27, + "learning_rate": 6.381198765746573e-06, + "loss": 1.7947, + "step": 30149000 + }, + { + "epoch": 87.27, + "learning_rate": 6.380475118099297e-06, + "loss": 1.8002, + "step": 30149500 + }, + { + "epoch": 87.27, + "learning_rate": 6.379752917747314e-06, + "loss": 1.8119, + "step": 30150000 + }, + { + "epoch": 87.27, + "learning_rate": 6.379029270100037e-06, + "loss": 1.7976, + "step": 30150500 + }, + { + "epoch": 87.27, + "learning_rate": 6.378305622452761e-06, + "loss": 1.7986, + "step": 30151000 + }, + { + "epoch": 87.28, + "learning_rate": 6.377581974805484e-06, + "loss": 1.8091, + "step": 30151500 + }, + { + "epoch": 87.28, + "learning_rate": 6.376859774453501e-06, + "loss": 1.8053, + "step": 30152000 + }, + { + "epoch": 87.28, + "learning_rate": 6.376136126806224e-06, + "loss": 1.797, + "step": 30152500 + }, + { + "epoch": 87.28, + "learning_rate": 6.375412479158948e-06, + "loss": 1.8053, + "step": 30153000 + }, + { + "epoch": 87.28, + "learning_rate": 6.374688831511671e-06, + "loss": 1.8214, + "step": 30153500 + }, + { + "epoch": 87.28, + "learning_rate": 6.3739651838643945e-06, + "loss": 1.809, + "step": 30154000 + }, + { + "epoch": 87.28, + "learning_rate": 6.3732415362171176e-06, + "loss": 1.805, + "step": 30154500 + }, + { + "epoch": 87.29, + "learning_rate": 6.3725178885698415e-06, + "loss": 1.821, + "step": 30155000 + }, + { + "epoch": 87.29, + "learning_rate": 6.371795688217859e-06, + "loss": 1.7991, + "step": 30155500 + }, + { + "epoch": 87.29, + "learning_rate": 6.371072040570582e-06, + "loss": 1.8064, + "step": 30156000 + }, + { + "epoch": 87.29, + "learning_rate": 6.370348392923305e-06, + "loss": 1.8036, + "step": 30156500 + }, + { + "epoch": 87.29, + "learning_rate": 6.369624745276029e-06, + "loss": 1.8084, + "step": 30157000 + }, + { + "epoch": 87.29, + "learning_rate": 6.368901097628752e-06, + "loss": 1.7806, + "step": 30157500 + }, + { + "epoch": 87.3, + "learning_rate": 6.368177449981474e-06, + "loss": 1.8066, + "step": 30158000 + }, + { + "epoch": 87.3, + "learning_rate": 6.367453802334199e-06, + "loss": 1.8131, + "step": 30158500 + }, + { + "epoch": 87.3, + "learning_rate": 6.366730154686921e-06, + "loss": 1.8234, + "step": 30159000 + }, + { + "epoch": 87.3, + "learning_rate": 6.366007954334939e-06, + "loss": 1.7805, + "step": 30159500 + }, + { + "epoch": 87.3, + "learning_rate": 6.365284306687662e-06, + "loss": 1.8078, + "step": 30160000 + }, + { + "epoch": 87.3, + "learning_rate": 6.364560659040386e-06, + "loss": 1.8057, + "step": 30160500 + }, + { + "epoch": 87.3, + "learning_rate": 6.363837011393109e-06, + "loss": 1.803, + "step": 30161000 + }, + { + "epoch": 87.31, + "learning_rate": 6.3631148110411266e-06, + "loss": 1.8045, + "step": 30161500 + }, + { + "epoch": 87.31, + "learning_rate": 6.36239116339385e-06, + "loss": 1.7997, + "step": 30162000 + }, + { + "epoch": 87.31, + "learning_rate": 6.361667515746574e-06, + "loss": 1.8171, + "step": 30162500 + }, + { + "epoch": 87.31, + "learning_rate": 6.360943868099297e-06, + "loss": 1.7937, + "step": 30163000 + }, + { + "epoch": 87.31, + "learning_rate": 6.360220220452019e-06, + "loss": 1.7924, + "step": 30163500 + }, + { + "epoch": 87.31, + "learning_rate": 6.359498020100037e-06, + "loss": 1.7917, + "step": 30164000 + }, + { + "epoch": 87.31, + "learning_rate": 6.358774372452761e-06, + "loss": 1.7664, + "step": 30164500 + }, + { + "epoch": 87.32, + "learning_rate": 6.358050724805484e-06, + "loss": 1.8219, + "step": 30165000 + }, + { + "epoch": 87.32, + "learning_rate": 6.357327077158206e-06, + "loss": 1.7897, + "step": 30165500 + }, + { + "epoch": 87.32, + "learning_rate": 6.356603429510931e-06, + "loss": 1.8061, + "step": 30166000 + }, + { + "epoch": 87.32, + "learning_rate": 6.355879781863654e-06, + "loss": 1.7816, + "step": 30166500 + }, + { + "epoch": 87.32, + "learning_rate": 6.355156134216376e-06, + "loss": 1.8024, + "step": 30167000 + }, + { + "epoch": 87.32, + "learning_rate": 6.354433933864394e-06, + "loss": 1.815, + "step": 30167500 + }, + { + "epoch": 87.32, + "learning_rate": 6.353710286217118e-06, + "loss": 1.8152, + "step": 30168000 + }, + { + "epoch": 87.33, + "learning_rate": 6.3529866385698414e-06, + "loss": 1.7977, + "step": 30168500 + }, + { + "epoch": 87.33, + "learning_rate": 6.352262990922564e-06, + "loss": 1.8263, + "step": 30169000 + }, + { + "epoch": 87.33, + "learning_rate": 6.351539343275287e-06, + "loss": 1.8041, + "step": 30169500 + }, + { + "epoch": 87.33, + "learning_rate": 6.350817142923306e-06, + "loss": 1.8, + "step": 30170000 + }, + { + "epoch": 87.33, + "learning_rate": 6.350093495276029e-06, + "loss": 1.8197, + "step": 30170500 + }, + { + "epoch": 87.33, + "learning_rate": 6.349369847628751e-06, + "loss": 1.8002, + "step": 30171000 + }, + { + "epoch": 87.33, + "learning_rate": 6.348646199981476e-06, + "loss": 1.8198, + "step": 30171500 + }, + { + "epoch": 87.34, + "learning_rate": 6.347922552334198e-06, + "loss": 1.8136, + "step": 30172000 + }, + { + "epoch": 87.34, + "learning_rate": 6.347198904686921e-06, + "loss": 1.8065, + "step": 30172500 + }, + { + "epoch": 87.34, + "learning_rate": 6.346476704334939e-06, + "loss": 1.8219, + "step": 30173000 + }, + { + "epoch": 87.34, + "learning_rate": 6.345753056687663e-06, + "loss": 1.7967, + "step": 30173500 + }, + { + "epoch": 87.34, + "learning_rate": 6.345029409040386e-06, + "loss": 1.8055, + "step": 30174000 + }, + { + "epoch": 87.34, + "learning_rate": 6.3443057613931084e-06, + "loss": 1.8063, + "step": 30174500 + }, + { + "epoch": 87.34, + "learning_rate": 6.3435821137458315e-06, + "loss": 1.7994, + "step": 30175000 + }, + { + "epoch": 87.35, + "learning_rate": 6.3428584660985554e-06, + "loss": 1.8032, + "step": 30175500 + }, + { + "epoch": 87.35, + "learning_rate": 6.3421348184512785e-06, + "loss": 1.7804, + "step": 30176000 + }, + { + "epoch": 87.35, + "learning_rate": 6.341411170804002e-06, + "loss": 1.8112, + "step": 30176500 + }, + { + "epoch": 87.35, + "learning_rate": 6.3406875231567255e-06, + "loss": 1.7997, + "step": 30177000 + }, + { + "epoch": 87.35, + "learning_rate": 6.339965322804743e-06, + "loss": 1.832, + "step": 30177500 + }, + { + "epoch": 87.35, + "learning_rate": 6.339241675157466e-06, + "loss": 1.8308, + "step": 30178000 + }, + { + "epoch": 87.35, + "learning_rate": 6.338518027510189e-06, + "loss": 1.7964, + "step": 30178500 + }, + { + "epoch": 87.36, + "learning_rate": 6.337794379862913e-06, + "loss": 1.7909, + "step": 30179000 + }, + { + "epoch": 87.36, + "learning_rate": 6.337070732215636e-06, + "loss": 1.7993, + "step": 30179500 + }, + { + "epoch": 87.36, + "learning_rate": 6.336348531863653e-06, + "loss": 1.7907, + "step": 30180000 + }, + { + "epoch": 87.36, + "learning_rate": 6.335624884216376e-06, + "loss": 1.8099, + "step": 30180500 + }, + { + "epoch": 87.36, + "learning_rate": 6.334902683864395e-06, + "loss": 1.7976, + "step": 30181000 + }, + { + "epoch": 87.36, + "learning_rate": 6.334179036217118e-06, + "loss": 1.7845, + "step": 30181500 + }, + { + "epoch": 87.36, + "learning_rate": 6.3334553885698405e-06, + "loss": 1.7865, + "step": 30182000 + }, + { + "epoch": 87.37, + "learning_rate": 6.332731740922564e-06, + "loss": 1.78, + "step": 30182500 + }, + { + "epoch": 87.37, + "learning_rate": 6.3320080932752875e-06, + "loss": 1.809, + "step": 30183000 + }, + { + "epoch": 87.37, + "learning_rate": 6.331284445628011e-06, + "loss": 1.8027, + "step": 30183500 + }, + { + "epoch": 87.37, + "learning_rate": 6.330560797980734e-06, + "loss": 1.8136, + "step": 30184000 + }, + { + "epoch": 87.37, + "learning_rate": 6.329837150333458e-06, + "loss": 1.8066, + "step": 30184500 + }, + { + "epoch": 87.37, + "learning_rate": 6.329114949981476e-06, + "loss": 1.8096, + "step": 30185000 + }, + { + "epoch": 87.37, + "learning_rate": 6.328391302334198e-06, + "loss": 1.7982, + "step": 30185500 + }, + { + "epoch": 87.38, + "learning_rate": 6.327667654686921e-06, + "loss": 1.7995, + "step": 30186000 + }, + { + "epoch": 87.38, + "learning_rate": 6.326944007039645e-06, + "loss": 1.8262, + "step": 30186500 + }, + { + "epoch": 87.38, + "learning_rate": 6.326220359392368e-06, + "loss": 1.8341, + "step": 30187000 + }, + { + "epoch": 87.38, + "learning_rate": 6.325498159040385e-06, + "loss": 1.8289, + "step": 30187500 + }, + { + "epoch": 87.38, + "learning_rate": 6.324774511393108e-06, + "loss": 1.7882, + "step": 30188000 + }, + { + "epoch": 87.38, + "learning_rate": 6.324050863745832e-06, + "loss": 1.7845, + "step": 30188500 + }, + { + "epoch": 87.38, + "learning_rate": 6.323327216098555e-06, + "loss": 1.792, + "step": 30189000 + }, + { + "epoch": 87.39, + "learning_rate": 6.322605015746573e-06, + "loss": 1.7988, + "step": 30189500 + }, + { + "epoch": 87.39, + "learning_rate": 6.321881368099296e-06, + "loss": 1.7861, + "step": 30190000 + }, + { + "epoch": 87.39, + "learning_rate": 6.32115772045202e-06, + "loss": 1.7919, + "step": 30190500 + }, + { + "epoch": 87.39, + "learning_rate": 6.320434072804743e-06, + "loss": 1.773, + "step": 30191000 + }, + { + "epoch": 87.39, + "learning_rate": 6.319710425157466e-06, + "loss": 1.8235, + "step": 30191500 + }, + { + "epoch": 87.39, + "learning_rate": 6.318988224805483e-06, + "loss": 1.8032, + "step": 30192000 + }, + { + "epoch": 87.39, + "learning_rate": 6.318264577158208e-06, + "loss": 1.7988, + "step": 30192500 + }, + { + "epoch": 87.4, + "learning_rate": 6.31754092951093e-06, + "loss": 1.8049, + "step": 30193000 + }, + { + "epoch": 87.4, + "learning_rate": 6.316817281863653e-06, + "loss": 1.8019, + "step": 30193500 + }, + { + "epoch": 87.4, + "learning_rate": 6.316093634216377e-06, + "loss": 1.8073, + "step": 30194000 + }, + { + "epoch": 87.4, + "learning_rate": 6.315371433864395e-06, + "loss": 1.7871, + "step": 30194500 + }, + { + "epoch": 87.4, + "learning_rate": 6.314647786217117e-06, + "loss": 1.7935, + "step": 30195000 + }, + { + "epoch": 87.4, + "learning_rate": 6.3139241385698405e-06, + "loss": 1.8103, + "step": 30195500 + }, + { + "epoch": 87.41, + "learning_rate": 6.313200490922564e-06, + "loss": 1.8133, + "step": 30196000 + }, + { + "epoch": 87.41, + "learning_rate": 6.3124782905705825e-06, + "loss": 1.7978, + "step": 30196500 + }, + { + "epoch": 87.41, + "learning_rate": 6.311754642923305e-06, + "loss": 1.818, + "step": 30197000 + }, + { + "epoch": 87.41, + "learning_rate": 6.311030995276028e-06, + "loss": 1.7671, + "step": 30197500 + }, + { + "epoch": 87.41, + "learning_rate": 6.310307347628753e-06, + "loss": 1.8327, + "step": 30198000 + }, + { + "epoch": 87.41, + "learning_rate": 6.309583699981475e-06, + "loss": 1.797, + "step": 30198500 + }, + { + "epoch": 87.41, + "learning_rate": 6.308860052334198e-06, + "loss": 1.8155, + "step": 30199000 + }, + { + "epoch": 87.42, + "learning_rate": 6.308136404686922e-06, + "loss": 1.8201, + "step": 30199500 + }, + { + "epoch": 87.42, + "learning_rate": 6.307412757039645e-06, + "loss": 1.8219, + "step": 30200000 + }, + { + "epoch": 87.42, + "learning_rate": 6.306689109392368e-06, + "loss": 1.8307, + "step": 30200500 + }, + { + "epoch": 87.42, + "learning_rate": 6.30596546174509e-06, + "loss": 1.7679, + "step": 30201000 + }, + { + "epoch": 87.42, + "learning_rate": 6.305241814097815e-06, + "loss": 1.8427, + "step": 30201500 + }, + { + "epoch": 87.42, + "learning_rate": 6.304518166450537e-06, + "loss": 1.812, + "step": 30202000 + }, + { + "epoch": 87.42, + "learning_rate": 6.303795966098555e-06, + "loss": 1.789, + "step": 30202500 + }, + { + "epoch": 87.43, + "learning_rate": 6.303072318451278e-06, + "loss": 1.7973, + "step": 30203000 + }, + { + "epoch": 87.43, + "learning_rate": 6.302348670804002e-06, + "loss": 1.7926, + "step": 30203500 + }, + { + "epoch": 87.43, + "learning_rate": 6.301625023156725e-06, + "loss": 1.8234, + "step": 30204000 + }, + { + "epoch": 87.43, + "learning_rate": 6.300901375509448e-06, + "loss": 1.8286, + "step": 30204500 + }, + { + "epoch": 87.43, + "learning_rate": 6.3001777278621724e-06, + "loss": 1.8108, + "step": 30205000 + }, + { + "epoch": 87.43, + "learning_rate": 6.299454080214895e-06, + "loss": 1.8179, + "step": 30205500 + }, + { + "epoch": 87.43, + "learning_rate": 6.298731879862913e-06, + "loss": 1.7846, + "step": 30206000 + }, + { + "epoch": 87.44, + "learning_rate": 6.298008232215635e-06, + "loss": 1.8125, + "step": 30206500 + }, + { + "epoch": 87.44, + "learning_rate": 6.297286031863653e-06, + "loss": 1.8201, + "step": 30207000 + }, + { + "epoch": 87.44, + "learning_rate": 6.296562384216377e-06, + "loss": 1.8194, + "step": 30207500 + }, + { + "epoch": 87.44, + "learning_rate": 6.2958387365691e-06, + "loss": 1.8119, + "step": 30208000 + }, + { + "epoch": 87.44, + "learning_rate": 6.295115088921822e-06, + "loss": 1.7976, + "step": 30208500 + }, + { + "epoch": 87.44, + "learning_rate": 6.294391441274547e-06, + "loss": 1.8062, + "step": 30209000 + }, + { + "epoch": 87.44, + "learning_rate": 6.29366779362727e-06, + "loss": 1.8361, + "step": 30209500 + }, + { + "epoch": 87.45, + "learning_rate": 6.292944145979992e-06, + "loss": 1.8214, + "step": 30210000 + }, + { + "epoch": 87.45, + "learning_rate": 6.2922204983327155e-06, + "loss": 1.787, + "step": 30210500 + }, + { + "epoch": 87.45, + "learning_rate": 6.2914968506854394e-06, + "loss": 1.8001, + "step": 30211000 + }, + { + "epoch": 87.45, + "learning_rate": 6.2907732030381625e-06, + "loss": 1.7697, + "step": 30211500 + }, + { + "epoch": 87.45, + "learning_rate": 6.29005100268618e-06, + "loss": 1.7771, + "step": 30212000 + }, + { + "epoch": 87.45, + "learning_rate": 6.2893273550389045e-06, + "loss": 1.8292, + "step": 30212500 + }, + { + "epoch": 87.45, + "learning_rate": 6.288605154686922e-06, + "loss": 1.8192, + "step": 30213000 + }, + { + "epoch": 87.46, + "learning_rate": 6.287882954334939e-06, + "loss": 1.8023, + "step": 30213500 + }, + { + "epoch": 87.46, + "learning_rate": 6.287159306687662e-06, + "loss": 1.7866, + "step": 30214000 + }, + { + "epoch": 87.46, + "learning_rate": 6.286435659040385e-06, + "loss": 1.802, + "step": 30214500 + }, + { + "epoch": 87.46, + "learning_rate": 6.285712011393109e-06, + "loss": 1.8047, + "step": 30215000 + }, + { + "epoch": 87.46, + "learning_rate": 6.284989811041126e-06, + "loss": 1.792, + "step": 30215500 + }, + { + "epoch": 87.46, + "learning_rate": 6.2842661633938495e-06, + "loss": 1.8145, + "step": 30216000 + }, + { + "epoch": 87.46, + "learning_rate": 6.2835425157465725e-06, + "loss": 1.8035, + "step": 30216500 + }, + { + "epoch": 87.47, + "learning_rate": 6.2828188680992965e-06, + "loss": 1.7781, + "step": 30217000 + }, + { + "epoch": 87.47, + "learning_rate": 6.2820952204520195e-06, + "loss": 1.7895, + "step": 30217500 + }, + { + "epoch": 87.47, + "learning_rate": 6.281371572804743e-06, + "loss": 1.788, + "step": 30218000 + }, + { + "epoch": 87.47, + "learning_rate": 6.2806479251574665e-06, + "loss": 1.7845, + "step": 30218500 + }, + { + "epoch": 87.47, + "learning_rate": 6.27992427751019e-06, + "loss": 1.8075, + "step": 30219000 + }, + { + "epoch": 87.47, + "learning_rate": 6.279200629862912e-06, + "loss": 1.8072, + "step": 30219500 + }, + { + "epoch": 87.47, + "learning_rate": 6.278476982215637e-06, + "loss": 1.7774, + "step": 30220000 + }, + { + "epoch": 87.48, + "learning_rate": 6.277753334568359e-06, + "loss": 1.8201, + "step": 30220500 + }, + { + "epoch": 87.48, + "learning_rate": 6.277029686921082e-06, + "loss": 1.7974, + "step": 30221000 + }, + { + "epoch": 87.48, + "learning_rate": 6.276306039273805e-06, + "loss": 1.7822, + "step": 30221500 + }, + { + "epoch": 87.48, + "learning_rate": 6.275583838921824e-06, + "loss": 1.7863, + "step": 30222000 + }, + { + "epoch": 87.48, + "learning_rate": 6.274860191274547e-06, + "loss": 1.7855, + "step": 30222500 + }, + { + "epoch": 87.48, + "learning_rate": 6.274136543627269e-06, + "loss": 1.7848, + "step": 30223000 + }, + { + "epoch": 87.48, + "learning_rate": 6.273412895979992e-06, + "loss": 1.779, + "step": 30223500 + }, + { + "epoch": 87.49, + "learning_rate": 6.272689248332716e-06, + "loss": 1.8421, + "step": 30224000 + }, + { + "epoch": 87.49, + "learning_rate": 6.271965600685439e-06, + "loss": 1.7868, + "step": 30224500 + }, + { + "epoch": 87.49, + "learning_rate": 6.2712419530381625e-06, + "loss": 1.7889, + "step": 30225000 + }, + { + "epoch": 87.49, + "learning_rate": 6.270518305390886e-06, + "loss": 1.7887, + "step": 30225500 + }, + { + "epoch": 87.49, + "learning_rate": 6.2697946577436095e-06, + "loss": 1.8139, + "step": 30226000 + }, + { + "epoch": 87.49, + "learning_rate": 6.269072457391627e-06, + "loss": 1.7902, + "step": 30226500 + }, + { + "epoch": 87.49, + "learning_rate": 6.26834880974435e-06, + "loss": 1.8232, + "step": 30227000 + }, + { + "epoch": 87.5, + "learning_rate": 6.267625162097074e-06, + "loss": 1.8035, + "step": 30227500 + }, + { + "epoch": 87.5, + "learning_rate": 6.266901514449797e-06, + "loss": 1.8256, + "step": 30228000 + }, + { + "epoch": 87.5, + "learning_rate": 6.26617786680252e-06, + "loss": 1.7876, + "step": 30228500 + }, + { + "epoch": 87.5, + "learning_rate": 6.265455666450537e-06, + "loss": 1.7931, + "step": 30229000 + }, + { + "epoch": 87.5, + "learning_rate": 6.264732018803261e-06, + "loss": 1.7742, + "step": 30229500 + }, + { + "epoch": 87.5, + "learning_rate": 6.264008371155984e-06, + "loss": 1.8072, + "step": 30230000 + }, + { + "epoch": 87.5, + "learning_rate": 6.263286170804001e-06, + "loss": 1.8129, + "step": 30230500 + }, + { + "epoch": 87.51, + "learning_rate": 6.2625625231567245e-06, + "loss": 1.7912, + "step": 30231000 + }, + { + "epoch": 87.51, + "learning_rate": 6.261838875509448e-06, + "loss": 1.7931, + "step": 30231500 + }, + { + "epoch": 87.51, + "learning_rate": 6.2611152278621715e-06, + "loss": 1.8052, + "step": 30232000 + }, + { + "epoch": 87.51, + "learning_rate": 6.2603915802148946e-06, + "loss": 1.7949, + "step": 30232500 + }, + { + "epoch": 87.51, + "learning_rate": 6.2596679325676185e-06, + "loss": 1.7755, + "step": 30233000 + }, + { + "epoch": 87.51, + "learning_rate": 6.2589442849203416e-06, + "loss": 1.8078, + "step": 30233500 + }, + { + "epoch": 87.52, + "learning_rate": 6.258220637273065e-06, + "loss": 1.7919, + "step": 30234000 + }, + { + "epoch": 87.52, + "learning_rate": 6.257496989625787e-06, + "loss": 1.804, + "step": 30234500 + }, + { + "epoch": 87.52, + "learning_rate": 6.256773341978512e-06, + "loss": 1.8148, + "step": 30235000 + }, + { + "epoch": 87.52, + "learning_rate": 6.256051141626529e-06, + "loss": 1.8164, + "step": 30235500 + }, + { + "epoch": 87.52, + "learning_rate": 6.255328941274546e-06, + "loss": 1.7746, + "step": 30236000 + }, + { + "epoch": 87.52, + "learning_rate": 6.254605293627269e-06, + "loss": 1.8127, + "step": 30236500 + }, + { + "epoch": 87.52, + "learning_rate": 6.253881645979993e-06, + "loss": 1.8101, + "step": 30237000 + }, + { + "epoch": 87.53, + "learning_rate": 6.253157998332716e-06, + "loss": 1.8048, + "step": 30237500 + }, + { + "epoch": 87.53, + "learning_rate": 6.252434350685439e-06, + "loss": 1.7994, + "step": 30238000 + }, + { + "epoch": 87.53, + "learning_rate": 6.2517107030381616e-06, + "loss": 1.7999, + "step": 30238500 + }, + { + "epoch": 87.53, + "learning_rate": 6.250987055390886e-06, + "loss": 1.7997, + "step": 30239000 + }, + { + "epoch": 87.53, + "learning_rate": 6.2502634077436086e-06, + "loss": 1.788, + "step": 30239500 + }, + { + "epoch": 87.53, + "learning_rate": 6.2495397600963325e-06, + "loss": 1.8106, + "step": 30240000 + }, + { + "epoch": 87.53, + "learning_rate": 6.24881755974435e-06, + "loss": 1.7983, + "step": 30240500 + }, + { + "epoch": 87.54, + "learning_rate": 6.248093912097074e-06, + "loss": 1.82, + "step": 30241000 + }, + { + "epoch": 87.54, + "learning_rate": 6.247370264449797e-06, + "loss": 1.7744, + "step": 30241500 + }, + { + "epoch": 87.54, + "learning_rate": 6.24664661680252e-06, + "loss": 1.8322, + "step": 30242000 + }, + { + "epoch": 87.54, + "learning_rate": 6.245922969155243e-06, + "loss": 1.7948, + "step": 30242500 + }, + { + "epoch": 87.54, + "learning_rate": 6.245200768803261e-06, + "loss": 1.8033, + "step": 30243000 + }, + { + "epoch": 87.54, + "learning_rate": 6.244477121155984e-06, + "loss": 1.8007, + "step": 30243500 + }, + { + "epoch": 87.54, + "learning_rate": 6.243753473508707e-06, + "loss": 1.8112, + "step": 30244000 + }, + { + "epoch": 87.55, + "learning_rate": 6.24302982586143e-06, + "loss": 1.8124, + "step": 30244500 + }, + { + "epoch": 87.55, + "learning_rate": 6.242306178214153e-06, + "loss": 1.8152, + "step": 30245000 + }, + { + "epoch": 87.55, + "learning_rate": 6.2415839778621714e-06, + "loss": 1.8145, + "step": 30245500 + }, + { + "epoch": 87.55, + "learning_rate": 6.2408603302148945e-06, + "loss": 1.807, + "step": 30246000 + }, + { + "epoch": 87.55, + "learning_rate": 6.240136682567618e-06, + "loss": 1.7901, + "step": 30246500 + }, + { + "epoch": 87.55, + "learning_rate": 6.2394130349203415e-06, + "loss": 1.8013, + "step": 30247000 + }, + { + "epoch": 87.55, + "learning_rate": 6.238690834568359e-06, + "loss": 1.8184, + "step": 30247500 + }, + { + "epoch": 87.56, + "learning_rate": 6.237967186921082e-06, + "loss": 1.7942, + "step": 30248000 + }, + { + "epoch": 87.56, + "learning_rate": 6.237243539273806e-06, + "loss": 1.8087, + "step": 30248500 + }, + { + "epoch": 87.56, + "learning_rate": 6.236519891626529e-06, + "loss": 1.8118, + "step": 30249000 + }, + { + "epoch": 87.56, + "learning_rate": 6.235796243979252e-06, + "loss": 1.8043, + "step": 30249500 + }, + { + "epoch": 87.56, + "learning_rate": 6.235072596331975e-06, + "loss": 1.7781, + "step": 30250000 + }, + { + "epoch": 87.56, + "learning_rate": 6.234348948684698e-06, + "loss": 1.8014, + "step": 30250500 + }, + { + "epoch": 87.56, + "learning_rate": 6.233625301037421e-06, + "loss": 1.7901, + "step": 30251000 + }, + { + "epoch": 87.57, + "learning_rate": 6.232903100685439e-06, + "loss": 1.8068, + "step": 30251500 + }, + { + "epoch": 87.57, + "learning_rate": 6.232180900333457e-06, + "loss": 1.7881, + "step": 30252000 + }, + { + "epoch": 87.57, + "learning_rate": 6.2314572526861805e-06, + "loss": 1.7986, + "step": 30252500 + }, + { + "epoch": 87.57, + "learning_rate": 6.2307336050389035e-06, + "loss": 1.7873, + "step": 30253000 + }, + { + "epoch": 87.57, + "learning_rate": 6.230011404686922e-06, + "loss": 1.787, + "step": 30253500 + }, + { + "epoch": 87.57, + "learning_rate": 6.229287757039645e-06, + "loss": 1.7831, + "step": 30254000 + }, + { + "epoch": 87.57, + "learning_rate": 6.228564109392368e-06, + "loss": 1.8214, + "step": 30254500 + }, + { + "epoch": 87.58, + "learning_rate": 6.227840461745091e-06, + "loss": 1.8054, + "step": 30255000 + }, + { + "epoch": 87.58, + "learning_rate": 6.227116814097814e-06, + "loss": 1.8027, + "step": 30255500 + }, + { + "epoch": 87.58, + "learning_rate": 6.226393166450537e-06, + "loss": 1.7996, + "step": 30256000 + }, + { + "epoch": 87.58, + "learning_rate": 6.225669518803261e-06, + "loss": 1.7939, + "step": 30256500 + }, + { + "epoch": 87.58, + "learning_rate": 6.224945871155984e-06, + "loss": 1.7868, + "step": 30257000 + }, + { + "epoch": 87.58, + "learning_rate": 6.224223670804002e-06, + "loss": 1.8099, + "step": 30257500 + }, + { + "epoch": 87.58, + "learning_rate": 6.223500023156725e-06, + "loss": 1.7935, + "step": 30258000 + }, + { + "epoch": 87.59, + "learning_rate": 6.222776375509448e-06, + "loss": 1.8291, + "step": 30258500 + }, + { + "epoch": 87.59, + "learning_rate": 6.222052727862171e-06, + "loss": 1.7893, + "step": 30259000 + }, + { + "epoch": 87.59, + "learning_rate": 6.2213290802148945e-06, + "loss": 1.8155, + "step": 30259500 + }, + { + "epoch": 87.59, + "learning_rate": 6.220605432567618e-06, + "loss": 1.7982, + "step": 30260000 + }, + { + "epoch": 87.59, + "learning_rate": 6.219883232215636e-06, + "loss": 1.8104, + "step": 30260500 + }, + { + "epoch": 87.59, + "learning_rate": 6.219159584568359e-06, + "loss": 1.791, + "step": 30261000 + }, + { + "epoch": 87.59, + "learning_rate": 6.218435936921082e-06, + "loss": 1.8047, + "step": 30261500 + }, + { + "epoch": 87.6, + "learning_rate": 6.217712289273806e-06, + "loss": 1.8027, + "step": 30262000 + }, + { + "epoch": 87.6, + "learning_rate": 6.216990088921823e-06, + "loss": 1.8204, + "step": 30262500 + }, + { + "epoch": 87.6, + "learning_rate": 6.216266441274547e-06, + "loss": 1.7988, + "step": 30263000 + }, + { + "epoch": 87.6, + "learning_rate": 6.215542793627269e-06, + "loss": 1.7696, + "step": 30263500 + }, + { + "epoch": 87.6, + "learning_rate": 6.214819145979993e-06, + "loss": 1.8257, + "step": 30264000 + }, + { + "epoch": 87.6, + "learning_rate": 6.214095498332716e-06, + "loss": 1.8288, + "step": 30264500 + }, + { + "epoch": 87.6, + "learning_rate": 6.213371850685439e-06, + "loss": 1.7992, + "step": 30265000 + }, + { + "epoch": 87.61, + "learning_rate": 6.212648203038163e-06, + "loss": 1.8051, + "step": 30265500 + }, + { + "epoch": 87.61, + "learning_rate": 6.211924555390885e-06, + "loss": 1.8011, + "step": 30266000 + }, + { + "epoch": 87.61, + "learning_rate": 6.2112023550389035e-06, + "loss": 1.7942, + "step": 30266500 + }, + { + "epoch": 87.61, + "learning_rate": 6.2104787073916266e-06, + "loss": 1.7952, + "step": 30267000 + }, + { + "epoch": 87.61, + "learning_rate": 6.2097550597443505e-06, + "loss": 1.8084, + "step": 30267500 + }, + { + "epoch": 87.61, + "learning_rate": 6.209031412097073e-06, + "loss": 1.8111, + "step": 30268000 + }, + { + "epoch": 87.61, + "learning_rate": 6.208307764449797e-06, + "loss": 1.8183, + "step": 30268500 + }, + { + "epoch": 87.62, + "learning_rate": 6.20758411680252e-06, + "loss": 1.8003, + "step": 30269000 + }, + { + "epoch": 87.62, + "learning_rate": 6.206860469155243e-06, + "loss": 1.7824, + "step": 30269500 + }, + { + "epoch": 87.62, + "learning_rate": 6.206136821507967e-06, + "loss": 1.8481, + "step": 30270000 + }, + { + "epoch": 87.62, + "learning_rate": 6.205413173860689e-06, + "loss": 1.8196, + "step": 30270500 + }, + { + "epoch": 87.62, + "learning_rate": 6.204690973508707e-06, + "loss": 1.7942, + "step": 30271000 + }, + { + "epoch": 87.62, + "learning_rate": 6.20396732586143e-06, + "loss": 1.8084, + "step": 30271500 + }, + { + "epoch": 87.63, + "learning_rate": 6.203243678214154e-06, + "loss": 1.792, + "step": 30272000 + }, + { + "epoch": 87.63, + "learning_rate": 6.202520030566876e-06, + "loss": 1.8108, + "step": 30272500 + }, + { + "epoch": 87.63, + "learning_rate": 6.201797830214895e-06, + "loss": 1.8326, + "step": 30273000 + }, + { + "epoch": 87.63, + "learning_rate": 6.2010741825676175e-06, + "loss": 1.7913, + "step": 30273500 + }, + { + "epoch": 87.63, + "learning_rate": 6.200350534920341e-06, + "loss": 1.8285, + "step": 30274000 + }, + { + "epoch": 87.63, + "learning_rate": 6.1996268872730645e-06, + "loss": 1.7915, + "step": 30274500 + }, + { + "epoch": 87.63, + "learning_rate": 6.1989032396257876e-06, + "loss": 1.8038, + "step": 30275000 + }, + { + "epoch": 87.64, + "learning_rate": 6.1981795919785115e-06, + "loss": 1.8088, + "step": 30275500 + }, + { + "epoch": 87.64, + "learning_rate": 6.197455944331234e-06, + "loss": 1.825, + "step": 30276000 + }, + { + "epoch": 87.64, + "learning_rate": 6.196732296683958e-06, + "loss": 1.8138, + "step": 30276500 + }, + { + "epoch": 87.64, + "learning_rate": 6.196008649036681e-06, + "loss": 1.7977, + "step": 30277000 + }, + { + "epoch": 87.64, + "learning_rate": 6.195285001389404e-06, + "loss": 1.7981, + "step": 30277500 + }, + { + "epoch": 87.64, + "learning_rate": 6.194561353742127e-06, + "loss": 1.8187, + "step": 30278000 + }, + { + "epoch": 87.64, + "learning_rate": 6.19383770609485e-06, + "loss": 1.8151, + "step": 30278500 + }, + { + "epoch": 87.65, + "learning_rate": 6.193115505742868e-06, + "loss": 1.7886, + "step": 30279000 + }, + { + "epoch": 87.65, + "learning_rate": 6.192393305390886e-06, + "loss": 1.8159, + "step": 30279500 + }, + { + "epoch": 87.65, + "learning_rate": 6.191669657743608e-06, + "loss": 1.7888, + "step": 30280000 + }, + { + "epoch": 87.65, + "learning_rate": 6.190946010096332e-06, + "loss": 1.7859, + "step": 30280500 + }, + { + "epoch": 87.65, + "learning_rate": 6.190222362449055e-06, + "loss": 1.813, + "step": 30281000 + }, + { + "epoch": 87.65, + "learning_rate": 6.1894987148017785e-06, + "loss": 1.8152, + "step": 30281500 + }, + { + "epoch": 87.65, + "learning_rate": 6.1887750671545024e-06, + "loss": 1.8192, + "step": 30282000 + }, + { + "epoch": 87.66, + "learning_rate": 6.18805286680252e-06, + "loss": 1.8089, + "step": 30282500 + }, + { + "epoch": 87.66, + "learning_rate": 6.187329219155244e-06, + "loss": 1.8024, + "step": 30283000 + }, + { + "epoch": 87.66, + "learning_rate": 6.186605571507966e-06, + "loss": 1.8163, + "step": 30283500 + }, + { + "epoch": 87.66, + "learning_rate": 6.18588192386069e-06, + "loss": 1.8286, + "step": 30284000 + }, + { + "epoch": 87.66, + "learning_rate": 6.185159723508707e-06, + "loss": 1.8119, + "step": 30284500 + }, + { + "epoch": 87.66, + "learning_rate": 6.184436075861431e-06, + "loss": 1.8395, + "step": 30285000 + }, + { + "epoch": 87.66, + "learning_rate": 6.183712428214153e-06, + "loss": 1.8102, + "step": 30285500 + }, + { + "epoch": 87.67, + "learning_rate": 6.182988780566877e-06, + "loss": 1.7888, + "step": 30286000 + }, + { + "epoch": 87.67, + "learning_rate": 6.1822651329196e-06, + "loss": 1.7864, + "step": 30286500 + }, + { + "epoch": 87.67, + "learning_rate": 6.181541485272323e-06, + "loss": 1.8107, + "step": 30287000 + }, + { + "epoch": 87.67, + "learning_rate": 6.180817837625046e-06, + "loss": 1.8415, + "step": 30287500 + }, + { + "epoch": 87.67, + "learning_rate": 6.1800970845683595e-06, + "loss": 1.8061, + "step": 30288000 + }, + { + "epoch": 87.67, + "learning_rate": 6.179373436921082e-06, + "loss": 1.8241, + "step": 30288500 + }, + { + "epoch": 87.67, + "learning_rate": 6.178649789273806e-06, + "loss": 1.7866, + "step": 30289000 + }, + { + "epoch": 87.68, + "learning_rate": 6.177926141626529e-06, + "loss": 1.8047, + "step": 30289500 + }, + { + "epoch": 87.68, + "learning_rate": 6.177202493979252e-06, + "loss": 1.781, + "step": 30290000 + }, + { + "epoch": 87.68, + "learning_rate": 6.176478846331975e-06, + "loss": 1.7939, + "step": 30290500 + }, + { + "epoch": 87.68, + "learning_rate": 6.175755198684698e-06, + "loss": 1.8146, + "step": 30291000 + }, + { + "epoch": 87.68, + "learning_rate": 6.175031551037422e-06, + "loss": 1.8085, + "step": 30291500 + }, + { + "epoch": 87.68, + "learning_rate": 6.174307903390145e-06, + "loss": 1.7927, + "step": 30292000 + }, + { + "epoch": 87.68, + "learning_rate": 6.173585703038163e-06, + "loss": 1.7804, + "step": 30292500 + }, + { + "epoch": 87.69, + "learning_rate": 6.172862055390886e-06, + "loss": 1.8121, + "step": 30293000 + }, + { + "epoch": 87.69, + "learning_rate": 6.172138407743609e-06, + "loss": 1.778, + "step": 30293500 + }, + { + "epoch": 87.69, + "learning_rate": 6.1714162073916265e-06, + "loss": 1.8211, + "step": 30294000 + }, + { + "epoch": 87.69, + "learning_rate": 6.17069255974435e-06, + "loss": 1.8262, + "step": 30294500 + }, + { + "epoch": 87.69, + "learning_rate": 6.1699689120970735e-06, + "loss": 1.81, + "step": 30295000 + }, + { + "epoch": 87.69, + "learning_rate": 6.1692452644497965e-06, + "loss": 1.8006, + "step": 30295500 + }, + { + "epoch": 87.69, + "learning_rate": 6.168523064097814e-06, + "loss": 1.8077, + "step": 30296000 + }, + { + "epoch": 87.7, + "learning_rate": 6.167799416450538e-06, + "loss": 1.8484, + "step": 30296500 + }, + { + "epoch": 87.7, + "learning_rate": 6.167075768803261e-06, + "loss": 1.8034, + "step": 30297000 + }, + { + "epoch": 87.7, + "learning_rate": 6.166352121155984e-06, + "loss": 1.8062, + "step": 30297500 + }, + { + "epoch": 87.7, + "learning_rate": 6.165628473508707e-06, + "loss": 1.8073, + "step": 30298000 + }, + { + "epoch": 87.7, + "learning_rate": 6.16490482586143e-06, + "loss": 1.8007, + "step": 30298500 + }, + { + "epoch": 87.7, + "learning_rate": 6.164181178214154e-06, + "loss": 1.7938, + "step": 30299000 + }, + { + "epoch": 87.7, + "learning_rate": 6.163457530566877e-06, + "loss": 1.7881, + "step": 30299500 + }, + { + "epoch": 87.71, + "learning_rate": 6.1627338829196e-06, + "loss": 1.7954, + "step": 30300000 + }, + { + "epoch": 87.71, + "learning_rate": 6.162011682567618e-06, + "loss": 1.7975, + "step": 30300500 + }, + { + "epoch": 87.71, + "learning_rate": 6.161288034920341e-06, + "loss": 1.7792, + "step": 30301000 + }, + { + "epoch": 87.71, + "learning_rate": 6.160564387273064e-06, + "loss": 1.8014, + "step": 30301500 + }, + { + "epoch": 87.71, + "learning_rate": 6.1598407396257875e-06, + "loss": 1.7969, + "step": 30302000 + }, + { + "epoch": 87.71, + "learning_rate": 6.1591185392738056e-06, + "loss": 1.8206, + "step": 30302500 + }, + { + "epoch": 87.71, + "learning_rate": 6.158394891626529e-06, + "loss": 1.8145, + "step": 30303000 + }, + { + "epoch": 87.72, + "learning_rate": 6.157671243979252e-06, + "loss": 1.796, + "step": 30303500 + }, + { + "epoch": 87.72, + "learning_rate": 6.156947596331975e-06, + "loss": 1.7824, + "step": 30304000 + }, + { + "epoch": 87.72, + "learning_rate": 6.156225395979993e-06, + "loss": 1.7885, + "step": 30304500 + }, + { + "epoch": 87.72, + "learning_rate": 6.155501748332716e-06, + "loss": 1.8066, + "step": 30305000 + }, + { + "epoch": 87.72, + "learning_rate": 6.154778100685439e-06, + "loss": 1.8116, + "step": 30305500 + }, + { + "epoch": 87.72, + "learning_rate": 6.154054453038163e-06, + "loss": 1.7917, + "step": 30306000 + }, + { + "epoch": 87.72, + "learning_rate": 6.153330805390886e-06, + "loss": 1.8043, + "step": 30306500 + }, + { + "epoch": 87.73, + "learning_rate": 6.152608605038903e-06, + "loss": 1.8262, + "step": 30307000 + }, + { + "epoch": 87.73, + "learning_rate": 6.151884957391626e-06, + "loss": 1.8376, + "step": 30307500 + }, + { + "epoch": 87.73, + "learning_rate": 6.15116130974435e-06, + "loss": 1.8143, + "step": 30308000 + }, + { + "epoch": 87.73, + "learning_rate": 6.150437662097073e-06, + "loss": 1.83, + "step": 30308500 + }, + { + "epoch": 87.73, + "learning_rate": 6.1497154617450915e-06, + "loss": 1.8029, + "step": 30309000 + }, + { + "epoch": 87.73, + "learning_rate": 6.148991814097815e-06, + "loss": 1.8025, + "step": 30309500 + }, + { + "epoch": 87.74, + "learning_rate": 6.148268166450538e-06, + "loss": 1.8054, + "step": 30310000 + }, + { + "epoch": 87.74, + "learning_rate": 6.147544518803261e-06, + "loss": 1.789, + "step": 30310500 + }, + { + "epoch": 87.74, + "learning_rate": 6.146820871155984e-06, + "loss": 1.8201, + "step": 30311000 + }, + { + "epoch": 87.74, + "learning_rate": 6.146098670804002e-06, + "loss": 1.8292, + "step": 30311500 + }, + { + "epoch": 87.74, + "learning_rate": 6.145375023156725e-06, + "loss": 1.7879, + "step": 30312000 + }, + { + "epoch": 87.74, + "learning_rate": 6.144651375509448e-06, + "loss": 1.8368, + "step": 30312500 + }, + { + "epoch": 87.74, + "learning_rate": 6.14393062245276e-06, + "loss": 1.7833, + "step": 30313000 + }, + { + "epoch": 87.75, + "learning_rate": 6.1432069748054834e-06, + "loss": 1.8123, + "step": 30313500 + }, + { + "epoch": 87.75, + "learning_rate": 6.142483327158207e-06, + "loss": 1.7887, + "step": 30314000 + }, + { + "epoch": 87.75, + "learning_rate": 6.1417596795109304e-06, + "loss": 1.7951, + "step": 30314500 + }, + { + "epoch": 87.75, + "learning_rate": 6.1410360318636535e-06, + "loss": 1.801, + "step": 30315000 + }, + { + "epoch": 87.75, + "learning_rate": 6.140312384216377e-06, + "loss": 1.7933, + "step": 30315500 + }, + { + "epoch": 87.75, + "learning_rate": 6.139590183864395e-06, + "loss": 1.7822, + "step": 30316000 + }, + { + "epoch": 87.75, + "learning_rate": 6.138866536217118e-06, + "loss": 1.8122, + "step": 30316500 + }, + { + "epoch": 87.76, + "learning_rate": 6.138142888569841e-06, + "loss": 1.8093, + "step": 30317000 + }, + { + "epoch": 87.76, + "learning_rate": 6.137419240922564e-06, + "loss": 1.7799, + "step": 30317500 + }, + { + "epoch": 87.76, + "learning_rate": 6.136695593275287e-06, + "loss": 1.8101, + "step": 30318000 + }, + { + "epoch": 87.76, + "learning_rate": 6.135971945628011e-06, + "loss": 1.8023, + "step": 30318500 + }, + { + "epoch": 87.76, + "learning_rate": 6.135248297980734e-06, + "loss": 1.8235, + "step": 30319000 + }, + { + "epoch": 87.76, + "learning_rate": 6.134524650333457e-06, + "loss": 1.7778, + "step": 30319500 + }, + { + "epoch": 87.76, + "learning_rate": 6.133802449981474e-06, + "loss": 1.7874, + "step": 30320000 + }, + { + "epoch": 87.77, + "learning_rate": 6.1330802496294925e-06, + "loss": 1.8329, + "step": 30320500 + }, + { + "epoch": 87.77, + "learning_rate": 6.1323566019822155e-06, + "loss": 1.8202, + "step": 30321000 + }, + { + "epoch": 87.77, + "learning_rate": 6.1316329543349395e-06, + "loss": 1.809, + "step": 30321500 + }, + { + "epoch": 87.77, + "learning_rate": 6.1309093066876625e-06, + "loss": 1.8252, + "step": 30322000 + }, + { + "epoch": 87.77, + "learning_rate": 6.130185659040386e-06, + "loss": 1.8245, + "step": 30322500 + }, + { + "epoch": 87.77, + "learning_rate": 6.129462011393109e-06, + "loss": 1.7971, + "step": 30323000 + }, + { + "epoch": 87.77, + "learning_rate": 6.128738363745832e-06, + "loss": 1.8086, + "step": 30323500 + }, + { + "epoch": 87.78, + "learning_rate": 6.128014716098556e-06, + "loss": 1.8166, + "step": 30324000 + }, + { + "epoch": 87.78, + "learning_rate": 6.127292515746573e-06, + "loss": 1.8172, + "step": 30324500 + }, + { + "epoch": 87.78, + "learning_rate": 6.126568868099297e-06, + "loss": 1.7865, + "step": 30325000 + }, + { + "epoch": 87.78, + "learning_rate": 6.125845220452019e-06, + "loss": 1.7965, + "step": 30325500 + }, + { + "epoch": 87.78, + "learning_rate": 6.125121572804743e-06, + "loss": 1.7606, + "step": 30326000 + }, + { + "epoch": 87.78, + "learning_rate": 6.124397925157465e-06, + "loss": 1.82, + "step": 30326500 + }, + { + "epoch": 87.78, + "learning_rate": 6.123674277510189e-06, + "loss": 1.8018, + "step": 30327000 + }, + { + "epoch": 87.79, + "learning_rate": 6.122950629862913e-06, + "loss": 1.7833, + "step": 30327500 + }, + { + "epoch": 87.79, + "learning_rate": 6.122226982215635e-06, + "loss": 1.7893, + "step": 30328000 + }, + { + "epoch": 87.79, + "learning_rate": 6.1215047818636535e-06, + "loss": 1.8163, + "step": 30328500 + }, + { + "epoch": 87.79, + "learning_rate": 6.1207811342163766e-06, + "loss": 1.8034, + "step": 30329000 + }, + { + "epoch": 87.79, + "learning_rate": 6.1200574865691005e-06, + "loss": 1.7886, + "step": 30329500 + }, + { + "epoch": 87.79, + "learning_rate": 6.119333838921823e-06, + "loss": 1.8242, + "step": 30330000 + }, + { + "epoch": 87.79, + "learning_rate": 6.118610191274547e-06, + "loss": 1.808, + "step": 30330500 + }, + { + "epoch": 87.8, + "learning_rate": 6.11788654362727e-06, + "loss": 1.8018, + "step": 30331000 + }, + { + "epoch": 87.8, + "learning_rate": 6.117162895979993e-06, + "loss": 1.8008, + "step": 30331500 + }, + { + "epoch": 87.8, + "learning_rate": 6.116439248332717e-06, + "loss": 1.8218, + "step": 30332000 + }, + { + "epoch": 87.8, + "learning_rate": 6.115715600685439e-06, + "loss": 1.8011, + "step": 30332500 + }, + { + "epoch": 87.8, + "learning_rate": 6.114991953038163e-06, + "loss": 1.8045, + "step": 30333000 + }, + { + "epoch": 87.8, + "learning_rate": 6.11426975268618e-06, + "loss": 1.8117, + "step": 30333500 + }, + { + "epoch": 87.8, + "learning_rate": 6.113546105038904e-06, + "loss": 1.7937, + "step": 30334000 + }, + { + "epoch": 87.81, + "learning_rate": 6.112822457391626e-06, + "loss": 1.7971, + "step": 30334500 + }, + { + "epoch": 87.81, + "learning_rate": 6.11209880974435e-06, + "loss": 1.822, + "step": 30335000 + }, + { + "epoch": 87.81, + "learning_rate": 6.111375162097073e-06, + "loss": 1.8005, + "step": 30335500 + }, + { + "epoch": 87.81, + "learning_rate": 6.110651514449796e-06, + "loss": 1.7807, + "step": 30336000 + }, + { + "epoch": 87.81, + "learning_rate": 6.10992786680252e-06, + "loss": 1.7935, + "step": 30336500 + }, + { + "epoch": 87.81, + "learning_rate": 6.1092056664505376e-06, + "loss": 1.8101, + "step": 30337000 + }, + { + "epoch": 87.81, + "learning_rate": 6.108482018803261e-06, + "loss": 1.8069, + "step": 30337500 + }, + { + "epoch": 87.82, + "learning_rate": 6.107758371155984e-06, + "loss": 1.8005, + "step": 30338000 + }, + { + "epoch": 87.82, + "learning_rate": 6.107034723508708e-06, + "loss": 1.7802, + "step": 30338500 + }, + { + "epoch": 87.82, + "learning_rate": 6.10631107586143e-06, + "loss": 1.7936, + "step": 30339000 + }, + { + "epoch": 87.82, + "learning_rate": 6.105587428214154e-06, + "loss": 1.8109, + "step": 30339500 + }, + { + "epoch": 87.82, + "learning_rate": 6.104865227862171e-06, + "loss": 1.8208, + "step": 30340000 + }, + { + "epoch": 87.82, + "learning_rate": 6.104141580214895e-06, + "loss": 1.808, + "step": 30340500 + }, + { + "epoch": 87.82, + "learning_rate": 6.103417932567618e-06, + "loss": 1.7879, + "step": 30341000 + }, + { + "epoch": 87.83, + "learning_rate": 6.102695732215636e-06, + "loss": 1.8012, + "step": 30341500 + }, + { + "epoch": 87.83, + "learning_rate": 6.101972084568358e-06, + "loss": 1.7942, + "step": 30342000 + }, + { + "epoch": 87.83, + "learning_rate": 6.101248436921082e-06, + "loss": 1.7853, + "step": 30342500 + }, + { + "epoch": 87.83, + "learning_rate": 6.100524789273805e-06, + "loss": 1.8081, + "step": 30343000 + }, + { + "epoch": 87.83, + "learning_rate": 6.0998011416265285e-06, + "loss": 1.7937, + "step": 30343500 + }, + { + "epoch": 87.83, + "learning_rate": 6.0990774939792524e-06, + "loss": 1.8354, + "step": 30344000 + }, + { + "epoch": 87.83, + "learning_rate": 6.098353846331975e-06, + "loss": 1.8411, + "step": 30344500 + }, + { + "epoch": 87.84, + "learning_rate": 6.097630198684699e-06, + "loss": 1.814, + "step": 30345000 + }, + { + "epoch": 87.84, + "learning_rate": 6.096907998332716e-06, + "loss": 1.8185, + "step": 30345500 + }, + { + "epoch": 87.84, + "learning_rate": 6.09618435068544e-06, + "loss": 1.824, + "step": 30346000 + }, + { + "epoch": 87.84, + "learning_rate": 6.095460703038163e-06, + "loss": 1.81, + "step": 30346500 + }, + { + "epoch": 87.84, + "learning_rate": 6.09473850268618e-06, + "loss": 1.7795, + "step": 30347000 + }, + { + "epoch": 87.84, + "learning_rate": 6.094014855038903e-06, + "loss": 1.8017, + "step": 30347500 + }, + { + "epoch": 87.85, + "learning_rate": 6.093291207391627e-06, + "loss": 1.8047, + "step": 30348000 + }, + { + "epoch": 87.85, + "learning_rate": 6.09256755974435e-06, + "loss": 1.7845, + "step": 30348500 + }, + { + "epoch": 87.85, + "learning_rate": 6.091843912097073e-06, + "loss": 1.783, + "step": 30349000 + }, + { + "epoch": 87.85, + "learning_rate": 6.091120264449796e-06, + "loss": 1.8551, + "step": 30349500 + }, + { + "epoch": 87.85, + "learning_rate": 6.090396616802519e-06, + "loss": 1.8221, + "step": 30350000 + }, + { + "epoch": 87.85, + "learning_rate": 6.089672969155243e-06, + "loss": 1.8116, + "step": 30350500 + }, + { + "epoch": 87.85, + "learning_rate": 6.088950768803261e-06, + "loss": 1.805, + "step": 30351000 + }, + { + "epoch": 87.86, + "learning_rate": 6.088227121155984e-06, + "loss": 1.8205, + "step": 30351500 + }, + { + "epoch": 87.86, + "learning_rate": 6.087503473508708e-06, + "loss": 1.7777, + "step": 30352000 + }, + { + "epoch": 87.86, + "learning_rate": 6.086779825861431e-06, + "loss": 1.8189, + "step": 30352500 + }, + { + "epoch": 87.86, + "learning_rate": 6.086056178214154e-06, + "loss": 1.8367, + "step": 30353000 + }, + { + "epoch": 87.86, + "learning_rate": 6.085332530566877e-06, + "loss": 1.7773, + "step": 30353500 + }, + { + "epoch": 87.86, + "learning_rate": 6.0846088829196e-06, + "loss": 1.7906, + "step": 30354000 + }, + { + "epoch": 87.86, + "learning_rate": 6.083885235272323e-06, + "loss": 1.8052, + "step": 30354500 + }, + { + "epoch": 87.87, + "learning_rate": 6.083163034920341e-06, + "loss": 1.7921, + "step": 30355000 + }, + { + "epoch": 87.87, + "learning_rate": 6.082440834568359e-06, + "loss": 1.801, + "step": 30355500 + }, + { + "epoch": 87.87, + "learning_rate": 6.081717186921082e-06, + "loss": 1.8096, + "step": 30356000 + }, + { + "epoch": 87.87, + "learning_rate": 6.080993539273805e-06, + "loss": 1.7988, + "step": 30356500 + }, + { + "epoch": 87.87, + "learning_rate": 6.0802698916265284e-06, + "loss": 1.8225, + "step": 30357000 + }, + { + "epoch": 87.87, + "learning_rate": 6.0795476912745465e-06, + "loss": 1.7895, + "step": 30357500 + }, + { + "epoch": 87.87, + "learning_rate": 6.07882404362727e-06, + "loss": 1.7848, + "step": 30358000 + }, + { + "epoch": 87.88, + "learning_rate": 6.078100395979993e-06, + "loss": 1.798, + "step": 30358500 + }, + { + "epoch": 87.88, + "learning_rate": 6.077376748332716e-06, + "loss": 1.7983, + "step": 30359000 + }, + { + "epoch": 87.88, + "learning_rate": 6.07665310068544e-06, + "loss": 1.8082, + "step": 30359500 + }, + { + "epoch": 87.88, + "learning_rate": 6.075930900333457e-06, + "loss": 1.8115, + "step": 30360000 + }, + { + "epoch": 87.88, + "learning_rate": 6.07520725268618e-06, + "loss": 1.8223, + "step": 30360500 + }, + { + "epoch": 87.88, + "learning_rate": 6.074483605038903e-06, + "loss": 1.7817, + "step": 30361000 + }, + { + "epoch": 87.88, + "learning_rate": 6.073759957391627e-06, + "loss": 1.799, + "step": 30361500 + }, + { + "epoch": 87.89, + "learning_rate": 6.07303630974435e-06, + "loss": 1.8017, + "step": 30362000 + }, + { + "epoch": 87.89, + "learning_rate": 6.072312662097073e-06, + "loss": 1.787, + "step": 30362500 + }, + { + "epoch": 87.89, + "learning_rate": 6.071590461745091e-06, + "loss": 1.8127, + "step": 30363000 + }, + { + "epoch": 87.89, + "learning_rate": 6.070866814097814e-06, + "loss": 1.8122, + "step": 30363500 + }, + { + "epoch": 87.89, + "learning_rate": 6.0701431664505375e-06, + "loss": 1.7999, + "step": 30364000 + }, + { + "epoch": 87.89, + "learning_rate": 6.0694195188032605e-06, + "loss": 1.771, + "step": 30364500 + }, + { + "epoch": 87.89, + "learning_rate": 6.0686958711559845e-06, + "loss": 1.807, + "step": 30365000 + }, + { + "epoch": 87.9, + "learning_rate": 6.067973670804002e-06, + "loss": 1.8332, + "step": 30365500 + }, + { + "epoch": 87.9, + "learning_rate": 6.067250023156725e-06, + "loss": 1.813, + "step": 30366000 + }, + { + "epoch": 87.9, + "learning_rate": 6.066526375509448e-06, + "loss": 1.79, + "step": 30366500 + }, + { + "epoch": 87.9, + "learning_rate": 6.065802727862172e-06, + "loss": 1.7811, + "step": 30367000 + }, + { + "epoch": 87.9, + "learning_rate": 6.065080527510189e-06, + "loss": 1.7942, + "step": 30367500 + }, + { + "epoch": 87.9, + "learning_rate": 6.064356879862913e-06, + "loss": 1.7968, + "step": 30368000 + }, + { + "epoch": 87.9, + "learning_rate": 6.06363467951093e-06, + "loss": 1.8252, + "step": 30368500 + }, + { + "epoch": 87.91, + "learning_rate": 6.062911031863653e-06, + "loss": 1.8047, + "step": 30369000 + }, + { + "epoch": 87.91, + "learning_rate": 6.062187384216376e-06, + "loss": 1.8033, + "step": 30369500 + }, + { + "epoch": 87.91, + "learning_rate": 6.0614637365691e-06, + "loss": 1.7802, + "step": 30370000 + }, + { + "epoch": 87.91, + "learning_rate": 6.0607400889218226e-06, + "loss": 1.8013, + "step": 30370500 + }, + { + "epoch": 87.91, + "learning_rate": 6.0600164412745465e-06, + "loss": 1.813, + "step": 30371000 + }, + { + "epoch": 87.91, + "learning_rate": 6.0592927936272696e-06, + "loss": 1.8179, + "step": 30371500 + }, + { + "epoch": 87.91, + "learning_rate": 6.058570593275288e-06, + "loss": 1.7924, + "step": 30372000 + }, + { + "epoch": 87.92, + "learning_rate": 6.057846945628011e-06, + "loss": 1.7919, + "step": 30372500 + }, + { + "epoch": 87.92, + "learning_rate": 6.057123297980734e-06, + "loss": 1.8113, + "step": 30373000 + }, + { + "epoch": 87.92, + "learning_rate": 6.056399650333457e-06, + "loss": 1.7964, + "step": 30373500 + }, + { + "epoch": 87.92, + "learning_rate": 6.05567600268618e-06, + "loss": 1.7899, + "step": 30374000 + }, + { + "epoch": 87.92, + "learning_rate": 6.054952355038904e-06, + "loss": 1.7886, + "step": 30374500 + }, + { + "epoch": 87.92, + "learning_rate": 6.054230154686921e-06, + "loss": 1.7847, + "step": 30375000 + }, + { + "epoch": 87.92, + "learning_rate": 6.053506507039645e-06, + "loss": 1.8198, + "step": 30375500 + }, + { + "epoch": 87.93, + "learning_rate": 6.052782859392367e-06, + "loss": 1.7856, + "step": 30376000 + }, + { + "epoch": 87.93, + "learning_rate": 6.052059211745091e-06, + "loss": 1.8375, + "step": 30376500 + }, + { + "epoch": 87.93, + "learning_rate": 6.051335564097814e-06, + "loss": 1.8027, + "step": 30377000 + }, + { + "epoch": 87.93, + "learning_rate": 6.0506133637458324e-06, + "loss": 1.8211, + "step": 30377500 + }, + { + "epoch": 87.93, + "learning_rate": 6.049889716098555e-06, + "loss": 1.8212, + "step": 30378000 + }, + { + "epoch": 87.93, + "learning_rate": 6.049166068451279e-06, + "loss": 1.8265, + "step": 30378500 + }, + { + "epoch": 87.93, + "learning_rate": 6.048442420804002e-06, + "loss": 1.814, + "step": 30379000 + }, + { + "epoch": 87.94, + "learning_rate": 6.047718773156725e-06, + "loss": 1.8134, + "step": 30379500 + }, + { + "epoch": 87.94, + "learning_rate": 6.046995125509449e-06, + "loss": 1.8094, + "step": 30380000 + }, + { + "epoch": 87.94, + "learning_rate": 6.046271477862171e-06, + "loss": 1.8136, + "step": 30380500 + }, + { + "epoch": 87.94, + "learning_rate": 6.045547830214895e-06, + "loss": 1.8045, + "step": 30381000 + }, + { + "epoch": 87.94, + "learning_rate": 6.044824182567618e-06, + "loss": 1.788, + "step": 30381500 + }, + { + "epoch": 87.94, + "learning_rate": 6.044101982215636e-06, + "loss": 1.8157, + "step": 30382000 + }, + { + "epoch": 87.94, + "learning_rate": 6.043378334568358e-06, + "loss": 1.7997, + "step": 30382500 + }, + { + "epoch": 87.95, + "learning_rate": 6.042654686921082e-06, + "loss": 1.7934, + "step": 30383000 + }, + { + "epoch": 87.95, + "learning_rate": 6.041931039273806e-06, + "loss": 1.8065, + "step": 30383500 + }, + { + "epoch": 87.95, + "learning_rate": 6.041208838921823e-06, + "loss": 1.7962, + "step": 30384000 + }, + { + "epoch": 87.95, + "learning_rate": 6.0404851912745464e-06, + "loss": 1.7836, + "step": 30384500 + }, + { + "epoch": 87.95, + "learning_rate": 6.0397615436272695e-06, + "loss": 1.8014, + "step": 30385000 + }, + { + "epoch": 87.95, + "learning_rate": 6.0390378959799934e-06, + "loss": 1.8538, + "step": 30385500 + }, + { + "epoch": 87.96, + "learning_rate": 6.038314248332716e-06, + "loss": 1.8265, + "step": 30386000 + }, + { + "epoch": 87.96, + "learning_rate": 6.037592047980735e-06, + "loss": 1.8033, + "step": 30386500 + }, + { + "epoch": 87.96, + "learning_rate": 6.036868400333457e-06, + "loss": 1.8128, + "step": 30387000 + }, + { + "epoch": 87.96, + "learning_rate": 6.036144752686181e-06, + "loss": 1.7938, + "step": 30387500 + }, + { + "epoch": 87.96, + "learning_rate": 6.035421105038903e-06, + "loss": 1.7861, + "step": 30388000 + }, + { + "epoch": 87.96, + "learning_rate": 6.034697457391627e-06, + "loss": 1.801, + "step": 30388500 + }, + { + "epoch": 87.96, + "learning_rate": 6.033975257039644e-06, + "loss": 1.8133, + "step": 30389000 + }, + { + "epoch": 87.97, + "learning_rate": 6.033251609392368e-06, + "loss": 1.7965, + "step": 30389500 + }, + { + "epoch": 87.97, + "learning_rate": 6.032529409040385e-06, + "loss": 1.7968, + "step": 30390000 + }, + { + "epoch": 87.97, + "learning_rate": 6.031805761393109e-06, + "loss": 1.8012, + "step": 30390500 + }, + { + "epoch": 87.97, + "learning_rate": 6.0310821137458315e-06, + "loss": 1.7915, + "step": 30391000 + }, + { + "epoch": 87.97, + "learning_rate": 6.0303584660985555e-06, + "loss": 1.8328, + "step": 30391500 + }, + { + "epoch": 87.97, + "learning_rate": 6.0296348184512785e-06, + "loss": 1.7838, + "step": 30392000 + }, + { + "epoch": 87.97, + "learning_rate": 6.028912618099297e-06, + "loss": 1.8231, + "step": 30392500 + }, + { + "epoch": 87.98, + "learning_rate": 6.02818897045202e-06, + "loss": 1.808, + "step": 30393000 + }, + { + "epoch": 87.98, + "learning_rate": 6.027465322804743e-06, + "loss": 1.7991, + "step": 30393500 + }, + { + "epoch": 87.98, + "learning_rate": 6.026741675157466e-06, + "loss": 1.7757, + "step": 30394000 + }, + { + "epoch": 87.98, + "learning_rate": 6.026018027510189e-06, + "loss": 1.7893, + "step": 30394500 + }, + { + "epoch": 87.98, + "learning_rate": 6.025294379862913e-06, + "loss": 1.8197, + "step": 30395000 + }, + { + "epoch": 87.98, + "learning_rate": 6.024570732215636e-06, + "loss": 1.8207, + "step": 30395500 + }, + { + "epoch": 87.98, + "learning_rate": 6.023847084568359e-06, + "loss": 1.8053, + "step": 30396000 + }, + { + "epoch": 87.99, + "learning_rate": 6.023123436921082e-06, + "loss": 1.8117, + "step": 30396500 + }, + { + "epoch": 87.99, + "learning_rate": 6.0224012365691e-06, + "loss": 1.8445, + "step": 30397000 + }, + { + "epoch": 87.99, + "learning_rate": 6.021677588921823e-06, + "loss": 1.8305, + "step": 30397500 + }, + { + "epoch": 87.99, + "learning_rate": 6.020953941274546e-06, + "loss": 1.8192, + "step": 30398000 + }, + { + "epoch": 87.99, + "learning_rate": 6.0202302936272695e-06, + "loss": 1.7993, + "step": 30398500 + }, + { + "epoch": 87.99, + "learning_rate": 6.0195066459799925e-06, + "loss": 1.8001, + "step": 30399000 + }, + { + "epoch": 87.99, + "learning_rate": 6.018784445628011e-06, + "loss": 1.8175, + "step": 30399500 + }, + { + "epoch": 88.0, + "learning_rate": 6.018060797980734e-06, + "loss": 1.8197, + "step": 30400000 + }, + { + "epoch": 88.0, + "learning_rate": 6.017337150333458e-06, + "loss": 1.8015, + "step": 30400500 + }, + { + "epoch": 88.0, + "learning_rate": 6.01661350268618e-06, + "loss": 1.8118, + "step": 30401000 + }, + { + "epoch": 88.0, + "learning_rate": 6.015889855038904e-06, + "loss": 1.8174, + "step": 30401500 + }, + { + "epoch": 88.0, + "eval_accuracy": 0.6895304195333495, + "eval_accuracy_mlm": 0.6585697473221408, + "eval_accuracy_nsp": 0.8556759382748301, + "eval_loss": 2.19228458404541, + "eval_runtime": 331.5315, + "eval_samples_per_second": 1316.273, + "eval_steps_per_second": 54.845, + "step": 30401536 + }, + { + "epoch": 88.0, + "learning_rate": 6.015166207391627e-06, + "loss": 1.7828, + "step": 30402000 + }, + { + "epoch": 88.0, + "learning_rate": 6.01444255974435e-06, + "loss": 1.8051, + "step": 30402500 + }, + { + "epoch": 88.0, + "learning_rate": 6.013718912097073e-06, + "loss": 1.7942, + "step": 30403000 + }, + { + "epoch": 88.01, + "learning_rate": 6.012996711745091e-06, + "loss": 1.7773, + "step": 30403500 + }, + { + "epoch": 88.01, + "learning_rate": 6.012273064097814e-06, + "loss": 1.8229, + "step": 30404000 + }, + { + "epoch": 88.01, + "learning_rate": 6.011550863745832e-06, + "loss": 1.7776, + "step": 30404500 + }, + { + "epoch": 88.01, + "learning_rate": 6.010827216098555e-06, + "loss": 1.7976, + "step": 30405000 + }, + { + "epoch": 88.01, + "learning_rate": 6.0101035684512785e-06, + "loss": 1.7747, + "step": 30405500 + }, + { + "epoch": 88.01, + "learning_rate": 6.0093799208040016e-06, + "loss": 1.7868, + "step": 30406000 + }, + { + "epoch": 88.01, + "learning_rate": 6.008656273156725e-06, + "loss": 1.814, + "step": 30406500 + }, + { + "epoch": 88.02, + "learning_rate": 6.007932625509449e-06, + "loss": 1.8139, + "step": 30407000 + }, + { + "epoch": 88.02, + "learning_rate": 6.007208977862172e-06, + "loss": 1.8089, + "step": 30407500 + }, + { + "epoch": 88.02, + "learning_rate": 6.006485330214895e-06, + "loss": 1.784, + "step": 30408000 + }, + { + "epoch": 88.02, + "learning_rate": 6.005761682567618e-06, + "loss": 1.8031, + "step": 30408500 + }, + { + "epoch": 88.02, + "learning_rate": 6.005039482215636e-06, + "loss": 1.7948, + "step": 30409000 + }, + { + "epoch": 88.02, + "learning_rate": 6.004315834568359e-06, + "loss": 1.8045, + "step": 30409500 + }, + { + "epoch": 88.02, + "learning_rate": 6.003592186921082e-06, + "loss": 1.8102, + "step": 30410000 + }, + { + "epoch": 88.03, + "learning_rate": 6.002868539273805e-06, + "loss": 1.8069, + "step": 30410500 + }, + { + "epoch": 88.03, + "learning_rate": 6.002144891626529e-06, + "loss": 1.8042, + "step": 30411000 + }, + { + "epoch": 88.03, + "learning_rate": 6.001422691274546e-06, + "loss": 1.7965, + "step": 30411500 + }, + { + "epoch": 88.03, + "learning_rate": 6.000699043627269e-06, + "loss": 1.7951, + "step": 30412000 + }, + { + "epoch": 88.03, + "learning_rate": 5.9999753959799925e-06, + "loss": 1.8128, + "step": 30412500 + }, + { + "epoch": 88.03, + "learning_rate": 5.9992517483327164e-06, + "loss": 1.7922, + "step": 30413000 + }, + { + "epoch": 88.03, + "learning_rate": 5.998529547980734e-06, + "loss": 1.7716, + "step": 30413500 + }, + { + "epoch": 88.04, + "learning_rate": 5.997805900333458e-06, + "loss": 1.7963, + "step": 30414000 + }, + { + "epoch": 88.04, + "learning_rate": 5.99708225268618e-06, + "loss": 1.7643, + "step": 30414500 + }, + { + "epoch": 88.04, + "learning_rate": 5.996358605038904e-06, + "loss": 1.7882, + "step": 30415000 + }, + { + "epoch": 88.04, + "learning_rate": 5.995634957391627e-06, + "loss": 1.8161, + "step": 30415500 + }, + { + "epoch": 88.04, + "learning_rate": 5.99491130974435e-06, + "loss": 1.8081, + "step": 30416000 + }, + { + "epoch": 88.04, + "learning_rate": 5.994189109392368e-06, + "loss": 1.7984, + "step": 30416500 + }, + { + "epoch": 88.04, + "learning_rate": 5.993465461745091e-06, + "loss": 1.7962, + "step": 30417000 + }, + { + "epoch": 88.05, + "learning_rate": 5.992741814097814e-06, + "loss": 1.8108, + "step": 30417500 + }, + { + "epoch": 88.05, + "learning_rate": 5.992019613745832e-06, + "loss": 1.8049, + "step": 30418000 + }, + { + "epoch": 88.05, + "learning_rate": 5.991295966098555e-06, + "loss": 1.7987, + "step": 30418500 + }, + { + "epoch": 88.05, + "learning_rate": 5.9905723184512784e-06, + "loss": 1.7897, + "step": 30419000 + }, + { + "epoch": 88.05, + "learning_rate": 5.9898486708040015e-06, + "loss": 1.807, + "step": 30419500 + }, + { + "epoch": 88.05, + "learning_rate": 5.989125023156725e-06, + "loss": 1.7927, + "step": 30420000 + }, + { + "epoch": 88.05, + "learning_rate": 5.9884013755094485e-06, + "loss": 1.7873, + "step": 30420500 + }, + { + "epoch": 88.06, + "learning_rate": 5.987677727862172e-06, + "loss": 1.8116, + "step": 30421000 + }, + { + "epoch": 88.06, + "learning_rate": 5.98695552751019e-06, + "loss": 1.7961, + "step": 30421500 + }, + { + "epoch": 88.06, + "learning_rate": 5.986231879862912e-06, + "loss": 1.7925, + "step": 30422000 + }, + { + "epoch": 88.06, + "learning_rate": 5.985508232215636e-06, + "loss": 1.793, + "step": 30422500 + }, + { + "epoch": 88.06, + "learning_rate": 5.984784584568359e-06, + "loss": 1.8137, + "step": 30423000 + }, + { + "epoch": 88.06, + "learning_rate": 5.984060936921082e-06, + "loss": 1.7935, + "step": 30423500 + }, + { + "epoch": 88.07, + "learning_rate": 5.983337289273806e-06, + "loss": 1.7991, + "step": 30424000 + }, + { + "epoch": 88.07, + "learning_rate": 5.982613641626528e-06, + "loss": 1.8143, + "step": 30424500 + }, + { + "epoch": 88.07, + "learning_rate": 5.981889993979252e-06, + "loss": 1.8027, + "step": 30425000 + }, + { + "epoch": 88.07, + "learning_rate": 5.981166346331974e-06, + "loss": 1.7724, + "step": 30425500 + }, + { + "epoch": 88.07, + "learning_rate": 5.980442698684698e-06, + "loss": 1.7676, + "step": 30426000 + }, + { + "epoch": 88.07, + "learning_rate": 5.9797204983327155e-06, + "loss": 1.8116, + "step": 30426500 + }, + { + "epoch": 88.07, + "learning_rate": 5.9789968506854395e-06, + "loss": 1.7833, + "step": 30427000 + }, + { + "epoch": 88.08, + "learning_rate": 5.9782732030381625e-06, + "loss": 1.7977, + "step": 30427500 + }, + { + "epoch": 88.08, + "learning_rate": 5.977549555390886e-06, + "loss": 1.7916, + "step": 30428000 + }, + { + "epoch": 88.08, + "learning_rate": 5.976827355038903e-06, + "loss": 1.8014, + "step": 30428500 + }, + { + "epoch": 88.08, + "learning_rate": 5.976103707391627e-06, + "loss": 1.83, + "step": 30429000 + }, + { + "epoch": 88.08, + "learning_rate": 5.975380059744351e-06, + "loss": 1.8077, + "step": 30429500 + }, + { + "epoch": 88.08, + "learning_rate": 5.974656412097073e-06, + "loss": 1.7749, + "step": 30430000 + }, + { + "epoch": 88.08, + "learning_rate": 5.973932764449797e-06, + "loss": 1.7812, + "step": 30430500 + }, + { + "epoch": 88.09, + "learning_rate": 5.973209116802519e-06, + "loss": 1.7976, + "step": 30431000 + }, + { + "epoch": 88.09, + "learning_rate": 5.972486916450538e-06, + "loss": 1.7747, + "step": 30431500 + }, + { + "epoch": 88.09, + "learning_rate": 5.97176326880326e-06, + "loss": 1.8143, + "step": 30432000 + }, + { + "epoch": 88.09, + "learning_rate": 5.971039621155984e-06, + "loss": 1.7982, + "step": 30432500 + }, + { + "epoch": 88.09, + "learning_rate": 5.970315973508707e-06, + "loss": 1.7945, + "step": 30433000 + }, + { + "epoch": 88.09, + "learning_rate": 5.96959232586143e-06, + "loss": 1.8086, + "step": 30433500 + }, + { + "epoch": 88.09, + "learning_rate": 5.968868678214154e-06, + "loss": 1.7928, + "step": 30434000 + }, + { + "epoch": 88.1, + "learning_rate": 5.9681450305668765e-06, + "loss": 1.7999, + "step": 30434500 + }, + { + "epoch": 88.1, + "learning_rate": 5.9674213829196005e-06, + "loss": 1.7898, + "step": 30435000 + }, + { + "epoch": 88.1, + "learning_rate": 5.9666977352723235e-06, + "loss": 1.7882, + "step": 30435500 + }, + { + "epoch": 88.1, + "learning_rate": 5.965975534920342e-06, + "loss": 1.7919, + "step": 30436000 + }, + { + "epoch": 88.1, + "learning_rate": 5.965251887273064e-06, + "loss": 1.8039, + "step": 30436500 + }, + { + "epoch": 88.1, + "learning_rate": 5.964528239625788e-06, + "loss": 1.7843, + "step": 30437000 + }, + { + "epoch": 88.1, + "learning_rate": 5.963804591978511e-06, + "loss": 1.8095, + "step": 30437500 + }, + { + "epoch": 88.11, + "learning_rate": 5.963080944331234e-06, + "loss": 1.7916, + "step": 30438000 + }, + { + "epoch": 88.11, + "learning_rate": 5.962357296683958e-06, + "loss": 1.8031, + "step": 30438500 + }, + { + "epoch": 88.11, + "learning_rate": 5.96163364903668e-06, + "loss": 1.7913, + "step": 30439000 + }, + { + "epoch": 88.11, + "learning_rate": 5.960912895979992e-06, + "loss": 1.8051, + "step": 30439500 + }, + { + "epoch": 88.11, + "learning_rate": 5.960189248332716e-06, + "loss": 1.8163, + "step": 30440000 + }, + { + "epoch": 88.11, + "learning_rate": 5.959465600685439e-06, + "loss": 1.7899, + "step": 30440500 + }, + { + "epoch": 88.11, + "learning_rate": 5.9587419530381625e-06, + "loss": 1.7971, + "step": 30441000 + }, + { + "epoch": 88.12, + "learning_rate": 5.95801975268618e-06, + "loss": 1.7875, + "step": 30441500 + }, + { + "epoch": 88.12, + "learning_rate": 5.957296105038904e-06, + "loss": 1.8326, + "step": 30442000 + }, + { + "epoch": 88.12, + "learning_rate": 5.956572457391627e-06, + "loss": 1.7952, + "step": 30442500 + }, + { + "epoch": 88.12, + "learning_rate": 5.95584880974435e-06, + "loss": 1.8008, + "step": 30443000 + }, + { + "epoch": 88.12, + "learning_rate": 5.955125162097074e-06, + "loss": 1.7865, + "step": 30443500 + }, + { + "epoch": 88.12, + "learning_rate": 5.954401514449796e-06, + "loss": 1.7737, + "step": 30444000 + }, + { + "epoch": 88.12, + "learning_rate": 5.95367786680252e-06, + "loss": 1.7704, + "step": 30444500 + }, + { + "epoch": 88.13, + "learning_rate": 5.952954219155243e-06, + "loss": 1.7945, + "step": 30445000 + }, + { + "epoch": 88.13, + "learning_rate": 5.952230571507966e-06, + "loss": 1.7947, + "step": 30445500 + }, + { + "epoch": 88.13, + "learning_rate": 5.951506923860689e-06, + "loss": 1.7832, + "step": 30446000 + }, + { + "epoch": 88.13, + "learning_rate": 5.950783276213412e-06, + "loss": 1.7762, + "step": 30446500 + }, + { + "epoch": 88.13, + "learning_rate": 5.950059628566136e-06, + "loss": 1.7859, + "step": 30447000 + }, + { + "epoch": 88.13, + "learning_rate": 5.949337428214153e-06, + "loss": 1.7986, + "step": 30447500 + }, + { + "epoch": 88.13, + "learning_rate": 5.948613780566877e-06, + "loss": 1.7904, + "step": 30448000 + }, + { + "epoch": 88.14, + "learning_rate": 5.9478901329196e-06, + "loss": 1.7841, + "step": 30448500 + }, + { + "epoch": 88.14, + "learning_rate": 5.9471664852723235e-06, + "loss": 1.8216, + "step": 30449000 + }, + { + "epoch": 88.14, + "learning_rate": 5.946442837625047e-06, + "loss": 1.8043, + "step": 30449500 + }, + { + "epoch": 88.14, + "learning_rate": 5.94571918997777e-06, + "loss": 1.7937, + "step": 30450000 + }, + { + "epoch": 88.14, + "learning_rate": 5.944996989625788e-06, + "loss": 1.8016, + "step": 30450500 + }, + { + "epoch": 88.14, + "learning_rate": 5.944273341978511e-06, + "loss": 1.789, + "step": 30451000 + }, + { + "epoch": 88.14, + "learning_rate": 5.943549694331234e-06, + "loss": 1.8098, + "step": 30451500 + }, + { + "epoch": 88.15, + "learning_rate": 5.942826046683957e-06, + "loss": 1.8036, + "step": 30452000 + }, + { + "epoch": 88.15, + "learning_rate": 5.942103846331975e-06, + "loss": 1.7985, + "step": 30452500 + }, + { + "epoch": 88.15, + "learning_rate": 5.941380198684698e-06, + "loss": 1.7904, + "step": 30453000 + }, + { + "epoch": 88.15, + "learning_rate": 5.940656551037421e-06, + "loss": 1.8183, + "step": 30453500 + }, + { + "epoch": 88.15, + "learning_rate": 5.939934350685439e-06, + "loss": 1.7926, + "step": 30454000 + }, + { + "epoch": 88.15, + "learning_rate": 5.9392107030381624e-06, + "loss": 1.8195, + "step": 30454500 + }, + { + "epoch": 88.15, + "learning_rate": 5.9384870553908855e-06, + "loss": 1.7919, + "step": 30455000 + }, + { + "epoch": 88.16, + "learning_rate": 5.9377634077436094e-06, + "loss": 1.8101, + "step": 30455500 + }, + { + "epoch": 88.16, + "learning_rate": 5.9370397600963325e-06, + "loss": 1.7962, + "step": 30456000 + }, + { + "epoch": 88.16, + "learning_rate": 5.936316112449056e-06, + "loss": 1.7993, + "step": 30456500 + }, + { + "epoch": 88.16, + "learning_rate": 5.935592464801779e-06, + "loss": 1.8125, + "step": 30457000 + }, + { + "epoch": 88.16, + "learning_rate": 5.934868817154502e-06, + "loss": 1.8227, + "step": 30457500 + }, + { + "epoch": 88.16, + "learning_rate": 5.934145169507225e-06, + "loss": 1.8021, + "step": 30458000 + }, + { + "epoch": 88.16, + "learning_rate": 5.933424416450537e-06, + "loss": 1.7845, + "step": 30458500 + }, + { + "epoch": 88.17, + "learning_rate": 5.932700768803261e-06, + "loss": 1.8058, + "step": 30459000 + }, + { + "epoch": 88.17, + "learning_rate": 5.931977121155984e-06, + "loss": 1.7734, + "step": 30459500 + }, + { + "epoch": 88.17, + "learning_rate": 5.931253473508707e-06, + "loss": 1.7917, + "step": 30460000 + }, + { + "epoch": 88.17, + "learning_rate": 5.93052982586143e-06, + "loss": 1.7869, + "step": 30460500 + }, + { + "epoch": 88.17, + "learning_rate": 5.929806178214153e-06, + "loss": 1.7936, + "step": 30461000 + }, + { + "epoch": 88.17, + "learning_rate": 5.929082530566877e-06, + "loss": 1.7954, + "step": 30461500 + }, + { + "epoch": 88.18, + "learning_rate": 5.9283588829196e-06, + "loss": 1.8046, + "step": 30462000 + }, + { + "epoch": 88.18, + "learning_rate": 5.9276352352723234e-06, + "loss": 1.7865, + "step": 30462500 + }, + { + "epoch": 88.18, + "learning_rate": 5.926913034920341e-06, + "loss": 1.8044, + "step": 30463000 + }, + { + "epoch": 88.18, + "learning_rate": 5.926189387273065e-06, + "loss": 1.7957, + "step": 30463500 + }, + { + "epoch": 88.18, + "learning_rate": 5.925465739625788e-06, + "loss": 1.806, + "step": 30464000 + }, + { + "epoch": 88.18, + "learning_rate": 5.924742091978511e-06, + "loss": 1.761, + "step": 30464500 + }, + { + "epoch": 88.18, + "learning_rate": 5.924018444331234e-06, + "loss": 1.7853, + "step": 30465000 + }, + { + "epoch": 88.19, + "learning_rate": 5.923294796683957e-06, + "loss": 1.7893, + "step": 30465500 + }, + { + "epoch": 88.19, + "learning_rate": 5.922571149036681e-06, + "loss": 1.8024, + "step": 30466000 + }, + { + "epoch": 88.19, + "learning_rate": 5.921848948684698e-06, + "loss": 1.8064, + "step": 30466500 + }, + { + "epoch": 88.19, + "learning_rate": 5.921125301037422e-06, + "loss": 1.7948, + "step": 30467000 + }, + { + "epoch": 88.19, + "learning_rate": 5.920401653390144e-06, + "loss": 1.7929, + "step": 30467500 + }, + { + "epoch": 88.19, + "learning_rate": 5.919679453038162e-06, + "loss": 1.8239, + "step": 30468000 + }, + { + "epoch": 88.19, + "learning_rate": 5.9189558053908855e-06, + "loss": 1.7995, + "step": 30468500 + }, + { + "epoch": 88.2, + "learning_rate": 5.918232157743609e-06, + "loss": 1.7685, + "step": 30469000 + }, + { + "epoch": 88.2, + "learning_rate": 5.917508510096332e-06, + "loss": 1.7717, + "step": 30469500 + }, + { + "epoch": 88.2, + "learning_rate": 5.9167848624490556e-06, + "loss": 1.7931, + "step": 30470000 + }, + { + "epoch": 88.2, + "learning_rate": 5.916062662097073e-06, + "loss": 1.7937, + "step": 30470500 + }, + { + "epoch": 88.2, + "learning_rate": 5.915339014449797e-06, + "loss": 1.8039, + "step": 30471000 + }, + { + "epoch": 88.2, + "learning_rate": 5.91461536680252e-06, + "loss": 1.781, + "step": 30471500 + }, + { + "epoch": 88.2, + "learning_rate": 5.913891719155243e-06, + "loss": 1.7908, + "step": 30472000 + }, + { + "epoch": 88.21, + "learning_rate": 5.913168071507967e-06, + "loss": 1.8089, + "step": 30472500 + }, + { + "epoch": 88.21, + "learning_rate": 5.912444423860689e-06, + "loss": 1.78, + "step": 30473000 + }, + { + "epoch": 88.21, + "learning_rate": 5.911720776213413e-06, + "loss": 1.8056, + "step": 30473500 + }, + { + "epoch": 88.21, + "learning_rate": 5.91099857586143e-06, + "loss": 1.7759, + "step": 30474000 + }, + { + "epoch": 88.21, + "learning_rate": 5.910274928214154e-06, + "loss": 1.7987, + "step": 30474500 + }, + { + "epoch": 88.21, + "learning_rate": 5.909551280566876e-06, + "loss": 1.801, + "step": 30475000 + }, + { + "epoch": 88.21, + "learning_rate": 5.9088276329196e-06, + "loss": 1.7958, + "step": 30475500 + }, + { + "epoch": 88.22, + "learning_rate": 5.908103985272323e-06, + "loss": 1.8216, + "step": 30476000 + }, + { + "epoch": 88.22, + "learning_rate": 5.9073803376250465e-06, + "loss": 1.7725, + "step": 30476500 + }, + { + "epoch": 88.22, + "learning_rate": 5.90665668997777e-06, + "loss": 1.8116, + "step": 30477000 + }, + { + "epoch": 88.22, + "learning_rate": 5.905933042330493e-06, + "loss": 1.8049, + "step": 30477500 + }, + { + "epoch": 88.22, + "learning_rate": 5.9052093946832166e-06, + "loss": 1.7965, + "step": 30478000 + }, + { + "epoch": 88.22, + "learning_rate": 5.90448574703594e-06, + "loss": 1.7807, + "step": 30478500 + }, + { + "epoch": 88.22, + "learning_rate": 5.903763546683958e-06, + "loss": 1.7824, + "step": 30479000 + }, + { + "epoch": 88.23, + "learning_rate": 5.90303989903668e-06, + "loss": 1.8166, + "step": 30479500 + }, + { + "epoch": 88.23, + "learning_rate": 5.902316251389404e-06, + "loss": 1.819, + "step": 30480000 + }, + { + "epoch": 88.23, + "learning_rate": 5.901592603742127e-06, + "loss": 1.8134, + "step": 30480500 + }, + { + "epoch": 88.23, + "learning_rate": 5.900870403390145e-06, + "loss": 1.8047, + "step": 30481000 + }, + { + "epoch": 88.23, + "learning_rate": 5.900148203038162e-06, + "loss": 1.797, + "step": 30481500 + }, + { + "epoch": 88.23, + "learning_rate": 5.899424555390886e-06, + "loss": 1.7951, + "step": 30482000 + }, + { + "epoch": 88.23, + "learning_rate": 5.8987009077436085e-06, + "loss": 1.8067, + "step": 30482500 + }, + { + "epoch": 88.24, + "learning_rate": 5.897977260096332e-06, + "loss": 1.7667, + "step": 30483000 + }, + { + "epoch": 88.24, + "learning_rate": 5.8972536124490555e-06, + "loss": 1.7984, + "step": 30483500 + }, + { + "epoch": 88.24, + "learning_rate": 5.896529964801779e-06, + "loss": 1.8005, + "step": 30484000 + }, + { + "epoch": 88.24, + "learning_rate": 5.8958063171545025e-06, + "loss": 1.7932, + "step": 30484500 + }, + { + "epoch": 88.24, + "learning_rate": 5.895082669507225e-06, + "loss": 1.8218, + "step": 30485000 + }, + { + "epoch": 88.24, + "learning_rate": 5.894359021859949e-06, + "loss": 1.7707, + "step": 30485500 + }, + { + "epoch": 88.24, + "learning_rate": 5.893638268803261e-06, + "loss": 1.7944, + "step": 30486000 + }, + { + "epoch": 88.25, + "learning_rate": 5.892914621155984e-06, + "loss": 1.787, + "step": 30486500 + }, + { + "epoch": 88.25, + "learning_rate": 5.892190973508707e-06, + "loss": 1.7645, + "step": 30487000 + }, + { + "epoch": 88.25, + "learning_rate": 5.891467325861431e-06, + "loss": 1.8216, + "step": 30487500 + }, + { + "epoch": 88.25, + "learning_rate": 5.890743678214153e-06, + "loss": 1.8031, + "step": 30488000 + }, + { + "epoch": 88.25, + "learning_rate": 5.890020030566877e-06, + "loss": 1.7803, + "step": 30488500 + }, + { + "epoch": 88.25, + "learning_rate": 5.8892963829196e-06, + "loss": 1.8041, + "step": 30489000 + }, + { + "epoch": 88.25, + "learning_rate": 5.888572735272323e-06, + "loss": 1.809, + "step": 30489500 + }, + { + "epoch": 88.26, + "learning_rate": 5.8878490876250464e-06, + "loss": 1.7937, + "step": 30490000 + }, + { + "epoch": 88.26, + "learning_rate": 5.8871268872730645e-06, + "loss": 1.8074, + "step": 30490500 + }, + { + "epoch": 88.26, + "learning_rate": 5.886403239625788e-06, + "loss": 1.8059, + "step": 30491000 + }, + { + "epoch": 88.26, + "learning_rate": 5.885679591978511e-06, + "loss": 1.8065, + "step": 30491500 + }, + { + "epoch": 88.26, + "learning_rate": 5.884955944331235e-06, + "loss": 1.791, + "step": 30492000 + }, + { + "epoch": 88.26, + "learning_rate": 5.884232296683957e-06, + "loss": 1.7771, + "step": 30492500 + }, + { + "epoch": 88.26, + "learning_rate": 5.883508649036681e-06, + "loss": 1.7607, + "step": 30493000 + }, + { + "epoch": 88.27, + "learning_rate": 5.882785001389404e-06, + "loss": 1.8009, + "step": 30493500 + }, + { + "epoch": 88.27, + "learning_rate": 5.882061353742127e-06, + "loss": 1.8088, + "step": 30494000 + }, + { + "epoch": 88.27, + "learning_rate": 5.881340600685439e-06, + "loss": 1.787, + "step": 30494500 + }, + { + "epoch": 88.27, + "learning_rate": 5.880618400333457e-06, + "loss": 1.8066, + "step": 30495000 + }, + { + "epoch": 88.27, + "learning_rate": 5.87989475268618e-06, + "loss": 1.826, + "step": 30495500 + }, + { + "epoch": 88.27, + "learning_rate": 5.8791711050389035e-06, + "loss": 1.7951, + "step": 30496000 + }, + { + "epoch": 88.27, + "learning_rate": 5.8784474573916265e-06, + "loss": 1.7615, + "step": 30496500 + }, + { + "epoch": 88.28, + "learning_rate": 5.8777238097443505e-06, + "loss": 1.796, + "step": 30497000 + }, + { + "epoch": 88.28, + "learning_rate": 5.8770001620970735e-06, + "loss": 1.7909, + "step": 30497500 + }, + { + "epoch": 88.28, + "learning_rate": 5.876276514449797e-06, + "loss": 1.7993, + "step": 30498000 + }, + { + "epoch": 88.28, + "learning_rate": 5.87555286680252e-06, + "loss": 1.8003, + "step": 30498500 + }, + { + "epoch": 88.28, + "learning_rate": 5.874829219155243e-06, + "loss": 1.7862, + "step": 30499000 + }, + { + "epoch": 88.28, + "learning_rate": 5.874105571507967e-06, + "loss": 1.8091, + "step": 30499500 + }, + { + "epoch": 88.29, + "learning_rate": 5.873383371155984e-06, + "loss": 1.7802, + "step": 30500000 + }, + { + "epoch": 88.29, + "learning_rate": 5.872659723508707e-06, + "loss": 1.7893, + "step": 30500500 + }, + { + "epoch": 88.29, + "learning_rate": 5.87193607586143e-06, + "loss": 1.7929, + "step": 30501000 + }, + { + "epoch": 88.29, + "learning_rate": 5.871212428214154e-06, + "loss": 1.787, + "step": 30501500 + }, + { + "epoch": 88.29, + "learning_rate": 5.870488780566877e-06, + "loss": 1.7897, + "step": 30502000 + }, + { + "epoch": 88.29, + "learning_rate": 5.869766580214895e-06, + "loss": 1.7646, + "step": 30502500 + }, + { + "epoch": 88.29, + "learning_rate": 5.8690429325676175e-06, + "loss": 1.7968, + "step": 30503000 + }, + { + "epoch": 88.3, + "learning_rate": 5.868319284920341e-06, + "loss": 1.7717, + "step": 30503500 + }, + { + "epoch": 88.3, + "learning_rate": 5.8675956372730645e-06, + "loss": 1.7926, + "step": 30504000 + }, + { + "epoch": 88.3, + "learning_rate": 5.8668734369210826e-06, + "loss": 1.8215, + "step": 30504500 + }, + { + "epoch": 88.3, + "learning_rate": 5.866149789273806e-06, + "loss": 1.7872, + "step": 30505000 + }, + { + "epoch": 88.3, + "learning_rate": 5.865427588921823e-06, + "loss": 1.7965, + "step": 30505500 + }, + { + "epoch": 88.3, + "learning_rate": 5.864703941274546e-06, + "loss": 1.8042, + "step": 30506000 + }, + { + "epoch": 88.3, + "learning_rate": 5.86398029362727e-06, + "loss": 1.7988, + "step": 30506500 + }, + { + "epoch": 88.31, + "learning_rate": 5.863256645979993e-06, + "loss": 1.789, + "step": 30507000 + }, + { + "epoch": 88.31, + "learning_rate": 5.862534445628011e-06, + "loss": 1.7999, + "step": 30507500 + }, + { + "epoch": 88.31, + "learning_rate": 5.861810797980734e-06, + "loss": 1.796, + "step": 30508000 + }, + { + "epoch": 88.31, + "learning_rate": 5.861087150333457e-06, + "loss": 1.8069, + "step": 30508500 + }, + { + "epoch": 88.31, + "learning_rate": 5.86036350268618e-06, + "loss": 1.8078, + "step": 30509000 + }, + { + "epoch": 88.31, + "learning_rate": 5.859639855038903e-06, + "loss": 1.8179, + "step": 30509500 + }, + { + "epoch": 88.31, + "learning_rate": 5.8589162073916265e-06, + "loss": 1.8214, + "step": 30510000 + }, + { + "epoch": 88.32, + "learning_rate": 5.858194007039645e-06, + "loss": 1.7939, + "step": 30510500 + }, + { + "epoch": 88.32, + "learning_rate": 5.857470359392368e-06, + "loss": 1.8212, + "step": 30511000 + }, + { + "epoch": 88.32, + "learning_rate": 5.856748159040386e-06, + "loss": 1.7974, + "step": 30511500 + }, + { + "epoch": 88.32, + "learning_rate": 5.856024511393109e-06, + "loss": 1.7786, + "step": 30512000 + }, + { + "epoch": 88.32, + "learning_rate": 5.855300863745832e-06, + "loss": 1.7805, + "step": 30512500 + }, + { + "epoch": 88.32, + "learning_rate": 5.854577216098555e-06, + "loss": 1.8287, + "step": 30513000 + }, + { + "epoch": 88.32, + "learning_rate": 5.853853568451279e-06, + "loss": 1.8035, + "step": 30513500 + }, + { + "epoch": 88.33, + "learning_rate": 5.853129920804002e-06, + "loss": 1.8053, + "step": 30514000 + }, + { + "epoch": 88.33, + "learning_rate": 5.852406273156725e-06, + "loss": 1.7787, + "step": 30514500 + }, + { + "epoch": 88.33, + "learning_rate": 5.851682625509448e-06, + "loss": 1.8216, + "step": 30515000 + }, + { + "epoch": 88.33, + "learning_rate": 5.850958977862171e-06, + "loss": 1.7876, + "step": 30515500 + }, + { + "epoch": 88.33, + "learning_rate": 5.850235330214895e-06, + "loss": 1.7932, + "step": 30516000 + }, + { + "epoch": 88.33, + "learning_rate": 5.849511682567617e-06, + "loss": 1.8006, + "step": 30516500 + }, + { + "epoch": 88.33, + "learning_rate": 5.848788034920341e-06, + "loss": 1.7855, + "step": 30517000 + }, + { + "epoch": 88.34, + "learning_rate": 5.848065834568359e-06, + "loss": 1.8047, + "step": 30517500 + }, + { + "epoch": 88.34, + "learning_rate": 5.8473421869210825e-06, + "loss": 1.8066, + "step": 30518000 + }, + { + "epoch": 88.34, + "learning_rate": 5.8466199865691e-06, + "loss": 1.7927, + "step": 30518500 + }, + { + "epoch": 88.34, + "learning_rate": 5.845896338921823e-06, + "loss": 1.8135, + "step": 30519000 + }, + { + "epoch": 88.34, + "learning_rate": 5.845172691274546e-06, + "loss": 1.7896, + "step": 30519500 + }, + { + "epoch": 88.34, + "learning_rate": 5.84444904362727e-06, + "loss": 1.8155, + "step": 30520000 + }, + { + "epoch": 88.34, + "learning_rate": 5.843725395979993e-06, + "loss": 1.8091, + "step": 30520500 + }, + { + "epoch": 88.35, + "learning_rate": 5.843001748332716e-06, + "loss": 1.7804, + "step": 30521000 + }, + { + "epoch": 88.35, + "learning_rate": 5.842278100685439e-06, + "loss": 1.7947, + "step": 30521500 + }, + { + "epoch": 88.35, + "learning_rate": 5.841554453038162e-06, + "loss": 1.8149, + "step": 30522000 + }, + { + "epoch": 88.35, + "learning_rate": 5.840830805390886e-06, + "loss": 1.7913, + "step": 30522500 + }, + { + "epoch": 88.35, + "learning_rate": 5.840108605038903e-06, + "loss": 1.7925, + "step": 30523000 + }, + { + "epoch": 88.35, + "learning_rate": 5.839384957391627e-06, + "loss": 1.8261, + "step": 30523500 + }, + { + "epoch": 88.35, + "learning_rate": 5.8386613097443495e-06, + "loss": 1.8179, + "step": 30524000 + }, + { + "epoch": 88.36, + "learning_rate": 5.8379376620970734e-06, + "loss": 1.8032, + "step": 30524500 + }, + { + "epoch": 88.36, + "learning_rate": 5.8372140144497965e-06, + "loss": 1.8074, + "step": 30525000 + }, + { + "epoch": 88.36, + "learning_rate": 5.83649036680252e-06, + "loss": 1.8047, + "step": 30525500 + }, + { + "epoch": 88.36, + "learning_rate": 5.8357667191552435e-06, + "loss": 1.7959, + "step": 30526000 + }, + { + "epoch": 88.36, + "learning_rate": 5.835043071507966e-06, + "loss": 1.7787, + "step": 30526500 + }, + { + "epoch": 88.36, + "learning_rate": 5.834320871155984e-06, + "loss": 1.8167, + "step": 30527000 + }, + { + "epoch": 88.36, + "learning_rate": 5.833598670804002e-06, + "loss": 1.7976, + "step": 30527500 + }, + { + "epoch": 88.37, + "learning_rate": 5.832875023156725e-06, + "loss": 1.8056, + "step": 30528000 + }, + { + "epoch": 88.37, + "learning_rate": 5.832152822804743e-06, + "loss": 1.7904, + "step": 30528500 + }, + { + "epoch": 88.37, + "learning_rate": 5.831429175157465e-06, + "loss": 1.8035, + "step": 30529000 + }, + { + "epoch": 88.37, + "learning_rate": 5.830705527510189e-06, + "loss": 1.8028, + "step": 30529500 + }, + { + "epoch": 88.37, + "learning_rate": 5.829981879862912e-06, + "loss": 1.7872, + "step": 30530000 + }, + { + "epoch": 88.37, + "learning_rate": 5.8292582322156355e-06, + "loss": 1.8124, + "step": 30530500 + }, + { + "epoch": 88.37, + "learning_rate": 5.8285360318636536e-06, + "loss": 1.7837, + "step": 30531000 + }, + { + "epoch": 88.38, + "learning_rate": 5.827812384216377e-06, + "loss": 1.8078, + "step": 30531500 + }, + { + "epoch": 88.38, + "learning_rate": 5.8270887365691006e-06, + "loss": 1.781, + "step": 30532000 + }, + { + "epoch": 88.38, + "learning_rate": 5.826365088921823e-06, + "loss": 1.8164, + "step": 30532500 + }, + { + "epoch": 88.38, + "learning_rate": 5.825642888569841e-06, + "loss": 1.8059, + "step": 30533000 + }, + { + "epoch": 88.38, + "learning_rate": 5.824919240922564e-06, + "loss": 1.8209, + "step": 30533500 + }, + { + "epoch": 88.38, + "learning_rate": 5.824195593275288e-06, + "loss": 1.8062, + "step": 30534000 + }, + { + "epoch": 88.38, + "learning_rate": 5.82347194562801e-06, + "loss": 1.8165, + "step": 30534500 + }, + { + "epoch": 88.39, + "learning_rate": 5.822748297980734e-06, + "loss": 1.7915, + "step": 30535000 + }, + { + "epoch": 88.39, + "learning_rate": 5.822024650333457e-06, + "loss": 1.7967, + "step": 30535500 + }, + { + "epoch": 88.39, + "learning_rate": 5.82130100268618e-06, + "loss": 1.8127, + "step": 30536000 + }, + { + "epoch": 88.39, + "learning_rate": 5.8205788023341975e-06, + "loss": 1.8175, + "step": 30536500 + }, + { + "epoch": 88.39, + "learning_rate": 5.819855154686921e-06, + "loss": 1.8063, + "step": 30537000 + }, + { + "epoch": 88.39, + "learning_rate": 5.8191315070396445e-06, + "loss": 1.7862, + "step": 30537500 + }, + { + "epoch": 88.4, + "learning_rate": 5.8184078593923676e-06, + "loss": 1.7875, + "step": 30538000 + }, + { + "epoch": 88.4, + "learning_rate": 5.8176842117450915e-06, + "loss": 1.8045, + "step": 30538500 + }, + { + "epoch": 88.4, + "learning_rate": 5.816960564097814e-06, + "loss": 1.8076, + "step": 30539000 + }, + { + "epoch": 88.4, + "learning_rate": 5.816236916450538e-06, + "loss": 1.7934, + "step": 30539500 + }, + { + "epoch": 88.4, + "learning_rate": 5.815514716098555e-06, + "loss": 1.7587, + "step": 30540000 + }, + { + "epoch": 88.4, + "learning_rate": 5.814791068451279e-06, + "loss": 1.7992, + "step": 30540500 + }, + { + "epoch": 88.4, + "learning_rate": 5.814067420804002e-06, + "loss": 1.7927, + "step": 30541000 + }, + { + "epoch": 88.41, + "learning_rate": 5.813343773156725e-06, + "loss": 1.7865, + "step": 30541500 + }, + { + "epoch": 88.41, + "learning_rate": 5.812620125509449e-06, + "loss": 1.7981, + "step": 30542000 + }, + { + "epoch": 88.41, + "learning_rate": 5.811896477862171e-06, + "loss": 1.767, + "step": 30542500 + }, + { + "epoch": 88.41, + "learning_rate": 5.811172830214895e-06, + "loss": 1.8072, + "step": 30543000 + }, + { + "epoch": 88.41, + "learning_rate": 5.810449182567617e-06, + "loss": 1.8144, + "step": 30543500 + }, + { + "epoch": 88.41, + "learning_rate": 5.809725534920341e-06, + "loss": 1.7955, + "step": 30544000 + }, + { + "epoch": 88.41, + "learning_rate": 5.8090033345683585e-06, + "loss": 1.8078, + "step": 30544500 + }, + { + "epoch": 88.42, + "learning_rate": 5.808279686921082e-06, + "loss": 1.7954, + "step": 30545000 + }, + { + "epoch": 88.42, + "learning_rate": 5.8075560392738055e-06, + "loss": 1.8099, + "step": 30545500 + }, + { + "epoch": 88.42, + "learning_rate": 5.8068323916265286e-06, + "loss": 1.7723, + "step": 30546000 + }, + { + "epoch": 88.42, + "learning_rate": 5.806110191274546e-06, + "loss": 1.7996, + "step": 30546500 + }, + { + "epoch": 88.42, + "learning_rate": 5.80538654362727e-06, + "loss": 1.7909, + "step": 30547000 + }, + { + "epoch": 88.42, + "learning_rate": 5.804662895979993e-06, + "loss": 1.7803, + "step": 30547500 + }, + { + "epoch": 88.42, + "learning_rate": 5.803939248332716e-06, + "loss": 1.7988, + "step": 30548000 + }, + { + "epoch": 88.43, + "learning_rate": 5.803217047980734e-06, + "loss": 1.8111, + "step": 30548500 + }, + { + "epoch": 88.43, + "learning_rate": 5.802493400333457e-06, + "loss": 1.845, + "step": 30549000 + }, + { + "epoch": 88.43, + "learning_rate": 5.80176975268618e-06, + "loss": 1.799, + "step": 30549500 + }, + { + "epoch": 88.43, + "learning_rate": 5.801047552334198e-06, + "loss": 1.7847, + "step": 30550000 + }, + { + "epoch": 88.43, + "learning_rate": 5.800323904686921e-06, + "loss": 1.7963, + "step": 30550500 + }, + { + "epoch": 88.43, + "learning_rate": 5.7996017043349394e-06, + "loss": 1.7788, + "step": 30551000 + }, + { + "epoch": 88.43, + "learning_rate": 5.7988780566876625e-06, + "loss": 1.787, + "step": 30551500 + }, + { + "epoch": 88.44, + "learning_rate": 5.798154409040386e-06, + "loss": 1.8023, + "step": 30552000 + }, + { + "epoch": 88.44, + "learning_rate": 5.797430761393109e-06, + "loss": 1.7791, + "step": 30552500 + }, + { + "epoch": 88.44, + "learning_rate": 5.796707113745832e-06, + "loss": 1.7656, + "step": 30553000 + }, + { + "epoch": 88.44, + "learning_rate": 5.795983466098556e-06, + "loss": 1.8062, + "step": 30553500 + }, + { + "epoch": 88.44, + "learning_rate": 5.795259818451279e-06, + "loss": 1.7969, + "step": 30554000 + }, + { + "epoch": 88.44, + "learning_rate": 5.794536170804002e-06, + "loss": 1.808, + "step": 30554500 + }, + { + "epoch": 88.44, + "learning_rate": 5.793812523156725e-06, + "loss": 1.7952, + "step": 30555000 + }, + { + "epoch": 88.45, + "learning_rate": 5.793088875509448e-06, + "loss": 1.7875, + "step": 30555500 + }, + { + "epoch": 88.45, + "learning_rate": 5.792365227862172e-06, + "loss": 1.8081, + "step": 30556000 + }, + { + "epoch": 88.45, + "learning_rate": 5.791641580214895e-06, + "loss": 1.7952, + "step": 30556500 + }, + { + "epoch": 88.45, + "learning_rate": 5.790917932567618e-06, + "loss": 1.8256, + "step": 30557000 + }, + { + "epoch": 88.45, + "learning_rate": 5.790195732215635e-06, + "loss": 1.8108, + "step": 30557500 + }, + { + "epoch": 88.45, + "learning_rate": 5.789472084568359e-06, + "loss": 1.8136, + "step": 30558000 + }, + { + "epoch": 88.45, + "learning_rate": 5.788748436921082e-06, + "loss": 1.7987, + "step": 30558500 + }, + { + "epoch": 88.46, + "learning_rate": 5.7880247892738054e-06, + "loss": 1.8137, + "step": 30559000 + }, + { + "epoch": 88.46, + "learning_rate": 5.7873011416265285e-06, + "loss": 1.784, + "step": 30559500 + }, + { + "epoch": 88.46, + "learning_rate": 5.786577493979252e-06, + "loss": 1.7938, + "step": 30560000 + }, + { + "epoch": 88.46, + "learning_rate": 5.785853846331975e-06, + "loss": 1.7766, + "step": 30560500 + }, + { + "epoch": 88.46, + "learning_rate": 5.785130198684699e-06, + "loss": 1.8036, + "step": 30561000 + }, + { + "epoch": 88.46, + "learning_rate": 5.784407998332716e-06, + "loss": 1.8154, + "step": 30561500 + }, + { + "epoch": 88.46, + "learning_rate": 5.783684350685439e-06, + "loss": 1.79, + "step": 30562000 + }, + { + "epoch": 88.47, + "learning_rate": 5.782960703038163e-06, + "loss": 1.8366, + "step": 30562500 + }, + { + "epoch": 88.47, + "learning_rate": 5.782237055390886e-06, + "loss": 1.7906, + "step": 30563000 + }, + { + "epoch": 88.47, + "learning_rate": 5.781513407743609e-06, + "loss": 1.8271, + "step": 30563500 + }, + { + "epoch": 88.47, + "learning_rate": 5.780789760096332e-06, + "loss": 1.7874, + "step": 30564000 + }, + { + "epoch": 88.47, + "learning_rate": 5.780066112449055e-06, + "loss": 1.7872, + "step": 30564500 + }, + { + "epoch": 88.47, + "learning_rate": 5.779343912097073e-06, + "loss": 1.7749, + "step": 30565000 + }, + { + "epoch": 88.47, + "learning_rate": 5.778620264449796e-06, + "loss": 1.7937, + "step": 30565500 + }, + { + "epoch": 88.48, + "learning_rate": 5.7778966168025194e-06, + "loss": 1.7967, + "step": 30566000 + }, + { + "epoch": 88.48, + "learning_rate": 5.777172969155243e-06, + "loss": 1.8344, + "step": 30566500 + }, + { + "epoch": 88.48, + "learning_rate": 5.7764493215079665e-06, + "loss": 1.8455, + "step": 30567000 + }, + { + "epoch": 88.48, + "learning_rate": 5.7757256738606895e-06, + "loss": 1.7935, + "step": 30567500 + }, + { + "epoch": 88.48, + "learning_rate": 5.775002026213413e-06, + "loss": 1.7972, + "step": 30568000 + }, + { + "epoch": 88.48, + "learning_rate": 5.774279825861431e-06, + "loss": 1.8104, + "step": 30568500 + }, + { + "epoch": 88.48, + "learning_rate": 5.773556178214154e-06, + "loss": 1.7951, + "step": 30569000 + }, + { + "epoch": 88.49, + "learning_rate": 5.772832530566877e-06, + "loss": 1.8129, + "step": 30569500 + }, + { + "epoch": 88.49, + "learning_rate": 5.7721088829196e-06, + "loss": 1.7829, + "step": 30570000 + }, + { + "epoch": 88.49, + "learning_rate": 5.771385235272323e-06, + "loss": 1.7921, + "step": 30570500 + }, + { + "epoch": 88.49, + "learning_rate": 5.770661587625047e-06, + "loss": 1.7865, + "step": 30571000 + }, + { + "epoch": 88.49, + "learning_rate": 5.769937939977769e-06, + "loss": 1.8043, + "step": 30571500 + }, + { + "epoch": 88.49, + "learning_rate": 5.769215739625788e-06, + "loss": 1.7848, + "step": 30572000 + }, + { + "epoch": 88.49, + "learning_rate": 5.76849209197851e-06, + "loss": 1.7881, + "step": 30572500 + }, + { + "epoch": 88.5, + "learning_rate": 5.7677698916265285e-06, + "loss": 1.7996, + "step": 30573000 + }, + { + "epoch": 88.5, + "learning_rate": 5.7670462439792516e-06, + "loss": 1.806, + "step": 30573500 + }, + { + "epoch": 88.5, + "learning_rate": 5.7663225963319755e-06, + "loss": 1.7993, + "step": 30574000 + }, + { + "epoch": 88.5, + "learning_rate": 5.765598948684698e-06, + "loss": 1.7858, + "step": 30574500 + }, + { + "epoch": 88.5, + "learning_rate": 5.764875301037422e-06, + "loss": 1.8234, + "step": 30575000 + }, + { + "epoch": 88.5, + "learning_rate": 5.764153100685439e-06, + "loss": 1.7955, + "step": 30575500 + }, + { + "epoch": 88.51, + "learning_rate": 5.763429453038163e-06, + "loss": 1.8184, + "step": 30576000 + }, + { + "epoch": 88.51, + "learning_rate": 5.762705805390886e-06, + "loss": 1.7851, + "step": 30576500 + }, + { + "epoch": 88.51, + "learning_rate": 5.761982157743609e-06, + "loss": 1.8044, + "step": 30577000 + }, + { + "epoch": 88.51, + "learning_rate": 5.761258510096332e-06, + "loss": 1.7937, + "step": 30577500 + }, + { + "epoch": 88.51, + "learning_rate": 5.760534862449055e-06, + "loss": 1.8083, + "step": 30578000 + }, + { + "epoch": 88.51, + "learning_rate": 5.759811214801779e-06, + "loss": 1.8035, + "step": 30578500 + }, + { + "epoch": 88.51, + "learning_rate": 5.759087567154501e-06, + "loss": 1.7949, + "step": 30579000 + }, + { + "epoch": 88.52, + "learning_rate": 5.758363919507225e-06, + "loss": 1.781, + "step": 30579500 + }, + { + "epoch": 88.52, + "learning_rate": 5.757640271859948e-06, + "loss": 1.8086, + "step": 30580000 + }, + { + "epoch": 88.52, + "learning_rate": 5.756918071507966e-06, + "loss": 1.7872, + "step": 30580500 + }, + { + "epoch": 88.52, + "learning_rate": 5.7561944238606895e-06, + "loss": 1.8084, + "step": 30581000 + }, + { + "epoch": 88.52, + "learning_rate": 5.7554707762134126e-06, + "loss": 1.7698, + "step": 30581500 + }, + { + "epoch": 88.52, + "learning_rate": 5.7547471285661365e-06, + "loss": 1.7891, + "step": 30582000 + }, + { + "epoch": 88.52, + "learning_rate": 5.754023480918859e-06, + "loss": 1.8125, + "step": 30582500 + }, + { + "epoch": 88.53, + "learning_rate": 5.753299833271583e-06, + "loss": 1.8073, + "step": 30583000 + }, + { + "epoch": 88.53, + "learning_rate": 5.752576185624305e-06, + "loss": 1.8188, + "step": 30583500 + }, + { + "epoch": 88.53, + "learning_rate": 5.751852537977029e-06, + "loss": 1.8043, + "step": 30584000 + }, + { + "epoch": 88.53, + "learning_rate": 5.751130337625046e-06, + "loss": 1.7481, + "step": 30584500 + }, + { + "epoch": 88.53, + "learning_rate": 5.75040668997777e-06, + "loss": 1.7868, + "step": 30585000 + }, + { + "epoch": 88.53, + "learning_rate": 5.749683042330493e-06, + "loss": 1.8074, + "step": 30585500 + }, + { + "epoch": 88.53, + "learning_rate": 5.748959394683216e-06, + "loss": 1.8052, + "step": 30586000 + }, + { + "epoch": 88.54, + "learning_rate": 5.748237194331233e-06, + "loss": 1.7869, + "step": 30586500 + }, + { + "epoch": 88.54, + "learning_rate": 5.747513546683957e-06, + "loss": 1.7691, + "step": 30587000 + }, + { + "epoch": 88.54, + "learning_rate": 5.746789899036681e-06, + "loss": 1.7841, + "step": 30587500 + }, + { + "epoch": 88.54, + "learning_rate": 5.7460662513894035e-06, + "loss": 1.8123, + "step": 30588000 + }, + { + "epoch": 88.54, + "learning_rate": 5.745342603742127e-06, + "loss": 1.8023, + "step": 30588500 + }, + { + "epoch": 88.54, + "learning_rate": 5.74461895609485e-06, + "loss": 1.8017, + "step": 30589000 + }, + { + "epoch": 88.54, + "learning_rate": 5.743895308447574e-06, + "loss": 1.8052, + "step": 30589500 + }, + { + "epoch": 88.55, + "learning_rate": 5.743171660800297e-06, + "loss": 1.8131, + "step": 30590000 + }, + { + "epoch": 88.55, + "learning_rate": 5.742449460448315e-06, + "loss": 1.8127, + "step": 30590500 + }, + { + "epoch": 88.55, + "learning_rate": 5.741725812801038e-06, + "loss": 1.7768, + "step": 30591000 + }, + { + "epoch": 88.55, + "learning_rate": 5.741002165153761e-06, + "loss": 1.8007, + "step": 30591500 + }, + { + "epoch": 88.55, + "learning_rate": 5.740278517506484e-06, + "loss": 1.7681, + "step": 30592000 + }, + { + "epoch": 88.55, + "learning_rate": 5.739554869859207e-06, + "loss": 1.7879, + "step": 30592500 + }, + { + "epoch": 88.55, + "learning_rate": 5.738831222211931e-06, + "loss": 1.7933, + "step": 30593000 + }, + { + "epoch": 88.56, + "learning_rate": 5.738107574564654e-06, + "loss": 1.8162, + "step": 30593500 + }, + { + "epoch": 88.56, + "learning_rate": 5.737383926917377e-06, + "loss": 1.8053, + "step": 30594000 + }, + { + "epoch": 88.56, + "learning_rate": 5.736661726565394e-06, + "loss": 1.7822, + "step": 30594500 + }, + { + "epoch": 88.56, + "learning_rate": 5.735938078918118e-06, + "loss": 1.8124, + "step": 30595000 + }, + { + "epoch": 88.56, + "learning_rate": 5.7352144312708414e-06, + "loss": 1.7946, + "step": 30595500 + }, + { + "epoch": 88.56, + "learning_rate": 5.734493678214154e-06, + "loss": 1.7864, + "step": 30596000 + }, + { + "epoch": 88.56, + "learning_rate": 5.733770030566877e-06, + "loss": 1.8049, + "step": 30596500 + }, + { + "epoch": 88.57, + "learning_rate": 5.733046382919601e-06, + "loss": 1.8, + "step": 30597000 + }, + { + "epoch": 88.57, + "learning_rate": 5.732322735272323e-06, + "loss": 1.7835, + "step": 30597500 + }, + { + "epoch": 88.57, + "learning_rate": 5.731599087625047e-06, + "loss": 1.8105, + "step": 30598000 + }, + { + "epoch": 88.57, + "learning_rate": 5.73087543997777e-06, + "loss": 1.7788, + "step": 30598500 + }, + { + "epoch": 88.57, + "learning_rate": 5.730151792330493e-06, + "loss": 1.8118, + "step": 30599000 + }, + { + "epoch": 88.57, + "learning_rate": 5.729428144683216e-06, + "loss": 1.808, + "step": 30599500 + }, + { + "epoch": 88.57, + "learning_rate": 5.728704497035939e-06, + "loss": 1.807, + "step": 30600000 + }, + { + "epoch": 88.58, + "learning_rate": 5.727982296683957e-06, + "loss": 1.792, + "step": 30600500 + }, + { + "epoch": 88.58, + "learning_rate": 5.72725864903668e-06, + "loss": 1.7641, + "step": 30601000 + }, + { + "epoch": 88.58, + "learning_rate": 5.726535001389404e-06, + "loss": 1.7987, + "step": 30601500 + }, + { + "epoch": 88.58, + "learning_rate": 5.7258113537421265e-06, + "loss": 1.7995, + "step": 30602000 + }, + { + "epoch": 88.58, + "learning_rate": 5.7250877060948505e-06, + "loss": 1.7754, + "step": 30602500 + }, + { + "epoch": 88.58, + "learning_rate": 5.724365505742868e-06, + "loss": 1.8005, + "step": 30603000 + }, + { + "epoch": 88.58, + "learning_rate": 5.723641858095592e-06, + "loss": 1.8045, + "step": 30603500 + }, + { + "epoch": 88.59, + "learning_rate": 5.722918210448315e-06, + "loss": 1.7898, + "step": 30604000 + }, + { + "epoch": 88.59, + "learning_rate": 5.722194562801038e-06, + "loss": 1.8106, + "step": 30604500 + }, + { + "epoch": 88.59, + "learning_rate": 5.721470915153761e-06, + "loss": 1.7897, + "step": 30605000 + }, + { + "epoch": 88.59, + "learning_rate": 5.720748714801779e-06, + "loss": 1.7669, + "step": 30605500 + }, + { + "epoch": 88.59, + "learning_rate": 5.720025067154502e-06, + "loss": 1.7809, + "step": 30606000 + }, + { + "epoch": 88.59, + "learning_rate": 5.71930286680252e-06, + "loss": 1.7752, + "step": 30606500 + }, + { + "epoch": 88.59, + "learning_rate": 5.718580666450537e-06, + "loss": 1.8162, + "step": 30607000 + }, + { + "epoch": 88.6, + "learning_rate": 5.7178570188032605e-06, + "loss": 1.8137, + "step": 30607500 + }, + { + "epoch": 88.6, + "learning_rate": 5.7171348184512786e-06, + "loss": 1.7916, + "step": 30608000 + }, + { + "epoch": 88.6, + "learning_rate": 5.716411170804002e-06, + "loss": 1.8012, + "step": 30608500 + }, + { + "epoch": 88.6, + "learning_rate": 5.715687523156725e-06, + "loss": 1.7725, + "step": 30609000 + }, + { + "epoch": 88.6, + "learning_rate": 5.714963875509449e-06, + "loss": 1.7854, + "step": 30609500 + }, + { + "epoch": 88.6, + "learning_rate": 5.714240227862172e-06, + "loss": 1.7898, + "step": 30610000 + }, + { + "epoch": 88.6, + "learning_rate": 5.713516580214895e-06, + "loss": 1.7682, + "step": 30610500 + }, + { + "epoch": 88.61, + "learning_rate": 5.712792932567618e-06, + "loss": 1.8085, + "step": 30611000 + }, + { + "epoch": 88.61, + "learning_rate": 5.712069284920341e-06, + "loss": 1.7981, + "step": 30611500 + }, + { + "epoch": 88.61, + "learning_rate": 5.711345637273064e-06, + "loss": 1.8207, + "step": 30612000 + }, + { + "epoch": 88.61, + "learning_rate": 5.710621989625788e-06, + "loss": 1.7783, + "step": 30612500 + }, + { + "epoch": 88.61, + "learning_rate": 5.709898341978511e-06, + "loss": 1.8069, + "step": 30613000 + }, + { + "epoch": 88.61, + "learning_rate": 5.709174694331234e-06, + "loss": 1.7969, + "step": 30613500 + }, + { + "epoch": 88.61, + "learning_rate": 5.708451046683957e-06, + "loss": 1.8241, + "step": 30614000 + }, + { + "epoch": 88.62, + "learning_rate": 5.70772739903668e-06, + "loss": 1.8198, + "step": 30614500 + }, + { + "epoch": 88.62, + "learning_rate": 5.707003751389404e-06, + "loss": 1.8067, + "step": 30615000 + }, + { + "epoch": 88.62, + "learning_rate": 5.7062801037421265e-06, + "loss": 1.8086, + "step": 30615500 + }, + { + "epoch": 88.62, + "learning_rate": 5.70555645609485e-06, + "loss": 1.7782, + "step": 30616000 + }, + { + "epoch": 88.62, + "learning_rate": 5.704834255742868e-06, + "loss": 1.8019, + "step": 30616500 + }, + { + "epoch": 88.62, + "learning_rate": 5.7041106080955916e-06, + "loss": 1.7863, + "step": 30617000 + }, + { + "epoch": 88.63, + "learning_rate": 5.703386960448315e-06, + "loss": 1.8029, + "step": 30617500 + }, + { + "epoch": 88.63, + "learning_rate": 5.702663312801038e-06, + "loss": 1.803, + "step": 30618000 + }, + { + "epoch": 88.63, + "learning_rate": 5.701941112449055e-06, + "loss": 1.8282, + "step": 30618500 + }, + { + "epoch": 88.63, + "learning_rate": 5.701217464801779e-06, + "loss": 1.7977, + "step": 30619000 + }, + { + "epoch": 88.63, + "learning_rate": 5.700493817154502e-06, + "loss": 1.8013, + "step": 30619500 + }, + { + "epoch": 88.63, + "learning_rate": 5.699770169507225e-06, + "loss": 1.7682, + "step": 30620000 + }, + { + "epoch": 88.63, + "learning_rate": 5.699047969155243e-06, + "loss": 1.8183, + "step": 30620500 + }, + { + "epoch": 88.64, + "learning_rate": 5.698324321507966e-06, + "loss": 1.805, + "step": 30621000 + }, + { + "epoch": 88.64, + "learning_rate": 5.6976021211559835e-06, + "loss": 1.7903, + "step": 30621500 + }, + { + "epoch": 88.64, + "learning_rate": 5.6968784735087074e-06, + "loss": 1.7912, + "step": 30622000 + }, + { + "epoch": 88.64, + "learning_rate": 5.6961548258614305e-06, + "loss": 1.8305, + "step": 30622500 + }, + { + "epoch": 88.64, + "learning_rate": 5.695431178214154e-06, + "loss": 1.8131, + "step": 30623000 + }, + { + "epoch": 88.64, + "learning_rate": 5.694707530566877e-06, + "loss": 1.7775, + "step": 30623500 + }, + { + "epoch": 88.64, + "learning_rate": 5.6939838829196e-06, + "loss": 1.7761, + "step": 30624000 + }, + { + "epoch": 88.65, + "learning_rate": 5.693260235272324e-06, + "loss": 1.7865, + "step": 30624500 + }, + { + "epoch": 88.65, + "learning_rate": 5.692536587625046e-06, + "loss": 1.8031, + "step": 30625000 + }, + { + "epoch": 88.65, + "learning_rate": 5.69181293997777e-06, + "loss": 1.7714, + "step": 30625500 + }, + { + "epoch": 88.65, + "learning_rate": 5.691089292330493e-06, + "loss": 1.7814, + "step": 30626000 + }, + { + "epoch": 88.65, + "learning_rate": 5.690365644683216e-06, + "loss": 1.8006, + "step": 30626500 + }, + { + "epoch": 88.65, + "learning_rate": 5.68964199703594e-06, + "loss": 1.8309, + "step": 30627000 + }, + { + "epoch": 88.65, + "learning_rate": 5.688919796683957e-06, + "loss": 1.7916, + "step": 30627500 + }, + { + "epoch": 88.66, + "learning_rate": 5.688196149036681e-06, + "loss": 1.8033, + "step": 30628000 + }, + { + "epoch": 88.66, + "learning_rate": 5.687472501389403e-06, + "loss": 1.793, + "step": 30628500 + }, + { + "epoch": 88.66, + "learning_rate": 5.686748853742127e-06, + "loss": 1.779, + "step": 30629000 + }, + { + "epoch": 88.66, + "learning_rate": 5.6860252060948495e-06, + "loss": 1.7958, + "step": 30629500 + }, + { + "epoch": 88.66, + "learning_rate": 5.6853015584475734e-06, + "loss": 1.7868, + "step": 30630000 + }, + { + "epoch": 88.66, + "learning_rate": 5.684579358095591e-06, + "loss": 1.7896, + "step": 30630500 + }, + { + "epoch": 88.66, + "learning_rate": 5.683855710448315e-06, + "loss": 1.7954, + "step": 30631000 + }, + { + "epoch": 88.67, + "learning_rate": 5.683132062801038e-06, + "loss": 1.7954, + "step": 30631500 + }, + { + "epoch": 88.67, + "learning_rate": 5.682408415153761e-06, + "loss": 1.8205, + "step": 30632000 + }, + { + "epoch": 88.67, + "learning_rate": 5.681684767506485e-06, + "loss": 1.811, + "step": 30632500 + }, + { + "epoch": 88.67, + "learning_rate": 5.680961119859207e-06, + "loss": 1.8114, + "step": 30633000 + }, + { + "epoch": 88.67, + "learning_rate": 5.680237472211931e-06, + "loss": 1.8298, + "step": 30633500 + }, + { + "epoch": 88.67, + "learning_rate": 5.679513824564654e-06, + "loss": 1.813, + "step": 30634000 + }, + { + "epoch": 88.67, + "learning_rate": 5.678791624212672e-06, + "loss": 1.7879, + "step": 30634500 + }, + { + "epoch": 88.68, + "learning_rate": 5.678067976565394e-06, + "loss": 1.8003, + "step": 30635000 + }, + { + "epoch": 88.68, + "learning_rate": 5.677344328918118e-06, + "loss": 1.7795, + "step": 30635500 + }, + { + "epoch": 88.68, + "learning_rate": 5.676620681270841e-06, + "loss": 1.8235, + "step": 30636000 + }, + { + "epoch": 88.68, + "learning_rate": 5.675897033623564e-06, + "loss": 1.8343, + "step": 30636500 + }, + { + "epoch": 88.68, + "learning_rate": 5.675173385976288e-06, + "loss": 1.7961, + "step": 30637000 + }, + { + "epoch": 88.68, + "learning_rate": 5.6744497383290105e-06, + "loss": 1.8055, + "step": 30637500 + }, + { + "epoch": 88.68, + "learning_rate": 5.6737275379770295e-06, + "loss": 1.8124, + "step": 30638000 + }, + { + "epoch": 88.69, + "learning_rate": 5.673003890329752e-06, + "loss": 1.789, + "step": 30638500 + }, + { + "epoch": 88.69, + "learning_rate": 5.672280242682476e-06, + "loss": 1.7971, + "step": 30639000 + }, + { + "epoch": 88.69, + "learning_rate": 5.671556595035199e-06, + "loss": 1.8077, + "step": 30639500 + }, + { + "epoch": 88.69, + "learning_rate": 5.670834394683217e-06, + "loss": 1.7789, + "step": 30640000 + }, + { + "epoch": 88.69, + "learning_rate": 5.670110747035939e-06, + "loss": 1.7791, + "step": 30640500 + }, + { + "epoch": 88.69, + "learning_rate": 5.669387099388663e-06, + "loss": 1.786, + "step": 30641000 + }, + { + "epoch": 88.69, + "learning_rate": 5.668663451741386e-06, + "loss": 1.7833, + "step": 30641500 + }, + { + "epoch": 88.7, + "learning_rate": 5.667939804094109e-06, + "loss": 1.8115, + "step": 30642000 + }, + { + "epoch": 88.7, + "learning_rate": 5.667216156446833e-06, + "loss": 1.823, + "step": 30642500 + }, + { + "epoch": 88.7, + "learning_rate": 5.666492508799555e-06, + "loss": 1.8087, + "step": 30643000 + }, + { + "epoch": 88.7, + "learning_rate": 5.665768861152279e-06, + "loss": 1.7957, + "step": 30643500 + }, + { + "epoch": 88.7, + "learning_rate": 5.6650466608002965e-06, + "loss": 1.7878, + "step": 30644000 + }, + { + "epoch": 88.7, + "learning_rate": 5.66432301315302e-06, + "loss": 1.7832, + "step": 30644500 + }, + { + "epoch": 88.7, + "learning_rate": 5.663600812801038e-06, + "loss": 1.8199, + "step": 30645000 + }, + { + "epoch": 88.71, + "learning_rate": 5.6628771651537616e-06, + "loss": 1.797, + "step": 30645500 + }, + { + "epoch": 88.71, + "learning_rate": 5.662153517506484e-06, + "loss": 1.7934, + "step": 30646000 + }, + { + "epoch": 88.71, + "learning_rate": 5.661429869859208e-06, + "loss": 1.7852, + "step": 30646500 + }, + { + "epoch": 88.71, + "learning_rate": 5.660706222211931e-06, + "loss": 1.7912, + "step": 30647000 + }, + { + "epoch": 88.71, + "learning_rate": 5.659984021859949e-06, + "loss": 1.7813, + "step": 30647500 + }, + { + "epoch": 88.71, + "learning_rate": 5.659260374212671e-06, + "loss": 1.7826, + "step": 30648000 + }, + { + "epoch": 88.71, + "learning_rate": 5.658536726565395e-06, + "loss": 1.8113, + "step": 30648500 + }, + { + "epoch": 88.72, + "learning_rate": 5.657813078918118e-06, + "loss": 1.7862, + "step": 30649000 + }, + { + "epoch": 88.72, + "learning_rate": 5.657089431270841e-06, + "loss": 1.7931, + "step": 30649500 + }, + { + "epoch": 88.72, + "learning_rate": 5.656365783623564e-06, + "loss": 1.7944, + "step": 30650000 + }, + { + "epoch": 88.72, + "learning_rate": 5.655642135976287e-06, + "loss": 1.7972, + "step": 30650500 + }, + { + "epoch": 88.72, + "learning_rate": 5.654918488329011e-06, + "loss": 1.8354, + "step": 30651000 + }, + { + "epoch": 88.72, + "learning_rate": 5.654194840681734e-06, + "loss": 1.8296, + "step": 30651500 + }, + { + "epoch": 88.72, + "learning_rate": 5.6534711930344575e-06, + "loss": 1.8018, + "step": 30652000 + }, + { + "epoch": 88.73, + "learning_rate": 5.6527475453871806e-06, + "loss": 1.7842, + "step": 30652500 + }, + { + "epoch": 88.73, + "learning_rate": 5.652023897739904e-06, + "loss": 1.7879, + "step": 30653000 + }, + { + "epoch": 88.73, + "learning_rate": 5.651301697387922e-06, + "loss": 1.7964, + "step": 30653500 + }, + { + "epoch": 88.73, + "learning_rate": 5.65057949703594e-06, + "loss": 1.7833, + "step": 30654000 + }, + { + "epoch": 88.73, + "learning_rate": 5.649855849388663e-06, + "loss": 1.7797, + "step": 30654500 + }, + { + "epoch": 88.73, + "learning_rate": 5.649132201741386e-06, + "loss": 1.7853, + "step": 30655000 + }, + { + "epoch": 88.74, + "learning_rate": 5.648410001389404e-06, + "loss": 1.816, + "step": 30655500 + }, + { + "epoch": 88.74, + "learning_rate": 5.647686353742127e-06, + "loss": 1.7918, + "step": 30656000 + }, + { + "epoch": 88.74, + "learning_rate": 5.64696270609485e-06, + "loss": 1.8024, + "step": 30656500 + }, + { + "epoch": 88.74, + "learning_rate": 5.646239058447573e-06, + "loss": 1.8383, + "step": 30657000 + }, + { + "epoch": 88.74, + "learning_rate": 5.645515410800296e-06, + "loss": 1.7849, + "step": 30657500 + }, + { + "epoch": 88.74, + "learning_rate": 5.64479176315302e-06, + "loss": 1.7806, + "step": 30658000 + }, + { + "epoch": 88.74, + "learning_rate": 5.644068115505743e-06, + "loss": 1.7767, + "step": 30658500 + }, + { + "epoch": 88.75, + "learning_rate": 5.643345915153761e-06, + "loss": 1.8079, + "step": 30659000 + }, + { + "epoch": 88.75, + "learning_rate": 5.642622267506484e-06, + "loss": 1.8202, + "step": 30659500 + }, + { + "epoch": 88.75, + "learning_rate": 5.641898619859208e-06, + "loss": 1.8004, + "step": 30660000 + }, + { + "epoch": 88.75, + "learning_rate": 5.641174972211931e-06, + "loss": 1.7922, + "step": 30660500 + }, + { + "epoch": 88.75, + "learning_rate": 5.640451324564654e-06, + "loss": 1.7893, + "step": 30661000 + }, + { + "epoch": 88.75, + "learning_rate": 5.639727676917377e-06, + "loss": 1.7877, + "step": 30661500 + }, + { + "epoch": 88.75, + "learning_rate": 5.639005476565395e-06, + "loss": 1.8066, + "step": 30662000 + }, + { + "epoch": 88.76, + "learning_rate": 5.638281828918118e-06, + "loss": 1.7778, + "step": 30662500 + }, + { + "epoch": 88.76, + "learning_rate": 5.637558181270841e-06, + "loss": 1.81, + "step": 30663000 + }, + { + "epoch": 88.76, + "learning_rate": 5.636834533623564e-06, + "loss": 1.7979, + "step": 30663500 + }, + { + "epoch": 88.76, + "learning_rate": 5.636110885976287e-06, + "loss": 1.8129, + "step": 30664000 + }, + { + "epoch": 88.76, + "learning_rate": 5.6353886856243054e-06, + "loss": 1.8271, + "step": 30664500 + }, + { + "epoch": 88.76, + "learning_rate": 5.6346650379770285e-06, + "loss": 1.8082, + "step": 30665000 + }, + { + "epoch": 88.76, + "learning_rate": 5.6339413903297524e-06, + "loss": 1.7953, + "step": 30665500 + }, + { + "epoch": 88.77, + "learning_rate": 5.6332177426824755e-06, + "loss": 1.7943, + "step": 30666000 + }, + { + "epoch": 88.77, + "learning_rate": 5.632494095035199e-06, + "loss": 1.8298, + "step": 30666500 + }, + { + "epoch": 88.77, + "learning_rate": 5.631770447387922e-06, + "loss": 1.8113, + "step": 30667000 + }, + { + "epoch": 88.77, + "learning_rate": 5.631046799740645e-06, + "loss": 1.8061, + "step": 30667500 + }, + { + "epoch": 88.77, + "learning_rate": 5.630323152093369e-06, + "loss": 1.8041, + "step": 30668000 + }, + { + "epoch": 88.77, + "learning_rate": 5.629599504446091e-06, + "loss": 1.7945, + "step": 30668500 + }, + { + "epoch": 88.77, + "learning_rate": 5.628875856798815e-06, + "loss": 1.7936, + "step": 30669000 + }, + { + "epoch": 88.78, + "learning_rate": 5.628152209151538e-06, + "loss": 1.8096, + "step": 30669500 + }, + { + "epoch": 88.78, + "learning_rate": 5.627430008799556e-06, + "loss": 1.8121, + "step": 30670000 + }, + { + "epoch": 88.78, + "learning_rate": 5.626706361152278e-06, + "loss": 1.8047, + "step": 30670500 + }, + { + "epoch": 88.78, + "learning_rate": 5.625982713505002e-06, + "loss": 1.7901, + "step": 30671000 + }, + { + "epoch": 88.78, + "learning_rate": 5.625259065857725e-06, + "loss": 1.8314, + "step": 30671500 + }, + { + "epoch": 88.78, + "learning_rate": 5.624536865505743e-06, + "loss": 1.8086, + "step": 30672000 + }, + { + "epoch": 88.78, + "learning_rate": 5.6238132178584664e-06, + "loss": 1.81, + "step": 30672500 + }, + { + "epoch": 88.79, + "learning_rate": 5.6230895702111895e-06, + "loss": 1.7877, + "step": 30673000 + }, + { + "epoch": 88.79, + "learning_rate": 5.6223659225639135e-06, + "loss": 1.7968, + "step": 30673500 + }, + { + "epoch": 88.79, + "learning_rate": 5.621642274916636e-06, + "loss": 1.792, + "step": 30674000 + }, + { + "epoch": 88.79, + "learning_rate": 5.620920074564654e-06, + "loss": 1.7781, + "step": 30674500 + }, + { + "epoch": 88.79, + "learning_rate": 5.620196426917377e-06, + "loss": 1.7894, + "step": 30675000 + }, + { + "epoch": 88.79, + "learning_rate": 5.619472779270101e-06, + "loss": 1.7805, + "step": 30675500 + }, + { + "epoch": 88.79, + "learning_rate": 5.618749131622823e-06, + "loss": 1.8162, + "step": 30676000 + }, + { + "epoch": 88.8, + "learning_rate": 5.618025483975547e-06, + "loss": 1.7985, + "step": 30676500 + }, + { + "epoch": 88.8, + "learning_rate": 5.61730183632827e-06, + "loss": 1.831, + "step": 30677000 + }, + { + "epoch": 88.8, + "learning_rate": 5.616579635976288e-06, + "loss": 1.7804, + "step": 30677500 + }, + { + "epoch": 88.8, + "learning_rate": 5.61585598832901e-06, + "loss": 1.8018, + "step": 30678000 + }, + { + "epoch": 88.8, + "learning_rate": 5.615132340681734e-06, + "loss": 1.793, + "step": 30678500 + }, + { + "epoch": 88.8, + "learning_rate": 5.614408693034457e-06, + "loss": 1.8014, + "step": 30679000 + }, + { + "epoch": 88.8, + "learning_rate": 5.6136864926824755e-06, + "loss": 1.8108, + "step": 30679500 + }, + { + "epoch": 88.81, + "learning_rate": 5.6129628450351985e-06, + "loss": 1.7938, + "step": 30680000 + }, + { + "epoch": 88.81, + "learning_rate": 5.612239197387922e-06, + "loss": 1.797, + "step": 30680500 + }, + { + "epoch": 88.81, + "learning_rate": 5.6115155497406456e-06, + "loss": 1.7892, + "step": 30681000 + }, + { + "epoch": 88.81, + "learning_rate": 5.610791902093368e-06, + "loss": 1.8063, + "step": 30681500 + }, + { + "epoch": 88.81, + "learning_rate": 5.610069701741386e-06, + "loss": 1.7641, + "step": 30682000 + }, + { + "epoch": 88.81, + "learning_rate": 5.609346054094109e-06, + "loss": 1.7891, + "step": 30682500 + }, + { + "epoch": 88.81, + "learning_rate": 5.608622406446833e-06, + "loss": 1.7897, + "step": 30683000 + }, + { + "epoch": 88.82, + "learning_rate": 5.607898758799555e-06, + "loss": 1.7908, + "step": 30683500 + }, + { + "epoch": 88.82, + "learning_rate": 5.607175111152279e-06, + "loss": 1.8167, + "step": 30684000 + }, + { + "epoch": 88.82, + "learning_rate": 5.606451463505002e-06, + "loss": 1.7911, + "step": 30684500 + }, + { + "epoch": 88.82, + "learning_rate": 5.605727815857725e-06, + "loss": 1.7907, + "step": 30685000 + }, + { + "epoch": 88.82, + "learning_rate": 5.605004168210449e-06, + "loss": 1.7749, + "step": 30685500 + }, + { + "epoch": 88.82, + "learning_rate": 5.604281967858466e-06, + "loss": 1.8016, + "step": 30686000 + }, + { + "epoch": 88.82, + "learning_rate": 5.60355832021119e-06, + "loss": 1.7762, + "step": 30686500 + }, + { + "epoch": 88.83, + "learning_rate": 5.6028346725639126e-06, + "loss": 1.7863, + "step": 30687000 + }, + { + "epoch": 88.83, + "learning_rate": 5.602112472211931e-06, + "loss": 1.8204, + "step": 30687500 + }, + { + "epoch": 88.83, + "learning_rate": 5.601388824564654e-06, + "loss": 1.8093, + "step": 30688000 + }, + { + "epoch": 88.83, + "learning_rate": 5.600665176917378e-06, + "loss": 1.7907, + "step": 30688500 + }, + { + "epoch": 88.83, + "learning_rate": 5.5999415292701e-06, + "loss": 1.7873, + "step": 30689000 + }, + { + "epoch": 88.83, + "learning_rate": 5.599217881622824e-06, + "loss": 1.7766, + "step": 30689500 + }, + { + "epoch": 88.83, + "learning_rate": 5.598494233975547e-06, + "loss": 1.8062, + "step": 30690000 + }, + { + "epoch": 88.84, + "learning_rate": 5.59777058632827e-06, + "loss": 1.8027, + "step": 30690500 + }, + { + "epoch": 88.84, + "learning_rate": 5.597046938680993e-06, + "loss": 1.8039, + "step": 30691000 + }, + { + "epoch": 88.84, + "learning_rate": 5.596323291033716e-06, + "loss": 1.795, + "step": 30691500 + }, + { + "epoch": 88.84, + "learning_rate": 5.59559964338644e-06, + "loss": 1.8143, + "step": 30692000 + }, + { + "epoch": 88.84, + "learning_rate": 5.594875995739163e-06, + "loss": 1.7956, + "step": 30692500 + }, + { + "epoch": 88.84, + "learning_rate": 5.594153795387181e-06, + "loss": 1.7918, + "step": 30693000 + }, + { + "epoch": 88.85, + "learning_rate": 5.5934315950351985e-06, + "loss": 1.7997, + "step": 30693500 + }, + { + "epoch": 88.85, + "learning_rate": 5.5927079473879216e-06, + "loss": 1.777, + "step": 30694000 + }, + { + "epoch": 88.85, + "learning_rate": 5.591984299740645e-06, + "loss": 1.833, + "step": 30694500 + }, + { + "epoch": 88.85, + "learning_rate": 5.591260652093369e-06, + "loss": 1.8051, + "step": 30695000 + }, + { + "epoch": 88.85, + "learning_rate": 5.590537004446092e-06, + "loss": 1.8037, + "step": 30695500 + }, + { + "epoch": 88.85, + "learning_rate": 5.589813356798815e-06, + "loss": 1.7909, + "step": 30696000 + }, + { + "epoch": 88.85, + "learning_rate": 5.589089709151538e-06, + "loss": 1.7984, + "step": 30696500 + }, + { + "epoch": 88.86, + "learning_rate": 5.588366061504261e-06, + "loss": 1.8042, + "step": 30697000 + }, + { + "epoch": 88.86, + "learning_rate": 5.587642413856985e-06, + "loss": 1.8021, + "step": 30697500 + }, + { + "epoch": 88.86, + "learning_rate": 5.586920213505002e-06, + "loss": 1.7887, + "step": 30698000 + }, + { + "epoch": 88.86, + "learning_rate": 5.586196565857725e-06, + "loss": 1.7873, + "step": 30698500 + }, + { + "epoch": 88.86, + "learning_rate": 5.585472918210448e-06, + "loss": 1.8064, + "step": 30699000 + }, + { + "epoch": 88.86, + "learning_rate": 5.584749270563172e-06, + "loss": 1.7902, + "step": 30699500 + }, + { + "epoch": 88.86, + "learning_rate": 5.584025622915895e-06, + "loss": 1.8006, + "step": 30700000 + }, + { + "epoch": 88.87, + "learning_rate": 5.583303422563913e-06, + "loss": 1.7635, + "step": 30700500 + }, + { + "epoch": 88.87, + "learning_rate": 5.582579774916636e-06, + "loss": 1.8105, + "step": 30701000 + }, + { + "epoch": 88.87, + "learning_rate": 5.5818561272693595e-06, + "loss": 1.8069, + "step": 30701500 + }, + { + "epoch": 88.87, + "learning_rate": 5.581132479622083e-06, + "loss": 1.7985, + "step": 30702000 + }, + { + "epoch": 88.87, + "learning_rate": 5.580408831974806e-06, + "loss": 1.8187, + "step": 30702500 + }, + { + "epoch": 88.87, + "learning_rate": 5.579686631622824e-06, + "loss": 1.8041, + "step": 30703000 + }, + { + "epoch": 88.87, + "learning_rate": 5.578962983975547e-06, + "loss": 1.7908, + "step": 30703500 + }, + { + "epoch": 88.88, + "learning_rate": 5.57823933632827e-06, + "loss": 1.7976, + "step": 30704000 + }, + { + "epoch": 88.88, + "learning_rate": 5.577515688680993e-06, + "loss": 1.7835, + "step": 30704500 + }, + { + "epoch": 88.88, + "learning_rate": 5.576792041033716e-06, + "loss": 1.7911, + "step": 30705000 + }, + { + "epoch": 88.88, + "learning_rate": 5.57606839338644e-06, + "loss": 1.8084, + "step": 30705500 + }, + { + "epoch": 88.88, + "learning_rate": 5.575344745739163e-06, + "loss": 1.8149, + "step": 30706000 + }, + { + "epoch": 88.88, + "learning_rate": 5.57462254538718e-06, + "loss": 1.7834, + "step": 30706500 + }, + { + "epoch": 88.88, + "learning_rate": 5.573898897739904e-06, + "loss": 1.774, + "step": 30707000 + }, + { + "epoch": 88.89, + "learning_rate": 5.573175250092627e-06, + "loss": 1.7932, + "step": 30707500 + }, + { + "epoch": 88.89, + "learning_rate": 5.5724516024453504e-06, + "loss": 1.8095, + "step": 30708000 + }, + { + "epoch": 88.89, + "learning_rate": 5.5717279547980735e-06, + "loss": 1.7979, + "step": 30708500 + }, + { + "epoch": 88.89, + "learning_rate": 5.571005754446092e-06, + "loss": 1.8277, + "step": 30709000 + }, + { + "epoch": 88.89, + "learning_rate": 5.570282106798815e-06, + "loss": 1.8034, + "step": 30709500 + }, + { + "epoch": 88.89, + "learning_rate": 5.569558459151538e-06, + "loss": 1.8037, + "step": 30710000 + }, + { + "epoch": 88.89, + "learning_rate": 5.568834811504261e-06, + "loss": 1.7848, + "step": 30710500 + }, + { + "epoch": 88.9, + "learning_rate": 5.568111163856985e-06, + "loss": 1.8218, + "step": 30711000 + }, + { + "epoch": 88.9, + "learning_rate": 5.567387516209707e-06, + "loss": 1.8063, + "step": 30711500 + }, + { + "epoch": 88.9, + "learning_rate": 5.566663868562431e-06, + "loss": 1.7922, + "step": 30712000 + }, + { + "epoch": 88.9, + "learning_rate": 5.565940220915154e-06, + "loss": 1.8251, + "step": 30712500 + }, + { + "epoch": 88.9, + "learning_rate": 5.565218020563172e-06, + "loss": 1.7845, + "step": 30713000 + }, + { + "epoch": 88.9, + "learning_rate": 5.564495820211189e-06, + "loss": 1.7928, + "step": 30713500 + }, + { + "epoch": 88.9, + "learning_rate": 5.5637736198592075e-06, + "loss": 1.7906, + "step": 30714000 + }, + { + "epoch": 88.91, + "learning_rate": 5.5630499722119305e-06, + "loss": 1.799, + "step": 30714500 + }, + { + "epoch": 88.91, + "learning_rate": 5.562326324564654e-06, + "loss": 1.7983, + "step": 30715000 + }, + { + "epoch": 88.91, + "learning_rate": 5.561602676917377e-06, + "loss": 1.7958, + "step": 30715500 + }, + { + "epoch": 88.91, + "learning_rate": 5.560879029270101e-06, + "loss": 1.8031, + "step": 30716000 + }, + { + "epoch": 88.91, + "learning_rate": 5.560155381622824e-06, + "loss": 1.8298, + "step": 30716500 + }, + { + "epoch": 88.91, + "learning_rate": 5.559431733975547e-06, + "loss": 1.7925, + "step": 30717000 + }, + { + "epoch": 88.91, + "learning_rate": 5.558709533623564e-06, + "loss": 1.7972, + "step": 30717500 + }, + { + "epoch": 88.92, + "learning_rate": 5.557985885976288e-06, + "loss": 1.7824, + "step": 30718000 + }, + { + "epoch": 88.92, + "learning_rate": 5.557262238329011e-06, + "loss": 1.8053, + "step": 30718500 + }, + { + "epoch": 88.92, + "learning_rate": 5.556538590681734e-06, + "loss": 1.7924, + "step": 30719000 + }, + { + "epoch": 88.92, + "learning_rate": 5.555814943034457e-06, + "loss": 1.8079, + "step": 30719500 + }, + { + "epoch": 88.92, + "learning_rate": 5.55509129538718e-06, + "loss": 1.7759, + "step": 30720000 + }, + { + "epoch": 88.92, + "learning_rate": 5.554367647739904e-06, + "loss": 1.7941, + "step": 30720500 + }, + { + "epoch": 88.92, + "learning_rate": 5.553644000092627e-06, + "loss": 1.8203, + "step": 30721000 + }, + { + "epoch": 88.93, + "learning_rate": 5.55292035244535e-06, + "loss": 1.8101, + "step": 30721500 + }, + { + "epoch": 88.93, + "learning_rate": 5.5521967047980735e-06, + "loss": 1.7978, + "step": 30722000 + }, + { + "epoch": 88.93, + "learning_rate": 5.5514745044460916e-06, + "loss": 1.8237, + "step": 30722500 + }, + { + "epoch": 88.93, + "learning_rate": 5.550750856798815e-06, + "loss": 1.8012, + "step": 30723000 + }, + { + "epoch": 88.93, + "learning_rate": 5.550027209151538e-06, + "loss": 1.8024, + "step": 30723500 + }, + { + "epoch": 88.93, + "learning_rate": 5.549303561504262e-06, + "loss": 1.7896, + "step": 30724000 + }, + { + "epoch": 88.93, + "learning_rate": 5.548579913856984e-06, + "loss": 1.7697, + "step": 30724500 + }, + { + "epoch": 88.94, + "learning_rate": 5.547856266209708e-06, + "loss": 1.8178, + "step": 30725000 + }, + { + "epoch": 88.94, + "learning_rate": 5.547134065857725e-06, + "loss": 1.8021, + "step": 30725500 + }, + { + "epoch": 88.94, + "learning_rate": 5.546410418210449e-06, + "loss": 1.8111, + "step": 30726000 + }, + { + "epoch": 88.94, + "learning_rate": 5.545686770563171e-06, + "loss": 1.7917, + "step": 30726500 + }, + { + "epoch": 88.94, + "learning_rate": 5.544963122915895e-06, + "loss": 1.8032, + "step": 30727000 + }, + { + "epoch": 88.94, + "learning_rate": 5.544240922563912e-06, + "loss": 1.8122, + "step": 30727500 + }, + { + "epoch": 88.94, + "learning_rate": 5.543517274916636e-06, + "loss": 1.7707, + "step": 30728000 + }, + { + "epoch": 88.95, + "learning_rate": 5.542795074564654e-06, + "loss": 1.8128, + "step": 30728500 + }, + { + "epoch": 88.95, + "learning_rate": 5.5420714269173775e-06, + "loss": 1.7955, + "step": 30729000 + }, + { + "epoch": 88.95, + "learning_rate": 5.5413477792701e-06, + "loss": 1.8046, + "step": 30729500 + }, + { + "epoch": 88.95, + "learning_rate": 5.540624131622824e-06, + "loss": 1.8012, + "step": 30730000 + }, + { + "epoch": 88.95, + "learning_rate": 5.539900483975547e-06, + "loss": 1.7883, + "step": 30730500 + }, + { + "epoch": 88.95, + "learning_rate": 5.53917683632827e-06, + "loss": 1.775, + "step": 30731000 + }, + { + "epoch": 88.96, + "learning_rate": 5.538453188680994e-06, + "loss": 1.8022, + "step": 30731500 + }, + { + "epoch": 88.96, + "learning_rate": 5.537729541033716e-06, + "loss": 1.7962, + "step": 30732000 + }, + { + "epoch": 88.96, + "learning_rate": 5.537007340681735e-06, + "loss": 1.7755, + "step": 30732500 + }, + { + "epoch": 88.96, + "learning_rate": 5.536283693034457e-06, + "loss": 1.7947, + "step": 30733000 + }, + { + "epoch": 88.96, + "learning_rate": 5.535560045387181e-06, + "loss": 1.8348, + "step": 30733500 + }, + { + "epoch": 88.96, + "learning_rate": 5.534836397739903e-06, + "loss": 1.8037, + "step": 30734000 + }, + { + "epoch": 88.96, + "learning_rate": 5.534112750092627e-06, + "loss": 1.7875, + "step": 30734500 + }, + { + "epoch": 88.97, + "learning_rate": 5.53338910244535e-06, + "loss": 1.8079, + "step": 30735000 + }, + { + "epoch": 88.97, + "learning_rate": 5.532665454798073e-06, + "loss": 1.8044, + "step": 30735500 + }, + { + "epoch": 88.97, + "learning_rate": 5.5319432544460915e-06, + "loss": 1.7965, + "step": 30736000 + }, + { + "epoch": 88.97, + "learning_rate": 5.531219606798815e-06, + "loss": 1.8064, + "step": 30736500 + }, + { + "epoch": 88.97, + "learning_rate": 5.5304959591515385e-06, + "loss": 1.7789, + "step": 30737000 + }, + { + "epoch": 88.97, + "learning_rate": 5.529772311504261e-06, + "loss": 1.7842, + "step": 30737500 + }, + { + "epoch": 88.97, + "learning_rate": 5.529048663856985e-06, + "loss": 1.8073, + "step": 30738000 + }, + { + "epoch": 88.98, + "learning_rate": 5.528325016209708e-06, + "loss": 1.7941, + "step": 30738500 + }, + { + "epoch": 88.98, + "learning_rate": 5.527602815857726e-06, + "loss": 1.7868, + "step": 30739000 + }, + { + "epoch": 88.98, + "learning_rate": 5.526879168210448e-06, + "loss": 1.783, + "step": 30739500 + }, + { + "epoch": 88.98, + "learning_rate": 5.526155520563172e-06, + "loss": 1.8051, + "step": 30740000 + }, + { + "epoch": 88.98, + "learning_rate": 5.525431872915895e-06, + "loss": 1.7868, + "step": 30740500 + }, + { + "epoch": 88.98, + "learning_rate": 5.524709672563913e-06, + "loss": 1.8062, + "step": 30741000 + }, + { + "epoch": 88.98, + "learning_rate": 5.523986024916636e-06, + "loss": 1.8043, + "step": 30741500 + }, + { + "epoch": 88.99, + "learning_rate": 5.523262377269359e-06, + "loss": 1.8041, + "step": 30742000 + }, + { + "epoch": 88.99, + "learning_rate": 5.5225387296220824e-06, + "loss": 1.7929, + "step": 30742500 + }, + { + "epoch": 88.99, + "learning_rate": 5.5218150819748055e-06, + "loss": 1.8043, + "step": 30743000 + }, + { + "epoch": 88.99, + "learning_rate": 5.521092881622824e-06, + "loss": 1.7979, + "step": 30743500 + }, + { + "epoch": 88.99, + "learning_rate": 5.520369233975547e-06, + "loss": 1.805, + "step": 30744000 + }, + { + "epoch": 88.99, + "learning_rate": 5.519645586328271e-06, + "loss": 1.7892, + "step": 30744500 + }, + { + "epoch": 88.99, + "learning_rate": 5.518921938680993e-06, + "loss": 1.8007, + "step": 30745000 + }, + { + "epoch": 89.0, + "learning_rate": 5.518199738329011e-06, + "loss": 1.8306, + "step": 30745500 + }, + { + "epoch": 89.0, + "learning_rate": 5.517476090681734e-06, + "loss": 1.8245, + "step": 30746000 + }, + { + "epoch": 89.0, + "learning_rate": 5.516752443034458e-06, + "loss": 1.7965, + "step": 30746500 + }, + { + "epoch": 89.0, + "learning_rate": 5.51602879538718e-06, + "loss": 1.776, + "step": 30747000 + }, + { + "epoch": 89.0, + "eval_accuracy": 0.6898743273065717, + "eval_accuracy_mlm": 0.6590290488740586, + "eval_accuracy_nsp": 0.855270334062046, + "eval_loss": 2.2004992961883545, + "eval_runtime": 332.1031, + "eval_samples_per_second": 1314.008, + "eval_steps_per_second": 54.751, + "step": 30747008 + }, + { + "epoch": 89.0, + "learning_rate": 5.515305147739904e-06, + "loss": 1.7704, + "step": 30747500 + }, + { + "epoch": 89.0, + "learning_rate": 5.514582947387921e-06, + "loss": 1.7767, + "step": 30748000 + }, + { + "epoch": 89.0, + "learning_rate": 5.513859299740645e-06, + "loss": 1.8196, + "step": 30748500 + }, + { + "epoch": 89.01, + "learning_rate": 5.5131370993886625e-06, + "loss": 1.7982, + "step": 30749000 + }, + { + "epoch": 89.01, + "learning_rate": 5.5124134517413865e-06, + "loss": 1.7849, + "step": 30749500 + }, + { + "epoch": 89.01, + "learning_rate": 5.511691251389404e-06, + "loss": 1.8098, + "step": 30750000 + }, + { + "epoch": 89.01, + "learning_rate": 5.510967603742127e-06, + "loss": 1.7711, + "step": 30750500 + }, + { + "epoch": 89.01, + "learning_rate": 5.51024395609485e-06, + "loss": 1.8025, + "step": 30751000 + }, + { + "epoch": 89.01, + "learning_rate": 5.509520308447574e-06, + "loss": 1.7797, + "step": 30751500 + }, + { + "epoch": 89.01, + "learning_rate": 5.508796660800297e-06, + "loss": 1.7952, + "step": 30752000 + }, + { + "epoch": 89.02, + "learning_rate": 5.50807301315302e-06, + "loss": 1.8069, + "step": 30752500 + }, + { + "epoch": 89.02, + "learning_rate": 5.507349365505743e-06, + "loss": 1.8088, + "step": 30753000 + }, + { + "epoch": 89.02, + "learning_rate": 5.506625717858466e-06, + "loss": 1.8133, + "step": 30753500 + }, + { + "epoch": 89.02, + "learning_rate": 5.50590207021119e-06, + "loss": 1.7769, + "step": 30754000 + }, + { + "epoch": 89.02, + "learning_rate": 5.505178422563913e-06, + "loss": 1.8163, + "step": 30754500 + }, + { + "epoch": 89.02, + "learning_rate": 5.504454774916636e-06, + "loss": 1.7815, + "step": 30755000 + }, + { + "epoch": 89.02, + "learning_rate": 5.503731127269359e-06, + "loss": 1.7708, + "step": 30755500 + }, + { + "epoch": 89.03, + "learning_rate": 5.503008926917377e-06, + "loss": 1.7887, + "step": 30756000 + }, + { + "epoch": 89.03, + "learning_rate": 5.5022852792701005e-06, + "loss": 1.8025, + "step": 30756500 + }, + { + "epoch": 89.03, + "learning_rate": 5.5015616316228236e-06, + "loss": 1.7958, + "step": 30757000 + }, + { + "epoch": 89.03, + "learning_rate": 5.500837983975547e-06, + "loss": 1.7988, + "step": 30757500 + }, + { + "epoch": 89.03, + "learning_rate": 5.50011433632827e-06, + "loss": 1.7975, + "step": 30758000 + }, + { + "epoch": 89.03, + "learning_rate": 5.499392135976288e-06, + "loss": 1.8, + "step": 30758500 + }, + { + "epoch": 89.03, + "learning_rate": 5.498668488329011e-06, + "loss": 1.7667, + "step": 30759000 + }, + { + "epoch": 89.04, + "learning_rate": 5.497946287977029e-06, + "loss": 1.791, + "step": 30759500 + }, + { + "epoch": 89.04, + "learning_rate": 5.497222640329752e-06, + "loss": 1.7851, + "step": 30760000 + }, + { + "epoch": 89.04, + "learning_rate": 5.496498992682475e-06, + "loss": 1.7869, + "step": 30760500 + }, + { + "epoch": 89.04, + "learning_rate": 5.495775345035198e-06, + "loss": 1.7826, + "step": 30761000 + }, + { + "epoch": 89.04, + "learning_rate": 5.495051697387921e-06, + "loss": 1.8174, + "step": 30761500 + }, + { + "epoch": 89.04, + "learning_rate": 5.494328049740645e-06, + "loss": 1.771, + "step": 30762000 + }, + { + "epoch": 89.04, + "learning_rate": 5.493604402093368e-06, + "loss": 1.7957, + "step": 30762500 + }, + { + "epoch": 89.05, + "learning_rate": 5.492880754446091e-06, + "loss": 1.7851, + "step": 30763000 + }, + { + "epoch": 89.05, + "learning_rate": 5.4921571067988145e-06, + "loss": 1.771, + "step": 30763500 + }, + { + "epoch": 89.05, + "learning_rate": 5.491434906446833e-06, + "loss": 1.8031, + "step": 30764000 + }, + { + "epoch": 89.05, + "learning_rate": 5.490711258799556e-06, + "loss": 1.7789, + "step": 30764500 + }, + { + "epoch": 89.05, + "learning_rate": 5.489989058447574e-06, + "loss": 1.826, + "step": 30765000 + }, + { + "epoch": 89.05, + "learning_rate": 5.489265410800297e-06, + "loss": 1.7838, + "step": 30765500 + }, + { + "epoch": 89.05, + "learning_rate": 5.488543210448314e-06, + "loss": 1.7589, + "step": 30766000 + }, + { + "epoch": 89.06, + "learning_rate": 5.487819562801038e-06, + "loss": 1.7799, + "step": 30766500 + }, + { + "epoch": 89.06, + "learning_rate": 5.487095915153761e-06, + "loss": 1.7825, + "step": 30767000 + }, + { + "epoch": 89.06, + "learning_rate": 5.486372267506484e-06, + "loss": 1.805, + "step": 30767500 + }, + { + "epoch": 89.06, + "learning_rate": 5.485648619859207e-06, + "loss": 1.8091, + "step": 30768000 + }, + { + "epoch": 89.06, + "learning_rate": 5.48492497221193e-06, + "loss": 1.7883, + "step": 30768500 + }, + { + "epoch": 89.06, + "learning_rate": 5.484201324564653e-06, + "loss": 1.7935, + "step": 30769000 + }, + { + "epoch": 89.07, + "learning_rate": 5.483477676917377e-06, + "loss": 1.7914, + "step": 30769500 + }, + { + "epoch": 89.07, + "learning_rate": 5.4827540292701004e-06, + "loss": 1.7982, + "step": 30770000 + }, + { + "epoch": 89.07, + "learning_rate": 5.4820303816228235e-06, + "loss": 1.777, + "step": 30770500 + }, + { + "epoch": 89.07, + "learning_rate": 5.481306733975547e-06, + "loss": 1.7725, + "step": 30771000 + }, + { + "epoch": 89.07, + "learning_rate": 5.48058308632827e-06, + "loss": 1.7986, + "step": 30771500 + }, + { + "epoch": 89.07, + "learning_rate": 5.479859438680994e-06, + "loss": 1.7816, + "step": 30772000 + }, + { + "epoch": 89.07, + "learning_rate": 5.479135791033716e-06, + "loss": 1.7746, + "step": 30772500 + }, + { + "epoch": 89.08, + "learning_rate": 5.478413590681735e-06, + "loss": 1.7961, + "step": 30773000 + }, + { + "epoch": 89.08, + "learning_rate": 5.477689943034457e-06, + "loss": 1.8051, + "step": 30773500 + }, + { + "epoch": 89.08, + "learning_rate": 5.476966295387181e-06, + "loss": 1.8136, + "step": 30774000 + }, + { + "epoch": 89.08, + "learning_rate": 5.476242647739904e-06, + "loss": 1.8127, + "step": 30774500 + }, + { + "epoch": 89.08, + "learning_rate": 5.475520447387922e-06, + "loss": 1.7819, + "step": 30775000 + }, + { + "epoch": 89.08, + "learning_rate": 5.474796799740644e-06, + "loss": 1.7883, + "step": 30775500 + }, + { + "epoch": 89.08, + "learning_rate": 5.474073152093368e-06, + "loss": 1.7946, + "step": 30776000 + }, + { + "epoch": 89.09, + "learning_rate": 5.473349504446091e-06, + "loss": 1.7865, + "step": 30776500 + }, + { + "epoch": 89.09, + "learning_rate": 5.4726258567988144e-06, + "loss": 1.789, + "step": 30777000 + }, + { + "epoch": 89.09, + "learning_rate": 5.4719036564468325e-06, + "loss": 1.8155, + "step": 30777500 + }, + { + "epoch": 89.09, + "learning_rate": 5.471180008799556e-06, + "loss": 1.768, + "step": 30778000 + }, + { + "epoch": 89.09, + "learning_rate": 5.470456361152279e-06, + "loss": 1.8028, + "step": 30778500 + }, + { + "epoch": 89.09, + "learning_rate": 5.469732713505002e-06, + "loss": 1.7778, + "step": 30779000 + }, + { + "epoch": 89.09, + "learning_rate": 5.46901051315302e-06, + "loss": 1.8016, + "step": 30779500 + }, + { + "epoch": 89.1, + "learning_rate": 5.468286865505743e-06, + "loss": 1.7807, + "step": 30780000 + }, + { + "epoch": 89.1, + "learning_rate": 5.467563217858467e-06, + "loss": 1.7774, + "step": 30780500 + }, + { + "epoch": 89.1, + "learning_rate": 5.466839570211189e-06, + "loss": 1.7785, + "step": 30781000 + }, + { + "epoch": 89.1, + "learning_rate": 5.466115922563913e-06, + "loss": 1.7757, + "step": 30781500 + }, + { + "epoch": 89.1, + "learning_rate": 5.465392274916636e-06, + "loss": 1.7665, + "step": 30782000 + }, + { + "epoch": 89.1, + "learning_rate": 5.464668627269359e-06, + "loss": 1.8119, + "step": 30782500 + }, + { + "epoch": 89.1, + "learning_rate": 5.463944979622083e-06, + "loss": 1.7855, + "step": 30783000 + }, + { + "epoch": 89.11, + "learning_rate": 5.463221331974805e-06, + "loss": 1.7648, + "step": 30783500 + }, + { + "epoch": 89.11, + "learning_rate": 5.462497684327529e-06, + "loss": 1.7818, + "step": 30784000 + }, + { + "epoch": 89.11, + "learning_rate": 5.461774036680252e-06, + "loss": 1.7665, + "step": 30784500 + }, + { + "epoch": 89.11, + "learning_rate": 5.4610518363282705e-06, + "loss": 1.795, + "step": 30785000 + }, + { + "epoch": 89.11, + "learning_rate": 5.460328188680993e-06, + "loss": 1.781, + "step": 30785500 + }, + { + "epoch": 89.11, + "learning_rate": 5.459604541033717e-06, + "loss": 1.7861, + "step": 30786000 + }, + { + "epoch": 89.11, + "learning_rate": 5.45888089338644e-06, + "loss": 1.8029, + "step": 30786500 + }, + { + "epoch": 89.12, + "learning_rate": 5.458158693034458e-06, + "loss": 1.8129, + "step": 30787000 + }, + { + "epoch": 89.12, + "learning_rate": 5.45743504538718e-06, + "loss": 1.8179, + "step": 30787500 + }, + { + "epoch": 89.12, + "learning_rate": 5.456711397739904e-06, + "loss": 1.7811, + "step": 30788000 + }, + { + "epoch": 89.12, + "learning_rate": 5.455987750092628e-06, + "loss": 1.7897, + "step": 30788500 + }, + { + "epoch": 89.12, + "learning_rate": 5.45526410244535e-06, + "loss": 1.7958, + "step": 30789000 + }, + { + "epoch": 89.12, + "learning_rate": 5.454540454798074e-06, + "loss": 1.8085, + "step": 30789500 + }, + { + "epoch": 89.12, + "learning_rate": 5.453816807150796e-06, + "loss": 1.786, + "step": 30790000 + }, + { + "epoch": 89.13, + "learning_rate": 5.45309315950352e-06, + "loss": 1.7876, + "step": 30790500 + }, + { + "epoch": 89.13, + "learning_rate": 5.452369511856243e-06, + "loss": 1.7974, + "step": 30791000 + }, + { + "epoch": 89.13, + "learning_rate": 5.451647311504261e-06, + "loss": 1.7876, + "step": 30791500 + }, + { + "epoch": 89.13, + "learning_rate": 5.4509236638569845e-06, + "loss": 1.8097, + "step": 30792000 + }, + { + "epoch": 89.13, + "learning_rate": 5.4502000162097076e-06, + "loss": 1.7785, + "step": 30792500 + }, + { + "epoch": 89.13, + "learning_rate": 5.449476368562431e-06, + "loss": 1.7882, + "step": 30793000 + }, + { + "epoch": 89.13, + "learning_rate": 5.448752720915154e-06, + "loss": 1.7842, + "step": 30793500 + }, + { + "epoch": 89.14, + "learning_rate": 5.448029073267878e-06, + "loss": 1.7723, + "step": 30794000 + }, + { + "epoch": 89.14, + "learning_rate": 5.447306872915895e-06, + "loss": 1.7749, + "step": 30794500 + }, + { + "epoch": 89.14, + "learning_rate": 5.446583225268619e-06, + "loss": 1.7977, + "step": 30795000 + }, + { + "epoch": 89.14, + "learning_rate": 5.445859577621341e-06, + "loss": 1.8002, + "step": 30795500 + }, + { + "epoch": 89.14, + "learning_rate": 5.445135929974065e-06, + "loss": 1.805, + "step": 30796000 + }, + { + "epoch": 89.14, + "learning_rate": 5.444413729622082e-06, + "loss": 1.8035, + "step": 30796500 + }, + { + "epoch": 89.14, + "learning_rate": 5.443690081974806e-06, + "loss": 1.8027, + "step": 30797000 + }, + { + "epoch": 89.15, + "learning_rate": 5.442966434327529e-06, + "loss": 1.8104, + "step": 30797500 + }, + { + "epoch": 89.15, + "learning_rate": 5.442242786680252e-06, + "loss": 1.7945, + "step": 30798000 + }, + { + "epoch": 89.15, + "learning_rate": 5.441519139032975e-06, + "loss": 1.7549, + "step": 30798500 + }, + { + "epoch": 89.15, + "learning_rate": 5.4407954913856985e-06, + "loss": 1.7933, + "step": 30799000 + }, + { + "epoch": 89.15, + "learning_rate": 5.440071843738422e-06, + "loss": 1.7839, + "step": 30799500 + }, + { + "epoch": 89.15, + "learning_rate": 5.4393481960911455e-06, + "loss": 1.7684, + "step": 30800000 + }, + { + "epoch": 89.15, + "learning_rate": 5.4386245484438686e-06, + "loss": 1.7954, + "step": 30800500 + }, + { + "epoch": 89.16, + "learning_rate": 5.437902348091886e-06, + "loss": 1.7817, + "step": 30801000 + }, + { + "epoch": 89.16, + "learning_rate": 5.43717870044461e-06, + "loss": 1.8115, + "step": 30801500 + }, + { + "epoch": 89.16, + "learning_rate": 5.436455052797333e-06, + "loss": 1.7599, + "step": 30802000 + }, + { + "epoch": 89.16, + "learning_rate": 5.435731405150056e-06, + "loss": 1.7912, + "step": 30802500 + }, + { + "epoch": 89.16, + "learning_rate": 5.435007757502779e-06, + "loss": 1.8003, + "step": 30803000 + }, + { + "epoch": 89.16, + "learning_rate": 5.434285557150797e-06, + "loss": 1.7727, + "step": 30803500 + }, + { + "epoch": 89.16, + "learning_rate": 5.43356190950352e-06, + "loss": 1.8002, + "step": 30804000 + }, + { + "epoch": 89.17, + "learning_rate": 5.432838261856243e-06, + "loss": 1.7995, + "step": 30804500 + }, + { + "epoch": 89.17, + "learning_rate": 5.432114614208966e-06, + "loss": 1.7842, + "step": 30805000 + }, + { + "epoch": 89.17, + "learning_rate": 5.431390966561689e-06, + "loss": 1.792, + "step": 30805500 + }, + { + "epoch": 89.17, + "learning_rate": 5.4306687662097075e-06, + "loss": 1.7899, + "step": 30806000 + }, + { + "epoch": 89.17, + "learning_rate": 5.429946565857726e-06, + "loss": 1.8301, + "step": 30806500 + }, + { + "epoch": 89.17, + "learning_rate": 5.429222918210449e-06, + "loss": 1.7838, + "step": 30807000 + }, + { + "epoch": 89.18, + "learning_rate": 5.428499270563172e-06, + "loss": 1.779, + "step": 30807500 + }, + { + "epoch": 89.18, + "learning_rate": 5.427775622915895e-06, + "loss": 1.7797, + "step": 30808000 + }, + { + "epoch": 89.18, + "learning_rate": 5.427051975268618e-06, + "loss": 1.8396, + "step": 30808500 + }, + { + "epoch": 89.18, + "learning_rate": 5.426328327621342e-06, + "loss": 1.7869, + "step": 30809000 + }, + { + "epoch": 89.18, + "learning_rate": 5.425604679974065e-06, + "loss": 1.7888, + "step": 30809500 + }, + { + "epoch": 89.18, + "learning_rate": 5.424881032326788e-06, + "loss": 1.7768, + "step": 30810000 + }, + { + "epoch": 89.18, + "learning_rate": 5.424157384679511e-06, + "loss": 1.7797, + "step": 30810500 + }, + { + "epoch": 89.19, + "learning_rate": 5.423433737032234e-06, + "loss": 1.7856, + "step": 30811000 + }, + { + "epoch": 89.19, + "learning_rate": 5.422711536680252e-06, + "loss": 1.7926, + "step": 30811500 + }, + { + "epoch": 89.19, + "learning_rate": 5.421987889032975e-06, + "loss": 1.7873, + "step": 30812000 + }, + { + "epoch": 89.19, + "learning_rate": 5.4212642413856984e-06, + "loss": 1.824, + "step": 30812500 + }, + { + "epoch": 89.19, + "learning_rate": 5.420540593738422e-06, + "loss": 1.7751, + "step": 30813000 + }, + { + "epoch": 89.19, + "learning_rate": 5.419816946091145e-06, + "loss": 1.773, + "step": 30813500 + }, + { + "epoch": 89.19, + "learning_rate": 5.4190932984438685e-06, + "loss": 1.7494, + "step": 30814000 + }, + { + "epoch": 89.2, + "learning_rate": 5.418369650796592e-06, + "loss": 1.7919, + "step": 30814500 + }, + { + "epoch": 89.2, + "learning_rate": 5.417646003149315e-06, + "loss": 1.7818, + "step": 30815000 + }, + { + "epoch": 89.2, + "learning_rate": 5.416925250092627e-06, + "loss": 1.7911, + "step": 30815500 + }, + { + "epoch": 89.2, + "learning_rate": 5.416201602445351e-06, + "loss": 1.8029, + "step": 30816000 + }, + { + "epoch": 89.2, + "learning_rate": 5.415477954798073e-06, + "loss": 1.797, + "step": 30816500 + }, + { + "epoch": 89.2, + "learning_rate": 5.414754307150797e-06, + "loss": 1.7833, + "step": 30817000 + }, + { + "epoch": 89.2, + "learning_rate": 5.41403065950352e-06, + "loss": 1.7763, + "step": 30817500 + }, + { + "epoch": 89.21, + "learning_rate": 5.413307011856243e-06, + "loss": 1.788, + "step": 30818000 + }, + { + "epoch": 89.21, + "learning_rate": 5.412583364208966e-06, + "loss": 1.7894, + "step": 30818500 + }, + { + "epoch": 89.21, + "learning_rate": 5.411859716561689e-06, + "loss": 1.7776, + "step": 30819000 + }, + { + "epoch": 89.21, + "learning_rate": 5.411136068914413e-06, + "loss": 1.7972, + "step": 30819500 + }, + { + "epoch": 89.21, + "learning_rate": 5.410412421267136e-06, + "loss": 1.8352, + "step": 30820000 + }, + { + "epoch": 89.21, + "learning_rate": 5.4096902209151545e-06, + "loss": 1.806, + "step": 30820500 + }, + { + "epoch": 89.21, + "learning_rate": 5.408966573267877e-06, + "loss": 1.7748, + "step": 30821000 + }, + { + "epoch": 89.22, + "learning_rate": 5.408242925620601e-06, + "loss": 1.7862, + "step": 30821500 + }, + { + "epoch": 89.22, + "learning_rate": 5.407519277973324e-06, + "loss": 1.784, + "step": 30822000 + }, + { + "epoch": 89.22, + "learning_rate": 5.406795630326047e-06, + "loss": 1.798, + "step": 30822500 + }, + { + "epoch": 89.22, + "learning_rate": 5.406073429974065e-06, + "loss": 1.813, + "step": 30823000 + }, + { + "epoch": 89.22, + "learning_rate": 5.405349782326788e-06, + "loss": 1.7736, + "step": 30823500 + }, + { + "epoch": 89.22, + "learning_rate": 5.404626134679511e-06, + "loss": 1.8017, + "step": 30824000 + }, + { + "epoch": 89.22, + "learning_rate": 5.403902487032234e-06, + "loss": 1.7837, + "step": 30824500 + }, + { + "epoch": 89.23, + "learning_rate": 5.403178839384958e-06, + "loss": 1.8063, + "step": 30825000 + }, + { + "epoch": 89.23, + "learning_rate": 5.402456639032975e-06, + "loss": 1.7941, + "step": 30825500 + }, + { + "epoch": 89.23, + "learning_rate": 5.401732991385699e-06, + "loss": 1.8237, + "step": 30826000 + }, + { + "epoch": 89.23, + "learning_rate": 5.4010093437384215e-06, + "loss": 1.7938, + "step": 30826500 + }, + { + "epoch": 89.23, + "learning_rate": 5.400285696091145e-06, + "loss": 1.7677, + "step": 30827000 + }, + { + "epoch": 89.23, + "learning_rate": 5.399562048443868e-06, + "loss": 1.7592, + "step": 30827500 + }, + { + "epoch": 89.23, + "learning_rate": 5.3988398480918866e-06, + "loss": 1.8239, + "step": 30828000 + }, + { + "epoch": 89.24, + "learning_rate": 5.398116200444609e-06, + "loss": 1.8059, + "step": 30828500 + }, + { + "epoch": 89.24, + "learning_rate": 5.397392552797333e-06, + "loss": 1.802, + "step": 30829000 + }, + { + "epoch": 89.24, + "learning_rate": 5.396668905150056e-06, + "loss": 1.8062, + "step": 30829500 + }, + { + "epoch": 89.24, + "learning_rate": 5.395946704798074e-06, + "loss": 1.7811, + "step": 30830000 + }, + { + "epoch": 89.24, + "learning_rate": 5.395223057150796e-06, + "loss": 1.7872, + "step": 30830500 + }, + { + "epoch": 89.24, + "learning_rate": 5.394500856798815e-06, + "loss": 1.789, + "step": 30831000 + }, + { + "epoch": 89.24, + "learning_rate": 5.393777209151537e-06, + "loss": 1.7801, + "step": 30831500 + }, + { + "epoch": 89.25, + "learning_rate": 5.393053561504261e-06, + "loss": 1.7844, + "step": 30832000 + }, + { + "epoch": 89.25, + "learning_rate": 5.392329913856984e-06, + "loss": 1.8089, + "step": 30832500 + }, + { + "epoch": 89.25, + "learning_rate": 5.391606266209707e-06, + "loss": 1.7998, + "step": 30833000 + }, + { + "epoch": 89.25, + "learning_rate": 5.390882618562431e-06, + "loss": 1.7726, + "step": 30833500 + }, + { + "epoch": 89.25, + "learning_rate": 5.3901589709151536e-06, + "loss": 1.8009, + "step": 30834000 + }, + { + "epoch": 89.25, + "learning_rate": 5.3894353232678775e-06, + "loss": 1.7977, + "step": 30834500 + }, + { + "epoch": 89.25, + "learning_rate": 5.3887116756206006e-06, + "loss": 1.7998, + "step": 30835000 + }, + { + "epoch": 89.26, + "learning_rate": 5.387988027973324e-06, + "loss": 1.8005, + "step": 30835500 + }, + { + "epoch": 89.26, + "learning_rate": 5.387264380326048e-06, + "loss": 1.7919, + "step": 30836000 + }, + { + "epoch": 89.26, + "learning_rate": 5.38654073267877e-06, + "loss": 1.7892, + "step": 30836500 + }, + { + "epoch": 89.26, + "learning_rate": 5.385818532326788e-06, + "loss": 1.8, + "step": 30837000 + }, + { + "epoch": 89.26, + "learning_rate": 5.385094884679511e-06, + "loss": 1.8013, + "step": 30837500 + }, + { + "epoch": 89.26, + "learning_rate": 5.384371237032235e-06, + "loss": 1.7858, + "step": 30838000 + }, + { + "epoch": 89.26, + "learning_rate": 5.383647589384957e-06, + "loss": 1.7951, + "step": 30838500 + }, + { + "epoch": 89.27, + "learning_rate": 5.382923941737681e-06, + "loss": 1.7945, + "step": 30839000 + }, + { + "epoch": 89.27, + "learning_rate": 5.382200294090404e-06, + "loss": 1.795, + "step": 30839500 + }, + { + "epoch": 89.27, + "learning_rate": 5.381476646443127e-06, + "loss": 1.7995, + "step": 30840000 + }, + { + "epoch": 89.27, + "learning_rate": 5.380752998795851e-06, + "loss": 1.7789, + "step": 30840500 + }, + { + "epoch": 89.27, + "learning_rate": 5.380030798443868e-06, + "loss": 1.7972, + "step": 30841000 + }, + { + "epoch": 89.27, + "learning_rate": 5.379308598091886e-06, + "loss": 1.7728, + "step": 30841500 + }, + { + "epoch": 89.27, + "learning_rate": 5.37858495044461e-06, + "loss": 1.7895, + "step": 30842000 + }, + { + "epoch": 89.28, + "learning_rate": 5.377861302797333e-06, + "loss": 1.8242, + "step": 30842500 + }, + { + "epoch": 89.28, + "learning_rate": 5.377137655150056e-06, + "loss": 1.7912, + "step": 30843000 + }, + { + "epoch": 89.28, + "learning_rate": 5.37641400750278e-06, + "loss": 1.8175, + "step": 30843500 + }, + { + "epoch": 89.28, + "learning_rate": 5.375690359855502e-06, + "loss": 1.8192, + "step": 30844000 + }, + { + "epoch": 89.28, + "learning_rate": 5.37496815950352e-06, + "loss": 1.7802, + "step": 30844500 + }, + { + "epoch": 89.28, + "learning_rate": 5.374244511856243e-06, + "loss": 1.8148, + "step": 30845000 + }, + { + "epoch": 89.29, + "learning_rate": 5.373522311504261e-06, + "loss": 1.7656, + "step": 30845500 + }, + { + "epoch": 89.29, + "learning_rate": 5.372798663856984e-06, + "loss": 1.8151, + "step": 30846000 + }, + { + "epoch": 89.29, + "learning_rate": 5.372075016209707e-06, + "loss": 1.7621, + "step": 30846500 + }, + { + "epoch": 89.29, + "learning_rate": 5.3713513685624304e-06, + "loss": 1.7947, + "step": 30847000 + }, + { + "epoch": 89.29, + "learning_rate": 5.3706291682104485e-06, + "loss": 1.779, + "step": 30847500 + }, + { + "epoch": 89.29, + "learning_rate": 5.369905520563172e-06, + "loss": 1.7855, + "step": 30848000 + }, + { + "epoch": 89.29, + "learning_rate": 5.3691818729158955e-06, + "loss": 1.8079, + "step": 30848500 + }, + { + "epoch": 89.3, + "learning_rate": 5.368458225268618e-06, + "loss": 1.7875, + "step": 30849000 + }, + { + "epoch": 89.3, + "learning_rate": 5.367734577621342e-06, + "loss": 1.7686, + "step": 30849500 + }, + { + "epoch": 89.3, + "learning_rate": 5.367010929974065e-06, + "loss": 1.8098, + "step": 30850000 + }, + { + "epoch": 89.3, + "learning_rate": 5.366287282326788e-06, + "loss": 1.7724, + "step": 30850500 + }, + { + "epoch": 89.3, + "learning_rate": 5.365563634679511e-06, + "loss": 1.7742, + "step": 30851000 + }, + { + "epoch": 89.3, + "learning_rate": 5.364839987032234e-06, + "loss": 1.8101, + "step": 30851500 + }, + { + "epoch": 89.3, + "learning_rate": 5.364117786680252e-06, + "loss": 1.7968, + "step": 30852000 + }, + { + "epoch": 89.31, + "learning_rate": 5.363394139032975e-06, + "loss": 1.7879, + "step": 30852500 + }, + { + "epoch": 89.31, + "learning_rate": 5.362670491385699e-06, + "loss": 1.7915, + "step": 30853000 + }, + { + "epoch": 89.31, + "learning_rate": 5.361946843738422e-06, + "loss": 1.8097, + "step": 30853500 + }, + { + "epoch": 89.31, + "learning_rate": 5.361223196091145e-06, + "loss": 1.8121, + "step": 30854000 + }, + { + "epoch": 89.31, + "learning_rate": 5.360499548443868e-06, + "loss": 1.8015, + "step": 30854500 + }, + { + "epoch": 89.31, + "learning_rate": 5.3597759007965914e-06, + "loss": 1.7686, + "step": 30855000 + }, + { + "epoch": 89.31, + "learning_rate": 5.3590537004446095e-06, + "loss": 1.7935, + "step": 30855500 + }, + { + "epoch": 89.32, + "learning_rate": 5.358330052797333e-06, + "loss": 1.7767, + "step": 30856000 + }, + { + "epoch": 89.32, + "learning_rate": 5.357606405150056e-06, + "loss": 1.776, + "step": 30856500 + }, + { + "epoch": 89.32, + "learning_rate": 5.356882757502779e-06, + "loss": 1.7798, + "step": 30857000 + }, + { + "epoch": 89.32, + "learning_rate": 5.356159109855502e-06, + "loss": 1.7797, + "step": 30857500 + }, + { + "epoch": 89.32, + "learning_rate": 5.35543690950352e-06, + "loss": 1.7976, + "step": 30858000 + }, + { + "epoch": 89.32, + "learning_rate": 5.354713261856243e-06, + "loss": 1.7788, + "step": 30858500 + }, + { + "epoch": 89.32, + "learning_rate": 5.353989614208967e-06, + "loss": 1.8135, + "step": 30859000 + }, + { + "epoch": 89.33, + "learning_rate": 5.35326596656169e-06, + "loss": 1.7955, + "step": 30859500 + }, + { + "epoch": 89.33, + "learning_rate": 5.352543766209707e-06, + "loss": 1.806, + "step": 30860000 + }, + { + "epoch": 89.33, + "learning_rate": 5.35182011856243e-06, + "loss": 1.7723, + "step": 30860500 + }, + { + "epoch": 89.33, + "learning_rate": 5.351096470915154e-06, + "loss": 1.7835, + "step": 30861000 + }, + { + "epoch": 89.33, + "learning_rate": 5.350372823267877e-06, + "loss": 1.7923, + "step": 30861500 + }, + { + "epoch": 89.33, + "learning_rate": 5.3496491756206005e-06, + "loss": 1.8174, + "step": 30862000 + }, + { + "epoch": 89.33, + "learning_rate": 5.3489269752686186e-06, + "loss": 1.799, + "step": 30862500 + }, + { + "epoch": 89.34, + "learning_rate": 5.348203327621342e-06, + "loss": 1.8064, + "step": 30863000 + }, + { + "epoch": 89.34, + "learning_rate": 5.347479679974065e-06, + "loss": 1.7785, + "step": 30863500 + }, + { + "epoch": 89.34, + "learning_rate": 5.346756032326788e-06, + "loss": 1.7993, + "step": 30864000 + }, + { + "epoch": 89.34, + "learning_rate": 5.346033831974806e-06, + "loss": 1.7823, + "step": 30864500 + }, + { + "epoch": 89.34, + "learning_rate": 5.345310184327529e-06, + "loss": 1.8041, + "step": 30865000 + }, + { + "epoch": 89.34, + "learning_rate": 5.344587983975547e-06, + "loss": 1.808, + "step": 30865500 + }, + { + "epoch": 89.34, + "learning_rate": 5.34386433632827e-06, + "loss": 1.8157, + "step": 30866000 + }, + { + "epoch": 89.35, + "learning_rate": 5.343140688680993e-06, + "loss": 1.8063, + "step": 30866500 + }, + { + "epoch": 89.35, + "learning_rate": 5.342417041033716e-06, + "loss": 1.7825, + "step": 30867000 + }, + { + "epoch": 89.35, + "learning_rate": 5.341693393386439e-06, + "loss": 1.8088, + "step": 30867500 + }, + { + "epoch": 89.35, + "learning_rate": 5.3409697457391625e-06, + "loss": 1.7893, + "step": 30868000 + }, + { + "epoch": 89.35, + "learning_rate": 5.340246098091886e-06, + "loss": 1.783, + "step": 30868500 + }, + { + "epoch": 89.35, + "learning_rate": 5.3395224504446095e-06, + "loss": 1.8143, + "step": 30869000 + }, + { + "epoch": 89.35, + "learning_rate": 5.3387988027973326e-06, + "loss": 1.7874, + "step": 30869500 + }, + { + "epoch": 89.36, + "learning_rate": 5.33807660244535e-06, + "loss": 1.777, + "step": 30870000 + }, + { + "epoch": 89.36, + "learning_rate": 5.337352954798074e-06, + "loss": 1.7977, + "step": 30870500 + }, + { + "epoch": 89.36, + "learning_rate": 5.336629307150797e-06, + "loss": 1.8144, + "step": 30871000 + }, + { + "epoch": 89.36, + "learning_rate": 5.33590565950352e-06, + "loss": 1.7861, + "step": 30871500 + }, + { + "epoch": 89.36, + "learning_rate": 5.335182011856244e-06, + "loss": 1.793, + "step": 30872000 + }, + { + "epoch": 89.36, + "learning_rate": 5.334458364208966e-06, + "loss": 1.8127, + "step": 30872500 + }, + { + "epoch": 89.36, + "learning_rate": 5.333736163856984e-06, + "loss": 1.8187, + "step": 30873000 + }, + { + "epoch": 89.37, + "learning_rate": 5.333012516209707e-06, + "loss": 1.7985, + "step": 30873500 + }, + { + "epoch": 89.37, + "learning_rate": 5.332290315857725e-06, + "loss": 1.7974, + "step": 30874000 + }, + { + "epoch": 89.37, + "learning_rate": 5.3315666682104484e-06, + "loss": 1.7948, + "step": 30874500 + }, + { + "epoch": 89.37, + "learning_rate": 5.3308444678584665e-06, + "loss": 1.7771, + "step": 30875000 + }, + { + "epoch": 89.37, + "learning_rate": 5.33012082021119e-06, + "loss": 1.8022, + "step": 30875500 + }, + { + "epoch": 89.37, + "learning_rate": 5.329397172563913e-06, + "loss": 1.7882, + "step": 30876000 + }, + { + "epoch": 89.37, + "learning_rate": 5.328673524916636e-06, + "loss": 1.7747, + "step": 30876500 + }, + { + "epoch": 89.38, + "learning_rate": 5.32794987726936e-06, + "loss": 1.779, + "step": 30877000 + }, + { + "epoch": 89.38, + "learning_rate": 5.327226229622082e-06, + "loss": 1.8146, + "step": 30877500 + }, + { + "epoch": 89.38, + "learning_rate": 5.326502581974806e-06, + "loss": 1.7813, + "step": 30878000 + }, + { + "epoch": 89.38, + "learning_rate": 5.325778934327529e-06, + "loss": 1.8003, + "step": 30878500 + }, + { + "epoch": 89.38, + "learning_rate": 5.325055286680252e-06, + "loss": 1.7912, + "step": 30879000 + }, + { + "epoch": 89.38, + "learning_rate": 5.324331639032976e-06, + "loss": 1.7693, + "step": 30879500 + }, + { + "epoch": 89.38, + "learning_rate": 5.323607991385698e-06, + "loss": 1.8191, + "step": 30880000 + }, + { + "epoch": 89.39, + "learning_rate": 5.322884343738422e-06, + "loss": 1.8077, + "step": 30880500 + }, + { + "epoch": 89.39, + "learning_rate": 5.322160696091145e-06, + "loss": 1.7945, + "step": 30881000 + }, + { + "epoch": 89.39, + "learning_rate": 5.321437048443868e-06, + "loss": 1.777, + "step": 30881500 + }, + { + "epoch": 89.39, + "learning_rate": 5.3207148480918855e-06, + "loss": 1.8095, + "step": 30882000 + }, + { + "epoch": 89.39, + "learning_rate": 5.3199912004446094e-06, + "loss": 1.8006, + "step": 30882500 + }, + { + "epoch": 89.39, + "learning_rate": 5.3192675527973325e-06, + "loss": 1.8042, + "step": 30883000 + }, + { + "epoch": 89.4, + "learning_rate": 5.318543905150056e-06, + "loss": 1.7722, + "step": 30883500 + }, + { + "epoch": 89.4, + "learning_rate": 5.3178202575027795e-06, + "loss": 1.7624, + "step": 30884000 + }, + { + "epoch": 89.4, + "learning_rate": 5.317098057150797e-06, + "loss": 1.8085, + "step": 30884500 + }, + { + "epoch": 89.4, + "learning_rate": 5.316374409503521e-06, + "loss": 1.7934, + "step": 30885000 + }, + { + "epoch": 89.4, + "learning_rate": 5.315650761856243e-06, + "loss": 1.7951, + "step": 30885500 + }, + { + "epoch": 89.4, + "learning_rate": 5.314927114208967e-06, + "loss": 1.8126, + "step": 30886000 + }, + { + "epoch": 89.4, + "learning_rate": 5.314203466561689e-06, + "loss": 1.768, + "step": 30886500 + }, + { + "epoch": 89.41, + "learning_rate": 5.313479818914413e-06, + "loss": 1.7952, + "step": 30887000 + }, + { + "epoch": 89.41, + "learning_rate": 5.312756171267137e-06, + "loss": 1.7704, + "step": 30887500 + }, + { + "epoch": 89.41, + "learning_rate": 5.312033970915154e-06, + "loss": 1.811, + "step": 30888000 + }, + { + "epoch": 89.41, + "learning_rate": 5.311310323267877e-06, + "loss": 1.7927, + "step": 30888500 + }, + { + "epoch": 89.41, + "learning_rate": 5.3105866756206e-06, + "loss": 1.8056, + "step": 30889000 + }, + { + "epoch": 89.41, + "learning_rate": 5.309864475268618e-06, + "loss": 1.7903, + "step": 30889500 + }, + { + "epoch": 89.41, + "learning_rate": 5.3091408276213415e-06, + "loss": 1.7923, + "step": 30890000 + }, + { + "epoch": 89.42, + "learning_rate": 5.3084171799740655e-06, + "loss": 1.804, + "step": 30890500 + }, + { + "epoch": 89.42, + "learning_rate": 5.307693532326788e-06, + "loss": 1.8157, + "step": 30891000 + }, + { + "epoch": 89.42, + "learning_rate": 5.306969884679512e-06, + "loss": 1.7941, + "step": 30891500 + }, + { + "epoch": 89.42, + "learning_rate": 5.306246237032234e-06, + "loss": 1.7915, + "step": 30892000 + }, + { + "epoch": 89.42, + "learning_rate": 5.305522589384958e-06, + "loss": 1.8038, + "step": 30892500 + }, + { + "epoch": 89.42, + "learning_rate": 5.304798941737681e-06, + "loss": 1.7935, + "step": 30893000 + }, + { + "epoch": 89.42, + "learning_rate": 5.304075294090404e-06, + "loss": 1.7814, + "step": 30893500 + }, + { + "epoch": 89.43, + "learning_rate": 5.303353093738422e-06, + "loss": 1.7947, + "step": 30894000 + }, + { + "epoch": 89.43, + "learning_rate": 5.302629446091145e-06, + "loss": 1.7814, + "step": 30894500 + }, + { + "epoch": 89.43, + "learning_rate": 5.301905798443868e-06, + "loss": 1.8244, + "step": 30895000 + }, + { + "epoch": 89.43, + "learning_rate": 5.301182150796591e-06, + "loss": 1.7883, + "step": 30895500 + }, + { + "epoch": 89.43, + "learning_rate": 5.300458503149315e-06, + "loss": 1.795, + "step": 30896000 + }, + { + "epoch": 89.43, + "learning_rate": 5.299734855502038e-06, + "loss": 1.7829, + "step": 30896500 + }, + { + "epoch": 89.43, + "learning_rate": 5.2990141024453506e-06, + "loss": 1.8124, + "step": 30897000 + }, + { + "epoch": 89.44, + "learning_rate": 5.298290454798074e-06, + "loss": 1.7611, + "step": 30897500 + }, + { + "epoch": 89.44, + "learning_rate": 5.297566807150797e-06, + "loss": 1.8045, + "step": 30898000 + }, + { + "epoch": 89.44, + "learning_rate": 5.29684315950352e-06, + "loss": 1.7979, + "step": 30898500 + }, + { + "epoch": 89.44, + "learning_rate": 5.296119511856244e-06, + "loss": 1.8069, + "step": 30899000 + }, + { + "epoch": 89.44, + "learning_rate": 5.295395864208967e-06, + "loss": 1.8113, + "step": 30899500 + }, + { + "epoch": 89.44, + "learning_rate": 5.29467221656169e-06, + "loss": 1.7716, + "step": 30900000 + }, + { + "epoch": 89.44, + "learning_rate": 5.293950016209707e-06, + "loss": 1.7531, + "step": 30900500 + }, + { + "epoch": 89.45, + "learning_rate": 5.293226368562431e-06, + "loss": 1.7919, + "step": 30901000 + }, + { + "epoch": 89.45, + "learning_rate": 5.292502720915154e-06, + "loss": 1.7903, + "step": 30901500 + }, + { + "epoch": 89.45, + "learning_rate": 5.291779073267877e-06, + "loss": 1.8032, + "step": 30902000 + }, + { + "epoch": 89.45, + "learning_rate": 5.2910554256206e-06, + "loss": 1.7656, + "step": 30902500 + }, + { + "epoch": 89.45, + "learning_rate": 5.290331777973323e-06, + "loss": 1.7889, + "step": 30903000 + }, + { + "epoch": 89.45, + "learning_rate": 5.289608130326047e-06, + "loss": 1.7842, + "step": 30903500 + }, + { + "epoch": 89.45, + "learning_rate": 5.28888448267877e-06, + "loss": 1.8239, + "step": 30904000 + }, + { + "epoch": 89.46, + "learning_rate": 5.2881608350314935e-06, + "loss": 1.8013, + "step": 30904500 + }, + { + "epoch": 89.46, + "learning_rate": 5.287438634679511e-06, + "loss": 1.7905, + "step": 30905000 + }, + { + "epoch": 89.46, + "learning_rate": 5.286716434327529e-06, + "loss": 1.8192, + "step": 30905500 + }, + { + "epoch": 89.46, + "learning_rate": 5.285992786680252e-06, + "loss": 1.8042, + "step": 30906000 + }, + { + "epoch": 89.46, + "learning_rate": 5.285269139032976e-06, + "loss": 1.7833, + "step": 30906500 + }, + { + "epoch": 89.46, + "learning_rate": 5.284545491385699e-06, + "loss": 1.7767, + "step": 30907000 + }, + { + "epoch": 89.46, + "learning_rate": 5.283821843738422e-06, + "loss": 1.798, + "step": 30907500 + }, + { + "epoch": 89.47, + "learning_rate": 5.283098196091145e-06, + "loss": 1.7874, + "step": 30908000 + }, + { + "epoch": 89.47, + "learning_rate": 5.282374548443868e-06, + "loss": 1.7823, + "step": 30908500 + }, + { + "epoch": 89.47, + "learning_rate": 5.281652348091886e-06, + "loss": 1.794, + "step": 30909000 + }, + { + "epoch": 89.47, + "learning_rate": 5.280928700444609e-06, + "loss": 1.7808, + "step": 30909500 + }, + { + "epoch": 89.47, + "learning_rate": 5.280205052797332e-06, + "loss": 1.7993, + "step": 30910000 + }, + { + "epoch": 89.47, + "learning_rate": 5.2794814051500555e-06, + "loss": 1.7874, + "step": 30910500 + }, + { + "epoch": 89.47, + "learning_rate": 5.2787577575027794e-06, + "loss": 1.773, + "step": 30911000 + }, + { + "epoch": 89.48, + "learning_rate": 5.2780341098555025e-06, + "loss": 1.8006, + "step": 30911500 + }, + { + "epoch": 89.48, + "learning_rate": 5.277310462208226e-06, + "loss": 1.7746, + "step": 30912000 + }, + { + "epoch": 89.48, + "learning_rate": 5.276586814560949e-06, + "loss": 1.8218, + "step": 30912500 + }, + { + "epoch": 89.48, + "learning_rate": 5.275864614208967e-06, + "loss": 1.7972, + "step": 30913000 + }, + { + "epoch": 89.48, + "learning_rate": 5.27514096656169e-06, + "loss": 1.7798, + "step": 30913500 + }, + { + "epoch": 89.48, + "learning_rate": 5.274418766209707e-06, + "loss": 1.7952, + "step": 30914000 + }, + { + "epoch": 89.48, + "learning_rate": 5.273695118562431e-06, + "loss": 1.823, + "step": 30914500 + }, + { + "epoch": 89.49, + "learning_rate": 5.272971470915154e-06, + "loss": 1.7852, + "step": 30915000 + }, + { + "epoch": 89.49, + "learning_rate": 5.272247823267877e-06, + "loss": 1.7957, + "step": 30915500 + }, + { + "epoch": 89.49, + "learning_rate": 5.2715241756206e-06, + "loss": 1.7705, + "step": 30916000 + }, + { + "epoch": 89.49, + "learning_rate": 5.270800527973323e-06, + "loss": 1.819, + "step": 30916500 + }, + { + "epoch": 89.49, + "learning_rate": 5.270076880326047e-06, + "loss": 1.7904, + "step": 30917000 + }, + { + "epoch": 89.49, + "learning_rate": 5.26935323267877e-06, + "loss": 1.7753, + "step": 30917500 + }, + { + "epoch": 89.49, + "learning_rate": 5.2686295850314934e-06, + "loss": 1.8049, + "step": 30918000 + }, + { + "epoch": 89.5, + "learning_rate": 5.267907384679511e-06, + "loss": 1.8046, + "step": 30918500 + }, + { + "epoch": 89.5, + "learning_rate": 5.267183737032235e-06, + "loss": 1.7791, + "step": 30919000 + }, + { + "epoch": 89.5, + "learning_rate": 5.266460089384958e-06, + "loss": 1.7844, + "step": 30919500 + }, + { + "epoch": 89.5, + "learning_rate": 5.265736441737681e-06, + "loss": 1.7581, + "step": 30920000 + }, + { + "epoch": 89.5, + "learning_rate": 5.265012794090404e-06, + "loss": 1.7858, + "step": 30920500 + }, + { + "epoch": 89.5, + "learning_rate": 5.264289146443127e-06, + "loss": 1.7983, + "step": 30921000 + }, + { + "epoch": 89.51, + "learning_rate": 5.263565498795851e-06, + "loss": 1.7856, + "step": 30921500 + }, + { + "epoch": 89.51, + "learning_rate": 5.262843298443868e-06, + "loss": 1.8084, + "step": 30922000 + }, + { + "epoch": 89.51, + "learning_rate": 5.262119650796592e-06, + "loss": 1.8065, + "step": 30922500 + }, + { + "epoch": 89.51, + "learning_rate": 5.261396003149314e-06, + "loss": 1.7954, + "step": 30923000 + }, + { + "epoch": 89.51, + "learning_rate": 5.260672355502038e-06, + "loss": 1.7681, + "step": 30923500 + }, + { + "epoch": 89.51, + "learning_rate": 5.2599501551500554e-06, + "loss": 1.816, + "step": 30924000 + }, + { + "epoch": 89.51, + "learning_rate": 5.2592279547980735e-06, + "loss": 1.7926, + "step": 30924500 + }, + { + "epoch": 89.52, + "learning_rate": 5.258504307150797e-06, + "loss": 1.7981, + "step": 30925000 + }, + { + "epoch": 89.52, + "learning_rate": 5.2577806595035206e-06, + "loss": 1.7848, + "step": 30925500 + }, + { + "epoch": 89.52, + "learning_rate": 5.257057011856243e-06, + "loss": 1.7838, + "step": 30926000 + }, + { + "epoch": 89.52, + "learning_rate": 5.256333364208967e-06, + "loss": 1.7952, + "step": 30926500 + }, + { + "epoch": 89.52, + "learning_rate": 5.255611163856984e-06, + "loss": 1.7956, + "step": 30927000 + }, + { + "epoch": 89.52, + "learning_rate": 5.254887516209708e-06, + "loss": 1.8011, + "step": 30927500 + }, + { + "epoch": 89.52, + "learning_rate": 5.254165315857725e-06, + "loss": 1.806, + "step": 30928000 + }, + { + "epoch": 89.53, + "learning_rate": 5.253441668210449e-06, + "loss": 1.7756, + "step": 30928500 + }, + { + "epoch": 89.53, + "learning_rate": 5.252718020563171e-06, + "loss": 1.7642, + "step": 30929000 + }, + { + "epoch": 89.53, + "learning_rate": 5.251994372915895e-06, + "loss": 1.7903, + "step": 30929500 + }, + { + "epoch": 89.53, + "learning_rate": 5.251270725268618e-06, + "loss": 1.8139, + "step": 30930000 + }, + { + "epoch": 89.53, + "learning_rate": 5.250547077621341e-06, + "loss": 1.7884, + "step": 30930500 + }, + { + "epoch": 89.53, + "learning_rate": 5.249823429974065e-06, + "loss": 1.8002, + "step": 30931000 + }, + { + "epoch": 89.53, + "learning_rate": 5.2490997823267876e-06, + "loss": 1.7765, + "step": 30931500 + }, + { + "epoch": 89.54, + "learning_rate": 5.2483761346795115e-06, + "loss": 1.796, + "step": 30932000 + }, + { + "epoch": 89.54, + "learning_rate": 5.247653934327529e-06, + "loss": 1.7761, + "step": 30932500 + }, + { + "epoch": 89.54, + "learning_rate": 5.246930286680253e-06, + "loss": 1.7893, + "step": 30933000 + }, + { + "epoch": 89.54, + "learning_rate": 5.246206639032975e-06, + "loss": 1.7634, + "step": 30933500 + }, + { + "epoch": 89.54, + "learning_rate": 5.245482991385699e-06, + "loss": 1.8213, + "step": 30934000 + }, + { + "epoch": 89.54, + "learning_rate": 5.244759343738422e-06, + "loss": 1.7931, + "step": 30934500 + }, + { + "epoch": 89.54, + "learning_rate": 5.244035696091145e-06, + "loss": 1.7975, + "step": 30935000 + }, + { + "epoch": 89.55, + "learning_rate": 5.243312048443869e-06, + "loss": 1.7835, + "step": 30935500 + }, + { + "epoch": 89.55, + "learning_rate": 5.242588400796591e-06, + "loss": 1.7915, + "step": 30936000 + }, + { + "epoch": 89.55, + "learning_rate": 5.24186620044461e-06, + "loss": 1.7902, + "step": 30936500 + }, + { + "epoch": 89.55, + "learning_rate": 5.241142552797332e-06, + "loss": 1.7869, + "step": 30937000 + }, + { + "epoch": 89.55, + "learning_rate": 5.240418905150056e-06, + "loss": 1.7798, + "step": 30937500 + }, + { + "epoch": 89.55, + "learning_rate": 5.2396952575027785e-06, + "loss": 1.7993, + "step": 30938000 + }, + { + "epoch": 89.55, + "learning_rate": 5.238971609855502e-06, + "loss": 1.82, + "step": 30938500 + }, + { + "epoch": 89.56, + "learning_rate": 5.23824940950352e-06, + "loss": 1.7943, + "step": 30939000 + }, + { + "epoch": 89.56, + "learning_rate": 5.237525761856244e-06, + "loss": 1.7971, + "step": 30939500 + }, + { + "epoch": 89.56, + "learning_rate": 5.236802114208967e-06, + "loss": 1.8102, + "step": 30940000 + }, + { + "epoch": 89.56, + "learning_rate": 5.23607846656169e-06, + "loss": 1.8095, + "step": 30940500 + }, + { + "epoch": 89.56, + "learning_rate": 5.235354818914414e-06, + "loss": 1.793, + "step": 30941000 + }, + { + "epoch": 89.56, + "learning_rate": 5.234631171267136e-06, + "loss": 1.7859, + "step": 30941500 + }, + { + "epoch": 89.56, + "learning_rate": 5.233908970915154e-06, + "loss": 1.8066, + "step": 30942000 + }, + { + "epoch": 89.57, + "learning_rate": 5.233186770563172e-06, + "loss": 1.7943, + "step": 30942500 + }, + { + "epoch": 89.57, + "learning_rate": 5.232463122915895e-06, + "loss": 1.7752, + "step": 30943000 + }, + { + "epoch": 89.57, + "learning_rate": 5.231739475268618e-06, + "loss": 1.7916, + "step": 30943500 + }, + { + "epoch": 89.57, + "learning_rate": 5.231015827621342e-06, + "loss": 1.8122, + "step": 30944000 + }, + { + "epoch": 89.57, + "learning_rate": 5.230292179974064e-06, + "loss": 1.8139, + "step": 30944500 + }, + { + "epoch": 89.57, + "learning_rate": 5.229568532326788e-06, + "loss": 1.7927, + "step": 30945000 + }, + { + "epoch": 89.57, + "learning_rate": 5.228846331974806e-06, + "loss": 1.8077, + "step": 30945500 + }, + { + "epoch": 89.58, + "learning_rate": 5.2281226843275295e-06, + "loss": 1.7993, + "step": 30946000 + }, + { + "epoch": 89.58, + "learning_rate": 5.227399036680252e-06, + "loss": 1.7814, + "step": 30946500 + }, + { + "epoch": 89.58, + "learning_rate": 5.226675389032976e-06, + "loss": 1.7848, + "step": 30947000 + }, + { + "epoch": 89.58, + "learning_rate": 5.225951741385699e-06, + "loss": 1.7803, + "step": 30947500 + }, + { + "epoch": 89.58, + "learning_rate": 5.225228093738422e-06, + "loss": 1.8016, + "step": 30948000 + }, + { + "epoch": 89.58, + "learning_rate": 5.224504446091145e-06, + "loss": 1.7929, + "step": 30948500 + }, + { + "epoch": 89.58, + "learning_rate": 5.223780798443868e-06, + "loss": 1.7591, + "step": 30949000 + }, + { + "epoch": 89.59, + "learning_rate": 5.223057150796592e-06, + "loss": 1.7635, + "step": 30949500 + }, + { + "epoch": 89.59, + "learning_rate": 5.222334950444609e-06, + "loss": 1.8051, + "step": 30950000 + }, + { + "epoch": 89.59, + "learning_rate": 5.221611302797333e-06, + "loss": 1.7866, + "step": 30950500 + }, + { + "epoch": 89.59, + "learning_rate": 5.220887655150055e-06, + "loss": 1.7867, + "step": 30951000 + }, + { + "epoch": 89.59, + "learning_rate": 5.220164007502779e-06, + "loss": 1.7896, + "step": 30951500 + }, + { + "epoch": 89.59, + "learning_rate": 5.2194418071507965e-06, + "loss": 1.7819, + "step": 30952000 + }, + { + "epoch": 89.59, + "learning_rate": 5.2187181595035204e-06, + "loss": 1.7739, + "step": 30952500 + }, + { + "epoch": 89.6, + "learning_rate": 5.2179945118562435e-06, + "loss": 1.799, + "step": 30953000 + }, + { + "epoch": 89.6, + "learning_rate": 5.217270864208967e-06, + "loss": 1.7997, + "step": 30953500 + }, + { + "epoch": 89.6, + "learning_rate": 5.216548663856984e-06, + "loss": 1.7749, + "step": 30954000 + }, + { + "epoch": 89.6, + "learning_rate": 5.215825016209708e-06, + "loss": 1.7898, + "step": 30954500 + }, + { + "epoch": 89.6, + "learning_rate": 5.215101368562431e-06, + "loss": 1.7885, + "step": 30955000 + }, + { + "epoch": 89.6, + "learning_rate": 5.214377720915154e-06, + "loss": 1.8157, + "step": 30955500 + }, + { + "epoch": 89.6, + "learning_rate": 5.213654073267877e-06, + "loss": 1.7921, + "step": 30956000 + }, + { + "epoch": 89.61, + "learning_rate": 5.2129304256206e-06, + "loss": 1.7882, + "step": 30956500 + }, + { + "epoch": 89.61, + "learning_rate": 5.212206777973324e-06, + "loss": 1.7968, + "step": 30957000 + }, + { + "epoch": 89.61, + "learning_rate": 5.211483130326047e-06, + "loss": 1.7702, + "step": 30957500 + }, + { + "epoch": 89.61, + "learning_rate": 5.210760929974065e-06, + "loss": 1.8034, + "step": 30958000 + }, + { + "epoch": 89.61, + "learning_rate": 5.2100387296220825e-06, + "loss": 1.8123, + "step": 30958500 + }, + { + "epoch": 89.61, + "learning_rate": 5.2093150819748055e-06, + "loss": 1.7914, + "step": 30959000 + }, + { + "epoch": 89.62, + "learning_rate": 5.208591434327529e-06, + "loss": 1.7955, + "step": 30959500 + }, + { + "epoch": 89.62, + "learning_rate": 5.2078677866802526e-06, + "loss": 1.8086, + "step": 30960000 + }, + { + "epoch": 89.62, + "learning_rate": 5.207144139032976e-06, + "loss": 1.7875, + "step": 30960500 + }, + { + "epoch": 89.62, + "learning_rate": 5.206421938680993e-06, + "loss": 1.7878, + "step": 30961000 + }, + { + "epoch": 89.62, + "learning_rate": 5.205698291033717e-06, + "loss": 1.8229, + "step": 30961500 + }, + { + "epoch": 89.62, + "learning_rate": 5.20497464338644e-06, + "loss": 1.8213, + "step": 30962000 + }, + { + "epoch": 89.62, + "learning_rate": 5.204250995739163e-06, + "loss": 1.7744, + "step": 30962500 + }, + { + "epoch": 89.63, + "learning_rate": 5.203528795387181e-06, + "loss": 1.7995, + "step": 30963000 + }, + { + "epoch": 89.63, + "learning_rate": 5.202805147739904e-06, + "loss": 1.8202, + "step": 30963500 + }, + { + "epoch": 89.63, + "learning_rate": 5.202081500092627e-06, + "loss": 1.8075, + "step": 30964000 + }, + { + "epoch": 89.63, + "learning_rate": 5.20135785244535e-06, + "loss": 1.7971, + "step": 30964500 + }, + { + "epoch": 89.63, + "learning_rate": 5.200635652093368e-06, + "loss": 1.8086, + "step": 30965000 + }, + { + "epoch": 89.63, + "learning_rate": 5.1999120044460915e-06, + "loss": 1.7913, + "step": 30965500 + }, + { + "epoch": 89.63, + "learning_rate": 5.1991883567988146e-06, + "loss": 1.8049, + "step": 30966000 + }, + { + "epoch": 89.64, + "learning_rate": 5.198464709151538e-06, + "loss": 1.8083, + "step": 30966500 + }, + { + "epoch": 89.64, + "learning_rate": 5.197741061504261e-06, + "loss": 1.8193, + "step": 30967000 + }, + { + "epoch": 89.64, + "learning_rate": 5.197017413856985e-06, + "loss": 1.8019, + "step": 30967500 + }, + { + "epoch": 89.64, + "learning_rate": 5.196293766209708e-06, + "loss": 1.771, + "step": 30968000 + }, + { + "epoch": 89.64, + "learning_rate": 5.195570118562431e-06, + "loss": 1.777, + "step": 30968500 + }, + { + "epoch": 89.64, + "learning_rate": 5.194847918210449e-06, + "loss": 1.7998, + "step": 30969000 + }, + { + "epoch": 89.64, + "learning_rate": 5.194124270563172e-06, + "loss": 1.8034, + "step": 30969500 + }, + { + "epoch": 89.65, + "learning_rate": 5.193402070211189e-06, + "loss": 1.7851, + "step": 30970000 + }, + { + "epoch": 89.65, + "learning_rate": 5.192678422563913e-06, + "loss": 1.7876, + "step": 30970500 + }, + { + "epoch": 89.65, + "learning_rate": 5.191954774916636e-06, + "loss": 1.8089, + "step": 30971000 + }, + { + "epoch": 89.65, + "learning_rate": 5.191231127269359e-06, + "loss": 1.7942, + "step": 30971500 + }, + { + "epoch": 89.65, + "learning_rate": 5.190507479622082e-06, + "loss": 1.8281, + "step": 30972000 + }, + { + "epoch": 89.65, + "learning_rate": 5.1897838319748055e-06, + "loss": 1.8098, + "step": 30972500 + }, + { + "epoch": 89.65, + "learning_rate": 5.189061631622824e-06, + "loss": 1.8161, + "step": 30973000 + }, + { + "epoch": 89.66, + "learning_rate": 5.188337983975547e-06, + "loss": 1.8081, + "step": 30973500 + }, + { + "epoch": 89.66, + "learning_rate": 5.18761433632827e-06, + "loss": 1.78, + "step": 30974000 + }, + { + "epoch": 89.66, + "learning_rate": 5.186893583271582e-06, + "loss": 1.8002, + "step": 30974500 + }, + { + "epoch": 89.66, + "learning_rate": 5.186169935624306e-06, + "loss": 1.7664, + "step": 30975000 + }, + { + "epoch": 89.66, + "learning_rate": 5.185446287977029e-06, + "loss": 1.8404, + "step": 30975500 + }, + { + "epoch": 89.66, + "learning_rate": 5.184722640329752e-06, + "loss": 1.8375, + "step": 30976000 + }, + { + "epoch": 89.66, + "learning_rate": 5.183998992682475e-06, + "loss": 1.7808, + "step": 30976500 + }, + { + "epoch": 89.67, + "learning_rate": 5.183275345035198e-06, + "loss": 1.805, + "step": 30977000 + }, + { + "epoch": 89.67, + "learning_rate": 5.182551697387922e-06, + "loss": 1.8033, + "step": 30977500 + }, + { + "epoch": 89.67, + "learning_rate": 5.1818280497406444e-06, + "loss": 1.7912, + "step": 30978000 + }, + { + "epoch": 89.67, + "learning_rate": 5.181104402093368e-06, + "loss": 1.7901, + "step": 30978500 + }, + { + "epoch": 89.67, + "learning_rate": 5.180382201741386e-06, + "loss": 1.8059, + "step": 30979000 + }, + { + "epoch": 89.67, + "learning_rate": 5.1796585540941095e-06, + "loss": 1.7782, + "step": 30979500 + }, + { + "epoch": 89.67, + "learning_rate": 5.178934906446833e-06, + "loss": 1.7981, + "step": 30980000 + }, + { + "epoch": 89.68, + "learning_rate": 5.178211258799556e-06, + "loss": 1.7891, + "step": 30980500 + }, + { + "epoch": 89.68, + "learning_rate": 5.177487611152279e-06, + "loss": 1.7972, + "step": 30981000 + }, + { + "epoch": 89.68, + "learning_rate": 5.176763963505002e-06, + "loss": 1.7873, + "step": 30981500 + }, + { + "epoch": 89.68, + "learning_rate": 5.176040315857726e-06, + "loss": 1.803, + "step": 30982000 + }, + { + "epoch": 89.68, + "learning_rate": 5.175316668210448e-06, + "loss": 1.7999, + "step": 30982500 + }, + { + "epoch": 89.68, + "learning_rate": 5.174593020563172e-06, + "loss": 1.7938, + "step": 30983000 + }, + { + "epoch": 89.68, + "learning_rate": 5.173869372915895e-06, + "loss": 1.7776, + "step": 30983500 + }, + { + "epoch": 89.69, + "learning_rate": 5.173145725268618e-06, + "loss": 1.7962, + "step": 30984000 + }, + { + "epoch": 89.69, + "learning_rate": 5.172422077621342e-06, + "loss": 1.7922, + "step": 30984500 + }, + { + "epoch": 89.69, + "learning_rate": 5.171698429974064e-06, + "loss": 1.7883, + "step": 30985000 + }, + { + "epoch": 89.69, + "learning_rate": 5.170974782326788e-06, + "loss": 1.7984, + "step": 30985500 + }, + { + "epoch": 89.69, + "learning_rate": 5.1702525819748054e-06, + "loss": 1.8063, + "step": 30986000 + }, + { + "epoch": 89.69, + "learning_rate": 5.169528934327529e-06, + "loss": 1.8084, + "step": 30986500 + }, + { + "epoch": 89.69, + "learning_rate": 5.168806733975547e-06, + "loss": 1.8123, + "step": 30987000 + }, + { + "epoch": 89.7, + "learning_rate": 5.1680830863282705e-06, + "loss": 1.7992, + "step": 30987500 + }, + { + "epoch": 89.7, + "learning_rate": 5.167360885976288e-06, + "loss": 1.7767, + "step": 30988000 + }, + { + "epoch": 89.7, + "learning_rate": 5.166637238329011e-06, + "loss": 1.818, + "step": 30988500 + }, + { + "epoch": 89.7, + "learning_rate": 5.165913590681734e-06, + "loss": 1.8021, + "step": 30989000 + }, + { + "epoch": 89.7, + "learning_rate": 5.165189943034458e-06, + "loss": 1.7757, + "step": 30989500 + }, + { + "epoch": 89.7, + "learning_rate": 5.16446629538718e-06, + "loss": 1.8012, + "step": 30990000 + }, + { + "epoch": 89.7, + "learning_rate": 5.163742647739904e-06, + "loss": 1.765, + "step": 30990500 + }, + { + "epoch": 89.71, + "learning_rate": 5.163019000092627e-06, + "loss": 1.8126, + "step": 30991000 + }, + { + "epoch": 89.71, + "learning_rate": 5.16229535244535e-06, + "loss": 1.7737, + "step": 30991500 + }, + { + "epoch": 89.71, + "learning_rate": 5.161571704798074e-06, + "loss": 1.7965, + "step": 30992000 + }, + { + "epoch": 89.71, + "learning_rate": 5.160849504446091e-06, + "loss": 1.7666, + "step": 30992500 + }, + { + "epoch": 89.71, + "learning_rate": 5.160125856798815e-06, + "loss": 1.7811, + "step": 30993000 + }, + { + "epoch": 89.71, + "learning_rate": 5.1594022091515375e-06, + "loss": 1.7611, + "step": 30993500 + }, + { + "epoch": 89.71, + "learning_rate": 5.1586785615042615e-06, + "loss": 1.8108, + "step": 30994000 + }, + { + "epoch": 89.72, + "learning_rate": 5.157954913856984e-06, + "loss": 1.8089, + "step": 30994500 + }, + { + "epoch": 89.72, + "learning_rate": 5.157231266209708e-06, + "loss": 1.7982, + "step": 30995000 + }, + { + "epoch": 89.72, + "learning_rate": 5.156507618562431e-06, + "loss": 1.7982, + "step": 30995500 + }, + { + "epoch": 89.72, + "learning_rate": 5.155785418210449e-06, + "loss": 1.7935, + "step": 30996000 + }, + { + "epoch": 89.72, + "learning_rate": 5.155061770563172e-06, + "loss": 1.7853, + "step": 30996500 + }, + { + "epoch": 89.72, + "learning_rate": 5.154338122915895e-06, + "loss": 1.7923, + "step": 30997000 + }, + { + "epoch": 89.73, + "learning_rate": 5.153615922563912e-06, + "loss": 1.8013, + "step": 30997500 + }, + { + "epoch": 89.73, + "learning_rate": 5.152892274916636e-06, + "loss": 1.7685, + "step": 30998000 + }, + { + "epoch": 89.73, + "learning_rate": 5.152168627269359e-06, + "loss": 1.8018, + "step": 30998500 + }, + { + "epoch": 89.73, + "learning_rate": 5.151444979622082e-06, + "loss": 1.8154, + "step": 30999000 + }, + { + "epoch": 89.73, + "learning_rate": 5.150721331974806e-06, + "loss": 1.7818, + "step": 30999500 + }, + { + "epoch": 89.73, + "learning_rate": 5.1499976843275285e-06, + "loss": 1.7994, + "step": 31000000 + }, + { + "epoch": 89.73, + "learning_rate": 5.149274036680252e-06, + "loss": 1.7675, + "step": 31000500 + }, + { + "epoch": 89.74, + "learning_rate": 5.1485503890329755e-06, + "loss": 1.8077, + "step": 31001000 + }, + { + "epoch": 89.74, + "learning_rate": 5.1478267413856986e-06, + "loss": 1.7768, + "step": 31001500 + }, + { + "epoch": 89.74, + "learning_rate": 5.1471030937384225e-06, + "loss": 1.7881, + "step": 31002000 + }, + { + "epoch": 89.74, + "learning_rate": 5.146379446091145e-06, + "loss": 1.7947, + "step": 31002500 + }, + { + "epoch": 89.74, + "learning_rate": 5.145655798443869e-06, + "loss": 1.7803, + "step": 31003000 + }, + { + "epoch": 89.74, + "learning_rate": 5.144932150796592e-06, + "loss": 1.7442, + "step": 31003500 + }, + { + "epoch": 89.74, + "learning_rate": 5.14420995044461e-06, + "loss": 1.7713, + "step": 31004000 + }, + { + "epoch": 89.75, + "learning_rate": 5.143486302797333e-06, + "loss": 1.7784, + "step": 31004500 + }, + { + "epoch": 89.75, + "learning_rate": 5.142762655150056e-06, + "loss": 1.7992, + "step": 31005000 + }, + { + "epoch": 89.75, + "learning_rate": 5.142039007502779e-06, + "loss": 1.7866, + "step": 31005500 + }, + { + "epoch": 89.75, + "learning_rate": 5.141315359855502e-06, + "loss": 1.7928, + "step": 31006000 + }, + { + "epoch": 89.75, + "learning_rate": 5.14059315950352e-06, + "loss": 1.7959, + "step": 31006500 + }, + { + "epoch": 89.75, + "learning_rate": 5.139869511856243e-06, + "loss": 1.7867, + "step": 31007000 + }, + { + "epoch": 89.75, + "learning_rate": 5.139145864208966e-06, + "loss": 1.7719, + "step": 31007500 + }, + { + "epoch": 89.76, + "learning_rate": 5.1384222165616895e-06, + "loss": 1.79, + "step": 31008000 + }, + { + "epoch": 89.76, + "learning_rate": 5.137698568914413e-06, + "loss": 1.8012, + "step": 31008500 + }, + { + "epoch": 89.76, + "learning_rate": 5.136976368562431e-06, + "loss": 1.8, + "step": 31009000 + }, + { + "epoch": 89.76, + "learning_rate": 5.136252720915154e-06, + "loss": 1.8131, + "step": 31009500 + }, + { + "epoch": 89.76, + "learning_rate": 5.135529073267877e-06, + "loss": 1.7746, + "step": 31010000 + }, + { + "epoch": 89.76, + "learning_rate": 5.134806872915895e-06, + "loss": 1.8007, + "step": 31010500 + }, + { + "epoch": 89.76, + "learning_rate": 5.134083225268618e-06, + "loss": 1.7869, + "step": 31011000 + }, + { + "epoch": 89.77, + "learning_rate": 5.133359577621342e-06, + "loss": 1.7984, + "step": 31011500 + }, + { + "epoch": 89.77, + "learning_rate": 5.132635929974065e-06, + "loss": 1.8042, + "step": 31012000 + }, + { + "epoch": 89.77, + "learning_rate": 5.131913729622082e-06, + "loss": 1.7885, + "step": 31012500 + }, + { + "epoch": 89.77, + "learning_rate": 5.131190081974805e-06, + "loss": 1.7894, + "step": 31013000 + }, + { + "epoch": 89.77, + "learning_rate": 5.130466434327529e-06, + "loss": 1.8091, + "step": 31013500 + }, + { + "epoch": 89.77, + "learning_rate": 5.129742786680252e-06, + "loss": 1.7733, + "step": 31014000 + }, + { + "epoch": 89.77, + "learning_rate": 5.1290191390329754e-06, + "loss": 1.8082, + "step": 31014500 + }, + { + "epoch": 89.78, + "learning_rate": 5.1282954913856985e-06, + "loss": 1.7927, + "step": 31015000 + }, + { + "epoch": 89.78, + "learning_rate": 5.127571843738422e-06, + "loss": 1.7983, + "step": 31015500 + }, + { + "epoch": 89.78, + "learning_rate": 5.12684964338644e-06, + "loss": 1.7992, + "step": 31016000 + }, + { + "epoch": 89.78, + "learning_rate": 5.126125995739163e-06, + "loss": 1.7725, + "step": 31016500 + }, + { + "epoch": 89.78, + "learning_rate": 5.125402348091886e-06, + "loss": 1.7999, + "step": 31017000 + }, + { + "epoch": 89.78, + "learning_rate": 5.12467870044461e-06, + "loss": 1.8036, + "step": 31017500 + }, + { + "epoch": 89.78, + "learning_rate": 5.123955052797333e-06, + "loss": 1.8026, + "step": 31018000 + }, + { + "epoch": 89.79, + "learning_rate": 5.123231405150056e-06, + "loss": 1.8066, + "step": 31018500 + }, + { + "epoch": 89.79, + "learning_rate": 5.122507757502779e-06, + "loss": 1.7892, + "step": 31019000 + }, + { + "epoch": 89.79, + "learning_rate": 5.121784109855502e-06, + "loss": 1.8035, + "step": 31019500 + }, + { + "epoch": 89.79, + "learning_rate": 5.121060462208226e-06, + "loss": 1.7748, + "step": 31020000 + }, + { + "epoch": 89.79, + "learning_rate": 5.120336814560948e-06, + "loss": 1.8117, + "step": 31020500 + }, + { + "epoch": 89.79, + "learning_rate": 5.119614614208966e-06, + "loss": 1.7964, + "step": 31021000 + }, + { + "epoch": 89.79, + "learning_rate": 5.1188909665616894e-06, + "loss": 1.8089, + "step": 31021500 + }, + { + "epoch": 89.8, + "learning_rate": 5.118167318914413e-06, + "loss": 1.8005, + "step": 31022000 + }, + { + "epoch": 89.8, + "learning_rate": 5.1174436712671364e-06, + "loss": 1.7662, + "step": 31022500 + }, + { + "epoch": 89.8, + "learning_rate": 5.1167200236198595e-06, + "loss": 1.8157, + "step": 31023000 + }, + { + "epoch": 89.8, + "learning_rate": 5.115996375972583e-06, + "loss": 1.8105, + "step": 31023500 + }, + { + "epoch": 89.8, + "learning_rate": 5.115272728325306e-06, + "loss": 1.7839, + "step": 31024000 + }, + { + "epoch": 89.8, + "learning_rate": 5.114550527973324e-06, + "loss": 1.7666, + "step": 31024500 + }, + { + "epoch": 89.8, + "learning_rate": 5.113826880326047e-06, + "loss": 1.8154, + "step": 31025000 + }, + { + "epoch": 89.81, + "learning_rate": 5.11310323267877e-06, + "loss": 1.7914, + "step": 31025500 + }, + { + "epoch": 89.81, + "learning_rate": 5.112379585031493e-06, + "loss": 1.8192, + "step": 31026000 + }, + { + "epoch": 89.81, + "learning_rate": 5.111655937384217e-06, + "loss": 1.8151, + "step": 31026500 + }, + { + "epoch": 89.81, + "learning_rate": 5.110932289736939e-06, + "loss": 1.7558, + "step": 31027000 + }, + { + "epoch": 89.81, + "learning_rate": 5.110208642089663e-06, + "loss": 1.8293, + "step": 31027500 + }, + { + "epoch": 89.81, + "learning_rate": 5.10948644173768e-06, + "loss": 1.7896, + "step": 31028000 + }, + { + "epoch": 89.81, + "learning_rate": 5.108762794090404e-06, + "loss": 1.7697, + "step": 31028500 + }, + { + "epoch": 89.82, + "learning_rate": 5.108039146443127e-06, + "loss": 1.7629, + "step": 31029000 + }, + { + "epoch": 89.82, + "learning_rate": 5.1073169460911455e-06, + "loss": 1.775, + "step": 31029500 + }, + { + "epoch": 89.82, + "learning_rate": 5.106593298443868e-06, + "loss": 1.7662, + "step": 31030000 + }, + { + "epoch": 89.82, + "learning_rate": 5.105869650796592e-06, + "loss": 1.8131, + "step": 31030500 + }, + { + "epoch": 89.82, + "learning_rate": 5.105146003149315e-06, + "loss": 1.8293, + "step": 31031000 + }, + { + "epoch": 89.82, + "learning_rate": 5.104422355502038e-06, + "loss": 1.783, + "step": 31031500 + }, + { + "epoch": 89.82, + "learning_rate": 5.103698707854762e-06, + "loss": 1.8036, + "step": 31032000 + }, + { + "epoch": 89.83, + "learning_rate": 5.102975060207484e-06, + "loss": 1.804, + "step": 31032500 + }, + { + "epoch": 89.83, + "learning_rate": 5.102252859855503e-06, + "loss": 1.7901, + "step": 31033000 + }, + { + "epoch": 89.83, + "learning_rate": 5.101529212208225e-06, + "loss": 1.8096, + "step": 31033500 + }, + { + "epoch": 89.83, + "learning_rate": 5.100805564560949e-06, + "loss": 1.8027, + "step": 31034000 + }, + { + "epoch": 89.83, + "learning_rate": 5.100081916913671e-06, + "loss": 1.7731, + "step": 31034500 + }, + { + "epoch": 89.83, + "learning_rate": 5.099358269266395e-06, + "loss": 1.803, + "step": 31035000 + }, + { + "epoch": 89.84, + "learning_rate": 5.098634621619119e-06, + "loss": 1.8024, + "step": 31035500 + }, + { + "epoch": 89.84, + "learning_rate": 5.097910973971841e-06, + "loss": 1.8052, + "step": 31036000 + }, + { + "epoch": 89.84, + "learning_rate": 5.097187326324565e-06, + "loss": 1.7962, + "step": 31036500 + }, + { + "epoch": 89.84, + "learning_rate": 5.0964651259725826e-06, + "loss": 1.7983, + "step": 31037000 + }, + { + "epoch": 89.84, + "learning_rate": 5.0957414783253065e-06, + "loss": 1.7771, + "step": 31037500 + }, + { + "epoch": 89.84, + "learning_rate": 5.095017830678029e-06, + "loss": 1.7917, + "step": 31038000 + }, + { + "epoch": 89.84, + "learning_rate": 5.094294183030753e-06, + "loss": 1.8234, + "step": 31038500 + }, + { + "epoch": 89.85, + "learning_rate": 5.093570535383476e-06, + "loss": 1.7986, + "step": 31039000 + }, + { + "epoch": 89.85, + "learning_rate": 5.092846887736199e-06, + "loss": 1.7761, + "step": 31039500 + }, + { + "epoch": 89.85, + "learning_rate": 5.092123240088923e-06, + "loss": 1.7962, + "step": 31040000 + }, + { + "epoch": 89.85, + "learning_rate": 5.09140103973694e-06, + "loss": 1.8111, + "step": 31040500 + }, + { + "epoch": 89.85, + "learning_rate": 5.090677392089663e-06, + "loss": 1.8011, + "step": 31041000 + }, + { + "epoch": 89.85, + "learning_rate": 5.089953744442386e-06, + "loss": 1.7815, + "step": 31041500 + }, + { + "epoch": 89.85, + "learning_rate": 5.08923009679511e-06, + "loss": 1.7855, + "step": 31042000 + }, + { + "epoch": 89.86, + "learning_rate": 5.088506449147832e-06, + "loss": 1.809, + "step": 31042500 + }, + { + "epoch": 89.86, + "learning_rate": 5.087782801500556e-06, + "loss": 1.7832, + "step": 31043000 + }, + { + "epoch": 89.86, + "learning_rate": 5.0870606011485735e-06, + "loss": 1.8157, + "step": 31043500 + }, + { + "epoch": 89.86, + "learning_rate": 5.086336953501297e-06, + "loss": 1.808, + "step": 31044000 + }, + { + "epoch": 89.86, + "learning_rate": 5.0856133058540205e-06, + "loss": 1.8058, + "step": 31044500 + }, + { + "epoch": 89.86, + "learning_rate": 5.0848896582067436e-06, + "loss": 1.8014, + "step": 31045000 + }, + { + "epoch": 89.86, + "learning_rate": 5.084166010559467e-06, + "loss": 1.7971, + "step": 31045500 + }, + { + "epoch": 89.87, + "learning_rate": 5.08344236291219e-06, + "loss": 1.8013, + "step": 31046000 + }, + { + "epoch": 89.87, + "learning_rate": 5.082718715264914e-06, + "loss": 1.7971, + "step": 31046500 + }, + { + "epoch": 89.87, + "learning_rate": 5.081995067617636e-06, + "loss": 1.7918, + "step": 31047000 + }, + { + "epoch": 89.87, + "learning_rate": 5.08127141997036e-06, + "loss": 1.7778, + "step": 31047500 + }, + { + "epoch": 89.87, + "learning_rate": 5.080547772323083e-06, + "loss": 1.7877, + "step": 31048000 + }, + { + "epoch": 89.87, + "learning_rate": 5.079825571971101e-06, + "loss": 1.7932, + "step": 31048500 + }, + { + "epoch": 89.87, + "learning_rate": 5.079103371619118e-06, + "loss": 1.7995, + "step": 31049000 + }, + { + "epoch": 89.88, + "learning_rate": 5.078379723971842e-06, + "loss": 1.7883, + "step": 31049500 + }, + { + "epoch": 89.88, + "learning_rate": 5.077656076324564e-06, + "loss": 1.7742, + "step": 31050000 + }, + { + "epoch": 89.88, + "learning_rate": 5.076932428677288e-06, + "loss": 1.7876, + "step": 31050500 + }, + { + "epoch": 89.88, + "learning_rate": 5.076208781030011e-06, + "loss": 1.7816, + "step": 31051000 + }, + { + "epoch": 89.88, + "learning_rate": 5.0754851333827345e-06, + "loss": 1.8116, + "step": 31051500 + }, + { + "epoch": 89.88, + "learning_rate": 5.0747614857354576e-06, + "loss": 1.7867, + "step": 31052000 + }, + { + "epoch": 89.88, + "learning_rate": 5.074037838088181e-06, + "loss": 1.7992, + "step": 31052500 + }, + { + "epoch": 89.89, + "learning_rate": 5.073314190440905e-06, + "loss": 1.7951, + "step": 31053000 + }, + { + "epoch": 89.89, + "learning_rate": 5.072591990088922e-06, + "loss": 1.7902, + "step": 31053500 + }, + { + "epoch": 89.89, + "learning_rate": 5.071868342441646e-06, + "loss": 1.8223, + "step": 31054000 + }, + { + "epoch": 89.89, + "learning_rate": 5.071144694794369e-06, + "loss": 1.7848, + "step": 31054500 + }, + { + "epoch": 89.89, + "learning_rate": 5.070421047147092e-06, + "loss": 1.7924, + "step": 31055000 + }, + { + "epoch": 89.89, + "learning_rate": 5.069697399499815e-06, + "loss": 1.8117, + "step": 31055500 + }, + { + "epoch": 89.89, + "learning_rate": 5.068975199147833e-06, + "loss": 1.8007, + "step": 31056000 + }, + { + "epoch": 89.9, + "learning_rate": 5.068251551500556e-06, + "loss": 1.7975, + "step": 31056500 + }, + { + "epoch": 89.9, + "learning_rate": 5.067527903853279e-06, + "loss": 1.788, + "step": 31057000 + }, + { + "epoch": 89.9, + "learning_rate": 5.066804256206002e-06, + "loss": 1.7742, + "step": 31057500 + }, + { + "epoch": 89.9, + "learning_rate": 5.0660820558540204e-06, + "loss": 1.801, + "step": 31058000 + }, + { + "epoch": 89.9, + "learning_rate": 5.065361302797333e-06, + "loss": 1.814, + "step": 31058500 + }, + { + "epoch": 89.9, + "learning_rate": 5.064637655150056e-06, + "loss": 1.7834, + "step": 31059000 + }, + { + "epoch": 89.9, + "learning_rate": 5.063914007502779e-06, + "loss": 1.7889, + "step": 31059500 + }, + { + "epoch": 89.91, + "learning_rate": 5.063190359855502e-06, + "loss": 1.7877, + "step": 31060000 + }, + { + "epoch": 89.91, + "learning_rate": 5.062466712208226e-06, + "loss": 1.7991, + "step": 31060500 + }, + { + "epoch": 89.91, + "learning_rate": 5.061743064560949e-06, + "loss": 1.7721, + "step": 31061000 + }, + { + "epoch": 89.91, + "learning_rate": 5.061019416913672e-06, + "loss": 1.7735, + "step": 31061500 + }, + { + "epoch": 89.91, + "learning_rate": 5.060295769266395e-06, + "loss": 1.8069, + "step": 31062000 + }, + { + "epoch": 89.91, + "learning_rate": 5.059572121619118e-06, + "loss": 1.7819, + "step": 31062500 + }, + { + "epoch": 89.91, + "learning_rate": 5.058848473971841e-06, + "loss": 1.7999, + "step": 31063000 + }, + { + "epoch": 89.92, + "learning_rate": 5.058124826324565e-06, + "loss": 1.8044, + "step": 31063500 + }, + { + "epoch": 89.92, + "learning_rate": 5.0574026259725824e-06, + "loss": 1.7907, + "step": 31064000 + }, + { + "epoch": 89.92, + "learning_rate": 5.0566789783253055e-06, + "loss": 1.7785, + "step": 31064500 + }, + { + "epoch": 89.92, + "learning_rate": 5.0559553306780295e-06, + "loss": 1.7746, + "step": 31065000 + }, + { + "epoch": 89.92, + "learning_rate": 5.0552316830307525e-06, + "loss": 1.7963, + "step": 31065500 + }, + { + "epoch": 89.92, + "learning_rate": 5.054508035383476e-06, + "loss": 1.797, + "step": 31066000 + }, + { + "epoch": 89.92, + "learning_rate": 5.053784387736199e-06, + "loss": 1.7972, + "step": 31066500 + }, + { + "epoch": 89.93, + "learning_rate": 5.053060740088922e-06, + "loss": 1.7928, + "step": 31067000 + }, + { + "epoch": 89.93, + "learning_rate": 5.052337092441646e-06, + "loss": 1.8019, + "step": 31067500 + }, + { + "epoch": 89.93, + "learning_rate": 5.051613444794368e-06, + "loss": 1.7654, + "step": 31068000 + }, + { + "epoch": 89.93, + "learning_rate": 5.050889797147092e-06, + "loss": 1.7965, + "step": 31068500 + }, + { + "epoch": 89.93, + "learning_rate": 5.050167596795109e-06, + "loss": 1.7858, + "step": 31069000 + }, + { + "epoch": 89.93, + "learning_rate": 5.049443949147833e-06, + "loss": 1.8038, + "step": 31069500 + }, + { + "epoch": 89.93, + "learning_rate": 5.048720301500556e-06, + "loss": 1.7854, + "step": 31070000 + }, + { + "epoch": 89.94, + "learning_rate": 5.047996653853279e-06, + "loss": 1.8226, + "step": 31070500 + }, + { + "epoch": 89.94, + "learning_rate": 5.0472744535012965e-06, + "loss": 1.8072, + "step": 31071000 + }, + { + "epoch": 89.94, + "learning_rate": 5.04655080585402e-06, + "loss": 1.8024, + "step": 31071500 + }, + { + "epoch": 89.94, + "learning_rate": 5.0458271582067435e-06, + "loss": 1.7958, + "step": 31072000 + }, + { + "epoch": 89.94, + "learning_rate": 5.0451035105594665e-06, + "loss": 1.7608, + "step": 31072500 + }, + { + "epoch": 89.94, + "learning_rate": 5.0443798629121905e-06, + "loss": 1.7754, + "step": 31073000 + }, + { + "epoch": 89.95, + "learning_rate": 5.043656215264913e-06, + "loss": 1.8251, + "step": 31073500 + }, + { + "epoch": 89.95, + "learning_rate": 5.042932567617637e-06, + "loss": 1.7764, + "step": 31074000 + }, + { + "epoch": 89.95, + "learning_rate": 5.04220891997036e-06, + "loss": 1.7879, + "step": 31074500 + }, + { + "epoch": 89.95, + "learning_rate": 5.041486719618378e-06, + "loss": 1.7692, + "step": 31075000 + }, + { + "epoch": 89.95, + "learning_rate": 5.0407630719711e-06, + "loss": 1.7914, + "step": 31075500 + }, + { + "epoch": 89.95, + "learning_rate": 5.040039424323824e-06, + "loss": 1.8386, + "step": 31076000 + }, + { + "epoch": 89.95, + "learning_rate": 5.039315776676547e-06, + "loss": 1.801, + "step": 31076500 + }, + { + "epoch": 89.96, + "learning_rate": 5.038595023619859e-06, + "loss": 1.7975, + "step": 31077000 + }, + { + "epoch": 89.96, + "learning_rate": 5.037871375972582e-06, + "loss": 1.7818, + "step": 31077500 + }, + { + "epoch": 89.96, + "learning_rate": 5.037147728325306e-06, + "loss": 1.8002, + "step": 31078000 + }, + { + "epoch": 89.96, + "learning_rate": 5.0364240806780286e-06, + "loss": 1.796, + "step": 31078500 + }, + { + "epoch": 89.96, + "learning_rate": 5.0357004330307525e-06, + "loss": 1.8078, + "step": 31079000 + }, + { + "epoch": 89.96, + "learning_rate": 5.0349767853834756e-06, + "loss": 1.8191, + "step": 31079500 + }, + { + "epoch": 89.96, + "learning_rate": 5.034253137736199e-06, + "loss": 1.8095, + "step": 31080000 + }, + { + "epoch": 89.97, + "learning_rate": 5.0335294900889226e-06, + "loss": 1.7904, + "step": 31080500 + }, + { + "epoch": 89.97, + "learning_rate": 5.032805842441645e-06, + "loss": 1.7769, + "step": 31081000 + }, + { + "epoch": 89.97, + "learning_rate": 5.032083642089663e-06, + "loss": 1.814, + "step": 31081500 + }, + { + "epoch": 89.97, + "learning_rate": 5.031359994442386e-06, + "loss": 1.791, + "step": 31082000 + }, + { + "epoch": 89.97, + "learning_rate": 5.03063634679511e-06, + "loss": 1.7928, + "step": 31082500 + }, + { + "epoch": 89.97, + "learning_rate": 5.029912699147832e-06, + "loss": 1.8185, + "step": 31083000 + }, + { + "epoch": 89.97, + "learning_rate": 5.029189051500556e-06, + "loss": 1.7939, + "step": 31083500 + }, + { + "epoch": 89.98, + "learning_rate": 5.028466851148573e-06, + "loss": 1.7925, + "step": 31084000 + }, + { + "epoch": 89.98, + "learning_rate": 5.027743203501297e-06, + "loss": 1.7887, + "step": 31084500 + }, + { + "epoch": 89.98, + "learning_rate": 5.0270210031493145e-06, + "loss": 1.8083, + "step": 31085000 + }, + { + "epoch": 89.98, + "learning_rate": 5.0262973555020384e-06, + "loss": 1.7956, + "step": 31085500 + }, + { + "epoch": 89.98, + "learning_rate": 5.025573707854761e-06, + "loss": 1.7919, + "step": 31086000 + }, + { + "epoch": 89.98, + "learning_rate": 5.024850060207485e-06, + "loss": 1.7945, + "step": 31086500 + }, + { + "epoch": 89.98, + "learning_rate": 5.024126412560208e-06, + "loss": 1.7981, + "step": 31087000 + }, + { + "epoch": 89.99, + "learning_rate": 5.023402764912931e-06, + "loss": 1.7997, + "step": 31087500 + }, + { + "epoch": 89.99, + "learning_rate": 5.022679117265655e-06, + "loss": 1.7895, + "step": 31088000 + }, + { + "epoch": 89.99, + "learning_rate": 5.021955469618377e-06, + "loss": 1.7703, + "step": 31088500 + }, + { + "epoch": 89.99, + "learning_rate": 5.021233269266396e-06, + "loss": 1.8148, + "step": 31089000 + }, + { + "epoch": 89.99, + "learning_rate": 5.020511068914413e-06, + "loss": 1.791, + "step": 31089500 + }, + { + "epoch": 89.99, + "learning_rate": 5.019787421267136e-06, + "loss": 1.7994, + "step": 31090000 + }, + { + "epoch": 89.99, + "learning_rate": 5.019063773619859e-06, + "loss": 1.7964, + "step": 31090500 + }, + { + "epoch": 90.0, + "learning_rate": 5.018340125972583e-06, + "loss": 1.795, + "step": 31091000 + }, + { + "epoch": 90.0, + "learning_rate": 5.0176164783253054e-06, + "loss": 1.7833, + "step": 31091500 + }, + { + "epoch": 90.0, + "learning_rate": 5.016892830678029e-06, + "loss": 1.794, + "step": 31092000 + }, + { + "epoch": 90.0, + "eval_accuracy": 0.6908986811886525, + "eval_accuracy_mlm": 0.6604567266583212, + "eval_accuracy_nsp": 0.8540649791698175, + "eval_loss": 2.221858263015747, + "eval_runtime": 331.9118, + "eval_samples_per_second": 1314.765, + "eval_steps_per_second": 54.783, + "step": 31092480 } ], "max_steps": 34547200, "num_train_epochs": 100, - "total_flos": 3.786397348095303e+19, + "total_flos": 4.259665445549079e+19, "trial_name": null, "trial_params": null }