|
[ |
|
{ |
|
"train": { |
|
"lr": 9.875093667547056e-05, |
|
"grad_norm": Infinity, |
|
"grad_scale": 16646.144, |
|
"ce": 3.3427528912723066, |
|
"ppl": 33.995531789183616, |
|
"ce_q1": 2.6098834899961947, |
|
"ppl_q1": 16.068788988828658, |
|
"ce_q2": 3.199262778028846, |
|
"ppl_q2": 29.528365777134894, |
|
"ce_q3": 3.5988389488831163, |
|
"ppl_q3": 44.14542267882824, |
|
"ce_q4": 3.963026348605752, |
|
"ppl_q4": 65.16646182084084, |
|
"duration": 1218.7015924453735 |
|
}, |
|
"valid": { |
|
"ce": 2.3822669982910156, |
|
"ppl": 10.829425811767578, |
|
"ce_q1": 1.7792327404022217, |
|
"ppl_q1": 5.925308704376221, |
|
"ce_q2": 2.184326171875, |
|
"ppl_q2": 8.884659767150879, |
|
"ce_q3": 2.657968759536743, |
|
"ppl_q3": 14.267280578613281, |
|
"ce_q4": 2.9075403213500977, |
|
"ppl_q4": 18.311702728271484, |
|
"duration": 12.130462884902954 |
|
} |
|
}, |
|
{ |
|
"train": { |
|
"lr": 9.441882233514132e-05, |
|
"grad_norm": 3.1516987761110067, |
|
"grad_scale": 16384.0, |
|
"ce": 2.7866730407330906, |
|
"ppl": 18.343669335007668, |
|
"ce_q1": 1.960708865690045, |
|
"ppl_q1": 7.67068022608757, |
|
"ce_q2": 2.627964652788825, |
|
"ppl_q2": 15.557403705596924, |
|
"ce_q3": 3.0775233307108283, |
|
"ppl_q3": 24.984127308368684, |
|
"ce_q4": 3.4804952954860635, |
|
"ppl_q4": 38.55263476216793, |
|
"duration": 1236.4078493118286 |
|
}, |
|
"valid": { |
|
"ce": 2.0738468170166016, |
|
"ppl": 7.955367088317871, |
|
"ce_q1": 1.3967729806900024, |
|
"ppl_q1": 4.042134761810303, |
|
"ce_q2": 1.8793870210647583, |
|
"ppl_q2": 6.549488544464111, |
|
"ce_q3": 2.3681416511535645, |
|
"ppl_q3": 10.677531242370605, |
|
"ce_q4": 2.65108585357666, |
|
"ppl_q4": 14.169415473937988, |
|
"duration": 16.665278434753418 |
|
} |
|
}, |
|
{ |
|
"train": { |
|
"lr": 8.528177696195438e-05, |
|
"grad_norm": 2.5766738409250975, |
|
"grad_scale": 32604.16, |
|
"ce": 2.456978987471317, |
|
"ppl": 13.047622307181358, |
|
"ce_q1": 1.6183160656695255, |
|
"ppl_q1": 5.345393500924111, |
|
"ce_q2": 2.2931290368936024, |
|
"ppl_q2": 10.987915291905404, |
|
"ce_q3": 2.7538199657049116, |
|
"ppl_q3": 17.96441888523102, |
|
"ce_q4": 3.1626508837685106, |
|
"ppl_q4": 27.951965188264847, |
|
"duration": 1225.9593234062195 |
|
}, |
|
"valid": { |
|
"ce": 1.8575392961502075, |
|
"ppl": 6.407949447631836, |
|
"ce_q1": 1.146897554397583, |
|
"ppl_q1": 3.1484100818634033, |
|
"ce_q2": 1.676759123802185, |
|
"ppl_q2": 5.3481950759887695, |
|
"ce_q3": 2.1644644737243652, |
|
"ppl_q3": 8.709936141967773, |
|
"ce_q4": 2.4420361518859863, |
|
"ppl_q4": 11.49642562866211, |
|
"duration": 14.441946506500244 |
|
} |
|
}, |
|
{ |
|
"train": { |
|
"lr": 7.268561864754141e-05, |
|
"grad_norm": 2.390021135300398, |
|
"grad_scale": 32768.0, |
|
"ce": 2.243085328816436, |
|
"ppl": 10.385881650805473, |
|
"ce_q1": 1.4056685628239065, |
|
"ppl_q1": 4.270641067743301, |
|
"ce_q2": 2.0750045562880115, |
|
"ppl_q2": 8.697048548817635, |
|
"ce_q3": 2.539443302554544, |
|
"ppl_q3": 14.286545807361604, |
|
"ce_q4": 2.9522249091272244, |
|
"ppl_q4": 22.33064289879799, |
|
"duration": 1231.9223251342773 |
|
}, |
|
"valid": { |
|
"ce": 1.6338310241699219, |
|
"ppl": 5.123465538024902, |
|
"ce_q1": 0.9277531504631042, |
|
"ppl_q1": 2.5288209915161133, |
|
"ce_q2": 1.4565773010253906, |
|
"ppl_q2": 4.2912468910217285, |
|
"ce_q3": 1.9195992946624756, |
|
"ppl_q3": 6.818225860595703, |
|
"ce_q4": 2.2313942909240723, |
|
"ppl_q4": 9.31284236907959, |
|
"duration": 12.240105867385864 |
|
} |
|
}, |
|
{ |
|
"train": { |
|
"lr": 5.7865306001898234e-05, |
|
"grad_norm": 2.3538931381218133, |
|
"grad_scale": 65208.32, |
|
"ce": 2.0580586477583274, |
|
"ppl": 8.52094031894207, |
|
"ce_q1": 1.2490628082135227, |
|
"ppl_q1": 3.6193587613105773, |
|
"ce_q2": 1.8907092852091882, |
|
"ppl_q2": 7.142661284089089, |
|
"ce_q3": 2.34134632987684, |
|
"ppl_q3": 11.545488672852516, |
|
"ce_q4": 2.751116160790931, |
|
"ppl_q4": 17.986016420960425, |
|
"duration": 1227.4011478424072 |
|
}, |
|
"valid": { |
|
"ce": 1.4793100357055664, |
|
"ppl": 4.389915466308594, |
|
"ce_q1": 0.7983056902885437, |
|
"ppl_q1": 2.221773386001587, |
|
"ce_q2": 1.30791437625885, |
|
"ppl_q2": 3.6984519958496094, |
|
"ce_q3": 1.7428033351898193, |
|
"ppl_q3": 5.7133378982543945, |
|
"ce_q4": 2.068216562271118, |
|
"ppl_q4": 7.910702228546143, |
|
"duration": 12.669232368469238 |
|
} |
|
} |
|
] |