File size: 4,581 Bytes
60f8a01
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
[
  {
    "train": {
      "lr": 9.875093667547056e-05,
      "grad_norm": Infinity,
      "grad_scale": 16646.144,
      "ce": 3.3427528912723066,
      "ppl": 33.995531789183616,
      "ce_q1": 2.6098834899961947,
      "ppl_q1": 16.068788988828658,
      "ce_q2": 3.199262778028846,
      "ppl_q2": 29.528365777134894,
      "ce_q3": 3.5988389488831163,
      "ppl_q3": 44.14542267882824,
      "ce_q4": 3.963026348605752,
      "ppl_q4": 65.16646182084084,
      "duration": 1218.7015924453735
    },
    "valid": {
      "ce": 2.3822669982910156,
      "ppl": 10.829425811767578,
      "ce_q1": 1.7792327404022217,
      "ppl_q1": 5.925308704376221,
      "ce_q2": 2.184326171875,
      "ppl_q2": 8.884659767150879,
      "ce_q3": 2.657968759536743,
      "ppl_q3": 14.267280578613281,
      "ce_q4": 2.9075403213500977,
      "ppl_q4": 18.311702728271484,
      "duration": 12.130462884902954
    }
  },
  {
    "train": {
      "lr": 9.441882233514132e-05,
      "grad_norm": 3.1516987761110067,
      "grad_scale": 16384.0,
      "ce": 2.7866730407330906,
      "ppl": 18.343669335007668,
      "ce_q1": 1.960708865690045,
      "ppl_q1": 7.67068022608757,
      "ce_q2": 2.627964652788825,
      "ppl_q2": 15.557403705596924,
      "ce_q3": 3.0775233307108283,
      "ppl_q3": 24.984127308368684,
      "ce_q4": 3.4804952954860635,
      "ppl_q4": 38.55263476216793,
      "duration": 1236.4078493118286
    },
    "valid": {
      "ce": 2.0738468170166016,
      "ppl": 7.955367088317871,
      "ce_q1": 1.3967729806900024,
      "ppl_q1": 4.042134761810303,
      "ce_q2": 1.8793870210647583,
      "ppl_q2": 6.549488544464111,
      "ce_q3": 2.3681416511535645,
      "ppl_q3": 10.677531242370605,
      "ce_q4": 2.65108585357666,
      "ppl_q4": 14.169415473937988,
      "duration": 16.665278434753418
    }
  },
  {
    "train": {
      "lr": 8.528177696195438e-05,
      "grad_norm": 2.5766738409250975,
      "grad_scale": 32604.16,
      "ce": 2.456978987471317,
      "ppl": 13.047622307181358,
      "ce_q1": 1.6183160656695255,
      "ppl_q1": 5.345393500924111,
      "ce_q2": 2.2931290368936024,
      "ppl_q2": 10.987915291905404,
      "ce_q3": 2.7538199657049116,
      "ppl_q3": 17.96441888523102,
      "ce_q4": 3.1626508837685106,
      "ppl_q4": 27.951965188264847,
      "duration": 1225.9593234062195
    },
    "valid": {
      "ce": 1.8575392961502075,
      "ppl": 6.407949447631836,
      "ce_q1": 1.146897554397583,
      "ppl_q1": 3.1484100818634033,
      "ce_q2": 1.676759123802185,
      "ppl_q2": 5.3481950759887695,
      "ce_q3": 2.1644644737243652,
      "ppl_q3": 8.709936141967773,
      "ce_q4": 2.4420361518859863,
      "ppl_q4": 11.49642562866211,
      "duration": 14.441946506500244
    }
  },
  {
    "train": {
      "lr": 7.268561864754141e-05,
      "grad_norm": 2.390021135300398,
      "grad_scale": 32768.0,
      "ce": 2.243085328816436,
      "ppl": 10.385881650805473,
      "ce_q1": 1.4056685628239065,
      "ppl_q1": 4.270641067743301,
      "ce_q2": 2.0750045562880115,
      "ppl_q2": 8.697048548817635,
      "ce_q3": 2.539443302554544,
      "ppl_q3": 14.286545807361604,
      "ce_q4": 2.9522249091272244,
      "ppl_q4": 22.33064289879799,
      "duration": 1231.9223251342773
    },
    "valid": {
      "ce": 1.6338310241699219,
      "ppl": 5.123465538024902,
      "ce_q1": 0.9277531504631042,
      "ppl_q1": 2.5288209915161133,
      "ce_q2": 1.4565773010253906,
      "ppl_q2": 4.2912468910217285,
      "ce_q3": 1.9195992946624756,
      "ppl_q3": 6.818225860595703,
      "ce_q4": 2.2313942909240723,
      "ppl_q4": 9.31284236907959,
      "duration": 12.240105867385864
    }
  },
  {
    "train": {
      "lr": 5.7865306001898234e-05,
      "grad_norm": 2.3538931381218133,
      "grad_scale": 65208.32,
      "ce": 2.0580586477583274,
      "ppl": 8.52094031894207,
      "ce_q1": 1.2490628082135227,
      "ppl_q1": 3.6193587613105773,
      "ce_q2": 1.8907092852091882,
      "ppl_q2": 7.142661284089089,
      "ce_q3": 2.34134632987684,
      "ppl_q3": 11.545488672852516,
      "ce_q4": 2.751116160790931,
      "ppl_q4": 17.986016420960425,
      "duration": 1227.4011478424072
    },
    "valid": {
      "ce": 1.4793100357055664,
      "ppl": 4.389915466308594,
      "ce_q1": 0.7983056902885437,
      "ppl_q1": 2.221773386001587,
      "ce_q2": 1.30791437625885,
      "ppl_q2": 3.6984519958496094,
      "ce_q3": 1.7428033351898193,
      "ppl_q3": 5.7133378982543945,
      "ce_q4": 2.068216562271118,
      "ppl_q4": 7.910702228546143,
      "duration": 12.669232368469238
    }
  }
]