youngp5 commited on
Commit
4de8749
1 Parent(s): 3827dea

Upload folder using huggingface_hub (#9)

Browse files

- Upload folder using huggingface_hub (5adf1bd6c7dc11965ec2ff2c6215a810cceccbc8)

Files changed (6) hide show
  1. optimizer.pt +2 -2
  2. pytorch_model.bin +1 -1
  3. rng_state.pth +1 -1
  4. scheduler.pt +1 -1
  5. trainer_state.json +58 -157
  6. training_args.bin +1 -1
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4373ca3f29c182403e6a4581c43a863b8b58292755d198fe1fc834ccd084a6ce
3
- size 686525061
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea415bb632e876ae512336a607af6840280bf456bb5c30658265c62bacd8732e
3
+ size 686524869
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de22ee000a33cc4c27096c9cfabd9c972fb27bbd412e0581dbdd28cd7229ca79
3
  size 343271789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c78c09461862f59df553d91ae01c18dc010f7012574bb553a4aea495dfa339
3
  size 343271789
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dd3a816ab8628e6038ecf426e93a907752049203fbc39b63fcde557182a866f
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7508d4b8dd267de5cc58e972da25236687927651336a28f292c92f7f23951475
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b081c596a28e61a0c2c71b36c558646038f30339afa5e1f02c6c82300b54ce5e
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:102c64654091da92418743f04a2cd860e670dced82d2da75143ba070fc004661
3
  size 627
trainer_state.json CHANGED
@@ -1,247 +1,148 @@
1
  {
2
- "best_metric": 0.07841455936431885,
3
- "best_model_checkpoint": "./vit-base-beans/checkpoint-280",
4
- "epoch": 0.7608695652173914,
5
- "global_step": 280,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.03,
12
- "learning_rate": 0.00019322033898305085,
13
- "loss": 0.6554,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.05,
18
- "learning_rate": 0.0001864406779661017,
19
- "loss": 0.306,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.08,
24
- "learning_rate": 0.00017966101694915257,
25
- "loss": 0.267,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.11,
30
- "learning_rate": 0.00017288135593220342,
31
- "loss": 0.2825,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.11,
36
- "eval_accuracy": 0.9318801089918256,
37
- "eval_loss": 0.2294050008058548,
38
- "eval_runtime": 16.8062,
39
- "eval_samples_per_second": 43.674,
40
- "eval_steps_per_second": 5.474,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 0.14,
45
- "learning_rate": 0.00016610169491525423,
46
- "loss": 0.3097,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 0.16,
51
- "learning_rate": 0.00015932203389830508,
52
- "loss": 0.2772,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 0.19,
57
- "learning_rate": 0.00015254237288135592,
58
- "loss": 0.1711,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 0.22,
63
- "learning_rate": 0.00014576271186440677,
64
- "loss": 0.1483,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.22,
69
- "eval_accuracy": 0.944141689373297,
70
- "eval_loss": 0.16020944714546204,
71
- "eval_runtime": 17.3798,
72
- "eval_samples_per_second": 42.233,
73
- "eval_steps_per_second": 5.294,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 0.24,
78
- "learning_rate": 0.00013898305084745764,
79
- "loss": 0.2356,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 0.27,
84
- "learning_rate": 0.00013220338983050849,
85
- "loss": 0.1144,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 0.3,
90
- "learning_rate": 0.00012542372881355933,
91
- "loss": 0.2216,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 0.33,
96
- "learning_rate": 0.00011864406779661017,
97
- "loss": 0.2209,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 0.33,
102
- "eval_accuracy": 0.829700272479564,
103
- "eval_loss": 0.29767370223999023,
104
- "eval_runtime": 17.13,
105
- "eval_samples_per_second": 42.849,
106
- "eval_steps_per_second": 5.371,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 0.35,
111
- "learning_rate": 0.00011186440677966102,
112
- "loss": 0.2153,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 0.38,
117
- "learning_rate": 0.00010508474576271188,
118
- "loss": 0.1693,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 0.41,
123
- "learning_rate": 9.830508474576272e-05,
124
- "loss": 0.1625,
125
  "step": 150
126
  },
127
  {
128
  "epoch": 0.43,
129
- "learning_rate": 9.152542372881357e-05,
130
- "loss": 0.1384,
131
  "step": 160
132
  },
133
  {
134
  "epoch": 0.43,
135
- "eval_accuracy": 0.9645776566757494,
136
- "eval_loss": 0.10578873753547668,
137
- "eval_runtime": 16.6083,
138
- "eval_samples_per_second": 44.195,
139
- "eval_steps_per_second": 5.539,
140
  "step": 160
141
- },
142
- {
143
- "epoch": 0.46,
144
- "learning_rate": 8.474576271186441e-05,
145
- "loss": 0.1371,
146
- "step": 170
147
- },
148
- {
149
- "epoch": 0.49,
150
- "learning_rate": 7.796610169491526e-05,
151
- "loss": 0.1355,
152
- "step": 180
153
- },
154
- {
155
- "epoch": 0.52,
156
- "learning_rate": 7.11864406779661e-05,
157
- "loss": 0.1557,
158
- "step": 190
159
- },
160
- {
161
- "epoch": 0.54,
162
- "learning_rate": 6.440677966101695e-05,
163
- "loss": 0.1551,
164
- "step": 200
165
- },
166
- {
167
- "epoch": 0.54,
168
- "eval_accuracy": 0.9114441416893733,
169
- "eval_loss": 0.1725204885005951,
170
- "eval_runtime": 17.0671,
171
- "eval_samples_per_second": 43.007,
172
- "eval_steps_per_second": 5.39,
173
- "step": 200
174
- },
175
- {
176
- "epoch": 0.57,
177
- "learning_rate": 5.76271186440678e-05,
178
- "loss": 0.2091,
179
- "step": 210
180
- },
181
- {
182
- "epoch": 0.6,
183
- "learning_rate": 5.0847457627118643e-05,
184
- "loss": 0.1313,
185
- "step": 220
186
- },
187
- {
188
- "epoch": 0.62,
189
- "learning_rate": 4.4067796610169495e-05,
190
- "loss": 0.1056,
191
- "step": 230
192
- },
193
- {
194
- "epoch": 0.65,
195
- "learning_rate": 3.728813559322034e-05,
196
- "loss": 0.1608,
197
- "step": 240
198
- },
199
- {
200
- "epoch": 0.65,
201
- "eval_accuracy": 0.9673024523160763,
202
- "eval_loss": 0.09211871027946472,
203
- "eval_runtime": 16.6063,
204
- "eval_samples_per_second": 44.2,
205
- "eval_steps_per_second": 5.54,
206
- "step": 240
207
- },
208
- {
209
- "epoch": 0.68,
210
- "learning_rate": 3.050847457627119e-05,
211
- "loss": 0.0761,
212
- "step": 250
213
- },
214
- {
215
- "epoch": 0.71,
216
- "learning_rate": 2.3728813559322036e-05,
217
- "loss": 0.1044,
218
- "step": 260
219
- },
220
- {
221
- "epoch": 0.73,
222
- "learning_rate": 1.694915254237288e-05,
223
- "loss": 0.1141,
224
- "step": 270
225
- },
226
- {
227
- "epoch": 0.76,
228
- "learning_rate": 1.016949152542373e-05,
229
- "loss": 0.12,
230
- "step": 280
231
- },
232
- {
233
- "epoch": 0.76,
234
- "eval_accuracy": 0.9754768392370572,
235
- "eval_loss": 0.07841455936431885,
236
- "eval_runtime": 16.7459,
237
- "eval_samples_per_second": 43.832,
238
- "eval_steps_per_second": 5.494,
239
- "step": 280
240
  }
241
  ],
242
- "max_steps": 295,
243
  "num_train_epochs": 1,
244
- "total_flos": 3.471672249955123e+17,
245
  "trial_name": null,
246
  "trial_params": null
247
  }
 
1
  {
2
+ "best_metric": 0.12063875794410706,
3
+ "best_model_checkpoint": "./vit-base-beans/checkpoint-160",
4
+ "epoch": 0.43478260869565216,
5
+ "global_step": 160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.03,
12
+ "learning_rate": 0.0001891304347826087,
13
+ "loss": 0.6558,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.05,
18
+ "learning_rate": 0.0001782608695652174,
19
+ "loss": 0.3045,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.08,
24
+ "learning_rate": 0.0001673913043478261,
25
+ "loss": 0.2567,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.11,
30
+ "learning_rate": 0.0001565217391304348,
31
+ "loss": 0.2319,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.11,
36
+ "eval_accuracy": 0.8637602179836512,
37
+ "eval_loss": 0.2531130313873291,
38
+ "eval_runtime": 17.2839,
39
+ "eval_samples_per_second": 42.467,
40
+ "eval_steps_per_second": 5.323,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 0.14,
45
+ "learning_rate": 0.0001456521739130435,
46
+ "loss": 0.2499,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 0.16,
51
+ "learning_rate": 0.0001347826086956522,
52
+ "loss": 0.2874,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 0.19,
57
+ "learning_rate": 0.00012391304347826086,
58
+ "loss": 0.1609,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 0.22,
63
+ "learning_rate": 0.00011304347826086956,
64
+ "loss": 0.1306,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.22,
69
+ "eval_accuracy": 0.9564032697547684,
70
+ "eval_loss": 0.1377830058336258,
71
+ "eval_runtime": 17.1335,
72
+ "eval_samples_per_second": 42.84,
73
+ "eval_steps_per_second": 5.37,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 0.24,
78
+ "learning_rate": 0.00010217391304347828,
79
+ "loss": 0.228,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 0.27,
84
+ "learning_rate": 9.130434782608696e-05,
85
+ "loss": 0.1187,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 0.3,
90
+ "learning_rate": 8.043478260869566e-05,
91
+ "loss": 0.1811,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 0.33,
96
+ "learning_rate": 6.956521739130436e-05,
97
+ "loss": 0.2075,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 0.33,
102
+ "eval_accuracy": 0.8419618528610354,
103
+ "eval_loss": 0.3006892800331116,
104
+ "eval_runtime": 17.1056,
105
+ "eval_samples_per_second": 42.91,
106
+ "eval_steps_per_second": 5.378,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 0.35,
111
+ "learning_rate": 5.869565217391305e-05,
112
+ "loss": 0.2099,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 0.38,
117
+ "learning_rate": 4.782608695652174e-05,
118
+ "loss": 0.1518,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 0.41,
123
+ "learning_rate": 3.695652173913043e-05,
124
+ "loss": 0.1559,
125
  "step": 150
126
  },
127
  {
128
  "epoch": 0.43,
129
+ "learning_rate": 2.608695652173913e-05,
130
+ "loss": 0.1573,
131
  "step": 160
132
  },
133
  {
134
  "epoch": 0.43,
135
+ "eval_accuracy": 0.9618528610354223,
136
+ "eval_loss": 0.12063875794410706,
137
+ "eval_runtime": 16.7256,
138
+ "eval_samples_per_second": 43.885,
139
+ "eval_steps_per_second": 5.501,
140
  "step": 160
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
141
  }
142
  ],
143
+ "max_steps": 184,
144
  "num_train_epochs": 1,
145
+ "total_flos": 1.9838127142600704e+17,
146
  "trial_name": null,
147
  "trial_params": null
148
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f07575c36fbac5b1ce76fcb42fdadefe90c95ce5be20b51ab48ba4f71f7e83f5
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0da1c4783c907062c5599838de2c50fb7797f9e629770cd8d98b5e414c53d23
3
  size 3963