maixbach commited on
Commit
51b5359
1 Parent(s): 096f439

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7696709585121603,
4
- "eval_loss": 0.5915560722351074,
5
- "eval_runtime": 7.0343,
6
- "eval_samples_per_second": 99.37,
7
- "eval_steps_per_second": 3.128,
8
- "total_flos": 2.085095129220956e+17,
9
- "train_loss": 0.8958317330389312,
10
- "train_runtime": 194.9461,
11
- "train_samples_per_second": 43.027,
12
- "train_steps_per_second": 0.339
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.882689556509299,
4
+ "eval_loss": 0.337208092212677,
5
+ "eval_runtime": 7.2237,
6
+ "eval_samples_per_second": 96.765,
7
+ "eval_steps_per_second": 3.046,
8
+ "total_flos": 6.950317097403187e+17,
9
+ "train_loss": 0.30874538096514614,
10
+ "train_runtime": 658.9789,
11
+ "train_samples_per_second": 42.429,
12
+ "train_steps_per_second": 0.334
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7696709585121603,
4
- "eval_loss": 0.5915560722351074,
5
- "eval_runtime": 7.0343,
6
- "eval_samples_per_second": 99.37,
7
- "eval_steps_per_second": 3.128
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.882689556509299,
4
+ "eval_loss": 0.337208092212677,
5
+ "eval_runtime": 7.2237,
6
+ "eval_samples_per_second": 96.765,
7
+ "eval_steps_per_second": 3.046
8
  }
runs/Jan03_16-42-55_527f2771f15a/events.out.tfevents.1672764998.527f2771f15a.148.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b02f7d41284bdebba3ad062cd92051291c0a5cdc77b5e816366a209f2fe52087
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 2.085095129220956e+17,
4
- "train_loss": 0.8958317330389312,
5
- "train_runtime": 194.9461,
6
- "train_samples_per_second": 43.027,
7
- "train_steps_per_second": 0.339
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 6.950317097403187e+17,
4
+ "train_loss": 0.30874538096514614,
5
+ "train_runtime": 658.9789,
6
+ "train_samples_per_second": 42.429,
7
+ "train_steps_per_second": 0.334
8
  }
trainer_state.json CHANGED
@@ -1,88 +1,247 @@
1
  {
2
- "best_metric": 0.7696709585121603,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-trash_classification/checkpoint-66",
4
- "epoch": 3.0,
5
- "global_step": 66,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.45,
12
- "learning_rate": 4.745762711864407e-05,
13
- "loss": 1.5462,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.91,
18
- "learning_rate": 3.898305084745763e-05,
19
- "loss": 1.1855,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 1.0,
24
- "eval_accuracy": 0.6809728183118741,
25
- "eval_loss": 0.9103820323944092,
26
- "eval_runtime": 6.9474,
27
- "eval_samples_per_second": 100.613,
28
- "eval_steps_per_second": 3.167,
29
  "step": 22
30
  },
31
  {
32
  "epoch": 1.36,
33
- "learning_rate": 3.050847457627119e-05,
34
- "loss": 0.8813,
35
  "step": 30
36
  },
37
  {
38
  "epoch": 1.82,
39
- "learning_rate": 2.2033898305084748e-05,
40
- "loss": 0.7209,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 2.0,
45
- "eval_accuracy": 0.7510729613733905,
46
- "eval_loss": 0.6361371278762817,
47
- "eval_runtime": 7.3972,
48
- "eval_samples_per_second": 94.496,
49
- "eval_steps_per_second": 2.974,
50
  "step": 44
51
  },
52
  {
53
  "epoch": 2.27,
54
- "learning_rate": 1.3559322033898305e-05,
55
- "loss": 0.6267,
56
  "step": 50
57
  },
58
  {
59
  "epoch": 2.73,
60
- "learning_rate": 5.084745762711865e-06,
61
- "loss": 0.6043,
62
  "step": 60
63
  },
64
  {
65
  "epoch": 3.0,
66
- "eval_accuracy": 0.7696709585121603,
67
- "eval_loss": 0.5915560722351074,
68
- "eval_runtime": 6.9079,
69
- "eval_samples_per_second": 101.188,
70
- "eval_steps_per_second": 3.185,
71
  "step": 66
72
  },
73
  {
74
- "epoch": 3.0,
75
- "step": 66,
76
- "total_flos": 2.085095129220956e+17,
77
- "train_loss": 0.8958317330389312,
78
- "train_runtime": 194.9461,
79
- "train_samples_per_second": 43.027,
80
- "train_steps_per_second": 0.339
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
81
  }
82
  ],
83
- "max_steps": 66,
84
- "num_train_epochs": 3,
85
- "total_flos": 2.085095129220956e+17,
86
  "trial_name": null,
87
  "trial_params": null
88
  }
 
1
  {
2
+ "best_metric": 0.882689556509299,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-trash_classification/checkpoint-198",
4
+ "epoch": 10.0,
5
+ "global_step": 220,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.45,
12
+ "learning_rate": 2.272727272727273e-05,
13
+ "loss": 0.531,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.91,
18
+ "learning_rate": 4.545454545454546e-05,
19
+ "loss": 0.4991,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 1.0,
24
+ "eval_accuracy": 0.7911301859799714,
25
+ "eval_loss": 0.5482170581817627,
26
+ "eval_runtime": 7.0774,
27
+ "eval_samples_per_second": 98.766,
28
+ "eval_steps_per_second": 3.109,
29
  "step": 22
30
  },
31
  {
32
  "epoch": 1.36,
33
+ "learning_rate": 4.797979797979798e-05,
34
+ "loss": 0.4159,
35
  "step": 30
36
  },
37
  {
38
  "epoch": 1.82,
39
+ "learning_rate": 4.545454545454546e-05,
40
+ "loss": 0.4008,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 2.0,
45
+ "eval_accuracy": 0.7954220314735336,
46
+ "eval_loss": 0.5192908644676208,
47
+ "eval_runtime": 7.6454,
48
+ "eval_samples_per_second": 91.427,
49
+ "eval_steps_per_second": 2.878,
50
  "step": 44
51
  },
52
  {
53
  "epoch": 2.27,
54
+ "learning_rate": 4.292929292929293e-05,
55
+ "loss": 0.3623,
56
  "step": 50
57
  },
58
  {
59
  "epoch": 2.73,
60
+ "learning_rate": 4.0404040404040405e-05,
61
+ "loss": 0.3659,
62
  "step": 60
63
  },
64
  {
65
  "epoch": 3.0,
66
+ "eval_accuracy": 0.8397711015736766,
67
+ "eval_loss": 0.44643908739089966,
68
+ "eval_runtime": 7.1094,
69
+ "eval_samples_per_second": 98.321,
70
+ "eval_steps_per_second": 3.095,
71
  "step": 66
72
  },
73
  {
74
+ "epoch": 3.18,
75
+ "learning_rate": 3.787878787878788e-05,
76
+ "loss": 0.3551,
77
+ "step": 70
78
+ },
79
+ {
80
+ "epoch": 3.64,
81
+ "learning_rate": 3.535353535353535e-05,
82
+ "loss": 0.372,
83
+ "step": 80
84
+ },
85
+ {
86
+ "epoch": 4.0,
87
+ "eval_accuracy": 0.8397711015736766,
88
+ "eval_loss": 0.4384276270866394,
89
+ "eval_runtime": 7.6735,
90
+ "eval_samples_per_second": 91.093,
91
+ "eval_steps_per_second": 2.867,
92
+ "step": 88
93
+ },
94
+ {
95
+ "epoch": 4.09,
96
+ "learning_rate": 3.282828282828283e-05,
97
+ "loss": 0.3277,
98
+ "step": 90
99
+ },
100
+ {
101
+ "epoch": 4.55,
102
+ "learning_rate": 3.0303030303030306e-05,
103
+ "loss": 0.3252,
104
+ "step": 100
105
+ },
106
+ {
107
+ "epoch": 5.0,
108
+ "learning_rate": 2.777777777777778e-05,
109
+ "loss": 0.3388,
110
+ "step": 110
111
+ },
112
+ {
113
+ "epoch": 5.0,
114
+ "eval_accuracy": 0.8454935622317596,
115
+ "eval_loss": 0.42808040976524353,
116
+ "eval_runtime": 7.1513,
117
+ "eval_samples_per_second": 97.745,
118
+ "eval_steps_per_second": 3.076,
119
+ "step": 110
120
+ },
121
+ {
122
+ "epoch": 5.45,
123
+ "learning_rate": 2.5252525252525256e-05,
124
+ "loss": 0.2767,
125
+ "step": 120
126
+ },
127
+ {
128
+ "epoch": 5.91,
129
+ "learning_rate": 2.272727272727273e-05,
130
+ "loss": 0.2654,
131
+ "step": 130
132
+ },
133
+ {
134
+ "epoch": 6.0,
135
+ "eval_accuracy": 0.871244635193133,
136
+ "eval_loss": 0.3618273138999939,
137
+ "eval_runtime": 7.6567,
138
+ "eval_samples_per_second": 91.293,
139
+ "eval_steps_per_second": 2.873,
140
+ "step": 132
141
+ },
142
+ {
143
+ "epoch": 6.36,
144
+ "learning_rate": 2.0202020202020203e-05,
145
+ "loss": 0.235,
146
+ "step": 140
147
+ },
148
+ {
149
+ "epoch": 6.82,
150
+ "learning_rate": 1.7676767676767676e-05,
151
+ "loss": 0.2326,
152
+ "step": 150
153
+ },
154
+ {
155
+ "epoch": 7.0,
156
+ "eval_accuracy": 0.8755364806866953,
157
+ "eval_loss": 0.3550046682357788,
158
+ "eval_runtime": 7.1895,
159
+ "eval_samples_per_second": 97.226,
160
+ "eval_steps_per_second": 3.06,
161
+ "step": 154
162
+ },
163
+ {
164
+ "epoch": 7.27,
165
+ "learning_rate": 1.5151515151515153e-05,
166
+ "loss": 0.219,
167
+ "step": 160
168
+ },
169
+ {
170
+ "epoch": 7.73,
171
+ "learning_rate": 1.2626262626262628e-05,
172
+ "loss": 0.2354,
173
+ "step": 170
174
+ },
175
+ {
176
+ "epoch": 8.0,
177
+ "eval_accuracy": 0.8798283261802575,
178
+ "eval_loss": 0.3400857448577881,
179
+ "eval_runtime": 7.5656,
180
+ "eval_samples_per_second": 92.392,
181
+ "eval_steps_per_second": 2.908,
182
+ "step": 176
183
+ },
184
+ {
185
+ "epoch": 8.18,
186
+ "learning_rate": 1.0101010101010101e-05,
187
+ "loss": 0.2455,
188
+ "step": 180
189
+ },
190
+ {
191
+ "epoch": 8.64,
192
+ "learning_rate": 7.5757575757575764e-06,
193
+ "loss": 0.1774,
194
+ "step": 190
195
+ },
196
+ {
197
+ "epoch": 9.0,
198
+ "eval_accuracy": 0.882689556509299,
199
+ "eval_loss": 0.337208092212677,
200
+ "eval_runtime": 7.0903,
201
+ "eval_samples_per_second": 98.586,
202
+ "eval_steps_per_second": 3.103,
203
+ "step": 198
204
+ },
205
+ {
206
+ "epoch": 9.09,
207
+ "learning_rate": 5.050505050505051e-06,
208
+ "loss": 0.2007,
209
+ "step": 200
210
+ },
211
+ {
212
+ "epoch": 9.55,
213
+ "learning_rate": 2.5252525252525253e-06,
214
+ "loss": 0.226,
215
+ "step": 210
216
+ },
217
+ {
218
+ "epoch": 10.0,
219
+ "learning_rate": 0.0,
220
+ "loss": 0.1849,
221
+ "step": 220
222
+ },
223
+ {
224
+ "epoch": 10.0,
225
+ "eval_accuracy": 0.882689556509299,
226
+ "eval_loss": 0.33802154660224915,
227
+ "eval_runtime": 7.6016,
228
+ "eval_samples_per_second": 91.954,
229
+ "eval_steps_per_second": 2.894,
230
+ "step": 220
231
+ },
232
+ {
233
+ "epoch": 10.0,
234
+ "step": 220,
235
+ "total_flos": 6.950317097403187e+17,
236
+ "train_loss": 0.30874538096514614,
237
+ "train_runtime": 658.9789,
238
+ "train_samples_per_second": 42.429,
239
+ "train_steps_per_second": 0.334
240
  }
241
  ],
242
+ "max_steps": 220,
243
+ "num_train_epochs": 10,
244
+ "total_flos": 6.950317097403187e+17,
245
  "trial_name": null,
246
  "trial_params": null
247
  }