hafidber commited on
Commit
52d1049
1 Parent(s): 581ee4c

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.5290322580645161,
4
- "eval_loss": 1.4294496774673462,
5
- "eval_runtime": 45.3757,
6
- "eval_samples_per_second": 3.416,
7
- "eval_steps_per_second": 1.719
8
  }
 
1
  {
2
+ "epoch": 1.5,
3
+ "eval_accuracy": 0.864516129032258,
4
+ "eval_loss": 0.4195975959300995,
5
+ "eval_runtime": 48.7546,
6
+ "eval_samples_per_second": 3.179,
7
+ "eval_steps_per_second": 1.6
8
  }
runs/Jan03_19-18-12_906282a222dc/events.out.tfevents.1704310050.906282a222dc.1586.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21c37fe1dbedad1bfbcb7e9c364f2f2d0a34c81c0c8f1168b2bf8002b6dd004a
3
- size 411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6cf1cb50efdd916e202f53bfcae9a9975a0510c4125a4b8b350c8529403d9cf
3
+ size 734
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.5290322580645161,
4
- "eval_loss": 1.4294496774673462,
5
- "eval_runtime": 45.3757,
6
- "eval_samples_per_second": 3.416,
7
- "eval_steps_per_second": 1.719
8
  }
 
1
  {
2
+ "epoch": 1.5,
3
+ "eval_accuracy": 0.864516129032258,
4
+ "eval_loss": 0.4195975959300995,
5
+ "eval_runtime": 48.7546,
6
+ "eval_samples_per_second": 3.179,
7
+ "eval_steps_per_second": 1.6
8
  }
trainer_state.json CHANGED
@@ -1,145 +1,244 @@
1
  {
2
- "best_metric": 0.6285714285714286,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-150",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
11
  {
12
  "epoch": 0.07,
13
  "learning_rate": 3.3333333333333335e-05,
14
- "loss": 2.3672,
15
- "step": 10
 
 
 
 
 
 
16
  },
17
  {
18
  "epoch": 0.13,
19
  "learning_rate": 4.814814814814815e-05,
20
- "loss": 2.5654,
21
- "step": 20
 
 
 
 
 
 
22
  },
23
  {
24
  "epoch": 0.2,
25
  "learning_rate": 4.4444444444444447e-05,
26
- "loss": 2.3019,
27
- "step": 30
 
 
 
 
 
 
28
  },
29
  {
30
  "epoch": 0.27,
31
  "learning_rate": 4.074074074074074e-05,
32
- "loss": 2.1634,
33
- "step": 40
 
 
 
 
 
 
34
  },
35
  {
36
  "epoch": 0.33,
37
  "learning_rate": 3.7037037037037037e-05,
38
- "loss": 1.9889,
39
- "step": 50
 
 
 
 
 
 
40
  },
41
  {
42
  "epoch": 0.4,
43
  "learning_rate": 3.3333333333333335e-05,
44
- "loss": 2.0758,
45
- "step": 60
 
 
 
 
 
 
46
  },
47
  {
48
  "epoch": 0.47,
49
  "learning_rate": 2.962962962962963e-05,
50
- "loss": 2.0439,
51
- "step": 70
 
 
 
 
 
 
52
  },
53
  {
54
- "epoch": 0.53,
 
 
 
 
 
 
 
 
 
55
  "learning_rate": 2.5925925925925925e-05,
56
- "loss": 1.6312,
57
- "step": 80
58
  },
59
  {
60
- "epoch": 0.6,
 
 
 
 
 
 
61
  "learning_rate": 2.2222222222222223e-05,
62
- "loss": 1.905,
63
- "step": 90
 
 
 
 
 
 
64
  },
65
  {
66
- "epoch": 0.67,
67
  "learning_rate": 1.8518518518518518e-05,
68
- "loss": 1.6742,
69
- "step": 100
 
 
 
 
 
 
70
  },
71
  {
72
- "epoch": 0.73,
73
  "learning_rate": 1.4814814814814815e-05,
74
- "loss": 1.6093,
75
- "step": 110
76
  },
77
  {
78
- "epoch": 0.8,
79
- "learning_rate": 1.1111111111111112e-05,
80
- "loss": 1.5733,
81
- "step": 120
82
  },
83
  {
84
- "epoch": 0.87,
85
- "learning_rate": 7.4074074074074075e-06,
86
- "loss": 1.6627,
87
- "step": 130
88
  },
89
  {
90
- "epoch": 0.93,
91
- "learning_rate": 3.7037037037037037e-06,
92
- "loss": 1.6796,
93
- "step": 140
94
  },
95
  {
96
- "epoch": 1.0,
97
- "learning_rate": 0.0,
98
- "loss": 1.3265,
99
- "step": 150
100
  },
101
  {
102
- "epoch": 1.0,
103
- "eval_accuracy": 0.6285714285714286,
104
- "eval_loss": 1.2609246969223022,
105
- "eval_runtime": 20.5848,
106
- "eval_samples_per_second": 3.401,
107
- "eval_steps_per_second": 1.7,
108
- "step": 150
109
  },
110
  {
111
- "epoch": 1.0,
112
- "step": 150,
113
- "total_flos": 3.73846047031296e+17,
114
- "train_loss": 1.9045542653401693,
115
- "train_runtime": 220.7068,
116
- "train_samples_per_second": 1.359,
117
- "train_steps_per_second": 0.68
118
  },
119
  {
120
- "epoch": 1.0,
121
- "eval_accuracy": 0.5290322580645161,
122
- "eval_loss": 1.429449439048767,
123
- "eval_runtime": 43.1887,
124
- "eval_samples_per_second": 3.589,
125
- "eval_steps_per_second": 1.806,
126
- "step": 150
127
  },
128
  {
129
- "epoch": 1.0,
130
- "eval_accuracy": 0.5290322580645161,
131
- "eval_loss": 1.4294496774673462,
132
- "eval_runtime": 45.3757,
133
- "eval_samples_per_second": 3.416,
134
- "eval_steps_per_second": 1.719,
135
- "step": 150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
136
  }
137
  ],
138
  "logging_steps": 10,
139
- "max_steps": 150,
140
  "num_train_epochs": 9223372036854775807,
141
  "save_steps": 500,
142
- "total_flos": 3.73846047031296e+17,
143
  "trial_name": null,
144
  "trial_params": null
145
  }
 
1
  {
2
+ "best_metric": 0.8428571428571429,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-300",
4
+ "epoch": 1.5,
5
  "eval_steps": 500,
6
+ "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 0.03,
13
+ "learning_rate": 1.6666666666666667e-05,
14
+ "loss": 2.3028,
15
+ "step": 10
16
+ },
17
  {
18
  "epoch": 0.07,
19
  "learning_rate": 3.3333333333333335e-05,
20
+ "loss": 2.3514,
21
+ "step": 20
22
+ },
23
+ {
24
+ "epoch": 0.1,
25
+ "learning_rate": 5e-05,
26
+ "loss": 2.3305,
27
+ "step": 30
28
  },
29
  {
30
  "epoch": 0.13,
31
  "learning_rate": 4.814814814814815e-05,
32
+ "loss": 2.2754,
33
+ "step": 40
34
+ },
35
+ {
36
+ "epoch": 0.17,
37
+ "learning_rate": 4.62962962962963e-05,
38
+ "loss": 2.0044,
39
+ "step": 50
40
  },
41
  {
42
  "epoch": 0.2,
43
  "learning_rate": 4.4444444444444447e-05,
44
+ "loss": 2.1435,
45
+ "step": 60
46
+ },
47
+ {
48
+ "epoch": 0.23,
49
+ "learning_rate": 4.259259259259259e-05,
50
+ "loss": 2.0639,
51
+ "step": 70
52
  },
53
  {
54
  "epoch": 0.27,
55
  "learning_rate": 4.074074074074074e-05,
56
+ "loss": 1.6206,
57
+ "step": 80
58
+ },
59
+ {
60
+ "epoch": 0.3,
61
+ "learning_rate": 3.888888888888889e-05,
62
+ "loss": 1.7889,
63
+ "step": 90
64
  },
65
  {
66
  "epoch": 0.33,
67
  "learning_rate": 3.7037037037037037e-05,
68
+ "loss": 1.6838,
69
+ "step": 100
70
+ },
71
+ {
72
+ "epoch": 0.37,
73
+ "learning_rate": 3.518518518518519e-05,
74
+ "loss": 1.3599,
75
+ "step": 110
76
  },
77
  {
78
  "epoch": 0.4,
79
  "learning_rate": 3.3333333333333335e-05,
80
+ "loss": 1.4852,
81
+ "step": 120
82
+ },
83
+ {
84
+ "epoch": 0.43,
85
+ "learning_rate": 3.148148148148148e-05,
86
+ "loss": 1.4107,
87
+ "step": 130
88
  },
89
  {
90
  "epoch": 0.47,
91
  "learning_rate": 2.962962962962963e-05,
92
+ "loss": 1.374,
93
+ "step": 140
94
+ },
95
+ {
96
+ "epoch": 0.5,
97
+ "learning_rate": 2.777777777777778e-05,
98
+ "loss": 1.0549,
99
+ "step": 150
100
  },
101
  {
102
+ "epoch": 0.5,
103
+ "eval_accuracy": 0.7571428571428571,
104
+ "eval_loss": 0.9527812600135803,
105
+ "eval_runtime": 22.0926,
106
+ "eval_samples_per_second": 3.168,
107
+ "eval_steps_per_second": 1.584,
108
+ "step": 150
109
+ },
110
+ {
111
+ "epoch": 1.03,
112
  "learning_rate": 2.5925925925925925e-05,
113
+ "loss": 0.8599,
114
+ "step": 160
115
  },
116
  {
117
+ "epoch": 1.07,
118
+ "learning_rate": 2.4074074074074074e-05,
119
+ "loss": 1.287,
120
+ "step": 170
121
+ },
122
+ {
123
+ "epoch": 1.1,
124
  "learning_rate": 2.2222222222222223e-05,
125
+ "loss": 0.9601,
126
+ "step": 180
127
+ },
128
+ {
129
+ "epoch": 1.13,
130
+ "learning_rate": 2.037037037037037e-05,
131
+ "loss": 0.6645,
132
+ "step": 190
133
  },
134
  {
135
+ "epoch": 1.17,
136
  "learning_rate": 1.8518518518518518e-05,
137
+ "loss": 0.6143,
138
+ "step": 200
139
+ },
140
+ {
141
+ "epoch": 1.2,
142
+ "learning_rate": 1.6666666666666667e-05,
143
+ "loss": 0.4838,
144
+ "step": 210
145
  },
146
  {
147
+ "epoch": 1.23,
148
  "learning_rate": 1.4814814814814815e-05,
149
+ "loss": 0.4428,
150
+ "step": 220
151
  },
152
  {
153
+ "epoch": 1.27,
154
+ "learning_rate": 1.2962962962962962e-05,
155
+ "loss": 0.7375,
156
+ "step": 230
157
  },
158
  {
159
+ "epoch": 1.3,
160
+ "learning_rate": 1.1111111111111112e-05,
161
+ "loss": 0.6078,
162
+ "step": 240
163
  },
164
  {
165
+ "epoch": 1.33,
166
+ "learning_rate": 9.259259259259259e-06,
167
+ "loss": 0.4268,
168
+ "step": 250
169
  },
170
  {
171
+ "epoch": 1.37,
172
+ "learning_rate": 7.4074074074074075e-06,
173
+ "loss": 0.2414,
174
+ "step": 260
175
  },
176
  {
177
+ "epoch": 1.4,
178
+ "learning_rate": 5.555555555555556e-06,
179
+ "loss": 0.4216,
180
+ "step": 270
 
 
 
181
  },
182
  {
183
+ "epoch": 1.43,
184
+ "learning_rate": 3.7037037037037037e-06,
185
+ "loss": 0.1838,
186
+ "step": 280
 
 
 
187
  },
188
  {
189
+ "epoch": 1.47,
190
+ "learning_rate": 1.8518518518518519e-06,
191
+ "loss": 0.5178,
192
+ "step": 290
 
 
 
193
  },
194
  {
195
+ "epoch": 1.5,
196
+ "learning_rate": 0.0,
197
+ "loss": 0.7251,
198
+ "step": 300
199
+ },
200
+ {
201
+ "epoch": 1.5,
202
+ "eval_accuracy": 0.8428571428571429,
203
+ "eval_loss": 0.4445994794368744,
204
+ "eval_runtime": 21.5992,
205
+ "eval_samples_per_second": 3.241,
206
+ "eval_steps_per_second": 1.62,
207
+ "step": 300
208
+ },
209
+ {
210
+ "epoch": 1.5,
211
+ "step": 300,
212
+ "total_flos": 7.47692094062592e+17,
213
+ "train_loss": 1.214137753645579,
214
+ "train_runtime": 449.6116,
215
+ "train_samples_per_second": 1.334,
216
+ "train_steps_per_second": 0.667
217
+ },
218
+ {
219
+ "epoch": 1.5,
220
+ "eval_accuracy": 0.864516129032258,
221
+ "eval_loss": 0.4195975959300995,
222
+ "eval_runtime": 49.2274,
223
+ "eval_samples_per_second": 3.149,
224
+ "eval_steps_per_second": 1.584,
225
+ "step": 300
226
+ },
227
+ {
228
+ "epoch": 1.5,
229
+ "eval_accuracy": 0.864516129032258,
230
+ "eval_loss": 0.4195975959300995,
231
+ "eval_runtime": 48.7546,
232
+ "eval_samples_per_second": 3.179,
233
+ "eval_steps_per_second": 1.6,
234
+ "step": 300
235
  }
236
  ],
237
  "logging_steps": 10,
238
+ "max_steps": 300,
239
  "num_train_epochs": 9223372036854775807,
240
  "save_steps": 500,
241
+ "total_flos": 7.47692094062592e+17,
242
  "trial_name": null,
243
  "trial_params": null
244
  }