PergaZuZ commited on
Commit
90e603a
1 Parent(s): 96cc896

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +6 -6
  2. test_results.json +6 -6
  3. trainer_state.json +65 -101
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 7.078947368421052,
3
- "eval_accuracy": 0.7972027972027972,
4
- "eval_loss": 0.7915867567062378,
5
- "eval_runtime": 1521.5044,
6
- "eval_samples_per_second": 0.282,
7
- "eval_steps_per_second": 0.018
8
  }
 
1
  {
2
+ "epoch": 3.2105263157894735,
3
+ "eval_accuracy": 0.5407925407925408,
4
+ "eval_loss": 0.9939900040626526,
5
+ "eval_runtime": 1531.0787,
6
+ "eval_samples_per_second": 0.28,
7
+ "eval_steps_per_second": 0.035
8
  }
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 7.078947368421052,
3
- "eval_accuracy": 0.7972027972027972,
4
- "eval_loss": 0.7915867567062378,
5
- "eval_runtime": 1521.5044,
6
- "eval_samples_per_second": 0.282,
7
- "eval_steps_per_second": 0.018
8
  }
 
1
  {
2
+ "epoch": 3.2105263157894735,
3
+ "eval_accuracy": 0.5407925407925408,
4
+ "eval_loss": 0.9939900040626526,
5
+ "eval_runtime": 1531.0787,
6
+ "eval_samples_per_second": 0.28,
7
+ "eval_steps_per_second": 0.035
8
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.5598526703499079,
3
  "best_model_checkpoint": "videomae-base-finetuned-lift-data-resize/checkpoint-76",
4
- "epoch": 7.078947368421052,
5
  "eval_steps": 500,
6
  "global_step": 76,
7
  "is_hyper_param_search": false,
@@ -10,150 +10,114 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.13157894736842105,
13
- "grad_norm": 5.784543514251709,
14
  "learning_rate": 4.8529411764705885e-05,
15
- "loss": 1.6087,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.13157894736842105,
20
- "eval_accuracy": 0.2596685082872928,
21
- "eval_loss": 1.8482669591903687,
22
- "eval_runtime": 1902.2155,
23
- "eval_samples_per_second": 0.285,
24
- "eval_steps_per_second": 0.018,
25
- "step": 10
26
- },
27
- {
28
- "epoch": 1.131578947368421,
29
- "grad_norm": 5.533542633056641,
30
  "learning_rate": 4.11764705882353e-05,
31
- "loss": 1.3273,
32
  "step": 20
33
  },
34
  {
35
- "epoch": 1.131578947368421,
36
- "eval_accuracy": 0.2983425414364641,
37
- "eval_loss": 1.445150375366211,
38
- "eval_runtime": 1919.0254,
39
- "eval_samples_per_second": 0.283,
40
- "eval_steps_per_second": 0.018,
41
  "step": 20
42
  },
43
  {
44
- "epoch": 2.1315789473684212,
45
- "grad_norm": 5.178999900817871,
46
  "learning_rate": 3.382352941176471e-05,
47
- "loss": 1.2351,
48
  "step": 30
49
  },
50
  {
51
- "epoch": 2.1315789473684212,
52
- "eval_accuracy": 0.27992633517495397,
53
- "eval_loss": 1.5890227556228638,
54
- "eval_runtime": 1917.7799,
55
- "eval_samples_per_second": 0.283,
56
- "eval_steps_per_second": 0.018,
57
- "step": 30
58
- },
59
- {
60
- "epoch": 3.1315789473684212,
61
- "grad_norm": 6.05620813369751,
62
  "learning_rate": 2.647058823529412e-05,
63
- "loss": 1.1635,
64
  "step": 40
65
  },
66
  {
67
- "epoch": 3.1315789473684212,
68
- "eval_accuracy": 0.29097605893186,
69
- "eval_loss": 1.3829658031463623,
70
- "eval_runtime": 1908.1474,
71
- "eval_samples_per_second": 0.285,
72
- "eval_steps_per_second": 0.018,
73
  "step": 40
74
  },
75
  {
76
- "epoch": 4.131578947368421,
77
- "grad_norm": 6.08853006362915,
78
  "learning_rate": 1.9117647058823528e-05,
79
- "loss": 1.0374,
80
- "step": 50
81
- },
82
- {
83
- "epoch": 4.131578947368421,
84
- "eval_accuracy": 0.3001841620626151,
85
- "eval_loss": 1.3681721687316895,
86
- "eval_runtime": 1920.2107,
87
- "eval_samples_per_second": 0.283,
88
- "eval_steps_per_second": 0.018,
89
  "step": 50
90
  },
91
  {
92
- "epoch": 5.131578947368421,
93
- "grad_norm": 8.272621154785156,
94
  "learning_rate": 1.1764705882352942e-05,
95
- "loss": 0.9699,
96
  "step": 60
97
  },
98
  {
99
- "epoch": 5.131578947368421,
100
- "eval_accuracy": 0.5322283609576427,
101
- "eval_loss": 1.2128217220306396,
102
- "eval_runtime": 1939.0306,
103
- "eval_samples_per_second": 0.28,
104
- "eval_steps_per_second": 0.018,
105
  "step": 60
106
  },
107
  {
108
- "epoch": 6.131578947368421,
109
- "grad_norm": 6.870037078857422,
110
  "learning_rate": 4.411764705882353e-06,
111
- "loss": 0.8748,
112
  "step": 70
113
  },
114
  {
115
- "epoch": 6.131578947368421,
116
- "eval_accuracy": 0.5561694290976059,
117
- "eval_loss": 1.0850194692611694,
118
- "eval_runtime": 1915.7845,
119
- "eval_samples_per_second": 0.283,
120
- "eval_steps_per_second": 0.018,
121
- "step": 70
122
- },
123
- {
124
- "epoch": 7.078947368421052,
125
- "eval_accuracy": 0.5598526703499079,
126
- "eval_loss": 1.0720747709274292,
127
- "eval_runtime": 1934.2154,
128
- "eval_samples_per_second": 0.281,
129
- "eval_steps_per_second": 0.018,
130
  "step": 76
131
  },
132
  {
133
- "epoch": 7.078947368421052,
134
  "step": 76,
135
- "total_flos": 1.4890870230147072e+18,
136
- "train_loss": 1.143978382411756,
137
- "train_runtime": 20019.1589,
138
  "train_samples_per_second": 0.061,
139
- "train_steps_per_second": 0.004
140
  },
141
  {
142
- "epoch": 7.078947368421052,
143
- "eval_accuracy": 0.7972027972027972,
144
- "eval_loss": 0.7926375269889832,
145
- "eval_runtime": 1534.4439,
146
- "eval_samples_per_second": 0.28,
147
- "eval_steps_per_second": 0.018,
148
  "step": 76
149
  },
150
  {
151
- "epoch": 7.078947368421052,
152
- "eval_accuracy": 0.7972027972027972,
153
- "eval_loss": 0.7915867567062378,
154
- "eval_runtime": 1521.5044,
155
- "eval_samples_per_second": 0.282,
156
- "eval_steps_per_second": 0.018,
157
  "step": 76
158
  }
159
  ],
@@ -174,8 +138,8 @@
174
  "attributes": {}
175
  }
176
  },
177
- "total_flos": 1.4890870230147072e+18,
178
- "train_batch_size": 16,
179
  "trial_name": null,
180
  "trial_params": null
181
  }
 
1
  {
2
+ "best_metric": 0.5524861878453039,
3
  "best_model_checkpoint": "videomae-base-finetuned-lift-data-resize/checkpoint-76",
4
+ "epoch": 3.2105263157894735,
5
  "eval_steps": 500,
6
  "global_step": 76,
7
  "is_hyper_param_search": false,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.13157894736842105,
13
+ "grad_norm": 5.10792875289917,
14
  "learning_rate": 4.8529411764705885e-05,
15
+ "loss": 1.6509,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.2631578947368421,
20
+ "grad_norm": 5.389455795288086,
 
 
 
 
 
 
 
 
 
21
  "learning_rate": 4.11764705882353e-05,
22
+ "loss": 1.5445,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 0.2631578947368421,
27
+ "eval_accuracy": 0.11233885819521179,
28
+ "eval_loss": 1.6094709634780884,
29
+ "eval_runtime": 1927.838,
30
+ "eval_samples_per_second": 0.282,
31
+ "eval_steps_per_second": 0.035,
32
  "step": 20
33
  },
34
  {
35
+ "epoch": 1.131578947368421,
36
+ "grad_norm": 5.348465442657471,
37
  "learning_rate": 3.382352941176471e-05,
38
+ "loss": 1.3201,
39
  "step": 30
40
  },
41
  {
42
+ "epoch": 1.263157894736842,
43
+ "grad_norm": 8.077356338500977,
 
 
 
 
 
 
 
 
 
44
  "learning_rate": 2.647058823529412e-05,
45
+ "loss": 1.2942,
46
  "step": 40
47
  },
48
  {
49
+ "epoch": 1.263157894736842,
50
+ "eval_accuracy": 0.5119705340699816,
51
+ "eval_loss": 1.2199088335037231,
52
+ "eval_runtime": 1935.0816,
53
+ "eval_samples_per_second": 0.281,
54
+ "eval_steps_per_second": 0.035,
55
  "step": 40
56
  },
57
  {
58
+ "epoch": 2.1315789473684212,
59
+ "grad_norm": 7.384807109832764,
60
  "learning_rate": 1.9117647058823528e-05,
61
+ "loss": 1.0568,
 
 
 
 
 
 
 
 
 
62
  "step": 50
63
  },
64
  {
65
+ "epoch": 2.263157894736842,
66
+ "grad_norm": 7.400702953338623,
67
  "learning_rate": 1.1764705882352942e-05,
68
+ "loss": 1.2008,
69
  "step": 60
70
  },
71
  {
72
+ "epoch": 2.263157894736842,
73
+ "eval_accuracy": 0.5267034990791897,
74
+ "eval_loss": 1.1846799850463867,
75
+ "eval_runtime": 1919.9448,
76
+ "eval_samples_per_second": 0.283,
77
+ "eval_steps_per_second": 0.035,
78
  "step": 60
79
  },
80
  {
81
+ "epoch": 3.1315789473684212,
82
+ "grad_norm": 8.256953239440918,
83
  "learning_rate": 4.411764705882353e-06,
84
+ "loss": 1.0759,
85
  "step": 70
86
  },
87
  {
88
+ "epoch": 3.2105263157894735,
89
+ "eval_accuracy": 0.5524861878453039,
90
+ "eval_loss": 1.04552161693573,
91
+ "eval_runtime": 1926.4299,
92
+ "eval_samples_per_second": 0.282,
93
+ "eval_steps_per_second": 0.035,
 
 
 
 
 
 
 
 
 
94
  "step": 76
95
  },
96
  {
97
+ "epoch": 3.2105263157894735,
98
  "step": 76,
99
+ "total_flos": 7.46412658398167e+17,
100
+ "train_loss": 1.275582376279329,
101
+ "train_runtime": 10041.2113,
102
  "train_samples_per_second": 0.061,
103
+ "train_steps_per_second": 0.008
104
  },
105
  {
106
+ "epoch": 3.2105263157894735,
107
+ "eval_accuracy": 0.5407925407925408,
108
+ "eval_loss": 0.993989884853363,
109
+ "eval_runtime": 1508.347,
110
+ "eval_samples_per_second": 0.284,
111
+ "eval_steps_per_second": 0.036,
112
  "step": 76
113
  },
114
  {
115
+ "epoch": 3.2105263157894735,
116
+ "eval_accuracy": 0.5407925407925408,
117
+ "eval_loss": 0.9939900040626526,
118
+ "eval_runtime": 1531.0787,
119
+ "eval_samples_per_second": 0.28,
120
+ "eval_steps_per_second": 0.035,
121
  "step": 76
122
  }
123
  ],
 
138
  "attributes": {}
139
  }
140
  },
141
+ "total_flos": 7.46412658398167e+17,
142
+ "train_batch_size": 8,
143
  "trial_name": null,
144
  "trial_params": null
145
  }