impcabbie commited on
Commit
fa0a315
1 Parent(s): 07d1e4c

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 9.73,
3
- "eval_accuracy": 0.7272727272727273,
4
- "eval_loss": 0.6321931481361389,
5
- "eval_runtime": 5.5693,
6
- "eval_samples_per_second": 23.702,
7
- "eval_steps_per_second": 0.898,
8
- "total_flos": 2.8567786371889766e+17,
9
- "train_loss": 0.6456676854027642,
10
- "train_runtime": 1051.9243,
11
- "train_samples_per_second": 11.227,
12
- "train_steps_per_second": 0.086
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.7429906542056075,
4
+ "eval_loss": 0.6470456719398499,
5
+ "eval_runtime": 11.8351,
6
+ "eval_samples_per_second": 18.082,
7
+ "eval_steps_per_second": 0.591,
8
+ "total_flos": 4.772483236233216e+17,
9
+ "train_loss": 0.631834732691447,
10
+ "train_runtime": 2090.315,
11
+ "train_samples_per_second": 9.185,
12
+ "train_steps_per_second": 0.072
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.73,
3
- "eval_accuracy": 0.7272727272727273,
4
- "eval_loss": 0.6321931481361389,
5
- "eval_runtime": 5.5693,
6
- "eval_samples_per_second": 23.702,
7
- "eval_steps_per_second": 0.898
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.7429906542056075,
4
+ "eval_loss": 0.6470456719398499,
5
+ "eval_runtime": 11.8351,
6
+ "eval_samples_per_second": 18.082,
7
+ "eval_steps_per_second": 0.591
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4f652eb7f5dba7f7403ed4940f204e2303af8a85925a7596a21f7b9665e6124
3
  size 110345908
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9ac478b76ae08c58cccf61527ab27ba693406c4feb993e3f897009f4c94e951
3
  size 110345908
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eaff7ef959a5de0ccb92404811b6aae31227f644993a4a312bab77b62554c238
3
  size 110397937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:551d1bdb0e9ea1e87e437ec74e9b435f70538f93be8bb4ca1e628486fe3d85a1
3
  size 110397937
runs/Nov30_02-36-21_5327fa17b653/events.out.tfevents.1701313909.5327fa17b653.294.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72551607429dd262fdffc024289acb359e31578c1960c0fc42477df2ff7964b1
3
+ size 411
runs/Nov30_05-39-29_26aa82926d21/events.out.tfevents.1701322776.26aa82926d21.160.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0193d3cb9bc11e9ec47fb4489babe0d9c271ff503e3525fe774fbb3750bdda2
3
+ size 4869
runs/Nov30_19-21-04_9d5d42108d17/events.out.tfevents.1701372159.9d5d42108d17.324.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ace2fd88b704b315c767e7399a598c65beadb6ca57962d425f81d06646f66152
3
+ size 5186
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.73,
3
- "total_flos": 2.8567786371889766e+17,
4
- "train_loss": 0.6456676854027642,
5
- "train_runtime": 1051.9243,
6
- "train_samples_per_second": 11.227,
7
- "train_steps_per_second": 0.086
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 4.772483236233216e+17,
4
+ "train_loss": 0.631834732691447,
5
+ "train_runtime": 2090.315,
6
+ "train_samples_per_second": 9.185,
7
+ "train_steps_per_second": 0.072
8
  }
trainer_state.json CHANGED
@@ -1,172 +1,208 @@
1
  {
2
- "best_metric": 0.7272727272727273,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-83",
4
- "epoch": 9.72972972972973,
5
  "eval_steps": 500,
6
- "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.97,
13
- "eval_accuracy": 0.4621212121212121,
14
- "eval_loss": 1.0291072130203247,
15
- "eval_runtime": 38.7664,
16
- "eval_samples_per_second": 3.405,
17
- "eval_steps_per_second": 0.129,
18
- "step": 9
19
- },
20
- {
21
- "epoch": 1.08,
22
- "learning_rate": 4.938271604938271e-05,
23
- "loss": 1.0954,
24
  "step": 10
25
  },
26
  {
27
- "epoch": 1.95,
28
- "eval_accuracy": 0.6136363636363636,
29
- "eval_loss": 0.8322019577026367,
30
- "eval_runtime": 6.218,
31
- "eval_samples_per_second": 21.229,
32
- "eval_steps_per_second": 0.804,
33
- "step": 18
34
  },
35
  {
36
- "epoch": 2.16,
37
- "learning_rate": 4.3209876543209875e-05,
38
- "loss": 0.8859,
39
  "step": 20
40
  },
41
  {
42
- "epoch": 2.92,
43
- "eval_accuracy": 0.6363636363636364,
44
- "eval_loss": 0.7933622598648071,
45
- "eval_runtime": 5.5171,
46
- "eval_samples_per_second": 23.926,
47
- "eval_steps_per_second": 0.906,
48
- "step": 27
49
  },
50
  {
51
- "epoch": 3.24,
52
- "learning_rate": 3.7037037037037037e-05,
53
- "loss": 0.7328,
 
 
 
54
  "step": 30
55
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
  {
57
  "epoch": 4.0,
58
- "eval_accuracy": 0.6742424242424242,
59
- "eval_loss": 0.7151352763175964,
60
- "eval_runtime": 6.9052,
61
- "eval_samples_per_second": 19.116,
62
- "eval_steps_per_second": 0.724,
63
- "step": 37
64
  },
65
  {
66
- "epoch": 4.32,
67
- "learning_rate": 3.08641975308642e-05,
68
- "loss": 0.6285,
69
- "step": 40
 
 
 
70
  },
71
  {
72
- "epoch": 4.97,
73
- "eval_accuracy": 0.6060606060606061,
74
- "eval_loss": 0.7613763809204102,
75
- "eval_runtime": 6.2935,
76
- "eval_samples_per_second": 20.974,
77
- "eval_steps_per_second": 0.794,
78
- "step": 46
79
  },
80
  {
81
- "epoch": 5.41,
82
- "learning_rate": 2.4691358024691357e-05,
83
- "loss": 0.5817,
84
- "step": 50
 
 
 
 
 
 
 
 
 
85
  },
86
  {
87
- "epoch": 5.95,
88
- "eval_accuracy": 0.6439393939393939,
89
- "eval_loss": 0.7581026554107666,
90
- "eval_runtime": 5.3759,
91
- "eval_samples_per_second": 24.554,
92
- "eval_steps_per_second": 0.93,
93
- "step": 55
 
 
 
 
 
 
94
  },
95
  {
96
- "epoch": 6.49,
97
  "learning_rate": 1.8518518518518518e-05,
98
- "loss": 0.5145,
99
- "step": 60
100
  },
101
  {
102
- "epoch": 6.92,
103
- "eval_accuracy": 0.7121212121212122,
104
- "eval_loss": 0.6607750654220581,
105
- "eval_runtime": 6.827,
106
- "eval_samples_per_second": 19.335,
107
- "eval_steps_per_second": 0.732,
108
- "step": 64
109
  },
110
  {
111
- "epoch": 7.57,
112
- "learning_rate": 1.2345679012345678e-05,
113
- "loss": 0.4899,
114
- "step": 70
115
  },
116
  {
117
  "epoch": 8.0,
118
- "eval_accuracy": 0.6893939393939394,
119
- "eval_loss": 0.6711231470108032,
120
- "eval_runtime": 5.4387,
121
- "eval_samples_per_second": 24.271,
122
- "eval_steps_per_second": 0.919,
123
- "step": 74
124
  },
125
  {
126
- "epoch": 8.65,
127
- "learning_rate": 6.172839506172839e-06,
128
- "loss": 0.4372,
129
- "step": 80
 
 
 
130
  },
131
  {
132
- "epoch": 8.97,
133
- "eval_accuracy": 0.7272727272727273,
134
- "eval_loss": 0.6321931481361389,
135
- "eval_runtime": 6.1539,
136
- "eval_samples_per_second": 21.45,
137
- "eval_steps_per_second": 0.812,
138
- "step": 83
139
  },
140
  {
141
- "epoch": 9.73,
142
- "learning_rate": 0.0,
143
- "loss": 0.4452,
144
- "step": 90
 
 
 
145
  },
146
  {
147
- "epoch": 9.73,
148
- "eval_accuracy": 0.7121212121212122,
149
- "eval_loss": 0.6398604512214661,
150
- "eval_runtime": 6.4193,
151
- "eval_samples_per_second": 20.563,
152
- "eval_steps_per_second": 0.779,
153
- "step": 90
154
  },
155
  {
156
- "epoch": 9.73,
157
- "step": 90,
158
- "total_flos": 2.8567786371889766e+17,
159
- "train_loss": 0.6456676854027642,
160
- "train_runtime": 1051.9243,
161
- "train_samples_per_second": 11.227,
162
- "train_steps_per_second": 0.086
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
163
  }
164
  ],
165
  "logging_steps": 10,
166
- "max_steps": 90,
167
  "num_train_epochs": 10,
168
  "save_steps": 500,
169
- "total_flos": 2.8567786371889766e+17,
170
  "trial_name": null,
171
  "trial_params": null
172
  }
 
1
  {
2
+ "best_metric": 0.7429906542056075,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-120",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.67,
13
+ "learning_rate": 3.3333333333333335e-05,
14
+ "loss": 1.0627,
 
 
 
 
 
 
 
 
 
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 1.0,
19
+ "eval_accuracy": 0.5467289719626168,
20
+ "eval_loss": 0.9620130062103271,
21
+ "eval_runtime": 76.4881,
22
+ "eval_samples_per_second": 2.798,
23
+ "eval_steps_per_second": 0.092,
24
+ "step": 15
25
  },
26
  {
27
+ "epoch": 1.33,
28
+ "learning_rate": 4.814814814814815e-05,
29
+ "loss": 0.9337,
30
  "step": 20
31
  },
32
  {
33
+ "epoch": 2.0,
34
+ "learning_rate": 4.4444444444444447e-05,
35
+ "loss": 0.8137,
36
+ "step": 30
 
 
 
37
  },
38
  {
39
+ "epoch": 2.0,
40
+ "eval_accuracy": 0.6588785046728972,
41
+ "eval_loss": 0.7779576778411865,
42
+ "eval_runtime": 11.4497,
43
+ "eval_samples_per_second": 18.691,
44
+ "eval_steps_per_second": 0.611,
45
  "step": 30
46
  },
47
+ {
48
+ "epoch": 2.67,
49
+ "learning_rate": 4.074074074074074e-05,
50
+ "loss": 0.7516,
51
+ "step": 40
52
+ },
53
+ {
54
+ "epoch": 3.0,
55
+ "eval_accuracy": 0.6822429906542056,
56
+ "eval_loss": 0.7736912369728088,
57
+ "eval_runtime": 10.1149,
58
+ "eval_samples_per_second": 21.157,
59
+ "eval_steps_per_second": 0.692,
60
+ "step": 45
61
+ },
62
+ {
63
+ "epoch": 3.33,
64
+ "learning_rate": 3.7037037037037037e-05,
65
+ "loss": 0.7407,
66
+ "step": 50
67
+ },
68
  {
69
  "epoch": 4.0,
70
+ "learning_rate": 3.3333333333333335e-05,
71
+ "loss": 0.6395,
72
+ "step": 60
 
 
 
73
  },
74
  {
75
+ "epoch": 4.0,
76
+ "eval_accuracy": 0.6869158878504673,
77
+ "eval_loss": 0.7195055484771729,
78
+ "eval_runtime": 11.3612,
79
+ "eval_samples_per_second": 18.836,
80
+ "eval_steps_per_second": 0.616,
81
+ "step": 60
82
  },
83
  {
84
+ "epoch": 4.67,
85
+ "learning_rate": 2.962962962962963e-05,
86
+ "loss": 0.579,
87
+ "step": 70
 
 
 
88
  },
89
  {
90
+ "epoch": 5.0,
91
+ "eval_accuracy": 0.7149532710280374,
92
+ "eval_loss": 0.674180269241333,
93
+ "eval_runtime": 10.9381,
94
+ "eval_samples_per_second": 19.565,
95
+ "eval_steps_per_second": 0.64,
96
+ "step": 75
97
+ },
98
+ {
99
+ "epoch": 5.33,
100
+ "learning_rate": 2.5925925925925925e-05,
101
+ "loss": 0.5781,
102
+ "step": 80
103
  },
104
  {
105
+ "epoch": 6.0,
106
+ "learning_rate": 2.2222222222222223e-05,
107
+ "loss": 0.5505,
108
+ "step": 90
109
+ },
110
+ {
111
+ "epoch": 6.0,
112
+ "eval_accuracy": 0.7242990654205608,
113
+ "eval_loss": 0.6525578498840332,
114
+ "eval_runtime": 10.1857,
115
+ "eval_samples_per_second": 21.01,
116
+ "eval_steps_per_second": 0.687,
117
+ "step": 90
118
  },
119
  {
120
+ "epoch": 6.67,
121
  "learning_rate": 1.8518518518518518e-05,
122
+ "loss": 0.5312,
123
+ "step": 100
124
  },
125
  {
126
+ "epoch": 7.0,
127
+ "eval_accuracy": 0.7289719626168224,
128
+ "eval_loss": 0.6616000533103943,
129
+ "eval_runtime": 11.5076,
130
+ "eval_samples_per_second": 18.596,
131
+ "eval_steps_per_second": 0.608,
132
+ "step": 105
133
  },
134
  {
135
+ "epoch": 7.33,
136
+ "learning_rate": 1.4814814814814815e-05,
137
+ "loss": 0.4709,
138
+ "step": 110
139
  },
140
  {
141
  "epoch": 8.0,
142
+ "learning_rate": 1.1111111111111112e-05,
143
+ "loss": 0.4793,
144
+ "step": 120
 
 
 
145
  },
146
  {
147
+ "epoch": 8.0,
148
+ "eval_accuracy": 0.7429906542056075,
149
+ "eval_loss": 0.6470456719398499,
150
+ "eval_runtime": 10.8132,
151
+ "eval_samples_per_second": 19.791,
152
+ "eval_steps_per_second": 0.647,
153
+ "step": 120
154
  },
155
  {
156
+ "epoch": 8.67,
157
+ "learning_rate": 7.4074074074074075e-06,
158
+ "loss": 0.4443,
159
+ "step": 130
 
 
 
160
  },
161
  {
162
+ "epoch": 9.0,
163
+ "eval_accuracy": 0.7383177570093458,
164
+ "eval_loss": 0.6374843716621399,
165
+ "eval_runtime": 11.7851,
166
+ "eval_samples_per_second": 18.158,
167
+ "eval_steps_per_second": 0.594,
168
+ "step": 135
169
  },
170
  {
171
+ "epoch": 9.33,
172
+ "learning_rate": 3.7037037037037037e-06,
173
+ "loss": 0.4335,
174
+ "step": 140
 
 
 
175
  },
176
  {
177
+ "epoch": 10.0,
178
+ "learning_rate": 0.0,
179
+ "loss": 0.4685,
180
+ "step": 150
181
+ },
182
+ {
183
+ "epoch": 10.0,
184
+ "eval_accuracy": 0.7289719626168224,
185
+ "eval_loss": 0.6419404745101929,
186
+ "eval_runtime": 11.0308,
187
+ "eval_samples_per_second": 19.4,
188
+ "eval_steps_per_second": 0.635,
189
+ "step": 150
190
+ },
191
+ {
192
+ "epoch": 10.0,
193
+ "step": 150,
194
+ "total_flos": 4.772483236233216e+17,
195
+ "train_loss": 0.631834732691447,
196
+ "train_runtime": 2090.315,
197
+ "train_samples_per_second": 9.185,
198
+ "train_steps_per_second": 0.072
199
  }
200
  ],
201
  "logging_steps": 10,
202
+ "max_steps": 150,
203
  "num_train_epochs": 10,
204
  "save_steps": 500,
205
+ "total_flos": 4.772483236233216e+17,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d83f4ba9a02cd15381b3fc9b8e15a2e8e344ad4850ea94ae1368ab4386f16a6
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a4f481a36c89204aeedde5377a22a9258ae5a4b142e7198e15e3fa361842a5b
3
  size 4664