impcabbie commited on
Commit
2e881ab
1 Parent(s): de1160c

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.7429906542056075,
4
- "eval_loss": 0.6470456719398499,
5
- "eval_runtime": 11.8351,
6
- "eval_samples_per_second": 18.082,
7
- "eval_steps_per_second": 0.591,
8
- "total_flos": 4.772483236233216e+17,
9
- "train_loss": 0.631834732691447,
10
- "train_runtime": 2090.315,
11
- "train_samples_per_second": 9.185,
12
- "train_steps_per_second": 0.072
13
  }
 
1
  {
2
+ "epoch": 9.68,
3
+ "eval_accuracy": 0.7272727272727273,
4
+ "eval_loss": 0.6827457547187805,
5
+ "eval_runtime": 17.8634,
6
+ "eval_samples_per_second": 12.316,
7
+ "eval_steps_per_second": 0.392,
8
+ "total_flos": 4.7612977286482944e+17,
9
+ "train_loss": 0.6240748373667399,
10
+ "train_runtime": 3165.909,
11
+ "train_samples_per_second": 6.251,
12
+ "train_steps_per_second": 0.047
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.7429906542056075,
4
- "eval_loss": 0.6470456719398499,
5
- "eval_runtime": 11.8351,
6
- "eval_samples_per_second": 18.082,
7
- "eval_steps_per_second": 0.591
8
  }
 
1
  {
2
+ "epoch": 9.68,
3
+ "eval_accuracy": 0.7272727272727273,
4
+ "eval_loss": 0.6827457547187805,
5
+ "eval_runtime": 17.8634,
6
+ "eval_samples_per_second": 12.316,
7
+ "eval_steps_per_second": 0.392
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:795d7fdfbf2c2c13acbb1b6d47d3945160d4f54d6a9c36f12c3ac128ff178056
3
  size 110345908
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a7379e8a0b9024c03ddc84ca54c44771da4b6b921aab03357917ea5a6217a00
3
  size 110345908
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eaff7ef959a5de0ccb92404811b6aae31227f644993a4a312bab77b62554c238
3
- size 110397937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe972a95fe34c7d0035a0ef86d6ef050cfad2ed110164fec7c8e5554c472707
3
+ size 110398382
runs/Dec02_05-43-49_eaeadb71b15c/events.out.tfevents.1701495842.eaeadb71b15c.351.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebfba51551c3ccb150ef1d61b3dee189c502af122158771581288d112c3384bb
3
+ size 5340
runs/Nov30_19-21-04_9d5d42108d17/events.out.tfevents.1701375355.9d5d42108d17.324.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88aa5d85c6470066b496f5eb7711e0d3b7a9d323c392f1dffec897df3efe7d46
3
+ size 734
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "total_flos": 4.772483236233216e+17,
4
- "train_loss": 0.631834732691447,
5
- "train_runtime": 2090.315,
6
- "train_samples_per_second": 9.185,
7
- "train_steps_per_second": 0.072
8
  }
 
1
  {
2
+ "epoch": 9.68,
3
+ "total_flos": 4.7612977286482944e+17,
4
+ "train_loss": 0.6240748373667399,
5
+ "train_runtime": 3165.909,
6
+ "train_samples_per_second": 6.251,
7
+ "train_steps_per_second": 0.047
8
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.7429906542056075,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-120",
4
- "epoch": 10.0,
5
  "eval_steps": 500,
6
  "global_step": 150,
7
  "is_hyper_param_search": false,
@@ -9,200 +9,200 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.67,
13
  "learning_rate": 3.3333333333333335e-05,
14
- "loss": 1.0627,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 1.0,
19
- "eval_accuracy": 0.5467289719626168,
20
- "eval_loss": 0.9620130062103271,
21
- "eval_runtime": 76.4881,
22
- "eval_samples_per_second": 2.798,
23
- "eval_steps_per_second": 0.092,
24
  "step": 15
25
  },
26
  {
27
- "epoch": 1.33,
28
  "learning_rate": 4.814814814814815e-05,
29
- "loss": 0.9337,
30
  "step": 20
31
  },
32
  {
33
- "epoch": 2.0,
34
  "learning_rate": 4.4444444444444447e-05,
35
- "loss": 0.8137,
36
  "step": 30
37
  },
38
  {
39
  "epoch": 2.0,
40
- "eval_accuracy": 0.6588785046728972,
41
- "eval_loss": 0.7779576778411865,
42
- "eval_runtime": 11.4497,
43
- "eval_samples_per_second": 18.691,
44
- "eval_steps_per_second": 0.611,
45
- "step": 30
46
  },
47
  {
48
- "epoch": 2.67,
49
  "learning_rate": 4.074074074074074e-05,
50
- "loss": 0.7516,
51
  "step": 40
52
  },
53
  {
54
- "epoch": 3.0,
55
- "eval_accuracy": 0.6822429906542056,
56
- "eval_loss": 0.7736912369728088,
57
- "eval_runtime": 10.1149,
58
- "eval_samples_per_second": 21.157,
59
- "eval_steps_per_second": 0.692,
60
- "step": 45
61
  },
62
  {
63
- "epoch": 3.33,
64
  "learning_rate": 3.7037037037037037e-05,
65
- "loss": 0.7407,
66
  "step": 50
67
  },
68
  {
69
- "epoch": 4.0,
70
  "learning_rate": 3.3333333333333335e-05,
71
- "loss": 0.6395,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
- "eval_accuracy": 0.6869158878504673,
77
- "eval_loss": 0.7195055484771729,
78
- "eval_runtime": 11.3612,
79
- "eval_samples_per_second": 18.836,
80
- "eval_steps_per_second": 0.616,
81
- "step": 60
82
  },
83
  {
84
- "epoch": 4.67,
85
  "learning_rate": 2.962962962962963e-05,
86
- "loss": 0.579,
87
  "step": 70
88
  },
89
  {
90
- "epoch": 5.0,
91
- "eval_accuracy": 0.7149532710280374,
92
- "eval_loss": 0.674180269241333,
93
- "eval_runtime": 10.9381,
94
- "eval_samples_per_second": 19.565,
95
- "eval_steps_per_second": 0.64,
96
- "step": 75
97
  },
98
  {
99
- "epoch": 5.33,
100
  "learning_rate": 2.5925925925925925e-05,
101
- "loss": 0.5781,
102
  "step": 80
103
  },
104
  {
105
- "epoch": 6.0,
106
  "learning_rate": 2.2222222222222223e-05,
107
- "loss": 0.5505,
108
  "step": 90
109
  },
110
  {
111
  "epoch": 6.0,
112
- "eval_accuracy": 0.7242990654205608,
113
- "eval_loss": 0.6525578498840332,
114
- "eval_runtime": 10.1857,
115
- "eval_samples_per_second": 21.01,
116
- "eval_steps_per_second": 0.687,
117
- "step": 90
118
  },
119
  {
120
- "epoch": 6.67,
121
  "learning_rate": 1.8518518518518518e-05,
122
- "loss": 0.5312,
123
  "step": 100
124
  },
125
  {
126
- "epoch": 7.0,
127
- "eval_accuracy": 0.7289719626168224,
128
- "eval_loss": 0.6616000533103943,
129
- "eval_runtime": 11.5076,
130
- "eval_samples_per_second": 18.596,
131
- "eval_steps_per_second": 0.608,
132
- "step": 105
133
  },
134
  {
135
- "epoch": 7.33,
136
  "learning_rate": 1.4814814814814815e-05,
137
- "loss": 0.4709,
138
  "step": 110
139
  },
140
  {
141
- "epoch": 8.0,
142
  "learning_rate": 1.1111111111111112e-05,
143
- "loss": 0.4793,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
- "eval_accuracy": 0.7429906542056075,
149
- "eval_loss": 0.6470456719398499,
150
- "eval_runtime": 10.8132,
151
- "eval_samples_per_second": 19.791,
152
- "eval_steps_per_second": 0.647,
153
- "step": 120
154
  },
155
  {
156
- "epoch": 8.67,
157
  "learning_rate": 7.4074074074074075e-06,
158
- "loss": 0.4443,
159
  "step": 130
160
  },
161
  {
162
- "epoch": 9.0,
163
- "eval_accuracy": 0.7383177570093458,
164
- "eval_loss": 0.6374843716621399,
165
- "eval_runtime": 11.7851,
166
- "eval_samples_per_second": 18.158,
167
- "eval_steps_per_second": 0.594,
168
- "step": 135
169
  },
170
  {
171
- "epoch": 9.33,
172
  "learning_rate": 3.7037037037037037e-06,
173
- "loss": 0.4335,
174
  "step": 140
175
  },
176
  {
177
- "epoch": 10.0,
178
  "learning_rate": 0.0,
179
- "loss": 0.4685,
180
  "step": 150
181
  },
182
  {
183
- "epoch": 10.0,
184
- "eval_accuracy": 0.7289719626168224,
185
- "eval_loss": 0.6419404745101929,
186
- "eval_runtime": 11.0308,
187
- "eval_samples_per_second": 19.4,
188
- "eval_steps_per_second": 0.635,
189
  "step": 150
190
  },
191
  {
192
- "epoch": 10.0,
193
  "step": 150,
194
- "total_flos": 4.772483236233216e+17,
195
- "train_loss": 0.631834732691447,
196
- "train_runtime": 2090.315,
197
- "train_samples_per_second": 9.185,
198
- "train_steps_per_second": 0.072
199
  }
200
  ],
201
  "logging_steps": 10,
202
  "max_steps": 150,
203
  "num_train_epochs": 10,
204
  "save_steps": 500,
205
- "total_flos": 4.772483236233216e+17,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
 
1
  {
2
+ "best_metric": 0.7272727272727273,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-93",
4
+ "epoch": 9.67741935483871,
5
  "eval_steps": 500,
6
  "global_step": 150,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.65,
13
  "learning_rate": 3.3333333333333335e-05,
14
+ "loss": 1.1158,
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 0.97,
19
+ "eval_accuracy": 0.5045454545454545,
20
+ "eval_loss": 0.9996662735939026,
21
+ "eval_runtime": 192.1374,
22
+ "eval_samples_per_second": 1.145,
23
+ "eval_steps_per_second": 0.036,
24
  "step": 15
25
  },
26
  {
27
+ "epoch": 1.29,
28
  "learning_rate": 4.814814814814815e-05,
29
+ "loss": 0.9619,
30
  "step": 20
31
  },
32
  {
33
+ "epoch": 1.94,
34
  "learning_rate": 4.4444444444444447e-05,
35
+ "loss": 0.8261,
36
  "step": 30
37
  },
38
  {
39
  "epoch": 2.0,
40
+ "eval_accuracy": 0.5909090909090909,
41
+ "eval_loss": 0.9179713726043701,
42
+ "eval_runtime": 12.9002,
43
+ "eval_samples_per_second": 17.054,
44
+ "eval_steps_per_second": 0.543,
45
+ "step": 31
46
  },
47
  {
48
+ "epoch": 2.58,
49
  "learning_rate": 4.074074074074074e-05,
50
+ "loss": 0.7361,
51
  "step": 40
52
  },
53
  {
54
+ "epoch": 2.97,
55
+ "eval_accuracy": 0.65,
56
+ "eval_loss": 0.8046814203262329,
57
+ "eval_runtime": 12.6289,
58
+ "eval_samples_per_second": 17.42,
59
+ "eval_steps_per_second": 0.554,
60
+ "step": 46
61
  },
62
  {
63
+ "epoch": 3.23,
64
  "learning_rate": 3.7037037037037037e-05,
65
+ "loss": 0.695,
66
  "step": 50
67
  },
68
  {
69
+ "epoch": 3.87,
70
  "learning_rate": 3.3333333333333335e-05,
71
+ "loss": 0.6325,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
+ "eval_accuracy": 0.6818181818181818,
77
+ "eval_loss": 0.7319933772087097,
78
+ "eval_runtime": 11.9267,
79
+ "eval_samples_per_second": 18.446,
80
+ "eval_steps_per_second": 0.587,
81
+ "step": 62
82
  },
83
  {
84
+ "epoch": 4.52,
85
  "learning_rate": 2.962962962962963e-05,
86
+ "loss": 0.5946,
87
  "step": 70
88
  },
89
  {
90
+ "epoch": 4.97,
91
+ "eval_accuracy": 0.6772727272727272,
92
+ "eval_loss": 0.7196129560470581,
93
+ "eval_runtime": 12.5354,
94
+ "eval_samples_per_second": 17.55,
95
+ "eval_steps_per_second": 0.558,
96
+ "step": 77
97
  },
98
  {
99
+ "epoch": 5.16,
100
  "learning_rate": 2.5925925925925925e-05,
101
+ "loss": 0.5746,
102
  "step": 80
103
  },
104
  {
105
+ "epoch": 5.81,
106
  "learning_rate": 2.2222222222222223e-05,
107
+ "loss": 0.5149,
108
  "step": 90
109
  },
110
  {
111
  "epoch": 6.0,
112
+ "eval_accuracy": 0.7272727272727273,
113
+ "eval_loss": 0.6827457547187805,
114
+ "eval_runtime": 12.8605,
115
+ "eval_samples_per_second": 17.107,
116
+ "eval_steps_per_second": 0.544,
117
+ "step": 93
118
  },
119
  {
120
+ "epoch": 6.45,
121
  "learning_rate": 1.8518518518518518e-05,
122
+ "loss": 0.5083,
123
  "step": 100
124
  },
125
  {
126
+ "epoch": 6.97,
127
+ "eval_accuracy": 0.6954545454545454,
128
+ "eval_loss": 0.6906238198280334,
129
+ "eval_runtime": 12.5065,
130
+ "eval_samples_per_second": 17.591,
131
+ "eval_steps_per_second": 0.56,
132
+ "step": 108
133
  },
134
  {
135
+ "epoch": 7.1,
136
  "learning_rate": 1.4814814814814815e-05,
137
+ "loss": 0.4835,
138
  "step": 110
139
  },
140
  {
141
+ "epoch": 7.74,
142
  "learning_rate": 1.1111111111111112e-05,
143
+ "loss": 0.4316,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
+ "eval_accuracy": 0.7090909090909091,
149
+ "eval_loss": 0.6681076288223267,
150
+ "eval_runtime": 12.7742,
151
+ "eval_samples_per_second": 17.222,
152
+ "eval_steps_per_second": 0.548,
153
+ "step": 124
154
  },
155
  {
156
+ "epoch": 8.39,
157
  "learning_rate": 7.4074074074074075e-06,
158
+ "loss": 0.4214,
159
  "step": 130
160
  },
161
  {
162
+ "epoch": 8.97,
163
+ "eval_accuracy": 0.7090909090909091,
164
+ "eval_loss": 0.6699694395065308,
165
+ "eval_runtime": 12.8762,
166
+ "eval_samples_per_second": 17.086,
167
+ "eval_steps_per_second": 0.544,
168
+ "step": 139
169
  },
170
  {
171
+ "epoch": 9.03,
172
  "learning_rate": 3.7037037037037037e-06,
173
+ "loss": 0.4551,
174
  "step": 140
175
  },
176
  {
177
+ "epoch": 9.68,
178
  "learning_rate": 0.0,
179
+ "loss": 0.4096,
180
  "step": 150
181
  },
182
  {
183
+ "epoch": 9.68,
184
+ "eval_accuracy": 0.7090909090909091,
185
+ "eval_loss": 0.6670935153961182,
186
+ "eval_runtime": 12.1565,
187
+ "eval_samples_per_second": 18.097,
188
+ "eval_steps_per_second": 0.576,
189
  "step": 150
190
  },
191
  {
192
+ "epoch": 9.68,
193
  "step": 150,
194
+ "total_flos": 4.7612977286482944e+17,
195
+ "train_loss": 0.6240748373667399,
196
+ "train_runtime": 3165.909,
197
+ "train_samples_per_second": 6.251,
198
+ "train_steps_per_second": 0.047
199
  }
200
  ],
201
  "logging_steps": 10,
202
  "max_steps": 150,
203
  "num_train_epochs": 10,
204
  "save_steps": 500,
205
+ "total_flos": 4.7612977286482944e+17,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a4f481a36c89204aeedde5377a22a9258ae5a4b142e7198e15e3fa361842a5b
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1210178898209e43a21f0315525493ed9643984df32cad3c848f6cee94f214bb
3
  size 4664