ruturajghumkar commited on
Commit
c15f883
1 Parent(s): b8c051c

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.541394829750061,
5
- "eval_runtime": 0.2681,
6
- "eval_samples_per_second": 18.649,
7
- "eval_steps_per_second": 3.73,
8
- "total_flos": 3206422579175424.0,
9
- "train_loss": 0.2824457089106242,
10
- "train_runtime": 11.3219,
11
- "train_samples_per_second": 11.394,
12
- "train_steps_per_second": 0.265
13
  }
 
1
  {
2
+ "epoch": 2.96,
3
+ "eval_accuracy": 0.8710801393728222,
4
+ "eval_loss": 0.3399865925312042,
5
+ "eval_runtime": 4.1257,
6
+ "eval_samples_per_second": 69.563,
7
+ "eval_steps_per_second": 2.181,
8
+ "total_flos": 1.9045723068223488e+17,
9
+ "train_loss": 0.657797618707021,
10
+ "train_runtime": 145.8955,
11
+ "train_samples_per_second": 53.113,
12
+ "train_steps_per_second": 0.411
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.541394829750061,
5
- "eval_runtime": 0.2681,
6
- "eval_samples_per_second": 18.649,
7
- "eval_steps_per_second": 3.73
8
  }
 
1
  {
2
+ "epoch": 2.96,
3
+ "eval_accuracy": 0.8710801393728222,
4
+ "eval_loss": 0.3399865925312042,
5
+ "eval_runtime": 4.1257,
6
+ "eval_samples_per_second": 69.563,
7
+ "eval_steps_per_second": 2.181
8
  }
runs/Apr08_12-28-18_90600695b4f6/events.out.tfevents.1712579455.90600695b4f6.424.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cc40f8b4bca792e8fbced46149a3d458393cfd165500ade4d9c5441d0278c94
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 3206422579175424.0,
4
- "train_loss": 0.2824457089106242,
5
- "train_runtime": 11.3219,
6
- "train_samples_per_second": 11.394,
7
- "train_steps_per_second": 0.265
8
  }
 
1
  {
2
+ "epoch": 2.96,
3
+ "total_flos": 1.9045723068223488e+17,
4
+ "train_loss": 0.657797618707021,
5
+ "train_runtime": 145.8955,
6
+ "train_samples_per_second": 53.113,
7
+ "train_steps_per_second": 0.411
8
  }
trainer_state.json CHANGED
@@ -1,56 +1,98 @@
1
  {
2
- "best_metric": 1.0,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-2",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "eval_accuracy": 0.2,
14
- "eval_loss": 0.7171379923820496,
15
- "eval_runtime": 0.288,
16
- "eval_samples_per_second": 17.359,
17
- "eval_steps_per_second": 3.472,
18
- "step": 1
19
- },
20
- {
21
- "epoch": 2.0,
22
- "eval_accuracy": 1.0,
23
- "eval_loss": 0.541394829750061,
24
- "eval_runtime": 0.2716,
25
- "eval_samples_per_second": 18.413,
26
- "eval_steps_per_second": 3.683,
27
- "step": 2
28
- },
29
- {
30
- "epoch": 3.0,
31
- "eval_accuracy": 1.0,
32
- "eval_loss": 0.4680565893650055,
33
- "eval_runtime": 0.3396,
34
- "eval_samples_per_second": 14.723,
35
- "eval_steps_per_second": 2.945,
36
- "step": 3
37
- },
38
- {
39
- "epoch": 3.0,
40
- "step": 3,
41
- "total_flos": 3206422579175424.0,
42
- "train_loss": 0.2824457089106242,
43
- "train_runtime": 11.3219,
44
- "train_samples_per_second": 11.394,
45
- "train_steps_per_second": 0.265
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
  "logging_steps": 10,
49
- "max_steps": 3,
50
  "num_input_tokens_seen": 0,
51
  "num_train_epochs": 3,
52
  "save_steps": 500,
53
- "total_flos": 3206422579175424.0,
54
  "train_batch_size": 32,
55
  "trial_name": null,
56
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.8710801393728222,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-60",
4
+ "epoch": 2.962962962962963,
5
  "eval_steps": 500,
6
+ "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.49,
13
+ "grad_norm": 9.358732223510742,
14
+ "learning_rate": 4.62962962962963e-05,
15
+ "loss": 1.259,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.99,
20
+ "grad_norm": 11.161949157714844,
21
+ "learning_rate": 3.7037037037037037e-05,
22
+ "loss": 0.8451,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.99,
27
+ "eval_accuracy": 0.7874564459930313,
28
+ "eval_loss": 0.5740640163421631,
29
+ "eval_runtime": 4.4336,
30
+ "eval_samples_per_second": 64.733,
31
+ "eval_steps_per_second": 2.03,
32
+ "step": 20
33
+ },
34
+ {
35
+ "epoch": 1.48,
36
+ "grad_norm": 13.122177124023438,
37
+ "learning_rate": 2.777777777777778e-05,
38
+ "loss": 0.581,
39
+ "step": 30
40
+ },
41
+ {
42
+ "epoch": 1.98,
43
+ "grad_norm": 10.2821044921875,
44
+ "learning_rate": 1.8518518518518518e-05,
45
+ "loss": 0.4621,
46
+ "step": 40
47
+ },
48
+ {
49
+ "epoch": 1.98,
50
+ "eval_accuracy": 0.8048780487804879,
51
+ "eval_loss": 0.45788925886154175,
52
+ "eval_runtime": 4.1854,
53
+ "eval_samples_per_second": 68.572,
54
+ "eval_steps_per_second": 2.15,
55
+ "step": 40
56
+ },
57
+ {
58
+ "epoch": 2.47,
59
+ "grad_norm": 12.540511131286621,
60
+ "learning_rate": 9.259259259259259e-06,
61
+ "loss": 0.4259,
62
+ "step": 50
63
+ },
64
+ {
65
+ "epoch": 2.96,
66
+ "grad_norm": 6.045067310333252,
67
+ "learning_rate": 0.0,
68
+ "loss": 0.3736,
69
+ "step": 60
70
+ },
71
+ {
72
+ "epoch": 2.96,
73
+ "eval_accuracy": 0.8710801393728222,
74
+ "eval_loss": 0.3399865925312042,
75
+ "eval_runtime": 4.397,
76
+ "eval_samples_per_second": 65.272,
77
+ "eval_steps_per_second": 2.047,
78
+ "step": 60
79
+ },
80
+ {
81
+ "epoch": 2.96,
82
+ "step": 60,
83
+ "total_flos": 1.9045723068223488e+17,
84
+ "train_loss": 0.657797618707021,
85
+ "train_runtime": 145.8955,
86
+ "train_samples_per_second": 53.113,
87
+ "train_steps_per_second": 0.411
88
  }
89
  ],
90
  "logging_steps": 10,
91
+ "max_steps": 60,
92
  "num_input_tokens_seen": 0,
93
  "num_train_epochs": 3,
94
  "save_steps": 500,
95
+ "total_flos": 1.9045723068223488e+17,
96
  "train_batch_size": 32,
97
  "trial_name": null,
98
  "trial_params": null