griffio commited on
Commit
0d55b9f
1 Parent(s): 7eae467

rotated_maps

Browse files
README.md CHANGED
@@ -24,7 +24,7 @@ model-index:
24
  metrics:
25
  - name: Accuracy
26
  type: accuracy
27
- value: 1.0
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -34,8 +34,8 @@ should probably proofread and complete it, then remove this comment. -->
34
 
35
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the rotated_maps dataset.
36
  It achieves the following results on the evaluation set:
37
- - Loss: 0.1515
38
- - Accuracy: 1.0
39
 
40
  ## Model description
41
 
@@ -67,7 +67,7 @@ The following hyperparameters were used during training:
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
69
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
70
- | 0.0386 | 12.5 | 100 | 0.1515 | 1.0 |
71
 
72
 
73
  ### Framework versions
 
24
  metrics:
25
  - name: Accuracy
26
  type: accuracy
27
+ value: 0.875
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the rotated_maps dataset.
36
  It achieves the following results on the evaluation set:
37
+ - Loss: 0.5177
38
+ - Accuracy: 0.875
39
 
40
  ## Model description
41
 
 
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
69
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
70
+ | 0.1009 | 12.5 | 100 | 0.5177 | 0.875 |
71
 
72
 
73
  ### Framework versions
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 15.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.1515045166015625,
5
- "eval_runtime": 0.092,
6
- "eval_samples_per_second": 76.101,
7
- "eval_steps_per_second": 10.872,
8
- "total_flos": 4.417241350846464e+16,
9
- "train_loss": 0.08117741694053014,
10
- "train_runtime": 27.1137,
11
- "train_samples_per_second": 21.023,
12
- "train_steps_per_second": 4.426
13
  }
 
1
  {
2
  "epoch": 15.0,
3
+ "eval_accuracy": 0.875,
4
+ "eval_loss": 0.5177230834960938,
5
+ "eval_runtime": 0.1273,
6
+ "eval_samples_per_second": 62.83,
7
+ "eval_steps_per_second": 7.854,
8
+ "total_flos": 4.64972773773312e+16,
9
+ "train_loss": 0.45015646318594615,
10
+ "train_runtime": 30.2968,
11
+ "train_samples_per_second": 19.804,
12
+ "train_steps_per_second": 3.961
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 15.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.1515045166015625,
5
- "eval_runtime": 0.092,
6
- "eval_samples_per_second": 76.101,
7
- "eval_steps_per_second": 10.872
8
  }
 
1
  {
2
  "epoch": 15.0,
3
+ "eval_accuracy": 0.875,
4
+ "eval_loss": 0.5177230834960938,
5
+ "eval_runtime": 0.1273,
6
+ "eval_samples_per_second": 62.83,
7
+ "eval_steps_per_second": 7.854
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec300bee5b7dde99c4801ee26ecb64e50738f69095e1b8d86fbc34f204f96153
3
  size 343239356
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624e1b227a433f765e4f11185a40c7bb3c8df1343071ee4c8ee0e1e20a8d84e1
3
  size 343239356
runs/Oct29_20-25-38_3e04bab4dd1f/events.out.tfevents.1730233547.3e04bab4dd1f.943.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bed54ae20228aceff93dd0913002cfc7cba4052841e376c2c8ae424d5e3d23f
3
+ size 8300
runs/Oct29_20-25-38_3e04bab4dd1f/events.out.tfevents.1730233581.3e04bab4dd1f.943.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315ced64c36dfa9ca028f47f5703e599bc4491b6b7dcef04ada114fa0ebb8da0
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 15.0,
3
- "total_flos": 4.417241350846464e+16,
4
- "train_loss": 0.08117741694053014,
5
- "train_runtime": 27.1137,
6
- "train_samples_per_second": 21.023,
7
- "train_steps_per_second": 4.426
8
  }
 
1
  {
2
  "epoch": 15.0,
3
+ "total_flos": 4.64972773773312e+16,
4
+ "train_loss": 0.45015646318594615,
5
+ "train_runtime": 30.2968,
6
+ "train_samples_per_second": 19.804,
7
+ "train_steps_per_second": 3.961
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.1515045166015625,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-rotated-dungeons-v3/checkpoint-100",
4
  "epoch": 15.0,
5
  "eval_steps": 100,
@@ -10,105 +10,105 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.25,
13
- "grad_norm": 0.588030219078064,
14
  "learning_rate": 0.00018333333333333334,
15
- "loss": 0.2001,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 2.5,
20
- "grad_norm": 0.40187984704971313,
21
  "learning_rate": 0.0001666666666666667,
22
- "loss": 0.2121,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 3.75,
27
- "grad_norm": 0.26918885111808777,
28
  "learning_rate": 0.00015000000000000001,
29
- "loss": 0.1179,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 5.0,
34
- "grad_norm": 0.2864986062049866,
35
  "learning_rate": 0.00013333333333333334,
36
- "loss": 0.0755,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 6.25,
41
- "grad_norm": 0.20267005264759064,
42
  "learning_rate": 0.00011666666666666668,
43
- "loss": 0.0641,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 7.5,
48
- "grad_norm": 0.24064351618289948,
49
  "learning_rate": 0.0001,
50
- "loss": 0.0523,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 8.75,
55
- "grad_norm": 0.15450333058834076,
56
  "learning_rate": 8.333333333333334e-05,
57
- "loss": 0.0487,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 10.0,
62
- "grad_norm": 0.3064187467098236,
63
  "learning_rate": 6.666666666666667e-05,
64
- "loss": 0.0447,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 11.25,
69
- "grad_norm": 0.23561660945415497,
70
  "learning_rate": 5e-05,
71
- "loss": 0.043,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 12.5,
76
- "grad_norm": 0.19291207194328308,
77
  "learning_rate": 3.3333333333333335e-05,
78
- "loss": 0.0386,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 12.5,
83
- "eval_accuracy": 1.0,
84
- "eval_loss": 0.1515045166015625,
85
- "eval_runtime": 0.0635,
86
- "eval_samples_per_second": 110.175,
87
- "eval_steps_per_second": 15.739,
88
  "step": 100
89
  },
90
  {
91
  "epoch": 13.75,
92
- "grad_norm": 0.14135047793388367,
93
  "learning_rate": 1.6666666666666667e-05,
94
- "loss": 0.0402,
95
  "step": 110
96
  },
97
  {
98
  "epoch": 15.0,
99
- "grad_norm": 0.2867968678474426,
100
  "learning_rate": 0.0,
101
- "loss": 0.037,
102
  "step": 120
103
  },
104
  {
105
  "epoch": 15.0,
106
  "step": 120,
107
- "total_flos": 4.417241350846464e+16,
108
- "train_loss": 0.08117741694053014,
109
- "train_runtime": 27.1137,
110
- "train_samples_per_second": 21.023,
111
- "train_steps_per_second": 4.426
112
  }
113
  ],
114
  "logging_steps": 10,
@@ -128,7 +128,7 @@
128
  "attributes": {}
129
  }
130
  },
131
- "total_flos": 4.417241350846464e+16,
132
  "train_batch_size": 5,
133
  "trial_name": null,
134
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.5177230834960938,
3
  "best_model_checkpoint": "vit-base-patch16-224-in21k-rotated-dungeons-v3/checkpoint-100",
4
  "epoch": 15.0,
5
  "eval_steps": 100,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.25,
13
+ "grad_norm": 2.4491872787475586,
14
  "learning_rate": 0.00018333333333333334,
15
+ "loss": 1.7253,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 2.5,
20
+ "grad_norm": 2.151639461517334,
21
  "learning_rate": 0.0001666666666666667,
22
+ "loss": 1.2096,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 3.75,
27
+ "grad_norm": 1.7387666702270508,
28
  "learning_rate": 0.00015000000000000001,
29
+ "loss": 0.8385,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 5.0,
34
+ "grad_norm": 1.5225492715835571,
35
  "learning_rate": 0.00013333333333333334,
36
+ "loss": 0.4285,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 6.25,
41
+ "grad_norm": 0.6194241046905518,
42
  "learning_rate": 0.00011666666666666668,
43
+ "loss": 0.322,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 7.5,
48
+ "grad_norm": 0.9321300387382507,
49
  "learning_rate": 0.0001,
50
+ "loss": 0.1986,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 8.75,
55
+ "grad_norm": 0.4772986173629761,
56
  "learning_rate": 8.333333333333334e-05,
57
+ "loss": 0.1683,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 10.0,
62
+ "grad_norm": 0.4312579929828644,
63
  "learning_rate": 6.666666666666667e-05,
64
+ "loss": 0.1219,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 11.25,
69
+ "grad_norm": 0.34619101881980896,
70
  "learning_rate": 5e-05,
71
+ "loss": 0.1029,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 12.5,
76
+ "grad_norm": 0.330285906791687,
77
  "learning_rate": 3.3333333333333335e-05,
78
+ "loss": 0.1009,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 12.5,
83
+ "eval_accuracy": 0.875,
84
+ "eval_loss": 0.5177230834960938,
85
+ "eval_runtime": 0.0932,
86
+ "eval_samples_per_second": 85.814,
87
+ "eval_steps_per_second": 10.727,
88
  "step": 100
89
  },
90
  {
91
  "epoch": 13.75,
92
+ "grad_norm": 0.5117152333259583,
93
  "learning_rate": 1.6666666666666667e-05,
94
+ "loss": 0.0982,
95
  "step": 110
96
  },
97
  {
98
  "epoch": 15.0,
99
+ "grad_norm": 0.43090176582336426,
100
  "learning_rate": 0.0,
101
+ "loss": 0.0872,
102
  "step": 120
103
  },
104
  {
105
  "epoch": 15.0,
106
  "step": 120,
107
+ "total_flos": 4.64972773773312e+16,
108
+ "train_loss": 0.45015646318594615,
109
+ "train_runtime": 30.2968,
110
+ "train_samples_per_second": 19.804,
111
+ "train_steps_per_second": 3.961
112
  }
113
  ],
114
  "logging_steps": 10,
 
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 4.64972773773312e+16,
132
  "train_batch_size": 5,
133
  "trial_name": null,
134
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c92f29ff6847d0e143af11ce92e7c695b999cab35edef2863bd027c51ded0a06
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fb2cc2648216541e9edbb969fa04031be3e7fa72f8bc658c167a01a32d323e1
3
  size 5240