kurosekurose commited on
Commit
fff1067
1 Parent(s): 95025bf

Valence Only Train

Browse files
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [facebook/wav2vec2-base](https://huggingface.co/facebook/wav2vec2-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.6840
21
- - Accuracy: 0.7324
22
 
23
  ## Model description
24
 
@@ -46,23 +46,28 @@ The following hyperparameters were used during training:
46
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
47
  - lr_scheduler_type: linear
48
  - lr_scheduler_warmup_steps: 1000
49
- - num_epochs: 10
50
  - mixed_precision_training: Native AMP
51
 
52
  ### Training results
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
55
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
56
- | 0.6966 | 1.0 | 269 | 0.6975 | 0.4366 |
57
- | 0.6903 | 2.0 | 538 | 0.6907 | 0.5915 |
58
- | 0.6738 | 3.0 | 807 | 0.6904 | 0.5634 |
59
- | 0.6383 | 4.0 | 1076 | 0.6504 | 0.5493 |
60
- | 0.5737 | 5.0 | 1345 | 0.6257 | 0.6901 |
61
- | 0.522 | 6.0 | 1614 | 0.6094 | 0.7042 |
62
- | 0.5022 | 7.0 | 1883 | 0.6444 | 0.7183 |
63
- | 0.4832 | 8.0 | 2152 | 0.6958 | 0.7042 |
64
- | 0.4683 | 9.0 | 2421 | 0.6627 | 0.7465 |
65
- | 0.4548 | 10.0 | 2690 | 0.6840 | 0.7324 |
 
 
 
 
 
66
 
67
 
68
  ### Framework versions
 
17
 
18
  This model is a fine-tuned version of [facebook/wav2vec2-base](https://huggingface.co/facebook/wav2vec2-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 1.1044
21
+ - Accuracy: 0.6761
22
 
23
  ## Model description
24
 
 
46
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
47
  - lr_scheduler_type: linear
48
  - lr_scheduler_warmup_steps: 1000
49
+ - num_epochs: 15
50
  - mixed_precision_training: Native AMP
51
 
52
  ### Training results
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
55
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
56
+ | 0.6979 | 1.0 | 269 | 0.6842 | 0.5915 |
57
+ | 0.69 | 2.0 | 538 | 0.6864 | 0.5775 |
58
+ | 0.6714 | 3.0 | 807 | 0.6900 | 0.5070 |
59
+ | 0.6357 | 4.0 | 1076 | 0.6514 | 0.5775 |
60
+ | 0.5678 | 5.0 | 1345 | 0.6612 | 0.6197 |
61
+ | 0.5152 | 6.0 | 1614 | 0.6496 | 0.6761 |
62
+ | 0.4826 | 7.0 | 1883 | 0.7743 | 0.6479 |
63
+ | 0.4707 | 8.0 | 2152 | 0.8348 | 0.6620 |
64
+ | 0.4742 | 9.0 | 2421 | 0.8808 | 0.6761 |
65
+ | 0.4857 | 10.0 | 2690 | 0.8734 | 0.7324 |
66
+ | 0.4779 | 11.0 | 2959 | 1.0206 | 0.6620 |
67
+ | 0.5063 | 12.0 | 3228 | 1.0737 | 0.6761 |
68
+ | 0.4776 | 13.0 | 3497 | 1.0966 | 0.6761 |
69
+ | 0.4716 | 14.0 | 3766 | 1.1046 | 0.6761 |
70
+ | 0.4672 | 15.0 | 4035 | 1.1044 | 0.6761 |
71
 
72
 
73
  ### Framework versions
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16c4131fbe73c8201bbf84f0ca6299d725d33ee5b0a38a81027d97f832ac652e
3
  size 379881432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04c6a107f5bdc6566453b272564bfbb800cb3105b7a444b642e21cd3007f558b
3
  size 379881432
runs/Feb07_10-30-11_9bea037ab619/events.out.tfevents.1707302062.9bea037ab619.513.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab1a5d238b24054183a7acfb3ee53b5300d81e11a2d78874a064c5fb32c61ee
3
+ size 13989
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.6094385981559753,
3
  "best_model_checkpoint": "/content/drive/MyDrive/AI_development/Musicbot/train_model/Valence-wav2vec2-base-EMOPIA/checkpoint-1614",
4
- "epoch": 10.0,
5
  "eval_steps": 500,
6
- "global_step": 2690,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,169 +11,244 @@
11
  {
12
  "epoch": 1.0,
13
  "learning_rate": 2.69e-07,
14
- "loss": 0.6966,
15
  "step": 269
16
  },
17
  {
18
  "epoch": 1.0,
19
- "eval_accuracy": 0.43661972880363464,
20
- "eval_loss": 0.6975200772285461,
21
- "eval_runtime": 41.5882,
22
- "eval_samples_per_second": 1.707,
23
- "eval_steps_per_second": 1.707,
24
  "step": 269
25
  },
26
  {
27
  "epoch": 2.0,
28
  "learning_rate": 5.38e-07,
29
- "loss": 0.6903,
30
  "step": 538
31
  },
32
  {
33
  "epoch": 2.0,
34
- "eval_accuracy": 0.591549277305603,
35
- "eval_loss": 0.6906841397285461,
36
- "eval_runtime": 42.4023,
37
- "eval_samples_per_second": 1.674,
38
- "eval_steps_per_second": 1.674,
39
  "step": 538
40
  },
41
  {
42
  "epoch": 3.0,
43
  "learning_rate": 8.070000000000001e-07,
44
- "loss": 0.6738,
45
  "step": 807
46
  },
47
  {
48
  "epoch": 3.0,
49
- "eval_accuracy": 0.5633803009986877,
50
- "eval_loss": 0.6904125213623047,
51
- "eval_runtime": 42.1763,
52
- "eval_samples_per_second": 1.683,
53
- "eval_steps_per_second": 1.683,
54
  "step": 807
55
  },
56
  {
57
  "epoch": 4.0,
58
- "learning_rate": 9.550295857988165e-07,
59
- "loss": 0.6383,
60
  "step": 1076
61
  },
62
  {
63
  "epoch": 4.0,
64
- "eval_accuracy": 0.5492957830429077,
65
- "eval_loss": 0.6504009366035461,
66
- "eval_runtime": 42.4689,
67
- "eval_samples_per_second": 1.672,
68
- "eval_steps_per_second": 1.672,
69
  "step": 1076
70
  },
71
  {
72
  "epoch": 5.0,
73
- "learning_rate": 7.970414201183432e-07,
74
- "loss": 0.5737,
75
  "step": 1345
76
  },
77
  {
78
  "epoch": 5.0,
79
- "eval_accuracy": 0.6901408433914185,
80
- "eval_loss": 0.6256533265113831,
81
- "eval_runtime": 42.7087,
82
- "eval_samples_per_second": 1.662,
83
- "eval_steps_per_second": 1.662,
84
  "step": 1345
85
  },
86
  {
87
  "epoch": 6.0,
88
- "learning_rate": 6.384615384615383e-07,
89
- "loss": 0.522,
90
  "step": 1614
91
  },
92
  {
93
  "epoch": 6.0,
94
- "eval_accuracy": 0.7042253613471985,
95
- "eval_loss": 0.6094385981559753,
96
- "eval_runtime": 42.2325,
97
- "eval_samples_per_second": 1.681,
98
- "eval_steps_per_second": 1.681,
99
  "step": 1614
100
  },
101
  {
102
  "epoch": 7.0,
103
- "learning_rate": 4.792899408284024e-07,
104
- "loss": 0.5022,
105
  "step": 1883
106
  },
107
  {
108
  "epoch": 7.0,
109
- "eval_accuracy": 0.7183098793029785,
110
- "eval_loss": 0.644359290599823,
111
- "eval_runtime": 42.6443,
112
- "eval_samples_per_second": 1.665,
113
- "eval_steps_per_second": 1.665,
114
  "step": 1883
115
  },
116
  {
117
  "epoch": 8.0,
118
- "learning_rate": 3.2011834319526625e-07,
119
- "loss": 0.4832,
120
  "step": 2152
121
  },
122
  {
123
  "epoch": 8.0,
124
- "eval_accuracy": 0.7042253613471985,
125
- "eval_loss": 0.6958394646644592,
126
- "eval_runtime": 42.8132,
127
- "eval_samples_per_second": 1.658,
128
- "eval_steps_per_second": 1.658,
129
  "step": 2152
130
  },
131
  {
132
  "epoch": 9.0,
133
- "learning_rate": 1.6153846153846155e-07,
134
- "loss": 0.4683,
135
  "step": 2421
136
  },
137
  {
138
  "epoch": 9.0,
139
- "eval_accuracy": 0.7464788556098938,
140
- "eval_loss": 0.66265869140625,
141
- "eval_runtime": 42.5503,
142
- "eval_samples_per_second": 1.669,
143
- "eval_steps_per_second": 1.669,
144
  "step": 2421
145
  },
146
  {
147
  "epoch": 10.0,
148
- "learning_rate": 2.3668639053254436e-09,
149
- "loss": 0.4548,
150
  "step": 2690
151
  },
152
  {
153
  "epoch": 10.0,
154
  "eval_accuracy": 0.7323943376541138,
155
- "eval_loss": 0.6839823126792908,
156
- "eval_runtime": 42.4148,
157
- "eval_samples_per_second": 1.674,
158
- "eval_steps_per_second": 1.674,
159
  "step": 2690
160
  },
161
  {
162
- "epoch": 10.0,
163
- "step": 2690,
164
- "total_flos": 3.85073061334848e+18,
165
- "train_loss": 0.5703220041267933,
166
- "train_runtime": 10535.0516,
167
- "train_samples_per_second": 0.766,
168
- "train_steps_per_second": 0.255
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
169
  }
170
  ],
171
  "logging_steps": 33,
172
- "max_steps": 2690,
173
  "num_input_tokens_seen": 0,
174
- "num_train_epochs": 10,
175
  "save_steps": 500,
176
- "total_flos": 3.85073061334848e+18,
177
  "train_batch_size": 1,
178
  "trial_name": null,
179
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6496289968490601,
3
  "best_model_checkpoint": "/content/drive/MyDrive/AI_development/Musicbot/train_model/Valence-wav2vec2-base-EMOPIA/checkpoint-1614",
4
+ "epoch": 15.0,
5
  "eval_steps": 500,
6
+ "global_step": 4035,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 1.0,
13
  "learning_rate": 2.69e-07,
14
+ "loss": 0.6979,
15
  "step": 269
16
  },
17
  {
18
  "epoch": 1.0,
19
+ "eval_accuracy": 0.591549277305603,
20
+ "eval_loss": 0.6842264533042908,
21
+ "eval_runtime": 39.6409,
22
+ "eval_samples_per_second": 1.791,
23
+ "eval_steps_per_second": 1.791,
24
  "step": 269
25
  },
26
  {
27
  "epoch": 2.0,
28
  "learning_rate": 5.38e-07,
29
+ "loss": 0.69,
30
  "step": 538
31
  },
32
  {
33
  "epoch": 2.0,
34
+ "eval_accuracy": 0.577464759349823,
35
+ "eval_loss": 0.6864134073257446,
36
+ "eval_runtime": 39.1896,
37
+ "eval_samples_per_second": 1.812,
38
+ "eval_steps_per_second": 1.812,
39
  "step": 538
40
  },
41
  {
42
  "epoch": 3.0,
43
  "learning_rate": 8.070000000000001e-07,
44
+ "loss": 0.6714,
45
  "step": 807
46
  },
47
  {
48
  "epoch": 3.0,
49
+ "eval_accuracy": 0.5070422291755676,
50
+ "eval_loss": 0.6899517178535461,
51
+ "eval_runtime": 39.605,
52
+ "eval_samples_per_second": 1.793,
53
+ "eval_steps_per_second": 1.793,
54
  "step": 807
55
  },
56
  {
57
  "epoch": 4.0,
58
+ "learning_rate": 9.7495881383855e-07,
59
+ "loss": 0.6357,
60
  "step": 1076
61
  },
62
  {
63
  "epoch": 4.0,
64
+ "eval_accuracy": 0.577464759349823,
65
+ "eval_loss": 0.6513809561729431,
66
+ "eval_runtime": 39.4173,
67
+ "eval_samples_per_second": 1.801,
68
+ "eval_steps_per_second": 1.801,
69
  "step": 1076
70
  },
71
  {
72
  "epoch": 5.0,
73
+ "learning_rate": 8.86985172981878e-07,
74
+ "loss": 0.5678,
75
  "step": 1345
76
  },
77
  {
78
  "epoch": 5.0,
79
+ "eval_accuracy": 0.6197183132171631,
80
+ "eval_loss": 0.6612136363983154,
81
+ "eval_runtime": 39.8225,
82
+ "eval_samples_per_second": 1.783,
83
+ "eval_steps_per_second": 1.783,
84
  "step": 1345
85
  },
86
  {
87
  "epoch": 6.0,
88
+ "learning_rate": 7.986820428336078e-07,
89
+ "loss": 0.5152,
90
  "step": 1614
91
  },
92
  {
93
  "epoch": 6.0,
94
+ "eval_accuracy": 0.6760563254356384,
95
+ "eval_loss": 0.6496289968490601,
96
+ "eval_runtime": 39.8771,
97
+ "eval_samples_per_second": 1.78,
98
+ "eval_steps_per_second": 1.78,
99
  "step": 1614
100
  },
101
  {
102
  "epoch": 7.0,
103
+ "learning_rate": 7.100494233937397e-07,
104
+ "loss": 0.4826,
105
  "step": 1883
106
  },
107
  {
108
  "epoch": 7.0,
109
+ "eval_accuracy": 0.6478873491287231,
110
+ "eval_loss": 0.7743203639984131,
111
+ "eval_runtime": 40.2905,
112
+ "eval_samples_per_second": 1.762,
113
+ "eval_steps_per_second": 1.762,
114
  "step": 1883
115
  },
116
  {
117
  "epoch": 8.0,
118
+ "learning_rate": 6.217462932454694e-07,
119
+ "loss": 0.4707,
120
  "step": 2152
121
  },
122
  {
123
  "epoch": 8.0,
124
+ "eval_accuracy": 0.6619718074798584,
125
+ "eval_loss": 0.8347696661949158,
126
+ "eval_runtime": 40.5923,
127
+ "eval_samples_per_second": 1.749,
128
+ "eval_steps_per_second": 1.749,
129
  "step": 2152
130
  },
131
  {
132
  "epoch": 9.0,
133
+ "learning_rate": 5.331136738056013e-07,
134
+ "loss": 0.4742,
135
  "step": 2421
136
  },
137
  {
138
  "epoch": 9.0,
139
+ "eval_accuracy": 0.6760563254356384,
140
+ "eval_loss": 0.8807682394981384,
141
+ "eval_runtime": 40.1866,
142
+ "eval_samples_per_second": 1.767,
143
+ "eval_steps_per_second": 1.767,
144
  "step": 2421
145
  },
146
  {
147
  "epoch": 10.0,
148
+ "learning_rate": 4.448105436573311e-07,
149
+ "loss": 0.4857,
150
  "step": 2690
151
  },
152
  {
153
  "epoch": 10.0,
154
  "eval_accuracy": 0.7323943376541138,
155
+ "eval_loss": 0.8734177947044373,
156
+ "eval_runtime": 39.9771,
157
+ "eval_samples_per_second": 1.776,
158
+ "eval_steps_per_second": 1.776,
159
  "step": 2690
160
  },
161
  {
162
+ "epoch": 11.0,
163
+ "learning_rate": 3.561779242174629e-07,
164
+ "loss": 0.4779,
165
+ "step": 2959
166
+ },
167
+ {
168
+ "epoch": 11.0,
169
+ "eval_accuracy": 0.6619718074798584,
170
+ "eval_loss": 1.0206172466278076,
171
+ "eval_runtime": 40.0006,
172
+ "eval_samples_per_second": 1.775,
173
+ "eval_steps_per_second": 1.775,
174
+ "step": 2959
175
+ },
176
+ {
177
+ "epoch": 12.0,
178
+ "learning_rate": 2.675453047775947e-07,
179
+ "loss": 0.5063,
180
+ "step": 3228
181
+ },
182
+ {
183
+ "epoch": 12.0,
184
+ "eval_accuracy": 0.6760563254356384,
185
+ "eval_loss": 1.073710322380066,
186
+ "eval_runtime": 39.9745,
187
+ "eval_samples_per_second": 1.776,
188
+ "eval_steps_per_second": 1.776,
189
+ "step": 3228
190
+ },
191
+ {
192
+ "epoch": 13.0,
193
+ "learning_rate": 1.7891268533772652e-07,
194
+ "loss": 0.4776,
195
+ "step": 3497
196
+ },
197
+ {
198
+ "epoch": 13.0,
199
+ "eval_accuracy": 0.6760563254356384,
200
+ "eval_loss": 1.0966248512268066,
201
+ "eval_runtime": 40.123,
202
+ "eval_samples_per_second": 1.77,
203
+ "eval_steps_per_second": 1.77,
204
+ "step": 3497
205
+ },
206
+ {
207
+ "epoch": 14.0,
208
+ "learning_rate": 9.028006589785832e-08,
209
+ "loss": 0.4716,
210
+ "step": 3766
211
+ },
212
+ {
213
+ "epoch": 14.0,
214
+ "eval_accuracy": 0.6760563254356384,
215
+ "eval_loss": 1.1046380996704102,
216
+ "eval_runtime": 40.3,
217
+ "eval_samples_per_second": 1.762,
218
+ "eval_steps_per_second": 1.762,
219
+ "step": 3766
220
+ },
221
+ {
222
+ "epoch": 15.0,
223
+ "learning_rate": 1.6474464579901152e-09,
224
+ "loss": 0.4672,
225
+ "step": 4035
226
+ },
227
+ {
228
+ "epoch": 15.0,
229
+ "eval_accuracy": 0.6760563254356384,
230
+ "eval_loss": 1.104396939277649,
231
+ "eval_runtime": 40.5426,
232
+ "eval_samples_per_second": 1.751,
233
+ "eval_steps_per_second": 1.751,
234
+ "step": 4035
235
+ },
236
+ {
237
+ "epoch": 15.0,
238
+ "step": 4035,
239
+ "total_flos": 5.776095920022718e+18,
240
+ "train_loss": 0.5394472843061445,
241
+ "train_runtime": 15506.5237,
242
+ "train_samples_per_second": 0.781,
243
+ "train_steps_per_second": 0.26
244
  }
245
  ],
246
  "logging_steps": 33,
247
+ "max_steps": 4035,
248
  "num_input_tokens_seen": 0,
249
+ "num_train_epochs": 15,
250
  "save_steps": 500,
251
+ "total_flos": 5.776095920022718e+18,
252
  "train_batch_size": 1,
253
  "trial_name": null,
254
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:413b6a3dbe8fa45ca792fd830f325d5008bdc2602d7cb23dbf331fcfecef154a
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d63a66560e1fa67dbf66481ce72aaf977ec50451a25fa9c7940b58998863901f
3
  size 4856