Commit
·
8a268aa
1
Parent(s):
8c1c4f2
Done
Browse files- config.json +21 -20
- optimizer.pt +2 -2
- preprocessor_config.json +0 -1
- pytorch_model.bin +2 -2
- rng_state.pth +1 -1
- runs/Sep19_06-49-13_vision-gpu-1/1663570168.217734/events.out.tfevents.1663570168.vision-gpu-1.17728.1 +3 -0
- runs/Sep19_06-49-13_vision-gpu-1/events.out.tfevents.1663570168.vision-gpu-1.17728.0 +3 -0
- runs/Sep19_07-05-01_vision-gpu-1/1663571119.45767/events.out.tfevents.1663571119.vision-gpu-1.19945.1 +3 -0
- runs/Sep19_07-05-01_vision-gpu-1/events.out.tfevents.1663571119.vision-gpu-1.19945.0 +3 -0
- runs/Sep19_07-09-02_vision-gpu-1/1663571352.04798/events.out.tfevents.1663571352.vision-gpu-1.21751.1 +3 -0
- runs/Sep19_07-09-02_vision-gpu-1/1663572282.0390873/events.out.tfevents.1663572282.vision-gpu-1.21751.3 +3 -0
- runs/Sep19_07-09-02_vision-gpu-1/events.out.tfevents.1663571352.vision-gpu-1.21751.0 +3 -0
- runs/Sep19_07-09-02_vision-gpu-1/events.out.tfevents.1663572282.vision-gpu-1.21751.2 +3 -0
- scaler.pt +1 -1
- scheduler.pt +1 -1
- trainer_state.json +50 -65
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
-
"activation_dropout": 0.
|
4 |
"adapter_kernel_size": 3,
|
5 |
"adapter_stride": 2,
|
6 |
"add_adapter": false,
|
@@ -49,35 +49,37 @@
|
|
49 |
"feat_extract_activation": "gelu",
|
50 |
"feat_extract_dropout": 0.0,
|
51 |
"feat_extract_norm": "layer",
|
52 |
-
"feat_proj_dropout": 0.
|
53 |
"feat_quantizer_dropout": 0.0,
|
54 |
"final_dropout": 0.0,
|
55 |
"finetuning_task": "wav2vec2_clf",
|
56 |
"hidden_act": "gelu",
|
57 |
-
"hidden_dropout": 0.
|
58 |
"hidden_size": 1024,
|
59 |
"id2label": {
|
60 |
"0": "angry",
|
61 |
-
"1": "
|
62 |
-
"2": "
|
63 |
-
"3": "
|
64 |
-
"4": "
|
65 |
-
"5": "
|
66 |
-
"6": "
|
|
|
67 |
},
|
68 |
"initializer_range": 0.02,
|
69 |
"intermediate_size": 4096,
|
70 |
"label2id": {
|
71 |
"angry": 0,
|
72 |
-
"
|
73 |
-
"
|
74 |
-
"
|
75 |
-
"
|
76 |
-
"
|
77 |
-
"
|
|
|
78 |
},
|
79 |
"layer_norm_eps": 1e-05,
|
80 |
-
"layerdrop": 0.
|
81 |
"mask_channel_length": 10,
|
82 |
"mask_channel_min_space": 1,
|
83 |
"mask_channel_other": 0.0,
|
@@ -103,11 +105,10 @@
|
|
103 |
"num_hidden_layers": 24,
|
104 |
"num_negatives": 100,
|
105 |
"output_hidden_size": 1024,
|
106 |
-
"pad_token_id":
|
107 |
"pooling_mode": "mean",
|
108 |
"problem_type": "single_label_classification",
|
109 |
"proj_codevector_dim": 256,
|
110 |
-
"push_to_hub": true,
|
111 |
"tdnn_dilation": [
|
112 |
1,
|
113 |
2,
|
@@ -132,6 +133,6 @@
|
|
132 |
"torch_dtype": "float32",
|
133 |
"transformers_version": "4.23.0.dev0",
|
134 |
"use_weighted_layer_sum": false,
|
135 |
-
"vocab_size":
|
136 |
"xvector_output_dim": 512
|
137 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "lighteternal/wav2vec2-large-xlsr-53-greek",
|
3 |
+
"activation_dropout": 0.0,
|
4 |
"adapter_kernel_size": 3,
|
5 |
"adapter_stride": 2,
|
6 |
"add_adapter": false,
|
|
|
49 |
"feat_extract_activation": "gelu",
|
50 |
"feat_extract_dropout": 0.0,
|
51 |
"feat_extract_norm": "layer",
|
52 |
+
"feat_proj_dropout": 0.0,
|
53 |
"feat_quantizer_dropout": 0.0,
|
54 |
"final_dropout": 0.0,
|
55 |
"finetuning_task": "wav2vec2_clf",
|
56 |
"hidden_act": "gelu",
|
57 |
+
"hidden_dropout": 0.1,
|
58 |
"hidden_size": 1024,
|
59 |
"id2label": {
|
60 |
"0": "angry",
|
61 |
+
"1": "calm",
|
62 |
+
"2": "disgust",
|
63 |
+
"3": "fearful",
|
64 |
+
"4": "happy",
|
65 |
+
"5": "neutral",
|
66 |
+
"6": "sad",
|
67 |
+
"7": "surprised"
|
68 |
},
|
69 |
"initializer_range": 0.02,
|
70 |
"intermediate_size": 4096,
|
71 |
"label2id": {
|
72 |
"angry": 0,
|
73 |
+
"calm": 1,
|
74 |
+
"disgust": 2,
|
75 |
+
"fearful": 3,
|
76 |
+
"happy": 4,
|
77 |
+
"neutral": 5,
|
78 |
+
"sad": 6,
|
79 |
+
"surprised": 7
|
80 |
},
|
81 |
"layer_norm_eps": 1e-05,
|
82 |
+
"layerdrop": 0.1,
|
83 |
"mask_channel_length": 10,
|
84 |
"mask_channel_min_space": 1,
|
85 |
"mask_channel_other": 0.0,
|
|
|
105 |
"num_hidden_layers": 24,
|
106 |
"num_negatives": 100,
|
107 |
"output_hidden_size": 1024,
|
108 |
+
"pad_token_id": 54,
|
109 |
"pooling_mode": "mean",
|
110 |
"problem_type": "single_label_classification",
|
111 |
"proj_codevector_dim": 256,
|
|
|
112 |
"tdnn_dilation": [
|
113 |
1,
|
114 |
2,
|
|
|
133 |
"torch_dtype": "float32",
|
134 |
"transformers_version": "4.23.0.dev0",
|
135 |
"use_weighted_layer_sum": false,
|
136 |
+
"vocab_size": 55,
|
137 |
"xvector_output_dim": 512
|
138 |
}
|
optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ebb6b6119110351be64f39f20826294fb7a16faeb39b79f1e56721d08f2ca7
|
3 |
+
size 2498522121
|
preprocessor_config.json
CHANGED
@@ -4,7 +4,6 @@
|
|
4 |
"feature_size": 1,
|
5 |
"padding_side": "right",
|
6 |
"padding_value": 0.0,
|
7 |
-
"processor_class": "Wav2Vec2ProcessorWithLM",
|
8 |
"return_attention_mask": true,
|
9 |
"sampling_rate": 16000
|
10 |
}
|
|
|
4 |
"feature_size": 1,
|
5 |
"padding_side": "right",
|
6 |
"padding_value": 0.0,
|
|
|
7 |
"return_attention_mask": true,
|
8 |
"sampling_rate": 16000
|
9 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21fe72d43c31b3044b1ec946fa3b32078ed99dea846cd0192a26856bb9c839e6
|
3 |
+
size 1266130541
|
rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14567
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f449ee5f1d7ffb1d2e2b47df15b3e8c0e25a55972ba52ec93a6b01f10b6ecec
|
3 |
size 14567
|
runs/Sep19_06-49-13_vision-gpu-1/1663570168.217734/events.out.tfevents.1663570168.vision-gpu-1.17728.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74ce15e161c8076653200576506a6c02c8d9d019904893fab0a075edf7883cce
|
3 |
+
size 5619
|
runs/Sep19_06-49-13_vision-gpu-1/events.out.tfevents.1663570168.vision-gpu-1.17728.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d158eaf6fb80de8795509d501ecc6422dc95f54baa66500671e571a591c7cf3
|
3 |
+
size 5811
|
runs/Sep19_07-05-01_vision-gpu-1/1663571119.45767/events.out.tfevents.1663571119.vision-gpu-1.19945.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0047a28ef3742f208728d55bafaed7605ce5763719f4c5295a3989398a26a8c9
|
3 |
+
size 5619
|
runs/Sep19_07-05-01_vision-gpu-1/events.out.tfevents.1663571119.vision-gpu-1.19945.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d651c7a4b87cd493f626b15d113dc2473c68251f506b14f8af184f109388efb5
|
3 |
+
size 4136
|
runs/Sep19_07-09-02_vision-gpu-1/1663571352.04798/events.out.tfevents.1663571352.vision-gpu-1.21751.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b24252725af424f1ef4733b51d8d6ce4773990249725e01ab8967a84819ab669
|
3 |
+
size 5619
|
runs/Sep19_07-09-02_vision-gpu-1/1663572282.0390873/events.out.tfevents.1663572282.vision-gpu-1.21751.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dffc2ea835e3ac9f4c0fc77b22843913d664c12008658e4bb88b9411c8a1a58a
|
3 |
+
size 5619
|
runs/Sep19_07-09-02_vision-gpu-1/events.out.tfevents.1663571352.vision-gpu-1.21751.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:323671afbabaf7e4e0e8b5f69ca861dfac2f63d5baef43e844cdf1818b8c4696
|
3 |
+
size 10874
|
runs/Sep19_07-09-02_vision-gpu-1/events.out.tfevents.1663572282.vision-gpu-1.21751.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67115331847d53ad55880cf40877aa5c3ba1ebb7863c0e2db3882d224d6ddb7c
|
3 |
+
size 8265
|
scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 559
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5340902b17e35966e7e8d13c891b4a72edbb8cbd01bf429032179aa2bf58052
|
3 |
size 559
|
scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9112768c193dcd7407fa487c3348c49ebdeabbef697849491bcfab0bd57910e
|
3 |
size 623
|
trainer_state.json
CHANGED
@@ -1,106 +1,91 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
-
"epoch": 0.
|
12 |
-
"learning_rate":
|
13 |
-
"loss": 1.
|
14 |
"step": 10
|
15 |
},
|
16 |
{
|
17 |
-
"epoch": 0.
|
18 |
-
"eval_accuracy": 0.
|
19 |
-
"eval_loss": 1.
|
20 |
-
"eval_runtime":
|
21 |
-
"eval_samples_per_second": 4.
|
22 |
-
"eval_steps_per_second": 1.
|
23 |
"step": 10
|
24 |
},
|
25 |
{
|
26 |
-
"epoch": 0.
|
27 |
-
"learning_rate":
|
28 |
-
"loss": 1.
|
29 |
"step": 20
|
30 |
},
|
31 |
{
|
32 |
-
"epoch": 0.
|
33 |
-
"eval_accuracy": 0.
|
34 |
-
"eval_loss": 1.
|
35 |
-
"eval_runtime":
|
36 |
-
"eval_samples_per_second": 4.
|
37 |
-
"eval_steps_per_second": 1.
|
38 |
"step": 20
|
39 |
},
|
40 |
{
|
41 |
-
"epoch": 0.
|
42 |
-
"learning_rate":
|
43 |
-
"loss": 1.
|
44 |
"step": 30
|
45 |
},
|
46 |
{
|
47 |
-
"epoch": 0.
|
48 |
-
"eval_accuracy": 0.
|
49 |
-
"eval_loss": 1.
|
50 |
-
"eval_runtime":
|
51 |
-
"eval_samples_per_second": 4.
|
52 |
-
"eval_steps_per_second": 1.
|
53 |
"step": 30
|
54 |
},
|
55 |
{
|
56 |
-
"epoch": 0.
|
57 |
-
"learning_rate":
|
58 |
-
"loss": 1.
|
59 |
"step": 40
|
60 |
},
|
61 |
{
|
62 |
-
"epoch": 0.
|
63 |
-
"eval_accuracy": 0.
|
64 |
-
"eval_loss": 1.
|
65 |
-
"eval_runtime":
|
66 |
-
"eval_samples_per_second": 4.
|
67 |
-
"eval_steps_per_second": 1.
|
68 |
"step": 40
|
69 |
},
|
70 |
{
|
71 |
-
"epoch":
|
72 |
-
"learning_rate":
|
73 |
-
"loss": 1.
|
74 |
"step": 50
|
75 |
},
|
76 |
{
|
77 |
-
"epoch":
|
78 |
-
"eval_accuracy": 0.
|
79 |
-
"eval_loss": 1.
|
80 |
-
"eval_runtime":
|
81 |
-
"eval_samples_per_second":
|
82 |
-
"eval_steps_per_second":
|
83 |
"step": 50
|
84 |
-
},
|
85 |
-
{
|
86 |
-
"epoch": 1.39,
|
87 |
-
"learning_rate": 6.511627906976745e-05,
|
88 |
-
"loss": 1.8197,
|
89 |
-
"step": 60
|
90 |
-
},
|
91 |
-
{
|
92 |
-
"epoch": 1.39,
|
93 |
-
"eval_accuracy": 0.35227271914482117,
|
94 |
-
"eval_loss": 1.6947021484375,
|
95 |
-
"eval_runtime": 21.8177,
|
96 |
-
"eval_samples_per_second": 4.033,
|
97 |
-
"eval_steps_per_second": 1.008,
|
98 |
-
"step": 60
|
99 |
}
|
100 |
],
|
101 |
-
"max_steps":
|
102 |
-
"num_train_epochs":
|
103 |
-
"total_flos": 1.
|
104 |
"trial_name": null,
|
105 |
"trial_params": null
|
106 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.5,
|
5 |
+
"global_step": 50,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
+
"epoch": 0.1,
|
12 |
+
"learning_rate": 0.0,
|
13 |
+
"loss": 1.8457,
|
14 |
"step": 10
|
15 |
},
|
16 |
{
|
17 |
+
"epoch": 0.1,
|
18 |
+
"eval_accuracy": 0.23000000417232513,
|
19 |
+
"eval_loss": 1.845852017402649,
|
20 |
+
"eval_runtime": 42.6127,
|
21 |
+
"eval_samples_per_second": 4.693,
|
22 |
+
"eval_steps_per_second": 1.173,
|
23 |
"step": 10
|
24 |
},
|
25 |
{
|
26 |
+
"epoch": 0.2,
|
27 |
+
"learning_rate": 0.0,
|
28 |
+
"loss": 1.9441,
|
29 |
"step": 20
|
30 |
},
|
31 |
{
|
32 |
+
"epoch": 0.2,
|
33 |
+
"eval_accuracy": 0.23000000417232513,
|
34 |
+
"eval_loss": 1.845852017402649,
|
35 |
+
"eval_runtime": 42.6438,
|
36 |
+
"eval_samples_per_second": 4.69,
|
37 |
+
"eval_steps_per_second": 1.173,
|
38 |
"step": 20
|
39 |
},
|
40 |
{
|
41 |
+
"epoch": 0.3,
|
42 |
+
"learning_rate": 0.0,
|
43 |
+
"loss": 1.8242,
|
44 |
"step": 30
|
45 |
},
|
46 |
{
|
47 |
+
"epoch": 0.3,
|
48 |
+
"eval_accuracy": 0.23000000417232513,
|
49 |
+
"eval_loss": 1.845852017402649,
|
50 |
+
"eval_runtime": 42.8454,
|
51 |
+
"eval_samples_per_second": 4.668,
|
52 |
+
"eval_steps_per_second": 1.167,
|
53 |
"step": 30
|
54 |
},
|
55 |
{
|
56 |
+
"epoch": 0.4,
|
57 |
+
"learning_rate": 0.0,
|
58 |
+
"loss": 1.8451,
|
59 |
"step": 40
|
60 |
},
|
61 |
{
|
62 |
+
"epoch": 0.4,
|
63 |
+
"eval_accuracy": 0.23000000417232513,
|
64 |
+
"eval_loss": 1.845852017402649,
|
65 |
+
"eval_runtime": 42.5518,
|
66 |
+
"eval_samples_per_second": 4.7,
|
67 |
+
"eval_steps_per_second": 1.175,
|
68 |
"step": 40
|
69 |
},
|
70 |
{
|
71 |
+
"epoch": 0.5,
|
72 |
+
"learning_rate": 0.0,
|
73 |
+
"loss": 1.7465,
|
74 |
"step": 50
|
75 |
},
|
76 |
{
|
77 |
+
"epoch": 0.5,
|
78 |
+
"eval_accuracy": 0.23000000417232513,
|
79 |
+
"eval_loss": 1.845852017402649,
|
80 |
+
"eval_runtime": 42.3785,
|
81 |
+
"eval_samples_per_second": 4.719,
|
82 |
+
"eval_steps_per_second": 1.18,
|
83 |
"step": 50
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
84 |
}
|
85 |
],
|
86 |
+
"max_steps": 100,
|
87 |
+
"num_train_epochs": 1,
|
88 |
+
"total_flos": 1.4748389432630784e+17,
|
89 |
"trial_name": null,
|
90 |
"trial_params": null
|
91 |
}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3439
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70a15c44c864138c37d3beb805073febdbcd67d33560564bdcb6bc07ab6c0653
|
3 |
size 3439
|