Gizachew commited on Apr 12

Commit

ec7e849

•

1 Parent(s): 9ce3233

End of training

Browse files

Files changed (20) hide show

README.md +64 -0
all_results.json +9 -0
config.json +93 -0
model.safetensors +3 -0
preprocessor_config.json +9 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712938183.6c0ec431eb03.34.0 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712939900.6c0ec431eb03.34.1 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940214.6c0ec431eb03.34.2 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940242.6c0ec431eb03.34.3 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940289.6c0ec431eb03.34.4 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940482.6c0ec431eb03.34.5 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940519.6c0ec431eb03.34.6 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940671.6c0ec431eb03.34.7 +3 -0
runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712941086.6c0ec431eb03.34.8 +3 -0
runs/Apr12_16-58-56_6c0ec431eb03/events.out.tfevents.1712941164.6c0ec431eb03.34.9 +3 -0
runs/Apr12_17-02-10_6c0ec431eb03/events.out.tfevents.1712941348.6c0ec431eb03.34.10 +3 -0
runs/Apr12_17-17-03_6c0ec431eb03/events.out.tfevents.1712942228.6c0ec431eb03.34.11 +3 -0
train_results.json +9 -0
trainer_state.json +132 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,64 @@

+---
+license: apache-2.0
+base_model: facebook/hubert-base-ls960
+tags:
+- generated_from_trainer
+metrics:
+- accuracy
+model-index:
+- name: ckpts
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# ckpts
+This model is a fine-tuned version of [facebook/hubert-base-ls960](https://huggingface.co/facebook/hubert-base-ls960) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.1910
+- Accuracy: 0.9697
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 1e-05
+- train_batch_size: 4
+- eval_batch_size: 4
+- seed: 42
+- gradient_accumulation_steps: 2
+- total_train_batch_size: 8
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 5.0
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Accuracy |
+|:-------------:|:-----:|:----:|:---------------:|:--------:|
+| 0.0228        | 2.02  | 500  | 0.1773          | 0.9737   |
+| 0.0385        | 4.04  | 1000 | 0.1910          | 0.9697   |
+### Framework versions
+- Transformers 4.40.0.dev0
+- Pytorch 2.1.2
+- Datasets 2.18.1.dev0
+- Tokenizers 0.15.2

all_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 4.99,
+    "total_flos": 3.160649695892544e+17,
+    "train_loss": 0.03992950008948322,
+    "train_runtime": 666.1547,
+    "train_samples": 1979,
+    "train_samples_per_second": 14.854,
+    "train_steps_per_second": 1.854
+}

config.json ADDED Viewed

	@@ -0,0 +1,93 @@

+{
+  "_name_or_path": "facebook/hubert-base-ls960",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "HubertForSpeechClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_proj_layer_norm": true,
+  "final_dropout": 0.1,
+  "finetuning_task": "wav2vec2_clf",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "01Neutral",
+    "1": "02Fearful",
+    "2": "03Happy",
+    "3": "04Sad",
+    "4": "05Angry"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "01Neutral": 0,
+    "02Fearful": 1,
+    "03Happy": 2,
+    "04Sad": 3,
+    "05Angry": 4
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.1,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "pooling_mode": "mean",
+  "problem_type": "single_label_classification",
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.0.dev0",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d0debed0760df769d15ac8682084547cc2c5e3cc04ab2f3880eafb91150c315
+size 379890236

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712938183.6c0ec431eb03.34.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdcff2c21cd7f636d16377c28120e72a5ac1fa8cc3bb0e2eeabae20537f34203
+size 5852

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712939900.6c0ec431eb03.34.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5a26b3cf658a40031ab93cd221b1b85f63d448d90769cd6ebb026ae8000a109
+size 5852

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940214.6c0ec431eb03.34.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42c6e5e2b531bef51b9a1303b98309a19bf20aa3e65a7ef0c43525bf8d31ea96
+size 5852

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940242.6c0ec431eb03.34.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7aa7443b5c435809a0a78667e31a4b04019df27788ed5d224e4c4baca446f28f
+size 5901

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940289.6c0ec431eb03.34.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7dcc8bceed9ca96ab476010eb4b5cf67083ae7f47d9aa983484707f7d9866ba0
+size 5901

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940482.6c0ec431eb03.34.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc1355b1381c53cf6d4686bb1e90599724bb30f23b5ee8c50b7dc0b8248286d2
+size 5901

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940519.6c0ec431eb03.34.6 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:55481ceeb53a61c1b9145543cf11fd6c32b8b375f90a52f7c3279e2172c49b70
+size 5901

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712940671.6c0ec431eb03.34.7 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:763299b2ea96af62e59c0c7cd6e45fc7c0fec7810d2143e0f4df56fd0b62235c
+size 5901

runs/Apr12_16-09-39_6c0ec431eb03/events.out.tfevents.1712941086.6c0ec431eb03.34.8 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:789d74ec93d39b683919e14627f5569d54d5624eb84ec44cec62a169ba53c70d
+size 5901

runs/Apr12_16-58-56_6c0ec431eb03/events.out.tfevents.1712941164.6c0ec431eb03.34.9 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d32147e7aba5a7843309f6903031ae02315424ed1e2ea6707f32f1536dad38c8
+size 8204

runs/Apr12_17-02-10_6c0ec431eb03/events.out.tfevents.1712941348.6c0ec431eb03.34.10 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7ac6b5b4834e9ba4c703845d7ae5c501441e9dafdb437ea7b401aa5889f912e
+size 25289

runs/Apr12_17-17-03_6c0ec431eb03/events.out.tfevents.1712942228.6c0ec431eb03.34.11 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:97b4720817badaf1e0159123c5a6324b528b7c3e563172f2b8fe1d151b38260b
+size 9476

train_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 4.99,
+    "total_flos": 3.160649695892544e+17,
+    "train_loss": 0.03992950008948322,
+    "train_runtime": 666.1547,
+    "train_samples": 1979,
+    "train_samples_per_second": 14.854,
+    "train_steps_per_second": 1.854
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,132 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 4.98989898989899,
+  "eval_steps": 500,
+  "global_step": 1235,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.4,
+      "grad_norm": 0.006182590499520302,
+      "learning_rate": 9.206477732793523e-06,
+      "loss": 0.0729,
+      "step": 100
+    },
+    {
+      "epoch": 0.81,
+      "grad_norm": 21.23886489868164,
+      "learning_rate": 8.39676113360324e-06,
+      "loss": 0.0698,
+      "step": 200
+    },
+    {
+      "epoch": 1.21,
+      "grad_norm": 0.006576939485967159,
+      "learning_rate": 7.587044534412956e-06,
+      "loss": 0.0464,
+      "step": 300
+    },
+    {
+      "epoch": 1.62,
+      "grad_norm": 0.009822617284953594,
+      "learning_rate": 6.785425101214575e-06,
+      "loss": 0.0689,
+      "step": 400
+    },
+    {
+      "epoch": 2.02,
+      "grad_norm": 0.00560363894328475,
+      "learning_rate": 5.975708502024292e-06,
+      "loss": 0.0228,
+      "step": 500
+    },
+    {
+      "epoch": 2.02,
+      "eval_accuracy": 0.973737359046936,
+      "eval_loss": 0.17728736996650696,
+      "eval_runtime": 23.1344,
+      "eval_samples_per_second": 21.397,
+      "eval_steps_per_second": 5.36,
+      "step": 500
+    },
+    {
+      "epoch": 2.42,
+      "grad_norm": 0.010259171947836876,
+      "learning_rate": 5.165991902834009e-06,
+      "loss": 0.0253,
+      "step": 600
+    },
+    {
+      "epoch": 2.83,
+      "grad_norm": 0.5489621758460999,
+      "learning_rate": 4.356275303643725e-06,
+      "loss": 0.0227,
+      "step": 700
+    },
+    {
+      "epoch": 3.23,
+      "grad_norm": 0.003071287414059043,
+      "learning_rate": 3.5465587044534415e-06,
+      "loss": 0.0398,
+      "step": 800
+    },
+    {
+      "epoch": 3.64,
+      "grad_norm": 0.0034055381547659636,
+      "learning_rate": 2.7368421052631583e-06,
+      "loss": 0.0299,
+      "step": 900
+    },
+    {
+      "epoch": 4.04,
+      "grad_norm": 0.005517472513020039,
+      "learning_rate": 1.9271255060728746e-06,
+      "loss": 0.0385,
+      "step": 1000
+    },
+    {
+      "epoch": 4.04,
+      "eval_accuracy": 0.9696969985961914,
+      "eval_loss": 0.190963014960289,
+      "eval_runtime": 23.4329,
+      "eval_samples_per_second": 21.124,
+      "eval_steps_per_second": 5.292,
+      "step": 1000
+    },
+    {
+      "epoch": 4.44,
+      "grad_norm": 19.359519958496094,
+      "learning_rate": 1.1174089068825912e-06,
+      "loss": 0.0365,
+      "step": 1100
+    },
+    {
+      "epoch": 4.85,
+      "grad_norm": 1.323317527770996,
+      "learning_rate": 3.0769230769230774e-07,
+      "loss": 0.0064,
+      "step": 1200
+    },
+    {
+      "epoch": 4.99,
+      "step": 1235,
+      "total_flos": 3.160649695892544e+17,
+      "train_loss": 0.03992950008948322,
+      "train_runtime": 666.1547,
+      "train_samples_per_second": 14.854,
+      "train_steps_per_second": 1.854
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 1235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 3.160649695892544e+17,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f507758a89624d13b7bed17a703fed0e8a853809c160f6b3fee91839d462fc37
+size 4984