Model save

Browse files

Files changed (5) hide show

README.md +18 -8
generation_config.json +3 -12
model-00001-of-00002.safetensors +1 -1
model-00002-of-00002.safetensors +1 -1
runs/Aug20_11-34-00_DITEC2014063010/events.out.tfevents.1724164511.DITEC2014063010.27248.0 +2 -2

README.md CHANGED Viewed

@@ -1,4 +1,5 @@
 ---
 license: apache-2.0
 base_model: openai/whisper-large-v3
 tags:
@@ -22,7 +23,7 @@ model-index:
     metrics:
     - name: Wer
       type: wer
-      value: 0.10366752081998719
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [openai/whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) on the common_voice_18_0 dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.1486
-- Wer: 0.1037
 ## Model description
@@ -56,24 +57,33 @@ The following hyperparameters were used during training:
 - train_batch_size: 8
 - eval_batch_size: 8
 - seed: 42
-- gradient_accumulation_steps: 32
-- total_train_batch_size: 256
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 1000
-- num_epochs: 2.0
 - mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Wer    |
 |:-------------:|:------:|:----:|:---------------:|:------:|
-| 0.13          | 0.9998 | 691  | 0.1486          | 0.1037 |
 ### Framework versions
-- Transformers 4.44.0.dev0
 - Pytorch 2.4.0+cu124
 - Datasets 2.18.1.dev0
 - Tokenizers 0.19.1

 ---
+library_name: transformers
 license: apache-2.0
 base_model: openai/whisper-large-v3
 tags:
     metrics:
     - name: Wer
       type: wer
+      value: 0.10419602818705957
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [openai/whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) on the common_voice_18_0 dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2671
+- Wer: 0.1042
 ## Model description
 - train_batch_size: 8
 - eval_batch_size: 8
 - seed: 42
+- gradient_accumulation_steps: 4
+- total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 1000
+- num_epochs: 10.0
 - mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Wer    |
 |:-------------:|:------:|:----:|:---------------:|:------:|
+| 0.1388        | 0.9996 | 691  | 0.1501          | 0.1074 |
+| 0.108         | 1.9993 | 1382 | 0.1619          | 0.1153 |
+| 0.091         | 2.9989 | 2073 | 0.1697          | 0.1124 |
+| 0.0461        | 4.0    | 2765 | 0.1764          | 0.1120 |
+| 0.0264        | 4.9996 | 3456 | 0.2024          | 0.1133 |
+| 0.0203        | 5.9993 | 4147 | 0.2200          | 0.1099 |
+| 0.0129        | 6.9989 | 4838 | 0.2277          | 0.1114 |
+| 0.0091        | 8.0    | 5530 | 0.2552          | 0.1067 |
+| 0.0063        | 8.9996 | 6221 | 0.2565          | 0.1054 |
+| 0.0019        | 9.9964 | 6910 | 0.2671          | 0.1042 |
 ### Framework versions
+- Transformers 4.45.0.dev0
 - Pytorch 2.4.0+cu124
 - Datasets 2.18.1.dev0
 - Tokenizers 0.19.1

generation_config.json CHANGED Viewed

@@ -48,16 +48,6 @@
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
-  "forced_decoder_ids": [
-    [
-      1,
-      null
-    ],
-    [
-      2,
-      50360
-    ]
-  ],
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
@@ -161,7 +151,7 @@
     "<|yue|>": 50358,
     "<|zh|>": 50260
   },
-  "language": "<|pt|>",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50364,
@@ -258,9 +248,10 @@
     50362,
     50363
   ],
   "task_to_id": {
     "transcribe": 50360,
     "translate": 50359
   },
-  "transformers_version": "4.44.0.dev0"
 }

   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
     "<|yue|>": 50358,
     "<|zh|>": 50260
   },
+  "language": "portuguese",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50364,
     50362,
     50363
   ],
+  "task": "transcribe",
   "task_to_id": {
     "transcribe": 50360,
     "translate": 50359
   },
+  "transformers_version": "4.45.0.dev0"
 }

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:524e5d905ac451a424fcd908db2e019cc0c8127f75d9ddc60f72eb9e8c820905
 size 4993448880

 version https://git-lfs.github.com/spec/v1
+oid sha256:d0d8543f8a343cf6bd7d5acea5735e038153f225305548ad9147e66d092130fd
 size 4993448880

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dffabf943db6878e36e9ec8c9f8d318d8be564694a0294ca3c9ccdaccb18bae2
 size 1180663192

 version https://git-lfs.github.com/spec/v1
+oid sha256:86eb946aa1f18d3940a43139960cc047edc7ac2addae69ac7012130eb797baa6
 size 1180663192

runs/Aug20_11-34-00_DITEC2014063010/events.out.tfevents.1724164511.DITEC2014063010.27248.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:094f803784c837c850ecbc36ee536ab49a222e38a170277aa75622860688921d
-size 67173

 version https://git-lfs.github.com/spec/v1
+oid sha256:cd31673c00dee3b5d966fc2e0d3187041e316f31dc7b87e1207763f5907c9fab
+size 67527