Add files using upload-large-folder tool

Files changed (5) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/leonardo_work/EUHPC_A01_006/models/whisper-small",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "apply_spec_augment": false,
@@ -7,10 +7,7 @@
     "WhisperForConditionalGeneration"
   ],
   "attention_dropout": 0.0,
-  "begin_suppress_tokens": [
-    220,
-    50257
-  ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
   "d_model": 768,
@@ -34,7 +31,7 @@
   "mask_time_length": 10,
   "mask_time_min_masks": 2,
   "mask_time_prob": 0.05,
-  "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "median_filter_width": 7,
@@ -44,7 +41,7 @@
   "pad_token_id": 50257,
   "scale_embedding": false,
   "torch_dtype": "float16",
-  "transformers_version": "4.37.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51865

 {
+  "_name_or_path": "/leonardo_work/EUHPC_A01_006/experiments_whisper/stage1_results/small/",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "apply_spec_augment": false,
     "WhisperForConditionalGeneration"
   ],
   "attention_dropout": 0.0,
+  "begin_suppress_tokens": null,
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
   "d_model": 768,
   "mask_time_length": 10,
   "mask_time_min_masks": 2,
   "mask_time_prob": 0.05,
+  "max_length": null,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "pad_token_id": 50257,
   "scale_embedding": false,
   "torch_dtype": "float16",
+  "transformers_version": "4.45.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51865

generation_config.json CHANGED Viewed

@@ -160,6 +160,7 @@
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
@@ -256,9 +257,10 @@
     50361,
     50362
   ],
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
-  "transformers_version": "4.37.2"
 }

     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
+  "language": "<|sv|>",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
     50361,
     50362
   ],
+  "task": "transcribe",
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
+  "transformers_version": "4.45.2"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4968b89aef05596bf9fcc61c01c8d483637ee788b51b02cfcc5e67e44bebde7b
 size 563189936

 version https://git-lfs.github.com/spec/v1
+oid sha256:1bc6e9b8a0b42dba65026354cf6247e4b5dbe6a1a3a663d7f0a0d1f5ef3a3ae7
 size 563189936

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "add_bos_token": false,
   "add_prefix_space": true,
   "added_tokens_decoder": {
     "50257": {
@@ -12977,14 +12976,11 @@
     "<|notimestamps|>"
   ],
   "bos_token": "<|endoftext|>",
-  "clean_up_tokenization_spaces": true,
   "dropout": 0.2,
   "eos_token": "<|endoftext|>",
-  "errors": "replace",
-  "model_max_length": 1024,
   "pad_token": "<|endoftext|>",
-  "processor_class": "WhisperProcessor",
-  "return_attention_mask": false,
   "tokenizer_class": "WhisperTokenizer",
   "unk_token": "<|endoftext|>"
 }

 {
   "add_prefix_space": true,
   "added_tokens_decoder": {
     "50257": {
     "<|notimestamps|>"
   ],
   "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
   "dropout": 0.2,
   "eos_token": "<|endoftext|>",
+  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
   "tokenizer_class": "WhisperTokenizer",
   "unk_token": "<|endoftext|>"
 }