Edmon02 commited on
Commit
ac770e6
1 Parent(s): 031ac88

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "Edmon02/speecht5_finetuned_voxpopuli_hy",
3
  "activation_dropout": 0.1,
4
  "apply_spec_augment": true,
5
  "architectures": [
@@ -65,8 +65,8 @@
65
  "mask_time_min_masks": 2,
66
  "mask_time_prob": 0.05,
67
  "max_length": 1876,
68
- "max_speech_positions": 1876,
69
- "max_text_positions": 600,
70
  "model_type": "speecht5",
71
  "num_conv_pos_embedding_groups": 16,
72
  "num_conv_pos_embeddings": 128,
@@ -85,8 +85,8 @@
85
  "speech_decoder_prenet_layers": 2,
86
  "speech_decoder_prenet_units": 256,
87
  "torch_dtype": "float32",
88
- "transformers_version": "4.41.2",
89
  "use_cache": false,
90
  "use_guided_attention_loss": true,
91
- "vocab_size": 81
92
  }
 
1
  {
2
+ "_name_or_path": "Edmon02/speecht5_finetuned_hy",
3
  "activation_dropout": 0.1,
4
  "apply_spec_augment": true,
5
  "architectures": [
 
65
  "mask_time_min_masks": 2,
66
  "mask_time_prob": 0.05,
67
  "max_length": 1876,
68
+ "max_speech_positions": 5000,
69
+ "max_text_positions": 450,
70
  "model_type": "speecht5",
71
  "num_conv_pos_embedding_groups": 16,
72
  "num_conv_pos_embeddings": 128,
 
85
  "speech_decoder_prenet_layers": 2,
86
  "speech_decoder_prenet_units": 256,
87
  "torch_dtype": "float32",
88
+ "transformers_version": "4.43.3",
89
  "use_cache": false,
90
  "use_guided_attention_loss": true,
91
+ "vocab_size": 113
92
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32f9a69172e75e08308b3f562c2e1cf418669803b80f28271143272d80093702
3
- size 577789320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb953c9e4c9b83629b0ad8d6160ba4e2526f95bcd2212f26110092e86843639
3
+ size 577887624
runs/Aug04_08-59-32_ip-10-192-12-187/events.out.tfevents.1722761976.ip-10-192-12-187.1938.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f39d0354f68e3fa73a8429b8af616ca1ff458a4cde3f9240e72544d387d13e93
3
+ size 15285
special_tokens_map.json CHANGED
@@ -1,13 +1,6 @@
1
  {
2
  "bos_token": "<s>",
3
  "eos_token": "</s>",
4
- "mask_token": {
5
- "content": "<mask>",
6
- "lstrip": true,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false
10
- },
11
  "pad_token": "<pad>",
12
  "unk_token": "<unk>"
13
  }
 
1
  {
2
  "bos_token": "<s>",
3
  "eos_token": "</s>",
 
 
 
 
 
 
 
4
  "pad_token": "<pad>",
5
  "unk_token": "<unk>"
6
  }
spm_char.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fcc48f3e225f627b1641db410ceb0c8649bd2b0c982e150b03f8be3728ab560
3
- size 238473
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1243a12f5c03b26a40f902255c52cea7977ff9990b98885d3146fe0e22991831
3
+ size 238893
tokenizer_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
- "content": "<s>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
@@ -9,7 +9,7 @@
9
  "special": true
10
  },
11
  "1": {
12
- "content": "<pad>",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
@@ -17,7 +17,7 @@
17
  "special": true
18
  },
19
  "2": {
20
- "content": "</s>",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
@@ -25,35 +25,18 @@
25
  "special": true
26
  },
27
  "3": {
28
- "content": "<unk>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
34
- },
35
- "79": {
36
- "content": "<mask>",
37
- "lstrip": true,
38
- "normalized": true,
39
- "rstrip": false,
40
- "single_word": false,
41
- "special": true
42
- },
43
- "80": {
44
- "content": "<ctc_blank>",
45
- "lstrip": false,
46
- "normalized": true,
47
- "rstrip": false,
48
- "single_word": false,
49
- "special": false
50
  }
51
  },
52
  "bos_token": "<s>",
53
  "clean_up_tokenization_spaces": true,
54
  "eos_token": "</s>",
55
- "mask_token": "<mask>",
56
- "model_max_length": 600,
57
  "normalize": false,
58
  "pad_token": "<pad>",
59
  "processor_class": "SpeechT5Processor",
 
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
+ "content": "<pad>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
 
9
  "special": true
10
  },
11
  "1": {
12
+ "content": "</s>",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
 
17
  "special": true
18
  },
19
  "2": {
20
+ "content": "<unk>",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
 
25
  "special": true
26
  },
27
  "3": {
28
+ "content": "<s>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  }
35
  },
36
  "bos_token": "<s>",
37
  "clean_up_tokenization_spaces": true,
38
  "eos_token": "</s>",
39
+ "model_max_length": 1000000000000000019884624838656,
 
40
  "normalize": false,
41
  "pad_token": "<pad>",
42
  "processor_class": "SpeechT5Processor",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1867ab2b1a9bebcaa1925e158b8a2b0bb8a542e47de1be77a5ed2c7c78a84c5
3
- size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f90c0e8244ed36c999c3e1f377ffce46397c67784893a7c27b81785e7a43aeea
3
+ size 5368