joaoalvarenga
commited on
Commit
•
98fedef
1
Parent(s):
2c9efbe
Update README.md
Browse files
README.md
CHANGED
@@ -93,7 +93,7 @@ processor = Wav2Vec2Processor.from_pretrained("joorock12/wav2vec2-large-xlsr-por
|
|
93 |
model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
|
94 |
model.to("cuda")
|
95 |
|
96 |
-
chars_to_ignore_regex = '[
|
97 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
98 |
|
99 |
# Preprocessing the datasets.
|
@@ -123,7 +123,7 @@ result = test_dataset.map(evaluate, batched=True, batch_size=8)
|
|
123 |
print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"], references=result["sentence"])))
|
124 |
```
|
125 |
|
126 |
-
**Test Result (wer)
|
127 |
|
128 |
|
129 |
## Training
|
|
|
93 |
model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
|
94 |
model.to("cuda")
|
95 |
|
96 |
+
chars_to_ignore_regex = '[\\,\\?\\.\\!\\-\\;\\:\\"\\“\\'\\�]'
|
97 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
98 |
|
99 |
# Preprocessing the datasets.
|
|
|
123 |
print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"], references=result["sentence"])))
|
124 |
```
|
125 |
|
126 |
+
**Test Result (wer)**: 15.734702%
|
127 |
|
128 |
|
129 |
## Training
|