MehdiHosseiniMoghadam
commited on
Commit
•
9c268f9
1
Parent(s):
fd6be2f
Update README.md
Browse files
README.md
CHANGED
@@ -106,7 +106,7 @@ model = Wav2Vec2ForCTC.from_pretrained("MehdiHosseiniMoghadam/wav2vec2-large-xls
|
|
106 |
|
107 |
model.to("cuda")
|
108 |
|
109 |
-
chars_to_ignore_regex = '[
|
110 |
|
111 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
112 |
|
@@ -170,4 +170,8 @@ print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"],
|
|
170 |
|
171 |
## Training
|
172 |
|
173 |
-
|
|
|
|
|
|
|
|
|
|
106 |
|
107 |
model.to("cuda")
|
108 |
|
109 |
+
chars_to_ignore_regex = '[\\,\\?\\.\\!\\-\\;\\:\\"\\“\\%\\‘\\”\\�]'
|
110 |
|
111 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
112 |
|
|
|
170 |
|
171 |
## Training
|
172 |
|
173 |
+
10% of the Common Voice `train`, `validation` datasets were used for training.
|
174 |
+
|
175 |
+
## Testing
|
176 |
+
|
177 |
+
10% of the Common Voice `Test` dataset were used for training.
|