Update README.md
Browse filesfix chars_to_ignore weirdness
README.md
CHANGED
|
@@ -86,7 +86,7 @@ processor = Wav2Vec2Processor.from_pretrained("ceyda/wav2vec2-large-xlsr-53-turk
|
|
| 86 |
model = Wav2Vec2ForCTC.from_pretrained("ceyda/wav2vec2-large-xlsr-53-turkish")
|
| 87 |
model.to("cuda")
|
| 88 |
|
| 89 |
-
chars_to_ignore_regex = '[
|
| 90 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
| 91 |
|
| 92 |
# Preprocessing the datasets.
|
|
|
|
| 86 |
model = Wav2Vec2ForCTC.from_pretrained("ceyda/wav2vec2-large-xlsr-53-turkish")
|
| 87 |
model.to("cuda")
|
| 88 |
|
| 89 |
+
chars_to_ignore_regex = '[\,\?\.\!\-\;\:\"\“\‘\”\'\`…\]\[\’»«]'
|
| 90 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
| 91 |
|
| 92 |
# Preprocessing the datasets.
|