bayartsogt commited on
Commit
1de0fb7
1 Parent(s): 23378e6

editing regex

Browse files
Files changed (1) hide show
  1. README.md +2 -1
README.md CHANGED
@@ -86,7 +86,8 @@ processor = Wav2Vec2Processor.from_pretrained("bayartsogt/wav2vec2-large-xlsr-mo
86
  model = Wav2Vec2ForCTC.from_pretrained("bayartsogt/wav2vec2-large-xlsr-mongolian")
87
  model.to("cuda")
88
 
89
- chars_to_ignore_regex = '[\,\?\.\!\-\;\:\"\“]' # TODO: adapt this list to include all special characters you removed from the data
 
90
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
91
 
92
  # Preprocessing the datasets.
 
86
  model = Wav2Vec2ForCTC.from_pretrained("bayartsogt/wav2vec2-large-xlsr-mongolian")
87
  model.to("cuda")
88
 
89
+ chars_to_ignore_regex = '[\,\?\.\!\-\;\:\"\“\%\‘\”\�\'h\«\»]'
90
+
91
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
92
 
93
  # Preprocessing the datasets.