Fastspeech2_HS / Unified_parser /extract_words.py
utkarsh2299's picture
Upload 97 files
2c8dc05 verified
raw
history blame
690 Bytes
import os, shutil
from uparser import wordparse
from joblib import Parallel, delayed
from tqdm import tqdm
num_jobs = 20
infolder = 'Original'
outfolder = 'Words'
for fdr in [outfolder]:
if os.path.exists(fdr):
shutil.rmtree(fdr)
os.mkdir(fdr)
flist = os.listdir(infolder)
for fname in flist:
with open(f'{infolder}/{fname}', 'r') as f:
cnts = f.readlines()
i = 0
words = []
for l in cnts:
l = l.strip().split('\t')
words.append(l[0])
fout = fname.split('_')[1]
fout = fout.split('.')[0]
print(fout)
with open(f'{outfolder}/{fout}.words', 'w') as f:
for w in words:
f.write(w + '\n')