bark-cloning / test_hubert.py
jameshuntercarter's picture
Upload 24 files
b5dba8a
raw
history blame
823 Bytes
import os
import numpy
import torch
import torchaudio
from hubert.customtokenizer import CustomTokenizer
from hubert.pre_kmeans_hubert import CustomHubert
def test_hubert(path: str, model: str = 'model/hubert/hubert_base_ls960.pt', tokenizer: str = 'model.pth'):
hubert_model = CustomHubert(checkpoint_path=model)
customtokenizer = CustomTokenizer.load_from_checkpoint(os.path.join(path, tokenizer))
wav, sr = torchaudio.load(os.path.join(path, 'test', 'wav.wav'))
original = numpy.load(os.path.join(path, 'test', 'semantic.npy'))
out = hubert_model.forward(wav, input_sample_hz=sr)
out_tokenized = customtokenizer.get_token(out)
# print(out.shape, out_tokenized.shape)
print(original[:-1], out_tokenized)
numpy.save(os.path.join(path, 'test', 'gen_semantic.npy'), out_tokenized)