Spaces:
No application file
No application file
File size: 823 Bytes
b5dba8a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
import os
import numpy
import torch
import torchaudio
from hubert.customtokenizer import CustomTokenizer
from hubert.pre_kmeans_hubert import CustomHubert
def test_hubert(path: str, model: str = 'model/hubert/hubert_base_ls960.pt', tokenizer: str = 'model.pth'):
hubert_model = CustomHubert(checkpoint_path=model)
customtokenizer = CustomTokenizer.load_from_checkpoint(os.path.join(path, tokenizer))
wav, sr = torchaudio.load(os.path.join(path, 'test', 'wav.wav'))
original = numpy.load(os.path.join(path, 'test', 'semantic.npy'))
out = hubert_model.forward(wav, input_sample_hz=sr)
out_tokenized = customtokenizer.get_token(out)
# print(out.shape, out_tokenized.shape)
print(original[:-1], out_tokenized)
numpy.save(os.path.join(path, 'test', 'gen_semantic.npy'), out_tokenized)
|