speech-to-speech-translation

Sleeping

arroyadr commited on Aug 26, 2023

Commit

75ec919

1 Parent(s): f9ada4e

updated translation model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,7 +9,8 @@ from transformers import SpeechT5ForTextToSpeech, SpeechT5HifiGan, SpeechT5Proce
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
-asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-base", device=device)
 # load text-to-speech checkpoint and speaker embeddings
 processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")

 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
+# asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-base", device=device)
+asr_pipe = pipeline("automatic-speech-recognition", model="thunninoi/wav2vec2-japanese-vtuber", device=device)
 # load text-to-speech checkpoint and speaker embeddings
 processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")