Video_translation_with_speaker_diarization_and_voice_cloning_private

Build error

vitaliy-sharandin commited on Nov 20, 2023

Commit

79c8716

•

1 Parent(s): 0657ec1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,10 +18,10 @@ DEEPL_TOKEN = os.environ["DEEPL_TOKEN"]
 # Download video from Youtube
 def download_youtube_video(url):
- yt = YouTube(url)
- stream = yt.streams.filter(file_extension='mp4').first()
- output_path = stream.download()
- return output_path
 # Extract audio from video
@@ -54,7 +54,7 @@ def speech_diarization(audio_path, hf_token):
  import gc; gc.collect(); torch.cuda.empty_cache(); del model_a
  # 3. Assign speaker labels
- diarize_model = whisperx.DiarizationPipeline(model_name='pyannote/[email protected]', use_auth_token=hf_token, device=device)
  # add min/max number of speakers if known
  diarize_segments = diarize_model(audio)

 # Download video from Youtube
 def download_youtube_video(url):
+ yt = YouTube(url)
+ stream = yt.streams.filter(file_extension='mp4').first()
+ output_path = stream.download()
+ return output_path
 # Extract audio from video
  import gc; gc.collect(); torch.cuda.empty_cache(); del model_a
  # 3. Assign speaker labels
+ diarize_model = whisperx.DiarizationPipeline(use_auth_token=hf_token, device=device)
  # add min/max number of speakers if known
  diarize_segments = diarize_model(audio)