Spaces:

rajesh1729
/

youtube-video-transcription-with-whisper

Running

App Files Files Community

rajesh1729 commited on Oct 28, 2024

Commit

d256ad9

verified ·

1 Parent(s): 1d8e620

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -119

app.py CHANGED Viewed

@@ -1,139 +1,46 @@
-import yt_dlp
-import os
-import gradio as gr
-from transformers import pipeline
 import whisper
-import random
-import time
-def get_audio(url):
-    try:
-        # Configure yt-dlp options without browser cookies
-        ydl_opts = {
-            'format': 'bestaudio/best',
-            'postprocessors': [{
-                'key': 'FFmpegExtractAudio',
-                'preferredcodec': 'mp3',
-                'preferredquality': '192',
-            }],
-            'outtmpl': 'audio_download.%(ext)s',
-            'quiet': True,
-            'no_warnings': True,
-            # Add basic user agent
-            'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/118.0.0.0 Safari/537.36',
-            # Add other options to help avoid restrictions
-            'extractor_args': {'youtube': {
-                'player_client': ['android', 'web'],
-                'skip': ['dash', 'hls']
-            }},
-            # Add network options
-            'socket_timeout': 30,
-            'retries': 3,
-        }
-        # Add small delay to avoid rate limiting
-        time.sleep(random.uniform(1, 2))
-        # Download the audio
-        with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-            info = ydl.extract_info(url, download=False)
-            duration = info.get('duration', 0)
-            # Check video duration (optional)
-            if duration > 1800:  # 30 minutes
-                raise gr.Error("Video is too long. Please use videos under 30 minutes.")
-            ydl.download([url])
-        return 'audio_download.mp3'
-    except Exception as e:
-        if 'Sign in to confirm' in str(e):
-            raise gr.Error("This video requires age verification. Please try a different video.")
-        elif 'Private video' in str(e):
-            raise gr.Error("This video is private. Please try a public video.")
-        elif 'Video unavailable' in str(e):
-            raise gr.Error("This video is unavailable. Please check the URL and try again.")
-        else:
-            raise gr.Error(f"Error downloading audio: {str(e)}")
-# Load models
 model = whisper.load_model("base")
-summarizer = pipeline("summarization")
 def get_text(url):
-    try:
-        # Validate URL
-        if not url.startswith('https://www.youtube.com/') and not url.startswith('https://youtu.be/'):
-            raise gr.Error("Please enter a valid YouTube URL")
-        audio_file = get_audio(url)
-        result = model.transcribe(audio_file)
-        # Cleanup
-        try:
-            os.remove(audio_file)
-        except:
-            pass
-        return result['text']
-    except Exception as e:
-        return f"Error: {str(e)}"
 def get_summary(url):
-    try:
-        article = get_text(url)
-        if isinstance(article, str) and article.startswith("Error:"):
-            return article
-        # Handle empty or short text
-        if not article or len(article.split()) < 30:
-            return "Text too short to summarize. Please try a longer video."
-        # Split long text into chunks
-        max_chunk_length = 1000
-        chunks = [article[i:i+max_chunk_length] for i in range(0, len(article), max_chunk_length)]
-        summaries = []
-        for chunk in chunks:
-            summary = summarizer(chunk, max_length=130, min_length=30, do_sample=False)
-            summaries.append(summary[0]['summary_text'])
-        return " ".join(summaries)
-    except Exception as e:
-        return f"Error: {str(e)}"
-# Create Gradio interface
 with gr.Blocks() as demo:
-    gr.Markdown("<h1><center>YouTube Video Transcription with OpenAI's Whisper</center></h1>")
-    gr.Markdown("<center>Enter the link of any YouTube video to get the transcription and summary. Please use videos under 30 minutes in length.</center>")
     with gr.Tab('Get the transcription of any Youtube video'):
         with gr.Row():
-            input_text_1 = gr.Textbox(
-                placeholder='Enter the Youtube video URL (e.g., https://www.youtube.com/watch?v=...)',
-                label='URL'
-            )
-            output_text_1 = gr.Textbox(
-                placeholder='Transcription of the video',
-                label='Transcription'
-            )
         result_button_1 = gr.Button('Get Transcription')
     with gr.Tab('Summary of Youtube video'):
         with gr.Row():
-            input_text = gr.Textbox(
-                placeholder='Enter the Youtube video URL (e.g., https://www.youtube.com/watch?v=...)',
-                label='URL'
-            )
-            output_text = gr.Textbox(
-                placeholder='Summary text of the Youtube Video',
-                label='Summary'
-            )
         result_button = gr.Button('Get Summary')
-    result_button.click(get_summary, inputs=input_text, outputs=output_text)
-    result_button_1.click(get_text, inputs=input_text_1, outputs=output_text_1)
-# Launch with appropriate settings
 demo.launch(debug=True)

 import whisper
+from pytubefix import YouTube
+from pytubefix.cli import on_progress
+from transformers import pipeline
+import gradio as gr
+import os
 model = whisper.load_model("base")
+summarizer = pipeline("summarization")
+def get_audio(url):
+    yt = YouTube(url, on_progress_callback=on_progress)
+    audio_stream = yt.streams.get_audio_only()
+    out_file = audio_stream.download(mp3=True)  # This will directly download as mp3
+    return out_file  # Returns the path to the mp3 file
 def get_text(url):
+    result = model.transcribe(get_audio(url))
+    return result['text']
 def get_summary(url):
+    article = get_text(url)
+    b = summarizer(article)
+    b = b[0]['summary_text']
+    return b
 with gr.Blocks() as demo:
+    gr.Markdown("<h1><center>Youtube video transcription with OpenAI's Whisper</center></h1>")
+    gr.Markdown("<center>Enter the link of any youtube video to get the transcription of the video and a summary of the video in the form of text.</center>")
     with gr.Tab('Get the transcription of any Youtube video'):
         with gr.Row():
+            input_text_1 = gr.Textbox(placeholder='Enter the Youtube video URL', label='URL')
+            output_text_1 = gr.Textbox(placeholder='Transcription of the video', label='Transcription')
         result_button_1 = gr.Button('Get Transcription')
     with gr.Tab('Summary of Youtube video'):
         with gr.Row():
+            input_text = gr.Textbox(placeholder='Enter the Youtube video URL', label='URL')
+            output_text = gr.Textbox(placeholder='Summary text of the Youtube Video', label='Summary')
         result_button = gr.Button('Get Summary')
+    result_button.click(get_summary, inputs = input_text, outputs = output_text)
+    result_button_1.click(get_text, inputs = input_text_1, outputs = output_text_1)
 demo.launch(debug=True)