Spaces:

dwarkesh
/

producer

Running

App Files Files Community

dwarkesh commited on 12 days ago

Commit

cc1687a

verified ·

1 Parent(s): bf385fc

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -33

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ class ContentRequest:
     prompt_key: str
 class ContentGenerator:
-    def __init__(self, api_key):
         self.current_prompts = self._load_default_prompts()
         self.client = genai.Client(api_key=api_key)
@@ -117,8 +117,8 @@ def get_transcript(video_id: str) -> str:
         return f"Error fetching transcript: {str(e)}"
 class TranscriptProcessor:
-    def __init__(self, api_key):
-        self.generator = ContentGenerator(api_key=api_key)
     def _get_youtube_transcript(self, url: str) -> str:
@@ -130,11 +130,11 @@ class TranscriptProcessor:
         except Exception as e:
             raise Exception(f"Error fetching YouTube transcript: {str(e)}")
-    async def process_transcript(self, audio_file, assembly_api_key):
         """Process input and generate all content."""
         audio_path = audio_file.name
         try:
-            aai.settings.api_key = assembly_api_key
             config = aai.TranscriptionConfig(speaker_labels=True, language_code="en")
             transcript_iter = aai.Transcriber().transcribe(str(audio_path), config=config)
             transcript = transcript_iter.text
@@ -184,50 +184,39 @@ class TranscriptProcessor:
 def create_interface():
     """Create the Gradio interface."""
-    with gr.Blocks(title="Gemini Podcast Content Generator") as app:
         gr.Markdown(
             """
-            # Gemini Podcast Content Generator
-            Generate preview clips, timestamps, descriptions and more from podcast transcripts using Gemini.
-            Upload an audio file to get started!
             """
         )
         with gr.Tab("Generate Content"):
-            google_api_key_input = gr.Textbox(
-                 label="Google API Key",
-                 placeholder="Enter your Google API Key here",
-                 type="password",
-                 lines=1,
-                 info="Your GCP account needs to have billing enabled to use the 2.5 pro model.",
-                 scale=1
-            )
-            assemblyai_api_key_input = gr.Textbox(
-                 label="AssemblyAI API Key",
-                 placeholder="Enter your AssemblyAI API Key here",
-                 type="password",
-                 lines=1,
-                 info="Your key is used for initial audio transcription.",
-                 scale=1
-            )
             input_audio = gr.File(
                 label="Upload Audio File",
                 file_count="single",
                 file_types=["audio"]
             )
-            submit_btn = gr.Button("Generate Content with Gemini")
-            processor = TranscriptProcessor(api_key=google_api_key_input)
             output = gr.Markdown()  # Single markdown output
-            async def process_wrapper(text, api_key):
                 print("Process wrapper started")
                 print(f"Input text: {text[:100]}...")
                 try:
-                    result = await processor.process_transcript(text, api_key)
                     print("Process completed, got results")
                     return result
                 except Exception as e:
@@ -236,7 +225,7 @@ def create_interface():
             submit_btn.click(
                 fn=process_wrapper,
-                inputs=[input_audio, assemblyai_api_key_input],
                 outputs=output,
                 queue=True
             )
@@ -244,7 +233,7 @@ def create_interface():
         with gr.Tab("Customize Prompts"):
             gr.Markdown(
                 """
-                ## Customize Generation Prompts for Gemini
                 Here you can experiment with different prompts during your session.
                 Changes will remain active until you reload the page.
@@ -277,7 +266,7 @@ def create_interface():
                 )
             # Reset button
-            reset_btn = gr.Button("Reset to Default Gemini Prompts")
             reset_btn.click(
                 fn=lambda: (
                     processor.update_prompts(*processor.generator.current_prompts.values()),
@@ -289,4 +278,4 @@ def create_interface():
     return app
 if __name__ == "__main__":
-    create_interface().launch()

     prompt_key: str
 class ContentGenerator:
+    def __init__(self,api_key):
         self.current_prompts = self._load_default_prompts()
         self.client = genai.Client(api_key=api_key)
         return f"Error fetching transcript: {str(e)}"
 class TranscriptProcessor:
+    def __init__(self):
+        self.generator = ContentGenerator(api_key=os.getenv("GOOGLE_API_KEY"))
     def _get_youtube_transcript(self, url: str) -> str:
         except Exception as e:
             raise Exception(f"Error fetching YouTube transcript: {str(e)}")
+    async def process_transcript(self, audio_file):
         """Process input and generate all content."""
         audio_path = audio_file.name
         try:
+            aai.settings.api_key = os.getenv("ASSEMBLYAI_API_KEY")
             config = aai.TranscriptionConfig(speaker_labels=True, language_code="en")
             transcript_iter = aai.Transcriber().transcribe(str(audio_path), config=config)
             transcript = transcript_iter.text
 def create_interface():
     """Create the Gradio interface."""
+    processor = TranscriptProcessor()
+    with gr.Blocks(title="Podcast Content Generator") as app:
         gr.Markdown(
             """
+            # Podcast Content Generator
+            Generate preview clips, timestamps, descriptions and more from podcast transcripts or YouTube videos.
+            Simply paste a YouTube URL or raw transcript text to get started!
             """
         )
         with gr.Tab("Generate Content"):
             input_audio = gr.File(
                 label="Upload Audio File",
                 file_count="single",
                 file_types=["audio"]
             )
+            input_text = gr.Textbox(
+                label="Youtube URL",
+                placeholder="YouTube URL",
+                lines=1
+            )
+            submit_btn = gr.Button("Generate Content")
             output = gr.Markdown()  # Single markdown output
+            async def process_wrapper(text):
                 print("Process wrapper started")
                 print(f"Input text: {text[:100]}...")
                 try:
+                    result = await processor.process_transcript(text)
                     print("Process completed, got results")
                     return result
                 except Exception as e:
             submit_btn.click(
                 fn=process_wrapper,
+                inputs=input_audio,
                 outputs=output,
                 queue=True
             )
         with gr.Tab("Customize Prompts"):
             gr.Markdown(
                 """
+                ## Customize Generation Prompts
                 Here you can experiment with different prompts during your session.
                 Changes will remain active until you reload the page.
                 )
             # Reset button
+            reset_btn = gr.Button("Reset to Default Prompts")
             reset_btn.click(
                 fn=lambda: (
                     processor.update_prompts(*processor.generator.current_prompts.values()),
     return app
 if __name__ == "__main__":
+    create_interface().launch(