Spaces:

nihalaninihal
/

knowledgeCast

Sleeping

App Files Files Community

nihalaninihal commited on May 28

Commit

34bfe42

verified ·

1 Parent(s): 3e4f04a

Update app.py

Browse files

Files changed (1) hide show

app.py +113 -109

app.py CHANGED Viewed

@@ -56,7 +56,7 @@ def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     return header + audio_data
-def parse_audio_mime_type(mime_type: str) -> dict[str, int | None]:
     """Parses bits per sample and rate from an audio MIME type string."""
     bits_per_sample = 16
     rate = 24000
@@ -79,10 +79,11 @@ def parse_audio_mime_type(mime_type: str) -> dict[str, int | None]:
     return {"bits_per_sample": bits_per_sample, "rate": rate}
-def fetch_web_content(url, progress=gr.Progress()):
     """Fetch and analyze web content using Gemini with tools."""
     try:
-        progress(0.1, desc="Initializing Gemini client...")
         logger.info("Initializing Gemini client...")
         if not GEMINI_API_KEY:
@@ -90,10 +91,11 @@ def fetch_web_content(url, progress=gr.Progress()):
         client = genai.Client(api_key=GEMINI_API_KEY)
-        progress(0.2, desc="Fetching web content...")
         logger.info(f"Fetching content from URL: {url}")
-        model = "gemini-2.5-flash-preview-04-17"
         contents = [
             types.Content(
                 role="user",
@@ -118,7 +120,8 @@ def fetch_web_content(url, progress=gr.Progress()):
             response_mime_type="text/plain",
         )
-        progress(0.4, desc="Analyzing content with AI...")
         logger.info("Generating content with Gemini...")
         content_text = ""
@@ -130,7 +133,8 @@ def fetch_web_content(url, progress=gr.Progress()):
             if chunk.text:
                 content_text += chunk.text
-        progress(0.6, desc="Content analysis complete!")
         logger.info(f"Content generation complete. Length: {len(content_text)} characters")
         return content_text
@@ -139,10 +143,11 @@ def fetch_web_content(url, progress=gr.Progress()):
         raise e
-def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", speaker2_name="Adam Chan", progress=gr.Progress()):
     """Generate audio podcast from text content."""
     try:
-        progress(0.7, desc="Generating podcast audio...")
         logger.info("Starting audio generation...")
         if not GEMINI_API_KEY:
@@ -150,7 +155,7 @@ def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", spea
         client = genai.Client(api_key=GEMINI_API_KEY)
-        model = "gemini-2.5-flash-preview-tts"
         podcast_prompt = f"""Please read aloud the following content in a natural podcast interview style with two distinct speakers.
         Make it sound conversational and engaging:
@@ -197,7 +202,8 @@ def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", spea
             ),
         )
-        progress(0.8, desc="Converting to audio...")
         logger.info("Generating audio stream...")
         # Create temporary file
@@ -235,7 +241,8 @@ def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", spea
             # For simplicity, just use the first chunk (you might want to concatenate them)
             final_audio = audio_chunks[0]
             save_binary_file(temp_file.name, final_audio)
-            progress(1.0, desc="Podcast generated successfully!")
             logger.info(f"Audio file saved: {temp_file.name}")
             return temp_file.name
         else:
@@ -246,10 +253,11 @@ def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", spea
         raise e
-def generate_web_podcast(url, speaker1_name, speaker2_name, progress=gr.Progress()):
     """Main function to fetch web content and generate podcast."""
     try:
-        progress(0.0, desc="Starting podcast generation...")
         logger.info(f"Starting podcast generation for URL: {url}")
         # Validate inputs
@@ -285,106 +293,102 @@ def generate_web_podcast(url, speaker1_name, speaker2_name, progress=gr.Progress
 # Create Gradio interface
 def create_interface():
-    try:
-        with gr.Blocks(
-            title="🎙️ Web-to-Podcast Generator",
-            theme=gr.themes.Soft(),
-            analytics_enabled=False
-        ) as demo:
-            gr.Markdown("""
-            # 🎙️ Web-to-Podcast Generator
-            Transform any website into an engaging podcast conversation between two AI hosts!
-            Simply paste a URL and let AI create a natural dialogue discussing the content.
-            """)
-            with gr.Row():
-                with gr.Column(scale=2):
-                    url_input = gr.Textbox(
-                        label="Website URL",
-                        placeholder="https://example.com",
-                        info="Enter the URL of the website you want to convert to a podcast",
                         lines=1
                     )
-                    with gr.Row():
-                        speaker1_input = gr.Textbox(
-                            label="Host 1 Name",
-                            value="Anna Chope",
-                            info="Name of the first podcast host",
-                            lines=1
-                        )
-                        speaker2_input = gr.Textbox(
-                            label="Host 2 Name",
-                            value="Adam Chan",
-                            info="Name of the second podcast host",
-                            lines=1
-                        )
-                    generate_btn = gr.Button("🎙️ Generate Podcast", variant="primary", size="lg")
-                with gr.Column(scale=1):
-                    gr.Markdown("""
-                    ### Instructions:
-                    1. Enter a website URL
-                    2. Customize host names (optional)
-                    3. Click "Generate Podcast"
-                    4. Wait for the AI to analyze content and create audio
-                    5. Download your podcast!
-                    ### Examples:
-                    - News articles
-                    - Blog posts
-                    - Product pages
-                    - Documentation
-                    - Research papers
-                    """)
-            with gr.Row():
-                status_output = gr.Textbox(label="Status", interactive=False, lines=2)
-            with gr.Row():
-                audio_output = gr.Audio(label="Generated Podcast", type="filepath")
-            with gr.Accordion("📝 Generated Script Preview", open=False):
-                script_output = gr.Textbox(
-                    label="Podcast Script",
-                    lines=10,
-                    interactive=False,
-                    info="Preview of the conversation script generated from the website content"
-                )
-            # Event handlers
-            generate_btn.click(
-                fn=generate_web_podcast,
-                inputs=[url_input, speaker1_input, speaker2_input],
-                outputs=[audio_output, status_output, script_output],
-                show_progress=True
-            )
-            # Examples
-            gr.Examples(
-                examples=[
-                    ["https://github.com/weaviate/weaviate", "Anna", "Adam"],
-                    ["https://huggingface.co/blog", "Sarah", "Mike"],
-                    ["https://openai.com/blog", "Emma", "John"],
-                ],
-                inputs=[url_input, speaker1_input, speaker2_input],
             )
-            gr.Markdown("""
-            ---
-            **Note:** API key is now directly embedded in the code for convenience.
-            The generated podcast will feature two AI voices having a natural conversation about the website content.
-            """)
-        return demo
-    except Exception as e:
-        logger.error(f"Error creating interface: {e}")
-        raise e
 if __name__ == "__main__":

     return header + audio_data
+def parse_audio_mime_type(mime_type: str) -> dict:
     """Parses bits per sample and rate from an audio MIME type string."""
     bits_per_sample = 16
     rate = 24000
     return {"bits_per_sample": bits_per_sample, "rate": rate}
+def fetch_web_content(url, progress=None):
     """Fetch and analyze web content using Gemini with tools."""
     try:
+        if progress:
+            progress(0.1, desc="Initializing Gemini client...")
         logger.info("Initializing Gemini client...")
         if not GEMINI_API_KEY:
         client = genai.Client(api_key=GEMINI_API_KEY)
+        if progress:
+            progress(0.2, desc="Fetching web content...")
         logger.info(f"Fetching content from URL: {url}")
+        model = "gemini-2.0-flash-exp"  # Updated model name
         contents = [
             types.Content(
                 role="user",
             response_mime_type="text/plain",
         )
+        if progress:
+            progress(0.4, desc="Analyzing content with AI...")
         logger.info("Generating content with Gemini...")
         content_text = ""
             if chunk.text:
                 content_text += chunk.text
+        if progress:
+            progress(0.6, desc="Content analysis complete!")
         logger.info(f"Content generation complete. Length: {len(content_text)} characters")
         return content_text
         raise e
+def generate_podcast_from_content(content_text, speaker1_name="Anna Chope", speaker2_name="Adam Chan", progress=None):
     """Generate audio podcast from text content."""
     try:
+        if progress:
+            progress(0.7, desc="Generating podcast audio...")
         logger.info("Starting audio generation...")
         if not GEMINI_API_KEY:
         client = genai.Client(api_key=GEMINI_API_KEY)
+        model = "gemini-2.0-flash-exp"  # Updated model name
         podcast_prompt = f"""Please read aloud the following content in a natural podcast interview style with two distinct speakers.
         Make it sound conversational and engaging:
             ),
         )
+        if progress:
+            progress(0.8, desc="Converting to audio...")
         logger.info("Generating audio stream...")
         # Create temporary file
             # For simplicity, just use the first chunk (you might want to concatenate them)
             final_audio = audio_chunks[0]
             save_binary_file(temp_file.name, final_audio)
+            if progress:
+                progress(1.0, desc="Podcast generated successfully!")
             logger.info(f"Audio file saved: {temp_file.name}")
             return temp_file.name
         else:
         raise e
+def generate_web_podcast(url, speaker1_name, speaker2_name, progress=None):
     """Main function to fetch web content and generate podcast."""
     try:
+        if progress:
+            progress(0.0, desc="Starting podcast generation...")
         logger.info(f"Starting podcast generation for URL: {url}")
         # Validate inputs
 # Create Gradio interface
 def create_interface():
+    """Create and return the Gradio interface."""
+    with gr.Blocks(
+        title="🎙️ Web-to-Podcast Generator",
+        theme=gr.themes.Soft(),
+        analytics_enabled=False
+    ) as demo:
+        gr.Markdown("""
+        # 🎙️ Web-to-Podcast Generator
+        Transform any website into an engaging podcast conversation between two AI hosts!
+        Simply paste a URL and let AI create a natural dialogue discussing the content.
+        """)
+        with gr.Row():
+            with gr.Column(scale=2):
+                url_input = gr.Textbox(
+                    label="Website URL",
+                    placeholder="https://example.com",
+                    info="Enter the URL of the website you want to convert to a podcast",
+                    lines=1
+                )
+                with gr.Row():
+                    speaker1_input = gr.Textbox(
+                        label="Host 1 Name",
+                        value="Anna Chope",
+                        info="Name of the first podcast host",
                         lines=1
                     )
+                    speaker2_input = gr.Textbox(
+                        label="Host 2 Name",
+                        value="Adam Chan",
+                        info="Name of the second podcast host",
+                        lines=1
+                    )
+                generate_btn = gr.Button("🎙️ Generate Podcast", variant="primary", size="lg")
+            with gr.Column(scale=1):
+                gr.Markdown("""
+                ### Instructions:
+                1. Enter a website URL
+                2. Customize host names (optional)
+                3. Click "Generate Podcast"
+                4. Wait for the AI to analyze content and create audio
+                5. Download your podcast!
+                ### Examples:
+                - News articles
+                - Blog posts
+                - Product pages
+                - Documentation
+                - Research papers
+                """)
+        with gr.Row():
+            status_output = gr.Textbox(label="Status", interactive=False, lines=2)
+        with gr.Row():
+            audio_output = gr.Audio(label="Generated Podcast", type="filepath")
+        with gr.Accordion("📝 Generated Script Preview", open=False):
+            script_output = gr.Textbox(
+                label="Podcast Script",
+                lines=10,
+                interactive=False,
+                info="Preview of the conversation script generated from the website content"
             )
+        # Event handlers
+        generate_btn.click(
+            fn=generate_web_podcast,
+            inputs=[url_input, speaker1_input, speaker2_input],
+            outputs=[audio_output, status_output, script_output],
+            show_progress=True
+        )
+        # Examples
+        gr.Examples(
+            examples=[
+                ["https://github.com/weaviate/weaviate", "Anna", "Adam"],
+                ["https://huggingface.co/blog", "Sarah", "Mike"],
+                ["https://openai.com/blog", "Emma", "John"],
+            ],
+            inputs=[url_input, speaker1_input, speaker2_input],
+        )
+        gr.Markdown("""
+        ---
+        **Note:** API key is now directly embedded in the code for convenience.
+        The generated podcast will feature two AI voices having a natural conversation about the website content.
+        """)
+    return demo
 if __name__ == "__main__":