podcast-generator

Sleeping

App Files Files Community

bluenevus commited on Apr 16

Commit

43f2e7f

verified ·

1 Parent(s): cdbb971

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -32

app.py CHANGED Viewed

@@ -38,43 +38,38 @@ def generate_podcast_script(api_key, prompt, uploaded_file, duration, num_hosts)
     try:
         genai.configure(api_key=api_key)
         model = genai.GenerativeModel('gemini-2.5-pro-preview-03-25')
         combined_content = prompt or ""
-    if uploaded_file is not None:
-        file_bytes = io.BytesIO(uploaded_file)
-        # Try to detect the file type based on content
-        file_bytes.seek(0)
-        if file_bytes.read(4) == b'%PDF':
-            # It's a PDF file
-            file_bytes.seek(0)
-            pdf_reader = PyPDF2.PdfReader(file_bytes)
-            file_content = "\n".join([page.extract_text() for page in pdf_reader.pages])
-        else:
-            # Try as text file first
             file_bytes.seek(0)
-            try:
-                file_content = file_bytes.read().decode('utf-8')
-            except UnicodeDecodeError:
-                # If it's not a text file, try as a docx
                 file_bytes.seek(0)
                 try:
-                    doc = Document(file_bytes)
-                    file_content = "\n".join([para.text for para in doc.paragraphs])
-                except:
-                    raise ValueError("Unsupported file type or corrupted file")
-        combined_content += "\n" + file_content if combined_content else file_content</code></pre></div></pre>
-        if uploaded_file is not None:
-            # Handle the uploaded file content
-            file_content = uploaded_file.name  # This gets the content of the NamedString
             combined_content += "\n" + file_content if combined_content else file_content
         num_hosts = int(num_hosts)  # Convert to integer
-        prompt = f"""
         Create a podcast script for {num_hosts} {'person' if num_hosts == 1 else 'people'} discussing:
         {combined_content}
@@ -91,17 +86,17 @@ def generate_podcast_script(api_key, prompt, uploaded_file, duration, num_hosts)
         The intro always includes the first speaker and should be in the same paragraph.
         The outro always includes the first speaker and should be in the same paragraph
         Do not include these types of transition "Intro Music fades in and then fades slightly to background"
-        Keep each speaker's entire monologue in a single paragraph, regardless of length if the humber of hosts is not 1.
-        Start a new paragraph only when switching to a different speaker if the humber of hosts is not 1.
         Maintain natural conversation flow and speech patterns within each monologue.
-        Use context clues or subtle references to indicate who is speaking without explicit labels if the humber of hosts is not 1
         Use speaker names sparingly, only when necessary for clarity or emphasis. Avoid starting every line with the other person's name.
         Rely more on context and speech patterns to indicate who is speaking, rather than always stating names.
         Use names primarily for transitions sparingly, definitely with agreements, or to draw attention to a specific point, not as a constant form of address.
         {'Make sure the script is a monologue for one person.' if num_hosts == 1 else 'Ensure the dialogue alternates between two distinct voices, with one speaking on odd-numbered lines and the other on even-numbered lines.'}
         """
-        response = model.generate_content(prompt)
         return re.sub(r'[^a-zA-Z0-9\s.,?!<>]', '', response.text)
     except Exception as e:
         logger.error(f"Error generating podcast script: {str(e)}")

     try:
         genai.configure(api_key=api_key)
         model = genai.GenerativeModel('gemini-2.5-pro-preview-03-25')
         combined_content = prompt or ""
+        if uploaded_file is not None:
+            file_bytes = io.BytesIO(uploaded_file)
+            # Try to detect the file type based on content
             file_bytes.seek(0)
+            if file_bytes.read(4) == b'%PDF':
+                # It's a PDF file
+                file_bytes.seek(0)
+                pdf_reader = PyPDF2.PdfReader(file_bytes)
+                file_content = "\n".join([page.extract_text() for page in pdf_reader.pages])
+            else:
+                # Try as text file first
                 file_bytes.seek(0)
                 try:
+                    file_content = file_bytes.read().decode('utf-8')
+                except UnicodeDecodeError:
+                    # If it's not a text file, try as a docx
+                    file_bytes.seek(0)
+                    try:
+                        doc = Document(file_bytes)
+                        file_content = "\n".join([para.text for para in doc.paragraphs])
+                    except:
+                        raise ValueError("Unsupported file type or corrupted file")
             combined_content += "\n" + file_content if combined_content else file_content
         num_hosts = int(num_hosts)  # Convert to integer
+        prompt_template = f"""
         Create a podcast script for {num_hosts} {'person' if num_hosts == 1 else 'people'} discussing:
         {combined_content}
         The intro always includes the first speaker and should be in the same paragraph.
         The outro always includes the first speaker and should be in the same paragraph
         Do not include these types of transition "Intro Music fades in and then fades slightly to background"
+        Keep each speaker's entire monologue in a single paragraph, regardless of length if the number of hosts is not 1.
+        Start a new paragraph only when switching to a different speaker if the number of hosts is not 1.
         Maintain natural conversation flow and speech patterns within each monologue.
+        Use context clues or subtle references to indicate who is speaking without explicit labels if the number of hosts is not 1
         Use speaker names sparingly, only when necessary for clarity or emphasis. Avoid starting every line with the other person's name.
         Rely more on context and speech patterns to indicate who is speaking, rather than always stating names.
         Use names primarily for transitions sparingly, definitely with agreements, or to draw attention to a specific point, not as a constant form of address.
         {'Make sure the script is a monologue for one person.' if num_hosts == 1 else 'Ensure the dialogue alternates between two distinct voices, with one speaking on odd-numbered lines and the other on even-numbered lines.'}
         """
+        response = model.generate_content(prompt_template)
         return re.sub(r'[^a-zA-Z0-9\s.,?!<>]', '', response.text)
     except Exception as e:
         logger.error(f"Error generating podcast script: {str(e)}")