Spaces:

nihalaninihal
/

GithubAnalyzerr

Sleeping

App Files Files Community

nihalaninihal commited on Feb 1

Commit

e696760

verified ·

1 Parent(s): 1c70005

added pdf download report analysis

Browse files

Files changed (1) hide show

app.py +250 -20

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import gradio as gr
 import google.generativeai as genai
 import os
@@ -13,6 +15,9 @@ import tempfile
 from tenacity import retry, stop_after_attempt, wait_exponential, retry_if_exception_type
 import time
 import os
@@ -258,12 +263,175 @@ class RepositoryAnalyzer:
             "total_contributors": len(contributor_data),
             "contributors": contributor_data
         }
 @retry(
     retry=retry_if_exception_type(Exception),
     stop=stop_after_attempt(3),
     wait=wait_exponential(multiplier=1, min=4, max=10)
 )
 def analyze_repository(repo_url: str, progress=gr.Progress()) -> Tuple[str, str, str]:
     """Analyze repository and generate LLM summary with rate limit handling"""
     try:
@@ -363,12 +531,31 @@ Please provide detailed analysis for each section while maintaining the formatti
             json.dump(analysis_data, f, indent=2)
             analysis_file = f.name
-        progress(1.0, desc="Analysis complete!")
-        return response.text, analysis_file, "✅ Analysis completed successfully!"
     except Exception as e:
         error_message = f"❌ Error analyzing repository: {str(e)}"
-        return "", "", error_message
 def create_chat_session() -> Any:
     """Create a new chat session for follow-up questions"""
@@ -426,6 +613,7 @@ def ask_question(question: str, analysis_file: str, chat_history: List[Tuple[str
 # Create Gradio interface
 with gr.Blocks(theme=gr.themes.Soft()) as app:
     gr.Markdown("""
@@ -435,8 +623,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
     1. 📊 Analyze repository structure and patterns
     2. 💡 Generate insights about development practices
     3. 💭 Allow you to ask follow-up questions about the analysis
-    Enter a GitHub repository URL (e.g., `https://github.com/owner/repo`)
     """)
     with gr.Row():
@@ -445,16 +632,24 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
             placeholder="https://github.com/owner/repo",
             scale=4
         )
-        analyze_btn = gr.Button("🔍 Analyze", variant="primary", scale=1)
-    # Add status message
     status_msg = gr.Markdown("", elem_id="status_message")
     with gr.Row():
-        # Use Markdown instead of Textbox for better formatting
-        summary = gr.Markdown(
-            label="Analysis Summary",
-        )
     with gr.Row():
         chatbot = gr.Chatbot(
@@ -472,13 +667,32 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
         ask_btn = gr.Button("💭 Ask", variant="primary", scale=1)
         clear_btn = gr.Button("🗑️ Clear Chat", variant="secondary", scale=1)
-    # Hidden state for analysis file
     analysis_file = gr.State("")
     def clear_outputs():
-        return "", [], "", ""
-    # Set up event handlers
     analyze_btn.click(
         fn=lambda: "⏳ Analysis in progress...",
         inputs=None,
@@ -487,15 +701,30 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
     ).then(
         analyze_repository,
         inputs=[repo_url],
-        outputs=[summary, analysis_file, status_msg],
     )
     ask_btn.click(
         ask_question,
         inputs=[question, analysis_file, chatbot],
-        outputs=[chatbot],
     ).then(
-        lambda: "",  # Clear the question input
         None,
         question,
         queue=False
@@ -504,10 +733,11 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
     clear_btn.click(
         clear_outputs,
         inputs=None,
-        outputs=[summary, chatbot, question, status_msg],
-        queue=False
     )
 # Launch the app
 if __name__ == "__main__":
     app.launch(

+!pip install requests
 import gradio as gr
 import google.generativeai as genai
 import os
 from tenacity import retry, stop_after_attempt, wait_exponential, retry_if_exception_type
 import time
 import os
+import re
+from fpdf import FPDF
+import requests
             "total_contributors": len(contributor_data),
             "contributors": contributor_data
         }
+def create_pdf_from_markdown(markdown_text: str, filename: str) -> str:
+    """Convert markdown text to PDF"""
+    class PDF(FPDF):
+        def header(self):
+            self.set_font('Arial', 'B', 12)
+            self.cell(0, 10, 'Repository Analysis Report', 0, 1, 'C')
+            self.ln(10)
+        def footer(self):
+            self.set_y(-15)
+            self.set_font('Arial', 'I', 8)
+            self.cell(0, 10, f'Page {self.page_no()}', 0, 0, 'C')
+    pdf = PDF()
+    pdf.add_page()
+    pdf.set_auto_page_break(auto=True, margin=15)
+    # Process markdown sections
+    sections = markdown_text.split('\n## ')
+    # Handle main title
+    if sections[0].startswith('# '):
+        title = sections[0].split('\n')[0].replace('# ', '')
+        pdf.set_font('Arial', 'B', 16)
+        pdf.cell(0, 10, title, 0, 1, 'C')
+        pdf.ln(5)
+        content = '\n'.join(sections[0].split('\n')[1:])
+        sections[0] = content
+    for section in sections:
+        if section:
+            # Extract section title and content
+            lines = section.split('\n')
+            if section == sections[0]:  # First section (after main title)
+                section_title = ''
+                content = lines
+            else:
+                section_title = lines[0]
+                content = lines[1:]
+            # Add section title
+            if section_title:
+                pdf.set_font('Arial', 'B', 14)
+                # Remove emojis from section titles
+                clean_title = re.sub(r'[^\x00-\x7F]+', '', section_title)
+                pdf.cell(0, 10, clean_title.strip(), 0, 1, 'L')
+                pdf.ln(5)
+            # Add content
+            pdf.set_font('Arial', '', 11)
+            for line in content:
+                if line.strip():
+                    # Remove markdown formatting and emojis
+                    clean_line = re.sub(r'[\*\[\]]', '', line)
+                    clean_line = re.sub(r'[^\x00-\x7F]+', '', clean_line)
+                    if line.startswith('- '):
+                        pdf.cell(10, 5, '', 0, 0)
+                        pdf.multi_cell(0, 5, clean_line[2:])
+                    else:
+                        pdf.multi_cell(0, 5, clean_line)
+            pdf.ln(5)
+    # Save PDF
+    pdf_path = f"{filename}.pdf"
+    pdf.output(pdf_path)
+    return pdf_path
+def download_noto_font():
+    """Download Google's Noto Color Emoji font if not already present"""
+    font_path = "NotoColorEmoji.ttf"
+    if not os.path.exists(font_path):
+        url = "https://github.com/googlefonts/noto-emoji/raw/main/fonts/NotoColorEmoji.ttf"
+        response = requests.get(url)
+        with open(font_path, "wb") as f:
+            f.write(response.content)
+    return font_path
+class PDFWithEmoji(FPDF):
+    def __init__(self):
+        super().__init__()
+        self.add_font('DejaVu', '', 'DejaVuSansCondensed.ttf', uni=True)
+        self.add_font('Noto', '', 'NotoColorEmoji.ttf', uni=True)
+    def header(self):
+        self.set_font('DejaVu', '', 12)
+        self.cell(0, 10, '📊 Repository Analysis Report', 0, 1, 'C')
+        self.ln(10)
+    def footer(self):
+        self.set_y(-15)
+        self.set_font('DejaVu', '', 8)
+        self.cell(0, 10, f'Page {self.page_no()}', 0, 0, 'C')
+    def write_with_emoji(self, text):
+        """Write text with proper emoji support"""
+        self.set_font('DejaVu', '', 11)
+        self.multi_cell(0, 5, text)
+def create_pdf_report(markdown_text: str) -> str:
+    """Create a PDF report with full emoji and Unicode support"""
+    # Ensure required fonts are available
+    if not os.path.exists("DejaVuSansCondensed.ttf"):
+        url = "https://github.com/dejavu-fonts/dejavu-fonts/raw/master/ttf/DejaVuSansCondensed.ttf"
+        response = requests.get(url)
+        with open("DejaVuSansCondensed.ttf", "wb") as f:
+            f.write(response.content)
+    download_noto_font()
+    # Create PDF
+    pdf = PDFWithEmoji()
+    pdf.add_page()
+    pdf.set_auto_page_break(auto=True, margin=15)
+    # Process markdown text
+    sections = markdown_text.split('\n## ')
+    # Handle main title
+    if sections[0].startswith('# '):
+        title = sections[0].split('\n')[0].replace('# ', '')
+        pdf.set_font('DejaVu', '', 16)
+        pdf.cell(0, 10, title, 0, 1, 'C')
+        pdf.ln(5)
+        content = '\n'.join(sections[0].split('\n')[1:])
+        sections[0] = content
+    # Process each section
+    for section in sections:
+        if section:
+            lines = section.split('\n')
+            if section == sections[0]:  # First section
+                section_title = ''
+                content = lines
+            else:
+                section_title = lines[0]
+                content = lines[1:]
+            # Add section title
+            if section_title:
+                pdf.set_font('DejaVu', '', 14)
+                pdf.cell(0, 10, section_title, 0, 1, 'L')
+                pdf.ln(5)
+            # Add content
+            pdf.set_font('DejaVu', '', 11)
+            for line in content:
+                if line.strip():
+                    if line.strip().startswith('- '):
+                        pdf.cell(10, 5, '•', 0, 0)
+                        pdf.write_with_emoji(line.strip()[2:])
+                        pdf.ln()
+                    else:
+                        pdf.write_with_emoji(line.strip())
+                        pdf.ln()
+    # Save PDF
+    timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
+    pdf_path = f"repo_analysis_{timestamp}.pdf"
+    pdf.output(pdf_path)
+    return pdf_path
 @retry(
     retry=retry_if_exception_type(Exception),
     stop=stop_after_attempt(3),
     wait=wait_exponential(multiplier=1, min=4, max=10)
 )
 def analyze_repository(repo_url: str, progress=gr.Progress()) -> Tuple[str, str, str]:
     """Analyze repository and generate LLM summary with rate limit handling"""
     try:
             json.dump(analysis_data, f, indent=2)
             analysis_file = f.name
+        progress(0.9, desc="Generating PDF report...")
+        try:
+            pdf_path = create_pdf_report(response.text)
+        except Exception as pdf_error:
+            print(f"PDF generation error: {str(pdf_error)}")
+            pdf_path = ""
+        # Generate PDF
+        pdf_path = create_pdf_from_markdown(response.text, f"analysis_{datetime.now().strftime('%Y%m%d_%H%M%S')}")
+        with tempfile.NamedTemporaryFile(mode='w', delete=False, suffix='.json') as f:
+            json.dump(analysis_data, f, indent=2)
+            analysis_file = f.name
+        progress(1.0, desc="✨ Analysis complete!")
+        return response.text, analysis_file, pdf_path, "✅ Analysis completed successfully!"
     except Exception as e:
         error_message = f"❌ Error analyzing repository: {str(e)}"
+        return "", "", "", error_message  # Return 4 empty values when there's an error
 def create_chat_session() -> Any:
     """Create a new chat session for follow-up questions"""
+# Create Gradio interface
 # Create Gradio interface
 with gr.Blocks(theme=gr.themes.Soft()) as app:
     gr.Markdown("""
     1. 📊 Analyze repository structure and patterns
     2. 💡 Generate insights about development practices
     3. 💭 Allow you to ask follow-up questions about the analysis
+    4. 📑 Generate a downloadable PDF report
     """)
     with gr.Row():
             placeholder="https://github.com/owner/repo",
             scale=4
         )
+    with gr.Row():
+        with gr.Column(scale=1):
+            analyze_btn = gr.Button("🔍 Analyze", variant="primary")
+            download_pdf_btn = gr.Button("📄 Download PDF", variant="secondary")
+    # Status message
     status_msg = gr.Markdown("", elem_id="status_message")
+    # File output for PDF
+    pdf_output = gr.File(
+        label="Analysis Report",
+        visible=False,
+        interactive=True
+    )
     with gr.Row():
+        summary = gr.Markdown(label="Analysis Summary")
     with gr.Row():
         chatbot = gr.Chatbot(
         ask_btn = gr.Button("💭 Ask", variant="primary", scale=1)
         clear_btn = gr.Button("🗑️ Clear Chat", variant="secondary", scale=1)
+    # Hidden states
     analysis_file = gr.State("")
+    current_pdf_path = gr.State("")
+    def handle_pdf_download(pdf_path):
+        """Handle PDF download when button is clicked"""
+        if pdf_path and os.path.exists(pdf_path):
+            return {
+                pdf_output: pdf_path
+            }
+        return {
+            pdf_output: None
+        }
     def clear_outputs():
+        """Clear all outputs"""
+        return {
+            summary: "",
+            chatbot: [],
+            question: "",
+            status_msg: "",
+            pdf_output: None,
+            current_pdf_path: ""
+        }
+    # Event handlers
     analyze_btn.click(
         fn=lambda: "⏳ Analysis in progress...",
         inputs=None,
     ).then(
         analyze_repository,
         inputs=[repo_url],
+        outputs=[summary, analysis_file, current_pdf_path, status_msg]
+    ).then(
+        lambda: gr.update(visible=True),
+        None,
+        download_pdf_btn
+    )
+    # PDF download handler
+    download_pdf_btn.click(
+        handle_pdf_download,
+        inputs=[current_pdf_path],
+        outputs=pdf_output
+    ).then(
+        lambda: gr.update(visible=True),
+        None,
+        pdf_output
     )
     ask_btn.click(
         ask_question,
         inputs=[question, analysis_file, chatbot],
+        outputs=[chatbot]
     ).then(
+        lambda: "",
         None,
         question,
         queue=False
     clear_btn.click(
         clear_outputs,
         inputs=None,
+        outputs=[summary, chatbot, question, status_msg, pdf_output, current_pdf_path]
     )
 # Launch the app
 if __name__ == "__main__":
     app.launch(