Spaces:

acecalisto3
/

GitBot

Runtime error

App Files Files Community

acecalisto3 commited on May 16, 2024

Commit

a7252e1

verified ·

1 Parent(s): 5654a45

Update app.py

Browse files

Files changed (1) hide show

app.py +117 -284

app.py CHANGED Viewed

@@ -1,9 +1,8 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
-import os
-import requests
 from transformers import pipeline
 from sentence_transformers import SentenceTransformer, util
 import logging
 # Configure logging for detailed insights
@@ -11,8 +10,8 @@ logging.basicConfig(level=logging.INFO)
 # Constants for enhanced organization
 GITHUB_API_BASE_URL = "https://api.github.com/repos"
-DEFAULT_MODEL = "microsoft/CodeBERT-base"  # Robust default model selection
-MAX_RELATED_ISSUES = 3
 # Hugging Face Inference Client
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
@@ -20,126 +19,59 @@ client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 # Load a pre-trained model for sentence similarity
 similarity_model = SentenceTransformer('all-mpnet-base-v2')
-### Function to analyze issues and provide solutions
 def analyze_issues(issue_text: str, model_name: str, severity: str = None, programming_language: str = None) -> str:
-    """
-    Analyzes issues and provides comprehensive solutions using a specified language model.
-    Args:
-        issue_text (str): The detailed description of the issue.
-        model_name (str): The name of the language model to use for analysis.
-        severity (str, optional): The severity level of the issue (e.g., "Critical", "Major"). Defaults to None.
-        programming_language (str, optional): The programming language relevant to the issue. Defaults to None.
-    Returns:
-        str: A structured analysis of the issue, including problem summary, root cause, solution options,
-             recommended solution, implementation steps, and verification steps.
-    """
-    logging.info(f"Analyzing issue: '{issue_text}' with model: '{model_name}'")
-    # Construct a detailed prompt for the language model
-    prompt = f"""Issue: {issue_text}
-Severity: {severity if severity else "Not specified"}
-Programming Language: {programming_language if programming_language else "Not specified"}
-Please provide a comprehensive resolution in the following format:
-## Problem Summary:
-(Concise summary of the issue)
-## Root Cause Analysis:
-(Possible reasons for the issue)
-## Solution Options:
-1. **Option 1:** (Description)
-   - Pros: (Advantages)
-   - Cons: (Disadvantages)
-2. **Option 2:** (Description)
-   - Pros: (Advantages)
-   - Cons: (Disadvantages)
-## Recommended Solution:
-(The best solution with justification)
-## Implementation Steps:
-1. (Step 1)
-2. (Step 2)
-3. (Step 3)
-## Verification Steps:
-1. (Step 1)
-2. (Step 2)
-"""
-    try:
-        nlp = pipeline("text-generation", model=model_name, max_length=1000)
-        logging.info(f"Pipeline created with model: '{model_name}'")
-        result = nlp(prompt)
-        logging.info(f"Model output: {result}")
-        return result[0]['generated_text']
-    except Exception as e:
-        logging.error(f"Error analyzing issue with model '{model_name}': {e}")
-        return f"Error analyzing issue. Please try again later." # User-friendly error message
-### Function to find related issues
 def find_related_issues(issue_text: str, issues: list) -> list:
-    """
-    Finds semantically related issues from a list of issues based on the input issue text.
-    Args:
-        issue_text (str): The text of the issue for which to find related issues.
-        issues (list): A list of issues, where each issue is a dictionary with at least a 'title' key.
-    Returns:
-        list: A list of tuples, each containing a related issue (dictionary) and its similarity score to the input issue.
-              The list is sorted by similarity in descending order, limited to MAX_RELATED_ISSUES.
-    """
-    logging.info(f"Finding related issues for: '{issue_text}'")
     issue_embedding = similarity_model.encode(issue_text)
-    related_issues = []
-    for issue in issues:
-        title_embedding = similarity_model.encode(issue['title'])
-        similarity = util.cos_sim(issue_embedding, title_embedding)[0][0]
-        related_issues.append((issue, similarity))
-    related_issues = sorted(related_issues, key=lambda x: x[1], reverse=True)[:MAX_RELATED_ISSUES]
-    logging.info(f"Found related issues: {related_issues}")
     return related_issues
-### Function to fetch GitHub issues
 def fetch_github_issues(github_api_token: str, github_username: str, github_repository: str) -> list:
-    """
-    Fetches issues from a specified GitHub repository using the GitHub API.
-    Args:
-        github_api_token (str): The user's GitHub API token for authentication.
-        github_username (str): The username of the GitHub account owning the repository.
-        github_repository (str): The name of the GitHub repository.
-    Returns:
-        list: A list of dictionaries, where each dictionary represents a GitHub issue with its details.
-    Raises:
-        Exception: If there's an error fetching issues from the GitHub API.
-    """
-    logging.info(f"Fetching GitHub issues for: '{github_username}/{github_repository}'")
     url = f"{GITHUB_API_BASE_URL}/{github_username}/{github_repository}/issues"
-    headers = {
-        "Authorization": f"Bearer {github_api_token}",
-        "Accept": "application/vnd.github.v3+json"
-    }
     response = requests.get(url, headers=headers)
-    if response.status_code == 200:
-        issues = response.json()
-        logging.info(f"Fetched issues: {issues}")
-        return issues
-    else:
-        logging.error(f"Error fetching issues: Status Code {response.status_code}, Response: {response.text}")
-        raise Exception(f"Error fetching GitHub issues. Please check your credentials and repository.")
-### Function to handle chat responses
 def respond(
     command: str,
     history: list[tuple[str, str]],
@@ -154,161 +86,62 @@ def respond(
     severity: str,
     programming_language: str,
 ) -> str:
-    """
-    Handles user commands and generates responses using the selected language model.
-    Args:
-        command (str): The user's command or input.
-        history (list[tuple[str, str]]): The conversation history as a list of (user, assistant) message tuples.
-        system_message (str): The initial system message defining the chatbot's persona.
-        max_tokens (int): The maximum number of tokens allowed in the generated response.
-        temperature (float): The temperature parameter controlling the randomness of the generated text.
-        top_p (float): The top-p parameter for nucleus sampling, controlling the diversity of the generated text.
-        github_api_token (str): The user's GitHub API token for authentication.
-        github_username (str): The username of the GitHub account owning the repository.
-        github_repository (str): The name of the GitHub repository.
-        selected_model (str): The name of the language model selected for generating responses.
-        severity (str): The severity level of the issue (e.g., "Critical", "Major").
-        programming_language (str): The programming language relevant to the issue.
-    Returns:
-        str: The chatbot's response, generated by the selected language model or based on the command.
-    """
-    global issues
-    issues = [] # Reset issues for each interaction
-    messages = [{"role": "system", "content": system_message}]
-    logging.info(f"System message: {system_message}")
-    for user_msg, assistant_msg in history:
-        if user_msg:
-            messages.append({"role": "user", "content": user_msg})
-            logging.info(f"User message: {user_msg}")
-        if assistant_msg:
-            messages.append({"role": "assistant", "content": assistant_msg})
-            logging.info(f"Assistant message: {assistant_msg}")
-    logging.info(f"Command received: {command}")
-    if command == "/github":
-        if not github_api_token:
-            return "Please enter your GitHub API token first. <https://github.com/settings/tokens>"
-        else:
-            try:
-                issues = fetch_github_issues(github_api_token, github_username, github_repository)
-                issue_list = "\n".join([f"{i+1}. {issue['title']}" for i, issue in enumerate(issues)])
-                return f"Available GitHub Issues:\n{issue_list}\n\nEnter the issue number to analyze:"
-            except Exception as e:
-                logging.error(f"Error fetching GitHub issues: {e}")
-                return "Error fetching GitHub issues. Please check your credentials and repository."
-    elif command == "/help":
-        help_message = """Available commands:
-          - `/github`: Analyze a GitHub issue
-          - `/help`: Show this help message
-          - `/generate_code [code description]`: Generate code based on the description
-          - `/explain_concept [concept]`: Explain a concept
-          - `/write_documentation [topic]`: Write documentation for a given topic
-          - `/translate_code [code] to [target language]`: Translate code to another language"""
-        return help_message
-    elif command.isdigit() and issues:
-        try:
-            issue_number = int(command) - 1
-            issue = issues[issue_number]
-            issue_text = issue['title'] + "\n\n" + issue['body']
-            resolution = analyze_issues(issue_text, selected_model, severity, programming_language)
-            # Find and display related issues
-            related_issues = find_related_issues(issue_text, issues)
-            related_issue_text = "\n".join(
-                [f"- {issue['title']} (Similarity: {similarity:.2f})" for issue, similarity in related_issues]
-            )
-            return f"Resolution for Issue '{issue['title']}':\n{resolution}\n\nRelated Issues:\n{related_issue_text}"
-        except Exception as e:
-            logging.error(f"Error analyzing issue: {e}")
-            return "Error analyzing issue. Please try again later."
-    elif command.startswith("/generate_code"):
-        # Extract the code description from the command
-        code_description = command.replace("/generate_code", "").strip()
-        if not code_description:
-            return "Please provide a description of the code you want to generate."
-        else:
-            prompt = f"Generate code for the following: {code_description}\nProgramming Language: {programming_language}"
-            try:
-                generated_code = analyze_issues(prompt, selected_model)
-                code_output = f"<pre>{generated_code}</pre>"
-                return code_output
-            except Exception as e:
-                logging.error(f"Error generating code: {e}")
-                return "Error generating code. Please try again later."
-    elif command.startswith("/explain_concept"):
-        concept = command.replace("/explain_concept", "").strip()
-        if not concept:
-            return "Please provide a concept to explain."
-        else:
-            prompt = f"Explain the concept of {concept} in detail."
-            try:
-                explanation = analyze_issues(prompt, selected_model)
-                return f"<pre>{explanation}</pre>"
-            except Exception as e:
-                logging.error(f"Error explaining concept: {e}")
-                return "Error explaining concept. Please try again later."
-    elif command.startswith("/write_documentation"):
-        topic = command.replace("/write_documentation", "").strip()
-        if not topic:
-            return "Please provide a topic for the documentation."
         else:
-            prompt = f"Write documentation for the following topic: {topic}\nProgramming Language: {programming_language}"
-            try:
-                documentation = analyze_issues(prompt, selected_model)
-                return f"<pre>{documentation}</pre>"
-            except Exception as e:
-                logging.error(f"Error writing documentation: {e}")
-                return "Error writing documentation. Please try again later."
-    elif command.startswith("/translate_code"):
-        try:
-            code_and_language = command.replace("/translate_code", "").strip().split(" to ")
-            code = code_and_language[0]
-            target_language = code_and_language[1]
-            prompt = f"Translate the following code to {target_language}:\n\n{code}"
-            try:
-                translated_code = analyze_issues(prompt, selected_model)
-                code_output = f"<pre>{translated_code}</pre>"
-                return code_output
-            except Exception as e:
-                logging.error(f"Error translating code: {e}")
-                return "Error translating code. Please try again later."
-        except Exception as e:
-            logging.error(f"Error parsing translate_code command: {e}")
-            return "Error parsing translate_code command. Please check the syntax."
-    else:
-        messages.append({"role": "user", "content": command})
-        logging.info(f"User message: {command}")
-        response = ""
-        try:
-            for message in client.chat_completion(
-                messages,
-                max_tokens=max_tokens,
-                stream=True,
-                temperature=temperature,
-                top_p=top_p,
-            ):
-                logging.info(f"Received message from chat completion: {message}")
-                token = message.choices[0].delta.content
-                response += token
-                yield response # Use yield for streaming responses
-        except Exception as e:
-            logging.error(f"Error during chat completion: {e}")
-            return "An error occurred. Please try again later."
 with gr.Blocks() as demo:
     with gr.Row():
@@ -316,47 +149,41 @@ with gr.Blocks() as demo:
         github_username = gr.Textbox(label="GitHub Username")
         github_repository = gr.Textbox(label="GitHub Repository")
-    # Define system_message here, after github_username and github_repository are defined
     system_message = gr.Textbox(
-        value="You are GitBot, the Github project guardian angel. You resolve issues and propose implementation of feature requests",
         label="System message",
     )
-    # Model Selection Dropdown
     model_dropdown = gr.Dropdown(
         choices=[
-            "acecalisto3/InstructiPhi",
             "microsoft/CodeBERT-base",
-            "HuggingFaceH4/zephyr-7b-beta"
         ],
         label="Select Model for Issue Resolution",
-        value=DEFAULT_MODEL # Set a default model
     )
-    # Severity Dropdown
     severity_dropdown = gr.Dropdown(
         choices=["Critical", "Major", "Minor", "Trivial"],
         label="Severity",
-        value=None  # Default to no severity selected
     )
-    # Programming Language Textbox
     programming_language_textbox = gr.Textbox(label="Programming Language")
-    # Command Dropdown
     command_dropdown = gr.Dropdown(
         choices=[
-            "/github",
-            "/help",
-            "/generate_code",
             "/explain_concept",
             "/write_documentation",
-            "/translate_code"
         ],
         label="Select Command",
     )
-    chatbot = gr.ChatInterface(
         respond,
         additional_inputs=[
             command_dropdown,
@@ -375,9 +202,15 @@ with gr.Blocks() as demo:
             github_repository,
             model_dropdown,
             severity_dropdown,
-            programming_language_textbox
         ],
     )
 if __name__ == "__main__":
-    demo.queue().launch(share=True, server_name="0.0.0.0", server_port=7860)

 import gradio as gr
 from transformers import pipeline
 from sentence_transformers import SentenceTransformer, util
+import os
+import requests
 import logging
 # Configure logging for detailed insights
 # Constants for enhanced organization
 GITHUB_API_BASE_URL = "https://api.github.com/repos"
+DEFAULT_MODEL = "microsoft/CodeBERT-base"
+MAX_RELATED_ISSUES = 3
 # Hugging Face Inference Client
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 # Load a pre-trained model for sentence similarity
 similarity_model = SentenceTransformer('all-mpnet-base-v2')
 def analyze_issues(issue_text: str, model_name: str, severity: str = None, programming_language: str = None) -> str:
+    # Initialize the model
+    model = pipeline("text-generation", model=model_name)
+    # Generate a response
+    response = model(
+        f"{system_message}\n{issue_text}\nAssistant: ",
+        max_length=max_tokens,
+        do_sample=True,
+        temperature=temperature,
+        top_k=top_p,
+    )
+    # Extract the assistant's response
+    assistant_response = response[0]['generated_text'].strip()
+    # Analyze the response
+    if "Severity" in assistant_response:
+        severity = assistant_response.split(":")[1].strip()
+    if "Programming Language" in assistant_response:
+        programming_language = assistant_response.split(":")[1].strip()
+    return {
+        'assistant_response': assistant_response,
+        'severity': severity,
+        'programming_language': programming_language,
+    }
 def find_related_issues(issue_text: str, issues: list) -> list:
+    # Calculate the similarity between the issue and other issues
     issue_embedding = similarity_model.encode(issue_text)
+    similarities = [util.cos_sim(issue_embedding, similarity_model.encode(issue['title'])) for issue in issues]
+    # Sort the issues by similarity
+    sorted_issues = sorted(enumerate(similarities), key=lambda x: x[1], reverse=True)
+    # Select the top related issues
+    related_issues = [issues[i] for i, similarity in sorted_issues[:MAX_RELATED_ISSUES]]
     return related_issues
 def fetch_github_issues(github_api_token: str, github_username: str, github_repository: str) -> list:
+    # Fetch the issues from the GitHub API
+    headers = {'Authorization': f'token {github_api_token}'}
     url = f"{GITHUB_API_BASE_URL}/{github_username}/{github_repository}/issues"
     response = requests.get(url, headers=headers)
+    # Parse the JSON response
+    issues = response.json()
+    return issues
 def respond(
     command: str,
     history: list[tuple[str, str]],
     severity: str,
     programming_language: str,
 ) -> str:
+    # Initialize the model
+    model = pipeline("text-generation", model=selected_model)
+    # Generate a response
+    response = model(
+        f"{system_message}\n{command}\n{history}\n{github_username}/{github_repository}\n{severity}\n{programming_language}\nAssistant: ",
+        max_length=max_tokens,
+        do_sample=True,
+        temperature=temperature,
+        top_k=top_p,
+    )
+    # Extract the assistant's response
+    assistant_response = response[0]['generated_text'].strip()
+    return assistant_response
+class MyChatbot(gr.ChatInterface):
+    def __init__(self, respond, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.respond = respond
+    def update_chat_history(self, message: str, is_user: bool) -> None:
+        if is_user:
+            self.history.append((message, None))
         else:
+            self.history.append((None, message))
+    def compute(self, *args, **kwargs):
+        command = args[0]
+        history = self.history
+        system_message = self.additional_inputs["system_message"]
+        max_tokens = self.additional_inputs["max_new_tokens"]
+        temperature = self.additional_inputs["temperature"]
+        top_p = self.additional_inputs["top_p"]
+        github_api_token = self.additional_inputs["github_api_token"]
+        github_username = self.additional_inputs["github_username"]
+        github_repository = self.additional_inputs["github_repository"]
+        selected_model = self.additional_inputs["model_dropdown"]
+        severity = self.additional_inputs["severity_dropdown"]
+        programming_language = self.additional_inputs["programming_language_textbox"]
+        return self.respond(
+            command,
+            history,
+            system_message,
+            max_tokens,
+            temperature,
+            top_p,
+            github_api_token,
+            github_username,
+            github_repository,
+            selected_model,
+            severity,
+            programming_language,
+        )
 with gr.Blocks() as demo:
     with gr.Row():
         github_username = gr.Textbox(label="GitHub Username")
         github_repository = gr.Textbox(label="GitHub Repository")
     system_message = gr.Textbox(
+        value="You are GitBot, the Github project guardian angel. You resolve issues and propose implementation of feature requests",
         label="System message",
     )
     model_dropdown = gr.Dropdown(
         choices=[
             "microsoft/CodeBERT-base",
+            "Salesforce/codegen-350M-mono",
         ],
         label="Select Model for Issue Resolution",
+        value=DEFAULT_MODEL,
     )
     severity_dropdown = gr.Dropdown(
         choices=["Critical", "Major", "Minor", "Trivial"],
         label="Severity",
+        value=None,
     )
     programming_language_textbox = gr.Textbox(label="Programming Language")
     command_dropdown = gr.Dropdown(
         choices=[
+            "/github",
+            "/help",
+            "/generate_code",
             "/explain_concept",
             "/write_documentation",
+            "/translate_code",
         ],
         label="Select Command",
     )
+    chatbot = MyChatbot(
         respond,
         additional_inputs=[
             command_dropdown,
             github_repository,
             model_dropdown,
             severity_dropdown,
+            programming_language_textbox,
         ],
     )
 if __name__ == "__main__":
+    demo.queue().launch(
+        share=True,
+        server_name="0.0.0.0",
+        server_port=7860,
+        show_header=False,
+        debug=True,
+    )