github_pr_review_agent

Sleeping

App Files Files Community

LukeMattingly commited on Feb 17

Commit

3ac40d9

1 Parent(s): 0a1dae9

updated ui, redoing tools to work with diffs

Browse files

Files changed (3) hide show

.gitignore +5 -0
CustomGradioUI.py +41 -0
app.py +84 -8

.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+venv
+tools
+__pycache__
+.env
+certificate.pem

CustomGradioUI.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import gradio as gr
+from smolagents import GradioUI
+class CustomGradioUI(GradioUI):
+    def launch(self, **kwargs):
+        with gr.Blocks(fill_height=True) as demo:
+            # Add your header and instructions at the very top
+            gr.Markdown("## Welcome my Github PR Review Agent 🤖")
+            gr.Markdown("Follow the instructions below to interact with the agent. Type your chat message in the box and hit enter.")
+            # The rest of the UI remains the same as the original launch method
+            stored_messages = gr.State([])
+            file_uploads_log = gr.State([])
+            chatbot = gr.Chatbot(
+                label="Agent",
+                type="messages",
+                avatar_images=(
+                    None,
+                    "https://huggingface.co/datasets/agents-course/course-images/resolve/main/en/communication/Alfred.png",
+                ),
+                resizeable=True,
+                scale=1,
+            )
+            # If an upload folder is provided, enable the upload feature
+            if self.file_upload_folder is not None:
+                upload_file = gr.File(label="Upload a file")
+                upload_status = gr.Textbox(label="Upload Status", interactive=False, visible=False)
+                upload_file.change(
+                    self.upload_file,
+                    [upload_file, file_uploads_log],
+                    [upload_status, file_uploads_log],
+                )
+            text_input = gr.Textbox(lines=1, label="Please provide a link to your github pull request for review.")
+            text_input.submit(
+                self.log_user_message,
+                [text_input, file_uploads_log],
+                [stored_messages, text_input],
+            ).then(self.interact_with_agent, [stored_messages, chatbot], [chatbot])
+        demo.launch(debug=True, share=True, **kwargs)

app.py CHANGED Viewed

@@ -9,6 +9,7 @@ import ast
 from typing import List
 from huggingface_hub import login
 import os
 from Gradio_UI import GradioUI
@@ -165,11 +166,46 @@ def get_pr_files_changed(github_url: str, pr_number: int) -> List[str]:
             return [f"Error fetching PR files: {response.json().get('message', 'Unknown error')}"]
         files = response.json()
-        return [file['filename'] for file in files]
     except Exception as e:
         return [f"Error retrieving files for PR #{pr_number}: {str(e)}"]
 @tool
 def detect_code_smells(code: str) -> str:
     """Detects common code smells such as long functions and deeply nested loops.
@@ -198,6 +234,40 @@ def detect_code_smells(code: str) -> str:
     except Exception as e:
         return f"Error analyzing code: {str(e)}"
 '''
 @tool
 def get_file_content(github_url: str, file_path: str) -> str:
     """Fetches the content of a specific file from the GitHub repository.
@@ -220,12 +290,14 @@ def get_file_content(github_url: str, file_path: str) -> str:
         return f"Error: {str(e)}"
         '''
 @tool
-def security_check_code(code: str) -> str:
-    """Analyzes the provided code snippet for potential security vulnerabilities.
     Args:
-        code: The source code to be analyzed for common security issues (e.g., hardcoded secrets, unsafe functions).
     Returns:
         A string listing detected potential security vulnerabilities based on common patterns (e.g., hardcoded credentials,
@@ -233,6 +305,7 @@ def security_check_code(code: str) -> str:
     """
     import re
     issues = []
     # Check for hardcoded credentials (case-insensitive search)
     secret_patterns = [
@@ -288,11 +361,11 @@ def check_documentation_updates(changed_files: str) -> str:
         return "No documentation updates detected. Consider reviewing the docs to ensure they reflect the new changes."
 @tool
-def lint_code(code: str) -> str:
     """Analyzes the provided code snippet for style and potential issues using a linter.
     Args:
-        code: The source code to be analyzed.
     Returns:
         A string with linting warnings and suggestions for improvement, or a message indicating that no issues were found.
@@ -300,6 +373,9 @@ def lint_code(code: str) -> str:
     # This is a placeholder; you could integrate pylint or flake8 via subprocess or an API.
     # For demonstration, we'll simulate a response.
     issues = []
     if "print(" in code:
         issues.append("Consider removing debug print statements.")
     if not issues:
@@ -329,7 +405,7 @@ with open("prompts.yaml", 'r') as stream:
 agent = CodeAgent(
     model=model,
-    tools=[final_answer, get_open_pull_requests, find_todo_comments, get_pr_diff, get_pr_files_changed, detect_code_smells, security_check_code, check_documentation_updates, lint_code, get_pr_diff_for_file ], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,
@@ -340,4 +416,4 @@ agent = CodeAgent(
 )
-GradioUI(agent).launch()

 from typing import List
 from huggingface_hub import login
 import os
+from CustomGradioUI import CustomGradioUI
 from Gradio_UI import GradioUI
             return [f"Error fetching PR files: {response.json().get('message', 'Unknown error')}"]
         files = response.json()
+        files_changed = [file['filename'] for file in files]
+        print(files_changed)
+        return files_changed
     except Exception as e:
         return [f"Error retrieving files for PR #{pr_number}: {str(e)}"]
+#Helper Function
+def diff_to_code(diff: str) -> str:
+    """
+    Converts a unified diff string into a regular code string by extracting
+    added and context lines, while ignoring diff metadata and removed lines.
+    Args:
+        diff: A unified diff string representing code changes.
+    Returns:
+        A string containing the reconstructed code.
+    """
+    code_lines = []
+    for line in diff.splitlines():
+        # Skip diff metadata lines
+        if line.startswith("diff") or line.startswith("index") or line.startswith("---") or line.startswith("+++"):
+            continue
+        # Skip hunk headers (lines starting with @@)
+        if re.match(r'^@@', line):
+            continue
+        # Skip removal lines (lines starting with '-')
+        if line.startswith("-"):
+            continue
+        # For added lines, remove the '+' prefix
+        if line.startswith("+"):
+            code_lines.append(line[1:])
+        # For context lines (starting with a space), remove the leading space
+        elif line.startswith(" "):
+            code_lines.append(line[1:])
+        else:
+            code_lines.append(line)
+    return "\n".join(code_lines)
+'''
 @tool
 def detect_code_smells(code: str) -> str:
     """Detects common code smells such as long functions and deeply nested loops.
     except Exception as e:
         return f"Error analyzing code: {str(e)}"
 '''
+@tool
+def detect_code_smells_diff(diff: str) -> str:
+    """Detects common code smells such as long functions and deeply nested loops from a code diff.
+    Args:
+        diff: A unified diff string representing changes in code to analyze for potential code smells.
+    Returns:
+        A string listing detected code smells based on the added and context code lines.
+        If no code smells are found, returns a message indicating the code is clean.
+    """
+    try:
+        # Use the helper function to convert the diff into a code string.
+        code = diff_to_code(diff)
+        tree = ast.parse(code)
+        issues = []
+        for node in ast.walk(tree):
+            # Detect long functions (more than 20 statements)
+            if isinstance(node, ast.FunctionDef) and len(node.body) > 20:
+                issues.append(f"Long function detected: {node.name} ({len(node.body)} lines)")
+            # Detect deeply nested loops by counting nested For/While nodes
+            if isinstance(node, (ast.For, ast.While)):
+                nested_loops = sum(isinstance(n, (ast.For, ast.While)) for n in ast.walk(node))
+                if nested_loops > 2:
+                    issues.append(f"Deeply nested loop detected at line {node.lineno}")
+        return "\n".join(issues) if issues else "No code smells detected."
+    except Exception as e:
+        return f"Error analyzing code diff: {str(e)}"
+'''
 @tool
 def get_file_content(github_url: str, file_path: str) -> str:
     """Fetches the content of a specific file from the GitHub repository.
         return f"Error: {str(e)}"
         '''
 @tool
+def security_check_code_diff(diff: str) -> str:
+    """Analyzes the provided code diff for potential security vulnerabilities.
     Args:
+        diff: A unified diff string representing changes in code. The source code to be analyzed for common security issues (e.g., hardcoded secrets, unsafe functions).
     Returns:
         A string listing detected potential security vulnerabilities based on common patterns (e.g., hardcoded credentials,
     """
     import re
     issues = []
+    code = diff_to_code(diff)
     # Check for hardcoded credentials (case-insensitive search)
     secret_patterns = [
         return "No documentation updates detected. Consider reviewing the docs to ensure they reflect the new changes."
 @tool
+def lint_code(diff: str) -> str:
     """Analyzes the provided code snippet for style and potential issues using a linter.
     Args:
+        diff: The source code to be analyzed.
     Returns:
         A string with linting warnings and suggestions for improvement, or a message indicating that no issues were found.
     # This is a placeholder; you could integrate pylint or flake8 via subprocess or an API.
     # For demonstration, we'll simulate a response.
     issues = []
+    code = diff_to_code(diff)
     if "print(" in code:
         issues.append("Consider removing debug print statements.")
     if not issues:
 agent = CodeAgent(
     model=model,
+    tools=[final_answer, get_open_pull_requests, find_todo_comments, get_pr_diff, get_pr_files_changed, detect_code_smells_diff, security_check_code, check_documentation_updates, lint_code, get_pr_diff_for_file ], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,
 )
+CustomGradioUI(agent).launch()