Spaces:

patched-codes
/

analyze-gh-repo

Running

App Files Files Community

codelion commited on Sep 21, 2024

Commit

ec0c2ab

verified ·

1 Parent(s): d3b6911

Update github_repo_analyzer.py

Browse files

Files changed (1) hide show

github_repo_analyzer.py +43 -16

github_repo_analyzer.py CHANGED Viewed

@@ -2,7 +2,7 @@ import os
 import sys
 import tempfile
 import shutil
-from urllib.parse import urlparse
 import requests
 from github import Github
 from git import Repo
@@ -45,8 +45,28 @@ def get_repo_info(input_str):
 def clone_repo(owner, repo_name, temp_dir):
     repo_url = f"https://github.com/{owner}/{repo_name}.git"
-    Repo.clone_from(repo_url, temp_dir)
-    return temp_dir
 def analyze_code(repo_path):
     file_types = defaultdict(int)
@@ -519,18 +539,20 @@ def llm_synthesize_findings(client, code_analysis, issues_analysis, pr_analysis)
     return call_llm(client, prompt, max_tokens=8192)
-def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, final_analysis):
     repo_url = f"https://github.com/{repo_info['owner']}/{repo_info['repo_name']}"
     report = f"""# LLM-Assisted Workflow Analysis for {repo_info['owner']}/{repo_info['repo_name']}
 ## Repository Overview
-- Owner: {repo_info['owner']}
-- Repository: {repo_info['repo_name']}
-- URL: {repo_url}
-- File types: {code_analysis.get('file_types', 'N/A')}
 ## Code Analysis
 """
     if isinstance(code_analysis.get('llm_analysis'), dict):
@@ -541,12 +563,14 @@ def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, fina
             report += f"- {pattern}\n"
         report += "\n### Best Practices\n"
-        report += "#### Followed:\n"
         for practice in code_llm_analysis.get('best_practices', {}).get('followed', []):
             report += f"- {practice}\n"
-        report += "\n#### Missing:\n"
         for practice in code_llm_analysis.get('best_practices', {}).get('missing', []):
             report += f"- {practice}\n"
         report += "\n### Areas for Improvement\n"
         for area in code_llm_analysis.get('areas_for_improvement', []):
@@ -554,12 +578,16 @@ def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, fina
         report += "\n### Potential Vulnerabilities\n"
         for vuln in code_llm_analysis.get('potential_vulnerabilities', []):
-            report += f"- {vuln['description']} in `{vuln['file_path']}` (Severity: {vuln['severity']})\n"
         report += "\n### LLM-Assisted Coding Opportunities\n"
         for opp in code_llm_analysis.get('llm_opportunities', []):
             report += f"- **Task:** {opp['task']}\n"
-            report += f"  - **File:** `{opp['file_path']}`\n"
             report += f"  - **Improvement:** {opp['improvement']}\n\n"
     else:
         report += "No structured code analysis available.\n"
@@ -574,7 +602,7 @@ def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, fina
         report += "\n### Promising LLM-Assisted Workflows for Issues\n"
         for workflow in issues_analysis['summary'].get('promising_workflows', []):
             report += f"- **Workflow:** {workflow['workflow']}\n"
-            report += f"  - **Example Issue:** [{workflow['applicable_issue']}]({repo_url}/issues/{workflow['applicable_issue']})\n\n"
         report += "### Overall Recommendations for Issue Management\n"
         for rec in issues_analysis['summary'].get('overall_recommendations', ['No recommendations available.']):
@@ -592,7 +620,7 @@ def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, fina
         report += "\n### Promising LLM-Assisted Workflows for Pull Requests\n"
         for workflow in pr_analysis['summary'].get('promising_workflows', []):
             report += f"- **Workflow:** {workflow['workflow']}\n"
-            report += f"  - **Example PR:** [{workflow['applicable_pr']}]({repo_url}/pull/{workflow['applicable_pr']})\n\n"
         report += "### Overall Recommendations for PR Process\n"
         for rec in pr_analysis['summary'].get('overall_recommendations', ['No recommendations available.']):
@@ -600,5 +628,4 @@ def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, fina
     else:
         report += "No structured pull requests analysis available.\n"
-    report += f"\n## Synthesis and Recommendations\n{final_analysis}\n"
     return report

 import sys
 import tempfile
 import shutil
+from urllib.parse import urlparse, quote
 import requests
 from github import Github
 from git import Repo
 def clone_repo(owner, repo_name, temp_dir):
     repo_url = f"https://github.com/{owner}/{repo_name}.git"
+    # Clone the repository
+    repo = Repo.clone_from(repo_url, temp_dir)
+    # Get the default branch
+    default_branch = repo.active_branch.name
+    # Get the full name of the repository (owner/repo_name)
+    full_name = f"{owner}/{repo_name}"
+    # Create the repo_info object
+    repo_info = {
+        "owner": owner,
+        "repo_name": repo_name,
+        "full_name": full_name,
+        "repo_url": repo_url,
+        "local_path": temp_dir,
+        "default_branch": default_branch,
+        "git_repo": repo
+    }
+    return repo_info
 def analyze_code(repo_path):
     file_types = defaultdict(int)
     return call_llm(client, prompt, max_tokens=8192)
+def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis):
     repo_url = f"https://github.com/{repo_info['owner']}/{repo_info['repo_name']}"
+    default_branch = repo_info.get('default_branch', 'master')  # Assume 'master' if not provided
     report = f"""# LLM-Assisted Workflow Analysis for {repo_info['owner']}/{repo_info['repo_name']}
 ## Repository Overview
+- **Owner:** {repo_info['owner']}
+- **Repository:** {repo_info['repo_name']}
+- **URL:** [{repo_url}]({repo_url})
+- **File types:** {', '.join(f"{ext} ({count})" for ext, count in code_analysis.get('file_types', {}).items())}
 ## Code Analysis
 """
     if isinstance(code_analysis.get('llm_analysis'), dict):
             report += f"- {pattern}\n"
         report += "\n### Best Practices\n"
+        report += "<details><summary>Followed</summary>\n\n"
         for practice in code_llm_analysis.get('best_practices', {}).get('followed', []):
             report += f"- {practice}\n"
+        report += "</details>\n\n"
+        report += "<details><summary>Missing</summary>\n\n"
         for practice in code_llm_analysis.get('best_practices', {}).get('missing', []):
             report += f"- {practice}\n"
+        report += "</details>\n"
         report += "\n### Areas for Improvement\n"
         for area in code_llm_analysis.get('areas_for_improvement', []):
         report += "\n### Potential Vulnerabilities\n"
         for vuln in code_llm_analysis.get('potential_vulnerabilities', []):
+            relative_path = os.path.relpath(vuln['file_path'], repo_info['local_path'])
+            file_url = f"{repo_url}/blob/{default_branch}/{quote(relative_path)}"
+            report += f"- [{vuln['description']}]({file_url}) (Severity: {vuln['severity']})\n"
         report += "\n### LLM-Assisted Coding Opportunities\n"
         for opp in code_llm_analysis.get('llm_opportunities', []):
+            relative_path = os.path.relpath(opp['file_path'], repo_info['local_path'])
+            file_url = f"{repo_url}/blob/{default_branch}/{quote(relative_path)}"
             report += f"- **Task:** {opp['task']}\n"
+            report += f"  - **File:** [`{relative_path}`]({file_url})\n"
             report += f"  - **Improvement:** {opp['improvement']}\n\n"
     else:
         report += "No structured code analysis available.\n"
         report += "\n### Promising LLM-Assisted Workflows for Issues\n"
         for workflow in issues_analysis['summary'].get('promising_workflows', []):
             report += f"- **Workflow:** {workflow['workflow']}\n"
+            report += f"  - **Example Issue:** [#{workflow['applicable_issue']}]({repo_url}/issues/{workflow['applicable_issue']})\n\n"
         report += "### Overall Recommendations for Issue Management\n"
         for rec in issues_analysis['summary'].get('overall_recommendations', ['No recommendations available.']):
         report += "\n### Promising LLM-Assisted Workflows for Pull Requests\n"
         for workflow in pr_analysis['summary'].get('promising_workflows', []):
             report += f"- **Workflow:** {workflow['workflow']}\n"
+            report += f"  - **Example PR:** [#{workflow['applicable_pr']}]({repo_url}/pull/{workflow['applicable_pr']})\n\n"
         report += "### Overall Recommendations for PR Process\n"
         for rec in pr_analysis['summary'].get('overall_recommendations', ['No recommendations available.']):
     else:
         report += "No structured pull requests analysis available.\n"
     return report