File size: 5,730 Bytes
86d1445
 
 
d6b7027
 
 
 
86d1445
05aecc2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
86d1445
 
 
 
 
d6b7027
 
05aecc2
5022335
d6b7027
 
 
05aecc2
5022335
d6b7027
968e76d
05aecc2
86d1445
 
d6b7027
05aecc2
86d1445
d6b7027
 
86d1445
d6b7027
 
edc590f
 
d6b7027
 
 
05aecc2
d6b7027
968e76d
 
d6b7027
 
05aecc2
d6b7027
968e76d
 
d6b7027
 
05aecc2
d6b7027
968e76d
 
d6b7027
 
05aecc2
d6b7027
968e76d
 
d6b7027
 
 
 
 
 
05aecc2
d6b7027
 
 
 
 
 
968e76d
 
d6b7027
05aecc2
d6b7027
05aecc2
968e76d
86d1445
b2506ee
05aecc2
d6b7027
968e76d
86d1445
 
 
 
 
 
 
 
 
 
 
 
968e76d
 
86d1445
 
 
 
5022335
86d1445
 
 
 
d6b7027
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
import gradio as gr
import os
import time
import tempfile
import traceback
from github import Github
from openai import OpenAI

# Mock functions for testing - replace these with your actual functions
def get_repo_info(repo_input):
    return repo_input.split('/')[-2:]

def clone_repo(owner, repo_name, temp_dir):
    return os.path.join(temp_dir, f"{owner}_{repo_name}")

def analyze_code(repo_path):
    return {"files": 10, "lines": 1000}

def analyze_issues(github_repo, max_issues):
    return [{"title": "Test Issue", "number": 1}]

def analyze_pull_requests(github_repo, max_prs):
    return [{"title": "Test PR", "number": 1}]

def llm_analyze_code(client, code_analysis):
    return "Code analysis summary"

def llm_analyze_issues(client, issues_data, repo_url):
    return {"summary": "Issues analysis summary"}

def llm_analyze_prs(client, prs_data, repo_url):
    return {"summary": "PRs analysis summary"}

def llm_synthesize_findings(client, code_analysis, issues_analysis, pr_analysis):
    return "Synthesized findings"

def generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, final_analysis):
    return f"""
# Repository Analysis Report for {repo_info['owner']}/{repo_info['repo_name']}

## Code Analysis
{code_analysis['llm_analysis']}

## Issues Analysis
{issues_analysis['summary']}

## Pull Requests Analysis
{pr_analysis['summary']}

## Final Analysis
{final_analysis}
"""

def analyze_github_repo(repo_input, github_token=None):
    if github_token:
        os.environ["GITHUB_TOKEN"] = github_token
    
    github_token = os.environ.get("GITHUB_TOKEN")
    if not github_token:
        print("GitHub token not found")
        return "❌ Error: GITHUB_TOKEN environment variable not set.", gr.update(visible=True), gr.update(visible=False)

    openrouter_api_key = os.environ.get("OPENROUTER_API_KEY")
    if not openrouter_api_key:
        print("OpenRouter API key not found")
        return "❌ Error: OPENROUTER_API_KEY environment variable not set.", gr.update(visible=True), gr.update(visible=False)

    progress_md = ""
    
    try:
        owner, repo_name = get_repo_info(repo_input)
        repo_url = f"https://github.com/{owner}/{repo_name}"
        print(f"Analyzing repository: {repo_url}")
        
        g = Github(github_token)
        github_repo = g.get_repo(f"{owner}/{repo_name}")
        
        client = OpenAI(api_key=openrouter_api_key, base_url="https://openrouter.ai/api/v1")

        max_issues = 4
        max_prs = 4

        with tempfile.TemporaryDirectory() as temp_dir:
            repo_path = clone_repo(owner, repo_name, temp_dir)
            print(f"Cloned repository to: {repo_path}")

            progress_md += "πŸ”¬ Analyzing code structure...  \n"
            yield progress_md, gr.update(visible=True), gr.update(visible=False)
            code_analysis = analyze_code(repo_path)
            code_analysis['llm_analysis'] = llm_analyze_code(client, code_analysis)
            print("Code analysis complete")

            progress_md += f"πŸ“Š Analyzing issues (max {max_issues})...  \n"
            yield progress_md, gr.update(visible=True), gr.update(visible=False)
            issues_data = analyze_issues(github_repo, max_issues)
            issues_analysis = llm_analyze_issues(client, issues_data, repo_url)
            print("Issues analysis complete")

            progress_md += f"πŸ”€ Analyzing pull requests (max {max_prs})...  \n"
            yield progress_md, gr.update(visible=True), gr.update(visible=False)
            prs_data = analyze_pull_requests(github_repo, max_prs)
            pr_analysis = llm_analyze_prs(client, prs_data, repo_url)
            print("Pull requests analysis complete")

            progress_md += "🧠 Synthesizing findings...  \n"
            yield progress_md, gr.update(visible=True), gr.update(visible=False)
            final_analysis = llm_synthesize_findings(
                client, 
                code_analysis.get('llm_analysis', ''),
                issues_analysis.get('summary', ''),
                pr_analysis.get('summary', '')
            )
            print("Findings synthesized")

            repo_info = {
                "owner": owner,
                "repo_name": repo_name,
            }

            progress_md += "πŸ“ Generating report...  \n"
            yield progress_md, gr.update(visible=True), gr.update(visible=False)
            report = generate_report(repo_info, code_analysis, issues_analysis, pr_analysis, final_analysis)
            print("Report generated")

        print("Analysis complete, returning results")
        return progress_md + "βœ… Analysis complete!", gr.update(visible=False), gr.update(visible=True, value=report)
    except Exception as e:
        error_message = f"❌ An error occurred: {str(e)}"
        print(f"Error occurred: {error_message}")
        traceback.print_exc()
        return progress_md + error_message, gr.update(visible=True), gr.update(visible=False)

# Define the Gradio interface
with gr.Blocks() as app:
    gr.Markdown("# GitHub Repository Analyzer")
    
    repo_input = gr.Textbox(label="Enter GitHub Repository Slug or URL")
    
    with gr.Accordion("Advanced Settings", open=False):
        github_token = gr.Textbox(label="GitHub Token (optional)", type="password")
    
    analyze_button = gr.Button("Analyze Repository")
    
    progress_output = gr.Markdown(label="Progress")
    report_output = gr.Markdown(label="Analysis Report", visible=False)
    
    analyze_button.click(
        analyze_github_repo,
        inputs=[repo_input, github_token],
        outputs=[progress_output, progress_output, report_output],
    )

# Launch the app
if __name__ == "__main__":
    app.launch()