File size: 4,653 Bytes
8f72ba3
8929e00
8f72ba3
 
 
8929e00
8f72ba3
8929e00
 
 
 
 
8f72ba3
8929e00
8f72ba3
8929e00
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1df4261
8929e00
 
 
 
 
 
 
 
 
 
8f72ba3
8929e00
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8f72ba3
8929e00
 
8f72ba3
8929e00
8f72ba3
 
8929e00
 
8f72ba3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8929e00
8f72ba3
 
 
 
 
 
 
 
 
 
8929e00
8f72ba3
 
 
 
8929e00
8f72ba3
 
8929e00
 
 
 
 
8f72ba3
 
 
 
 
 
 
b6d5172
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
import os
import logging
import requests
import gradio as gr
from groq import Groq
from urllib.parse import urlparse

# Configure logging
logging.basicConfig(level=logging.INFO)


def extract_repo_id(input_str: str) -> str:
    """
    Extract the repository ID in the format 'user/repo' from a URL or plain string.
    """
    input_str = input_str.strip()

    # Remove trailing '.git' if present
    if input_str.endswith(".git"):
        input_str = input_str[:-4]

    # If input is a URL, parse it to extract the repo path.
    if input_str.startswith("http"):
        try:
            parsed = urlparse(input_str)
            path_parts = parsed.path.strip("/").split("/")
            if len(path_parts) >= 2:
                repo_id = "/".join(path_parts[:2])
                logging.info("Extracted repo_id: %s", repo_id)
                return repo_id
            else:
                raise ValueError("Invalid GitHub URL format.")
        except Exception as e:
            raise ValueError(f"Error parsing URL: {e}")
    else:
        # Assume it's already in the correct format.
        return input_str


def fetch_repo_details(repo_id: str) -> dict:
    """
    Fetch repository details from GitHub using its API.
    """
    api_url = f"https://api.github.com/repos/{repo_id}"
    response = requests.get(api_url)
    if response.status_code != 200:
        raise ValueError(
            f"Error: Unable to fetch repository details for '{repo_id}'. "
            f"Status code: {response.status_code}"
        )
    return response.json()


def fetch_readme(repo_id: str) -> str:
    """
    Attempt to fetch the README.md from the repository's main branch.
    """
    readme_url = f"https://raw.githubusercontent.com/{repo_id}/main/README.md"
    response = requests.get(readme_url)
    if response.status_code == 200:
        return response.text
    else:
        return "No README found."


def generate_docs(repo_input: str) -> str:
    """
    Fetch repository details from GitHub and generate documentation using the Groq API.
    """
    try:
        # Extract a clean repository ID.
        repo_id = extract_repo_id(repo_input)
    except ValueError as e:
        return str(e)

    try:
        repo_data = fetch_repo_details(repo_id)
    except ValueError as e:
        return str(e)

    # Extract repository information.
    repo_name = repo_data.get("name", repo_id)
    repo_description = repo_data.get("description", "No description provided.")
    readme_content = fetch_readme(repo_id)

    # Construct the prompt for the Groq API.
    prompt = (
        f"Generate comprehensive documentation for the GitHub repository '{repo_id}'. "
        f"The repository is named '{repo_name}' and its description is: {repo_description}. "
        f"Use the following README content as reference:\n\n{readme_content}\n\n"
        "Please include sections such as an introduction, installation instructions, usage examples, "
        "and any relevant details that would help a new user understand and work with this repository."
    )

    # Retrieve the Groq API key from environment variables.
    groq_api_key = os.environ.get("GROQ_API_KEY")
    if not groq_api_key:
        return "Error: GROQ_API_KEY environment variable is not set."

    # Initialize the Groq client.
    client = Groq(api_key=groq_api_key)

    try:
        # Call the Groq API with the generated prompt.
        chat_completion = client.chat.completions.create(
            messages=[{"role": "user", "content": prompt}],
            model="llama-3.3-70b-versatile",
            stream=False,
        )
    except Exception as e:
        return f"Error calling Groq API: {e}"

    # Extract and return the generated documentation.
    documentation = chat_completion.choices[0].message.content
    return documentation


# Define the Gradio Blocks interface.
with gr.Blocks() as demo:
    gr.Markdown("# GitHub Repository Documentation Generator")
    gr.Markdown(
        "Enter a GitHub repository URL or ID (in the format `user/repo`) below. "
        "This tool fetches repository details and uses the Groq API to generate documentation."
    )

    repo_id_input = gr.Textbox(
        label="GitHub Repository URL or ID",
        placeholder="https://github.com/octocat/Hello-World or octocat/Hello-World",
    )
    output_box = gr.Textbox(label="Generated Documentation", lines=20)
    generate_button = gr.Button("Generate Documentation")

    # When the button is clicked, call the generate_docs function.
    generate_button.click(fn=generate_docs, inputs=repo_id_input, outputs=output_box)

# Launch the Gradio app.
demo.launch(debug=True)