path: root/etc/tool/copilot.py



import sys
from pathlib import Path

sys.path.append(str(Path(__file__).parent.parent.parent))

import g4f
import json
import os
import re
import requests
from typing import Union
from github import Github
from github.PullRequest import PullRequest

g4f.debug.logging = True
g4f.debug.version_check = False

GITHUB_TOKEN = os.getenv('GITHUB_TOKEN')
GITHUB_REPOSITORY = os.getenv('GITHUB_REPOSITORY')
G4F_PROVIDER = os.getenv('G4F_PROVIDER')
G4F_MODEL = os.getenv('G4F_MODEL') or g4f.models.gpt_4o or g4f.models.gpt_4o

def get_github_token():
    token = os.getenv('GITHUB_TOKEN')
    if not token:
        raise ValueError("GITHUB_TOKEN environment variable is not set")
    print(f"Token length: {len(token)}")
    print(f"Token (masked): {'*' * (len(token) - 4) + token[-4:]}")
    if len(token) != 40 or not token.isalnum():
        raise ValueError("GITHUB_TOKEN appears to be invalid (should be 40 alphanumeric characters)")
    return token

def get_pr_details(github: Github) -> PullRequest:
    """
    Retrieves the details of the pull request from GitHub.

    Args:
        github (Github): The Github object to interact with the GitHub API.

    Returns:
        PullRequest: An object representing the pull request.
    """
    pr_number = os.getenv('PR_NUMBER')
    if not pr_number:
        print("PR_NUMBER environment variable is not set.")
        return None

    try:
        print(f"Attempting to get repo: {GITHUB_REPOSITORY}")
        repo = github.get_repo(GITHUB_REPOSITORY)
        print(f"Successfully got repo: {repo.full_name}")
        
        print(f"Attempting to get pull request: {pr_number}")
        pull = repo.get_pull(int(pr_number))
        print(f"Successfully got pull request: #{pull.number}")
        
        return pull
    except Exception as e:
        print(f"Error in get_pr_details: {e}")
        return None

def get_diff(diff_url: str) -> str:
    """
    Fetches the diff of the pull request from a given URL.

    Args:
        diff_url (str): URL to the pull request diff.

    Returns:
        str: The diff of the pull request.
    """
    response = requests.get(diff_url)
    response.raise_for_status()
    return response.text

def read_json(text: str) -> dict:
    """
    Parses JSON code block from a string.

    Args:
        text (str): A string containing a JSON code block.

    Returns:
        dict: A dictionary parsed from the JSON code block.
    """
    match = re.search(r"```(json|)\n(?P<code>[\S\s]+?)\n```", text)
    if match:
        text = match.group("code")
    try:
        return json.loads(text.strip())
    except json.JSONDecodeError:
        print("No valid json:", text)
        return {}

def read_text(text: str) -> str:
    """
    Extracts text from a markdown code block.

    Args:
        text (str): A string containing a markdown code block.

    Returns:
        str: The extracted text.
    """
    match = re.search(r"```(markdown|)\n(?P<text>[\S\s]+?)\n```", text)
    if match:
        return match.group("text")
    return text

def get_ai_response(prompt: str, as_json: bool = True) -> Union[dict, str]:
    """
    Gets a response from g4f API based on the prompt.

    Args:
        prompt (str): The prompt to send to g4f.
        as_json (bool): Whether to parse the response as JSON.

    Returns:
        Union[dict, str]: The parsed response from g4f, either as a dictionary or a string.
    """
    max_retries = 5
    providers = [None, 'Chatgpt4Online', 'OpenaiChat', 'Bing', 'Ai4Chat', 'NexraChatGPT']
    
    for provider in providers:
        for _ in range(max_retries):
            try:
                response = g4f.chat.completions.create(
                    G4F_MODEL,
                    [{'role': 'user', 'content': prompt}],
                    provider,
                    ignore_stream_and_auth=True
                )
                if as_json:
                    parsed_response = read_json(response)
                    if parsed_response and 'reviews' in parsed_response:
                        return parsed_response
                else:
                    parsed_response = read_text(response)
                    if parsed_response.strip():
                        return parsed_response
            except Exception as e:
                print(f"Error with provider {provider}: {e}")
    
    # If all retries and providers fail, return a default response
    if as_json:
        return {"reviews": []}
    else:
        return "AI Code Review: Unable to generate a detailed response. Please review the changes manually."

def analyze_code(pull: PullRequest, diff: str) -> list[dict]:
    """
    Analyzes the code changes in the pull request.

    Args:
        pull (PullRequest): The pull request object.
        diff (str): The diff of the pull request.

    Returns:
        list[dict]: A list of comments generated by the analysis.
    """
    comments = []
    changed_lines = []
    current_file_path = None
    offset_line = 0

    try:
        for line in diff.split('\n'):
            if line.startswith('+++ b/'):
                current_file_path = line[6:]
                changed_lines = []
            elif line.startswith('@@'):
                match = re.search(r'\+([0-9]+?),', line)
                if match:
                    offset_line = int(match.group(1))
            elif current_file_path:
                if (line.startswith('\\') or line.startswith('diff')) and changed_lines:
                    prompt = create_analyze_prompt(changed_lines, pull, current_file_path)
                    response = get_ai_response(prompt)
                    for review in response.get('reviews', []):
                        review['path'] = current_file_path
                        comments.append(review)
                    current_file_path = None
                elif line.startswith('-'):
                    changed_lines.append(line)
                else:
                    changed_lines.append(f"{offset_line}:{line}")
                    offset_line += 1
    except Exception as e:
        print(f"Error in analyze_code: {e}")
    
    if not comments:
        print("No comments generated by analyze_code")
    
    return comments

def create_analyze_prompt(changed_lines: list[str], pull: PullRequest, file_path: str):
    """
    Creates a prompt for the g4f model.

    Args:
        changed_lines (list[str]): The lines of code that have changed.
        pull (PullRequest): The pull request object.
        file_path (str): The path to the file being reviewed.

    Returns:
        str: The generated prompt.
    """
    code = "\n".join(changed_lines)
    example = '{"reviews": [{"line": <line_number>, "body": "<review comment>"}]}'
    return f"""Your task is to review pull requests. Instructions:
- Provide the response in following JSON format: {example}
- Do not give positive comments or compliments.
- Provide comments and suggestions ONLY if there is something to improve, otherwise "reviews" should be an empty array.
- Write the comment in GitHub Markdown format.
- Use the given description only for the overall context and only comment the code.
- IMPORTANT: NEVER suggest adding comments to the code.

Review the following code diff in the file "{file_path}" and take the pull request title and description into account when writing the response.
  
Pull request title: {pull.title}
Pull request description:
---
{pull.body}
---

Each line is prefixed by its number. Code to review:
```
{code}
```
"""

def create_review_prompt(pull: PullRequest, diff: str):
    """
    Creates a prompt to create a review comment.

    Args:
        pull (PullRequest): The pull request object.
        diff (str): The diff of the pull request.

    Returns:
        str: The generated prompt for review.
    """
    description = pull.body if pull.body else "No description provided."
    return f"""Your task is to review a pull request. Instructions:
- Write in name of g4f copilot. Don't use placeholder.
- Write the review in GitHub Markdown format.
- Thank the author for contributing to the project.
- If no issues are found, still provide a brief summary of the changes.

Pull request author: {pull.user.name or "Unknown"}
Pull request title: {pull.title or "Untitled Pull Request"}
Pull request description:
---
{description}
---

Diff:
```diff
{diff}
```

Please provide a comprehensive review of the changes, highlighting any potential issues or improvements, or summarizing the changes if no issues are found.
"""

def main():
    try:
        github_token = get_github_token()
    except ValueError as e:
        print(f"Error: {str(e)}")
        return

    if not GITHUB_REPOSITORY or not os.getenv('PR_NUMBER'):
        print("Error: GITHUB_REPOSITORY or PR_NUMBER environment variables are not set.")
        return

    print(f"GITHUB_REPOSITORY: {GITHUB_REPOSITORY}")
    print(f"PR_NUMBER: {os.getenv('PR_NUMBER')}")
    print("GITHUB_TOKEN is set")

    try:
        github = Github(github_token)
        
        # Test GitHub connection
        print("Testing GitHub connection...")
        try:
            user = github.get_user()
            print(f"Successfully authenticated as: {user.login}")
        except Exception as e:
            print(f"Error authenticating: {str(e)}")
            print(f"Error type: {type(e).__name__}")
            print(f"Error args: {e.args}")
            return
        
        # If connection is successful, proceed with PR details
        pull = get_pr_details(github)
        if not pull:
            print(f"No PR number found or invalid PR number")
            return
        print(f"Successfully fetched PR #{pull.number}")
        if pull.get_reviews().totalCount > 0 or pull.get_issue_comments().totalCount > 0:
            print(f"Has already a review")
            return
        
        diff = get_diff(pull.diff_url)
        review = "AI Code Review: Unable to generate a detailed response."
        comments = []
        
        try:
            review = get_ai_response(create_review_prompt(pull, diff), False)
            comments = analyze_code(pull, diff)
        except Exception as analysis_error:
            print(f"Error during analysis: {analysis_error}")
            review += f" Error during analysis: {str(analysis_error)[:200]}"
        
        print("Comments:", comments)
        
        review_body = review if review and review.strip() else "AI Code Review"
        if not review_body.strip():
            review_body = "AI Code Review: No specific issues found."
        
        try:
            if comments:
                pull.create_review(body=review_body, comments=comments, event='COMMENT')
            else:
                pull.create_review(body=review_body, event='COMMENT')
            print("Review posted successfully")
        except Exception as post_error:
            print(f"Error posting review: {post_error}")
            error_message = f"AI Code Review: An error occurred while posting the review. Error: {str(post_error)[:200]}. Please review the changes manually."
            pull.create_issue_comment(body=error_message)
    
    except Exception as e:
        print(f"Unexpected error in main: {e.__class__.__name__}: {e}")
        try:
            if 'pull' in locals():
                error_message = f"AI Code Review: An error occurred while processing this pull request. Error: {str(e)[:200]}. Please review the changes manually."
                pull.create_issue_comment(body=error_message)
            else:
                print("Unable to post error message: Pull request object not available")
        except Exception as post_error:
            print(f"Failed to post error message to pull request: {post_error}")

if __name__ == "__main__":
    main()