Files
pr-agent/pr_agent/tools/pr_reviewer.py

184 lines
8.2 KiB
Python
Raw Normal View History

2023-07-06 00:21:08 +03:00
import copy
import json
import logging
2023-07-19 01:03:47 +03:00
from collections import OrderedDict
2023-07-06 00:21:08 +03:00
from jinja2 import Environment, StrictUndefined
from pr_agent.algo.ai_handler import AiHandler
from pr_agent.algo.pr_processing import get_pr_diff
from pr_agent.algo.token_handler import TokenHandler
from pr_agent.algo.utils import convert_to_markdown, try_fix_json
2023-07-06 00:21:08 +03:00
from pr_agent.config_loader import settings
2023-07-18 10:17:09 +03:00
from pr_agent.git_providers import get_git_provider
2023-07-19 14:22:34 +03:00
from pr_agent.git_providers.git_provider import get_main_pr_language, IncrementalPR
2023-07-18 11:34:57 +03:00
from pr_agent.servers.help import actions_help_text, bot_help_text
2023-07-06 00:21:08 +03:00
class PRReviewer:
2023-07-19 14:22:34 +03:00
def __init__(self, pr_url: str, cli_mode=False, is_answer: bool = False, args=None):
self.parse_args(args)
2023-07-06 00:21:08 +03:00
2023-07-19 14:22:34 +03:00
self.git_provider = get_git_provider()(pr_url, incremental=self.incremental)
2023-07-07 16:31:28 +03:00
self.main_language = get_main_pr_language(
2023-07-07 16:10:33 +03:00
self.git_provider.get_languages(), self.git_provider.get_files()
)
2023-07-19 01:03:47 +03:00
self.pr_url = pr_url
2023-07-17 15:49:29 +03:00
self.is_answer = is_answer
2023-07-18 10:17:09 +03:00
if self.is_answer and not self.git_provider.is_supported("get_issue_comments"):
raise Exception(f"Answer mode is not supported for {settings.config.git_provider} for now")
2023-07-18 16:32:51 +03:00
answer_str, question_str = self._get_user_answers()
2023-07-06 00:21:08 +03:00
self.ai_handler = AiHandler()
self.patches_diff = None
self.prediction = None
self.cli_mode = cli_mode
2023-07-06 00:21:08 +03:00
self.vars = {
"title": self.git_provider.pr.title,
"branch": self.git_provider.get_pr_branch(),
2023-07-07 15:02:40 +03:00
"description": self.git_provider.get_pr_description(),
2023-07-06 17:34:40 +03:00
"language": self.main_language,
2023-07-06 00:21:08 +03:00
"diff": "", # empty diff for initial calculation
"require_tests": settings.pr_reviewer.require_tests_review,
"require_security": settings.pr_reviewer.require_security_review,
2023-07-11 08:50:28 +03:00
"require_focused": settings.pr_reviewer.require_focused_review,
2023-07-06 00:21:08 +03:00
'num_code_suggestions': settings.pr_reviewer.num_code_suggestions,
2023-07-17 15:49:29 +03:00
#
'question_str': question_str,
'answer_str': answer_str,
2023-07-06 00:21:08 +03:00
}
self.token_handler = TokenHandler(self.git_provider.pr,
self.vars,
settings.pr_review_prompt.system,
settings.pr_review_prompt.user)
2023-07-19 14:22:34 +03:00
def parse_args(self, args):
is_incremental = False
if len(args) >= 1:
arg = args[0]
if arg == "-i":
is_incremental = True
self.incremental = IncrementalPR(is_incremental)
2023-07-06 00:21:08 +03:00
async def review(self):
logging.info('Reviewing PR...')
2023-07-17 08:18:42 +03:00
if settings.config.publish_output:
2023-07-18 12:27:28 +03:00
self.git_provider.publish_comment("Preparing review...", is_temporary=True)
2023-07-06 00:21:08 +03:00
logging.info('Getting PR diff...')
self.patches_diff = get_pr_diff(self.git_provider, self.token_handler)
logging.info('Getting AI prediction...')
self.prediction = await self._get_prediction()
logging.info('Preparing PR review...')
pr_comment = self._prepare_pr_review()
2023-07-17 08:18:42 +03:00
if settings.config.publish_output:
2023-07-06 00:21:08 +03:00
logging.info('Pushing PR review...')
self.git_provider.publish_comment(pr_comment)
2023-07-06 08:44:08 +03:00
self.git_provider.remove_initial_comment()
2023-07-13 09:44:33 +03:00
if settings.pr_reviewer.inline_code_comments:
logging.info('Pushing inline code comments...')
self._publish_inline_code_comments()
2023-07-06 00:21:08 +03:00
return ""
async def _get_prediction(self):
variables = copy.deepcopy(self.vars)
variables["diff"] = self.patches_diff # update diff
environment = Environment(undefined=StrictUndefined)
system_prompt = environment.from_string(settings.pr_review_prompt.system).render(variables)
user_prompt = environment.from_string(settings.pr_review_prompt.user).render(variables)
if settings.config.verbosity_level >= 2:
logging.info(f"\nSystem prompt:\n{system_prompt}")
logging.info(f"\nUser prompt:\n{user_prompt}")
model = settings.config.model
response, finish_reason = await self.ai_handler.chat_completion(model=model, temperature=0.2,
system=system_prompt, user=user_prompt)
2023-07-11 17:32:48 +03:00
2023-07-06 00:21:08 +03:00
return response
def _prepare_pr_review(self) -> str:
review = self.prediction.strip()
try:
data = json.loads(review)
except json.decoder.JSONDecodeError:
data = try_fix_json(review)
2023-07-06 12:49:10 +03:00
# reordering for nicer display
if 'PR Feedback' in data:
if 'Security concerns' in data['PR Feedback']:
val = data['PR Feedback']['Security concerns']
del data['PR Feedback']['Security concerns']
data['PR Analysis']['Security concerns'] = val
2023-07-18 13:03:36 +03:00
if settings.config.git_provider != 'bitbucket' and \
2023-07-17 08:18:42 +03:00
settings.pr_reviewer.inline_code_comments and \
'Code suggestions' in data['PR Feedback']:
# keeping only code suggestions that can't be submitted as inline comments
data['PR Feedback']['Code suggestions'] = [
d for d in data['PR Feedback']['Code suggestions']
if any(key not in d for key in ('relevant file', 'relevant line in file', 'suggestion content'))
]
if not data['PR Feedback']['Code suggestions']:
del data['PR Feedback']['Code suggestions']
2023-07-13 09:44:33 +03:00
2023-07-19 14:22:34 +03:00
if self.incremental.is_incremental:
2023-07-19 01:03:47 +03:00
# Rename title when incremental review - Add to the beginning of the dict
2023-07-19 14:22:34 +03:00
last_commit_url = f"{self.pr_url}/commits/{self.git_provider.incremental.first_new_commit_sha}"
2023-07-19 01:03:47 +03:00
data = OrderedDict(data)
2023-07-19 14:22:34 +03:00
data.update({'Incremental PR Review': {
"⏮️ Review for commits since previous PR-Agent review": f"Starting from commit {last_commit_url}"}})
2023-07-19 01:03:47 +03:00
data.move_to_end('Incremental PR Review', last=False)
2023-07-06 00:21:08 +03:00
markdown_text = convert_to_markdown(data)
user = self.git_provider.get_user_id()
if not self.cli_mode:
markdown_text += "\n### How to use\n"
if user and '[bot]' not in user:
2023-07-16 15:00:13 +03:00
markdown_text += bot_help_text(user)
else:
2023-07-16 15:00:13 +03:00
markdown_text += actions_help_text
2023-07-06 00:21:08 +03:00
if settings.config.verbosity_level >= 2:
logging.info(f"Markdown response:\n{markdown_text}")
2023-07-13 09:44:33 +03:00
return markdown_text
def _publish_inline_code_comments(self):
2023-07-17 08:18:42 +03:00
if settings.pr_reviewer.num_code_suggestions == 0:
return
2023-07-13 09:44:33 +03:00
review = self.prediction.strip()
try:
data = json.loads(review)
except json.decoder.JSONDecodeError:
data = try_fix_json(review)
comments = []
2023-07-13 09:44:33 +03:00
for d in data['PR Feedback']['Code suggestions']:
relevant_file = d.get('relevant file', '').strip()
relevant_line_in_file = d.get('relevant line in file', '').strip()
content = d.get('suggestion content', '')
if not relevant_file or not relevant_line_in_file or not content:
logging.info("Skipping inline comment with missing file/line/content")
continue
if self.git_provider.is_supported("create_inline_comment"):
comment = self.git_provider.create_inline_comment(content, relevant_file, relevant_line_in_file)
if comment:
comments.append(comment)
else:
self.git_provider.publish_inline_comment(content, relevant_file, relevant_line_in_file)
2023-07-17 16:53:38 +03:00
if comments:
self.git_provider.publish_inline_comments(comments)
2023-07-17 15:49:29 +03:00
def _get_user_answers(self):
answer_str = question_str = ""
if self.is_answer:
2023-07-18 10:17:09 +03:00
discussion_messages = self.git_provider.get_issue_comments()
2023-07-17 15:49:29 +03:00
for message in discussion_messages.reversed:
if "Questions to better understand the PR:" in message.body:
question_str = message.body
elif '/answer' in message.body:
answer_str = message.body
if answer_str and question_str:
break
return question_str, answer_str