pr-agent/pr_agent/algo/ai_handler.py

import logging

import litellm
import openai
from litellm import acompletion
from openai.error import APIError, RateLimitError, Timeout, TryAgain
from retry import retry
from pr_agent.config_loader import get_settings
OPENAI_RETRIES = 5


class AiHandler:
    """
    This class handles interactions with the OpenAI API for chat completions.
    It initializes the API key and other settings from a configuration file,
    and provides a method for performing chat completions using the OpenAI ChatCompletion API.
    """

    def __init__(self):
        """
        Initializes the OpenAI API key and other settings from a configuration file.
        Raises a ValueError if the OpenAI key is missing.
        """
        try:
            openai.api_key = get_settings().openai.key
            litellm.openai_key = get_settings().openai.key
            self.azure = False
            if get_settings().get("OPENAI.ORG", None):
                litellm.organization = get_settings().openai.org
            if get_settings().get("OPENAI.API_TYPE", None):
                if get_settings().openai.api_type == "azure":
                    self.azure = True
                    litellm.azure_key = get_settings().openai.key
            if get_settings().get("OPENAI.API_VERSION", None):
                litellm.api_version = get_settings().openai.api_version
            if get_settings().get("OPENAI.API_BASE", None):
                litellm.api_base = get_settings().openai.api_base
            if get_settings().get("ANTHROPIC.KEY", None):
                litellm.anthropic_key = get_settings().anthropic.key
            if get_settings().get("COHERE.KEY", None):
                litellm.cohere_key = get_settings().cohere.key
            if get_settings().get("REPLICATE.KEY", None):
                litellm.replicate_key = get_settings().replicate.key
            if get_settings().get("REPLICATE.KEY", None):
                litellm.replicate_key = get_settings().replicate.key
            if get_settings().get("HUGGINGFACE.KEY", None):
                litellm.huggingface_key = get_settings().huggingface.key
                if get_settings().get("HUGGINGFACE.API_BASE", None):
                    litellm.api_base = get_settings().huggingface.api_base
        except AttributeError as e:
            raise ValueError("OpenAI key is required") from e

    @property
    def deployment_id(self):
        """
        Returns the deployment ID for the OpenAI API.
        """
        return get_settings().get("OPENAI.DEPLOYMENT_ID", None)

    @retry(exceptions=(APIError, Timeout, TryAgain, AttributeError, RateLimitError),
           tries=OPENAI_RETRIES, delay=2, backoff=2, jitter=(1, 3))
    async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):
        """
        Performs a chat completion using the OpenAI ChatCompletion API.
        Retries in case of API errors or timeouts.
        
        Args:
            model (str): The model to use for chat completion.
            temperature (float): The temperature parameter for chat completion.
            system (str): The system message for chat completion.
            user (str): The user message for chat completion.
        
        Returns:
            tuple: A tuple containing the response and finish reason from the API.
        
        Raises:
            TryAgain: If the API response is empty or there are no choices in the response.
            APIError: If there is an error during OpenAI inference.
            Timeout: If there is a timeout during OpenAI inference.
            TryAgain: If there is an attribute error during OpenAI inference.
        """
        try:
            deployment_id = self.deployment_id
            if get_settings().config.verbosity_level >= 2:
                logging.debug(
                    f"Generating completion with {model}"
                    f"{(' from deployment ' + deployment_id) if deployment_id else ''}"
                )
            response = await acompletion(
                model=model,
                deployment_id=deployment_id,
                messages=[
                    {"role": "system", "content": system},
                    {"role": "user", "content": user}
                ],
                temperature=temperature,
                azure=self.azure,
                force_timeout=get_settings().config.ai_timeout
            )
        except (APIError, Timeout, TryAgain) as e:
            logging.error("Error during OpenAI inference: ", e)
            raise
        except (RateLimitError) as e:
            logging.error("Rate limit error during OpenAI inference: ", e)
            raise
        except (Exception) as e:
            logging.error("Unknown error during OpenAI inference: ", e)
            raise TryAgain from e
        if response is None or len(response["choices"]) == 0:
            raise TryAgain
        resp = response["choices"][0]['message']['content']
        finish_reason = response["choices"][0]["finish_reason"]
        print(resp, finish_reason)
        return resp, finish_reason
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`import logging`

Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`import litellm`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`import openai`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`from litellm import acompletion`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`from openai.error import APIError, RateLimitError, Timeout, TryAgain`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`from retry import retry`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`from pr_agent.config_loader import get_settings`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`OPENAI_RETRIES = 5`

Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00
			`class AiHandler:`
docstring 2023-07-20 10:51:21 +03:00			`"""`
			`This class handles interactions with the OpenAI API for chat completions.`
			`It initializes the API key and other settings from a configuration file,`
			`and provides a method for performing chat completions using the OpenAI ChatCompletion API.`
			`"""`

Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`def __init__(self):`
docstring 2023-07-20 10:51:21 +03:00			`"""`
			`Initializes the OpenAI API key and other settings from a configuration file.`
			`Raises a ValueError if the OpenAI key is missing.`
			`"""`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`try:`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`openai.api_key = get_settings().openai.key`
bug fixes and updates 2023-08-03 16:05:46 -07:00			`litellm.openai_key = get_settings().openai.key`
bug fixes 2023-08-05 22:50:41 -07:00			`self.azure = False`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`if get_settings().get("OPENAI.ORG", None):`
bug fixes 2023-08-05 22:50:41 -07:00			`litellm.organization = get_settings().openai.org`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`if get_settings().get("OPENAI.API_TYPE", None):`
bug fixes 2023-08-05 22:50:41 -07:00			`if get_settings().openai.api_type == "azure":`
			`self.azure = True`
			`litellm.azure_key = get_settings().openai.key`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`if get_settings().get("OPENAI.API_VERSION", None):`
bug fixes 2023-08-05 22:50:41 -07:00			`litellm.api_version = get_settings().openai.api_version`
Support context aware settings (for each incoming request), support override of settings, refactor CLI to use pr_agent.py 2023-08-01 14:43:26 +03:00			`if get_settings().get("OPENAI.API_BASE", None):`
bug fixes and updates 2023-08-03 16:05:46 -07:00			`litellm.api_base = get_settings().openai.api_base`
bug fixes 2023-08-05 22:50:41 -07:00			`if get_settings().get("ANTHROPIC.KEY", None):`
			`litellm.anthropic_key = get_settings().anthropic.key`
			`if get_settings().get("COHERE.KEY", None):`
			`litellm.cohere_key = get_settings().cohere.key`
			`if get_settings().get("REPLICATE.KEY", None):`
			`litellm.replicate_key = get_settings().replicate.key`
adding huggingface inference support + litellm debugger 2023-08-21 15:31:51 -07:00			`if get_settings().get("REPLICATE.KEY", None):`
			`litellm.replicate_key = get_settings().replicate.key`
			`if get_settings().get("HUGGINGFACE.KEY", None):`
			`litellm.huggingface_key = get_settings().huggingface.key`
showing how to use huggingface models 2023-09-05 16:23:22 -07:00			`if get_settings().get("HUGGINGFACE.API_BASE", None):`
			`litellm.api_base = get_settings().huggingface.api_base`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`except AttributeError as e:`
			`raise ValueError("OpenAI key is required") from e`

Support fallback deployments to accompany fallback models This is useful for example in Azure OpenAI deployments where you have a different deployment per model, so the current fallback implementation doesn't work (still uses the same deployment for each fallback attempt) 2023-08-07 16:17:06 +03:00			`@property`
			`def deployment_id(self):`
			`"""`
			`Returns the deployment ID for the OpenAI API.`
			`"""`
			`return get_settings().get("OPENAI.DEPLOYMENT_ID", None)`

Retry on rate limit error on OpenAI calls 2023-07-20 15:01:12 +03:00			`@retry(exceptions=(APIError, Timeout, TryAgain, AttributeError, RateLimitError),`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`tries=OPENAI_RETRIES, delay=2, backoff=2, jitter=(1, 3))`
extended improve 2023-08-21 09:07:21 +03:00			`async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):`
docstring 2023-07-20 10:51:21 +03:00			`"""`
			`Performs a chat completion using the OpenAI ChatCompletion API.`
			`Retries in case of API errors or timeouts.`

			`Args:`
			`model (str): The model to use for chat completion.`
			`temperature (float): The temperature parameter for chat completion.`
			`system (str): The system message for chat completion.`
			`user (str): The user message for chat completion.`

			`Returns:`
			`tuple: A tuple containing the response and finish reason from the API.`

			`Raises:`
			`TryAgain: If the API response is empty or there are no choices in the response.`
			`APIError: If there is an error during OpenAI inference.`
			`Timeout: If there is a timeout during OpenAI inference.`
			`TryAgain: If there is an attribute error during OpenAI inference.`
			`"""`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`try:`
Logging 2023-08-07 22:42:53 +03:00			`deployment_id = self.deployment_id`
			`if get_settings().config.verbosity_level >= 2:`
			`logging.debug(`
			`f"Generating completion with {model}"`
			`f"{(' from deployment ' + deployment_id) if deployment_id else ''}"`
			`)`
adding support for Anthropic, Cohere, Replicate, Azure 2023-08-03 12:04:08 -07:00			`response = await acompletion(`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`model=model,`
Merge branch 'main' into zmeir-fallback_deployments 2023-08-08 11:00:13 +03:00			`deployment_id=deployment_id,`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`messages=[`
			`{"role": "system", "content": system},`
			`{"role": "user", "content": user}`
			`],`
			`temperature=temperature,`
Fixed incorrect usage for Azure OpenAI API 2023-08-28 16:13:26 +03:00			`azure=self.azure,`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`force_timeout=get_settings().config.ai_timeout`
			`)`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`except (APIError, Timeout, TryAgain) as e:`
			`logging.error("Error during OpenAI inference: ", e)`
			`raise`
Retry on rate limit error on OpenAI calls 2023-07-20 15:01:12 +03:00			`except (RateLimitError) as e:`
			`logging.error("Rate limit error during OpenAI inference: ", e)`
			`raise`
Retry on rate limit error on OpenAI calls 2023-07-20 15:02:34 +03:00			`except (Exception) as e:`
			`logging.error("Unknown error during OpenAI inference: ", e)`
			`raise TryAgain from e`
bug fixes and updates 2023-08-03 16:05:46 -07:00			`if response is None or len(response["choices"]) == 0:`
Initial commit - PR-Agent OSS release 2023-07-06 00:21:08 +03:00			`raise TryAgain`
bug fixes and updates 2023-08-03 16:05:46 -07:00			`resp = response["choices"][0]['message']['content']`
			`finish_reason = response["choices"][0]["finish_reason"]`
			`print(resp, finish_reason)`
Default timeout for AI is now 180s, configurable 2023-08-07 13:26:28 +03:00			`return resp, finish_reason`