pr-agent/pr_agent/algo/ai_handlers/langchain_ai_handler.py

try:
    from langchain_core.messages import HumanMessage, SystemMessage
    from langchain_openai import AzureChatOpenAI, ChatOpenAI
except:  # we don't enforce langchain as a dependency, so if it's not installed, just move on
    pass

import functools

import openai
from tenacity import retry, retry_if_exception_type, retry_if_not_exception_type, stop_after_attempt

from pr_agent.algo.ai_handlers.base_ai_handler import BaseAiHandler
from pr_agent.config_loader import get_settings
from pr_agent.log import get_logger

OPENAI_RETRIES = 5


class LangChainOpenAIHandler(BaseAiHandler):
    def __init__(self):
        # Initialize OpenAIHandler specific attributes here
        super().__init__()
        self.azure = get_settings().get("OPENAI.API_TYPE", "").lower() == "azure"

        # Create a default unused chat object to trigger early validation
        self._create_chat(self.deployment_id)

    def chat(self, messages: list, model: str, temperature: float):
        chat = self._create_chat(self.deployment_id)
        return chat.invoke(input=messages, model=model, temperature=temperature)

    @property
    def deployment_id(self):
        """
        Returns the deployment ID for the OpenAI API.
        """
        return get_settings().get("OPENAI.DEPLOYMENT_ID", None)

    @retry(
        retry=retry_if_exception_type(openai.APIError) & retry_if_not_exception_type(openai.RateLimitError),
        stop=stop_after_attempt(OPENAI_RETRIES),
    )
    async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):
        try:
            messages = [SystemMessage(content=system), HumanMessage(content=user)]

            # get a chat completion from the formatted messages
            resp = self.chat(messages, model=model, temperature=temperature)
            finish_reason = "completed"
            return resp.content, finish_reason

        except openai.RateLimitError as e:
            get_logger().error(f"Rate limit error during LLM inference: {e}")
            raise
        except openai.APIError as e:
            get_logger().warning(f"Error during LLM inference: {e}")
            raise
        except Exception as e:
            get_logger().warning(f"Unknown error during LLM inference: {e}")
            raise openai.APIError from e

    def _create_chat(self, deployment_id=None):
        try:
            if self.azure:
                # using a partial function so we can set the deployment_id later to support fallback_deployments
                # but still need to access the other settings now so we can raise a proper exception if they're missing
                return AzureChatOpenAI(
                    openai_api_key=get_settings().openai.key,
                    openai_api_version=get_settings().openai.api_version,
                    azure_deployment=deployment_id,
                    azure_endpoint=get_settings().openai.api_base,
                )
            else:
                # for llms that compatible with openai, should use custom api base
                openai_api_base = get_settings().get("OPENAI.API_BASE", None)
                if openai_api_base is None or len(openai_api_base) == 0:
                    return ChatOpenAI(openai_api_key=get_settings().openai.key)
                else:
                    return ChatOpenAI(openai_api_key=get_settings().openai.key, openai_api_base=openai_api_base)
        except AttributeError as e:
            if getattr(e, "name"):
                raise ValueError(f"OpenAI {e.name} is required") from e
            else:
                raise e
Make LangChain dependency optional in pr-agent and update requirements.txt 2023-12-14 09:05:53 +02:00			`try:`
Format files by `pre-commit run -a` Signed-off-by: Yu Ishikawa <yu-iskw@users.noreply.github.com> 2024-10-30 09:56:03 +09:00			`from langchain_core.messages import HumanMessage, SystemMessage`
			`from langchain_openai import AzureChatOpenAI, ChatOpenAI`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00			`except: # we don't enforce langchain as a dependency, so if it's not installed, just move on`
Make LangChain dependency optional in pr-agent and update requirements.txt 2023-12-14 09:05:53 +02:00			`pass`
update langchain 2023-12-12 23:52:50 +08:00
Format files by `pre-commit run -a` Signed-off-by: Yu Ishikawa <yu-iskw@users.noreply.github.com> 2024-10-30 09:56:03 +09:00			`import functools`
add LangChain AI Handler 2023-12-12 23:03:49 +08:00
fix: exclude RateLimitError from retry logic 2025-05-22 15:04:16 +09:00			`import openai`
			`from tenacity import retry, retry_if_exception_type, retry_if_not_exception_type, stop_after_attempt`
Format files by `pre-commit run -a` Signed-off-by: Yu Ishikawa <yu-iskw@users.noreply.github.com> 2024-10-30 09:56:03 +09:00
			`from pr_agent.algo.ai_handlers.base_ai_handler import BaseAiHandler`
			`from pr_agent.config_loader import get_settings`
			`from pr_agent.log import get_logger`
update langchain 2023-12-12 23:52:50 +08:00
			`OPENAI_RETRIES = 5`

Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00
Update langchain 2023-12-12 23:28:58 +08:00			`class LangChainOpenAIHandler(BaseAiHandler):`
add LangChain AI Handler 2023-12-12 23:03:49 +08:00			`def __init__(self):`
			`# Initialize OpenAIHandler specific attributes here`
Add support for Azure OpenAI in LangChainOpenAIHandler 2024-01-04 16:08:10 +02:00			`super().__init__()`
			`self.azure = get_settings().get("OPENAI.API_TYPE", "").lower() == "azure"`
Fix LangChainOpenAIHandler for Azure 2024-08-08 09:55:18 -04:00
			`# Create a default unused chat object to trigger early validation`
			`self._create_chat(self.deployment_id)`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00
1. update LangChainOpenAIHandler to support langchain version 0.2 2. read openai_api_base from settings for llms that compatible with openai 2024-06-06 22:27:01 +08:00			`def chat(self, messages: list, model: str, temperature: float):`
Fix LangChainOpenAIHandler for Azure 2024-08-08 09:55:18 -04:00			`chat = self._create_chat(self.deployment_id)`
			`return chat.invoke(input=messages, model=model, temperature=temperature)`
Update langchain 2023-12-12 23:28:58 +08:00
add LangChain AI Handler 2023-12-12 23:03:49 +08:00			`@property`
			`def deployment_id(self):`
			`"""`
			`Returns the deployment ID for the OpenAI API.`
			`"""`
			`return get_settings().get("OPENAI.DEPLOYMENT_ID", None)`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00
fix: exclude RateLimitError from retry logic 2025-05-22 15:04:16 +09:00			`@retry(`
			`retry=retry_if_exception_type(openai.APIError) & retry_if_not_exception_type(openai.RateLimitError),`
			`stop=stop_after_attempt(OPENAI_RETRIES),`
			`)`
add LangChain AI Handler 2023-12-12 23:03:49 +08:00			`async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):`
			`try:`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00			`messages = [SystemMessage(content=system), HumanMessage(content=user)]`

add LangChain AI Handler 2023-12-12 23:03:49 +08:00			`# get a chat completion from the formatted messages`
Update langchain 2023-12-12 23:28:58 +08:00			`resp = self.chat(messages, model=model, temperature=temperature)`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00			`finish_reason = "completed"`
add LangChain AI Handler 2023-12-12 23:03:49 +08:00			`return resp.content, finish_reason`
Update Python code formatting, configuration loading, and local model additions 1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations. 2024-06-03 23:58:31 +08:00
fix: exclude RateLimitError from retry logic 2025-05-22 15:04:16 +09:00			`except openai.RateLimitError as e:`
			`get_logger().error(f"Rate limit error during LLM inference: {e}")`
			`raise`
			`except openai.APIError as e:`
			`get_logger().warning(f"Error during LLM inference: {e}")`
			`raise`
			`except Exception as e:`
			`get_logger().warning(f"Unknown error during LLM inference: {e}")`
			`raise openai.APIError from e`
Fix LangChainOpenAIHandler for Azure 2024-08-08 09:55:18 -04:00
			`def _create_chat(self, deployment_id=None):`
			`try:`
			`if self.azure:`
			`# using a partial function so we can set the deployment_id later to support fallback_deployments`
			`# but still need to access the other settings now so we can raise a proper exception if they're missing`
			`return AzureChatOpenAI(`
			`openai_api_key=get_settings().openai.key,`
			`openai_api_version=get_settings().openai.api_version,`
			`azure_deployment=deployment_id,`
			`azure_endpoint=get_settings().openai.api_base,`
			`)`
			`else:`
			`# for llms that compatible with openai, should use custom api base`
			`openai_api_base = get_settings().get("OPENAI.API_BASE", None)`
			`if openai_api_base is None or len(openai_api_base) == 0:`
			`return ChatOpenAI(openai_api_key=get_settings().openai.key)`
			`else:`
			`return ChatOpenAI(openai_api_key=get_settings().openai.key, openai_api_base=openai_api_base)`
			`except AttributeError as e:`
			`if getattr(e, "name"):`
			`raise ValueError(f"OpenAI {e.name} is required") from e`
			`else:`
			`raise e`