Update Python code formatting, configuration loading, and local model additions

1. Code Formatting: - Standardized Python code formatting across multiple files to align with PEP 8 guidelines. This includes adjustments to whitespace, line breaks, and inline comments. 2. Configuration Loader Enhancements: - Enhanced the `get_settings` function in `config_loader.py` to provide more robust handling of settings retrieval. Added detailed documentation to improve code maintainability and clarity. 3. Model Addition in __init__.py: - Added a new model "ollama/llama3" with a token limit to the MAX_TOKENS dictionary in `__init__.py` to support new AI capabilities and configurations.
2025-07-21 04:50:39 +08:00 · 2024-06-03 23:58:31 +08:00
parent ab31d2f1f8
commit b4f0ad948f
11 changed files with 48 additions and 29 deletions
--- a/pr_agent/algo/init.py
+++ b/pr_agent/algo/init.py
@ -9,7 +9,7 @@ MAX_TOKENS = {
    'gpt-4': 8000,
    'gpt-4-0613': 8000,
    'gpt-4-32k': 32000,
-    'gpt-4-1106-preview': 128000, # 128K, but may be limited by config.max_model_tokens
+    'gpt-4-1106-preview': 128000,  # 128K, but may be limited by config.max_model_tokens
    'gpt-4-0125-preview': 128000,  # 128K, but may be limited by config.max_model_tokens
    'gpt-4o': 128000,  # 128K, but may be limited by config.max_model_tokens
    'gpt-4o-2024-05-13': 128000,  # 128K, but may be limited by config.max_model_tokens
@ -36,4 +36,5 @@ MAX_TOKENS = {
    'bedrock/anthropic.claude-3-haiku-20240307-v1:0': 100000,
    'groq/llama3-8b-8192': 8192,
    'groq/llama3-70b-8192': 8192,
+    "ollama/llama3": 4096,
 }
--- a/pr_agent/algo/ai_handlers/base_ai_handler.py
+++ b/pr_agent/algo/ai_handlers/base_ai_handler.py
@ -1,5 +1,6 @@
 from abc import ABC, abstractmethod

+
 class BaseAiHandler(ABC):
    """
    This class defines the interface for an AI handler to be used by the PR Agents.  
@ -14,7 +15,7 @@ class BaseAiHandler(ABC):
    def deployment_id(self):
        pass

-    @abstractmethod   
+    @abstractmethod
    async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2, img_path: str = None):
        """
        This method should be implemented to return a chat completion from the AI model.
@ -25,4 +26,3 @@ class BaseAiHandler(ABC):
            temperature (float): the temperature to use for the chat completion    
        """
        pass
-
--- a/pr_agent/algo/ai_handlers/langchain_ai_handler.py
+++ b/pr_agent/algo/ai_handlers/langchain_ai_handler.py
@ -1,7 +1,7 @@
 try:
    from langchain.chat_models import ChatOpenAI, AzureChatOpenAI
    from langchain.schema import SystemMessage, HumanMessage
-except: # we don't enforce langchain as a dependency, so if it's not installed, just move on
+except:  # we don't enforce langchain as a dependency, so if it's not installed, just move on
    pass

 from pr_agent.algo.ai_handlers.base_ai_handler import BaseAiHandler
@ -14,6 +14,7 @@ import functools

 OPENAI_RETRIES = 5

+
 class LangChainOpenAIHandler(BaseAiHandler):
    def __init__(self):
        # Initialize OpenAIHandler specific attributes here
@ -36,7 +37,7 @@ class LangChainOpenAIHandler(BaseAiHandler):
                raise ValueError(f"OpenAI {e.name} is required") from e
            else:
                raise e
-    
+
    @property
    def chat(self):
        if self.azure:
@ -51,17 +52,18 @@ class LangChainOpenAIHandler(BaseAiHandler):
        Returns the deployment ID for the OpenAI API.
        """
        return get_settings().get("OPENAI.DEPLOYMENT_ID", None)
+
    @retry(exceptions=(APIError, Timeout, TryAgain, AttributeError, RateLimitError),
           tries=OPENAI_RETRIES, delay=2, backoff=2, jitter=(1, 3))
    async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):
        try:
-            messages=[SystemMessage(content=system), HumanMessage(content=user)]
-            
+            messages = [SystemMessage(content=system), HumanMessage(content=user)]
+
            # get a chat completion from the formatted messages
            resp = self.chat(messages, model=model, temperature=temperature)
-            finish_reason="completed"
+            finish_reason = "completed"
            return resp.content, finish_reason
-        
+
        except (Exception) as e:
            get_logger().error("Unknown error during OpenAI inference: ", e)
-            raise e
+            raise e
--- a/pr_agent/algo/ai_handlers/litellm_ai_handler.py
+++ b/pr_agent/algo/ai_handlers/litellm_ai_handler.py
@ -61,7 +61,7 @@ class LiteLLMAIHandler(BaseAiHandler):
        if get_settings().get("HUGGINGFACE.API_BASE", None) and 'huggingface' in get_settings().config.model:
            litellm.api_base = get_settings().huggingface.api_base
            self.api_base = get_settings().huggingface.api_base
-        if get_settings().get("OLLAMA.API_BASE", None) :
+        if get_settings().get("OLLAMA.API_BASE", None):
            litellm.api_base = get_settings().ollama.api_base
            self.api_base = get_settings().ollama.api_base
        if get_settings().get("HUGGINGFACE.REPITITION_PENALTY", None):
@ -129,7 +129,7 @@ class LiteLLMAIHandler(BaseAiHandler):
                "messages": messages,
                "temperature": temperature,
                "force_timeout": get_settings().config.ai_timeout,
-                "api_base" : self.api_base,
+                "api_base": self.api_base,
            }
            if self.aws_bedrock_client:
                kwargs["aws_bedrock_client"] = self.aws_bedrock_client
--- a/pr_agent/algo/ai_handlers/openai_ai_handler.py
+++ b/pr_agent/algo/ai_handlers/openai_ai_handler.py
@ -28,13 +28,14 @@ class OpenAIHandler(BaseAiHandler):

        except AttributeError as e:
            raise ValueError("OpenAI key is required") from e
+
    @property
    def deployment_id(self):
        """
        Returns the deployment ID for the OpenAI API.
        """
        return get_settings().get("OPENAI.DEPLOYMENT_ID", None)
-    
+
    @retry(exceptions=(APIError, Timeout, TryAgain, AttributeError, RateLimitError),
           tries=OPENAI_RETRIES, delay=2, backoff=2, jitter=(1, 3))
    async def chat_completion(self, model: str, system: str, user: str, temperature: float = 0.2):
@ -54,8 +55,8 @@ class OpenAIHandler(BaseAiHandler):
            finish_reason = chat_completion["choices"][0]["finish_reason"]
            usage = chat_completion.get("usage")
            get_logger().info("AI response", response=resp, messages=messages, finish_reason=finish_reason,
-                            model=model, usage=usage)
-            return resp, finish_reason       
+                              model=model, usage=usage)
+            return resp, finish_reason
        except (APIError, Timeout, TryAgain) as e:
            get_logger().error("Error during OpenAI inference: ", e)
            raise
@ -64,4 +65,4 @@ class OpenAIHandler(BaseAiHandler):
            raise
        except (Exception) as e:
            get_logger().error("Unknown error during OpenAI inference: ", e)
-            raise TryAgain from e        
+            raise TryAgain from e
--- a/pr_agent/algo/file_filter.py
+++ b/pr_agent/algo/file_filter.py
@ -3,6 +3,7 @@ import re

 from pr_agent.config_loader import get_settings

+
 def filter_ignored(files):
    """
    Filter out files that match the ignore patterns.
@ -14,7 +15,7 @@ def filter_ignored(files):
        if isinstance(patterns, str):
            patterns = [patterns]
        glob_setting = get_settings().ignore.glob
-        if isinstance(glob_setting, str): # --ignore.glob=[.*utils.py], --ignore.glob=.*utils.py
+        if isinstance(glob_setting, str):  # --ignore.glob=[.*utils.py], --ignore.glob=.*utils.py
            glob_setting = glob_setting.strip('[]').split(",")
        patterns += [fnmatch.translate(glob) for glob in glob_setting]

--- a/pr_agent/algo/utils.py
+++ b/pr_agent/algo/utils.py
@ -409,7 +409,7 @@ def update_settings_from_args(args: List[str]) -> List[str]:
                arg = arg.strip('-').strip()
                vals = arg.split('=', 1)
                if len(vals) != 2:
-                    if len(vals) > 2: # --extended is a valid argument
+                    if len(vals) > 2:  # --extended is a valid argument
                        get_logger().error(f'Invalid argument format: {arg}')
                    other_args.append(arg)
                    continue