stable

2025-07-21 04:50:39 +08:00 · 2023-09-06 09:43:23 +03:00
parent bc95cf5b8e
commit 8962c9cf8a
2 changed files with 24 additions and 20 deletions
--- a/pr_agent/settings/configuration.toml
+++ b/pr_agent/settings/configuration.toml
@ -100,7 +100,7 @@ polling_interval_seconds = 30
 [pr_similar_issue]
 skip_comments = false
 force_update_dataset = false
-max_issues_to_scan = 1000
+max_issues_to_scan = 500
 [pinecone]
 # fill and place in .secrets.toml
--- a/pr_agent/tools/pr_similar_issue.py
+++ b/pr_agent/tools/pr_similar_issue.py
@ -183,7 +183,7 @@ class PRSimilarIssue:
                        if num_words_comment < 10 or not isinstance(comment_body, str):
                            continue
-                    if len(issue_str) < 8000 or \
+                        if len(comment_body) < 8000 or \
                                self.token_handler.count_tokens(comment_body) < MAX_TOKENS[MODEL]:
                            comment_record = Record(
                                id=issue_key + ".comment_" + str(j + 1),
@ -205,9 +205,13 @@ class PRSimilarIssue:
            embeds = [record['embedding'] for record in res['data']]
        except:
            embeds = []
            logging.error('Failed to embed entire list, embedding one by one...')
            for i, text in enumerate(list_to_encode):
                try:
                    res = openai.Embedding.create(input=[text], engine=MODEL)
                    embeds.append(res['data'][0]['embedding'])
                except:
                    embeds.append([0] * 1536)
        df["values"] = embeds
        meta = DatasetMetadata.empty()
        meta.dense_model.dimension = len(embeds[0])