ubiquity-os-marketplace · whilefoo · Jan 15, 2025 · Jan 15, 2025 · Jan 26, 2025 · Jan 26, 2025
diff --git a/.cspell.json b/.cspell.json
@@ -32,7 +32,9 @@
     "Rpcs",
     "sonarjs",
     "pico",
-    "timespan"
+    "timespan",
+    "Retryable",
+    "ratelimit"
   ],
   "dictionaries": ["typescript", "node", "software-terms"],
   "import": [

diff --git a/bun.lockb b/bun.lockb
diff --git a/dist/index.js b/dist/index.js
diff --git a/dist/index.js.map b/dist/index.js.map
diff --git a/manifest.json b/manifest.json
@@ -74,6 +74,12 @@
                         "description": "OpenAI endpoint for requests",
                         "examples": ["https://api.openai.com/v1"],
                         "type": "string"
+                      },
+                      "maxRetries": {
+                        "default": 10,
+                        "description": "Maximum number of retries to make",
+                        "examples": ["10"],
+                        "type": "number"
                       }
                     }
                   },

diff --git a/package.json b/package.json
@@ -41,6 +41,7 @@
     "js-tiktoken": "1.0.15",
     "jsdom": "24.0.0",
     "markdown-it": "14.1.0",
+    "ms": "^2.1.3",
     "minimatch": "^10.0.1",
     "openai": "4.56.0",
     "yaml": "^2.6.1"
@@ -59,6 +60,7 @@
     "@types/jest": "29.5.12",
     "@types/jsdom": "21.1.6",
     "@types/markdown-it": "13.0.7",
+    "@types/ms": "^2.1.0",
     "@types/node": "20.11.28",
     "babel-jest": "29.7.0",
     "cross-env": "^7.0.3",

diff --git a/src/configuration/content-evaluator-config.ts b/src/configuration/content-evaluator-config.ts
@@ -26,6 +26,11 @@ const openAiType = Type.Object(
       description: "OpenAI endpoint for requests",
       examples: ["https://api.openai.com/v1"],
     }),
+    maxRetries: Type.Number({
+      default: 10,
+      description: "Maximum number of retries to make",
+      examples: ["10"],
+    }),
   },
   { default: {} }
 );

diff --git a/src/helpers/retry.ts b/src/helpers/retry.ts
@@ -0,0 +1,36 @@
+interface RetryOptions {
+  maxRetries: number;
+  onError?: (error: unknown) => void | Promise<void>;
+  // Return false to stop retrying, return true to automatically delay the next retry, or a number to set the delay before the next retry
+  isErrorRetryable?: (error: unknown) => boolean | number;
+}
+
+function sleep(ms: number) {
+  return new Promise((resolve) => setTimeout(resolve, ms));
+}
+
+export async function retry<T>(fn: () => Promise<T>, options: RetryOptions): Promise<T> {
+  let delay = 1000;
+  let lastError: unknown = null;
+  for (let i = 0; i < options.maxRetries; i++) {
+    try {
+      return await fn();
+    } catch (err) {
+      if (options.onError) {
+        await options.onError(err);
+      }
+      if (options.isErrorRetryable) {
+        const res = options.isErrorRetryable(err);
+        if (res === false) {
+          throw err;
+        } else if (typeof res === "number") {
+          delay = res;
+        }
+      }
+      lastError = err;
+    }
+    await sleep(delay);
+    delay *= 2;
+  }
+  throw lastError;
+}
diff --git a/src/parser/content-evaluator-module.ts b/src/parser/content-evaluator-module.ts
@@ -15,6 +15,10 @@ import {
 import { BaseModule } from "../types/module";
 import { ContextPlugin } from "../types/plugin-input";
 import { GithubCommentScore, Result } from "../types/results";
+import { postComment } from "@ubiquity-os/plugin-sdk";
+import { retry } from "../helpers/retry";
+import ms, { StringValue } from "ms";
+import { TypeBoxError } from "@sinclair/typebox";
 
 /**
  * Evaluates and rates comments.
@@ -26,6 +30,7 @@ export class ContentEvaluatorModule extends BaseModule {
     ...(this._configuration?.openAi.endpoint && { baseURL: this._configuration.openAi.endpoint }),
   });
   private readonly _fixedRelevances: { [k: string]: number } = {};
+  private _tokenLimit: number = 0;
 
   _getEnumValue(key: CommentType) {
     let res = 0;
@@ -56,7 +61,25 @@ export class ContentEvaluatorModule extends BaseModule {
     return true;
   }
 
+  async _getRateLimitTokens() {
+    const res = await this._openAi.chat.completions
+      .create({
+        model: this._configuration?.openAi.model ?? "gpt-4o-2024-08-06",
+        messages: [{ role: "system", content: "a" }],
+        max_tokens: 1,
+      })
+      .asResponse();
+    const tokenLimit = res.headers.get("x-ratelimit-limit-tokens");
+    return tokenLimit && Number.isFinite(Number(tokenLimit)) ? Number(tokenLimit) : Infinity;
+  }
+
   async transform(data: Readonly<IssueActivity>, result: Result) {
+    if (!this._configuration?.openAi.tokenCountLimit) {
+      throw this.context.logger.fatal("Token count limit is missing, comments cannot be evaluated.");
+    }
+    this._tokenLimit = Math.min(this._configuration?.openAi.tokenCountLimit, await this._getRateLimitTokens());
+    this.context.logger.info(`Using token limit: ${this._tokenLimit}`);
+
     const promises: Promise<GithubCommentScore[]>[] = [];
     const allComments: { id: number; comment: string; author: string }[] = [];
 
@@ -99,6 +122,8 @@ export class ContentEvaluatorModule extends BaseModule {
 
     if (Object.keys(relevancesByAi).length !== commentsToEvaluate.length + prCommentsToEvaluate.length) {
       throw this.context.logger.error("Relevance / Comment length mismatch!", {
+        expectedRelevances: commentsToEvaluate.length + prCommentsToEvaluate.length,
+        receivedRelevances: Object.keys(relevancesByAi).length,
         relevancesByAi,
         commentsToEvaluate,
         prCommentsToEvaluate,
@@ -182,14 +207,28 @@ export class ContentEvaluatorModule extends BaseModule {
     allComments: AllComments
   ) {
     const commentRelevances: Relevances = {};
-    const chunks = 2;
+
+    const dummyResponse = JSON.stringify(this._generateDummyResponse(comments), null, 2);
+    const maxOutputTokens = this._calculateMaxTokens(dummyResponse);
+
+    let chunks = 2;
+    while (
+      maxOutputTokens +
+        Math.max(
+          ...this._splitArrayToChunks(allComments, chunks).map((chunk) =>
+            this._calculateMaxTokens(this._generatePromptForComments(specification, comments, chunk), Infinity)
+          )
+        ) >
+      this._tokenLimit
+    ) {
+      chunks++;
+    }
+    this.context.logger.info(`Splitting issue comments into ${chunks} chunks`);
 
     for (const commentSplit of this._splitArrayToChunks(allComments, chunks)) {
-      const dummyResponse = JSON.stringify(this._generateDummyResponse(comments), null, 2);
-      const maxTokens = this._calculateMaxTokens(dummyResponse);
       const promptForComments = this._generatePromptForComments(specification, comments, commentSplit);
 
-      for (const [key, value] of Object.entries(await this._submitPrompt(promptForComments, maxTokens))) {
+      for (const [key, value] of Object.entries(await this._submitPrompt(promptForComments, maxOutputTokens))) {
         if (commentRelevances[key]) {
           commentRelevances[key] = new Decimal(commentRelevances[key]).add(value).toNumber();
         } else {
@@ -206,14 +245,27 @@ export class ContentEvaluatorModule extends BaseModule {
 
   async _splitPromptForPullRequestCommentEvaluation(specification: string, comments: PrCommentToEvaluate[]) {
     const commentRelevances: Relevances = {};
-    const chunks = 2;
+
+    let chunks = 2;
+    while (
+      Math.max(
+        ...this._splitArrayToChunks(comments, chunks).map(
+          (chunk) =>
+            this._calculateMaxTokens(JSON.stringify(this._generateDummyResponse(chunk), null, 2)) +
+            this._calculateMaxTokens(this._generatePromptForPrComments(specification, chunk), Infinity)
+        )
+      ) > this._tokenLimit
+    ) {
+      chunks++;
+    }
+    this.context.logger.info(`Splitting PR comments into ${chunks} chunks`);
 
     for (const commentSplit of this._splitArrayToChunks(comments, chunks)) {
       const dummyResponse = JSON.stringify(this._generateDummyResponse(commentSplit), null, 2);
-      const maxTokens = this._calculateMaxTokens(dummyResponse);
+      const maxOutputTokens = this._calculateMaxTokens(dummyResponse);
       const promptForComments = this._generatePromptForPrComments(specification, commentSplit);
 
-      for (const [key, value] of Object.entries(await this._submitPrompt(promptForComments, maxTokens))) {
+      for (const [key, value] of Object.entries(await this._submitPrompt(promptForComments, maxOutputTokens))) {
         if (commentRelevances[key]) {
           commentRelevances[key] = new Decimal(commentRelevances[key]).add(value).toNumber();
         } else {
@@ -237,74 +289,100 @@ export class ContentEvaluatorModule extends BaseModule {
     let commentRelevances: Relevances = {};
     let prCommentRelevances: Relevances = {};
 
-    if (!this._configuration?.openAi.tokenCountLimit) {
-      throw this.context.logger.fatal("Token count limit is missing, comments cannot be evaluated.");
-    }
-
-    const tokenLimit = this._configuration?.openAi.tokenCountLimit;
-
     if (userIssueComments.length) {
       const dummyResponse = JSON.stringify(this._generateDummyResponse(userIssueComments), null, 2);
-      const maxTokens = this._calculateMaxTokens(dummyResponse);
+      const maxOutputTokens = this._calculateMaxTokens(dummyResponse);
 
       const promptForIssueComments = this._generatePromptForComments(specification, userIssueComments, allComments);
-      if (this._calculateMaxTokens(promptForIssueComments, Infinity) > tokenLimit) {
+      if (this._calculateMaxTokens(promptForIssueComments, Infinity) + maxOutputTokens > this._tokenLimit) {
         commentRelevances = await this._splitPromptForIssueCommentEvaluation(
           specification,
           userIssueComments,
           allComments
         );
       } else {
-        commentRelevances = await this._submitPrompt(promptForIssueComments, maxTokens);
+        commentRelevances = await this._submitPrompt(promptForIssueComments, maxOutputTokens);
       }
     }
 
     if (userPrComments.length) {
       const dummyResponse = JSON.stringify(this._generateDummyResponse(userPrComments), null, 2);
-      const maxTokens = this._calculateMaxTokens(dummyResponse);
+      const maxOutputTokens = this._calculateMaxTokens(dummyResponse);
 
       const promptForPrComments = this._generatePromptForPrComments(specification, userPrComments);
-      if (this._calculateMaxTokens(promptForPrComments, Infinity) > tokenLimit) {
+      if (this._calculateMaxTokens(promptForPrComments, Infinity) + maxOutputTokens > this._tokenLimit) {
         prCommentRelevances = await this._splitPromptForPullRequestCommentEvaluation(specification, userPrComments);
       } else {
-        prCommentRelevances = await this._submitPrompt(promptForPrComments, maxTokens);
+        prCommentRelevances = await this._submitPrompt(promptForPrComments, maxOutputTokens);
       }
     }
 
     return { ...commentRelevances, ...prCommentRelevances };
   }
 
   async _submitPrompt(prompt: string, maxTokens: number): Promise<Relevances> {
-    const response: OpenAI.Chat.ChatCompletion = await this._openAi.chat.completions.create({
-      model: this._configuration?.openAi.model ?? "gpt-4o-2024-08-06",
-      response_format: { type: "json_object" },
-      messages: [
-        {
-          role: "system",
-          content: prompt,
-        },
-      ],
-      max_tokens: maxTokens,
-      top_p: 1,
-      temperature: 1,
-      frequency_penalty: 0,
-      presence_penalty: 0,
-    });
-
-    const rawResponse = String(response.choices[0].message.content);
-    this.context.logger.info(`OpenAI raw response (using max_tokens: ${maxTokens}): ${rawResponse}`);
+    try {
+      const relevances = await retry(
+        async () => {
+          const res = await this._openAi.chat.completions.create({
+            model: this._configuration?.openAi.model ?? "gpt-4o-2024-08-06",
+            response_format: {
+              type: "json_object",
+            },
+            messages: [
+              {
+                role: "system",
+                content: prompt,
+              },
+            ],
+            max_tokens: maxTokens,
+            top_p: 1,
+            temperature: 1,
+            frequency_penalty: 0,
+            presence_penalty: 0,
+          });
+          const rawResponse = String(res.choices[0].message.content);
+          this.context.logger.info(`OpenAI raw response (using max_tokens: ${maxTokens}): ${rawResponse}`);
 
-    const jsonResponse = JSON.parse(rawResponse);
+          const relevances = Value.Decode(openAiRelevanceResponseSchema, JSON.parse(rawResponse));
+          this.context.logger.info(`Relevances by OpenAI: ${JSON.stringify(relevances)}`);
 
-    try {
-      const relevances = Value.Decode(openAiRelevanceResponseSchema, jsonResponse);
-      this.context.logger.info(`Relevances by OpenAI: ${JSON.stringify(relevances)}`);
+          return relevances;
+        },
+        {
+          maxRetries: this._configuration?.openAi.maxRetries ?? 3,
+          onError: async (error) => {
+            if (this.context.config.incentives.githubComment?.post) {
+              await postComment(this.context, this.context.logger.ok("Results are being retried", { err: error }), {
+                updateComment: true,
+              });
+            }
+          },
+          isErrorRetryable: (error) => {
+            if (error instanceof OpenAI.APIError && error.status) {
+              if ([500, 503].includes(error.status)) {
+                return true;
+              }
+              if (error.status === 429 && error.headers) {
+                const retryAfterTokens = error.headers["x-ratelimit-reset-tokens"];
+                const retryAfterRequests = error.headers["x-ratelimit-reset-requests"];
+                if (!retryAfterTokens || !retryAfterRequests) {
+                  return true;
+                }
+                const retryAfter = Math.max(ms(retryAfterTokens as StringValue), ms(retryAfterRequests as StringValue));
+                return Number.isFinite(retryAfter) ? retryAfter : true;
+              }
+            }
+            // Retry if there is a SyntaxError caused by malformed JSON or TypeBoxError caused by incorrect JSON from OpenAI
+            return error instanceof SyntaxError || error instanceof TypeBoxError;
+          },
+        }
+      );
       return relevances;
     } catch (e) {
       throw new Error(
         this.context.logger.error(`Invalid response type received from openai while evaluating: \n\nError: ${e}`, {
           error: e as Error,
-          jsonResponse,
         }).logMessage.raw
       );
     }
@@ -353,10 +431,20 @@ export class ContentEvaluatorModule extends BaseModule {
     if (!issue?.length) {
       throw new Error("Issue specification comment is missing or empty");
     }
-    return `I need to evaluate the value of a GitHub contributor's comments in a pull request. Some of these comments are code review comments, and some are general suggestions or a part of the discussion. I'm interested in how much each comment helps to solve the GitHub issue and improve code quality. Please provide a float between 0 and 1 to represent the value of each comment. A score of 1 indicates that the comment is very valuable and significantly improves the submitted solution and code quality, whereas a score of 0 indicates a negative or zero impact. A stringified JSON is given below that contains the specification of the GitHub issue, and comments by different contributors. The property "diffHunk" presents the chunk of code being addressed for a possible change in a code review comment. \n\n\`\`\`\n${JSON.stringify(
-      { specification: issue, comments: userComments }
-    )}\n\`\`\`\n\n\nTo what degree are each of the comments valuable? Please reply with ONLY a JSON where each key is the comment ID given in JSON above, and the value is a float number between 0 and 1 corresponding to the comment. The float number should represent the value of the comment for improving the issue solution and code quality. The total number of properties in your JSON response should equal exactly ${
-      userComments.length
-    }.`;
+    return `I need to evaluate the value of a GitHub contributor's comments in a pull request. 
+    Some of these comments are code review comments, and some are general suggestions or a part of the discussion. 
+    I'm interested in how much each comment helps to solve the GitHub issue and improve code quality. 
+    Please provide a float between 0 and 1 to represent the value of each comment. 
+    A score of 1 indicates that the comment is very valuable and significantly improves the submitted solution and code quality, whereas a score of 0 indicates a negative or zero impact. 
+    A stringified JSON is given below that contains the specification of the GitHub issue, and comments by different contributors. 
+    The property "diffHunk" presents the chunk of code being addressed for a possible change in a code review comment. 
+
+    \`\`\`
+    ${JSON.stringify({ specification: issue, comments: userComments })}
+    \`\`\`\
+
+    To what degree are each of the comments valuable? 
+    Please reply with ONLY a JSON where each key is the comment ID given in JSON above, and the value is a float number between 0 and 1 corresponding to the comment. 
+    The float number should represent the value of the comment for improving the issue solution and code quality. The total number of properties in your JSON response should equal exactly ${userComments.length}.`;
   }
 }
diff --git a/src/types/content-evaluator-module-type.ts b/src/types/content-evaluator-module-type.ts
@@ -6,6 +6,9 @@ export type PrCommentToEvaluate = { id: number; comment: string; diffHunk?: stri
 
 export type AllComments = { id: number; comment: string; author: string }[];
 
-export const openAiRelevanceResponseSchema = Type.Record(Type.String(), Type.Number({ minimum: 0, maximum: 1 }));
+export const openAiRelevanceResponseSchema = Type.Record(
+  Type.RegExp("^[0-9]+$"),
+  Type.Number({ minimum: 0, maximum: 1 })
+);
 
 export type Relevances = Static<typeof openAiRelevanceResponseSchema>;
diff --git a/tests/__mocks__/results/valid-configuration.json b/tests/__mocks__/results/valid-configuration.json
@@ -17,7 +17,8 @@
       ],
       "openAi": {
         "endpoint": "https://api.openai.com/v1",
-        "model": "gpt-4o"
+        "model": "gpt-4o",
+        "tokenCountLimit": 124000
       }
     },
     "dataPurge": {},