Increase timeouts of OAI out of quota requests

2025-06-05 21:59:27 +02:00 · 2023-11-08 12:07:14 +02:00
parent b3ced2c4c5
commit 740f6548a2
2 changed files with 3 additions and 2 deletions
--- a/public/scripts/openai.js
+++ b/public/scripts/openai.js
@@ -110,7 +110,7 @@ const max_4k = 4095;
 const max_8k = 8191;
 const max_16k = 16383;
 const max_32k = 32767;
-const max_128k = 128 * 1024 - 1;
+const max_128k = 128 * 1000;
 const scale_max = 8191;
 const claude_max = 9000; // We have a proper tokenizer, so theoretically could be larger (up to 9k)
 const palm2_max = 7500; // The real context window is 8192, spare some for padding due to using turbo tokenizer
--- a/server.js
+++ b/server.js
@@ -3222,7 +3222,8 @@ app.post("/generate_openai", jsonParser, function (request, response_generate_op
            } else if (fetchResponse.status === 429 && retries > 0) {
                console.log(`Out of quota, retrying in ${Math.round(timeout / 1000)}s`);
                setTimeout(() => {
-                    makeRequest(config, response_generate_openai, request, retries - 1);
+                    timeout *= 2;
                    makeRequest(config, response_generate_openai, request, retries - 1, timeout);
                }, timeout);
            } else {
                await handleErrorResponse(fetchResponse);