Adjust KAI retry logic

This commit is contained in:
Cohee
2023-06-12 23:01:01 +03:00
parent 88fadce5c6
commit 5971efd330

View File

@@ -385,8 +385,8 @@ app.post("/generate", jsonParser, async function (request, response_generate = r
headers: { "Content-Type": "application/json" },
};
const MAX_RETRIES = 20;
const delayAmount = 5000;
const MAX_RETRIES = 50;
const delayAmount = 2500;
for (let i = 0; i < MAX_RETRIES; i++) {
try {
const data = await postAsync(api_server + "/v1/generate", args);
@@ -400,18 +400,23 @@ app.post("/generate", jsonParser, async function (request, response_generate = r
}
// response
switch (error.status) {
switch (error?.status) {
case 403:
case 503:
console.debug(`KoboldAI is busy. Retry attempt ${i+1} of ${MAX_RETRIES}...`);
await delay(delayAmount);
break;
default:
console.log('Status Code from Kobold:', error.status);
if ('status' in error) {
console.log('Status Code from Kobold:', error.status);
}
return response_generate.send({ error: true });
}
}
}
console.log('Max retries exceeded. Giving up.');
return response_generate.send({ error: true });
});
//************** Text generation web UI