SillyTavern/public/scripts/horde.js

385 lines
12 KiB
JavaScript
Raw Normal View History

2023-07-20 19:32:15 +02:00
import {
saveSettingsDebounced,
callPopup,
setGenerationProgress,
getRequestHeaders,
2023-09-17 16:00:23 +02:00
max_context,
2023-12-02 21:06:57 +01:00
amount_gen,
2023-12-02 19:04:51 +01:00
} from '../script.js';
import { SECRET_KEYS, writeSecret } from './secrets.js';
import { delay } from './utils.js';
import { isMobile } from './RossAscends-mods.js';
2023-12-02 19:04:51 +01:00
import { autoSelectInstructPreset } from './instruct-mode.js';
2023-07-20 19:32:15 +02:00
export {
horde_settings,
generateHorde,
checkHordeStatus,
loadHordeSettings,
adjustHordeGenerationParams,
getHordeModels,
2023-10-24 15:23:32 +02:00
MIN_LENGTH,
2023-12-02 20:11:06 +01:00
};
2023-07-20 19:32:15 +02:00
let models = [];
let horde_settings = {
models: [],
auto_adjust_response_length: true,
auto_adjust_context_length: false,
trusted_workers_only: false,
};
2023-11-19 20:30:08 +01:00
const MAX_RETRIES = 480;
const CHECK_INTERVAL = 2500;
2023-10-24 15:23:32 +02:00
const MIN_LENGTH = 16;
2023-07-20 19:32:15 +02:00
2023-12-22 21:10:09 +01:00
/**
* Gets the available workers from Horde.
* @param {boolean} force Do a force refresh of the workers
* @returns {Promise<Array>} Array of workers
*/
async function getWorkers(force) {
const response = await fetch('/api/horde/text-workers', {
method: 'POST',
headers: getRequestHeaders(),
body: JSON.stringify({ force }),
});
const data = await response.json();
return data;
}
/**
* Gets the available models from Horde.
* @param {boolean} force Do a force refresh of the models
* @returns {Promise<Array>} Array of models
*/
async function getModels(force) {
const response = await fetch('/api/horde/text-models', {
method: 'POST',
headers: getRequestHeaders(),
body: JSON.stringify({ force }),
});
const data = await response.json();
return data;
}
/**
* Gets the status of a Horde task.
* @param {string} taskId Task ID
* @returns {Promise<Object>} Task status
*/
async function getTaskStatus(taskId) {
const response = await fetch('/api/horde/task-status', {
method: 'POST',
headers: getRequestHeaders(),
body: JSON.stringify({ taskId }),
});
if (!response.ok) {
throw new Error(`Failed to get task status: ${response.statusText}`);
}
2023-07-20 19:32:15 +02:00
const data = await response.json();
return data;
}
2023-12-22 21:10:09 +01:00
/**
* Cancels a Horde task.
* @param {string} taskId Task ID
*/
async function cancelTask(taskId) {
const response = await fetch('/api/horde/cancel-task', {
method: 'POST',
headers: getRequestHeaders(),
body: JSON.stringify({ taskId }),
});
if (!response.ok) {
throw new Error(`Failed to cancel task: ${response.statusText}`);
}
}
/**
* Checks if Horde is online.
* @returns {Promise<boolean>} True if Horde is online, false otherwise
*/
async function checkHordeStatus() {
try {
const response = await fetch('/api/horde/status', {
method: 'POST',
headers: getRequestHeaders(),
});
if (!response.ok) {
return false;
}
const data = await response.json();
return data.ok;
} catch (error) {
console.error(error);
return false;
}
}
2023-07-20 19:32:15 +02:00
function validateHordeModel() {
let selectedModels = models.filter(m => horde_settings.models.includes(m.name));
if (selectedModels.length === 0) {
toastr.warning('No Horde model selected or the selected models are no longer available. Please choose another model');
throw new Error('No Horde model available');
}
return selectedModels;
}
async function adjustHordeGenerationParams(max_context_length, max_length) {
2023-12-02 20:11:06 +01:00
console.log(max_context_length, max_length);
2023-12-22 21:10:09 +01:00
const workers = await getWorkers(false);
2023-07-20 19:32:15 +02:00
let maxContextLength = max_context_length;
let maxLength = max_length;
let availableWorkers = [];
let selectedModels = validateHordeModel();
if (selectedModels.length === 0) {
return { maxContextLength, maxLength };
}
for (const model of selectedModels) {
for (const worker of workers) {
if (model.cluster == worker.cluster && worker.models.includes(model.name)) {
// Skip workers that are not trusted if the option is enabled
if (horde_settings.trusted_workers_only && !worker.trusted) {
continue;
}
2023-07-20 19:32:15 +02:00
availableWorkers.push(worker);
}
}
}
//get the minimum requires parameters, lowest common value for all selected
for (const worker of availableWorkers) {
if (horde_settings.auto_adjust_context_length) {
maxContextLength = Math.min(worker.max_context_length, maxContextLength);
}
if (horde_settings.auto_adjust_response_length) {
maxLength = Math.min(worker.max_length, maxLength);
}
}
2023-12-02 20:11:06 +01:00
console.log(maxContextLength, maxLength);
$('#adjustedHordeParams').text(`Context: ${maxContextLength}, Response: ${maxLength}`);
2023-07-20 19:32:15 +02:00
return { maxContextLength, maxLength };
}
function setContextSizePreview() {
if (horde_settings.models.length) {
adjustHordeGenerationParams(max_context, amount_gen);
} else {
2023-12-02 19:04:51 +01:00
$('#adjustedHordeParams').text('Context: --, Response: --');
}
}
2023-10-11 16:56:52 +02:00
async function generateHorde(prompt, params, signal, reportProgress) {
2023-07-20 19:32:15 +02:00
validateHordeModel();
delete params.prompt;
// No idea what these do
2023-12-02 19:04:51 +01:00
params['n'] = 1;
params['frmtadsnsp'] = false;
params['frmtrmblln'] = false;
params['frmtrmspch'] = false;
params['frmttriminc'] = false;
2023-07-20 19:32:15 +02:00
const payload = {
2023-12-02 19:04:51 +01:00
'prompt': prompt,
'params': params,
'trusted_workers': horde_settings.trusted_workers_only,
2023-07-20 19:32:15 +02:00
//"slow_workers": false,
2023-12-02 19:04:51 +01:00
'models': horde_settings.models,
2023-07-20 19:32:15 +02:00
};
2023-12-02 19:04:51 +01:00
const response = await fetch('/api/horde/generate-text', {
2023-07-20 19:32:15 +02:00
method: 'POST',
2023-12-22 21:10:09 +01:00
headers: getRequestHeaders(),
2023-12-02 21:06:57 +01:00
body: JSON.stringify(payload),
2023-07-20 19:32:15 +02:00
});
if (!response.ok) {
2023-08-27 12:31:14 +02:00
toastr.error(response.statusText, 'Horde generation failed');
throw new Error(`Horde generation failed: ${response.statusText}`);
2023-07-20 19:32:15 +02:00
}
const responseJson = await response.json();
2023-08-27 12:31:14 +02:00
if (responseJson.error) {
const reason = responseJson.error?.message || 'Unknown error';
toastr.error(reason, 'Horde generation failed');
throw new Error(`Horde generation failed: ${reason}`);
}
2023-12-22 21:10:09 +01:00
const taskId = responseJson.id;
2023-07-20 19:32:15 +02:00
let queue_position_first = null;
2023-12-22 21:10:09 +01:00
console.log(`Horde task id = ${taskId}`);
2023-07-20 19:32:15 +02:00
for (let retryNumber = 0; retryNumber < MAX_RETRIES; retryNumber++) {
if (signal.aborted) {
2023-12-22 21:10:09 +01:00
cancelTask(taskId);
2023-07-20 19:32:15 +02:00
throw new Error('Request aborted');
}
2023-12-22 21:10:09 +01:00
const statusCheckJson = await getTaskStatus(taskId);
2023-07-20 19:32:15 +02:00
console.log(statusCheckJson);
2023-09-18 17:00:11 +02:00
if (statusCheckJson.faulted === true) {
toastr.error('Horde request faulted. Please try again.');
2023-12-02 19:04:51 +01:00
throw new Error('Horde generation failed: Faulted');
2023-09-18 17:00:11 +02:00
}
if (statusCheckJson.is_possible === false) {
toastr.error('There are no Horde workers that are able to generate text with your request. Please change the parameters or try again later.');
2023-12-02 19:04:51 +01:00
throw new Error('Horde generation failed: Unsatisfiable request');
2023-09-18 17:00:11 +02:00
}
2023-07-20 19:32:15 +02:00
if (statusCheckJson.done && Array.isArray(statusCheckJson.generations) && statusCheckJson.generations.length) {
2023-10-11 16:56:52 +02:00
reportProgress && setGenerationProgress(100);
2023-07-20 19:32:15 +02:00
const generatedText = statusCheckJson.generations[0].text;
const WorkerName = statusCheckJson.generations[0].worker_name;
const WorkerModel = statusCheckJson.generations[0].model;
console.log(generatedText);
console.log(`Generated by Horde Worker: ${WorkerName} [${WorkerModel}]`);
return { text: generatedText, workerName: `Generated by Horde worker: ${WorkerName} [${WorkerModel}]` };
}
else if (!queue_position_first) {
queue_position_first = statusCheckJson.queue_position;
2023-10-11 16:56:52 +02:00
reportProgress && setGenerationProgress(0);
2023-07-20 19:32:15 +02:00
}
else if (statusCheckJson.queue_position >= 0) {
let queue_position = statusCheckJson.queue_position;
const progress = Math.round(100 - (queue_position / queue_position_first * 100));
2023-10-11 16:56:52 +02:00
reportProgress && setGenerationProgress(progress);
2023-07-20 19:32:15 +02:00
}
await delay(CHECK_INTERVAL);
}
callPopup('Horde request timed out. Try again', 'text');
throw new Error('Horde timeout');
}
2023-12-22 21:10:09 +01:00
/**
* Displays the available models in the Horde model selection dropdown.
* @param {boolean} force Force refresh of the models
*/
async function getHordeModels(force) {
2023-07-20 19:32:15 +02:00
$('#horde_model').empty();
2023-12-22 21:10:09 +01:00
models = (await getModels(force)).sort((a, b) => b.performance - a.performance);
2023-07-20 19:32:15 +02:00
for (const model of models) {
const option = document.createElement('option');
option.value = model.name;
2023-09-17 16:00:23 +02:00
option.innerText = `${model.name} (ETA: ${model.eta}s, Speed: ${model.performance}, Queue: ${model.queued}, Workers: ${model.count})`;
2023-07-20 19:32:15 +02:00
option.selected = horde_settings.models.includes(model.name);
$('#horde_model').append(option);
}
// if previously selected is no longer available
if (horde_settings.models.length && models.filter(m => horde_settings.models.includes(m.name)).length === 0) {
horde_settings.models = [];
}
setContextSizePreview();
2023-07-20 19:32:15 +02:00
}
function loadHordeSettings(settings) {
if (settings.horde_settings) {
Object.assign(horde_settings, settings.horde_settings);
}
2023-12-02 19:04:51 +01:00
$('#horde_auto_adjust_response_length').prop('checked', horde_settings.auto_adjust_response_length);
$('#horde_auto_adjust_context_length').prop('checked', horde_settings.auto_adjust_context_length);
$('#horde_trusted_workers_only').prop('checked', horde_settings.trusted_workers_only);
2023-07-20 19:32:15 +02:00
}
async function showKudos() {
const response = await fetch('/api/horde/user-info', {
2023-07-20 19:32:15 +02:00
method: 'POST',
headers: getRequestHeaders(),
});
if (!response.ok) {
toastr.warning('Could not load user info from Horde. Please try again later.');
return;
}
const data = await response.json();
if (data.anonymous) {
2023-12-02 20:11:06 +01:00
toastr.info('You are in anonymous mode. Set your personal Horde API key to see kudos.');
2023-07-20 19:32:15 +02:00
return;
}
console.log('Horde user data', data);
toastr.info(`Kudos: ${data.kudos}`, data.username);
}
jQuery(function () {
2023-12-02 19:04:51 +01:00
$('#horde_model').on('mousedown change', async function (e) {
2023-07-20 19:32:15 +02:00
horde_settings.models = $('#horde_model').val();
console.log('Updated Horde models', horde_settings.models);
// Try select instruct preset
autoSelectInstructPreset(horde_settings.models.join(' '));
2023-09-17 16:00:23 +02:00
if (horde_settings.models.length) {
2023-12-02 20:11:06 +01:00
adjustHordeGenerationParams(max_context, amount_gen);
2023-09-17 16:00:23 +02:00
} else {
2023-12-02 20:11:06 +01:00
$('#adjustedHordeParams').text('Context: --, Response: --');
2023-09-17 16:00:23 +02:00
}
2023-07-20 19:32:15 +02:00
});
2023-12-02 19:04:51 +01:00
$('#horde_auto_adjust_response_length').on('input', function () {
horde_settings.auto_adjust_response_length = !!$(this).prop('checked');
setContextSizePreview();
2023-07-20 19:32:15 +02:00
saveSettingsDebounced();
});
2023-12-02 19:04:51 +01:00
$('#horde_auto_adjust_context_length').on('input', function () {
horde_settings.auto_adjust_context_length = !!$(this).prop('checked');
setContextSizePreview();
2023-07-20 19:32:15 +02:00
saveSettingsDebounced();
});
2023-12-02 19:04:51 +01:00
$('#horde_trusted_workers_only').on('input', function () {
horde_settings.trusted_workers_only = !!$(this).prop('checked');
setContextSizePreview();
2023-07-20 19:32:15 +02:00
saveSettingsDebounced();
2023-12-02 20:11:06 +01:00
});
2023-07-20 19:32:15 +02:00
2023-12-02 19:04:51 +01:00
$('#horde_api_key').on('input', async function () {
const key = String($(this).val()).trim();
2023-07-20 19:32:15 +02:00
await writeSecret(SECRET_KEYS.HORDE, key);
});
2023-12-22 21:10:09 +01:00
$('#horde_refresh').on('click', () => getHordeModels(true));
2023-12-02 19:04:51 +01:00
$('#horde_kudos').on('click', showKudos);
2023-07-20 19:32:15 +02:00
// Not needed on mobile
if (!isMobile()) {
2023-07-20 19:32:15 +02:00
$('#horde_model').select2({
width: '100%',
placeholder: 'Select Horde models',
allowClear: true,
closeOnSelect: false,
2023-09-17 16:00:23 +02:00
templateSelection: function (data) {
2023-07-20 19:32:15 +02:00
// Customize the pillbox text by shortening the full text
return data.id;
},
2023-09-17 16:00:23 +02:00
templateResult: function (data) {
2023-07-20 19:32:15 +02:00
// Return the full text for the dropdown
return data.text;
},
});
}
2023-12-02 20:11:06 +01:00
});