mirror of
https://github.com/SillyTavern/SillyTavern.git
synced 2025-01-21 22:16:24 +01:00
445 lines
14 KiB
JavaScript
445 lines
14 KiB
JavaScript
import {
|
|
amount_gen,
|
|
callPopup,
|
|
getRequestHeaders,
|
|
max_context,
|
|
saveSettingsDebounced,
|
|
setGenerationProgress,
|
|
} from '../script.js';
|
|
import { SECRET_KEYS, writeSecret } from './secrets.js';
|
|
import { delay } from './utils.js';
|
|
import { isMobile } from './RossAscends-mods.js';
|
|
import { autoSelectInstructPreset } from './instruct-mode.js';
|
|
|
|
export {
|
|
horde_settings,
|
|
generateHorde,
|
|
checkHordeStatus,
|
|
loadHordeSettings,
|
|
adjustHordeGenerationParams,
|
|
getHordeModels,
|
|
MIN_LENGTH,
|
|
};
|
|
|
|
let models = [];
|
|
|
|
let horde_settings = {
|
|
models: [],
|
|
auto_adjust_response_length: true,
|
|
auto_adjust_context_length: false,
|
|
trusted_workers_only: false,
|
|
};
|
|
|
|
const MAX_RETRIES = 480;
|
|
const CHECK_INTERVAL = 2500;
|
|
const MIN_LENGTH = 16;
|
|
|
|
/**
|
|
* Gets the available workers from Horde.
|
|
* @param {boolean} force Do a force refresh of the workers
|
|
* @returns {Promise<Array>} Array of workers
|
|
*/
|
|
async function getWorkers(force) {
|
|
const response = await fetch('/api/horde/text-workers', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify({ force }),
|
|
});
|
|
return await response.json();
|
|
}
|
|
|
|
/**
|
|
* Gets the available models from Horde.
|
|
* @param {boolean} force Do a force refresh of the models
|
|
* @returns {Promise<Array>} Array of models
|
|
*/
|
|
async function getModels(force) {
|
|
const response = await fetch('/api/horde/text-models', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify({ force }),
|
|
});
|
|
const data = await response.json();
|
|
console.log('getModels', data);
|
|
return data;
|
|
}
|
|
|
|
|
|
/**
|
|
* Gets the status of a Horde task.
|
|
* @param {string} taskId Task ID
|
|
* @returns {Promise<Object>} Task status
|
|
*/
|
|
async function getTaskStatus(taskId) {
|
|
const response = await fetch('/api/horde/task-status', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify({ taskId }),
|
|
});
|
|
|
|
if (!response.ok) {
|
|
throw new Error(`Failed to get task status: ${response.statusText}`);
|
|
}
|
|
|
|
return await response.json();
|
|
}
|
|
|
|
/**
|
|
* Cancels a Horde task.
|
|
* @param {string} taskId Task ID
|
|
*/
|
|
async function cancelTask(taskId) {
|
|
const response = await fetch('/api/horde/cancel-task', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify({ taskId }),
|
|
});
|
|
|
|
if (!response.ok) {
|
|
throw new Error(`Failed to cancel task: ${response.statusText}`);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Checks if Horde is online.
|
|
* @returns {Promise<boolean>} True if Horde is online, false otherwise
|
|
*/
|
|
async function checkHordeStatus() {
|
|
try {
|
|
const response = await fetch('/api/horde/status', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
});
|
|
|
|
if (!response.ok) {
|
|
return false;
|
|
}
|
|
|
|
const data = await response.json();
|
|
return data.ok;
|
|
} catch (error) {
|
|
console.error(error);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
function validateHordeModel() {
|
|
let selectedModels = models.filter(m => horde_settings.models.includes(m.name));
|
|
|
|
if (selectedModels.length === 0) {
|
|
toastr.warning('No Horde model selected or the selected models are no longer available. Please choose another model');
|
|
throw new Error('No Horde model available');
|
|
}
|
|
|
|
return selectedModels;
|
|
}
|
|
|
|
async function adjustHordeGenerationParams(max_context_length, max_length) {
|
|
console.log(max_context_length, max_length);
|
|
const workers = await getWorkers(false);
|
|
let maxContextLength = max_context_length;
|
|
let maxLength = max_length;
|
|
let availableWorkers = [];
|
|
let selectedModels = validateHordeModel();
|
|
|
|
if (selectedModels.length === 0) {
|
|
return { maxContextLength, maxLength };
|
|
}
|
|
|
|
for (const model of selectedModels) {
|
|
for (const worker of workers) {
|
|
if (model.cluster === worker.cluster && worker.models.includes(model.name)) {
|
|
// Skip workers that are not trusted if the option is enabled
|
|
if (horde_settings.trusted_workers_only && !worker.trusted) {
|
|
continue;
|
|
}
|
|
|
|
availableWorkers.push(worker);
|
|
}
|
|
}
|
|
}
|
|
|
|
//get the minimum requires parameters, lowest common value for all selected
|
|
for (const worker of availableWorkers) {
|
|
if (horde_settings.auto_adjust_context_length) {
|
|
maxContextLength = Math.min(worker.max_context_length, maxContextLength);
|
|
}
|
|
if (horde_settings.auto_adjust_response_length) {
|
|
maxLength = Math.min(worker.max_length, maxLength);
|
|
}
|
|
}
|
|
console.log(maxContextLength, maxLength);
|
|
$('#adjustedHordeParams').text(`Context: ${maxContextLength}, Response: ${maxLength}`);
|
|
return { maxContextLength, maxLength };
|
|
}
|
|
|
|
function setContextSizePreview() {
|
|
if (horde_settings.models.length) {
|
|
adjustHordeGenerationParams(max_context, amount_gen);
|
|
} else {
|
|
$('#adjustedHordeParams').text('Context: --, Response: --');
|
|
}
|
|
}
|
|
|
|
async function generateHorde(prompt, params, signal, reportProgress) {
|
|
validateHordeModel();
|
|
delete params.prompt;
|
|
|
|
// No idea what these do
|
|
params['n'] = 1;
|
|
params['frmtadsnsp'] = false;
|
|
params['frmtrmblln'] = false;
|
|
params['frmtrmspch'] = false;
|
|
params['frmttriminc'] = false;
|
|
|
|
const payload = {
|
|
'prompt': prompt,
|
|
'params': params,
|
|
'trusted_workers': horde_settings.trusted_workers_only,
|
|
//"slow_workers": false,
|
|
'models': horde_settings.models,
|
|
};
|
|
|
|
const response = await fetch('/api/horde/generate-text', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify(payload),
|
|
});
|
|
|
|
if (!response.ok) {
|
|
toastr.error(response.statusText, 'Horde generation failed');
|
|
throw new Error(`Horde generation failed: ${response.statusText}`);
|
|
}
|
|
|
|
const responseJson = await response.json();
|
|
|
|
if (responseJson.error) {
|
|
const reason = responseJson.error?.message || 'Unknown error';
|
|
toastr.error(reason, 'Horde generation failed');
|
|
throw new Error(`Horde generation failed: ${reason}`);
|
|
}
|
|
|
|
const taskId = responseJson.id;
|
|
let queue_position_first = null;
|
|
console.log(`Horde task id = ${taskId}`);
|
|
|
|
for (let retryNumber = 0; retryNumber < MAX_RETRIES; retryNumber++) {
|
|
if (signal.aborted) {
|
|
cancelTask(taskId);
|
|
throw new Error('Request aborted');
|
|
}
|
|
|
|
const statusCheckJson = await getTaskStatus(taskId);
|
|
console.log(statusCheckJson);
|
|
|
|
if (statusCheckJson.faulted === true) {
|
|
toastr.error('Horde request faulted. Please try again.');
|
|
throw new Error('Horde generation failed: Faulted');
|
|
}
|
|
|
|
if (statusCheckJson.is_possible === false) {
|
|
toastr.error('There are no Horde workers that are able to generate text with your request. Please change the parameters or try again later.');
|
|
throw new Error('Horde generation failed: Unsatisfiable request');
|
|
}
|
|
|
|
if (statusCheckJson.done && Array.isArray(statusCheckJson.generations) && statusCheckJson.generations.length) {
|
|
reportProgress && setGenerationProgress(100);
|
|
const generatedText = statusCheckJson.generations[0].text;
|
|
const WorkerName = statusCheckJson.generations[0].worker_name;
|
|
const WorkerModel = statusCheckJson.generations[0].model;
|
|
console.log(generatedText);
|
|
console.log(`Generated by Horde Worker: ${WorkerName} [${WorkerModel}]`);
|
|
return { text: generatedText, workerName: `Generated by Horde worker: ${WorkerName} [${WorkerModel}]` };
|
|
} else if (!queue_position_first) {
|
|
queue_position_first = statusCheckJson.queue_position;
|
|
reportProgress && setGenerationProgress(0);
|
|
} else if (statusCheckJson.queue_position >= 0) {
|
|
let queue_position = statusCheckJson.queue_position;
|
|
const progress = Math.round(100 - (queue_position / queue_position_first * 100));
|
|
reportProgress && setGenerationProgress(progress);
|
|
}
|
|
|
|
await delay(CHECK_INTERVAL);
|
|
}
|
|
|
|
callPopup('Horde request timed out. Try again', 'text');
|
|
throw new Error('Horde timeout');
|
|
}
|
|
|
|
|
|
/**
|
|
* Displays the available models in the Horde model selection dropdown.
|
|
* @param {boolean} force Force refresh of the models
|
|
*/
|
|
async function getHordeModels(force) {
|
|
const sortByPerformance = (a, b) => b.performance - a.performance;
|
|
const sortByWhitelisted = (a, b) => b.is_whitelisted - a.is_whitelisted;
|
|
const sortByPopular = (a, b) => b.tags?.includes('popular') - a.tags?.includes('popular');
|
|
|
|
$('#horde_model').empty();
|
|
models = (await getModels(force)).sort((a, b) => {
|
|
return sortByWhitelisted(a, b) || sortByPopular(a, b) || sortByPerformance(a, b);
|
|
});
|
|
for (const model of models) {
|
|
const option = document.createElement('option');
|
|
option.value = model.name;
|
|
option.innerText = hordeModelTextString(model);
|
|
option.selected = horde_settings.models.includes(model.name);
|
|
$('#horde_model').append(option);
|
|
}
|
|
|
|
// if previously selected is no longer available
|
|
if (horde_settings.models.length && models.filter(m => horde_settings.models.includes(m.name)).length === 0) {
|
|
horde_settings.models = [];
|
|
}
|
|
|
|
setContextSizePreview();
|
|
}
|
|
|
|
function loadHordeSettings(settings) {
|
|
if (settings.horde_settings) {
|
|
Object.assign(horde_settings, settings.horde_settings);
|
|
}
|
|
|
|
$('#horde_auto_adjust_response_length').prop('checked', horde_settings.auto_adjust_response_length);
|
|
$('#horde_auto_adjust_context_length').prop('checked', horde_settings.auto_adjust_context_length);
|
|
$('#horde_trusted_workers_only').prop('checked', horde_settings.trusted_workers_only);
|
|
}
|
|
|
|
async function showKudos() {
|
|
const response = await fetch('/api/horde/user-info', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
});
|
|
|
|
if (!response.ok) {
|
|
toastr.warning('Could not load user info from Horde. Please try again later.');
|
|
return;
|
|
}
|
|
|
|
const data = await response.json();
|
|
|
|
if (data.anonymous) {
|
|
toastr.info('You are in anonymous mode. Set your personal Horde API key to see kudos.');
|
|
return;
|
|
}
|
|
|
|
console.log('Horde user data', data);
|
|
toastr.info(`Kudos: ${data.kudos}`, data.username);
|
|
}
|
|
|
|
function hordeModelTextString(model) {
|
|
const q = hordeModelQueueStateString(model);
|
|
return `${model.name} (${q})`;
|
|
}
|
|
|
|
function hordeModelQueueStateString(model) {
|
|
return `ETA: ${model.eta}s, Speed: ${model.performance}, Queue: ${model.queued}, Workers: ${model.count}`;
|
|
}
|
|
|
|
function getHordeModelTemplate(option) {
|
|
const model = models.find(x => x.name === option?.element?.value);
|
|
|
|
if (!option.id || !model) {
|
|
console.debug('No model found for option', option, option?.element?.value);
|
|
console.debug('Models', models);
|
|
return option.text;
|
|
}
|
|
|
|
const strip = html => {
|
|
const tmp = document.createElement('DIV');
|
|
tmp.innerHTML = html || '';
|
|
return tmp.textContent || tmp.innerText || '';
|
|
};
|
|
|
|
// how much do we trust the metadata from the models repo? about this much
|
|
const displayName = strip(model.display_name || model.name).replace(/.*\//g, '');
|
|
const description = strip(model.description);
|
|
const tags = model.tags ? model.tags.map(strip) : [];
|
|
const url = strip(model.url);
|
|
const style = strip(model.style);
|
|
|
|
const workerInfo = hordeModelQueueStateString(model);
|
|
const isPopular = model.tags?.includes('popular');
|
|
const descriptionDiv = description ? `<div class="horde-model-description">${description}</div>` : '';
|
|
const tagSpans = tags.length > 0 &&
|
|
`${tags.map(tag => `<span class="tag tag_name">${tag}</span>`).join('')}</span>` || '';
|
|
|
|
const modelDetailsLink = url && `<a href="${url}" target="_blank" rel="noopener noreferrer" class="model-details-link fa-solid fa-circle-question"> </a>`;
|
|
const capitalize = s => s ? s[0].toUpperCase() + s.slice(1) : '';
|
|
const innerContent = [
|
|
`<strong>${displayName}</strong> ${modelDetailsLink}`,
|
|
style ? `${capitalize(style)}` : '',
|
|
tagSpans ? `<span class="tags tags_inline inline-flex margin-r2">${tagSpans}</span>` : '',
|
|
].filter(Boolean).join(' | ');
|
|
|
|
return $((`
|
|
<div class="flex-container flexFlowColumn">
|
|
<div>
|
|
${isPopular ? '<span class="fa-fw fa-solid fa-star" title="Popular"></span>' : ''}
|
|
${innerContent}
|
|
</div>
|
|
${descriptionDiv}
|
|
<div><small>${workerInfo}</small></div>
|
|
</div>
|
|
`));
|
|
}
|
|
|
|
jQuery(function () {
|
|
$('#horde_model').on('mousedown change', async function (e) {
|
|
console.log('Horde model change', e);
|
|
horde_settings.models = $('#horde_model').val();
|
|
console.log('Updated Horde models', horde_settings.models);
|
|
|
|
// Try select instruct preset
|
|
autoSelectInstructPreset(horde_settings.models.join(' '));
|
|
if (horde_settings.models.length) {
|
|
adjustHordeGenerationParams(max_context, amount_gen);
|
|
} else {
|
|
$('#adjustedHordeParams').text('Context: --, Response: --');
|
|
}
|
|
});
|
|
|
|
$('#horde_auto_adjust_response_length').on('input', function () {
|
|
horde_settings.auto_adjust_response_length = !!$(this).prop('checked');
|
|
setContextSizePreview();
|
|
saveSettingsDebounced();
|
|
});
|
|
|
|
$('#horde_auto_adjust_context_length').on('input', function () {
|
|
horde_settings.auto_adjust_context_length = !!$(this).prop('checked');
|
|
setContextSizePreview();
|
|
saveSettingsDebounced();
|
|
});
|
|
|
|
$('#horde_trusted_workers_only').on('input', function () {
|
|
horde_settings.trusted_workers_only = !!$(this).prop('checked');
|
|
setContextSizePreview();
|
|
saveSettingsDebounced();
|
|
});
|
|
|
|
$('#horde_api_key').on('input', async function () {
|
|
const key = String($(this).val()).trim();
|
|
await writeSecret(SECRET_KEYS.HORDE, key);
|
|
});
|
|
|
|
$('#horde_refresh').on('click', () => getHordeModels(true));
|
|
$('#horde_kudos').on('click', showKudos);
|
|
|
|
// Not needed on mobile
|
|
if (!isMobile()) {
|
|
$('#horde_model').select2({
|
|
width: '100%',
|
|
placeholder: 'Select Horde models',
|
|
allowClear: true,
|
|
closeOnSelect: false,
|
|
templateSelection: function (data) {
|
|
// Customize the pillbox text by shortening the full text
|
|
return data.id;
|
|
},
|
|
templateResult: getHordeModelTemplate,
|
|
});
|
|
}
|
|
});
|
|
|