2024-06-21 23:36:29 +02:00
|
|
|
import { ensureImageFormatSupported, getBase64Async, isTrueBoolean, saveBase64AsFile } from '../../utils.js';
|
2024-06-07 01:25:42 +02:00
|
|
|
import { getContext, getApiUrl, doExtrasFetch, extension_settings, modules, renderExtensionTemplateAsync } from '../../extensions.js';
|
2024-06-29 23:31:54 +02:00
|
|
|
import { appendMediaToMessage, callPopup, eventSource, event_types, getRequestHeaders, saveChatConditional, saveSettingsDebounced, substituteParamsExtended } from '../../../script.js';
|
2023-12-02 19:04:51 +01:00
|
|
|
import { getMessageTimeStamp } from '../../RossAscends-mods.js';
|
|
|
|
import { SECRET_KEYS, secret_state } from '../../secrets.js';
|
|
|
|
import { getMultimodalCaption } from '../shared.js';
|
2023-12-19 23:45:45 +01:00
|
|
|
import { textgen_types, textgenerationwebui_settings } from '../../textgen-settings.js';
|
2024-05-12 21:15:05 +02:00
|
|
|
import { SlashCommandParser } from '../../slash-commands/SlashCommandParser.js';
|
|
|
|
import { SlashCommand } from '../../slash-commands/SlashCommand.js';
|
|
|
|
import { ARGUMENT_TYPE, SlashCommandArgument, SlashCommandNamedArgument } from '../../slash-commands/SlashCommandArgument.js';
|
2024-06-20 20:33:45 +02:00
|
|
|
import { commonEnumProviders } from '../../slash-commands/SlashCommandCommonEnumsProvider.js';
|
2023-07-20 19:32:15 +02:00
|
|
|
export { MODULE_NAME };
|
|
|
|
|
|
|
|
const MODULE_NAME = 'caption';
|
|
|
|
|
2024-08-01 00:34:49 +02:00
|
|
|
const PROMPT_DEFAULT = 'What\'s in this image?';
|
2023-11-07 00:58:34 +01:00
|
|
|
const TEMPLATE_DEFAULT = '[{{user}} sends {{char}} a picture that contains: {{caption}}]';
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Migrates old extension settings to the new format.
|
|
|
|
* Must keep this function for compatibility with old settings.
|
|
|
|
*/
|
2023-11-07 00:58:34 +01:00
|
|
|
function migrateSettings() {
|
2023-11-07 00:28:46 +01:00
|
|
|
if (extension_settings.caption.local !== undefined) {
|
|
|
|
extension_settings.caption.source = extension_settings.caption.local ? 'local' : 'extras';
|
|
|
|
}
|
|
|
|
|
|
|
|
delete extension_settings.caption.local;
|
2023-11-07 00:58:34 +01:00
|
|
|
|
|
|
|
if (!extension_settings.caption.source) {
|
|
|
|
extension_settings.caption.source = 'extras';
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
if (extension_settings.caption.source === 'openai') {
|
|
|
|
extension_settings.caption.source = 'multimodal';
|
|
|
|
extension_settings.caption.multimodal_api = 'openai';
|
2024-04-10 06:24:43 +02:00
|
|
|
extension_settings.caption.multimodal_model = 'gpt-4-turbo';
|
2023-11-17 22:19:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (!extension_settings.caption.multimodal_api) {
|
|
|
|
extension_settings.caption.multimodal_api = 'openai';
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!extension_settings.caption.multimodal_model) {
|
2024-04-10 06:24:43 +02:00
|
|
|
extension_settings.caption.multimodal_model = 'gpt-4-turbo';
|
2023-11-17 22:19:21 +01:00
|
|
|
}
|
|
|
|
|
2023-11-07 00:58:34 +01:00
|
|
|
if (!extension_settings.caption.prompt) {
|
|
|
|
extension_settings.caption.prompt = PROMPT_DEFAULT;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!extension_settings.caption.template) {
|
|
|
|
extension_settings.caption.template = TEMPLATE_DEFAULT;
|
|
|
|
}
|
2023-11-07 00:28:46 +01:00
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Sets an image icon for the send button.
|
|
|
|
*/
|
2023-07-20 19:32:15 +02:00
|
|
|
async function setImageIcon() {
|
|
|
|
try {
|
|
|
|
const sendButton = $('#send_picture .extensionsMenuExtensionButton');
|
|
|
|
sendButton.addClass('fa-image');
|
|
|
|
sendButton.removeClass('fa-hourglass-half');
|
|
|
|
}
|
|
|
|
catch (error) {
|
|
|
|
console.log(error);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Sets a spinner icon for the send button.
|
|
|
|
*/
|
2023-07-20 19:32:15 +02:00
|
|
|
async function setSpinnerIcon() {
|
|
|
|
try {
|
|
|
|
const sendButton = $('#send_picture .extensionsMenuExtensionButton');
|
|
|
|
sendButton.removeClass('fa-image');
|
|
|
|
sendButton.addClass('fa-hourglass-half');
|
|
|
|
}
|
|
|
|
catch (error) {
|
|
|
|
console.log(error);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
2024-06-29 23:06:17 +02:00
|
|
|
* Wraps a caption with a message template.
|
|
|
|
* @param {string} caption Raw caption
|
|
|
|
* @returns {Promise<string>} Wrapped caption
|
2023-11-17 22:19:21 +01:00
|
|
|
*/
|
2024-06-29 23:06:17 +02:00
|
|
|
async function wrapCaptionTemplate(caption) {
|
2023-11-07 00:58:34 +01:00
|
|
|
let template = extension_settings.caption.template || TEMPLATE_DEFAULT;
|
|
|
|
|
|
|
|
if (!/{{caption}}/i.test(template)) {
|
2023-12-02 20:11:06 +01:00
|
|
|
console.warn('Poka-yoke: Caption template does not contain {{caption}}. Appending it.');
|
2023-11-07 00:58:34 +01:00
|
|
|
template += ' {{caption}}';
|
|
|
|
}
|
|
|
|
|
2024-06-15 00:40:16 +02:00
|
|
|
let messageText = substituteParamsExtended(template, { caption: caption });
|
2023-07-20 19:32:15 +02:00
|
|
|
|
|
|
|
if (extension_settings.caption.refine_mode) {
|
|
|
|
messageText = await callPopup(
|
2024-06-29 23:06:17 +02:00
|
|
|
'<h3>Review and edit the generated caption:</h3>Press "Cancel" to abort the caption sending.',
|
2023-07-20 19:32:15 +02:00
|
|
|
'input',
|
|
|
|
messageText,
|
|
|
|
{ rows: 5, okButton: 'Send' });
|
|
|
|
|
|
|
|
if (!messageText) {
|
|
|
|
throw new Error('User aborted the caption sending.');
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-06-29 23:06:17 +02:00
|
|
|
return messageText;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Appends caption to an existing message.
|
|
|
|
* @param {Object} data Message data
|
|
|
|
* @returns {Promise<void>}
|
|
|
|
*/
|
|
|
|
async function captionExistingMessage(data) {
|
|
|
|
if (!(data?.extra?.image)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const imageData = await fetch(data.extra.image);
|
|
|
|
const blob = await imageData.blob();
|
|
|
|
const type = imageData.headers.get('Content-Type');
|
|
|
|
const file = new File([blob], 'image.png', { type });
|
|
|
|
const caption = await getCaptionForFile(file, null, true);
|
|
|
|
|
|
|
|
if (!caption) {
|
|
|
|
console.warn('Failed to generate a caption for the image.');
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const wrappedCaption = await wrapCaptionTemplate(caption);
|
|
|
|
|
|
|
|
const messageText = String(data.mes).trim();
|
|
|
|
|
|
|
|
if (!messageText) {
|
|
|
|
data.extra.inline_image = false;
|
|
|
|
data.mes = wrappedCaption;
|
|
|
|
data.extra.title = wrappedCaption;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
data.extra.inline_image = true;
|
|
|
|
data.extra.append_title = true;
|
|
|
|
data.extra.title = wrappedCaption;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Sends a captioned message to the chat.
|
|
|
|
* @param {string} caption Caption text
|
|
|
|
* @param {string} image Image URL
|
|
|
|
*/
|
|
|
|
async function sendCaptionedMessage(caption, image) {
|
|
|
|
const messageText = await wrapCaptionTemplate(caption);
|
|
|
|
|
|
|
|
const context = getContext();
|
2023-07-20 19:32:15 +02:00
|
|
|
const message = {
|
|
|
|
name: context.name1,
|
|
|
|
is_user: true,
|
2023-08-22 17:13:03 +02:00
|
|
|
send_date: getMessageTimeStamp(),
|
2023-07-20 19:32:15 +02:00
|
|
|
mes: messageText,
|
|
|
|
extra: {
|
|
|
|
image: image,
|
|
|
|
title: messageText,
|
|
|
|
},
|
|
|
|
};
|
|
|
|
context.chat.push(message);
|
2024-08-05 20:22:40 +02:00
|
|
|
const messageId = context.chat.length - 1;
|
|
|
|
await eventSource.emit(event_types.MESSAGE_SENT, messageId);
|
2023-07-20 19:32:15 +02:00
|
|
|
context.addOneMessage(message);
|
2024-08-05 20:22:40 +02:00
|
|
|
await eventSource.emit(event_types.USER_MESSAGE_RENDERED, messageId);
|
|
|
|
await context.saveChat();
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
|
|
|
|
2023-11-07 00:28:46 +01:00
|
|
|
/**
|
2023-11-17 22:19:21 +01:00
|
|
|
* Generates a caption for an image using a selected source.
|
2023-11-07 00:28:46 +01:00
|
|
|
* @param {string} base64Img Base64 encoded image without the data:image/...;base64, prefix
|
|
|
|
* @param {string} fileData Base64 encoded image with the data:image/...;base64, prefix
|
2024-04-18 15:22:33 +02:00
|
|
|
* @param {string} externalPrompt Caption prompt
|
2023-11-17 22:19:21 +01:00
|
|
|
* @returns {Promise<{caption: string}>} Generated caption
|
2023-11-07 00:28:46 +01:00
|
|
|
*/
|
2024-04-18 15:22:33 +02:00
|
|
|
async function doCaptionRequest(base64Img, fileData, externalPrompt) {
|
2023-11-07 00:28:46 +01:00
|
|
|
switch (extension_settings.caption.source) {
|
|
|
|
case 'local':
|
|
|
|
return await captionLocal(base64Img);
|
|
|
|
case 'extras':
|
|
|
|
return await captionExtras(base64Img);
|
|
|
|
case 'horde':
|
|
|
|
return await captionHorde(base64Img);
|
2023-11-17 22:19:21 +01:00
|
|
|
case 'multimodal':
|
2024-04-18 15:22:33 +02:00
|
|
|
return await captionMultimodal(fileData, externalPrompt);
|
2023-11-07 00:28:46 +01:00
|
|
|
default:
|
|
|
|
throw new Error('Unknown caption source.');
|
|
|
|
}
|
|
|
|
}
|
2023-07-20 19:32:15 +02:00
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Generates a caption for an image using Extras API.
|
|
|
|
* @param {string} base64Img Base64 encoded image without the data:image/...;base64, prefix
|
|
|
|
* @returns {Promise<{caption: string}>} Generated caption
|
|
|
|
*/
|
2023-11-07 00:28:46 +01:00
|
|
|
async function captionExtras(base64Img) {
|
|
|
|
if (!modules.includes('caption')) {
|
|
|
|
throw new Error('No captioning module is available.');
|
|
|
|
}
|
2023-07-20 19:32:15 +02:00
|
|
|
|
2023-11-07 00:28:46 +01:00
|
|
|
const url = new URL(getApiUrl());
|
|
|
|
url.pathname = '/api/caption';
|
2023-07-20 19:32:15 +02:00
|
|
|
|
2023-11-07 00:28:46 +01:00
|
|
|
const apiResult = await doExtrasFetch(url, {
|
|
|
|
method: 'POST',
|
|
|
|
headers: {
|
|
|
|
'Content-Type': 'application/json',
|
|
|
|
'Bypass-Tunnel-Reminder': 'bypass',
|
|
|
|
},
|
2023-12-02 21:06:57 +01:00
|
|
|
body: JSON.stringify({ image: base64Img }),
|
2023-11-07 00:28:46 +01:00
|
|
|
});
|
2023-09-11 23:15:21 +02:00
|
|
|
|
2023-11-07 00:28:46 +01:00
|
|
|
if (!apiResult.ok) {
|
|
|
|
throw new Error('Failed to caption image via Extras.');
|
|
|
|
}
|
|
|
|
|
|
|
|
const data = await apiResult.json();
|
|
|
|
return data;
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Generates a caption for an image using a local model.
|
|
|
|
* @param {string} base64Img Base64 encoded image without the data:image/...;base64, prefix
|
|
|
|
* @returns {Promise<{caption: string}>} Generated caption
|
|
|
|
*/
|
2023-11-07 00:28:46 +01:00
|
|
|
async function captionLocal(base64Img) {
|
|
|
|
const apiResult = await fetch('/api/extra/caption', {
|
|
|
|
method: 'POST',
|
|
|
|
headers: getRequestHeaders(),
|
2023-12-02 21:06:57 +01:00
|
|
|
body: JSON.stringify({ image: base64Img }),
|
2023-11-07 00:28:46 +01:00
|
|
|
});
|
|
|
|
|
|
|
|
if (!apiResult.ok) {
|
|
|
|
throw new Error('Failed to caption image via local pipeline.');
|
|
|
|
}
|
|
|
|
|
|
|
|
const data = await apiResult.json();
|
|
|
|
return data;
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Generates a caption for an image using a Horde model.
|
|
|
|
* @param {string} base64Img Base64 encoded image without the data:image/...;base64, prefix
|
|
|
|
* @returns {Promise<{caption: string}>} Generated caption
|
|
|
|
*/
|
2023-11-07 00:28:46 +01:00
|
|
|
async function captionHorde(base64Img) {
|
|
|
|
const apiResult = await fetch('/api/horde/caption-image', {
|
|
|
|
method: 'POST',
|
|
|
|
headers: getRequestHeaders(),
|
2023-12-02 21:06:57 +01:00
|
|
|
body: JSON.stringify({ image: base64Img }),
|
2023-11-07 00:28:46 +01:00
|
|
|
});
|
|
|
|
|
|
|
|
if (!apiResult.ok) {
|
|
|
|
throw new Error('Failed to caption image via Horde.');
|
2023-09-11 23:15:21 +02:00
|
|
|
}
|
2023-11-07 00:28:46 +01:00
|
|
|
|
|
|
|
const data = await apiResult.json();
|
|
|
|
return data;
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
/**
|
|
|
|
* Generates a caption for an image using a multimodal model.
|
|
|
|
* @param {string} base64Img Base64 encoded image with the data:image/...;base64, prefix
|
2024-04-18 15:22:33 +02:00
|
|
|
* @param {string} externalPrompt Caption prompt
|
2023-11-17 22:19:21 +01:00
|
|
|
* @returns {Promise<{caption: string}>} Generated caption
|
|
|
|
*/
|
2024-04-18 15:22:33 +02:00
|
|
|
async function captionMultimodal(base64Img, externalPrompt) {
|
|
|
|
let prompt = externalPrompt || extension_settings.caption.prompt || PROMPT_DEFAULT;
|
2023-12-20 20:23:59 +01:00
|
|
|
|
2024-04-18 15:22:33 +02:00
|
|
|
if (!externalPrompt && extension_settings.caption.prompt_ask) {
|
2023-12-20 20:23:59 +01:00
|
|
|
const customPrompt = await callPopup('<h3>Enter a comment or question:</h3>', 'input', prompt, { rows: 2 });
|
|
|
|
if (!customPrompt) {
|
|
|
|
throw new Error('User aborted the caption sending.');
|
|
|
|
}
|
|
|
|
prompt = String(customPrompt).trim();
|
|
|
|
}
|
|
|
|
|
2023-11-17 22:19:21 +01:00
|
|
|
const caption = await getMultimodalCaption(base64Img, prompt);
|
|
|
|
return { caption };
|
2023-09-11 23:15:21 +02:00
|
|
|
}
|
|
|
|
|
2024-04-18 15:22:33 +02:00
|
|
|
/**
|
|
|
|
* Handles the image selection event.
|
|
|
|
* @param {Event} e Input event
|
|
|
|
* @param {string} prompt Caption prompt
|
|
|
|
* @param {boolean} quiet Suppresses sending a message
|
|
|
|
* @returns {Promise<string>} Generated caption
|
|
|
|
*/
|
|
|
|
async function onSelectImage(e, prompt, quiet) {
|
|
|
|
if (!(e.target instanceof HTMLInputElement)) {
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
|
2023-09-11 23:15:21 +02:00
|
|
|
const file = e.target.files[0];
|
2024-04-18 15:22:33 +02:00
|
|
|
const form = e.target.form;
|
2023-09-11 23:15:21 +02:00
|
|
|
|
|
|
|
if (!file || !(file instanceof File)) {
|
2024-04-18 15:22:33 +02:00
|
|
|
form && form.reset();
|
|
|
|
return '';
|
2023-09-11 23:15:21 +02:00
|
|
|
}
|
|
|
|
|
2024-05-12 21:15:05 +02:00
|
|
|
const caption = await getCaptionForFile(file, prompt, quiet);
|
|
|
|
form && form.reset();
|
|
|
|
return caption;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Gets a caption for an image file.
|
|
|
|
* @param {File} file Input file
|
|
|
|
* @param {string} prompt Caption prompt
|
|
|
|
* @param {boolean} quiet Suppresses sending a message
|
|
|
|
* @returns {Promise<string>} Generated caption
|
|
|
|
*/
|
|
|
|
async function getCaptionForFile(file, prompt, quiet) {
|
2023-09-11 23:15:21 +02:00
|
|
|
try {
|
2024-04-18 15:22:33 +02:00
|
|
|
setSpinnerIcon();
|
2023-09-11 23:15:21 +02:00
|
|
|
const context = getContext();
|
2024-06-21 23:36:29 +02:00
|
|
|
const fileData = await getBase64Async(await ensureImageFormatSupported(file));
|
2023-09-11 23:15:21 +02:00
|
|
|
const base64Format = fileData.split(',')[0].split(';')[0].split('/')[1];
|
|
|
|
const base64Data = fileData.split(',')[1];
|
2024-04-18 15:22:33 +02:00
|
|
|
const { caption } = await doCaptionRequest(base64Data, fileData, prompt);
|
|
|
|
if (!quiet) {
|
|
|
|
const imagePath = await saveBase64AsFile(base64Data, context.name2, '', base64Format);
|
|
|
|
await sendCaptionedMessage(caption, imagePath);
|
|
|
|
}
|
|
|
|
return caption;
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
|
|
|
catch (error) {
|
2024-07-11 01:12:39 +02:00
|
|
|
const errorMessage = error.message || 'Unknown error';
|
2024-08-01 00:34:49 +02:00
|
|
|
toastr.error(errorMessage, 'Failed to caption image.');
|
2024-07-11 01:12:39 +02:00
|
|
|
console.error(error);
|
2024-04-18 15:22:33 +02:00
|
|
|
return '';
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
|
|
|
finally {
|
|
|
|
setImageIcon();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function onRefineModeInput() {
|
|
|
|
extension_settings.caption.refine_mode = $('#caption_refine_mode').prop('checked');
|
|
|
|
saveSettingsDebounced();
|
|
|
|
}
|
|
|
|
|
2024-04-18 15:22:33 +02:00
|
|
|
/**
|
|
|
|
* Callback for the /caption command.
|
|
|
|
* @param {object} args Named parameters
|
|
|
|
* @param {string} prompt Caption prompt
|
|
|
|
*/
|
2024-05-12 21:15:05 +02:00
|
|
|
async function captionCommandCallback(args, prompt) {
|
|
|
|
const quiet = isTrueBoolean(args?.quiet);
|
|
|
|
const id = args?.id;
|
|
|
|
|
|
|
|
if (!isNaN(Number(id))) {
|
|
|
|
const message = getContext().chat[id];
|
|
|
|
if (message?.extra?.image) {
|
|
|
|
try {
|
|
|
|
const fetchResult = await fetch(message.extra.image);
|
|
|
|
const blob = await fetchResult.blob();
|
|
|
|
const file = new File([blob], 'image.jpg', { type: blob.type });
|
|
|
|
return await getCaptionForFile(file, prompt, quiet);
|
|
|
|
} catch (error) {
|
|
|
|
toastr.error('Failed to get image from the message. Make sure the image is accessible.');
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-04-18 15:22:33 +02:00
|
|
|
return new Promise(resolve => {
|
|
|
|
const input = document.createElement('input');
|
|
|
|
input.type = 'file';
|
|
|
|
input.accept = 'image/*';
|
|
|
|
input.onchange = async (e) => {
|
|
|
|
const caption = await onSelectImage(e, prompt, quiet);
|
|
|
|
resolve(caption);
|
|
|
|
};
|
|
|
|
input.oncancel = () => resolve('');
|
|
|
|
input.click();
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2024-06-07 01:25:42 +02:00
|
|
|
jQuery(async function () {
|
2023-07-20 19:32:15 +02:00
|
|
|
function addSendPictureButton() {
|
|
|
|
const sendButton = $(`
|
|
|
|
<div id="send_picture" class="list-group-item flex-container flexGap5">
|
|
|
|
<div class="fa-solid fa-image extensionsMenuExtensionButton"></div>
|
2023-11-18 18:23:58 +01:00
|
|
|
Generate Caption
|
|
|
|
</div>`);
|
2023-07-20 19:32:15 +02:00
|
|
|
|
2024-06-24 22:17:58 +02:00
|
|
|
$('#caption_wand_container').append(sendButton);
|
2023-09-11 23:15:21 +02:00
|
|
|
$(sendButton).on('click', () => {
|
2023-11-07 00:28:46 +01:00
|
|
|
const hasCaptionModule =
|
|
|
|
(modules.includes('caption') && extension_settings.caption.source === 'extras') ||
|
2023-12-19 23:45:45 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'openai' && (secret_state[SECRET_KEYS.OPENAI] || extension_settings.caption.allow_reverse_proxy)) ||
|
2023-11-17 22:19:21 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'openrouter' && secret_state[SECRET_KEYS.OPENROUTER]) ||
|
2024-08-01 00:34:49 +02:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'zerooneai' && secret_state[SECRET_KEYS.ZEROONEAI]) ||
|
2024-05-24 20:38:29 +02:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'google' && (secret_state[SECRET_KEYS.MAKERSUITE] || extension_settings.caption.allow_reverse_proxy)) ||
|
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'anthropic' && (secret_state[SECRET_KEYS.CLAUDE] || extension_settings.caption.allow_reverse_proxy)) ||
|
2023-12-19 23:45:45 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'ollama' && textgenerationwebui_settings.server_urls[textgen_types.OLLAMA]) ||
|
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'llamacpp' && textgenerationwebui_settings.server_urls[textgen_types.LLAMACPP]) ||
|
2023-12-24 00:43:29 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'ooba' && textgenerationwebui_settings.server_urls[textgen_types.OOBA]) ||
|
2024-03-14 00:03:51 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'koboldcpp' && textgenerationwebui_settings.server_urls[textgen_types.KOBOLDCPP]) ||
|
2024-06-28 23:33:12 +02:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'vllm' && textgenerationwebui_settings.server_urls[textgen_types.VLLM]) ||
|
2023-12-20 20:05:20 +01:00
|
|
|
(extension_settings.caption.source === 'multimodal' && extension_settings.caption.multimodal_api === 'custom') ||
|
2023-11-07 00:28:46 +01:00
|
|
|
extension_settings.caption.source === 'local' ||
|
|
|
|
extension_settings.caption.source === 'horde';
|
2023-09-11 23:15:21 +02:00
|
|
|
|
|
|
|
if (!hasCaptionModule) {
|
2023-11-17 22:19:21 +01:00
|
|
|
toastr.error('Choose other captioning source in the extension settings.', 'Captioning is not available');
|
2023-09-11 23:15:21 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
$('#img_file').trigger('click');
|
|
|
|
});
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
|
|
|
function addPictureSendForm() {
|
2023-12-02 19:04:51 +01:00
|
|
|
const inputHtml = '<input id="img_file" type="file" hidden accept="image/*">';
|
2023-07-20 19:32:15 +02:00
|
|
|
const imgForm = document.createElement('form');
|
|
|
|
imgForm.id = 'img_form';
|
|
|
|
$(imgForm).append(inputHtml);
|
|
|
|
$(imgForm).hide();
|
|
|
|
$('#form_sheld').append(imgForm);
|
2024-04-18 15:22:33 +02:00
|
|
|
$('#img_file').on('change', (e) => onSelectImage(e.originalEvent, '', false));
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
2023-11-17 22:19:21 +01:00
|
|
|
function switchMultimodalBlocks() {
|
|
|
|
const isMultimodal = extension_settings.caption.source === 'multimodal';
|
2024-06-22 15:28:57 +02:00
|
|
|
$('#caption_ollama_pull').on('click', (e) => {
|
|
|
|
const presetModel = extension_settings.caption.multimodal_model !== 'ollama_current' ? extension_settings.caption.multimodal_model : '';
|
|
|
|
e.preventDefault();
|
|
|
|
$('#ollama_download_model').trigger('click');
|
|
|
|
$('#dialogue_popup_input').val(presetModel);
|
|
|
|
});
|
2023-11-17 22:19:21 +01:00
|
|
|
$('#caption_multimodal_block').toggle(isMultimodal);
|
|
|
|
$('#caption_prompt_block').toggle(isMultimodal);
|
|
|
|
$('#caption_multimodal_api').val(extension_settings.caption.multimodal_api);
|
|
|
|
$('#caption_multimodal_model').val(extension_settings.caption.multimodal_model);
|
2023-12-17 18:41:20 +01:00
|
|
|
$('#caption_multimodal_block [data-type]').each(function () {
|
2023-11-17 22:19:21 +01:00
|
|
|
const type = $(this).data('type');
|
2024-03-05 17:47:00 +01:00
|
|
|
const types = type.split(',');
|
|
|
|
$(this).toggle(types.includes(extension_settings.caption.multimodal_api));
|
2023-11-17 22:19:21 +01:00
|
|
|
});
|
|
|
|
$('#caption_multimodal_api').on('change', () => {
|
|
|
|
const api = String($('#caption_multimodal_api').val());
|
|
|
|
const model = String($(`#caption_multimodal_model option[data-type="${api}"]`).first().val());
|
|
|
|
extension_settings.caption.multimodal_api = api;
|
|
|
|
extension_settings.caption.multimodal_model = model;
|
|
|
|
saveSettingsDebounced();
|
|
|
|
switchMultimodalBlocks();
|
|
|
|
});
|
|
|
|
$('#caption_multimodal_model').on('change', () => {
|
|
|
|
extension_settings.caption.multimodal_model = String($('#caption_multimodal_model').val());
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
|
|
|
}
|
2024-06-07 01:25:42 +02:00
|
|
|
async function addSettings() {
|
2024-06-29 22:22:29 +02:00
|
|
|
const html = await renderExtensionTemplateAsync('caption', 'settings', { TEMPLATE_DEFAULT, PROMPT_DEFAULT });
|
2024-06-24 21:15:08 +02:00
|
|
|
$('#caption_container').append(html);
|
2023-07-20 19:32:15 +02:00
|
|
|
}
|
|
|
|
|
2024-06-07 01:25:42 +02:00
|
|
|
await addSettings();
|
2023-07-20 19:32:15 +02:00
|
|
|
addPictureSendForm();
|
|
|
|
addSendPictureButton();
|
|
|
|
setImageIcon();
|
2023-11-07 00:58:34 +01:00
|
|
|
migrateSettings();
|
2023-11-17 22:19:21 +01:00
|
|
|
switchMultimodalBlocks();
|
2023-11-07 00:28:46 +01:00
|
|
|
|
2023-07-20 19:32:15 +02:00
|
|
|
$('#caption_refine_mode').prop('checked', !!(extension_settings.caption.refine_mode));
|
2023-12-17 18:41:20 +01:00
|
|
|
$('#caption_allow_reverse_proxy').prop('checked', !!(extension_settings.caption.allow_reverse_proxy));
|
2023-12-20 20:23:59 +01:00
|
|
|
$('#caption_prompt_ask').prop('checked', !!(extension_settings.caption.prompt_ask));
|
2024-06-29 23:06:17 +02:00
|
|
|
$('#caption_auto_mode').prop('checked', !!(extension_settings.caption.auto_mode));
|
2023-11-07 00:28:46 +01:00
|
|
|
$('#caption_source').val(extension_settings.caption.source);
|
2023-11-07 00:58:34 +01:00
|
|
|
$('#caption_prompt').val(extension_settings.caption.prompt);
|
|
|
|
$('#caption_template').val(extension_settings.caption.template);
|
2023-07-20 19:32:15 +02:00
|
|
|
$('#caption_refine_mode').on('input', onRefineModeInput);
|
2023-11-07 00:28:46 +01:00
|
|
|
$('#caption_source').on('change', () => {
|
|
|
|
extension_settings.caption.source = String($('#caption_source').val());
|
2023-11-17 22:19:21 +01:00
|
|
|
switchMultimodalBlocks();
|
2023-09-11 23:15:21 +02:00
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
2023-11-07 00:58:34 +01:00
|
|
|
$('#caption_prompt').on('input', () => {
|
|
|
|
extension_settings.caption.prompt = String($('#caption_prompt').val());
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
|
|
|
$('#caption_template').on('input', () => {
|
|
|
|
extension_settings.caption.template = String($('#caption_template').val());
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
2023-12-17 18:41:20 +01:00
|
|
|
$('#caption_allow_reverse_proxy').on('input', () => {
|
|
|
|
extension_settings.caption.allow_reverse_proxy = $('#caption_allow_reverse_proxy').prop('checked');
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
2023-12-20 20:23:59 +01:00
|
|
|
$('#caption_prompt_ask').on('input', () => {
|
|
|
|
extension_settings.caption.prompt_ask = $('#caption_prompt_ask').prop('checked');
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
2024-06-29 23:06:17 +02:00
|
|
|
$('#caption_auto_mode').on('input', () => {
|
|
|
|
extension_settings.caption.auto_mode = !!$('#caption_auto_mode').prop('checked');
|
|
|
|
saveSettingsDebounced();
|
|
|
|
});
|
|
|
|
|
|
|
|
const onMessageEvent = async (index) => {
|
|
|
|
if (!extension_settings.caption.auto_mode) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const data = getContext().chat[index];
|
|
|
|
await captionExistingMessage(data);
|
|
|
|
};
|
|
|
|
|
|
|
|
eventSource.on(event_types.MESSAGE_SENT, onMessageEvent);
|
|
|
|
eventSource.on(event_types.MESSAGE_FILE_EMBEDDED, onMessageEvent);
|
2024-04-18 15:22:33 +02:00
|
|
|
|
2024-06-29 23:31:54 +02:00
|
|
|
$(document).on('click', '.mes_img_caption', async function () {
|
2024-06-30 00:19:43 +02:00
|
|
|
const animationClass = 'fa-fade';
|
2024-06-29 23:31:54 +02:00
|
|
|
const messageBlock = $(this).closest('.mes');
|
2024-06-30 00:19:43 +02:00
|
|
|
const messageImg = messageBlock.find('.mes_img');
|
|
|
|
if (messageImg.hasClass(animationClass)) return;
|
|
|
|
messageImg.addClass(animationClass);
|
2024-06-30 18:20:39 +02:00
|
|
|
try {
|
|
|
|
const index = Number(messageBlock.attr('mesid'));
|
|
|
|
const data = getContext().chat[index];
|
|
|
|
await captionExistingMessage(data);
|
|
|
|
appendMediaToMessage(data, messageBlock, false);
|
|
|
|
await saveChatConditional();
|
|
|
|
} catch(e) {
|
|
|
|
console.error('Message image recaption failed', e);
|
|
|
|
} finally {
|
|
|
|
messageImg.removeClass(animationClass);
|
|
|
|
}
|
2024-06-29 23:31:54 +02:00
|
|
|
});
|
|
|
|
|
2024-05-12 21:15:05 +02:00
|
|
|
SlashCommandParser.addCommandObject(SlashCommand.fromProps({ name: 'caption',
|
|
|
|
callback: captionCommandCallback,
|
|
|
|
returns: 'caption',
|
|
|
|
namedArgumentList: [
|
|
|
|
new SlashCommandNamedArgument(
|
2024-06-17 07:04:10 +02:00
|
|
|
'quiet', 'suppress sending a captioned message', [ARGUMENT_TYPE.BOOLEAN], false, false, 'false',
|
2024-05-12 21:15:05 +02:00
|
|
|
),
|
2024-06-17 07:04:10 +02:00
|
|
|
SlashCommandNamedArgument.fromProps({
|
|
|
|
name: 'id',
|
|
|
|
description: 'get image from a message with this ID',
|
|
|
|
typeList: [ARGUMENT_TYPE.NUMBER],
|
2024-06-21 20:04:55 +02:00
|
|
|
enumProvider: commonEnumProviders.messages(),
|
2024-06-17 07:04:10 +02:00
|
|
|
}),
|
2024-05-12 21:15:05 +02:00
|
|
|
],
|
|
|
|
unnamedArgumentList: [
|
|
|
|
new SlashCommandArgument(
|
|
|
|
'prompt', [ARGUMENT_TYPE.STRING], false,
|
|
|
|
),
|
|
|
|
],
|
|
|
|
helpString: `
|
|
|
|
<div>
|
|
|
|
Caption an image with an optional prompt and passes the caption down the pipe.
|
|
|
|
</div>
|
|
|
|
<div>
|
|
|
|
Only multimodal sources support custom prompts.
|
|
|
|
</div>
|
|
|
|
<div>
|
|
|
|
Provide a message ID to get an image from a message instead of uploading one.
|
|
|
|
</div>
|
|
|
|
<div>
|
|
|
|
Set the "quiet" argument to true to suppress sending a captioned message, default: false.
|
|
|
|
</div>
|
|
|
|
`,
|
|
|
|
}));
|
2024-06-29 23:31:54 +02:00
|
|
|
|
|
|
|
document.body.classList.add('caption');
|
2023-07-20 19:32:15 +02:00
|
|
|
});
|