import { getStringHash, debounce, waitUntilCondition, extractAllWords, isTrueBoolean } from '../../utils.js'; import { getContext, getApiUrl, extension_settings, doExtrasFetch, modules, renderExtensionTemplateAsync } from '../../extensions.js'; import { activateSendButtons, deactivateSendButtons, animation_duration, eventSource, event_types, extension_prompt_roles, extension_prompt_types, generateQuietPrompt, is_send_press, saveSettingsDebounced, substituteParamsExtended, generateRaw, getMaxContextSize, setExtensionPrompt, streamingProcessor, } from '../../../script.js'; import { is_group_generating, selected_group } from '../../group-chats.js'; import { loadMovingUIState } from '../../power-user.js'; import { dragElement } from '../../RossAscends-mods.js'; import { getTextTokens, getTokenCountAsync, tokenizers } from '../../tokenizers.js'; import { debounce_timeout } from '../../constants.js'; import { SlashCommandParser } from '../../slash-commands/SlashCommandParser.js'; import { SlashCommand } from '../../slash-commands/SlashCommand.js'; import { ARGUMENT_TYPE, SlashCommandArgument, SlashCommandNamedArgument } from '../../slash-commands/SlashCommandArgument.js'; import { MacrosParser } from '../../macros.js'; import { countWebLlmTokens, generateWebLlmChatPrompt, getWebLlmContextSize, isWebLlmSupported } from '../shared.js'; import { commonEnumProviders } from '../../slash-commands/SlashCommandCommonEnumsProvider.js'; export { MODULE_NAME }; const MODULE_NAME = '1_memory'; let lastCharacterId = null; let lastGroupId = null; let lastChatId = null; let lastMessageHash = null; let lastMessageId = null; let inApiCall = false; /** * Count the number of tokens in the provided text. * @param {string} text Text to count tokens for * @param {number} padding Number of additional tokens to add to the count * @returns {Promise} Number of tokens in the text */ async function countSourceTokens(text, padding = 0) { if (extension_settings.memory.source === summary_sources.webllm) { const count = await countWebLlmTokens(text); return count + padding; } if (extension_settings.memory.source === summary_sources.extras) { const count = getTextTokens(tokenizers.GPT2, text).length; return count + padding; } return await getTokenCountAsync(text, padding); } async function getSourceContextSize() { const overrideLength = extension_settings.memory.overrideResponseLength; if (extension_settings.memory.source === summary_sources.webllm) { const maxContext = await getWebLlmContextSize(); return overrideLength > 0 ? (maxContext - overrideLength) : Math.round(maxContext * 0.75); } if (extension_settings.source === summary_sources.extras) { return 1024 - 64; } return getMaxContextSize(overrideLength); } const formatMemoryValue = function (value) { if (!value) { return ''; } value = value.trim(); if (extension_settings.memory.template) { return substituteParamsExtended(extension_settings.memory.template, { summary: value }); } else { return `Summary: ${value}`; } }; const saveChatDebounced = debounce(() => getContext().saveChat(), debounce_timeout.relaxed); const summary_sources = { 'extras': 'extras', 'main': 'main', 'webllm': 'webllm', }; const prompt_builders = { DEFAULT: 0, RAW_BLOCKING: 1, RAW_NON_BLOCKING: 2, }; const defaultPrompt = '[Pause your roleplay. Summarize the most important facts and events in the story so far. If a summary already exists in your memory, use that as a base and expand with new facts. Limit the summary to {{words}} words or less. Your response should include nothing but the summary.]'; const defaultTemplate = '[Summary: {{summary}}]'; const defaultSettings = { memoryFrozen: false, SkipWIAN: false, source: summary_sources.extras, prompt: defaultPrompt, template: defaultTemplate, position: extension_prompt_types.IN_PROMPT, role: extension_prompt_roles.SYSTEM, scan: false, depth: 2, promptWords: 200, promptMinWords: 25, promptMaxWords: 1000, promptWordsStep: 25, promptInterval: 10, promptMinInterval: 0, promptMaxInterval: 250, promptIntervalStep: 1, promptForceWords: 0, promptForceWordsStep: 100, promptMinForceWords: 0, promptMaxForceWords: 10000, overrideResponseLength: 0, overrideResponseLengthMin: 0, overrideResponseLengthMax: 4096, overrideResponseLengthStep: 16, maxMessagesPerRequest: 0, maxMessagesPerRequestMin: 0, maxMessagesPerRequestMax: 250, maxMessagesPerRequestStep: 1, prompt_builder: prompt_builders.DEFAULT, }; function loadSettings() { if (Object.keys(extension_settings.memory).length === 0) { Object.assign(extension_settings.memory, defaultSettings); } for (const key of Object.keys(defaultSettings)) { if (extension_settings.memory[key] === undefined) { extension_settings.memory[key] = defaultSettings[key]; } } $('#summary_source').val(extension_settings.memory.source).trigger('change'); $('#memory_frozen').prop('checked', extension_settings.memory.memoryFrozen).trigger('input'); $('#memory_skipWIAN').prop('checked', extension_settings.memory.SkipWIAN).trigger('input'); $('#memory_prompt').val(extension_settings.memory.prompt).trigger('input'); $('#memory_prompt_words').val(extension_settings.memory.promptWords).trigger('input'); $('#memory_prompt_interval').val(extension_settings.memory.promptInterval).trigger('input'); $('#memory_template').val(extension_settings.memory.template).trigger('input'); $('#memory_depth').val(extension_settings.memory.depth).trigger('input'); $('#memory_role').val(extension_settings.memory.role).trigger('input'); $(`input[name="memory_position"][value="${extension_settings.memory.position}"]`).prop('checked', true).trigger('input'); $('#memory_prompt_words_force').val(extension_settings.memory.promptForceWords).trigger('input'); $(`input[name="memory_prompt_builder"][value="${extension_settings.memory.prompt_builder}"]`).prop('checked', true).trigger('input'); $('#memory_override_response_length').val(extension_settings.memory.overrideResponseLength).trigger('input'); $('#memory_max_messages_per_request').val(extension_settings.memory.maxMessagesPerRequest).trigger('input'); $('#memory_include_wi_scan').prop('checked', extension_settings.memory.scan).trigger('input'); switchSourceControls(extension_settings.memory.source); } async function onPromptForceWordsAutoClick() { const context = getContext(); const maxPromptLength = await getSourceContextSize(); const chat = context.chat; const allMessages = chat.filter(m => !m.is_system && m.mes).map(m => m.mes); const messagesWordCount = allMessages.map(m => extractAllWords(m)).flat().length; const averageMessageWordCount = messagesWordCount / allMessages.length; const tokensPerWord = await countSourceTokens(allMessages.join('\n')) / messagesWordCount; const wordsPerToken = 1 / tokensPerWord; const maxPromptLengthWords = Math.round(maxPromptLength * wordsPerToken); // How many words should pass so that messages will start be dropped out of context; const wordsPerPrompt = Math.floor(maxPromptLength / tokensPerWord); // How many words will be needed to fit the allowance buffer const summaryPromptWords = extractAllWords(extension_settings.memory.prompt).length; const promptAllowanceWords = maxPromptLengthWords - extension_settings.memory.promptWords - summaryPromptWords; const averageMessagesPerPrompt = Math.floor(promptAllowanceWords / averageMessageWordCount); const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0; const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt); const targetSummaryWords = (targetMessagesInPrompt * averageMessageWordCount) + (promptAllowanceWords / 4); console.table({ maxPromptLength, maxPromptLengthWords, promptAllowanceWords, averageMessagesPerPrompt, targetMessagesInPrompt, targetSummaryWords, wordsPerPrompt, wordsPerToken, tokensPerWord, messagesWordCount, }); const ROUNDING = 100; extension_settings.memory.promptForceWords = Math.max(1, Math.floor(targetSummaryWords / ROUNDING) * ROUNDING); $('#memory_prompt_words_force').val(extension_settings.memory.promptForceWords).trigger('input'); } async function onPromptIntervalAutoClick() { const context = getContext(); const maxPromptLength = await getSourceContextSize(); const chat = context.chat; const allMessages = chat.filter(m => !m.is_system && m.mes).map(m => m.mes); const messagesWordCount = allMessages.map(m => extractAllWords(m)).flat().length; const messagesTokenCount = await countSourceTokens(allMessages.join('\n')); const tokensPerWord = messagesTokenCount / messagesWordCount; const averageMessageTokenCount = messagesTokenCount / allMessages.length; const targetSummaryTokens = Math.round(extension_settings.memory.promptWords * tokensPerWord); const promptTokens = await countSourceTokens(extension_settings.memory.prompt); const promptAllowance = maxPromptLength - promptTokens - targetSummaryTokens; const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0; const averageMessagesPerPrompt = Math.floor(promptAllowance / averageMessageTokenCount); const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt); const adjustedAverageMessagesPerPrompt = targetMessagesInPrompt + (averageMessagesPerPrompt - targetMessagesInPrompt) / 4; console.table({ maxPromptLength, promptAllowance, targetSummaryTokens, promptTokens, messagesWordCount, messagesTokenCount, tokensPerWord, averageMessageTokenCount, averageMessagesPerPrompt, targetMessagesInPrompt, adjustedAverageMessagesPerPrompt, maxMessagesPerSummary, }); const ROUNDING = 5; extension_settings.memory.promptInterval = Math.max(1, Math.floor(adjustedAverageMessagesPerPrompt / ROUNDING) * ROUNDING); $('#memory_prompt_interval').val(extension_settings.memory.promptInterval).trigger('input'); } function onSummarySourceChange(event) { const value = event.target.value; extension_settings.memory.source = value; switchSourceControls(value); saveSettingsDebounced(); } function switchSourceControls(value) { $('#memory_settings [data-summary-source]').each((_, element) => { const source = element.dataset.summarySource.split(',').map(s => s.trim()); $(element).toggle(source.includes(value)); }); } function onMemoryFrozenInput() { const value = Boolean($(this).prop('checked')); extension_settings.memory.memoryFrozen = value; saveSettingsDebounced(); } function onMemorySkipWIANInput() { const value = Boolean($(this).prop('checked')); extension_settings.memory.SkipWIAN = value; saveSettingsDebounced(); } function onMemoryPromptWordsInput() { const value = $(this).val(); extension_settings.memory.promptWords = Number(value); $('#memory_prompt_words_value').text(extension_settings.memory.promptWords); saveSettingsDebounced(); } function onMemoryPromptIntervalInput() { const value = $(this).val(); extension_settings.memory.promptInterval = Number(value); $('#memory_prompt_interval_value').text(extension_settings.memory.promptInterval); saveSettingsDebounced(); } function onMemoryPromptRestoreClick() { $('#memory_prompt').val(defaultPrompt).trigger('input'); } function onMemoryPromptInput() { const value = $(this).val(); extension_settings.memory.prompt = value; saveSettingsDebounced(); } function onMemoryTemplateInput() { const value = $(this).val(); extension_settings.memory.template = value; reinsertMemory(); saveSettingsDebounced(); } function onMemoryDepthInput() { const value = $(this).val(); extension_settings.memory.depth = Number(value); reinsertMemory(); saveSettingsDebounced(); } function onMemoryRoleInput() { const value = $(this).val(); extension_settings.memory.role = Number(value); reinsertMemory(); saveSettingsDebounced(); } function onMemoryPositionChange(e) { const value = e.target.value; extension_settings.memory.position = value; reinsertMemory(); saveSettingsDebounced(); } function onMemoryIncludeWIScanInput() { const value = !!$(this).prop('checked'); extension_settings.memory.scan = value; reinsertMemory(); saveSettingsDebounced(); } function onMemoryPromptWordsForceInput() { const value = $(this).val(); extension_settings.memory.promptForceWords = Number(value); $('#memory_prompt_words_force_value').text(extension_settings.memory.promptForceWords); saveSettingsDebounced(); } function onOverrideResponseLengthInput() { const value = $(this).val(); extension_settings.memory.overrideResponseLength = Number(value); $('#memory_override_response_length_value').text(extension_settings.memory.overrideResponseLength); saveSettingsDebounced(); } function onMaxMessagesPerRequestInput() { const value = $(this).val(); extension_settings.memory.maxMessagesPerRequest = Number(value); $('#memory_max_messages_per_request_value').text(extension_settings.memory.maxMessagesPerRequest); saveSettingsDebounced(); } function saveLastValues() { const context = getContext(); lastGroupId = context.groupId; lastCharacterId = context.characterId; lastChatId = context.chatId; lastMessageId = context.chat?.length ?? null; lastMessageHash = getStringHash((context.chat.length && context.chat[context.chat.length - 1]['mes']) ?? ''); } function getLatestMemoryFromChat(chat) { if (!Array.isArray(chat) || !chat.length) { return ''; } const reversedChat = chat.slice().reverse(); reversedChat.shift(); for (let mes of reversedChat) { if (mes.extra && mes.extra.memory) { return mes.extra.memory; } } return ''; } function getIndexOfLatestChatSummary(chat) { if (!Array.isArray(chat) || !chat.length) { return -1; } const reversedChat = chat.slice().reverse(); reversedChat.shift(); for (let mes of reversedChat) { if (mes.extra && mes.extra.memory) { return chat.indexOf(mes); } } return -1; } async function onChatEvent() { // Module not enabled if (extension_settings.memory.source === summary_sources.extras && !modules.includes('summarize')) { return; } // WebLLM is not supported if (extension_settings.memory.source === summary_sources.webllm && !isWebLlmSupported()) { return; } const context = getContext(); const chat = context.chat; // no characters or group selected if (!context.groupId && context.characterId === undefined) { return; } // Streaming in-progress if (streamingProcessor && !streamingProcessor.isFinished) { return; } // Chat/character/group changed if ((context.groupId && lastGroupId !== context.groupId) || (context.characterId !== lastCharacterId) || (context.chatId !== lastChatId)) { const latestMemory = getLatestMemoryFromChat(chat); setMemoryContext(latestMemory, false); saveLastValues(); return; } // Currently summarizing or frozen state - skip if (inApiCall || extension_settings.memory.memoryFrozen) { return; } // No new messages - do nothing if (chat.length === 0 || (lastMessageId === chat.length && getStringHash(chat[chat.length - 1].mes) === lastMessageHash)) { return; } // Messages has been deleted - rewrite the context with the latest available memory if (chat.length < lastMessageId) { const latestMemory = getLatestMemoryFromChat(chat); setMemoryContext(latestMemory, false); } // Message has been edited / regenerated - delete the saved memory if (chat.length && chat[chat.length - 1].extra && chat[chat.length - 1].extra.memory && lastMessageId === chat.length && getStringHash(chat[chat.length - 1].mes) !== lastMessageHash) { delete chat[chat.length - 1].extra.memory; } summarizeChat(context) .catch(console.error) .finally(saveLastValues); } /** * Forces a summary generation for the current chat. * @param {boolean} quiet If an informational toast should be displayed * @returns {Promise} Summarized text */ async function forceSummarizeChat(quiet) { if (extension_settings.memory.source === summary_sources.extras) { toastr.warning('Force summarization is not supported for Extras API'); return; } const context = getContext(); const skipWIAN = extension_settings.memory.SkipWIAN; console.log(`Skipping WIAN? ${skipWIAN}`); if (!context.chatId) { toastr.warning('No chat selected'); return ''; } const toast = quiet ? jQuery() : toastr.info('Summarizing chat...', 'Please wait', { timeOut: 0, extendedTimeOut: 0 }); const value = extension_settings.memory.source === summary_sources.main ? await summarizeChatMain(context, true, skipWIAN) : await summarizeChatWebLLM(context, true); toastr.clear(toast); if (!value) { toastr.warning('Failed to summarize chat'); return ''; } return value; } /** * Callback for the summarize command. * @param {object} args Command arguments * @param {string} text Text to summarize */ async function summarizeCallback(args, text) { text = text.trim(); // Summarize the current chat if no text provided if (!text) { const quiet = isTrueBoolean(args.quiet); return await forceSummarizeChat(quiet); } const source = args.source || extension_settings.memory.source; const prompt = substituteParamsExtended((args.prompt || extension_settings.memory.prompt), { words: extension_settings.memory.promptWords }); try { switch (source) { case summary_sources.extras: return await callExtrasSummarizeAPI(text); case summary_sources.main: return await generateRaw(text, '', false, false, prompt, extension_settings.memory.overrideResponseLength); case summary_sources.webllm: { const messages = [{ role: 'system', content: prompt }, { role: 'user', content: text }].filter(m => m.content); const params = extension_settings.memory.overrideResponseLength > 0 ? { max_tokens: extension_settings.memory.overrideResponseLength } : {}; return await generateWebLlmChatPrompt(messages, params); } default: toastr.warning('Invalid summarization source specified'); return ''; } } catch (error) { toastr.error(String(error), 'Failed to summarize text'); console.log(error); return ''; } } async function summarizeChat(context) { const skipWIAN = extension_settings.memory.SkipWIAN; switch (extension_settings.memory.source) { case summary_sources.extras: await summarizeChatExtras(context); break; case summary_sources.main: await summarizeChatMain(context, false, skipWIAN); break; case summary_sources.webllm: await summarizeChatWebLLM(context, false); break; default: break; } } /** * Check if the chat should be summarized based on the current conditions. * Return summary prompt if it should be summarized. * @param {any} context ST context * @param {boolean} force Summarize the chat regardless of the conditions * @returns {Promise} Summary prompt or empty string */ async function getSummaryPromptForNow(context, force) { if (extension_settings.memory.promptInterval === 0 && !force) { console.debug('Prompt interval is set to 0, skipping summarization'); return ''; } try { // Wait for group to finish generating if (selected_group) { await waitUntilCondition(() => is_group_generating === false, 1000, 10); } // Wait for the send button to be released await waitUntilCondition(() => is_send_press === false, 30000, 100); } catch { console.debug('Timeout waiting for is_send_press'); return ''; } if (!context.chat.length) { console.debug('No messages in chat to summarize'); return ''; } if (context.chat.length < extension_settings.memory.promptInterval && !force) { console.debug(`Not enough messages in chat to summarize (chat: ${context.chat.length}, interval: ${extension_settings.memory.promptInterval})`); return ''; } let messagesSinceLastSummary = 0; let wordsSinceLastSummary = 0; let conditionSatisfied = false; for (let i = context.chat.length - 1; i >= 0; i--) { if (context.chat[i].extra && context.chat[i].extra.memory) { break; } messagesSinceLastSummary++; wordsSinceLastSummary += extractAllWords(context.chat[i].mes).length; } if (messagesSinceLastSummary >= extension_settings.memory.promptInterval) { conditionSatisfied = true; } if (extension_settings.memory.promptForceWords && wordsSinceLastSummary >= extension_settings.memory.promptForceWords) { conditionSatisfied = true; } if (!conditionSatisfied && !force) { console.debug(`Summary conditions not satisfied (messages: ${messagesSinceLastSummary}, interval: ${extension_settings.memory.promptInterval}, words: ${wordsSinceLastSummary}, force words: ${extension_settings.memory.promptForceWords})`); return ''; } console.log('Summarizing chat, messages since last summary: ' + messagesSinceLastSummary, 'words since last summary: ' + wordsSinceLastSummary); const prompt = substituteParamsExtended(extension_settings.memory.prompt, { words: extension_settings.memory.promptWords }); if (!prompt) { console.debug('Summarization prompt is empty. Skipping summarization.'); return ''; } return prompt; } async function summarizeChatWebLLM(context, force) { if (!isWebLlmSupported()) { return; } const prompt = await getSummaryPromptForNow(context, force); if (!prompt) { return; } const { rawPrompt, lastUsedIndex } = await getRawSummaryPrompt(context, prompt); if (lastUsedIndex === null || lastUsedIndex === -1) { if (force) { toastr.info('To try again, remove the latest summary.', 'No messages found to summarize'); } return null; } const messages = [ { role: 'system', content: prompt }, { role: 'user', content: rawPrompt }, ]; const params = {}; if (extension_settings.memory.overrideResponseLength > 0) { params.max_tokens = extension_settings.memory.overrideResponseLength; } try { inApiCall = true; const summary = await generateWebLlmChatPrompt(messages, params); const newContext = getContext(); if (!summary) { console.warn('Empty summary received'); return; } // something changed during summarization request if (newContext.groupId !== context.groupId || newContext.chatId !== context.chatId || (!newContext.groupId && (newContext.characterId !== context.characterId))) { console.log('Context changed, summary discarded'); return; } setMemoryContext(summary, true, lastUsedIndex); return summary; } finally { inApiCall = false; } } async function summarizeChatMain(context, force, skipWIAN) { const prompt = await getSummaryPromptForNow(context, force); if (!prompt) { return; } console.log('sending summary prompt'); let summary = ''; let index = null; if (prompt_builders.DEFAULT === extension_settings.memory.prompt_builder) { try { inApiCall = true; summary = await generateQuietPrompt(prompt, false, skipWIAN, '', '', extension_settings.memory.overrideResponseLength); } finally { inApiCall = false; } } if ([prompt_builders.RAW_BLOCKING, prompt_builders.RAW_NON_BLOCKING].includes(extension_settings.memory.prompt_builder)) { const lock = extension_settings.memory.prompt_builder === prompt_builders.RAW_BLOCKING; try { inApiCall = true; if (lock) { deactivateSendButtons(); } const { rawPrompt, lastUsedIndex } = await getRawSummaryPrompt(context, prompt); if (lastUsedIndex === null || lastUsedIndex === -1) { if (force) { toastr.info('To try again, remove the latest summary.', 'No messages found to summarize'); } return null; } summary = await generateRaw(rawPrompt, '', false, false, prompt, extension_settings.memory.overrideResponseLength); index = lastUsedIndex; } finally { inApiCall = false; if (lock) { activateSendButtons(); } } } if (!summary) { console.warn('Empty summary received'); return; } const newContext = getContext(); // something changed during summarization request if (newContext.groupId !== context.groupId || newContext.chatId !== context.chatId || (!newContext.groupId && (newContext.characterId !== context.characterId))) { console.log('Context changed, summary discarded'); return; } setMemoryContext(summary, true, index); return summary; } /** * Get the raw summarization prompt from the chat context. * @param {object} context ST context * @param {string} prompt Summarization system prompt * @returns {Promise<{rawPrompt: string, lastUsedIndex: number}>} Raw summarization prompt */ async function getRawSummaryPrompt(context, prompt) { /** * Get the memory string from the chat buffer. * @param {boolean} includeSystem Include prompt into the memory string * @returns {string} Memory string */ function getMemoryString(includeSystem) { const delimiter = '\n\n'; const stringBuilder = []; const bufferString = chatBuffer.slice().join(delimiter); if (includeSystem) { stringBuilder.push(prompt); } if (latestSummary) { stringBuilder.push(latestSummary); } stringBuilder.push(bufferString); return stringBuilder.join(delimiter).trim(); } const chat = context.chat.slice(); const latestSummary = getLatestMemoryFromChat(chat); const latestSummaryIndex = getIndexOfLatestChatSummary(chat); chat.pop(); // We always exclude the last message from the buffer const chatBuffer = []; const PADDING = 64; const PROMPT_SIZE = await getSourceContextSize(); let latestUsedMessage = null; for (let index = latestSummaryIndex + 1; index < chat.length; index++) { const message = chat[index]; if (!message) { break; } if (message.is_system || !message.mes) { continue; } const entry = `${message.name}:\n${message.mes}`; chatBuffer.push(entry); const tokens = await countSourceTokens(getMemoryString(true), PADDING); if (tokens > PROMPT_SIZE) { chatBuffer.pop(); break; } latestUsedMessage = message; if (extension_settings.memory.maxMessagesPerRequest > 0 && chatBuffer.length >= extension_settings.memory.maxMessagesPerRequest) { break; } } const lastUsedIndex = context.chat.indexOf(latestUsedMessage); const rawPrompt = getMemoryString(false); return { rawPrompt, lastUsedIndex }; } async function summarizeChatExtras(context) { function getMemoryString() { return (longMemory + '\n\n' + memoryBuffer.slice().reverse().join('\n\n')).trim(); } const chat = context.chat; const longMemory = getLatestMemoryFromChat(chat); const reversedChat = chat.slice().reverse(); reversedChat.shift(); const memoryBuffer = []; const CONTEXT_SIZE = await getSourceContextSize(); for (const message of reversedChat) { // we reached the point of latest memory if (longMemory && message.extra && message.extra.memory == longMemory) { break; } // don't care about system if (message.is_system) { continue; } // determine the sender's name const entry = `${message.name}:\n${message.mes}`; memoryBuffer.push(entry); // check if token limit was reached const tokens = await countSourceTokens(getMemoryString()); if (tokens >= CONTEXT_SIZE) { break; } } const resultingString = getMemoryString(); const resultingTokens = await countSourceTokens(resultingString); if (!resultingString || resultingTokens < CONTEXT_SIZE) { console.debug('Not enough context to summarize'); return; } // perform the summarization API call try { inApiCall = true; const summary = await callExtrasSummarizeAPI(resultingString); const newContext = getContext(); if (!summary) { console.warn('Empty summary received'); return; } // something changed during summarization request if (newContext.groupId !== context.groupId || newContext.chatId !== context.chatId || (!newContext.groupId && (newContext.characterId !== context.characterId))) { console.log('Context changed, summary discarded'); return; } setMemoryContext(summary, true); } catch (error) { console.log(error); } finally { inApiCall = false; } } /** * Call the Extras API to summarize the provided text. * @param {string} text Text to summarize * @returns {Promise} Summarized text */ async function callExtrasSummarizeAPI(text) { if (!modules.includes('summarize')) { throw new Error('Summarize module is not enabled in Extras API'); } const url = new URL(getApiUrl()); url.pathname = '/api/summarize'; const apiResult = await doExtrasFetch(url, { method: 'POST', headers: { 'Content-Type': 'application/json', 'Bypass-Tunnel-Reminder': 'bypass', }, body: JSON.stringify({ text: text, params: {}, }), }); if (apiResult.ok) { const data = await apiResult.json(); const summary = data.summary; return summary; } throw new Error('Extras API call failed'); } function onMemoryRestoreClick() { const context = getContext(); const content = $('#memory_contents').val(); const reversedChat = context.chat.slice().reverse(); reversedChat.shift(); for (let mes of reversedChat) { if (mes.extra && mes.extra.memory == content) { delete mes.extra.memory; break; } } const newContent = getLatestMemoryFromChat(context.chat); setMemoryContext(newContent, false); } function onMemoryContentInput() { const value = $(this).val(); setMemoryContext(value, true); } function onMemoryPromptBuilderInput(e) { const value = Number(e.target.value); extension_settings.memory.prompt_builder = value; saveSettingsDebounced(); } function reinsertMemory() { const existingValue = String($('#memory_contents').val()); setMemoryContext(existingValue, false); } /** * Set the summary value to the context and save it to the chat message extra. * @param {string} value Value of a summary * @param {boolean} saveToMessage Should the summary be saved to the chat message extra * @param {number|null} index Index of the chat message to save the summary to. If null, the pre-last message is used. */ function setMemoryContext(value, saveToMessage, index = null) { setExtensionPrompt(MODULE_NAME, formatMemoryValue(value), extension_settings.memory.position, extension_settings.memory.depth, extension_settings.memory.scan, extension_settings.memory.role); $('#memory_contents').val(value); const summaryLog = value ? `Summary set to: ${value}. Position: ${extension_settings.memory.position}. Depth: ${extension_settings.memory.depth}. Role: ${extension_settings.memory.role}` : 'Summary has no content'; console.debug(summaryLog); const context = getContext(); if (saveToMessage && context.chat.length) { const idx = index ?? context.chat.length - 2; const mes = context.chat[idx < 0 ? 0 : idx]; if (!mes.extra) { mes.extra = {}; } mes.extra.memory = value; saveChatDebounced(); } } function doPopout(e) { const target = e.target; //repurposes the zoomed avatar template to server as a floating div if ($('#summaryExtensionPopout').length === 0) { console.debug('did not see popout yet, creating'); const originalHTMLClone = $(target).parent().parent().parent().find('.inline-drawer-content').html(); const originalElement = $(target).parent().parent().parent().find('.inline-drawer-content'); const template = $('#zoomed_avatar_template').html(); const controlBarHtml = `
`; const newElement = $(template); newElement.attr('id', 'summaryExtensionPopout') .removeClass('zoomed_avatar') .addClass('draggable') .empty(); const prevSummaryBoxContents = $('#memory_contents').val(); //copy summary box before emptying originalElement.empty(); originalElement.html('
Currently popped out
'); newElement.append(controlBarHtml).append(originalHTMLClone); $('body').append(newElement); $('#summaryExtensionDrawerContents').addClass('scrollableInnerFull'); setMemoryContext(prevSummaryBoxContents, false); //paste prev summary box contents into popout box setupListeners(); loadSettings(); loadMovingUIState(); $('#summaryExtensionPopout').fadeIn(animation_duration); dragElement(newElement); //setup listener for close button to restore extensions menu $('#summaryExtensionPopoutClose').off('click').on('click', function () { $('#summaryExtensionDrawerContents').removeClass('scrollableInnerFull'); const summaryPopoutHTML = $('#summaryExtensionDrawerContents'); $('#summaryExtensionPopout').fadeOut(animation_duration, () => { originalElement.empty(); originalElement.html(summaryPopoutHTML); $('#summaryExtensionPopout').remove(); }); loadSettings(); }); } else { console.debug('saw existing popout, removing'); $('#summaryExtensionPopout').fadeOut(animation_duration, () => { $('#summaryExtensionPopoutClose').trigger('click'); }); } } function setupListeners() { //setup shared listeners for popout and regular ext menu $('#memory_restore').off('click').on('click', onMemoryRestoreClick); $('#memory_contents').off('click').on('input', onMemoryContentInput); $('#memory_frozen').off('click').on('input', onMemoryFrozenInput); $('#memory_skipWIAN').off('click').on('input', onMemorySkipWIANInput); $('#summary_source').off('click').on('change', onSummarySourceChange); $('#memory_prompt_words').off('click').on('input', onMemoryPromptWordsInput); $('#memory_prompt_interval').off('click').on('input', onMemoryPromptIntervalInput); $('#memory_prompt').off('click').on('input', onMemoryPromptInput); $('#memory_force_summarize').off('click').on('click', () => forceSummarizeChat(false)); $('#memory_template').off('click').on('input', onMemoryTemplateInput); $('#memory_depth').off('click').on('input', onMemoryDepthInput); $('#memory_role').off('click').on('input', onMemoryRoleInput); $('input[name="memory_position"]').off('click').on('change', onMemoryPositionChange); $('#memory_prompt_words_force').off('click').on('input', onMemoryPromptWordsForceInput); $('#memory_prompt_builder_default').off('click').on('input', onMemoryPromptBuilderInput); $('#memory_prompt_builder_raw_blocking').off('click').on('input', onMemoryPromptBuilderInput); $('#memory_prompt_builder_raw_non_blocking').off('click').on('input', onMemoryPromptBuilderInput); $('#memory_prompt_restore').off('click').on('click', onMemoryPromptRestoreClick); $('#memory_prompt_interval_auto').off('click').on('click', onPromptIntervalAutoClick); $('#memory_prompt_words_auto').off('click').on('click', onPromptForceWordsAutoClick); $('#memory_override_response_length').off('click').on('input', onOverrideResponseLengthInput); $('#memory_max_messages_per_request').off('click').on('input', onMaxMessagesPerRequestInput); $('#memory_include_wi_scan').off('input').on('input', onMemoryIncludeWIScanInput); $('#summarySettingsBlockToggle').off('click').on('click', function () { console.log('saw settings button click'); $('#summarySettingsBlock').slideToggle(200, 'swing'); //toggleClass("hidden"); }); } jQuery(async function () { async function addExtensionControls() { const settingsHtml = await renderExtensionTemplateAsync('memory', 'settings', { defaultSettings }); $('#summarize_container').append(settingsHtml); setupListeners(); $('#summaryExtensionPopoutButton').off('click').on('click', function (e) { doPopout(e); e.stopPropagation(); }); } await addExtensionControls(); loadSettings(); eventSource.makeLast(event_types.CHARACTER_MESSAGE_RENDERED, onChatEvent); eventSource.on(event_types.MESSAGE_DELETED, onChatEvent); eventSource.on(event_types.MESSAGE_EDITED, onChatEvent); eventSource.on(event_types.MESSAGE_SWIPED, onChatEvent); eventSource.on(event_types.CHAT_CHANGED, onChatEvent); SlashCommandParser.addCommandObject(SlashCommand.fromProps({ name: 'summarize', callback: summarizeCallback, namedArgumentList: [ new SlashCommandNamedArgument('source', 'API to use for summarization', [ARGUMENT_TYPE.STRING], false, false, '', Object.values(summary_sources)), SlashCommandNamedArgument.fromProps({ name: 'prompt', description: 'prompt to use for summarization', typeList: [ARGUMENT_TYPE.STRING], defaultValue: '', }), SlashCommandNamedArgument.fromProps({ name: 'quiet', description: 'suppress the toast message when summarizing the chat', typeList: [ARGUMENT_TYPE.BOOLEAN], defaultValue: 'false', enumList: commonEnumProviders.boolean('trueFalse')(), }), ], unnamedArgumentList: [ new SlashCommandArgument('text to summarize', [ARGUMENT_TYPE.STRING], false, false, ''), ], helpString: 'Summarizes the given text. If no text is provided, the current chat will be summarized. Can specify the source and the prompt to use.', returns: ARGUMENT_TYPE.STRING, })); MacrosParser.registerMacro('summary', () => getLatestMemoryFromChat(getContext().chat)); });