Merge branch 'staging' into pick-macro

2025-06-05 21:59:27 +02:00 · 2024-04-02 01:07:04 +03:00
parent 70adee3c63 910837441c
commit 36b718b9c7
14 changed files with 405 additions and 28 deletions
--- a/public/scripts/RossAscends-mods.js
+++ b/public/scripts/RossAscends-mods.js
@@ -350,6 +350,7 @@ function RA_autoconnect(PrevApi) {
                    || (secret_state[SECRET_KEYS.AI21] && oai_settings.chat_completion_source == chat_completion_sources.AI21)
                    || (secret_state[SECRET_KEYS.MAKERSUITE] && oai_settings.chat_completion_source == chat_completion_sources.MAKERSUITE)
                    || (secret_state[SECRET_KEYS.MISTRALAI] && oai_settings.chat_completion_source == chat_completion_sources.MISTRALAI)
+                    || (secret_state[SECRET_KEYS.COHERE] && oai_settings.chat_completion_source == chat_completion_sources.COHERE)
                    || (isValidUrl(oai_settings.custom_url) && oai_settings.chat_completion_source == chat_completion_sources.CUSTOM)
                ) {
                    $('#api_button_openai').trigger('click');
--- a/public/scripts/extensions/memory/index.js
+++ b/public/scripts/extensions/memory/index.js
@@ -122,6 +122,44 @@ function loadSettings() {
    switchSourceControls(extension_settings.memory.source);
 }

+async function onPromptForceWordsAutoClick() {
+    const context = getContext();
+    const maxPromptLength = getMaxContextSize(extension_settings.memory.overrideResponseLength);
+    const chat = context.chat;
+    const allMessages = chat.filter(m => !m.is_system && m.mes).map(m => m.mes);
+    const messagesWordCount = allMessages.map(m => extractAllWords(m)).flat().length;
+    const averageMessageWordCount = messagesWordCount / allMessages.length;
+    const tokensPerWord = getTokenCount(allMessages.join('\n')) / messagesWordCount;
+    const wordsPerToken = 1 / tokensPerWord;
+    const maxPromptLengthWords = Math.round(maxPromptLength * wordsPerToken);
+    // How many words should pass so that messages will start be dropped out of context;
+    const wordsPerPrompt = Math.floor(maxPromptLength / tokensPerWord);
+    // How many words will be needed to fit the allowance buffer
+    const summaryPromptWords = extractAllWords(extension_settings.memory.prompt).length;
+    const promptAllowanceWords = maxPromptLengthWords - extension_settings.memory.promptWords - summaryPromptWords;
+    const averageMessagesPerPrompt = Math.floor(promptAllowanceWords / averageMessageWordCount);
+    const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0;
+    const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt);
+    const targetSummaryWords = (targetMessagesInPrompt * averageMessageWordCount) + (promptAllowanceWords / 4);
+
+    console.table({
+        maxPromptLength,
+        maxPromptLengthWords,
+        promptAllowanceWords,
+        averageMessagesPerPrompt,
+        targetMessagesInPrompt,
+        targetSummaryWords,
+        wordsPerPrompt,
+        wordsPerToken,
+        tokensPerWord,
+        messagesWordCount,
+    });
+
+    const ROUNDING = 100;
+    extension_settings.memory.promptForceWords = Math.max(1, Math.floor(targetSummaryWords / ROUNDING) * ROUNDING);
+    $('#memory_prompt_words_force').val(extension_settings.memory.promptForceWords).trigger('input');
+}
+
 async function onPromptIntervalAutoClick() {
    const context = getContext();
    const maxPromptLength = getMaxContextSize(extension_settings.memory.overrideResponseLength);
@@ -136,8 +174,8 @@ async function onPromptIntervalAutoClick() {
    const promptAllowance = maxPromptLength - promptTokens - targetSummaryTokens;
    const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0;
    const averageMessagesPerPrompt = Math.floor(promptAllowance / averageMessageTokenCount);
-    const unfitMessages = maxMessagesPerSummary > 0 ? averageMessagesPerPrompt - maxMessagesPerSummary : 0;
-    const adjustedAverageMessagesPerPrompt = Math.max(1, averageMessagesPerPrompt - (unfitMessages > 0 ? Math.ceil(unfitMessages / 2) : 0));
+    const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt);
+    const adjustedAverageMessagesPerPrompt = targetMessagesInPrompt + (averageMessagesPerPrompt - targetMessagesInPrompt) / 4;

    console.table({
        maxPromptLength,
@@ -149,9 +187,9 @@ async function onPromptIntervalAutoClick() {
        tokensPerWord,
        averageMessageTokenCount,
        averageMessagesPerPrompt,
+        targetMessagesInPrompt,
        adjustedAverageMessagesPerPrompt,
        maxMessagesPerSummary,
-        unfitMessages,
    });

    const ROUNDING = 5;
@@ -800,6 +838,7 @@ function setupListeners() {
    $('#memory_prompt_builder_raw_non_blocking').off('click').on('input', onMemoryPromptBuilderInput);
    $('#memory_prompt_restore').off('click').on('click', onMemoryPromptRestoreClick);
    $('#memory_prompt_interval_auto').off('click').on('click', onPromptIntervalAutoClick);
+    $('#memory_prompt_words_auto').off('click').on('click', onPromptForceWordsAutoClick);
    $('#memory_override_response_length').off('click').on('input', onOverrideResponseLengthInput);
    $('#memory_max_messages_per_request').off('click').on('input', onMaxMessagesPerRequestInput);
    $('#summarySettingsBlockToggle').off('click').on('click', function () {
--- a/public/scripts/extensions/memory/settings.html
+++ b/public/scripts/extensions/memory/settings.html
@@ -17,7 +17,9 @@

                <div class="flex-container justifyspacebetween alignitemscenter">
                    <span class="flex1">Current summary:</span>
-                    <div id="memory_restore" class="menu_button flex1 margin0"><span>Restore Previous</span></div>
+                    <div id="memory_restore" class="menu_button flex1 margin0">
+                        <span>Restore Previous</span>
+                    </div>
                </div>

                <textarea id="memory_contents" class="text_pole textarea_compact" rows="6" placeholder="Summary will be generated here..."></textarea>
@@ -27,7 +29,10 @@
                        <span>Summarize now</span>
                    </div>
                    <label for="memory_frozen" title="Disable automatic summary updates. While paused, the summary remains as-is. You can still force an update by pressing the Summarize now button (which is only available with the Main API)." data-i18n="[title]Disable automatic summary updates. While paused, the summary remains as-is. You can still force an update by pressing the Summarize now button (which is only available with the Main API)."><input id="memory_frozen" type="checkbox" />Pause</label>
-                    <label for="memory_skipWIAN" title="Omit World Info and Author's Note from text to be summarized. Only has an effect when using the Main API. The Extras API always omits WI/AN." data-i18n="[title]Omit World Info and Author's Note from text to be summarized. Only has an effect when using the Main API. The Extras API always omits WI/AN."><input id="memory_skipWIAN" type="checkbox" />No WI/AN</label>
+                    <label data-summary-source="main" for="memory_skipWIAN" title="Omit World Info and Author's Note from text to be summarized. Only has an effect when using the Main API. The Extras API always omits WI/AN." data-i18n="[title]Omit World Info and Author's Note from text to be summarized. Only has an effect when using the Main API. The Extras API always omits WI/AN.">
+                        <input id="memory_skipWIAN" type="checkbox" />
+                        <span>No WI/AN</span>
+                    </label>
                </div>
                <div class="memory_contents_controls">
                    <div id="summarySettingsBlockToggle" class="menu_button menu_button_icon" title="Edit summarization prompt, insertion position, etc.">
@@ -86,9 +91,14 @@
                            </div>
                        </label>
                        <input id="memory_prompt_interval" type="range" value="{{defaultSettings.promptInterval}}" min="{{defaultSettings.promptMinInterval}}" max="{{defaultSettings.promptMaxInterval}}" step="{{defaultSettings.promptIntervalStep}}" />
-                        <label for="memory_prompt_words_force">
-                            Update every <span id="memory_prompt_words_force_value"></span> words
-                            <small class="memory_disabled_hint">0 = disable</small>
+                        <label for="memory_prompt_words_force" class="title_restorable">
+                            <span>
+                                Update every <span id="memory_prompt_words_force_value"></span> words
+                                <small class="memory_disabled_hint">0 = disable</small>
+                            </span>
+                            <div id="memory_prompt_words_auto" title="Try to automatically adjust the interval based on the chat metrics." class="right_menu_button">
+                                <div class="fa-solid fa-wand-magic-sparkles"></div>
+                            </div>
                        </label>
                        <input id="memory_prompt_words_force" type="range" value="{{defaultSettings.promptForceWords}}" min="{{defaultSettings.promptMinForceWords}}" max="{{defaultSettings.promptMaxForceWords}}" step="{{defaultSettings.promptForceWordsStep}}" />
                        <small>If both sliders are non-zero, then both will trigger summary updates at their respective intervals.</small>
--- a/public/scripts/openai.js
+++ b/public/scripts/openai.js
@@ -171,6 +171,7 @@ export const chat_completion_sources = {
    MAKERSUITE: 'makersuite',
    MISTRALAI: 'mistralai',
    CUSTOM: 'custom',
+    COHERE: 'cohere',
 };

 const character_names_behavior = {
@@ -230,6 +231,7 @@ const default_settings = {
    google_model: 'gemini-pro',
    ai21_model: 'j2-ultra',
    mistralai_model: 'mistral-medium-latest',
+    cohere_model: 'command-r',
    custom_model: '',
    custom_url: '',
    custom_include_body: '',
@@ -298,6 +300,7 @@ const oai_settings = {
    google_model: 'gemini-pro',
    ai21_model: 'j2-ultra',
    mistralai_model: 'mistral-medium-latest',
+    cohere_model: 'command-r',
    custom_model: '',
    custom_url: '',
    custom_include_body: '',
@@ -1384,6 +1387,8 @@ function getChatCompletionModel() {
            return oai_settings.mistralai_model;
        case chat_completion_sources.CUSTOM:
            return oai_settings.custom_model;
+        case chat_completion_sources.COHERE:
+            return oai_settings.cohere_model;
        default:
            throw new Error(`Unknown chat completion source: ${oai_settings.chat_completion_source}`);
    }
@@ -1603,6 +1608,7 @@ async function sendOpenAIRequest(type, messages, signal) {
    const isOAI = oai_settings.chat_completion_source == chat_completion_sources.OPENAI;
    const isMistral = oai_settings.chat_completion_source == chat_completion_sources.MISTRALAI;
    const isCustom = oai_settings.chat_completion_source == chat_completion_sources.CUSTOM;
+    const isCohere = oai_settings.chat_completion_source == chat_completion_sources.COHERE;
    const isTextCompletion = (isOAI && textCompletionModels.includes(oai_settings.openai_model)) || (isOpenRouter && oai_settings.openrouter_force_instruct && power_user.instruct.enabled);
    const isQuiet = type === 'quiet';
    const isImpersonate = type === 'impersonate';
@@ -1737,7 +1743,17 @@ async function sendOpenAIRequest(type, messages, signal) {
        generate_data['custom_include_headers'] = oai_settings.custom_include_headers;
    }

-    if ((isOAI || isOpenRouter || isMistral || isCustom) && oai_settings.seed >= 0) {
+    if (isCohere) {
+        // Clamp to 0.01 -> 0.99
+        generate_data['top_p'] = Math.min(Math.max(Number(oai_settings.top_p_openai), 0.01), 0.99);
+        generate_data['top_k'] = Number(oai_settings.top_k_openai);
+        // Clamp to 0 -> 1
+        generate_data['frequency_penalty'] = Math.min(Math.max(Number(oai_settings.freq_pen_openai), 0), 1);
+        generate_data['presence_penalty'] = Math.min(Math.max(Number(oai_settings.pres_pen_openai), 0), 1);
+        generate_data['stop'] = getCustomStoppingStrings(5);
+    }
+
+    if ((isOAI || isOpenRouter || isMistral || isCustom || isCohere) && oai_settings.seed >= 0) {
        generate_data['seed'] = oai_settings.seed;
    }

@@ -2597,6 +2613,7 @@ function loadOpenAISettings(data, settings) {
    oai_settings.openrouter_force_instruct = settings.openrouter_force_instruct ?? default_settings.openrouter_force_instruct;
    oai_settings.ai21_model = settings.ai21_model ?? default_settings.ai21_model;
    oai_settings.mistralai_model = settings.mistralai_model ?? default_settings.mistralai_model;
+    oai_settings.cohere_model = settings.cohere_model ?? default_settings.cohere_model;
    oai_settings.custom_model = settings.custom_model ?? default_settings.custom_model;
    oai_settings.custom_url = settings.custom_url ?? default_settings.custom_url;
    oai_settings.custom_include_body = settings.custom_include_body ?? default_settings.custom_include_body;
@@ -2657,6 +2674,8 @@ function loadOpenAISettings(data, settings) {
    $(`#model_ai21_select option[value="${oai_settings.ai21_model}"`).attr('selected', true);
    $('#model_mistralai_select').val(oai_settings.mistralai_model);
    $(`#model_mistralai_select option[value="${oai_settings.mistralai_model}"`).attr('selected', true);
+    $('#model_cohere_select').val(oai_settings.cohere_model);
+    $(`#model_cohere_select option[value="${oai_settings.cohere_model}"`).attr('selected', true);
    $('#custom_model_id').val(oai_settings.custom_model);
    $('#custom_api_url_text').val(oai_settings.custom_url);
    $('#openai_max_context').val(oai_settings.openai_max_context);
@@ -2893,6 +2912,7 @@ async function saveOpenAIPreset(name, settings, triggerUi = true) {
        openrouter_sort_models: settings.openrouter_sort_models,
        ai21_model: settings.ai21_model,
        mistralai_model: settings.mistralai_model,
+        cohere_model: settings.cohere_model,
        custom_model: settings.custom_model,
        custom_url: settings.custom_url,
        custom_include_body: settings.custom_include_body,
@@ -3281,6 +3301,7 @@ function onSettingsPresetChange() {
        openrouter_sort_models: ['#openrouter_sort_models', 'openrouter_sort_models', false],
        ai21_model: ['#model_ai21_select', 'ai21_model', false],
        mistralai_model: ['#model_mistralai_select', 'mistralai_model', false],
+        cohere_model: ['#model_cohere_select', 'cohere_model', false],
        custom_model: ['#custom_model_id', 'custom_model', false],
        custom_url: ['#custom_api_url_text', 'custom_url', false],
        custom_include_body: ['#custom_include_body', 'custom_include_body', false],
@@ -3496,6 +3517,11 @@ async function onModelChange() {
        $('#model_mistralai_select').val(oai_settings.mistralai_model);
    }

+    if ($(this).is('#model_cohere_select')) {
+        console.log('Cohere model changed to', value);
+        oai_settings.cohere_model = value;
+    }
+
    if (value && $(this).is('#model_custom_select')) {
        console.log('Custom model changed to', value);
        oai_settings.custom_model = value;
@@ -3619,6 +3645,26 @@ async function onModelChange() {
        $('#temp_openai').attr('max', claude_max_temp).val(oai_settings.temp_openai).trigger('input');
    }

+    if (oai_settings.chat_completion_source === chat_completion_sources.COHERE) {
+        if (oai_settings.max_context_unlocked) {
+            $('#openai_max_context').attr('max', unlocked_max);
+        }
+        else if (['command-light', 'command'].includes(oai_settings.cohere_model)) {
+            $('#openai_max_context').attr('max', max_4k);
+        }
+        else if (['command-light-nightly', 'command-nightly'].includes(oai_settings.cohere_model)) {
+            $('#openai_max_context').attr('max', max_8k);
+        }
+        else if (['command-r'].includes(oai_settings.cohere_model)) {
+            $('#openai_max_context').attr('max', max_128k);
+        }
+        else {
+            $('#openai_max_context').attr('max', max_4k);
+        }
+        oai_settings.openai_max_context = Math.min(Number($('#openai_max_context').attr('max')), oai_settings.openai_max_context);
+        $('#openai_max_context').val(oai_settings.openai_max_context).trigger('input');
+    }
+
    if (oai_settings.chat_completion_source == chat_completion_sources.AI21) {
        if (oai_settings.max_context_unlocked) {
            $('#openai_max_context').attr('max', unlocked_max);
@@ -3812,6 +3858,19 @@ async function onConnectButtonClick(e) {
        }
    }

+    if (oai_settings.chat_completion_source == chat_completion_sources.COHERE) {
+        const api_key_cohere = String($('#api_key_cohere').val()).trim();
+
+        if (api_key_cohere.length) {
+            await writeSecret(SECRET_KEYS.COHERE, api_key_cohere);
+        }
+
+        if (!secret_state[SECRET_KEYS.COHERE]) {
+            console.log('No secret key saved for Cohere');
+            return;
+        }
+    }
+
    startStatusLoading();
    saveSettingsDebounced();
    await getStatusOpen();
@@ -3847,6 +3906,9 @@ function toggleChatCompletionForms() {
    else if (oai_settings.chat_completion_source == chat_completion_sources.MISTRALAI) {
        $('#model_mistralai_select').trigger('change');
    }
+    else if (oai_settings.chat_completion_source == chat_completion_sources.COHERE) {
+        $('#model_cohere_select').trigger('change');
+    }
    else if (oai_settings.chat_completion_source == chat_completion_sources.CUSTOM) {
        $('#model_custom_select').trigger('change');
    }
@@ -4499,6 +4561,7 @@ $(document).ready(async function () {
    $('#openrouter_sort_models').on('change', onOpenrouterModelSortChange);
    $('#model_ai21_select').on('change', onModelChange);
    $('#model_mistralai_select').on('change', onModelChange);
+    $('#model_cohere_select').on('change', onModelChange);
    $('#model_custom_select').on('change', onModelChange);
    $('#settings_preset_openai').on('change', onSettingsPresetChange);
    $('#new_oai_preset').on('click', onNewPresetClick);
--- a/public/scripts/secrets.js
+++ b/public/scripts/secrets.js
@@ -23,6 +23,7 @@ export const SECRET_KEYS = {
    NOMICAI: 'api_key_nomicai',
    KOBOLDCPP: 'api_key_koboldcpp',
    LLAMACPP: 'api_key_llamacpp',
+    COHERE: 'api_key_cohere',
 };

 const INPUT_MAP = {
@@ -47,6 +48,7 @@ const INPUT_MAP = {
    [SECRET_KEYS.NOMICAI]: '#api_key_nomicai',
    [SECRET_KEYS.KOBOLDCPP]: '#api_key_koboldcpp',
    [SECRET_KEYS.LLAMACPP]: '#api_key_llamacpp',
+    [SECRET_KEYS.COHERE]: '#api_key_cohere',
 };

 async function clearSecret() {
--- a/public/scripts/slash-commands.js
+++ b/public/scripts/slash-commands.js
@@ -1660,6 +1660,7 @@ function modelCallback(_, model) {
        { id: 'model_google_select', api: 'openai', type: chat_completion_sources.MAKERSUITE },
        { id: 'model_mistralai_select', api: 'openai', type: chat_completion_sources.MISTRALAI },
        { id: 'model_custom_select', api: 'openai', type: chat_completion_sources.CUSTOM },
+        { id: 'model_cohere_select', api: 'openai', type: chat_completion_sources.COHERE },
        { id: 'model_novel_select', api: 'novel', type: null },
        { id: 'horde_model', api: 'koboldhorde', type: null },
    ];