mirror of
https://github.com/SillyTavern/SillyTavern.git
synced 2025-01-05 21:46:49 +01:00
239 lines
8.2 KiB
JavaScript
239 lines
8.2 KiB
JavaScript
import { substituteParams } from '../../../script.js';
|
|
import { extension_settings } from '../../extensions.js';
|
|
export {
|
|
regex_placement,
|
|
getRegexedString,
|
|
runRegexScript,
|
|
};
|
|
|
|
/**
|
|
* @enum {number} Where the regex script should be applied
|
|
*/
|
|
const regex_placement = {
|
|
/**
|
|
* @deprecated MD Display is deprecated. Do not use.
|
|
*/
|
|
MD_DISPLAY: 0,
|
|
USER_INPUT: 1,
|
|
AI_OUTPUT: 2,
|
|
SLASH_COMMAND: 3,
|
|
};
|
|
|
|
/**
|
|
* @enum {number} How the regex script should replace the matched string
|
|
*/
|
|
const regex_replace_strategy = {
|
|
REPLACE: 0,
|
|
OVERLAY: 1,
|
|
};
|
|
|
|
/**
|
|
* Instantiates a regular expression from a string.
|
|
* @param {string} input The input string.
|
|
* @returns {RegExp} The regular expression instance.
|
|
* @copyright Originally from: https://github.com/IonicaBizau/regex-parser.js/blob/master/lib/index.js
|
|
*/
|
|
function regexFromString(input) {
|
|
try {
|
|
// Parse input
|
|
var m = input.match(/(\/?)(.+)\1([a-z]*)/i);
|
|
|
|
// Invalid flags
|
|
if (m[3] && !/^(?!.*?(.).*?\1)[gmixXsuUAJ]+$/.test(m[3])) {
|
|
return RegExp(input);
|
|
}
|
|
|
|
// Create the regular expression
|
|
return new RegExp(m[2], m[3]);
|
|
} catch {
|
|
return;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Parent function to fetch a regexed version of a raw string
|
|
* @param {string} rawString The raw string to be regexed
|
|
* @param {regex_placement} placement The placement of the string
|
|
* @param {RegexParams} params The parameters to use for the regex script
|
|
* @returns {string} The regexed string
|
|
* @typedef {{characterOverride?: string, isMarkdown?: boolean, isPrompt?: boolean }} RegexParams The parameters to use for the regex script
|
|
*/
|
|
function getRegexedString(rawString, placement, { characterOverride, isMarkdown, isPrompt } = {}) {
|
|
// WTF have you passed me?
|
|
if (typeof rawString !== 'string') {
|
|
console.warn('getRegexedString: rawString is not a string. Returning empty string.');
|
|
return '';
|
|
}
|
|
|
|
let finalString = rawString;
|
|
if (extension_settings.disabledExtensions.includes('regex') || !rawString || placement === undefined) {
|
|
return finalString;
|
|
}
|
|
|
|
extension_settings.regex.forEach((script) => {
|
|
if (
|
|
// Script applies to Markdown and input is Markdown
|
|
(script.markdownOnly && isMarkdown) ||
|
|
// Script applies to Generate and input is Generate
|
|
(script.promptOnly && isPrompt) ||
|
|
// Script applies to all cases when neither "only"s are true, but there's no need to do it when `isMarkdown`, the as source (chat history) should already be changed beforehand
|
|
(!script.markdownOnly && !script.promptOnly && !isMarkdown)
|
|
) {
|
|
if (script.placement.includes(placement)) {
|
|
finalString = runRegexScript(script, finalString, { characterOverride });
|
|
}
|
|
}
|
|
});
|
|
|
|
return finalString;
|
|
}
|
|
|
|
/**
|
|
* Runs the provided regex script on the given string
|
|
* @param {object} regexScript The regex script to run
|
|
* @param {string} rawString The string to run the regex script on
|
|
* @param {RegexScriptParams} params The parameters to use for the regex script
|
|
* @returns {string} The new string
|
|
* @typedef {{characterOverride?: string}} RegexScriptParams The parameters to use for the regex script
|
|
*/
|
|
function runRegexScript(regexScript, rawString, { characterOverride } = {}) {
|
|
let newString = rawString;
|
|
if (!regexScript || !!(regexScript.disabled) || !regexScript?.findRegex || !rawString) {
|
|
return newString;
|
|
}
|
|
|
|
const findRegex = regexFromString(regexScript.substituteRegex ? substituteParams(regexScript.findRegex) : regexScript.findRegex);
|
|
|
|
// The user skill issued. Return with nothing.
|
|
if (!findRegex) {
|
|
return newString;
|
|
}
|
|
|
|
// Run replacement. Currently does not support the Overlay strategy
|
|
newString = rawString.replace(findRegex, function(match) {
|
|
const args = [...arguments];
|
|
const replaceString = regexScript.replaceString.replace(/{{match}}/gi, '$0');
|
|
const replaceWithGroups = replaceString.replaceAll(/\$(\d)+/g, (_, num) => {
|
|
// Get a full match or a capture group
|
|
const match = args[Number(num)];
|
|
|
|
// No match found - return the empty string
|
|
if (!match) {
|
|
return '';
|
|
}
|
|
|
|
// Remove trim strings from the match
|
|
const filteredMatch = filterString(match, regexScript.trimStrings, { characterOverride });
|
|
|
|
// TODO: Handle overlay here
|
|
|
|
return filteredMatch;
|
|
});
|
|
|
|
// Substitute at the end
|
|
return substituteParams(replaceWithGroups);
|
|
});
|
|
|
|
return newString;
|
|
}
|
|
|
|
/**
|
|
* Filters anything to trim from the regex match
|
|
* @param {string} rawString The raw string to filter
|
|
* @param {string[]} trimStrings The strings to trim
|
|
* @param {RegexScriptParams} params The parameters to use for the regex filter
|
|
* @returns {string} The filtered string
|
|
*/
|
|
function filterString(rawString, trimStrings, { characterOverride } = {}) {
|
|
let finalString = rawString;
|
|
trimStrings.forEach((trimString) => {
|
|
const subTrimString = substituteParams(trimString, undefined, characterOverride);
|
|
finalString = finalString.replaceAll(subTrimString, '');
|
|
});
|
|
|
|
return finalString;
|
|
}
|
|
|
|
/**
|
|
* Substitutes regex-specific and normal parameters
|
|
* @param {string} rawString
|
|
* @param {string} regexMatch
|
|
* @param {RegexSubstituteParams} params The parameters to use for the regex substitution
|
|
* @returns {string} The substituted string
|
|
* @typedef {{characterOverride?: string, replaceStrategy?: number}} RegexSubstituteParams The parameters to use for the regex substitution
|
|
*/
|
|
function substituteRegexParams(rawString, regexMatch, { characterOverride, replaceStrategy } = {}) {
|
|
let finalString = rawString;
|
|
finalString = substituteParams(finalString, undefined, characterOverride);
|
|
|
|
let overlaidMatch = regexMatch;
|
|
// TODO: Maybe move the for loops into a separate function?
|
|
if (replaceStrategy === regex_replace_strategy.OVERLAY) {
|
|
const splitReplace = finalString.split('{{match}}');
|
|
|
|
// There's a prefix
|
|
if (splitReplace[0]) {
|
|
// Fetch the prefix
|
|
const splicedPrefix = spliceSymbols(splitReplace[0], false);
|
|
|
|
// Sequentially remove all occurrences of prefix from start of split
|
|
const splitMatch = overlaidMatch.split(splicedPrefix);
|
|
let sliceNum = 0;
|
|
for (let index = 0; index < splitMatch.length; index++) {
|
|
if (splitMatch[index].length === 0) {
|
|
sliceNum++;
|
|
} else {
|
|
break;
|
|
}
|
|
}
|
|
|
|
overlaidMatch = splitMatch.slice(sliceNum, splitMatch.length).join(splicedPrefix);
|
|
}
|
|
|
|
// There's a suffix
|
|
if (splitReplace[1]) {
|
|
// Fetch the suffix
|
|
const splicedSuffix = spliceSymbols(splitReplace[1], true);
|
|
|
|
// Sequential removal of all suffix occurrences from end of split
|
|
const splitMatch = overlaidMatch.split(splicedSuffix);
|
|
let sliceNum = 0;
|
|
for (let index = splitMatch.length - 1; index >= 0; index--) {
|
|
if (splitMatch[index].length === 0) {
|
|
sliceNum++;
|
|
} else {
|
|
break;
|
|
}
|
|
}
|
|
|
|
overlaidMatch = splitMatch.slice(0, splitMatch.length - sliceNum).join(splicedSuffix);
|
|
}
|
|
}
|
|
|
|
// Only one match is replaced. This is by design
|
|
finalString = finalString.replace('{{match}}', overlaidMatch) || finalString.replace('{{match}}', regexMatch);
|
|
|
|
return finalString;
|
|
}
|
|
|
|
/**
|
|
* Splices common sentence symbols and whitespace from the beginning and end of a string.
|
|
* Using a for loop due to sequential ordering.
|
|
* @param {string} rawString The raw string to splice
|
|
* @param {boolean} isSuffix String is a suffix
|
|
* @returns {string} The spliced string
|
|
*/
|
|
function spliceSymbols(rawString, isSuffix) {
|
|
let offset = 0;
|
|
|
|
for (const ch of isSuffix ? rawString.split('').reverse() : rawString) {
|
|
if (ch.match(/[^\w.,?'!]/)) {
|
|
offset++;
|
|
} else {
|
|
break;
|
|
}
|
|
}
|
|
|
|
return isSuffix ? rawString.substring(0, rawString.length - offset) : rawString.substring(offset);
|
|
}
|