2023-12-02 19:04:51 +01:00
import { substituteParams } from '../../../script.js' ;
import { extension _settings } from '../../extensions.js' ;
2023-07-20 19:32:15 +02:00
export {
regex _placement ,
getRegexedString ,
2023-12-02 21:06:57 +01:00
runRegexScript ,
2023-12-02 20:11:06 +01:00
} ;
2023-07-20 19:32:15 +02:00
2024-01-03 18:53:24 +01:00
/ * *
* @ enum { number } Where the regex script should be applied
* /
2023-07-20 19:32:15 +02:00
const regex _placement = {
2024-01-03 18:53:24 +01:00
/ * *
* @ deprecated MD Display is deprecated . Do not use .
* /
2023-07-20 19:32:15 +02:00
MD _DISPLAY : 0 ,
USER _INPUT : 1 ,
AI _OUTPUT : 2 ,
2023-12-02 21:06:57 +01:00
SLASH _COMMAND : 3 ,
2023-12-02 20:11:06 +01:00
} ;
2023-07-20 19:32:15 +02:00
2024-01-03 18:53:24 +01:00
/ * *
* Instantiates a regular expression from a string .
* @ param { string } input The input string .
* @ returns { RegExp } The regular expression instance .
* @ copyright Originally from : https : //github.com/IonicaBizau/regex-parser.js/blob/master/lib/index.js
* /
2023-07-20 19:32:15 +02:00
function regexFromString ( input ) {
try {
// Parse input
var m = input . match ( /(\/?)(.+)\1([a-z]*)/i ) ;
2023-11-02 23:52:33 +01:00
2023-07-20 19:32:15 +02:00
// Invalid flags
if ( m [ 3 ] && ! /^(?!.*?(.).*?\1)[gmixXsuUAJ]+$/ . test ( m [ 3 ] ) ) {
return RegExp ( input ) ;
}
2023-11-02 23:52:33 +01:00
2023-07-20 19:32:15 +02:00
// Create the regular expression
return new RegExp ( m [ 2 ] , m [ 3 ] ) ;
} catch {
return ;
}
}
2024-01-03 18:53:24 +01:00
/ * *
* Parent function to fetch a regexed version of a raw string
* @ param { string } rawString The raw string to be regexed
* @ param { regex _placement } placement The placement of the string
* @ param { RegexParams } params The parameters to use for the regex script
* @ returns { string } The regexed string
2024-01-24 21:48:58 +01:00
* @ typedef { { characterOverride ? : string , isMarkdown ? : boolean , isPrompt ? : boolean , depth ? : number } } RegexParams The parameters to use for the regex script
2024-01-03 18:53:24 +01:00
* /
2024-01-24 21:48:58 +01:00
function getRegexedString ( rawString , placement , { characterOverride , isMarkdown , isPrompt , depth } = { } ) {
2024-01-03 18:53:24 +01:00
// WTF have you passed me?
if ( typeof rawString !== 'string' ) {
console . warn ( 'getRegexedString: rawString is not a string. Returning empty string.' ) ;
return '' ;
}
2023-07-20 19:32:15 +02:00
let finalString = rawString ;
2023-12-02 19:04:51 +01:00
if ( extension _settings . disabledExtensions . includes ( 'regex' ) || ! rawString || placement === undefined ) {
2023-07-20 19:32:15 +02:00
return finalString ;
}
extension _settings . regex . forEach ( ( script ) => {
2023-11-02 23:52:33 +01:00
if (
// Script applies to Markdown and input is Markdown
( script . markdownOnly && isMarkdown ) ||
// Script applies to Generate and input is Generate
( script . promptOnly && isPrompt ) ||
// Script applies to all cases when neither "only"s are true, but there's no need to do it when `isMarkdown`, the as source (chat history) should already be changed beforehand
( ! script . markdownOnly && ! script . promptOnly && ! isMarkdown )
) {
2024-01-24 21:48:58 +01:00
// Check if the depth is within the min/max depth
if ( typeof depth === 'number' && depth >= 0 ) {
2024-02-04 20:34:17 +01:00
if ( ! isNaN ( script . minDepth ) && script . minDepth !== null && script . minDepth >= 0 && depth < script . minDepth ) {
2024-01-24 21:48:58 +01:00
console . debug ( ` getRegexedString: Skipping script ${ script . scriptName } because depth ${ depth } is less than minDepth ${ script . minDepth } ` ) ;
return ;
}
2024-02-04 20:34:17 +01:00
if ( ! isNaN ( script . maxDepth ) && script . maxDepth !== null && script . maxDepth >= 0 && depth > script . maxDepth ) {
2024-01-24 21:48:58 +01:00
console . debug ( ` getRegexedString: Skipping script ${ script . scriptName } because depth ${ depth } is greater than maxDepth ${ script . maxDepth } ` ) ;
return ;
}
}
2023-11-02 23:52:33 +01:00
if ( script . placement . includes ( placement ) ) {
finalString = runRegexScript ( script , finalString , { characterOverride } ) ;
}
2023-07-20 19:32:15 +02:00
}
} ) ;
return finalString ;
}
2024-01-03 11:28:56 +01:00
/ * *
* Runs the provided regex script on the given string
* @ param { object } regexScript The regex script to run
* @ param { string } rawString The string to run the regex script on
2024-01-03 18:53:24 +01:00
* @ param { RegexScriptParams } params The parameters to use for the regex script
2024-01-03 11:28:56 +01:00
* @ returns { string } The new string
2024-01-03 18:53:24 +01:00
* @ typedef { { characterOverride ? : string } } RegexScriptParams The parameters to use for the regex script
2024-01-03 11:28:56 +01:00
* /
2023-07-20 19:32:15 +02:00
function runRegexScript ( regexScript , rawString , { characterOverride } = { } ) {
let newString = rawString ;
if ( ! regexScript || ! ! ( regexScript . disabled ) || ! regexScript ? . findRegex || ! rawString ) {
return newString ;
}
const findRegex = regexFromString ( regexScript . substituteRegex ? substituteParams ( regexScript . findRegex ) : regexScript . findRegex ) ;
// The user skill issued. Return with nothing.
if ( ! findRegex ) {
return newString ;
}
2024-01-06 06:30:25 +01:00
// Run replacement. Currently does not support the Overlay strategy
newString = rawString . replace ( findRegex , function ( match ) {
const args = [ ... arguments ] ;
2024-01-11 01:41:00 +01:00
const replaceString = regexScript . replaceString . replace ( /{{match}}/gi , '$0' ) ;
2024-01-06 06:30:25 +01:00
const replaceWithGroups = replaceString . replaceAll ( /\$(\d)+/g , ( _ , num ) => {
2024-01-11 01:41:00 +01:00
// Get a full match or a capture group
2024-01-06 06:30:25 +01:00
const match = args [ Number ( num ) ] ;
2024-01-11 01:41:00 +01:00
// No match found - return the empty string
if ( ! match ) {
return '' ;
}
// Remove trim strings from the match
2024-01-06 06:30:25 +01:00
const filteredMatch = filterString ( match , regexScript . trimStrings , { characterOverride } ) ;
// TODO: Handle overlay here
return filteredMatch ;
} ) ;
// Substitute at the end
return substituteParams ( replaceWithGroups ) ;
2024-01-03 18:53:24 +01:00
} ) ;
2023-07-20 19:32:15 +02:00
return newString ;
}
2024-01-03 18:53:24 +01:00
/ * *
* Filters anything to trim from the regex match
* @ param { string } rawString The raw string to filter
* @ param { string [ ] } trimStrings The strings to trim
* @ param { RegexScriptParams } params The parameters to use for the regex filter
* @ returns { string } The filtered string
* /
2023-07-20 19:32:15 +02:00
function filterString ( rawString , trimStrings , { characterOverride } = { } ) {
let finalString = rawString ;
2024-01-06 06:33:52 +01:00
trimStrings . forEach ( ( trimString ) => {
2023-07-20 19:32:15 +02:00
const subTrimString = substituteParams ( trimString , undefined , characterOverride ) ;
2023-12-02 19:04:51 +01:00
finalString = finalString . replaceAll ( subTrimString , '' ) ;
2024-01-06 06:33:52 +01:00
} ) ;
2023-07-20 19:32:15 +02:00
return finalString ;
}