Parser consumes basic macros

- Fix lexer mode names - Add basic macro parsing (identifier, and arguments) - Tests: basic macro parsing tests - Tests: simplifyCstNode supports ignoring nodes, or flattening nodes to just plaintext
2025-06-05 21:59:27 +02:00 · 2025-03-17 00:12:04 +01:00
parent 6a72369327
commit efa367541a
3 changed files with 167 additions and 33 deletions
--- a/public/scripts/macros/MacroLexer.js
+++ b/public/scripts/macros/MacroLexer.js
@@ -6,10 +6,10 @@ import { createToken, Lexer } from '../../lib/chevrotain.js';
 const modes = {
    plaintext: 'plaintext_mode',
    macro_def: 'macro_def_mode',
-    macro_identifier_end: 'macro_identifier_end',
+    macro_identifier_end: 'macro_identifier_end_mode',
    macro_args: 'macro_args_mode',
    macro_filter_modifer: 'macro_filter_modifer_mode',
-    macro_filter_modifier_end: 'macro_filter_modifier_end',
+    macro_filter_modifier_end: 'macro_filter_modifier_end_mode',
 };

 /** @readonly */
@@ -146,7 +146,9 @@ class MacroLexer extends Lexer {

    /** @private */
    constructor() {
-        super(MacroLexer.def);
+        super(MacroLexer.def, {
+            traceInitPerf: true,
+        });
    }

    test(input) {
--- a/public/scripts/macros/MacroParser.js
+++ b/public/scripts/macros/MacroParser.js
@@ -1,6 +1,8 @@
 import { CstParser } from '../../lib/chevrotain.js';
 import { MacroLexer } from './MacroLexer.js';

+/** @typedef {import('../../lib/chevrotain.js').TokenType} TokenType */
+
 /**
 * The singleton instance of the MacroParser.
 *
@@ -15,20 +17,45 @@ class MacroParser extends CstParser {

    /** @private */
    constructor() {
-        super(MacroLexer.def);
+        super(MacroLexer.def, {
+            traceInitPerf: true,
+            nodeLocationTracking: 'full',
+        });
        const Tokens = MacroLexer.tokens;

        const $ = this;

-        this.macro = $.RULE('macro', () => {
+        // Basic Macro Structure
+        $.macro = $.RULE('macro', () => {
            $.CONSUME(Tokens.Macro.Start);
            $.CONSUME(Tokens.Macro.Identifier);
            $.OPTION(() => $.SUBRULE($.arguments));
            $.CONSUME(Tokens.Macro.End);
        });

-        this.arguments = $.RULE('arguments', () => {
-            $.CONSUME(Tokens.Identifier);
+        // Arguments Parsing
+        $.arguments = $.RULE('arguments', () => {
+            // Remember the separator being used, it needs to stay consistent
+            /** @type {import('../../lib/chevrotain.js').IToken} */
+            let separator;
+            $.OR([
+                { ALT: () => separator = $.CONSUME(Tokens.Args.DoubleColon, { LABEL: 'separator' }) },
+                { ALT: () => separator = $.CONSUME(Tokens.Args.Colon, { LABEL: 'separator' }) },
+            ]);
+            $.AT_LEAST_ONE_SEP({
+                SEP: separator.tokenType,
+                DEF: () => $.SUBRULE($.argument),
+            });
+        });
+
+        $.argument = $.RULE('argument', () => {
+            $.MANY(() => {
+                $.OR([
+                    { ALT: () => $.SUBRULE($.macro) }, // Nested Macros
+                    { ALT: () => $.CONSUME(Tokens.Identifier) },
+                    { ALT: () => $.CONSUME(Tokens.Unknown) },
+                ]);
+            });
        });

        this.performSelfAnalysis();
--- a/tests/frontend/MacroParser.test.js
+++ b/tests/frontend/MacroParser.test.js
@@ -40,20 +40,6 @@ describe('MacroParser', () => {

            expect(macroCst).toEqual(expectedCst);
        });
-        // {{ macro value }}
-        it('should only read one identifier and treat the rest as arguments', async () => {
-            const input = '{{ macro value }}';
-            const macroCst = await runParser(input);
-
-            const expectedCst = {
-                'Macro.Start': '{{',
-                'Macro.Identifier': 'macro',
-                'arguments': { 'Identifier': 'value' },
-                'Macro.End': '}}',
-            };
-
-            expect(macroCst).toEqual(expectedCst);
-        });

        describe('Error Cases (General Macro', () => {
            // {{}}
@@ -94,16 +80,107 @@ describe('MacroParser', () => {
            });
        });
    });
+
+    describe('Arguments Handling', () => {
+        it('should parse macros with double-colon argument', async () => {
+            const input = '{{getvar::myvar}}';
+            const macroCst = await runParser(input, {
+                flattenKeys: ['arguments.argument'],
+            });
+            expect(macroCst).toEqual({
+                'Macro.Start': '{{',
+                'Macro.Identifier': 'getvar',
+                'arguments': {
+                    'separator': '::',
+                    'argument': 'myvar',
+                },
+                'Macro.End': '}}',
+            });
+        });
+
+        it('should parse macros with single colon arguments', async () => {
+            const input = '{{roll:3d20}}';
+            const macroCst = await runParser(input, {
+                flattenKeys: ['arguments.argument'],
+            });
+            expect(macroCst).toEqual({
+                'Macro.Start': '{{',
+                'Macro.Identifier': 'roll',
+                'arguments': {
+                    'separator': ':',
+                    'argument': '3d20',
+                },
+                'Macro.End': '}}',
+            });
+        });
+
+        it('should parse macros with double-colon arguments', async () => {
+            const input = '{{setvar::myvar::value}}';
+            const macroCst = await runParser(input, {
+                flattenKeys: ['arguments.argument'],
+                ignoreKeys: ['arguments.Args.DoubleColon'],
+            });
+            expect(macroCst).toEqual({
+                'Macro.Start': '{{',
+                'Macro.Identifier': 'setvar',
+                'arguments': {
+                    'separator': '::',
+                    'argument': ['myvar', 'value'],
+                },
+                'Macro.End': '}}',
+            });
+        });
+
+        it('should strip spaces around arguments', async () => {
+            const input = '{{something::  spaced  }}';
+            const macroCst = await runParser(input, {
+                flattenKeys: ['arguments.argument'],
+                ignoreKeys: ['arguments.separator', 'arguments.Args.DoubleColon'],
+            });
+            expect(macroCst).toEqual({
+                'Macro.Start': '{{',
+                'Macro.Identifier': 'something',
+                'arguments': { 'argument': 'spaced' },
+                'Macro.End': '}}',
+            });
+        });
+    });
+
+    describe('Nested Macros', () => {
+        it('should parse nested macros inside arguments', async () => {
+            const input = '{{outer::word {{inner}}}}';
+            const macroCst = await runParser(input, {});
+            expect(macroCst).toEqual({
+                'Macro.Start': '{{',
+                'Macro.Identifier': 'outer',
+                'arguments': {
+                    'argument': {
+                        'Identifier': 'word',
+                        'macro': {
+                            'Macro.Start': '{{',
+                            'Macro.Identifier': 'inner',
+                            'Macro.End': '}}',
+                        },
+                    },
+                    'separator': '::',
+                },
+                'Macro.End': '}}',
+            });
+        });
+    });
 });

 /**
 * Runs the input through the MacroParser and returns the result.
 *
 * @param {string} input - The input string to be parsed.
- * @return {Promise<TestableCstNode>} A promise that resolves to the result of the MacroParser.
+ * @param {Object} [options={}] Optional arguments
+ * @param {string[]} [options.flattenKeys=[]] Optional array of dot-separated keys to flatten
+ * @param {string[]} [options.ignoreKeys=[]] Optional array of dot-separated keys to ignore
+ * @returns {Promise<TestableCstNode>} A promise that resolves to the result of the MacroParser.
 */
-async function runParser(input) {
-    const { cst, errors } = await runParserAndGetErrors(input);
+async function runParser(input, options = {}) {
+    const { cst, errors } = await runParserAndGetErrors(input, options);

    // Make sure that parser errors get correctly marked as errors during testing, even if the resulting structure might work.
    // If we don't test for errors, the test should fail.
@@ -120,9 +197,12 @@ async function runParser(input) {
 * Use `runParser` if you don't want to explicitly test against parser errors.
 *
 * @param {string} input - The input string to be parsed.
- * @return {Promise<{cst: TestableCstNode, errors: TestableRecognitionException[]}>} A promise that resolves to the result of the MacroParser and error list.
+ * @param {Object} [options={}] Optional arguments
+ * @param {string[]} [options.flattenKeys=[]] Optional array of dot-separated keys to flatten
+ * @param {string[]} [options.ignoreKeys=[]] Optional array of dot-separated keys to ignore
+ * @returns {Promise<{cst: TestableCstNode, errors: TestableRecognitionException[]}>} A promise that resolves to the result of the MacroParser and error list.
 */
-async function runParserAndGetErrors(input) {
+async function runParserAndGetErrors(input, options = {}) {
    const result = await page.evaluate(async (input) => {
        /** @type {import('../../public/scripts/macros/MacroParser.js')} */
        const { MacroParser } = await import('./scripts/macros/MacroParser.js');
@@ -131,31 +211,56 @@ async function runParserAndGetErrors(input) {
        return result;
    }, input);

-    return { cst: simplifyCstNode(result.cst), errors: simplifyErrors(result.errors) };
+    return { cst: simplifyCstNode(result.cst, input, options), errors: simplifyErrors(result.errors) };
 }

 /**
 * Simplify the parser syntax tree result into an easily testable format.
 *
 * @param {CstNode} result The result from the parser
+ * @param {Object} [options={}] Optional arguments
+ * @param {string[]} [options.flattenKeys=[]] Optional array of dot-separated keys to flatten
+ * @param {string[]} [options.ignoreKeys=[]] Optional array of dot-separated keys to ignore
 * @returns {TestableCstNode} The testable syntax tree
 */
-function simplifyCstNode(cst) {
-    /** @returns {TestableCstNode} @param {CstNode} node */
-    function simplifyNode(node) {
+function simplifyCstNode(cst, input, { flattenKeys = [], ignoreKeys = [] } = {}) {
+    /** @returns {TestableCstNode} @param {CstNode} node @param {string[]} path */
+    function simplifyNode(node, path = []) {
        if (!node) return node;
        if (Array.isArray(node)) {
            // Single-element arrays are converted to a single string
            if (node.length === 1) {
-                return node[0].image || simplifyNode(node[0]);
+                return node[0].image || simplifyNode(node[0], path.concat('[]'));
            }
            // For multiple elements, return an array of simplified nodes
-            return node.map(simplifyNode);
+            return node.map(child => simplifyNode(child, path.concat('[]')));
        }
        if (node.children) {
            const simplifiedChildren = {};
            for (const key in node.children) {
-                simplifiedChildren[key] = simplifyNode(node.children[key]);
+                function simplifyChildNode(childNode, path) {
+                    if (Array.isArray(childNode)) {
+                        // Single-element arrays are converted to a single string
+                        if (childNode.length === 1) {
+                            return simplifyChildNode(childNode[0], path.concat('[]'));
+                        }
+                        return childNode.map(child => simplifyChildNode(child, path.concat('[]')));
+                    }
+
+                    const flattenKey = path.filter(x => x !== '[]').join('.');
+                    if (ignoreKeys.includes(flattenKey)) {
+                        return null;
+                    } else if (flattenKeys.includes(flattenKey)) {
+                        const startOffset = childNode.location.startOffset;
+                        const endOffset = childNode.location.endOffset;
+                        return input.slice(startOffset, endOffset + 1);
+                    } else {
+                        return simplifyNode(childNode, path);
+                    }
+                }
+
+                const simplifiedValue = simplifyChildNode(node.children[key], path.concat(key));
+                simplifiedValue && (simplifiedChildren[key] = simplifiedValue);
            }
            return simplifiedChildren;
        }