prototype-3x5/src/parser.ts

177 lines
4.2 KiB
TypeScript
Raw Normal View History

2023-08-05 05:09:33 +00:00
import { escapeHtml } from "./helpers";
import {
AtLeast,
Choose,
End,
Pattern,
Peek,
Regex,
Sequence,
Use,
} from "./peg";
import {
EnchantedWord as EnchantedWordType,
InterpolatedPiece,
2023-08-25 23:16:33 +00:00
Script,
2023-08-25 23:10:45 +00:00
ScriptPiece,
2023-08-25 23:16:33 +00:00
SimplifyWord,
TextWord,
Word as WordType,
} from "./words";
2023-08-05 05:09:33 +00:00
const Comment = Regex(/#[^\n]*/y)
.expects("#")
.map(() => []);
const PreWordWhitespace = Regex(/[^\S\n;]+/y).expects("whitespace");
2023-08-25 23:10:45 +00:00
const EnchantedWord = Regex(/[^\]\[\}\{$\\";\s]+(?=[\s;\]]|$)/y)
.map(([enchanted]) => ({ enchanted } as EnchantedWordType))
.expects("ENCHANTED_WORD");
2023-08-23 05:09:56 +00:00
const BackslashEscape = Regex(/\\(.)/y)
.expects("\\")
.map(([, char]) => ({ text: char }));
2023-08-25 23:10:45 +00:00
const BARE_WORD_CHAR = /[^\s\\;\[]+/y;
const BARE_BRACKET_WORD_CHAR = /[^\s\\;\[\]]+/y;
let BracketScript: Pattern<Script>;
const Bracket: Pattern<ScriptPiece> = Sequence(
Regex(/\[/y).expects("["),
Use(() => BracketScript)
)
.expects("[")
.map(([, script]) => ({ script }));
function bareWordTmpl(charRegex: RegExp) {
return Sequence(
Regex(/(?!["\{])/y),
AtLeast(
1,
Choose<InterpolatedPiece>(
BackslashEscape,
2023-08-25 23:10:45 +00:00
Bracket,
Regex(charRegex)
.expects("CHAR")
.map(([text]) => ({ text }))
)
2023-08-23 05:09:56 +00:00
)
).map(([, pieces]) => SimplifyWord(pieces));
}
2023-08-23 05:09:56 +00:00
const QuotedWord = Sequence(
Regex(/"/y).expects('"'),
AtLeast(
0,
Choose<InterpolatedPiece>(
2023-08-23 05:09:56 +00:00
BackslashEscape,
2023-08-25 23:10:45 +00:00
Bracket,
Regex(/[^"\\\[]+/y)
2023-08-23 05:09:56 +00:00
.expects("CHAR")
.map(([text]) => ({ text }))
)
),
Regex(/"/y).expects('"')
).map(([, pieces]) => SimplifyWord(pieces));
2023-08-05 05:09:33 +00:00
2023-08-06 06:09:30 +00:00
const Brace: Pattern<string> = Sequence(
2023-08-05 05:09:33 +00:00
Regex(/\{/y).expects("{"),
AtLeast(
0,
Choose(
Use(() => Brace)
.expects("{")
.map((text) => `{${text}}`),
2023-08-22 03:57:27 +00:00
Regex(/\\./y)
.expects("\\")
.map(([escape]) => escape),
Regex(/[^\\{}]+/y)
2023-08-05 05:09:33 +00:00
.expects("text")
.map(([text]) => text)
)
),
Regex(/\}/y).expects("}")
2023-08-23 05:09:56 +00:00
).map(([, fragments]) => fragments.join(""));
2023-08-05 05:09:33 +00:00
function wordTmpl(bareWordCharRegex: RegExp): Pattern<WordType> {
return Choose<WordType>(
EnchantedWord,
Brace.map((text) => ({ text } as TextWord)),
QuotedWord,
bareWordTmpl(bareWordCharRegex)
);
}
2023-08-05 05:09:33 +00:00
const CommandTerminator = Regex(/[\n;]/y)
.expects("NEWLINE | ;")
.map(() => true);
function commandTmpl(bareWordCharRegex: RegExp) {
const word = wordTmpl(bareWordCharRegex);
return Sequence(
word,
AtLeast(
0,
Sequence(PreWordWhitespace, word).map(([, word]) => word)
),
AtLeast(0, PreWordWhitespace)
).map(([word, moreWords]) => [word].concat(moreWords));
}
2023-08-05 05:09:33 +00:00
function scriptTmpl(bareWordCharRegex: RegExp, endPattern: Pattern<unknown>) {
return Sequence(
AtLeast(
0,
Choose(
PreWordWhitespace.map(() => []),
CommandTerminator.map(() => []),
Sequence(Comment, Choose(CommandTerminator, Peek(endPattern))).map(
() => []
),
Sequence(
commandTmpl(bareWordCharRegex),
Choose(CommandTerminator, Peek(endPattern))
).map(([words]) => words)
2023-08-05 05:09:33 +00:00
)
),
endPattern
).map(([commands]) => commands.filter((command) => command.length > 0));
}
const Script = scriptTmpl(BARE_WORD_CHAR, End());
2023-08-25 23:10:45 +00:00
BracketScript = scriptTmpl(BARE_BRACKET_WORD_CHAR, Regex(/\]/y).expects("]"));
2023-08-05 05:09:33 +00:00
const ERROR_CONTEXT = /(?<=([^\n]{0,50}))([^\n]{0,50})/y;
2023-07-29 17:50:13 +00:00
2023-08-05 05:09:33 +00:00
/**
* Parse out a Notcl script into an easier-to-interpret representation.
* No script is actually executed yet.
*
* @param - code to parse
* @returns - parsed list of commands, or error message on failure
*/
export function parse(code: string): [true, Script] | [false, string] {
/* Preprocess */
// fold line endings
code = code.replace(/(?<!\\)((\\\\)*)\\\n[ \t]*/g, "$1 ");
2023-08-05 05:09:33 +00:00
/* Parse */
const [commands, errorPos, expected] = Script(code, 0);
if (commands) {
return [true, commands[0]];
} else {
ERROR_CONTEXT.lastIndex = errorPos;
const [, before, after] = ERROR_CONTEXT.exec(code)!;
return [
false,
`<pre>Error at position ${errorPos}
${escapeHtml(before + "" + after)}
${"-".repeat(before.length)}^
Expected: ${escapeHtml(expected)}</pre>`,
2023-08-05 05:09:33 +00:00
];
}
}