prototype-3x5/src/parser.ts

158 lines
4 KiB
TypeScript
Raw Normal View History

2023-09-08 04:47:47 +00:00
import { escapeHtml } from './helpers';
import { AtLeast, Choose, End, Pattern, Peek, Regex, Sequence, Use } from './peg';
import {
2023-09-08 04:47:47 +00:00
InterpolatedPiece, Script, ScriptPiece, SimplifyWord, TextWord, Word as WordType
} from './words';
2023-08-05 05:09:33 +00:00
const Comment = Regex(/#[^\n]*/y)
.expects("#")
.map(() => []);
const PreWordWhitespace = Regex(/[^\S\n;]+/y).expects("whitespace");
2023-09-08 18:47:24 +00:00
const BackslashEscape = Sequence(
Regex(/\\/y).expects("BACKSLASH"),
Regex(/./y).expects("CHAR")
).map(([, [char]]) => ({ text: char }));
2023-08-23 05:09:56 +00:00
2023-08-25 23:10:45 +00:00
const BARE_WORD_CHAR = /[^\s\\;\[]+/y;
const BARE_BRACKET_WORD_CHAR = /[^\s\\;\[\]]+/y;
let BracketScript: Pattern<Script>;
const Bracket: Pattern<ScriptPiece> = Sequence(
Regex(/\[/y).expects("["),
Use(() => BracketScript)
)
.expects("[")
.map(([, script]) => ({ script }));
function bareWordTmpl(charRegex: RegExp) {
return Sequence(
2023-09-08 18:47:24 +00:00
Regex(/(?!["{])/y),
AtLeast(
1,
Choose<InterpolatedPiece>(
BackslashEscape,
2023-08-25 23:10:45 +00:00
Bracket,
Regex(charRegex)
.expects("CHAR")
.map(([text]) => ({ enchanted: text }))
)
2023-08-23 05:09:56 +00:00
)
).map(([, pieces]) => SimplifyWord(pieces));
}
2023-08-23 05:09:56 +00:00
const QuotedWord = Sequence(
Regex(/"/y).expects('"'),
AtLeast(
0,
Choose<InterpolatedPiece>(
2023-08-23 05:09:56 +00:00
BackslashEscape,
2023-08-25 23:10:45 +00:00
Bracket,
Regex(/[^"\\\[]+/y)
2023-08-23 05:09:56 +00:00
.expects("CHAR")
.map(([text]) => ({ text }))
)
),
Regex(/"/y).expects('"')
).map(([, pieces]) => SimplifyWord(pieces));
2023-08-05 05:09:33 +00:00
2023-08-06 06:09:30 +00:00
const Brace: Pattern<string> = Sequence(
2023-08-05 05:09:33 +00:00
Regex(/\{/y).expects("{"),
AtLeast(
0,
Choose(
Use(() => Brace)
.expects("{")
.map((text) => `{${text}}`),
2023-08-22 03:57:27 +00:00
Regex(/\\./y)
2023-09-08 18:47:24 +00:00
.expects("BACKSLASH")
2023-08-22 03:57:27 +00:00
.map(([escape]) => escape),
Regex(/[^\\{}]+/y)
2023-09-08 18:47:24 +00:00
.expects("CHAR")
2023-08-05 05:09:33 +00:00
.map(([text]) => text)
)
),
Regex(/\}/y).expects("}")
2023-08-23 05:09:56 +00:00
).map(([, fragments]) => fragments.join(""));
2023-08-05 05:09:33 +00:00
function wordTmpl(bareWordCharRegex: RegExp): Pattern<WordType> {
return Choose<WordType>(
Brace.map((text) => ({ text } as TextWord)),
QuotedWord,
bareWordTmpl(bareWordCharRegex)
);
}
2023-08-05 05:09:33 +00:00
const CommandTerminator = Regex(/[\n;]/y)
.expects("NEWLINE | ;")
.map(() => true);
function commandTmpl(bareWordCharRegex: RegExp) {
const word = wordTmpl(bareWordCharRegex);
return Sequence(
word,
AtLeast(
0,
Sequence(PreWordWhitespace, word).map(([, word]) => word)
),
AtLeast(0, PreWordWhitespace)
).map(([word, moreWords]) => [word].concat(moreWords));
}
2023-08-05 05:09:33 +00:00
function scriptTmpl(bareWordCharRegex: RegExp, endPattern: Pattern<unknown>) {
return Sequence(
AtLeast(
0,
Choose(
PreWordWhitespace.map(() => []),
CommandTerminator.map(() => []),
Sequence(Comment, Choose(CommandTerminator, Peek(endPattern))).map(
() => []
),
Sequence(
commandTmpl(bareWordCharRegex),
Choose(CommandTerminator, Peek(endPattern))
).map(([words]) => words)
2023-08-05 05:09:33 +00:00
)
),
endPattern
).map(([commands]) => commands.filter((command) => command.length > 0));
}
const Script = scriptTmpl(BARE_WORD_CHAR, End());
2023-08-25 23:10:45 +00:00
BracketScript = scriptTmpl(BARE_BRACKET_WORD_CHAR, Regex(/\]/y).expects("]"));
2023-08-05 05:09:33 +00:00
const ERROR_CONTEXT = /(?<=([^\n]{0,50}))([^\n]{0,50})/y;
2023-07-29 17:50:13 +00:00
2023-08-05 05:09:33 +00:00
/**
* Parse out a Notcl script into an easier-to-interpret representation.
* No script is actually executed yet.
*
* @param - code to parse
* @returns - parsed list of commands, or error message on failure
*/
export function parse(code: string): [true, Script] | [false, string] {
/* Preprocess */
// fold line endings
code = code.replace(/(?<!\\)((\\\\)*)\\\n[ \t]*/g, "$1 ");
2023-08-05 05:09:33 +00:00
/* Parse */
2023-09-08 04:47:47 +00:00
const [commands, errorPos, expected] = Script.match(code, 0);
2023-08-05 05:09:33 +00:00
if (commands) {
return [true, commands[0]];
} else {
ERROR_CONTEXT.lastIndex = errorPos;
const [, before, after] = ERROR_CONTEXT.exec(code)!;
return [
false,
`<pre>Error at position ${errorPos}
${escapeHtml(before + "" + after)}
${"-".repeat(before.length)}^
Expected: ${escapeHtml(expected)}</pre>`,
2023-08-05 05:09:33 +00:00
];
}
}