mirror of
https://github.com/denoland/deno.git
synced 2025-01-16 19:04:02 -05:00
70 lines
1.6 KiB
TypeScript
70 lines
1.6 KiB
TypeScript
|
export type Token = {
|
||
|
type: string;
|
||
|
value: string | number;
|
||
|
index: number;
|
||
|
};
|
||
|
|
||
|
interface ReceiverResult {
|
||
|
[name: string]: string | number;
|
||
|
}
|
||
|
export type CallbackResult = { type: string; value: string | number };
|
||
|
type CallbackFunction = (value: unknown) => CallbackResult;
|
||
|
|
||
|
export type TestResult = { value: unknown; length: number } | undefined;
|
||
|
export type TestFunction = (
|
||
|
string: string,
|
||
|
) => TestResult | undefined;
|
||
|
|
||
|
export interface Rule {
|
||
|
test: TestFunction;
|
||
|
fn: CallbackFunction;
|
||
|
}
|
||
|
|
||
|
export class Tokenizer {
|
||
|
rules: Rule[];
|
||
|
|
||
|
constructor(rules: Rule[] = []) {
|
||
|
this.rules = rules;
|
||
|
}
|
||
|
|
||
|
addRule(test: TestFunction, fn: CallbackFunction): Tokenizer {
|
||
|
this.rules.push({ test, fn });
|
||
|
return this;
|
||
|
}
|
||
|
|
||
|
tokenize(
|
||
|
string: string,
|
||
|
receiver = (token: Token): ReceiverResult => token,
|
||
|
): ReceiverResult[] {
|
||
|
function* generator(rules: Rule[]): IterableIterator<ReceiverResult> {
|
||
|
let index = 0;
|
||
|
for (const rule of rules) {
|
||
|
const result = rule.test(string);
|
||
|
if (result) {
|
||
|
const { value, length } = result;
|
||
|
index += length;
|
||
|
string = string.slice(length);
|
||
|
const token = { ...rule.fn(value), index };
|
||
|
yield receiver(token);
|
||
|
yield* generator(rules);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
const tokenGenerator = generator(this.rules);
|
||
|
|
||
|
const tokens: ReceiverResult[] = [];
|
||
|
|
||
|
for (const token of tokenGenerator) {
|
||
|
tokens.push(token);
|
||
|
}
|
||
|
|
||
|
if (string.length) {
|
||
|
throw new Error(
|
||
|
`parser error: string not fully parsed! ${string.slice(0, 25)}`,
|
||
|
);
|
||
|
}
|
||
|
|
||
|
return tokens;
|
||
|
}
|
||
|
}
|