nwex.de/html/tokenizer/token.ts
networkException 586546ee57 Everywhere: Rework website concept completely
This patch removes the Next.js React project that was contained
by this repository previously. The replacement is a vanilla HTML
page with TypeScript that parses it's own HTML source and highlights
it using on load.

The concept will be iterated on in following commits, planned are
on hover tooltips showing metadata about HTML tokens as well as
tokenizing (perhaps parsing) of JavaScript and CSS to be able to
highlight those sections as well. To properly determent the range
of script and style sections it might be required to also implement
HTML tree building, however on read execution of JavaScript or
on the fly parsing as well as fragment parsing is not required for
the site.

This commit merely represents a start and is made to better track
the progress of changes.
2021-10-24 22:36:38 +02:00

61 lines
No EOL
1.9 KiB
TypeScript

export const enum Type {
DOCTYPE = 'DOCTYPE',
StartTag = 'start tag',
EndTag = 'end tag',
Comment = 'comment',
Character = 'character',
EndOfFile = 'end-of-file'
}
export type Attribute = { name: NonNullable<string>, value: NonNullable<string> };
export class AttributeList {
private attributes: Array<Attribute>;
public constructor() {
this.attributes = new Array<Attribute>();
}
public get current(): Attribute {
return this.attributes[this.attributes.length - 1];
}
public get list(): Array<Attribute> {
return this.attributes;
}
public nonEmpty(): boolean {
return this.list.length !== 0;
}
public append(attribute: Attribute): void {
this.attributes.push(attribute);
}
}
export type Token = { type: Type.DOCTYPE, name?: string, publicIdentifier?: string, systemIdentifier?: string, forceQuirks?: true } |
{ type: Type.StartTag, name: NonNullable<string>, selfClosing?: true, attributes: AttributeList } |
{ type: Type.EndTag, name: NonNullable<string>, selfClosing?: true, attributes: AttributeList } |
{ type: Type.Comment, data: NonNullable<string> } |
{ type: Type.Character, data: NonNullable<string> } |
{ type: Type.EndOfFile };
export function stringify(token: Token): string {
switch (token.type) {
case Type.Character: return token.data;
case Type.Comment: return `<!--${token.data}-->`;
case Type.DOCTYPE: return `<!DOCTYPE ${token.name}>`;
case Type.EndOfFile: return 'EOF';
case Type.EndTag: return `</${token.name}>`;
case Type.StartTag: {
let string = `<${token.name}`;
for (const attribute of token.attributes.list)
string += ` ${attribute.name}="${attribute.value}"`;
if (token.selfClosing) return `${string} />`;
return `${string}>`;
};
}
}