toy-html-parser

学习如何把html代码解析为dom树而自制的解析器

lexer测试代码

const input = `<html>
    <head>
        <title>cool</title>
    </head>
    <body class="foo bar">
        <img src="a" />
        <input disabled type="text" />
        hello world
    </body>
</html>`;

const parser = new HTMLLexer(input);
const rawToken = parser.run();

// 过滤掉空白无意义token
const result = [];
for (let i = 0; i < rawToken.length; i++) {
    rawToken[i] = rawToken[i].replace(/[\n]/g, '');
    rawToken[i] = rawToken[i].trim();
    if (rawToken[i]) {
        result.push(rawToken[i]);
    }
}
console.log(result);

lexer输出

[ '<html>',
  '<head>',
  '<title>',
  'cool',
  '</title>',
  '</head>',
  '<body',
  'class="foo bar"',
  '>',
  '<img',
  'src="a"',
  '/>',
  '<input',
  'disabled',
  'type="text"',
  '/>',
  'hello world',
  '</body>',
  '</html>' ]

champkeh/toy-html-parser

toy-html-parser

lexer测试代码

lexer输出