import {TYPE_WORD, TYPE_TAG, TYPE_ATTR_NAME, TYPE_ATTR_VALUE, TYPE_SPACE, TYPE_NEW_LINE} from '../src/Token' import { createLexer } from '../src/lexer' const TYPE = { WORD: TYPE_WORD, TAG: TYPE_TAG, ATTR_NAME: TYPE_ATTR_NAME, ATTR_VALUE: TYPE_ATTR_VALUE, SPACE: TYPE_SPACE, NEW_LINE: TYPE_NEW_LINE, }; const tokenize = input => (createLexer(input).tokenize()); describe('lexer', () => { const expectOutput = (output, tokens) => { expect(tokens.length).toBe(output.length); expect(tokens).toBeInstanceOf(Array); tokens.forEach((token, idx) => { expect(token).toBeInstanceOf(Object); expect(token.type).toEqual(output[idx][0]); expect(token.value).toEqual(output[idx][1]); }); }; test('single tag', () => { const input = '[SingleTag]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'SingleTag', '0', '0'], ]; expectOutput(output, tokens); }); test('single tag with params', () => { const input = '[user=111]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'user', '0', '0'], [TYPE.ATTR_VALUE, '111', '0', '0'], ]; expectOutput(output, tokens); }); test('single tag with spaces', () => { const input = '[Single Tag]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'Single Tag', '0', '0'], ]; expectOutput(output, tokens); }); test('string with quotemarks', () => { const input = '"Someone Like You" by Adele'; const tokens = tokenize(input); const output = [ [TYPE.WORD, '"Someone', '0', '0'], [TYPE.SPACE, ' ', '8', '0'], [TYPE.WORD, 'Like', '8', '0'], [TYPE.SPACE, ' ', '13', '0'], [TYPE.WORD, 'You"', '13', '0'], [TYPE.SPACE, ' ', '18', '0'], [TYPE.WORD, 'by', '18', '0'], [TYPE.SPACE, ' ', '21', '0'], [TYPE.WORD, 'Adele', '21', '0'], ]; expectOutput(output, tokens); }); test('tags in brakets', () => { const input = '[ [h1]G[/h1] ]'; const tokens = tokenize(input); const output = [ [TYPE.WORD, '[', '0', '0'], [TYPE.SPACE, ' ', '1', '0'], [TYPE.TAG, 'h1', '2', '0'], [TYPE.WORD, 'G', '1', '0'], [TYPE.TAG, '/h1', '7', '0'], [TYPE.SPACE, ' ', '12', '0'], [TYPE.WORD, ']', '7', '0'], ]; expectOutput(output, tokens); }); test('tag as param', () => { const input = '[color="#ff0000"]Text[/color]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'color', '0', '0'], [TYPE.ATTR_VALUE, '#ff0000', '6', '0'], [TYPE.WORD, 'Text', '17', '0'], [TYPE.TAG, '/color', '21', '0'], ]; expectOutput(output, tokens); }); test('tag with quotemark params with spaces', () => { const input = '[url text="Foo Bar" text2="Foo Bar 2"]Text[/url]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'url', '0', '0'], [TYPE.ATTR_NAME, 'text', '4', '0'], [TYPE.ATTR_VALUE, 'Foo Bar', '9', '0'], [TYPE.ATTR_NAME, 'text2', '4', '0'], [TYPE.ATTR_VALUE, 'Foo Bar 2', '9', '0'], [TYPE.WORD, 'Text', '20', '0'], [TYPE.TAG, '/url', '24', '0'], ]; expectOutput(output, tokens); }); test('tag with escaped quotemark param', () => { const input = `[url text="Foo \\"Bar"]Text[/url]`; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'url', '0', '0'], [TYPE.ATTR_NAME, 'text', '4', '0'], [TYPE.ATTR_VALUE, 'Foo "Bar', '9', '0'], [TYPE.WORD, 'Text', '22', '0'], [TYPE.TAG, '/url', '26', '0'], ]; expectOutput(output, tokens); }); test('tag param without quotemarks', () => { const input = '[style color=#ff0000]Text[/style]'; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'style', '0', '0'], [TYPE.ATTR_NAME, 'color', '6', '0'], [TYPE.ATTR_VALUE, '#ff0000', '12', '0'], [TYPE.WORD, 'Text', '21', '0'], [TYPE.TAG, '/style', '25', '0'], ]; expectOutput(output, tokens); }); test('list tag with items', () => { const input = `[list] [*] Item 1. [*] Item 2. [*] Item 3. [/list]`; const tokens = tokenize(input); const output = [ [TYPE.TAG, 'list', '0', '0'], [TYPE.NEW_LINE, '\n', '6', '0'], [TYPE.SPACE, ' ', '0', '1'], [TYPE.TAG, '*', '3', '1'], [TYPE.SPACE, ' ', '6', '1'], [TYPE.WORD, 'Item', '7', '1'], [TYPE.SPACE, ' ', '11', '1'], [TYPE.WORD, '1.', '11', '1'], [TYPE.NEW_LINE, '\n', '14', '1'], [TYPE.SPACE, ' ', '0', '2'], [TYPE.TAG, '*', '3', '2'], [TYPE.SPACE, ' ', '6', '2'], [TYPE.WORD, 'Item', '14', '1'], [TYPE.SPACE, ' ', '11', '2'], [TYPE.WORD, '2.', '11', '2'], [TYPE.NEW_LINE, '\n', '14', '2'], [TYPE.SPACE, ' ', '0', '3'], [TYPE.TAG, '*', '3', '3'], [TYPE.SPACE, ' ', '6', '3'], [TYPE.WORD, 'Item', '14', '2'], [TYPE.SPACE, ' ', '11', '3'], [TYPE.WORD, '3.', '11', '3'], [TYPE.NEW_LINE, '\n', '14', '3'], [TYPE.TAG, '/list', '0', '4'], ]; expectOutput(output, tokens); }); test('bad tags as texts', () => { const inputs = [ '[]', '[=]', '![](image.jpg)', 'x html([a. title][, alt][, classes]) x', '[/y]', '[sc', '[sc / [/sc]', '[sc arg="val', ]; const asserts = [ [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, ']', '0', '0'] ], [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, '=]', '0', '0'] ], [ [TYPE.WORD, '!', '0', '0'], [TYPE.WORD, '[', '1', '0'], [TYPE.WORD, ']', '1', '0'], [TYPE.WORD, '(image.jpg)', '1', '0'], ], [ [TYPE.WORD, 'x', '0', '0'], [TYPE.SPACE, ' ', '1', '0'], [TYPE.WORD, 'html(', '1', '0'], [TYPE.TAG, 'a. title', '7', '0'], [TYPE.TAG, ', alt', '17', '0'], [TYPE.TAG, ', classes', '24', '0'], [TYPE.WORD, ')', '7', '0'], [TYPE.SPACE, ' ', '36', '0'], [TYPE.WORD, 'x', '36', '0'], ], [ [TYPE.TAG, '/y', '0', '0'] ], [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, 'sc', '0', '0'] ], [ // [sc / [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, 'sc', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, '/', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.TAG, '/sc', '0', '0'] ], [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, 'sc', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, 'arg="val', '0', '0'], ] ]; inputs.forEach((input, idx) => { const tokens = tokenize(input); const output = asserts[idx]; expectOutput(output, tokens); }); }); test('bad unclosed tag', () => { const input = `[Finger Part A [Finger]`; const tokens = tokenize(input); const output = [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, 'Finger', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, 'Part', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, 'A', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.TAG, 'Finger', '0', '0'] ]; expectOutput(output, tokens); }); test('no close tag', () => { const input = '[Finger Part A'; const tokens = tokenize(input); const output = [ [TYPE.WORD, '[', '0', '0'], [TYPE.WORD, 'Finger', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, 'Part', '0', '0'], [TYPE.SPACE, ' ', '0', '0'], [TYPE.WORD, 'A', '0', '0'], ]; expectOutput(output, tokens); }); describe('html', () => { const tokenizeHTML = input => createLexer(input, { openTag: '<', closeTag: '>' }).tokenize(); test('normal attributes', () => { const content = ``; const tokens = tokenizeHTML(content); const output = [ [TYPE.TAG, 'button', 2, 0], [TYPE.ATTR_NAME, 'id', 2, 0], [TYPE.ATTR_VALUE, 'test0', 2, 0], [TYPE.ATTR_NAME, 'class', 2, 0], [TYPE.ATTR_VALUE, 'value0', 2, 0], [TYPE.ATTR_NAME, 'title', 2, 0], [TYPE.ATTR_VALUE, 'value1', 2, 0], [TYPE.WORD, "class=\"value0\"", 2, 0], [TYPE.SPACE, " ", 2, 0], [TYPE.WORD, "title=\"value1\"", 2, 0], [TYPE.TAG, '/button', 2, 0] ]; expectOutput(output, tokens); }); test('attributes with no quotes or value', () => { const content = ``; const tokens = tokenizeHTML(content); const output = [ [TYPE.TAG, 'button', 2, 0], [TYPE.ATTR_NAME, 'id', 2, 0], [TYPE.ATTR_VALUE, 'test1', 2, 0], [TYPE.ATTR_NAME, 'class', 2, 0], [TYPE.ATTR_VALUE, 'value2', 2, 0], [TYPE.ATTR_VALUE, 'disabled', 2, 0], [TYPE.WORD, "class=value2", 2, 0], [TYPE.SPACE, " ", 2, 0], [TYPE.WORD, "disabled", 2, 0], [TYPE.TAG, '/button', 2, 0] ]; expectOutput(output, tokens); }); test('attributes with no space between them. No valid, but accepted by the browser', () => { const content = ``; const tokens = tokenizeHTML(content); const output = [ [TYPE.TAG, 'button', 2, 0], [TYPE.ATTR_NAME, 'id', 2, 0], [TYPE.ATTR_VALUE, 'test2', 2, 0], [TYPE.ATTR_NAME, 'class', 2, 0], [TYPE.ATTR_VALUE, 'value4', 2, 0], [TYPE.ATTR_NAME, 'title', 2, 0], [TYPE.ATTR_VALUE, 'value5', 2, 0], [TYPE.WORD, "class=\"value4\"title=\"value5\"", 2, 0], [TYPE.TAG, '/button', 2, 0] ]; expectOutput(output, tokens); }); test.skip('style tag', () => { const content = `` const tokens = tokenizeHTML(content); const output = []; expectOutput(output, tokens); }); test.skip('script tag', () => { const content = ``; const tokens = tokenizeHTML(content); const output = []; expectOutput(output, tokens); }) }) });