123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458 |
- 'use strict'
- var assert = require('assert')
- var asciiAlpha = require('../character/ascii-alpha.js')
- var asciiAlphanumeric = require('../character/ascii-alphanumeric.js')
- var codes = require('../character/codes.js')
- var markdownLineEnding = require('../character/markdown-line-ending.js')
- var markdownLineEndingOrSpace = require('../character/markdown-line-ending-or-space.js')
- var markdownSpace = require('../character/markdown-space.js')
- var constants = require('../constant/constants.js')
- var types = require('../constant/types.js')
- var factorySpace = require('./factory-space.js')
- function _interopDefaultLegacy(e) {
- return e && typeof e === 'object' && 'default' in e ? e : {default: e}
- }
- var assert__default = /*#__PURE__*/ _interopDefaultLegacy(assert)
- var htmlText = {
- name: 'htmlText',
- tokenize: tokenizeHtmlText
- }
- function tokenizeHtmlText(effects, ok, nok) {
- var self = this
- var marker
- var buffer
- var index
- var returnState
- return start
- function start(code) {
- assert__default['default'](code === codes.lessThan, 'expected `<`')
- effects.enter(types.htmlText)
- effects.enter(types.htmlTextData)
- effects.consume(code)
- return open
- }
- function open(code) {
- if (code === codes.exclamationMark) {
- effects.consume(code)
- return declarationOpen
- }
- if (code === codes.slash) {
- effects.consume(code)
- return tagCloseStart
- }
- if (code === codes.questionMark) {
- effects.consume(code)
- return instruction
- }
- if (asciiAlpha(code)) {
- effects.consume(code)
- return tagOpen
- }
- return nok(code)
- }
- function declarationOpen(code) {
- if (code === codes.dash) {
- effects.consume(code)
- return commentOpen
- }
- if (code === codes.leftSquareBracket) {
- effects.consume(code)
- buffer = constants.cdataOpeningString
- index = 0
- return cdataOpen
- }
- if (asciiAlpha(code)) {
- effects.consume(code)
- return declaration
- }
- return nok(code)
- }
- function commentOpen(code) {
- if (code === codes.dash) {
- effects.consume(code)
- return commentStart
- }
- return nok(code)
- }
- function commentStart(code) {
- if (code === codes.eof || code === codes.greaterThan) {
- return nok(code)
- }
- if (code === codes.dash) {
- effects.consume(code)
- return commentStartDash
- }
- return comment(code)
- }
- function commentStartDash(code) {
- if (code === codes.eof || code === codes.greaterThan) {
- return nok(code)
- }
- return comment(code)
- }
- function comment(code) {
- if (code === codes.eof) {
- return nok(code)
- }
- if (code === codes.dash) {
- effects.consume(code)
- return commentClose
- }
- if (markdownLineEnding(code)) {
- returnState = comment
- return atLineEnding(code)
- }
- effects.consume(code)
- return comment
- }
- function commentClose(code) {
- if (code === codes.dash) {
- effects.consume(code)
- return end
- }
- return comment(code)
- }
- function cdataOpen(code) {
- if (code === buffer.charCodeAt(index++)) {
- effects.consume(code)
- return index === buffer.length ? cdata : cdataOpen
- }
- return nok(code)
- }
- function cdata(code) {
- if (code === codes.eof) {
- return nok(code)
- }
- if (code === codes.rightSquareBracket) {
- effects.consume(code)
- return cdataClose
- }
- if (markdownLineEnding(code)) {
- returnState = cdata
- return atLineEnding(code)
- }
- effects.consume(code)
- return cdata
- }
- function cdataClose(code) {
- if (code === codes.rightSquareBracket) {
- effects.consume(code)
- return cdataEnd
- }
- return cdata(code)
- }
- function cdataEnd(code) {
- if (code === codes.greaterThan) {
- return end(code)
- }
- if (code === codes.rightSquareBracket) {
- effects.consume(code)
- return cdataEnd
- }
- return cdata(code)
- }
- function declaration(code) {
- if (code === codes.eof || code === codes.greaterThan) {
- return end(code)
- }
- if (markdownLineEnding(code)) {
- returnState = declaration
- return atLineEnding(code)
- }
- effects.consume(code)
- return declaration
- }
- function instruction(code) {
- if (code === codes.eof) {
- return nok(code)
- }
- if (code === codes.questionMark) {
- effects.consume(code)
- return instructionClose
- }
- if (markdownLineEnding(code)) {
- returnState = instruction
- return atLineEnding(code)
- }
- effects.consume(code)
- return instruction
- }
- function instructionClose(code) {
- return code === codes.greaterThan ? end(code) : instruction(code)
- }
- function tagCloseStart(code) {
- if (asciiAlpha(code)) {
- effects.consume(code)
- return tagClose
- }
- return nok(code)
- }
- function tagClose(code) {
- if (code === codes.dash || asciiAlphanumeric(code)) {
- effects.consume(code)
- return tagClose
- }
- return tagCloseBetween(code)
- }
- function tagCloseBetween(code) {
- if (markdownLineEnding(code)) {
- returnState = tagCloseBetween
- return atLineEnding(code)
- }
- if (markdownSpace(code)) {
- effects.consume(code)
- return tagCloseBetween
- }
- return end(code)
- }
- function tagOpen(code) {
- if (code === codes.dash || asciiAlphanumeric(code)) {
- effects.consume(code)
- return tagOpen
- }
- if (
- code === codes.slash ||
- code === codes.greaterThan ||
- markdownLineEndingOrSpace(code)
- ) {
- return tagOpenBetween(code)
- }
- return nok(code)
- }
- function tagOpenBetween(code) {
- if (code === codes.slash) {
- effects.consume(code)
- return end
- }
- if (code === codes.colon || code === codes.underscore || asciiAlpha(code)) {
- effects.consume(code)
- return tagOpenAttributeName
- }
- if (markdownLineEnding(code)) {
- returnState = tagOpenBetween
- return atLineEnding(code)
- }
- if (markdownSpace(code)) {
- effects.consume(code)
- return tagOpenBetween
- }
- return end(code)
- }
- function tagOpenAttributeName(code) {
- if (
- code === codes.dash ||
- code === codes.dot ||
- code === codes.colon ||
- code === codes.underscore ||
- asciiAlphanumeric(code)
- ) {
- effects.consume(code)
- return tagOpenAttributeName
- }
- return tagOpenAttributeNameAfter(code)
- }
- function tagOpenAttributeNameAfter(code) {
- if (code === codes.equalsTo) {
- effects.consume(code)
- return tagOpenAttributeValueBefore
- }
- if (markdownLineEnding(code)) {
- returnState = tagOpenAttributeNameAfter
- return atLineEnding(code)
- }
- if (markdownSpace(code)) {
- effects.consume(code)
- return tagOpenAttributeNameAfter
- }
- return tagOpenBetween(code)
- }
- function tagOpenAttributeValueBefore(code) {
- if (
- code === codes.eof ||
- code === codes.lessThan ||
- code === codes.equalsTo ||
- code === codes.greaterThan ||
- code === codes.graveAccent
- ) {
- return nok(code)
- }
- if (code === codes.quotationMark || code === codes.apostrophe) {
- effects.consume(code)
- marker = code
- return tagOpenAttributeValueQuoted
- }
- if (markdownLineEnding(code)) {
- returnState = tagOpenAttributeValueBefore
- return atLineEnding(code)
- }
- if (markdownSpace(code)) {
- effects.consume(code)
- return tagOpenAttributeValueBefore
- }
- effects.consume(code)
- marker = undefined
- return tagOpenAttributeValueUnquoted
- }
- function tagOpenAttributeValueQuoted(code) {
- if (code === marker) {
- effects.consume(code)
- return tagOpenAttributeValueQuotedAfter
- }
- if (code === codes.eof) {
- return nok(code)
- }
- if (markdownLineEnding(code)) {
- returnState = tagOpenAttributeValueQuoted
- return atLineEnding(code)
- }
- effects.consume(code)
- return tagOpenAttributeValueQuoted
- }
- function tagOpenAttributeValueQuotedAfter(code) {
- if (
- code === codes.greaterThan ||
- code === codes.slash ||
- markdownLineEndingOrSpace(code)
- ) {
- return tagOpenBetween(code)
- }
- return nok(code)
- }
- function tagOpenAttributeValueUnquoted(code) {
- if (
- code === codes.eof ||
- code === codes.quotationMark ||
- code === codes.apostrophe ||
- code === codes.lessThan ||
- code === codes.equalsTo ||
- code === codes.graveAccent
- ) {
- return nok(code)
- }
- if (code === codes.greaterThan || markdownLineEndingOrSpace(code)) {
- return tagOpenBetween(code)
- }
- effects.consume(code)
- return tagOpenAttributeValueUnquoted
- }
- // We can’t have blank lines in content, so no need to worry about empty
- // tokens.
- function atLineEnding(code) {
- assert__default['default'](returnState, 'expected return state')
- assert__default['default'](markdownLineEnding(code), 'expected eol')
- effects.exit(types.htmlTextData)
- effects.enter(types.lineEnding)
- effects.consume(code)
- effects.exit(types.lineEnding)
- return factorySpace(
- effects,
- afterPrefix,
- types.linePrefix,
- self.parser.constructs.disable.null.indexOf('codeIndented') > -1
- ? undefined
- : constants.tabSize
- )
- }
- function afterPrefix(code) {
- effects.enter(types.htmlTextData)
- return returnState(code)
- }
- function end(code) {
- if (code === codes.greaterThan) {
- effects.consume(code)
- effects.exit(types.htmlTextData)
- effects.exit(types.htmlText)
- return ok
- }
- return nok(code)
- }
- }
- module.exports = htmlText
|