markdown-it/lib/rules_block/state_block.mjs

// Parser state class

import Token from '../token.mjs'
import { isSpace } from '../common/utils.mjs'


function StateBlock (src, md, env, tokens) {
  this.src = src

  // link to parser instance
  this.md     = md

  this.env = env

  //
  // Internal state vartiables
  //

  this.tokens = tokens

  this.bMarks = []  // line begin offsets for fast jumps
  this.eMarks = []  // line end offsets for fast jumps
  this.tShift = []  // offsets of the first non-space characters (tabs not expanded)
  this.sCount = []  // indents for each line (tabs expanded)

  // An amount of virtual spaces (tabs expanded) between beginning
  // of each line (bMarks) and real beginning of that line.
  //
  // It exists only as a hack because blockquotes override bMarks
  // losing information in the process.
  //
  // It's used only when expanding tabs, you can think about it as
  // an initial tab length, e.g. bsCount=21 applied to string `\t123`
  // means first tab should be expanded to 4-21%4 === 3 spaces.
  //
  this.bsCount = []

  // block parser variables

  // required block content indent (for example, if we are
  // inside a list, it would be positioned after list marker)
  this.blkIndent  = 0
  this.line       = 0 // line index in src
  this.lineMax    = 0 // lines count
  this.tight      = false  // loose/tight mode for lists
  this.ddIndent   = -1 // indent of the current dd block (-1 if there isn't any)
  this.listIndent = -1 // indent of the current list block (-1 if there isn't any)

  // can be 'blockquote', 'list', 'root', 'paragraph' or 'reference'
  // used in lists to determine if they interrupt a paragraph
  this.parentType = 'root'

  this.level = 0

  // Create caches
  // Generate markers.
  const s = this.src

  for (let start = 0, pos = 0, indent = 0, offset = 0, len = s.length, indent_found = false; pos < len; pos++) {
    const ch = s.charCodeAt(pos)

    if (!indent_found) {
      if (isSpace(ch)) {
        indent++

        if (ch === 0x09) {
          offset += 4 - offset % 4
        } else {
          offset++
        }
        continue
      } else {
        indent_found = true
      }
    }

    if (ch === 0x0A || pos === len - 1) {
      if (ch !== 0x0A) { pos++ }
      this.bMarks.push(start)
      this.eMarks.push(pos)
      this.tShift.push(indent)
      this.sCount.push(offset)
      this.bsCount.push(0)

      indent_found = false
      indent = 0
      offset = 0
      start = pos + 1
    }
  }

  // Push fake entry to simplify cache bounds checks
  this.bMarks.push(s.length)
  this.eMarks.push(s.length)
  this.tShift.push(0)
  this.sCount.push(0)
  this.bsCount.push(0)

  this.lineMax = this.bMarks.length - 1 // don't count last fake line
}

// Push new token to "stream".
//
StateBlock.prototype.push = function (type, tag, nesting) {
  const token = new Token(type, tag, nesting)
  token.block = true

  if (nesting < 0) this.level-- // closing tag
  token.level = this.level
  if (nesting > 0) this.level++ // opening tag

  this.tokens.push(token)
  return token
}

StateBlock.prototype.isEmpty = function isEmpty (line) {
  return this.bMarks[line] + this.tShift[line] >= this.eMarks[line]
}

StateBlock.prototype.skipEmptyLines = function skipEmptyLines (from) {
  for (let max = this.lineMax; from < max; from++) {
    if (this.bMarks[from] + this.tShift[from] < this.eMarks[from]) {
      break
    }
  }
  return from
}

// Skip spaces from given position.
StateBlock.prototype.skipSpaces = function skipSpaces (pos) {
  for (let max = this.src.length; pos < max; pos++) {
    const ch = this.src.charCodeAt(pos)
    if (!isSpace(ch)) { break }
  }
  return pos
}

// Skip spaces from given position in reverse.
StateBlock.prototype.skipSpacesBack = function skipSpacesBack (pos, min) {
  if (pos <= min) { return pos }

  while (pos > min) {
    if (!isSpace(this.src.charCodeAt(--pos))) { return pos + 1 }
  }
  return pos
}

// Skip char codes from given position
StateBlock.prototype.skipChars = function skipChars (pos, code) {
  for (let max = this.src.length; pos < max; pos++) {
    if (this.src.charCodeAt(pos) !== code) { break }
  }
  return pos
}

// Skip char codes reverse from given position - 1
StateBlock.prototype.skipCharsBack = function skipCharsBack (pos, code, min) {
  if (pos <= min) { return pos }

  while (pos > min) {
    if (code !== this.src.charCodeAt(--pos)) { return pos + 1 }
  }
  return pos
}

// cut lines range from source.
StateBlock.prototype.getLines = function getLines (begin, end, indent, keepLastLF) {
  if (begin >= end) {
    return ''
  }

  const queue = new Array(end - begin)

  for (let i = 0, line = begin; line < end; line++, i++) {
    let lineIndent = 0
    const lineStart = this.bMarks[line]
    let first = lineStart
    let last

    if (line + 1 < end || keepLastLF) {
      // No need for bounds check because we have fake entry on tail.
      last = this.eMarks[line] + 1
    } else {
      last = this.eMarks[line]
    }

    while (first < last && lineIndent < indent) {
      const ch = this.src.charCodeAt(first)

      if (isSpace(ch)) {
        if (ch === 0x09) {
          lineIndent += 4 - (lineIndent + this.bsCount[line]) % 4
        } else {
          lineIndent++
        }
      } else if (first - lineStart < this.tShift[line]) {
        // patched tShift masked characters to look like spaces (blockquotes, list markers)
        lineIndent++
      } else {
        break
      }

      first++
    }

    if (lineIndent > indent) {
      // partially expanding tabs in code blocks, e.g '\t\tfoobar'
      // with indent=2 becomes '  \tfoobar'
      queue[i] = new Array(lineIndent - indent + 1).join(' ') + this.src.slice(first, last)
    } else {
      queue[i] = this.src.slice(first, last)
    }
  }

  return queue.join('')
}

// re-export Token class to use in block rules
StateBlock.prototype.Token = Token


export default StateBlock
Splitted block lexer & index to files 10 years ago			`// Parser state class`

standard: remove semi 1 year ago			`import Token from '../token.mjs'`
			`import { isSpace } from '../common/utils.mjs'`
Use a common class for tokens 10 years ago
Splitted block lexer & index to files 10 years ago
standard: space before function params 1 year ago			`function StateBlock (src, md, env, tokens) {`
standard: remove semi 1 year ago			`this.src = src`
Splitted block lexer & index to files 10 years ago
Place md link to states and remove other aliases 10 years ago			`// link to parser instance`
standard: remove semi 1 year ago			`this.md = md`
Splitted block lexer & index to files 10 years ago
standard: remove semi 1 year ago			`this.env = env`
Parse link reference definitions 10 years ago
Splitted block lexer & index to files 10 years ago			`//`
			`// Internal state vartiables`
			`//`

standard: remove semi 1 year ago			`this.tokens = tokens`
Splitted block lexer & index to files 10 years ago
standard: remove semi 1 year ago			`this.bMarks = [] // line begin offsets for fast jumps`
			`this.eMarks = [] // line end offsets for fast jumps`
			`this.tShift = [] // offsets of the first non-space characters (tabs not expanded)`
			`this.sCount = [] // indents for each line (tabs expanded)`
Splitted block lexer & index to files 10 years ago
Fix tab behavior inside blockquotes 8 years ago			`// An amount of virtual spaces (tabs expanded) between beginning`
			`// of each line (bMarks) and real beginning of that line.`
			`//`
			`// It exists only as a hack because blockquotes override bMarks`
			`// losing information in the process.`
			`//`
			`// It's used only when expanding tabs, you can think about it as`
			// an initial tab length, e.g. bsCount=21 applied to string `\t123`
			`// means first tab should be expanded to 4-21%4 === 3 spaces.`
			`//`
standard: remove semi 1 year ago			`this.bsCount = []`
Fix tab behavior inside blockquotes 8 years ago
Perf: speedup cache creation in StateBlock 10 years ago			`// block parser variables`
standard: more tweaks & simplify eslint config 1 year ago
			`// required block content indent (for example, if we are`
			`// inside a list, it would be positioned after list marker)`
			`this.blkIndent = 0`
standard: remove semi 1 year ago			`this.line = 0 // line index in src`
			`this.lineMax = 0 // lines count`
			`this.tight = false // loose/tight mode for lists`
			`this.ddIndent = -1 // indent of the current dd block (-1 if there isn't any)`
			`this.listIndent = -1 // indent of the current list block (-1 if there isn't any)`
Perf: speedup cache creation in StateBlock 10 years ago
Fix lists and headings 8 years ago			`// can be 'blockquote', 'list', 'root', 'paragraph' or 'reference'`
			`// used in lists to determine if they interrupt a paragraph`
standard: remove semi 1 year ago			`this.parentType = 'root'`
Fix lists and headings 8 years ago
standard: remove semi 1 year ago			`this.level = 0`
Perf: speedup cache creation in StateBlock 10 years ago
			`// Create caches`
Splitted block lexer & index to files 10 years ago			`// Generate markers.`
standard: remove semi 1 year ago			`const s = this.src`
Splitted block lexer & index to files 10 years ago
var => const, let 1 year ago			`for (let start = 0, pos = 0, indent = 0, offset = 0, len = s.length, indent_found = false; pos < len; pos++) {`
standard: remove semi 1 year ago			`const ch = s.charCodeAt(pos)`
Splitted block lexer & index to files 10 years ago
Perf: speedup cache creation in StateBlock 10 years ago			`if (!indent_found) {`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`if (isSpace(ch)) {`
standard: remove semi 1 year ago			`indent++`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago
			`if (ch === 0x09) {`
standard: remove semi 1 year ago			`offset += 4 - offset % 4`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`} else {`
standard: remove semi 1 year ago			`offset++`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`}`
standard: remove semi 1 year ago			`continue`
Perf: speedup cache creation in StateBlock 10 years ago			`} else {`
standard: remove semi 1 year ago			`indent_found = true`
Perf: speedup cache creation in StateBlock 10 years ago			`}`
Splitted block lexer & index to files 10 years ago			`}`

StateBlock() cleanup 10 years ago			`if (ch === 0x0A \|\| pos === len - 1) {`
standard: remove semi 1 year ago			`if (ch !== 0x0A) { pos++ }`
			`this.bMarks.push(start)`
			`this.eMarks.push(pos)`
			`this.tShift.push(indent)`
			`this.sCount.push(offset)`
			`this.bsCount.push(0)`

			`indent_found = false`
			`indent = 0`
			`offset = 0`
			`start = pos + 1`
Splitted block lexer & index to files 10 years ago			`}`
			`}`

Rewritten string fetch for inline tokenizer + list fixes 10 years ago			`// Push fake entry to simplify cache bounds checks`
standard: remove semi 1 year ago			`this.bMarks.push(s.length)`
			`this.eMarks.push(s.length)`
			`this.tShift.push(0)`
			`this.sCount.push(0)`
			`this.bsCount.push(0)`
Rewritten string fetch for inline tokenizer + list fixes 10 years ago
standard: remove semi 1 year ago			`this.lineMax = this.bMarks.length - 1 // don't count last fake line`
Splitted block lexer & index to files 10 years ago			`}`

Use a common class for tokens 10 years ago			`// Push new token to "stream".`
			`//`
			`StateBlock.prototype.push = function (type, tag, nesting) {`
standard: remove semi 1 year ago			`const token = new Token(type, tag, nesting)`
			`token.block = true`
Use a common class for tokens 10 years ago
standard: remove semi 1 year ago			`if (nesting < 0) this.level-- // closing tag`
			`token.level = this.level`
			`if (nesting > 0) this.level++ // opening tag`
Use a common class for tokens 10 years ago
standard: remove semi 1 year ago			`this.tokens.push(token)`
			`return token`
			`}`
Use a common class for tokens 10 years ago
standard: space before function params 1 year ago			`StateBlock.prototype.isEmpty = function isEmpty (line) {`
standard: remove semi 1 year ago			`return this.bMarks[line] + this.tShift[line] >= this.eMarks[line]`
			`}`
Moved state helpers to State* classes 10 years ago
standard: space before function params 1 year ago			`StateBlock.prototype.skipEmptyLines = function skipEmptyLines (from) {`
var => const, let 1 year ago			`for (let max = this.lineMax; from < max; from++) {`
Moved state helpers to State* classes 10 years ago			`if (this.bMarks[from] + this.tShift[from] < this.eMarks[from]) {`
standard: remove semi 1 year ago			`break`
Moved state helpers to State* classes 10 years ago			`}`
			`}`
standard: remove semi 1 year ago			`return from`
			`}`
Moved state helpers to State* classes 10 years ago
			`// Skip spaces from given position.`
standard: space before function params 1 year ago			`StateBlock.prototype.skipSpaces = function skipSpaces (pos) {`
var => const, let 1 year ago			`for (let max = this.src.length; pos < max; pos++) {`
standard: remove semi 1 year ago			`const ch = this.src.charCodeAt(pos)`
			`if (!isSpace(ch)) { break }`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`}`
standard: remove semi 1 year ago			`return pos`
			`}`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago
			`// Skip spaces from given position in reverse.`
standard: space before function params 1 year ago			`StateBlock.prototype.skipSpacesBack = function skipSpacesBack (pos, min) {`
standard: remove semi 1 year ago			`if (pos <= min) { return pos }`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago
			`while (pos > min) {`
standard: remove semi 1 year ago			`if (!isSpace(this.src.charCodeAt(--pos))) { return pos + 1 }`
Moved state helpers to State* classes 10 years ago			`}`
standard: remove semi 1 year ago			`return pos`
			`}`
Moved state helpers to State* classes 10 years ago
			`// Skip char codes from given position`
standard: space before function params 1 year ago			`StateBlock.prototype.skipChars = function skipChars (pos, code) {`
var => const, let 1 year ago			`for (let max = this.src.length; pos < max; pos++) {`
standard: remove semi 1 year ago			`if (this.src.charCodeAt(pos) !== code) { break }`
Moved state helpers to State* classes 10 years ago			`}`
standard: remove semi 1 year ago			`return pos`
			`}`
Moved state helpers to State* classes 10 years ago
			`// Skip char codes reverse from given position - 1`
standard: space before function params 1 year ago			`StateBlock.prototype.skipCharsBack = function skipCharsBack (pos, code, min) {`
standard: remove semi 1 year ago			`if (pos <= min) { return pos }`
Moved state helpers to State* classes 10 years ago
			`while (pos > min) {`
standard: remove semi 1 year ago			`if (code !== this.src.charCodeAt(--pos)) { return pos + 1 }`
Moved state helpers to State* classes 10 years ago			`}`
standard: remove semi 1 year ago			`return pos`
			`}`
Moved state helpers to State* classes 10 years ago
			`// cut lines range from source.`
standard: space before function params 1 year ago			`StateBlock.prototype.getLines = function getLines (begin, end, indent, keepLastLF) {`
Moved state helpers to State* classes 10 years ago			`if (begin >= end) {`
standard: remove semi 1 year ago			`return ''`
Moved state helpers to State* classes 10 years ago			`}`

standard: remove semi 1 year ago			`const queue = new Array(end - begin)`
Moved state helpers to State* classes 10 years ago
var => const, let 1 year ago			`for (let i = 0, line = begin; line < end; line++, i++) {`
standard: remove semi 1 year ago			`let lineIndent = 0`
			`const lineStart = this.bMarks[line]`
			`let first = lineStart`
			`let last`
Moved state helpers to State* classes 10 years ago
			`if (line + 1 < end \|\| keepLastLF) {`
			`// No need for bounds check because we have fake entry on tail.`
standard: remove semi 1 year ago			`last = this.eMarks[line] + 1`
Moved state helpers to State* classes 10 years ago			`} else {`
standard: remove semi 1 year ago			`last = this.eMarks[line]`
Moved state helpers to State* classes 10 years ago			`}`

Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`while (first < last && lineIndent < indent) {`
standard: remove semi 1 year ago			`const ch = this.src.charCodeAt(first)`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago
			`if (isSpace(ch)) {`
			`if (ch === 0x09) {`
standard: remove semi 1 year ago			`lineIndent += 4 - (lineIndent + this.bsCount[line]) % 4`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`} else {`
standard: remove semi 1 year ago			`lineIndent++`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`}`
			`} else if (first - lineStart < this.tShift[line]) {`
			`// patched tShift masked characters to look like spaces (blockquotes, list markers)`
standard: remove semi 1 year ago			`lineIndent++`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`} else {`
standard: remove semi 1 year ago			`break`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`}`

standard: remove semi 1 year ago			`first++`
Expand tabs only when it's needed, as per CommonMark 0.21 10 years ago			`}`

Partially fix tabs inside code blocks 8 years ago			`if (lineIndent > indent) {`
			`// partially expanding tabs in code blocks, e.g '\t\tfoobar'`
			`// with indent=2 becomes ' \tfoobar'`
standard: remove semi 1 year ago			`queue[i] = new Array(lineIndent - indent + 1).join(' ') + this.src.slice(first, last)`
Partially fix tabs inside code blocks 8 years ago			`} else {`
standard: remove semi 1 year ago			`queue[i] = this.src.slice(first, last)`
Partially fix tabs inside code blocks 8 years ago			`}`
Moved state helpers to State* classes 10 years ago			`}`

standard: remove semi 1 year ago			`return queue.join('')`
			`}`
Splitted block lexer & index to files 10 years ago
Add StateCore.Token and StateCore.push() so all state objects would have roughly the same interface 10 years ago			`// re-export Token class to use in block rules`
standard: remove semi 1 year ago			`StateBlock.prototype.Token = Token`
Make Token class accessible from a State 10 years ago
Implemented nested blocks lexing, now block quotes works as expected 10 years ago
standard: remove semi 1 year ago			`export default StateBlock`