markdown-it/lib/rules_core/smartquotes.mjs

// Convert straight quotation marks to typographic ones
//

import { isWhiteSpace, isPunctChar, isMdAsciiPunct } from '../common/utils.mjs'

const QUOTE_TEST_RE = /['"]/
const QUOTE_RE = /['"]/g
const APOSTROPHE = '\u2019' /* ’ */

function replaceAt (str, index, ch) {
  return str.slice(0, index) + ch + str.slice(index + 1)
}

function process_inlines (tokens, state) {
  let j

  const stack = []

  for (let i = 0; i < tokens.length; i++) {
    const token = tokens[i]

    const thisLevel = tokens[i].level

    for (j = stack.length - 1; j >= 0; j--) {
      if (stack[j].level <= thisLevel) { break }
    }
    stack.length = j + 1

    if (token.type !== 'text') { continue }

    let text = token.content
    let pos = 0
    let max = text.length

    /* eslint no-labels:0,block-scoped-var:0 */
    OUTER:
    while (pos < max) {
      QUOTE_RE.lastIndex = pos
      const t = QUOTE_RE.exec(text)
      if (!t) { break }

      let canOpen = true
      let canClose = true
      pos = t.index + 1
      const isSingle = (t[0] === "'")

      // Find previous character,
      // default to space if it's the beginning of the line
      //
      let lastChar = 0x20

      if (t.index - 1 >= 0) {
        lastChar = text.charCodeAt(t.index - 1)
      } else {
        for (j = i - 1; j >= 0; j--) {
          if (tokens[j].type === 'softbreak' || tokens[j].type === 'hardbreak') break // lastChar defaults to 0x20
          if (!tokens[j].content) continue // should skip all tokens except 'text', 'html_inline' or 'code_inline'

          lastChar = tokens[j].content.charCodeAt(tokens[j].content.length - 1)
          break
        }
      }

      // Find next character,
      // default to space if it's the end of the line
      //
      let nextChar = 0x20

      if (pos < max) {
        nextChar = text.charCodeAt(pos)
      } else {
        for (j = i + 1; j < tokens.length; j++) {
          if (tokens[j].type === 'softbreak' || tokens[j].type === 'hardbreak') break // nextChar defaults to 0x20
          if (!tokens[j].content) continue // should skip all tokens except 'text', 'html_inline' or 'code_inline'

          nextChar = tokens[j].content.charCodeAt(0)
          break
        }
      }

      const isLastPunctChar = isMdAsciiPunct(lastChar) || isPunctChar(String.fromCharCode(lastChar))
      const isNextPunctChar = isMdAsciiPunct(nextChar) || isPunctChar(String.fromCharCode(nextChar))

      const isLastWhiteSpace = isWhiteSpace(lastChar)
      const isNextWhiteSpace = isWhiteSpace(nextChar)

      if (isNextWhiteSpace) {
        canOpen = false
      } else if (isNextPunctChar) {
        if (!(isLastWhiteSpace || isLastPunctChar)) {
          canOpen = false
        }
      }

      if (isLastWhiteSpace) {
        canClose = false
      } else if (isLastPunctChar) {
        if (!(isNextWhiteSpace || isNextPunctChar)) {
          canClose = false
        }
      }

      if (nextChar === 0x22 /* " */ && t[0] === '"') {
        if (lastChar >= 0x30 /* 0 */ && lastChar <= 0x39 /* 9 */) {
          // special case: 1"" - count first quote as an inch
          canClose = canOpen = false
        }
      }

      if (canOpen && canClose) {
        // Replace quotes in the middle of punctuation sequence, but not
        // in the middle of the words, i.e.:
        //
        // 1. foo " bar " baz - not replaced
        // 2. foo-"-bar-"-baz - replaced
        // 3. foo"bar"baz     - not replaced
        //
        canOpen = isLastPunctChar
        canClose = isNextPunctChar
      }

      if (!canOpen && !canClose) {
        // middle of word
        if (isSingle) {
          token.content = replaceAt(token.content, t.index, APOSTROPHE)
        }
        continue
      }

      if (canClose) {
        // this could be a closing quote, rewind the stack to get a match
        for (j = stack.length - 1; j >= 0; j--) {
          let item = stack[j]
          if (stack[j].level < thisLevel) { break }
          if (item.single === isSingle && stack[j].level === thisLevel) {
            item = stack[j]

            let openQuote
            let closeQuote
            if (isSingle) {
              openQuote = state.md.options.quotes[2]
              closeQuote = state.md.options.quotes[3]
            } else {
              openQuote = state.md.options.quotes[0]
              closeQuote = state.md.options.quotes[1]
            }

            // replace token.content *before* tokens[item.token].content,
            // because, if they are pointing at the same token, replaceAt
            // could mess up indices when quote length != 1
            token.content = replaceAt(token.content, t.index, closeQuote)
            tokens[item.token].content = replaceAt(
              tokens[item.token].content, item.pos, openQuote)

            pos += closeQuote.length - 1
            if (item.token === i) { pos += openQuote.length - 1 }

            text = token.content
            max = text.length

            stack.length = j
            continue OUTER
          }
        }
      }

      if (canOpen) {
        stack.push({
          token: i,
          pos: t.index,
          single: isSingle,
          level: thisLevel
        })
      } else if (canClose && isSingle) {
        token.content = replaceAt(token.content, t.index, APOSTROPHE)
      }
    }
  }
}

export default function smartquotes (state) {
  /* eslint max-depth:0 */
  if (!state.md.options.typographer) { return }

  for (let blkIdx = state.tokens.length - 1; blkIdx >= 0; blkIdx--) {
    if (state.tokens[blkIdx].type !== 'inline' ||
        !QUOTE_TEST_RE.test(state.tokens[blkIdx].content)) {
      continue
    }

    process_inlines(state.tokens[blkIdx].children, state)
  }
}
Add rule to replace quotes with typographic ones 10 years ago			`// Convert straight quotation marks to typographic ones`
			`//`

standard: remove semi 11 months ago			`import { isWhiteSpace, isPunctChar, isMdAsciiPunct } from '../common/utils.mjs'`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago
standard: remove semi 11 months ago			`const QUOTE_TEST_RE = /['"]/`
			`const QUOTE_RE = /['"]/g`
			`const APOSTROPHE = '\u2019' /* ’ */`
Add rule to replace quotes with typographic ones 10 years ago
standard: space before function params 11 months ago			`function replaceAt (str, index, ch) {`
standard: remove semi 11 months ago			`return str.slice(0, index) + ch + str.slice(index + 1)`
Add rule to replace quotes with typographic ones 10 years ago			`}`

standard: space before function params 11 months ago			`function process_inlines (tokens, state) {`
standard: remove semi 11 months ago			`let j`
Nuked typographer class, separated core chain class 10 years ago
standard: remove semi 11 months ago			`const stack = []`
Add rule to replace quotes with typographic ones 10 years ago
var => const, let 11 months ago			`for (let i = 0; i < tokens.length; i++) {`
standard: remove semi 11 months ago			`const token = tokens[i]`
Moved scans from typorgapher directly to rules 10 years ago
standard: remove semi 11 months ago			`const thisLevel = tokens[i].level`
Moved scans from typorgapher directly to rules 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`for (j = stack.length - 1; j >= 0; j--) {`
standard: remove semi 11 months ago			`if (stack[j].level <= thisLevel) { break }`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
standard: remove semi 11 months ago			`stack.length = j + 1`
Splitted replacements & smartquotes to smaller functions 10 years ago
standard: remove semi 11 months ago			`if (token.type !== 'text') { continue }`
Smartquote rule cleanup 10 years ago
standard: remove semi 11 months ago			`let text = token.content`
			`let pos = 0`
			`let max = text.length`
Splitted replacements & smartquotes to smaller functions 10 years ago
standard: spaces in comments 11 months ago			`/* eslint no-labels:0,block-scoped-var:0 */`
Splitted replacements & smartquotes to smaller functions 10 years ago			`OUTER:`
			`while (pos < max) {`
standard: remove semi 11 months ago			`QUOTE_RE.lastIndex = pos`
			`const t = QUOTE_RE.exec(text)`
			`if (!t) { break }`
Splitted replacements & smartquotes to smaller functions 10 years ago
standard: remove semi 11 months ago			`let canOpen = true`
			`let canClose = true`
			`pos = t.index + 1`
			`const isSingle = (t[0] === "'")`
Splitted replacements & smartquotes to smaller functions 10 years ago
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago			`// Find previous character,`
			`// default to space if it's the beginning of the line`
			`//`
standard: remove semi 11 months ago			`let lastChar = 0x20`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago
			`if (t.index - 1 >= 0) {`
standard: remove semi 11 months ago			`lastChar = text.charCodeAt(t.index - 1)`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago			`} else {`
			`for (j = i - 1; j >= 0; j--) {`
standard: remove semi 11 months ago			`if (tokens[j].type === 'softbreak' \|\| tokens[j].type === 'hardbreak') break // lastChar defaults to 0x20`
			`if (!tokens[j].content) continue // should skip all tokens except 'text', 'html_inline' or 'code_inline'`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago
standard: remove semi 11 months ago			`lastChar = tokens[j].content.charCodeAt(tokens[j].content.length - 1)`
			`break`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago			`}`
			`}`

			`// Find next character,`
			`// default to space if it's the end of the line`
			`//`
standard: remove semi 11 months ago			`let nextChar = 0x20`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago
			`if (pos < max) {`
standard: remove semi 11 months ago			`nextChar = text.charCodeAt(pos)`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago			`} else {`
			`for (j = i + 1; j < tokens.length; j++) {`
standard: remove semi 11 months ago			`if (tokens[j].type === 'softbreak' \|\| tokens[j].type === 'hardbreak') break // nextChar defaults to 0x20`
			`if (!tokens[j].content) continue // should skip all tokens except 'text', 'html_inline' or 'code_inline'`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago
standard: remove semi 11 months ago			`nextChar = tokens[j].content.charCodeAt(0)`
			`break`
Take into account adjacent tokens in smartquotes close https://github.com/markdown-it/markdown-it/issues/181 9 years ago			`}`
			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago
standard: remove semi 11 months ago			`const isLastPunctChar = isMdAsciiPunct(lastChar) \|\| isPunctChar(String.fromCharCode(lastChar))`
			`const isNextPunctChar = isMdAsciiPunct(nextChar) \|\| isPunctChar(String.fromCharCode(nextChar))`
Splitted replacements & smartquotes to smaller functions 10 years ago
standard: remove semi 11 months ago			`const isLastWhiteSpace = isWhiteSpace(lastChar)`
			`const isNextWhiteSpace = isWhiteSpace(nextChar)`
Splitted replacements & smartquotes to smaller functions 10 years ago
			`if (isNextWhiteSpace) {`
standard: remove semi 11 months ago			`canOpen = false`
Splitted replacements & smartquotes to smaller functions 10 years ago			`} else if (isNextPunctChar) {`
			`if (!(isLastWhiteSpace \|\| isLastPunctChar)) {`
standard: remove semi 11 months ago			`canOpen = false`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (isLastWhiteSpace) {`
standard: remove semi 11 months ago			`canClose = false`
Splitted replacements & smartquotes to smaller functions 10 years ago			`} else if (isLastPunctChar) {`
			`if (!(isNextWhiteSpace \|\| isNextPunctChar)) {`
standard: remove semi 11 months ago			`canClose = false`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (nextChar === 0x22 /* " */ && t[0] === '"') {`
			`if (lastChar >= 0x30 /* 0 / && lastChar <= 0x39 / 9 */) {`
			`// special case: 1"" - count first quote as an inch`
standard: remove semi 11 months ago			`canClose = canOpen = false`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (canOpen && canClose) {`
Allow opening quote after another punctuation char in typographer close https://github.com/markdown-it/markdown-it/issues/643 5 years ago			`// Replace quotes in the middle of punctuation sequence, but not`
			`// in the middle of the words, i.e.:`
			`//`
			`// 1. foo " bar " baz - not replaced`
			`// 2. foo-"-bar-"-baz - replaced`
			`// 3. foo"bar"baz - not replaced`
			`//`
standard: remove semi 11 months ago			`canOpen = isLastPunctChar`
			`canClose = isNextPunctChar`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Improve smartquotes handling Use implementation similar to the new emphasis one. 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (!canOpen && !canClose) {`
			`// middle of word`
			`if (isSingle) {`
standard: remove semi 11 months ago			`token.content = replaceAt(token.content, t.index, APOSTROPHE)`
Moved scans from typorgapher directly to rules 10 years ago			`}`
standard: remove semi 11 months ago			`continue`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Add rule to replace quotes with typographic ones 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (canClose) {`
			`// this could be a closing quote, rewind the stack to get a match`
			`for (j = stack.length - 1; j >= 0; j--) {`
standard: remove semi 11 months ago			`let item = stack[j]`
			`if (stack[j].level < thisLevel) { break }`
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (item.single === isSingle && stack[j].level === thisLevel) {`
standard: remove semi 11 months ago			`item = stack[j]`
Add multichar replacements in smartquotes fix #115 10 years ago
standard: remove semi 11 months ago			`let openQuote`
			`let closeQuote`
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (isSingle) {`
standard: remove semi 11 months ago			`openQuote = state.md.options.quotes[2]`
			`closeQuote = state.md.options.quotes[3]`
Splitted replacements & smartquotes to smaller functions 10 years ago			`} else {`
standard: remove semi 11 months ago			`openQuote = state.md.options.quotes[0]`
			`closeQuote = state.md.options.quotes[1]`
Add rule to replace quotes with typographic ones 10 years ago			`}`
Add multichar replacements in smartquotes fix #115 10 years ago
			`// replace token.content before tokens[item.token].content,`
			`// because, if they are pointing at the same token, replaceAt`
			`// could mess up indices when quote length != 1`
standard: remove semi 11 months ago			`token.content = replaceAt(token.content, t.index, closeQuote)`
Add multichar replacements in smartquotes fix #115 10 years ago			`tokens[item.token].content = replaceAt(`
standard: remove semi 11 months ago			`tokens[item.token].content, item.pos, openQuote)`
Add multichar replacements in smartquotes fix #115 10 years ago
standard: remove semi 11 months ago			`pos += closeQuote.length - 1`
			`if (item.token === i) { pos += openQuote.length - 1 }`
Add multichar replacements in smartquotes fix #115 10 years ago
standard: remove semi 11 months ago			`text = token.content`
			`max = text.length`
Add multichar replacements in smartquotes fix #115 10 years ago
standard: remove semi 11 months ago			`stack.length = j`
			`continue OUTER`
Add rule to replace quotes with typographic ones 10 years ago			`}`
			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Add rule to replace quotes with typographic ones 10 years ago
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (canOpen) {`
			`stack.push({`
			`token: i,`
			`pos: t.index,`
			`single: isSingle,`
			`level: thisLevel`
standard: remove semi 11 months ago			`})`
Splitted replacements & smartquotes to smaller functions 10 years ago			`} else if (canClose && isSingle) {`
standard: remove semi 11 months ago			`token.content = replaceAt(token.content, t.index, APOSTROPHE)`
Add rule to replace quotes with typographic ones 10 years ago			`}`
			`}`
			`}`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`

standard: space before function params 11 months ago			`export default function smartquotes (state) {`
standard: spaces in comments 11 months ago			`/* eslint max-depth:0 */`
standard: remove semi 11 months ago			`if (!state.md.options.typographer) { return }`
Splitted replacements & smartquotes to smaller functions 10 years ago
var => const, let 11 months ago			`for (let blkIdx = state.tokens.length - 1; blkIdx >= 0; blkIdx--) {`
Splitted replacements & smartquotes to smaller functions 10 years ago			`if (state.tokens[blkIdx].type !== 'inline' \|\|`
			`!QUOTE_TEST_RE.test(state.tokens[blkIdx].content)) {`
standard: remove semi 11 months ago			`continue`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`

standard: remove semi 11 months ago			`process_inlines(state.tokens[blkIdx].children, state)`
Splitted replacements & smartquotes to smaller functions 10 years ago			`}`
Rewrite core to es6 modules 12 months ago			`}`