markdown-it/lib/common/utils.mjs

// Utilities
//

import * as mdurl from 'mdurl'
import * as ucmicro from 'uc.micro'
import { decodeHTML } from 'entities'

function _class (obj) { return Object.prototype.toString.call(obj) }

function isString (obj) { return _class(obj) === '[object String]' }

const _hasOwnProperty = Object.prototype.hasOwnProperty

function has (object, key) {
  return _hasOwnProperty.call(object, key)
}

// Merge objects
//
function assign (obj /* from1, from2, from3, ... */) {
  const sources = Array.prototype.slice.call(arguments, 1)

  sources.forEach(function (source) {
    if (!source) { return }

    if (typeof source !== 'object') {
      throw new TypeError(source + 'must be object')
    }

    Object.keys(source).forEach(function (key) {
      obj[key] = source[key]
    })
  })

  return obj
}

// Remove element from array and put another array at those position.
// Useful for some operations with tokens
function arrayReplaceAt (src, pos, newElements) {
  return [].concat(src.slice(0, pos), newElements, src.slice(pos + 1))
}

function isValidEntityCode (c) {
  /* eslint no-bitwise:0 */
  // broken sequence
  if (c >= 0xD800 && c <= 0xDFFF) { return false }
  // never used
  if (c >= 0xFDD0 && c <= 0xFDEF) { return false }
  if ((c & 0xFFFF) === 0xFFFF || (c & 0xFFFF) === 0xFFFE) { return false }
  // control codes
  if (c >= 0x00 && c <= 0x08) { return false }
  if (c === 0x0B) { return false }
  if (c >= 0x0E && c <= 0x1F) { return false }
  if (c >= 0x7F && c <= 0x9F) { return false }
  // out of range
  if (c > 0x10FFFF) { return false }
  return true
}

function fromCodePoint (c) {
  /* eslint no-bitwise:0 */
  if (c > 0xffff) {
    c -= 0x10000
    const surrogate1 = 0xd800 + (c >> 10)
    const surrogate2 = 0xdc00 + (c & 0x3ff)

    return String.fromCharCode(surrogate1, surrogate2)
  }
  return String.fromCharCode(c)
}

const UNESCAPE_MD_RE  = /\\([!"#$%&'()*+,\-./:;<=>?@[\\\]^_`{|}~])/g
const ENTITY_RE       = /&([a-z#][a-z0-9]{1,31});/gi
const UNESCAPE_ALL_RE = new RegExp(UNESCAPE_MD_RE.source + '|' + ENTITY_RE.source, 'gi')

const DIGITAL_ENTITY_TEST_RE = /^#((?:x[a-f0-9]{1,8}|[0-9]{1,8}))$/i

function replaceEntityPattern (match, name) {
  if (name.charCodeAt(0) === 0x23/* # */ && DIGITAL_ENTITY_TEST_RE.test(name)) {
    const code = name[1].toLowerCase() === 'x'
      ? parseInt(name.slice(2), 16)
      : parseInt(name.slice(1), 10)

    if (isValidEntityCode(code)) {
      return fromCodePoint(code)
    }

    return match
  }

  const decoded = decodeHTML(match)
  if (decoded !== match) {
    return decoded
  }

  return match
}

/* function replaceEntities(str) {
  if (str.indexOf('&') < 0) { return str; }

  return str.replace(ENTITY_RE, replaceEntityPattern);
} */

function unescapeMd (str) {
  if (str.indexOf('\\') < 0) { return str }
  return str.replace(UNESCAPE_MD_RE, '$1')
}

function unescapeAll (str) {
  if (str.indexOf('\\') < 0 && str.indexOf('&') < 0) { return str }

  return str.replace(UNESCAPE_ALL_RE, function (match, escaped, entity) {
    if (escaped) { return escaped }
    return replaceEntityPattern(match, entity)
  })
}

const HTML_ESCAPE_TEST_RE = /[&<>"]/
const HTML_ESCAPE_REPLACE_RE = /[&<>"]/g
const HTML_REPLACEMENTS = {
  '&': '&amp;',
  '<': '&lt;',
  '>': '&gt;',
  '"': '&quot;'
}

function replaceUnsafeChar (ch) {
  return HTML_REPLACEMENTS[ch]
}

function escapeHtml (str) {
  if (HTML_ESCAPE_TEST_RE.test(str)) {
    return str.replace(HTML_ESCAPE_REPLACE_RE, replaceUnsafeChar)
  }
  return str
}

const REGEXP_ESCAPE_RE = /[.?*+^$[\]\\(){}|-]/g

function escapeRE (str) {
  return str.replace(REGEXP_ESCAPE_RE, '\\$&')
}

function isSpace (code) {
  switch (code) {
    case 0x09:
    case 0x20:
      return true
  }
  return false
}

// Zs (unicode class) || [\t\f\v\r\n]
function isWhiteSpace (code) {
  if (code >= 0x2000 && code <= 0x200A) { return true }
  switch (code) {
    case 0x09: // \t
    case 0x0A: // \n
    case 0x0B: // \v
    case 0x0C: // \f
    case 0x0D: // \r
    case 0x20:
    case 0xA0:
    case 0x1680:
    case 0x202F:
    case 0x205F:
    case 0x3000:
      return true
  }
  return false
}

/* eslint-disable max-len */

// Currently without astral characters support.
function isPunctChar (ch) {
  return ucmicro.P.test(ch) || ucmicro.S.test(ch)
}

// Markdown ASCII punctuation characters.
//
// !, ", #, $, %, &, ', (, ), *, +, ,, -, ., /, :, ;, <, =, >, ?, @, [, \, ], ^, _, `, {, |, }, or ~
// http://spec.commonmark.org/0.15/#ascii-punctuation-character
//
// Don't confuse with unicode punctuation !!! It lacks some chars in ascii range.
//
function isMdAsciiPunct (ch) {
  switch (ch) {
    case 0x21/* ! */:
    case 0x22/* " */:
    case 0x23/* # */:
    case 0x24/* $ */:
    case 0x25/* % */:
    case 0x26/* & */:
    case 0x27/* ' */:
    case 0x28/* ( */:
    case 0x29/* ) */:
    case 0x2A/* * */:
    case 0x2B/* + */:
    case 0x2C/* , */:
    case 0x2D/* - */:
    case 0x2E/* . */:
    case 0x2F/* / */:
    case 0x3A/* : */:
    case 0x3B/* ; */:
    case 0x3C/* < */:
    case 0x3D/* = */:
    case 0x3E/* > */:
    case 0x3F/* ? */:
    case 0x40/* @ */:
    case 0x5B/* [ */:
    case 0x5C/* \ */:
    case 0x5D/* ] */:
    case 0x5E/* ^ */:
    case 0x5F/* _ */:
    case 0x60/* ` */:
    case 0x7B/* { */:
    case 0x7C/* | */:
    case 0x7D/* } */:
    case 0x7E/* ~ */:
      return true
    default:
      return false
  }
}

// Hepler to unify [reference labels].
//
function normalizeReference (str) {
  // Trim and collapse whitespace
  //
  str = str.trim().replace(/\s+/g, ' ')

  // In node v10 'ẞ'.toLowerCase() === 'Ṿ', which is presumed to be a bug
  // fixed in v12 (couldn't find any details).
  //
  // So treat this one as a special case
  // (remove this when node v10 is no longer supported).
  //
  if ('ẞ'.toLowerCase() === 'Ṿ') {
    str = str.replace(/ẞ/g, 'ß')
  }

  // .toLowerCase().toUpperCase() should get rid of all differences
  // between letter variants.
  //
  // Simple .toLowerCase() doesn't normalize 125 code points correctly,
  // and .toUpperCase doesn't normalize 6 of them (list of exceptions:
  // İ, ϴ, ẞ, Ω, K, Å - those are already uppercased, but have differently
  // uppercased versions).
  //
  // Here's an example showing how it happens. Lets take greek letter omega:
  // uppercase U+0398 (Θ), U+03f4 (ϴ) and lowercase U+03b8 (θ), U+03d1 (ϑ)
  //
  // Unicode entries:
  // 0398;GREEK CAPITAL LETTER THETA;Lu;0;L;;;;;N;;;;03B8;
  // 03B8;GREEK SMALL LETTER THETA;Ll;0;L;;;;;N;;;0398;;0398
  // 03D1;GREEK THETA SYMBOL;Ll;0;L;<compat> 03B8;;;;N;GREEK SMALL LETTER SCRIPT THETA;;0398;;0398
  // 03F4;GREEK CAPITAL THETA SYMBOL;Lu;0;L;<compat> 0398;;;;N;;;;03B8;
  //
  // Case-insensitive comparison should treat all of them as equivalent.
  //
  // But .toLowerCase() doesn't change ϑ (it's already lowercase),
  // and .toUpperCase() doesn't change ϴ (already uppercase).
  //
  // Applying first lower then upper case normalizes any character:
  // '\u0398\u03f4\u03b8\u03d1'.toLowerCase().toUpperCase() === '\u0398\u0398\u0398\u0398'
  //
  // Note: this is equivalent to unicode case folding; unicode normalization
  // is a different step that is not required here.
  //
  // Final result should be uppercased, because it's later stored in an object
  // (this avoid a conflict with Object.prototype members,
  // most notably, `__proto__`)
  //
  return str.toLowerCase().toUpperCase()
}

// Re-export libraries commonly used in both markdown-it and its plugins,
// so plugins won't have to depend on them explicitly, which reduces their
// bundled size (e.g. a browser build).
//
const lib = { mdurl, ucmicro }

export {
  lib,
  assign,
  isString,
  has,
  unescapeMd,
  unescapeAll,
  isValidEntityCode,
  fromCodePoint,
  escapeHtml,
  arrayReplaceAt,
  isSpace,
  isWhiteSpace,
  isMdAsciiPunct,
  isPunctChar,
  escapeRE,
  normalizeReference
}
Replaced `assign` helper 10 years ago			`// Utilities`
Moved string helpers to utilities 10 years ago			`//`
Replaced `assign` helper 10 years ago
Deps bump 12 months ago			`import * as mdurl from 'mdurl'`
			`import * as ucmicro from 'uc.micro'`
standard: remove semi 12 months ago			`import { decodeHTML } from 'entities'`
Replaced `assign` helper 10 years ago
standard: space before function params 12 months ago			`function _class (obj) { return Object.prototype.toString.call(obj) }`
Reorganized parser configuration 10 years ago
standard: space before function params 12 months ago			`function isString (obj) { return _class(obj) === '[object String]' }`
Reorganized parser configuration 10 years ago
standard: remove semi 12 months ago			`const _hasOwnProperty = Object.prototype.hasOwnProperty`
More safe properties check 10 years ago
standard: space before function params 12 months ago			`function has (object, key) {`
standard: remove semi 12 months ago			`return _hasOwnProperty.call(object, key)`
More safe properties check 10 years ago			`}`

Replaced `assign` helper 10 years ago			`// Merge objects`
			`//`
standard: spaces in comments 12 months ago			`function assign (obj /* from1, from2, from3, ... */) {`
standard: remove semi 12 months ago			`const sources = Array.prototype.slice.call(arguments, 1)`
Fixed replaceEntities, default preset, improved coverage 10 years ago
			`sources.forEach(function (source) {`
standard: remove semi 12 months ago			`if (!source) { return }`
Replaced `assign` helper 10 years ago
Coverage improve 10 years ago			`if (typeof source !== 'object') {`
standard: remove semi 12 months ago			`throw new TypeError(source + 'must be object')`
Replaced `assign` helper 10 years ago			`}`

Fixed replaceEntities, default preset, improved coverage 10 years ago			`Object.keys(source).forEach(function (key) {`
standard: remove semi 12 months ago			`obj[key] = source[key]`
			`})`
			`})`
Replaced `assign` helper 10 years ago
standard: remove semi 12 months ago			`return obj`
Moved string helpers to utilities 10 years ago			`}`

Both helpers & utils are not in each instance of main parser 10 years ago			`// Remove element from array and put another array at those position.`
			`// Useful for some operations with tokens`
standard: space before function params 12 months ago			`function arrayReplaceAt (src, pos, newElements) {`
standard: remove semi 12 months ago			`return [].concat(src.slice(0, pos), newElements, src.slice(pos + 1))`
Both helpers & utils are not in each instance of main parser 10 years ago			`}`

standard: space before function params 12 months ago			`function isValidEntityCode (c) {`
standard: spaces in comments 12 months ago			`/* eslint no-bitwise:0 */`
Moved string helpers to utilities 10 years ago			`// broken sequence`
standard: remove semi 12 months ago			`if (c >= 0xD800 && c <= 0xDFFF) { return false }`
Moved string helpers to utilities 10 years ago			`// never used`
standard: remove semi 12 months ago			`if (c >= 0xFDD0 && c <= 0xFDEF) { return false }`
			`if ((c & 0xFFFF) === 0xFFFF \|\| (c & 0xFFFF) === 0xFFFE) { return false }`
Moved string helpers to utilities 10 years ago			`// control codes`
standard: remove semi 12 months ago			`if (c >= 0x00 && c <= 0x08) { return false }`
			`if (c === 0x0B) { return false }`
			`if (c >= 0x0E && c <= 0x1F) { return false }`
			`if (c >= 0x7F && c <= 0x9F) { return false }`
Moved string helpers to utilities 10 years ago			`// out of range`
standard: remove semi 12 months ago			`if (c > 0x10FFFF) { return false }`
			`return true`
Moved string helpers to utilities 10 years ago			`}`

standard: space before function params 12 months ago			`function fromCodePoint (c) {`
standard: spaces in comments 12 months ago			`/* eslint no-bitwise:0 */`
Moved string helpers to utilities 10 years ago			`if (c > 0xffff) {`
standard: remove semi 12 months ago			`c -= 0x10000`
standard: init vars in separate declaration 12 months ago			`const surrogate1 = 0xd800 + (c >> 10)`
			`const surrogate2 = 0xdc00 + (c & 0x3ff)`
Moved string helpers to utilities 10 years ago
standard: remove semi 12 months ago			`return String.fromCharCode(surrogate1, surrogate2)`
Moved string helpers to utilities 10 years ago			`}`
standard: remove semi 12 months ago			`return String.fromCharCode(c)`
Moved string helpers to utilities 10 years ago			`}`

standard: more tweaks & simplify eslint config 12 months ago			const UNESCAPE_MD_RE = /\\([!"#$%&'()*+,\-./:;<=>?@[\\\]^_`{\|}~])/g
standard: remove semi 12 months ago			`const ENTITY_RE = /&([a-z#][a-z0-9]{1,31});/gi`
			`const UNESCAPE_ALL_RE = new RegExp(UNESCAPE_MD_RE.source + '\|' + ENTITY_RE.source, 'gi')`
Var rename & coverage improve 10 years ago
standard: remove semi 12 months ago			`const DIGITAL_ENTITY_TEST_RE = /^#((?:x[a-f0-9]{1,8}\|[0-9]{1,8}))$/i`
Var rename & coverage improve 10 years ago
standard: space before function params 12 months ago			`function replaceEntityPattern (match, name) {`
Commented out unused `replaceEntities()` 10 years ago			`if (name.charCodeAt(0) === 0x23/* # */ && DIGITAL_ENTITY_TEST_RE.test(name)) {`
standard: more tweaks & simplify eslint config 12 months ago			`const code = name[1].toLowerCase() === 'x'`
			`? parseInt(name.slice(2), 16)`
			`: parseInt(name.slice(1), 10)`
Bump eslint & update CS 5 years ago
Fixed replaceEntities, default preset, improved coverage 10 years ago			`if (isValidEntityCode(code)) {`
standard: remove semi 12 months ago			`return fromCodePoint(code)`
Fixed replaceEntities, default preset, improved coverage 10 years ago			`}`
chore: Update entities dependency (#901) * Update entities package + usage * Apply custom digital entity logic before entities decode 1 year ago
standard: remove semi 12 months ago			`return match`
chore: Update entities dependency (#901) * Update entities package + usage * Apply custom digital entity logic before entities decode 1 year ago			`}`

standard: remove semi 12 months ago			`const decoded = decodeHTML(match)`
chore: Update entities dependency (#901) * Update entities package + usage * Apply custom digital entity logic before entities decode 1 year ago			`if (decoded !== match) {`
standard: remove semi 12 months ago			`return decoded`
Fixed replaceEntities, default preset, improved coverage 10 years ago			`}`
Commented out unused `replaceEntities()` 10 years ago
standard: remove semi 12 months ago			`return match`
Fixed replaceEntities, default preset, improved coverage 10 years ago			`}`

standard: spaces in comments 12 months ago			`/* function replaceEntities(str) {`
Moved string helpers to utilities 10 years ago			`if (str.indexOf('&') < 0) { return str; }`

Var rename & coverage improve 10 years ago			`return str.replace(ENTITY_RE, replaceEntityPattern);`
standard: spaces in comments 12 months ago			`} */`
Moved string helpers to utilities 10 years ago
standard: space before function params 12 months ago			`function unescapeMd (str) {`
standard: remove semi 12 months ago			`if (str.indexOf('\\') < 0) { return str }`
			`return str.replace(UNESCAPE_MD_RE, '$1')`
Use unescapeAll for links unescaping 10 years ago			`}`

standard: space before function params 12 months ago			`function unescapeAll (str) {`
standard: remove semi 12 months ago			`if (str.indexOf('\\') < 0 && str.indexOf('&') < 0) { return str }`
Use unescapeAll for links unescaping 10 years ago
eslint update & code cleanup 9 years ago			`return str.replace(UNESCAPE_ALL_RE, function (match, escaped, entity) {`
standard: remove semi 12 months ago			`if (escaped) { return escaped }`
			`return replaceEntityPattern(match, entity)`
			`})`
Use unescapeAll for links unescaping 10 years ago			`}`

standard: remove semi 12 months ago			`const HTML_ESCAPE_TEST_RE = /[&<>"]/`
			`const HTML_ESCAPE_REPLACE_RE = /[&<>"]/g`
var => const, let 12 months ago			`const HTML_REPLACEMENTS = {`
Moved html escape helper to utils 10 years ago			`'&': '&',`
			`'<': '<',`
			`'>': '>',`
			`'"': '"'`
standard: remove semi 12 months ago			`}`
Moved html escape helper to utils 10 years ago
standard: space before function params 12 months ago			`function replaceUnsafeChar (ch) {`
standard: remove semi 12 months ago			`return HTML_REPLACEMENTS[ch]`
Moved html escape helper to utils 10 years ago			`}`

standard: space before function params 12 months ago			`function escapeHtml (str) {`
Moved html escape helper to utils 10 years ago			`if (HTML_ESCAPE_TEST_RE.test(str)) {`
standard: remove semi 12 months ago			`return str.replace(HTML_ESCAPE_REPLACE_RE, replaceUnsafeChar)`
Moved html escape helper to utils 10 years ago			`}`
standard: remove semi 12 months ago			`return str`
Moved html escape helper to utils 10 years ago			`}`

standard: remove semi 12 months ago			`const REGEXP_ESCAPE_RE = /[.?*+^$[\]\\(){}\|-]/g`
Added regexp escaper to utils 10 years ago
standard: space before function params 12 months ago			`function escapeRE (str) {`
standard: remove semi 12 months ago			`return str.replace(REGEXP_ESCAPE_RE, '\\$&')`
Added regexp escaper to utils 10 years ago			`}`

standard: space before function params 12 months ago			`function isSpace (code) {`
Expand tabs only when it's needed, as per CommonMark 0.21 9 years ago			`switch (code) {`
			`case 0x09:`
			`case 0x20:`
standard: remove semi 12 months ago			`return true`
Expand tabs only when it's needed, as per CommonMark 0.21 9 years ago			`}`
standard: remove semi 12 months ago			`return false`
Expand tabs only when it's needed, as per CommonMark 0.21 9 years ago			`}`

Clarified isWhiteSpace() 10 years ago			`// Zs (unicode class) \|\| [\t\f\v\r\n]`
standard: space before function params 12 months ago			`function isWhiteSpace (code) {`
standard: remove semi 12 months ago			`if (code >= 0x2000 && code <= 0x200A) { return true }`
Unicode helpers for upcoming 0.15 update 10 years ago			`switch (code) {`
Clarified isWhiteSpace() 10 years ago			`case 0x09: // \t`
			`case 0x0A: // \n`
			`case 0x0B: // \v`
			`case 0x0C: // \f`
			`case 0x0D: // \r`
Unicode helpers for upcoming 0.15 update 10 years ago			`case 0x20:`
Fixed whitespace check helper 10 years ago			`case 0xA0:`
			`case 0x1680:`
Unicode helpers for upcoming 0.15 update 10 years ago			`case 0x202F:`
			`case 0x205F:`
			`case 0x3000:`
standard: remove semi 12 months ago			`return true`
Unicode helpers for upcoming 0.15 update 10 years ago			`}`
standard: remove semi 12 months ago			`return false`
Unicode helpers for upcoming 0.15 update 10 years ago			`}`

standard: spaces in comments 12 months ago			`/* eslint-disable max-len */`
Unicode helpers for upcoming 0.15 update 10 years ago
			`// Currently without astral characters support.`
standard: space before function params 12 months ago			`function isPunctChar (ch) {`
Update to comply with spec 0.31.2 The spec update changes these things: * It simplifies the HTML regex so that `<!-- a -- b -->` is an HTML comment. HTML5 reports this as an error, but still parses it. * It changes the set of known HTML block elements to match HTML5, adding `search` and removing `source`. * It adds Unicode Symbols to the set of punctuation characters that are used to evaluate flankingness. This commit also changes the declaration HTML regex to match lowercase, even though that change was technically made in spec version 0.30. 9 months ago			`return ucmicro.P.test(ch) \|\| ucmicro.S.test(ch)`
Unicode helpers for upcoming 0.15 update 10 years ago			`}`

Fixed punctuation check in emphasis 10 years ago			`// Markdown ASCII punctuation characters.`
			`//`
			// !, ", #, $, %, &, ', (, ), *, +, ,, -, ., /, :, ;, <, =, >, ?, @, [, \, ], ^, _, `, {, \|, }, or ~
			`// http://spec.commonmark.org/0.15/#ascii-punctuation-character`
			`//`
			`// Don't confuse with unicode punctuation !!! It lacks some chars in ascii range.`
			`//`
standard: space before function params 12 months ago			`function isMdAsciiPunct (ch) {`
Fixed punctuation check in emphasis 10 years ago			`switch (ch) {`
			`case 0x21/* ! */:`
			`case 0x22/* " */:`
			`case 0x23/* # */:`
			`case 0x24/* $ */:`
			`case 0x25/* % */:`
			`case 0x26/* & */:`
			`case 0x27/* ' */:`
			`case 0x28/* ( */:`
			`case 0x29/* ) */:`
			`case 0x2A/* * */:`
			`case 0x2B/* + */:`
			`case 0x2C/* , */:`
			`case 0x2D/* - */:`
			`case 0x2E/* . */:`
			`case 0x2F/* / */:`
			`case 0x3A/* : */:`
			`case 0x3B/* ; */:`
			`case 0x3C/* < */:`
			`case 0x3D/* = */:`
			`case 0x3E/* > */:`
			`case 0x3F/* ? */:`
			`case 0x40/* @ */:`
			`case 0x5B/* [ */:`
			`case 0x5C/* \ */:`
			`case 0x5D/* ] */:`
			`case 0x5E/* ^ */:`
			`case 0x5F/* _ */:`
			case 0x60/* ` */:
			`case 0x7B/* { */:`
			`case 0x7C/* \| */:`
			`case 0x7D/* } */:`
			`case 0x7E/* ~ */:`
standard: remove semi 12 months ago			`return true`
Fixed punctuation check in emphasis 10 years ago			`default:`
standard: remove semi 12 months ago			`return false`
Fixed punctuation check in emphasis 10 years ago			`}`
			`}`

moved normalizeReference to utils, closes #42 10 years ago			`// Hepler to unify [reference labels].`
			`//`
standard: space before function params 12 months ago			`function normalizeReference (str) {`
Improve normalization for reference label matching Simple toUpperCase() does not work for various ligatures and legacy characters that are already in a different upper case form. See also: https://github.com/commonmark/commonmark-spec/commit/278ea515fe5ff3e0dd652ee2127ffcd5cbc91527 5 years ago			`// Trim and collapse whitespace`
			`//`
standard: remove semi 12 months ago			`str = str.trim().replace(/\s+/g, ' ')`
Improve normalization for reference label matching Simple toUpperCase() does not work for various ligatures and legacy characters that are already in a different upper case form. See also: https://github.com/commonmark/commonmark-spec/commit/278ea515fe5ff3e0dd652ee2127ffcd5cbc91527 5 years ago
			`// In node v10 'ẞ'.toLowerCase() === 'Ṿ', which is presumed to be a bug`
			`// fixed in v12 (couldn't find any details).`
			`//`
			`// So treat this one as a special case`
			`// (remove this when node v10 is no longer supported).`
			`//`
			`if ('ẞ'.toLowerCase() === 'Ṿ') {`
standard: remove semi 12 months ago			`str = str.replace(/ẞ/g, 'ß')`
Improve normalization for reference label matching Simple toUpperCase() does not work for various ligatures and legacy characters that are already in a different upper case form. See also: https://github.com/commonmark/commonmark-spec/commit/278ea515fe5ff3e0dd652ee2127ffcd5cbc91527 5 years ago			`}`

			`// .toLowerCase().toUpperCase() should get rid of all differences`
			`// between letter variants.`
			`//`
Add an example related to case-insensitive comparisons 5 years ago			`// Simple .toLowerCase() doesn't normalize 125 code points correctly,`
			`// and .toUpperCase doesn't normalize 6 of them (list of exceptions:`
			`// İ, ϴ, ẞ, Ω, K, Å - those are already uppercased, but have differently`
			`// uppercased versions).`
			`//`
			`// Here's an example showing how it happens. Lets take greek letter omega:`
			`// uppercase U+0398 (Θ), U+03f4 (ϴ) and lowercase U+03b8 (θ), U+03d1 (ϑ)`
			`//`
			`// Unicode entries:`
			`// 0398;GREEK CAPITAL LETTER THETA;Lu;0;L;;;;;N;;;;03B8;`
			`// 03B8;GREEK SMALL LETTER THETA;Ll;0;L;;;;;N;;;0398;;0398`
			`// 03D1;GREEK THETA SYMBOL;Ll;0;L;<compat> 03B8;;;;N;GREEK SMALL LETTER SCRIPT THETA;;0398;;0398`
			`// 03F4;GREEK CAPITAL THETA SYMBOL;Lu;0;L;<compat> 0398;;;;N;;;;03B8;`
			`//`
			`// Case-insensitive comparison should treat all of them as equivalent.`
			`//`
			`// But .toLowerCase() doesn't change ϑ (it's already lowercase),`
			`// and .toUpperCase() doesn't change ϴ (already uppercase).`
			`//`
			`// Applying first lower then upper case normalizes any character:`
			`// '\u0398\u03f4\u03b8\u03d1'.toLowerCase().toUpperCase() === '\u0398\u0398\u0398\u0398'`
			`//`
			`// Note: this is equivalent to unicode case folding; unicode normalization`
			`// is a different step that is not required here.`
			`//`
Improve normalization for reference label matching Simple toUpperCase() does not work for various ligatures and legacy characters that are already in a different upper case form. See also: https://github.com/commonmark/commonmark-spec/commit/278ea515fe5ff3e0dd652ee2127ffcd5cbc91527 5 years ago			`// Final result should be uppercased, because it's later stored in an object`
			`// (this avoid a conflict with Object.prototype members,`
			// most notably, `__proto__`)
			`//`
standard: remove semi 12 months ago			`return str.toLowerCase().toUpperCase()`
moved normalizeReference to utils, closes #42 10 years ago			`}`

Re-export uc.micro and mdurl 10 years ago			`// Re-export libraries commonly used in both markdown-it and its plugins,`
			`// so plugins won't have to depend on them explicitly, which reduces their`
			`// bundled size (e.g. a browser build).`
			`//`
standard: remove semi 12 months ago			`const lib = { mdurl, ucmicro }`
Rewrite core to es6 modules 1 year ago
			`export {`
			`lib,`
			`assign,`
			`isString,`
			`has,`
			`unescapeMd,`
			`unescapeAll,`
			`isValidEntityCode,`
			`fromCodePoint,`
			`escapeHtml,`
			`arrayReplaceAt,`
			`isSpace,`
			`isWhiteSpace,`
			`isMdAsciiPunct,`
			`isPunctChar,`
			`escapeRE,`
			`normalizeReference`
standard: remove semi 12 months ago			`}`