// GFM table, https://github.github.com/gfm/#tables-extension- import { isSpace } from '../common/utils.mjs' function getLine (state, line) { const pos = state.bMarks[line] + state.tShift[line] const max = state.eMarks[line] return state.src.slice(pos, max) } function escapedSplit (str) { const result = [] const max = str.length let pos = 0 let ch = str.charCodeAt(pos) let isEscaped = false let lastPos = 0 let current = '' while (pos < max) { if (ch === 0x7c/* | */) { if (!isEscaped) { // pipe separating cells, '|' result.push(current + str.substring(lastPos, pos)) current = '' lastPos = pos + 1 } else { // escaped pipe, '\|' current += str.substring(lastPos, pos - 1) lastPos = pos } } isEscaped = (ch === 0x5c/* \ */) pos++ ch = str.charCodeAt(pos) } result.push(current + str.substring(lastPos)) return result } export default function table (state, startLine, endLine, silent) { // should have at least two lines if (startLine + 2 > endLine) { return false } let nextLine = startLine + 1 if (state.sCount[nextLine] < state.blkIndent) { return false } // if it's indented more than 3 spaces, it should be a code block if (state.sCount[nextLine] - state.blkIndent >= 4) { return false } // first character of the second line should be '|', '-', ':', // and no other characters are allowed but spaces; // basically, this is the equivalent of /^[-:|][-:|\s]*$/ regexp let pos = state.bMarks[nextLine] + state.tShift[nextLine] if (pos >= state.eMarks[nextLine]) { return false } const firstCh = state.src.charCodeAt(pos++) if (firstCh !== 0x7C/* | */ && firstCh !== 0x2D/* - */ && firstCh !== 0x3A/* : */) { return false } if (pos >= state.eMarks[nextLine]) { return false } const secondCh = state.src.charCodeAt(pos++) if (secondCh !== 0x7C/* | */ && secondCh !== 0x2D/* - */ && secondCh !== 0x3A/* : */ && !isSpace(secondCh)) { return false } // if first character is '-', then second character must not be a space // (due to parsing ambiguity with list) if (firstCh === 0x2D/* - */ && isSpace(secondCh)) { return false } while (pos < state.eMarks[nextLine]) { const ch = state.src.charCodeAt(pos) if (ch !== 0x7C/* | */ && ch !== 0x2D/* - */ && ch !== 0x3A/* : */ && !isSpace(ch)) { return false } pos++ } let lineText = getLine(state, startLine + 1) let columns = lineText.split('|') const aligns = [] for (let i = 0; i < columns.length; i++) { const t = columns[i].trim() if (!t) { // allow empty columns before and after table, but not in between columns; // e.g. allow ` |---| `, disallow ` ---||--- ` if (i === 0 || i === columns.length - 1) { continue } else { return false } } if (!/^:?-+:?$/.test(t)) { return false } if (t.charCodeAt(t.length - 1) === 0x3A/* : */) { aligns.push(t.charCodeAt(0) === 0x3A/* : */ ? 'center' : 'right') } else if (t.charCodeAt(0) === 0x3A/* : */) { aligns.push('left') } else { aligns.push('') } } lineText = getLine(state, startLine).trim() if (lineText.indexOf('|') === -1) { return false } if (state.sCount[startLine] - state.blkIndent >= 4) { return false } columns = escapedSplit(lineText) if (columns.length && columns[0] === '') columns.shift() if (columns.length && columns[columns.length - 1] === '') columns.pop() // header row will define an amount of columns in the entire table, // and align row should be exactly the same (the rest of the rows can differ) const columnCount = columns.length if (columnCount === 0 || columnCount !== aligns.length) { return false } if (silent) { return true } const oldParentType = state.parentType state.parentType = 'table' // use 'blockquote' lists for termination because it's // the most similar to tables const terminatorRules = state.md.block.ruler.getRules('blockquote') const token_to = state.push('table_open', 'table', 1) const tableLines = [startLine, 0] token_to.map = tableLines const token_tho = state.push('thead_open', 'thead', 1) token_tho.map = [startLine, startLine + 1] const token_htro = state.push('tr_open', 'tr', 1) token_htro.map = [startLine, startLine + 1] for (let i = 0; i < columns.length; i++) { const token_ho = state.push('th_open', 'th', 1) if (aligns[i]) { token_ho.attrs = [['style', 'text-align:' + aligns[i]]] } const token_il = state.push('inline', '', 0) token_il.content = columns[i].trim() token_il.children = [] state.push('th_close', 'th', -1) } state.push('tr_close', 'tr', -1) state.push('thead_close', 'thead', -1) let tbodyLines for (nextLine = startLine + 2; nextLine < endLine; nextLine++) { if (state.sCount[nextLine] < state.blkIndent) { break } let terminate = false for (let i = 0, l = terminatorRules.length; i < l; i++) { if (terminatorRules[i](state, nextLine, endLine, true)) { terminate = true break } } if (terminate) { break } lineText = getLine(state, nextLine).trim() if (!lineText) { break } if (state.sCount[nextLine] - state.blkIndent >= 4) { break } columns = escapedSplit(lineText) if (columns.length && columns[0] === '') columns.shift() if (columns.length && columns[columns.length - 1] === '') columns.pop() if (nextLine === startLine + 2) { const token_tbo = state.push('tbody_open', 'tbody', 1) token_tbo.map = tbodyLines = [startLine + 2, 0] } const token_tro = state.push('tr_open', 'tr', 1) token_tro.map = [nextLine, nextLine + 1] for (let i = 0; i < columnCount; i++) { const token_tdo = state.push('td_open', 'td', 1) if (aligns[i]) { token_tdo.attrs = [['style', 'text-align:' + aligns[i]]] } const token_il = state.push('inline', '', 0) token_il.content = columns[i] ? columns[i].trim() : '' token_il.children = [] state.push('td_close', 'td', -1) } state.push('tr_close', 'tr', -1) } if (tbodyLines) { state.push('tbody_close', 'tbody', -1) tbodyLines[1] = nextLine } state.push('table_close', 'table', -1) tableLines[1] = nextLine state.parentType = oldParentType state.line = nextLine return true }