showdown/src/subParsers/lists.js

/**
 * Form HTML ordered (numbered) and unordered (bulleted) lists.
 */
showdown.subParser('lists', function (text, options, globals) {
  'use strict';

  var spl = '~1';

  /**
   * Process the contents of a single ordered or unordered list, splitting it
   * into individual list items.
   * @param {string} listStr
   * @returns {string}
   */
  function processListItems (listStr) {
    // The $g_list_level global keeps track of when we're inside a list.
    // Each time we enter a list, we increment it; when we leave a list,
    // we decrement. If it's zero, we're not in a list anymore.
    //
    // We do this because when we're not inside a list, we want to treat
    // something like this:
    //
    //    I recommend upgrading to version
    //    8. Oops, now this line is treated
    //    as a sub-list.
    //
    // As a single paragraph, despite the fact that the second line starts
    // with a digit-period-space sequence.
    //
    // Whereas when we're inside a list (or sub-list), that line will be
    // treated as the start of a sub-list. What a kludge, huh? This is
    // an aspect of Markdown's syntax that's hard to parse perfectly
    // without resorting to mind-reading. Perhaps the solution is to
    // change the syntax rules such that sub-lists must start with a
    // starting cardinal number; e.g. "1." or "a.".

    globals.gListLevel++;

    // trim trailing blank lines:
    listStr = listStr.replace(/\n{2,}$/, '\n');

    // attacklab: add sentinel to emulate \z
    listStr += '~0';

    /*
     list_str = list_str.replace(/
     (\n)?							// leading line = $1
     (^[ \t]*)						// leading whitespace = $2
     ([*+-]|\d+[.]) [ \t]+			// list marker = $3
     ([^\r]+?						// list item text   = $4
     (\n{1,2}))
     (?= \n* (~0 | \2 ([*+-]|\d+[.]) [ \t]+))
     /gm, function(){...});
     */
    var rgx = /(\n)?(^[ \t]*)([*+-]|\d+[.])[ \t]+([^\r]+?(\n{1,2}))(?=\n*(~0|\2([*+-]|\d+[.])[ \t]+))/gm;

    listStr = listStr.replace(rgx, function (wholeMatch, m1, m2, m3, m4) {
      var item = showdown.subParser('outdent')(m4, options, globals);
      //m1 - LeadingLine

      if (m1 || (item.search(/\n{2,}/) > -1)) {
        item = showdown.subParser('blockGamut')(item, options, globals);
      } else {
        // Recursion for sub-lists:
        item = showdown.subParser('lists')(item, options, globals);
        item = item.replace(/\n$/, ''); // chomp(item)
        item = showdown.subParser('spanGamut')(item, options, globals);
      }

      // this is a "hack" to differentiate between ordered and unordered lists
      // related to issue #142
      var tp = (m3.search(/[*+-]/g) > -1) ? 'ul' : 'ol';
      return spl + tp + '<li>' + item + '</li>\n';
    });

    // attacklab: strip sentinel
    listStr = listStr.replace(/~0/g, '');

    globals.gListLevel--;
    return listStr;
  }

  /**
   * Slit consecutive ol/ul lists (related to issue 142)
   * @param {Array} results
   * @param {string} listType
   * @returns {string|*}
   */
  function splitConsecutiveLists (results, listType) {
    var cthulhu = /(<p[^>]+?>|<p>|<\/p>)/img,
        holder = [[]],
        res = '',
        y = 0;

    // Initialize first sublist
    holder[0].type = listType;

    for (var i = 0; i < results.length; ++i) {
      var txt = results[i].slice(2),
          nListType = results[i].slice(0, 2);

      if (listType !== nListType) {
        y++;
        holder[y] = [];
        holder[y].type = nListType;
        listType = nListType;
      }
      holder[y].push(txt);
    }
    for (i = 0; i < holder.length; ++i) {
      res += '<' + holder[i].type + '>\n';
      for (var ii = 0; ii < holder[i].length; ++ii) {
        if (holder[i].length > 1 && ii === holder[i].length - 1 && !cthulhu.test(holder[i][ii - 1])) {
          //holder[i][ii] = holder[i][ii].replace(cthulhu, '');
        }
        res += holder[i][ii];
      }
      res += '</' + holder[i].type + '>\n';
    }
    return res;
  }

  // attacklab: add sentinel to hack around khtml/safari bug:
  // http://bugs.webkit.org/show_bug.cgi?id=11231
  text += '~0';

  // Re-usable pattern to match any entire ul or ol list:

  /*
   var whole_list = /
   (									// $1 = whole list
   (								// $2
   [ ]{0,3}					// attacklab: g_tab_width - 1
   ([*+-]|\d+[.])				// $3 = first list item marker
   [ \t]+
   )
   [^\r]+?
   (								// $4
   ~0							// sentinel for workaround; should be $
   |
   \n{2,}
   (?=\S)
   (?!							// Negative lookahead for another list item marker
   [ \t]*
   (?:[*+-]|\d+[.])[ \t]+
   )
   )
   )/g
   */
  var wholeList = /^(([ ]{0,3}([*+-]|\d+[.])[ \t]+)[^\r]+?(~0|\n{2,}(?=\S)(?![ \t]*(?:[*+-]|\d+[.])[ \t]+)))/gm;

  if (globals.gListLevel) {
    text = text.replace(wholeList, function (wholeMatch, m1, m2) {
      var listType = (m2.search(/[*+-]/g) > -1) ? 'ul' : 'ol',
          result = processListItems(m1);

      // Turn double returns into triple returns, so that we can make a
      // paragraph for the last item in a list, if necessary:
      //list = list.replace(/\n{2,}/g, '\n\n\n');
      //result = processListItems(list);

      // Trim any trailing whitespace, to put the closing `</$list_type>`
      // up on the preceding line, to get it past the current stupid
      // HTML block parser. This is a hack to work around the terrible
      // hack that is the HTML block parser.
      result = result.replace(/\s+$/, '');
      var splRes = result.split(spl);
      splRes.shift();
      result = splitConsecutiveLists(splRes, listType);
      return result;
    });
  } else {
    wholeList = /(\n\n|^\n?)(([ ]{0,3}([*+-]|\d+[.])[ \t]+)[^\r]+?(~0|\n{2,}(?=\S)(?![ \t]*(?:[*+-]|\d+[.])[ \t]+)))/g;
    //wholeList = /(\n\n|^\n?)( {0,3}([*+-]|\d+\.)[ \t]+[\s\S]+?)(?=(~0)|(\n\n(?!\t| {2,}| {0,3}([*+-]|\d+\.)[ \t])))/g;

    text = text.replace(wholeList, function (wholeMatch, m1, m2, m3) {

      // Turn double returns into triple returns, so that we can make a
      // paragraph for the last item in a list, if necessary:
      var list = m2.replace(/\n{2,}/g, '\n\n\n'),
      //var list = (m2.slice(-2) !== '~0') ? m2 + '\n' : m2, //add a newline after the list
          listType = (m3.search(/[*+-]/g) > -1) ? 'ul' : 'ol',
          result = processListItems(list),
          splRes = result.split(spl);

      splRes.shift();
      return m1 + splitConsecutiveLists(splRes, listType) + '\n';
    });
  }

  // attacklab: strip sentinel
  text = text.replace(/~0/, '');

  return text;
});
Major code refactoring 2015-01-16 05:21:33 +08:00			`/**`
			`* Form HTML ordered (numbered) and unordered (bulleted) lists.`
			`*/`
			`showdown.subParser('lists', function (text, options, globals) {`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`'use strict';`

fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`var spl = '~1';`

chore(all): code style change 2015-01-19 19:37:21 +08:00			`/**`
			`* Process the contents of a single ordered or unordered list, splitting it`
			`* into individual list items.`
chore(): code fix to pass jscs linter 2015-01-19 22:57:43 +08:00			`* @param {string} listStr`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`* @returns {string}`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`*/`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`function processListItems (listStr) {`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`// The $g_list_level global keeps track of when we're inside a list.`
			`// Each time we enter a list, we increment it; when we leave a list,`
			`// we decrement. If it's zero, we're not in a list anymore.`
			`//`
			`// We do this because when we're not inside a list, we want to treat`
			`// something like this:`
			`//`
			`// I recommend upgrading to version`
			`// 8. Oops, now this line is treated`
			`// as a sub-list.`
			`//`
			`// As a single paragraph, despite the fact that the second line starts`
			`// with a digit-period-space sequence.`
			`//`
			`// Whereas when we're inside a list (or sub-list), that line will be`
			`// treated as the start of a sub-list. What a kludge, huh? This is`
			`// an aspect of Markdown's syntax that's hard to parse perfectly`
			`// without resorting to mind-reading. Perhaps the solution is to`
			`// change the syntax rules such that sub-lists must start with a`
			`// starting cardinal number; e.g. "1." or "a.".`

			`globals.gListLevel++;`

			`// trim trailing blank lines:`
			`listStr = listStr.replace(/\n{2,}$/, '\n');`

			`// attacklab: add sentinel to emulate \z`
			`listStr += '~0';`
Major code refactoring 2015-01-16 05:21:33 +08:00
			`/*`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`list_str = list_str.replace(/`
			`(\n)? // leading line = $1`
			`(^[ \t]*) // leading whitespace = $2`
			`([*+-]\|\d+[.]) [ \t]+ // list marker = $3`
			`([^\r]+? // list item text = $4`
			`(\n{1,2}))`
			`(?= \n* (~0 \| \2 ([*+-]\|\d+[.]) [ \t]+))`
			`/gm, function(){...});`
Major code refactoring 2015-01-16 05:21:33 +08:00			`*/`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`var rgx = /(\n)?(^[ \t])([+-]\|\d+[.])[ \t]+([^\r]+?(\n{1,2}))(?=\n(~0\|\2([+-]\|\d+[.])[ \t]+))/gm;`

			`listStr = listStr.replace(rgx, function (wholeMatch, m1, m2, m3, m4) {`
			`var item = showdown.subParser('outdent')(m4, options, globals);`
			`//m1 - LeadingLine`

			`if (m1 \|\| (item.search(/\n{2,}/) > -1)) {`
			`item = showdown.subParser('blockGamut')(item, options, globals);`
			`} else {`
			`// Recursion for sub-lists:`
			`item = showdown.subParser('lists')(item, options, globals);`
			`item = item.replace(/\n$/, ''); // chomp(item)`
			`item = showdown.subParser('spanGamut')(item, options, globals);`
			`}`

			`// this is a "hack" to differentiate between ordered and unordered lists`
			`// related to issue #142`
			`var tp = (m3.search(/[*+-]/g) > -1) ? 'ul' : 'ol';`
			`return spl + tp + '<li>' + item + '</li>\n';`
			`});`
Major code refactoring 2015-01-16 05:21:33 +08:00
			`// attacklab: strip sentinel`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`listStr = listStr.replace(/~0/g, '');`

			`globals.gListLevel--;`
			`return listStr;`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`}`

			`/**`
			`* Slit consecutive ol/ul lists (related to issue 142)`
			`* @param {Array} results`
			`* @param {string} listType`
			`* @returns {string\|*}`
			`*/`
			`function splitConsecutiveLists (results, listType) {`
			`var cthulhu = /(<p[^>]+?>\|<p>\|<\/p>)/img,`
			`holder = [[]],`
			`res = '',`
			`y = 0;`

			`// Initialize first sublist`
			`holder[0].type = listType;`

			`for (var i = 0; i < results.length; ++i) {`
			`var txt = results[i].slice(2),`
			`nListType = results[i].slice(0, 2);`

chore: fix jshint 2015-06-17 08:26:50 +08:00			`if (listType !== nListType) {`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`y++;`
			`holder[y] = [];`
			`holder[y].type = nListType;`
			`listType = nListType;`
			`}`
			`holder[y].push(txt);`
			`}`
			`for (i = 0; i < holder.length; ++i) {`
			`res += '<' + holder[i].type + '>\n';`
			`for (var ii = 0; ii < holder[i].length; ++ii) {`
			`if (holder[i].length > 1 && ii === holder[i].length - 1 && !cthulhu.test(holder[i][ii - 1])) {`
			`//holder[i][ii] = holder[i][ii].replace(cthulhu, '');`
			`}`
			`res += holder[i][ii];`
			`}`
			`res += '</' + holder[i].type + '>\n';`
			`}`
			`return res;`
			`}`
chore(all): code style change 2015-01-19 19:37:21 +08:00
			`// attacklab: add sentinel to hack around khtml/safari bug:`
			`// http://bugs.webkit.org/show_bug.cgi?id=11231`
			`text += '~0';`

fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`// Re-usable pattern to match any entire ul or ol list:`
chore(all): code style change 2015-01-19 19:37:21 +08:00
			`/*`
			`var whole_list = /`
			`( // $1 = whole list`
			`( // $2`
			`[ ]{0,3} // attacklab: g_tab_width - 1`
			`([*+-]\|\d+[.]) // $3 = first list item marker`
			`[ \t]+`
			`)`
			`[^\r]+?`
			`( // $4`
			`~0 // sentinel for workaround; should be $`
			`\|`
			`\n{2,}`
			`(?=\S)`
			`(?! // Negative lookahead for another list item marker`
			`[ \t]*`
			`(?:[*+-]\|\d+[.])[ \t]+`
			`)`
			`)`
			`)/g`
			`*/`
			`var wholeList = /^(([ ]{0,3}([+-]\|\d+[.])[ \t]+)[^\r]+?(~0\|\n{2,}(?=\S)(?![ \t](?:[*+-]\|\d+[.])[ \t]+)))/gm;`

			`if (globals.gListLevel) {`
			`text = text.replace(wholeList, function (wholeMatch, m1, m2) {`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`var listType = (m2.search(/[*+-]/g) > -1) ? 'ul' : 'ol',`
			`result = processListItems(m1);`
chore(all): code style change 2015-01-19 19:37:21 +08:00
			`// Turn double returns into triple returns, so that we can make a`
			`// paragraph for the last item in a list, if necessary:`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`//list = list.replace(/\n{2,}/g, '\n\n\n');`
			`//result = processListItems(list);`
chore(all): code style change 2015-01-19 19:37:21 +08:00
			// Trim any trailing whitespace, to put the closing `</$list_type>`
			`// up on the preceding line, to get it past the current stupid`
			`// HTML block parser. This is a hack to work around the terrible`
			`// hack that is the HTML block parser.`
			`result = result.replace(/\s+$/, '');`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`var splRes = result.split(spl);`
			`splRes.shift();`
			`result = splitConsecutiveLists(splRes, listType);`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`return result;`
			`});`
			`} else {`
			`wholeList = /(\n\n\|^\n?)(([ ]{0,3}([+-]\|\d+[.])[ \t]+)[^\r]+?(~0\|\n{2,}(?=\S)(?![ \t](?:[*+-]\|\d+[.])[ \t]+)))/g;`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`//wholeList = /(\n\n\|^\n?)( {0,3}([+-]\|\d+\.)[ \t]+[\s\S]+?)(?=(~0)\|(\n\n(?!\t\| {2,}\| {0,3}([+-]\|\d+\.)[ \t])))/g;`
chore(all): code style change 2015-01-19 19:37:21 +08:00
			`text = text.replace(wholeList, function (wholeMatch, m1, m2, m3) {`

			`// Turn double returns into triple returns, so that we can make a`
			`// paragraph for the last item in a list, if necessary:`
chore(): code style fix and tests fix due to code style changes 2015-01-19 20:04:22 +08:00			`var list = m2.replace(/\n{2,}/g, '\n\n\n'),`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`//var list = (m2.slice(-2) !== '~0') ? m2 + '\n' : m2, //add a newline after the list`
chore(): code style fix and tests fix due to code style changes 2015-01-19 20:04:22 +08:00			`listType = (m3.search(/[*+-]/g) > -1) ? 'ul' : 'ol',`
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`result = processListItems(list),`
			`splRes = result.split(spl);`
chore(all): code style change 2015-01-19 19:37:21 +08:00
fix(subParsers/lists.js): partial fix for odd behavior on multiple consecutive lists Consecutive lists we're previously being condensed into one unique list, with odd paragraph output. This fix correctly splits lists, but does not change the weird paragraph output closes #142 2015-06-13 21:59:14 +08:00			`splRes.shift();`
			`return m1 + splitConsecutiveLists(splRes, listType) + '\n';`
chore(all): code style change 2015-01-19 19:37:21 +08:00			`});`
			`}`

			`// attacklab: strip sentinel`
			`text = text.replace(/~0/, '');`

			`return text;`
Major code refactoring 2015-01-16 05:21:33 +08:00			`});`