From 12e80b7badbc09f75bfbee270dd13ee0f5bdd89c Mon Sep 17 00:00:00 2001 From: thepurpleblob Date: Tue, 21 Aug 2007 09:54:49 +0000 Subject: [PATCH] MDL-10928: Markdown library updated to latest version (Markdown Extra 1.1.4) --- lib/markdown.php | 343 +++++++++++++++++++++++++++++++------------------------ 1 file changed, 195 insertions(+), 148 deletions(-) diff --git a/lib/markdown.php b/lib/markdown.php index 0c2cfed85..6d43f8bca 100755 --- a/lib/markdown.php +++ b/lib/markdown.php @@ -12,8 +12,8 @@ # -define( 'MARKDOWN_VERSION', "1.0.1f" ); # Wed 7 Feb 2007 -define( 'MARKDOWNEXTRA_VERSION', "1.1.2" ); # Wed 7 Feb 2007 +define( 'MARKDOWN_VERSION', "1.0.1h" ); # Fri 3 Aug 2007 +define( 'MARKDOWNEXTRA_VERSION', "1.1.4" ); # Fri 3 Aug 2007 # @@ -71,7 +71,7 @@ function Markdown($text) { Plugin Name: Markdown Extra Plugin URI: http://www.michelf.com/projects/php-markdown/ Description: Markdown syntax allows you to write using an easy-to-read, easy-to-write plain text format. Based on the original Perl version by John Gruber. More... -Version: 1.1.2 +Version: 1.1.4 Author: Michel Fortin Author URI: http://www.michelf.com/ */ @@ -85,9 +85,11 @@ if (isset($wp_version)) { # - Run Markdown on excerpt, then remove all tags. # - Add paragraph tag around the excerpt, but remove it for the excerpt rss. if (MARKDOWN_WP_POSTS) { - remove_filter('the_content', 'wpautop'); - remove_filter('the_excerpt', 'wpautop'); + remove_filter('the_content', 'wpautop'); + remove_filter('the_content_rss', 'wpautop'); + remove_filter('the_excerpt', 'wpautop'); add_filter('the_content', 'Markdown', 6); + add_filter('the_content_rss', 'Markdown', 6); add_filter('get_the_excerpt', 'Markdown', 6); add_filter('get_the_excerpt', 'trim', 7); add_filter('the_excerpt', 'mdwp_add_p'); @@ -105,7 +107,7 @@ if (isset($wp_version)) { # - Scramble important tags before passing them to the kses filter. # - Run Markdown on excerpt then remove paragraph tags. if (MARKDOWN_WP_COMMENTS) { - remove_filter('comment_text', 'wpautop'); + remove_filter('comment_text', 'wpautop', 30); remove_filter('comment_text', 'make_clickable'); add_filter('pre_comment_content', 'Markdown', 6); add_filter('pre_comment_content', 'mdwp_hide_tags', 8); @@ -114,14 +116,12 @@ if (isset($wp_version)) { add_filter('get_comment_excerpt', 'Markdown', 6); add_filter('get_comment_excerpt', 'mdwp_strip_p', 7); - global $markdown_hidden_tags; - $markdown_hidden_tags = array( - '

' => md5('

'), '

' => md5('

'), - '
'	=> md5('
'),	'
'=> md5('
'), - '
    ' => md5('
      '), '
    ' => md5('
'), - ''), - '
  • ' => md5('
  • '), '
  • ' => md5(''), - ); + global $mdwp_hidden_tags, $mdwp_placeholders; + $mdwp_hidden_tags = explode(' ', + '

     
  • '); + $mdwp_placeholders = explode(' ', str_rot13( + 'pEj07ZbbBZ U1kqgh4w4p pre2zmeN6K QTi31t9pre ol0MP1jzJR '. + 'ML5IjmbRol ulANi1NsGY J7zRLJqPul liA8ctl16T K9nhooUHli')); } function mdwp_add_p($text) { @@ -135,14 +135,12 @@ if (isset($wp_version)) { function mdwp_strip_p($t) { return preg_replace('{}i', '', $t); } function mdwp_hide_tags($text) { - global $markdown_hidden_tags; - return str_replace(array_keys($markdown_hidden_tags), - array_values($markdown_hidden_tags), $text); + global $mdwp_hidden_tags, $mdwp_placeholders; + return str_replace($mdwp_hidden_tags, $mdwp_placeholders, $text); } function mdwp_show_tags($text) { - global $markdown_hidden_tags; - return str_replace(array_values($markdown_hidden_tags), - array_keys($markdown_hidden_tags), $text); + global $mdwp_hidden_tags, $mdwp_placeholders; + return str_replace($mdwp_placeholders, $mdwp_hidden_tags, $text); } } @@ -205,15 +203,22 @@ class Markdown_Parser { # Needed to insert a maximum bracked depth while converting to PHP. var $nested_brackets_depth = 6; var $nested_brackets; + + var $nested_url_parenthesis_depth = 4; + var $nested_url_parenthesis; # Table of hash values for escaped characters: var $escape_chars = '\`*_{}[]()>#+-.!'; - var $escape_table = array(); +// var $escape_table = array(); var $backslash_escape_table = array(); # Change to ">" for HTML output. var $empty_element_suffix = MARKDOWN_EMPTY_ELEMENT_SUFFIX; var $tab_width = MARKDOWN_TAB_WIDTH; + + # Change to `true` to disallow markup or entities. + var $no_markup = false; + var $no_entities = false; function Markdown_Parser() { @@ -225,12 +230,16 @@ class Markdown_Parser { $this->nested_brackets = str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth). str_repeat('\])*', $this->nested_brackets_depth); + + $this->nested_url_parenthesis = + str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth). + str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth); # Create an identical table but for escaped characters. foreach (preg_split('/(?!^|$)/', $this->escape_chars) as $char) { - $hash = md5($char); - $this->escape_table[$char] = $hash; - $this->backslash_escape_table["\\$char"] = $hash; + $entity = "&#". ord($char). ";"; +// $this->escape_table[$char] = $entity; + $this->backslash_escape_table["\\$char"] = $entity; } # Sort document, block, and span gamut in ascendent priority order. @@ -245,6 +254,9 @@ class Markdown_Parser { var $titles = array(); var $html_blocks = array(); var $html_hashes = array(); # Contains both blocks and span hashes. + + # Status flag to avoid invalid nesting. + var $in_anchor = false; function transform($text) { @@ -279,8 +291,8 @@ class Markdown_Parser { # Strip any lines consisting only of spaces and tabs. # This makes subsequent regexen easier to write, because we can # match consecutive blank lines with /\n+/ instead of something - # contorted like /[ \t]*\n+/ . - $text = preg_replace('/^[ \t]+$/m', '', $text); + # contorted like /[ ]*\n+/ . + $text = preg_replace('/^[ ]+$/m', '', $text); # Run document gamut methods. foreach ($this->document_gamut as $method => $priority) { @@ -295,7 +307,6 @@ class Markdown_Parser { "stripLinkDefinitions" => 20, "runBasicBlockGamut" => 30, - "unescapeSpecialChars" => 90, ); @@ -309,19 +320,19 @@ class Markdown_Parser { # Link defs are in the form: ^[id]: url "optional title" $text = preg_replace_callback('{ ^[ ]{0,'.$less_than_tab.'}\[(.+)\][ ]?: # id = $1 - [ \t]* + [ ]* \n? # maybe *one* newline - [ \t]* + [ ]* ? # url = $2 - [ \t]* + [ ]* \n? # maybe one newline - [ \t]* + [ ]* (?: (?<=\s) # lookbehind for whitespace ["(] (.*?) # title = $3 [")] - [ \t]* + [ ]* )? # title is optional (?:\n+|\Z) }xm', @@ -339,6 +350,8 @@ class Markdown_Parser { function hashHTMLBlocks($text) { + if ($this->no_markup) return $text; + $less_than_tab = $this->tab_width - 1; # Hashify HTML blocks: @@ -407,10 +420,10 @@ class Markdown_Parser { '.$attr.'>\n # attributes followed by > and \n '.$content.' # content, support nesting # the matching end tag - [ \t]* # trailing spaces/tabs + [ ]* # trailing spaces/tabs (?=\n+|\Z) # followed by a newline or end of document ) - }xm', + }xmi', array(&$this, '_hashHTMLBlocks_callback'), $text); @@ -424,10 +437,10 @@ class Markdown_Parser { '.$attr.'> # attributes followed by > '.$content.' # content, support nesting # the matching end tag - [ \t]* # trailing spaces/tabs + [ ]* # trailing spaces/tabs (?=\n+|\Z) # followed by a newline or end of document ) - }xm', + }xmi', array(&$this, '_hashHTMLBlocks_callback'), $text); @@ -445,10 +458,10 @@ class Markdown_Parser { \b # word break ([^<>])*? # /?> # the matching end tag - [ \t]* + [ ]* (?=\n{2,}|\Z) # followed by a blank line or end of document ) - }x', + }xi', array(&$this, '_hashHTMLBlocks_callback'), $text); @@ -464,7 +477,7 @@ class Markdown_Parser { (?s: ) - [ \t]* + [ ]* (?=\n{2,}|\Z) # followed by a blank line or end of document ) }x', @@ -485,7 +498,7 @@ class Markdown_Parser { .*? \2> ) - [ \t]* + [ ]* (?=\n{2,}|\Z) # followed by a blank line or end of document ) }x', @@ -512,25 +525,28 @@ class Markdown_Parser { $text = $this->unhash($text); # Then hash the block. - $key = md5($text); + $key = "B\x1A". md5($text); $this->html_hashes[$key] = $text; $this->html_blocks[$key] = $text; return $key; # String that will replace the tag. } - function hashSpan($text) { + function hashSpan($text, $word_separator = false) { # # Called whenever a tag must be hashed when a function insert a span-level # element in $text, it pass through this function and is automaticaly - # escaped, blocking invalid nested overlap. + # escaped, blocking invalid nested overlap. If optional argument + # $word_separator is true, surround the hash value by spaces. # # Swap back any tag hash found in $text so we do not have to `unhash` # multiple times at the end. $text = $this->unhash($text); # Then hash the span. - $key = md5($text); + $key = "S\x1A". md5($text); + if ($word_separator) $key = ":$key:"; + $this->html_hashes[$key] = $text; return $key; # String that will replace the span tag. } @@ -583,9 +599,9 @@ class Markdown_Parser { function doHorizontalRules($text) { # Do Horizontal Rules: return preg_replace( - array('{^[ ]{0,2}([ ]?\*[ ]?){3,}[ \t]*$}mx', - '{^[ ]{0,2}([ ]? -[ ]?){3,}[ \t]*$}mx', - '{^[ ]{0,2}([ ]? _[ ]?){3,}[ \t]*$}mx'), + array('{^[ ]{0,2}([ ]?\*[ ]?){3,}[ ]*$}mx', + '{^[ ]{0,2}([ ]? -[ ]?){3,}[ ]*$}mx', + '{^[ ]{0,2}([ ]? _[ ]?){3,}[ ]*$}mx'), "\n".$this->hashBlock("empty_element_suffix")."\n", $text); } @@ -642,15 +658,18 @@ class Markdown_Parser { # value; this is likely overkill, but it should prevent us from colliding # with the escape values by accident. # + if ($this->no_markup) return $text; + $tokens = $this->tokenizeHTML($text); $text = ''; # rebuild $text from the tokens foreach ($tokens as $cur_token) { if ($cur_token[0] == 'tag') { - $cur_token[1] = str_replace('\\', $this->escape_table['\\'], $cur_token[1]); - $cur_token[1] = str_replace(array('`'), $this->escape_table['`'], $cur_token[1]); - $cur_token[1] = str_replace('*', $this->escape_table['*'], $cur_token[1]); - $cur_token[1] = str_replace('_', $this->escape_table['_'], $cur_token[1]); +// $cur_token[1] = str_replace('\\', $this->escape_table['\\'], $cur_token[1]); +// $cur_token[1] = str_replace('`', $this->escape_table['`'], $cur_token[1]); +// $cur_token[1] = str_replace('*', $this->escape_table['*'], $cur_token[1]); +// $cur_token[1] = str_replace('_', $this->escape_table['_'], $cur_token[1]); + $cur_token[1] = $this->hashSpan($cur_token[1]); } $text .= $cur_token[1]; } @@ -662,6 +681,9 @@ class Markdown_Parser { # # Turn Markdown link shortcuts into XHTML tags. # + if ($this->in_anchor) return $text; + $this->in_anchor = true; + # # First, handle reference-style links: [link text] [id] # @@ -690,14 +712,18 @@ class Markdown_Parser { ('.$this->nested_brackets.') # link text = $2 \] \( # literal paren - [ \t]* - ? # href = $3 - [ \t]* - ( # $4 - ([\'"]) # quote char = $5 - (.*?) # Title = $6 - \5 # matching quote - [ \t]* # ignore any spaces/tabs between closing quote and ) + [ ]* + (?: + <(\S*)> # href = $3 + | + ('.$this->nested_url_parenthesis.') # href = $4 + ) + [ ]* + ( # $5 + ([\'"]) # quote char = $6 + (.*?) # Title = $7 + \6 # matching quote + [ ]* # ignore any spaces/tabs between closing quote and ) )? # title is optional \) ) @@ -718,6 +744,7 @@ class Markdown_Parser { // }xs', // array(&$this, '_doAnchors_reference_callback'), $text); + $this->in_anchor = false; return $text; } function _doAnchors_reference_callback($matches) { @@ -757,9 +784,9 @@ class Markdown_Parser { function _doAnchors_inline_callback($matches) { $whole_match = $matches[1]; $link_text = $this->runSpanGamut($matches[2]); - $url = $matches[3]; - $title =& $matches[6]; - + $url = $matches[3] == '' ? $matches[4] : $matches[3]; + $title =& $matches[7]; + $url = $this->encodeAmpsAndAngles($url); $result = "? # src url = $3 - [ \t]* - ( # $4 - ([\'"]) # quote char = $5 - (.*?) # title = $6 - \5 # matching quote - [ \t]* + [ ]* + (?: + <(\S*)> # src url = $3 + | + ('.$this->nested_url_parenthesis.') # src url = $4 + ) + [ ]* + ( # $5 + ([\'"]) # quote char = $6 + (.*?) # title = $7 + \6 # matching quote + [ ]* )? # title is optional \) ) @@ -857,8 +888,8 @@ class Markdown_Parser { function _doImages_inline_callback($matches) { $whole_match = $matches[1]; $alt_text = $matches[2]; - $url = $matches[3]; - $title =& $matches[6]; + $url = $matches[3] == '' ? $matches[4] : $matches[3]; + $title =& $matches[7]; $alt_text = str_replace('"', '"', $alt_text); $result = "\"$alt_text\"";encodeCode($this->outdent($codeblock)); - // $codeblock = $this->detab($codeblock); +// $codeblock = $this->detab($codeblock); # trim leading newlines and trailing whitespace $codeblock = preg_replace(array('/\A\n+/', '/\n+\z/'), '', $codeblock); @@ -1133,8 +1164,8 @@ class Markdown_Parser { } function _doCodeSpans_callback($matches) { $c = $matches[2]; - $c = preg_replace('/^[ \t]*/', '', $c); # leading whitespace - $c = preg_replace('/[ \t]*$/', '', $c); # trailing whitespace + $c = preg_replace('/^[ ]*/', '', $c); # leading whitespace + $c = preg_replace('/[ ]*$/', '', $c); # trailing whitespace $c = $this->encodeCode($c); return $this->hashSpan("$c"); } @@ -1173,13 +1204,13 @@ class Markdown_Parser { (?=\S) # Not followed by whitespace (?!\1\1) # or two others marker chars. ( # $2: Content - (?: + (?> [^*_]+? # Anthing not em markers. | # Balence any regular emphasis inside. \1 (?=\S) .+? (?<=\S) \1 | - (?! \1 ) . # Allow unbalenced * and _. + . # Allow unbalenced * and _. )+? ) (?<=\S) \1\1 # End mark not preceded by whitespace. @@ -1187,7 +1218,7 @@ class Markdown_Parser { array(&$this, '_doItalicAndBold_strong_callback'), $text); # Then : $text = preg_replace_callback( - '{ ( (?[ \t]? # ">" at the start of a line + ^[ ]*>[ ]? # ">" at the start of a line .+\n # rest of the first line (.+\n)* # subsequent consecutive lines \n* # blanks @@ -1222,7 +1253,7 @@ class Markdown_Parser { function _doBlockQuotes_callback($matches) { $bq = $matches[1]; # trim one level of quoting - trim whitespace-only lines - $bq = preg_replace(array('/^[ \t]*>[ \t]?/m', '/^[ \t]+$/m'), '', $bq); + $bq = preg_replace(array('/^[ ]*>[ ]?/m', '/^[ ]+$/m'), '', $bq); $bq = $this->runBlockGamut($bq); # recurse $bq = preg_replace('/^/m', " ", $bq); @@ -1256,7 +1287,7 @@ class Markdown_Parser { foreach ($grafs as $key => $value) { if (!isset( $this->html_blocks[$value] )) { $value = $this->runSpanGamut($value); - $value = preg_replace('/^([ \t]*)/', "

    ", $value); + $value = preg_replace('/^([ ]*)/', "

    ", $value); $value .= "

    "; $grafs[$key] = $this->unhash($value); } @@ -1315,6 +1346,11 @@ class Markdown_Parser { function encodeAmpsAndAngles($text) { # Smart processing for ampersands and angle brackets that need to be encoded. + if ($this->no_entities) { + $text = str_replace('&', '&', $text); + $text = str_replace('<', '<', $text); + return $text; + } # Ampersand-encoding based entirely on Nat Irons's Amputator MT plugin: # http://bumppo.net/projects/amputator/ @@ -1334,9 +1370,11 @@ class Markdown_Parser { # Returns: The string, with after processing the following backslash # escape sequences. # - # Must process escaped backslashes first. - return str_replace(array_keys($this->backslash_escape_table), - array_values($this->backslash_escape_table), $text); + # Must process escaped backslashes first (should be first in list). + foreach ($this->backslash_escape_table as $search => $replacement) { + $text = str_replace($search, $this->hashSpan($replacement), $text); + } + return $text; } @@ -1366,7 +1404,6 @@ class Markdown_Parser { } function _doAutoLinks_email_callback($matches) { $address = $matches[1]; - $address = $this->unescapeSpecialChars($address); $link = $this->encodeEmailAddress($address); return $this->hashSpan($link); } @@ -1413,15 +1450,6 @@ class Markdown_Parser { } - function unescapeSpecialChars($text) { - # - # Swap back in all the special characters we've hidden. - # - return str_replace(array_values($this->escape_table), - array_keys($this->escape_table), $text); - } - - function tokenizeHTML($str) { # # Parameter: String containing HTML + Markdown markup. @@ -1512,7 +1540,7 @@ class Markdown_Parser { # tab characters. Then we reconstruct every line by adding the # appropriate number of space between each blocks. - $strlen = $this->utf8_strlen; # best strlen function for UTF-8. + $strlen = $this->utf8_strlen; # strlen function for UTF-8. $lines = explode("\n", $text); $text = ""; @@ -1535,18 +1563,14 @@ class Markdown_Parser { function _initDetab() { # # Check for the availability of the function in the `utf8_strlen` property - # (probably `mb_strlen`). If the function is not available, create a + # (initially `mb_strlen`). If the function is not available, create a # function that will loosely count the number of UTF-8 characters with a # regular expression. # if (function_exists($this->utf8_strlen)) return; - $this->utf8_strlen = 'Markdown_UTF8_strlen'; - - if (function_exists($this->utf8_strlen)) return; - function Markdown_UTF8_strlen($text) { - return preg_match_all('/[\x00-\xBF]|[\xC0-\xFF][\x80-\xBF]*/', - $text, $m); - } + $this->utf8_strlen = create_function('$text', 'return preg_match_all( + "/[\\\\x00-\\\\xBF]|[\\\\xC0-\\\\xFF][\\\\x80-\\\\xBF]*/", + $text, $m);'); } @@ -1599,8 +1623,8 @@ class MarkdownExtra_Parser extends Markdown_Parser { "doDefLists" => 45, ); $this->span_gamut += array( - "doFootnotes" => 4, - "doAbbreviations" => 5, + "doFootnotes" => 5, + "doAbbreviations" => 70, ); parent::Markdown_Parser(); @@ -1614,6 +1638,9 @@ class MarkdownExtra_Parser extends Markdown_Parser { var $abbr_matches = array(); var $html_cleans = array(); + # Status flag to avoid invalid nesting. + var $in_footnote = false; + function transform($text) { # @@ -1727,7 +1754,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { (?!\s)'.$enclosing_tag.' ) \s* # Whitespace. - (?: + (?> ".*?" | # Double quotes (can contain `>`) \'.*?\' | # Single quotes (can contain `>`) .+? # Anything but quotes and `>`. @@ -1763,8 +1790,9 @@ class MarkdownExtra_Parser extends Markdown_Parser { # If in Markdown span mode, add a empty-string span-level hash # after each newline to prevent triggering any block element. if ($span) { - $newline = $this->hashSpan("") . "\n"; - $parts[0] = str_replace("\n", $newline, $parts[0]); + $void = $this->hashSpan("", true) ; + $newline = $this->hashSpan("", true) . "\n"; + $parts[0] = $void . str_replace("\n", $newline, $parts[0]) . $void; } $parsed .= $parts[0]; # Text before current tag. @@ -1879,9 +1907,14 @@ class MarkdownExtra_Parser extends Markdown_Parser { \s* # Eat whitespace before the `markdown` attribute markdown \s*=\s* - (["\']) # $1: quote delimiter - (.*?) # $2: attribute value - \1 # matching delimiter + (?: + (["\']) # $1: quote delimiter + (.*?) # $2: attribute value + \1 # matching delimiter + | + ([^\s>]*) # $3: unquoted attribute value + ) + () # $4: make $3 always defined (avoid warnings) }xs'; # Regex to match any tag. @@ -1890,7 +1923,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { ".*?" | # Double quotes (can contain `>`) \'.*?\' | # Single quotes (can contain `>`) .+? # Anything but quotes and `>`. @@ -1967,14 +2000,14 @@ class MarkdownExtra_Parser extends Markdown_Parser { # Check for `markdown="1"` attribute and handle it. # if ($md_attr && - preg_match($markdown_attr_match, $tag, $attr_matches) && - preg_match('/^1|block|span$/', $attr_matches[2])) + preg_match($markdown_attr_match, $tag, $attr_m) && + preg_match('/^1|block|span$/', $attr_m[2] . $attr_m[3])) { # Remove `markdown` attribute from opening tag. $tag = preg_replace($markdown_attr_match, '', $tag); # Check if text inside this tag must be parsed in span mode. - $this->mode = $attr_matches[2]; + $this->mode = $attr_m[2] . $attr_m[3]; $span_mode = $this->mode == 'span' || $this->mode != 'block' && preg_match("{^<(?:$this->contain_span_tags)\b}", $tag); @@ -2033,7 +2066,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { $text = $this->unhash($text); # Then hash the tag. - $key = md5($text); + $key = "C\x1A". md5($text); $this->html_cleans[$key] = $text; $this->html_hashes[$key] = $text; return $key; # String that will replace the clean tag. @@ -2052,10 +2085,10 @@ class MarkdownExtra_Parser extends Markdown_Parser { # -------- # $text = preg_replace_callback( - '{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ \t]*\n=+[ \t]*\n+ }mx', + '{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ ]*\n=+[ ]*\n+ }mx', array(&$this, '_doHeaders_callback_setext_h1'), $text); $text = preg_replace_callback( - '{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ \t]*\n-+[ \t]*\n+ }mx', + '{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ ]*\n-+[ ]*\n+ }mx', array(&$this, '_doHeaders_callback_setext_h2'), $text); # atx-style headers: @@ -2067,12 +2100,12 @@ class MarkdownExtra_Parser extends Markdown_Parser { # $text = preg_replace_callback('{ ^(\#{1,6}) # $1 = string of #\'s - [ \t]* + [ ]* (.+?) # $2 = Header text - [ \t]* + [ ]* \#* # optional closing #\'s (not counted) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? # id attribute - [ \t]* + [ ]* \n+ }xm', array(&$this, '_doHeaders_callback_atx'), $text); @@ -2368,14 +2401,14 @@ class MarkdownExtra_Parser extends Markdown_Parser { (?=\S) # Not followed by whitespace (?!__) # or two others marker chars. ( # $2: Content - (?: + (?> [^_]+? # Anthing not em markers. | # Balence any regular _ emphasis inside. (? [^*]+? # Anthing not em markers. | # Balence any regular * emphasis inside. \* (?=\S) (.+?) (?<=\S) \* + | + \* # Allow unbalenced as last resort. )+? ) (?<=\S) \*\* # End mark not preceded by whitespace. @@ -2401,7 +2436,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { # Then : $text = preg_replace_callback(array( '{ ( (?html_blocks[$block_key]) && !isset($this->html_cleans[$clean_key])); @@ -2461,7 +2496,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { # Link defs are in the form: [^id]: url "optional title" $text = preg_replace_callback('{ ^[ ]{0,'.$less_than_tab.'}\[\^(.+?)\][ ]?: # note_id = $1 - [ \t]* + [ ]* \n? # maybe *one* newline ( # text = $2 (no blank lines allowed) (?: @@ -2479,7 +2514,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { return $text; } function _stripFootnotes_callback($matches) { - $note_id = $matches[1]; + $note_id = $this->fn_id_prefix . $matches[1]; $this->footnotes[$note_id] = $this->outdent($matches[2]); return ''; # String that will replace the block } @@ -2490,7 +2525,9 @@ class MarkdownExtra_Parser extends Markdown_Parser { # Replace footnote references in $text [^id] with a special text-token # which will be can be # - $text = preg_replace('{\[\^(.+?)\]}', "a\0fn:\\1\0z", $text); + if (!$this->in_footnote && !$this->in_anchor) { + $text = preg_replace('{\[\^(.+?)\]}', "F\x1Afn:\\1\x1A:", $text); + } return $text; } @@ -2499,7 +2536,8 @@ class MarkdownExtra_Parser extends Markdown_Parser { # # Append footnote list to text. # - $text = preg_replace_callback('{a\0fn:(.*?)\0z}', + + $text = preg_replace_callback('{F\x1Afn:(.*?)\x1A:}', array(&$this, '_appendFootnotes_callback'), $text); if (!empty($this->footnotes_ordered)) { @@ -2523,6 +2561,8 @@ class MarkdownExtra_Parser extends Markdown_Parser { } $num = 0; + $this->in_footnote = true; + foreach ($this->footnotes_ordered as $note_id => $footnote) { $footnote .= "\n"; # Need to append newline before parsing. $footnote = $this->runBlockGamut("$footnote\n"); @@ -2542,10 +2582,10 @@ class MarkdownExtra_Parser extends Markdown_Parser { $text .= "\n\n"; } + $this->in_footnote = false; + $text .= "\n"; $text .= ""; - - $text = preg_replace('{a\{fn:(.*?)\}z}', '[^\\1]', $text); } return $text; } @@ -2589,8 +2629,7 @@ class MarkdownExtra_Parser extends Markdown_Parser { function stripAbbreviations($text) { # - # Strips abbreviations from text, stores the URLs and titles in - # hash references. + # Strips abbreviations from text, stores titles in hash references. # $less_than_tab = $this->tab_width - 1; @@ -2614,12 +2653,16 @@ class MarkdownExtra_Parser extends Markdown_Parser { function doAbbreviations($text) { # - # Replace footnote references in $text [^id] with a link to the footnote. + # Find defined abbreviations in text and wrap them in elements. # if ($this->abbr_matches) { - $regex = '{(?abbr_matches) .')(?!\w)}'; - - $text = preg_replace_callback($regex, + // cannot use the /x modifier because abbr_matches may + // contain spaces: + $text = preg_replace_callback('{'. + '(?abbr_matches) .')'. + '(?![\w\x1A])'. + '}', array(&$this, '_doAbbreviations_callback'), $text); } return $text; @@ -2686,6 +2729,10 @@ Version History See Readme file for details. +Extra 1.1.4 (3 Aug 2007): + +Extra 1.1.3 (3 Jul 2007): + Extra 1.1.2 (7 Feb 2007) Extra 1.1.1 (28 Dec 2006) -- 2.11.4.GIT