PHP Markdown Extra 1.1.3b1

2007-08-14 16:43:52 -04:00 · 2007-08-14 16:43:52 -04:00 · 2008178bc0
commit 2008178bc0
parent 128de3aa97
2 changed files with 229 additions and 168 deletions
--- a/Readme.text
+++ b/Readme.text
@ -1,7 +1,7 @@
 PHP Markdown Extra
 ==================

-Version 1.1.2 - Wed 7 Feb 2007
+Version 1.1.3b1 - Mon 21 May 2007

 by Michel Fortin
 <http://www.michelf.com/>
--- a/markdown.php
+++ b/markdown.php
@ -12,8 +12,8 @@
 #


-define( 'MARKDOWN_VERSION',       "1.0.1f" ); # Wed 7 Feb 2007
-define( 'MARKDOWNEXTRA_VERSION',  "1.1.2" );  # Wed 7 Feb 2007
+define( 'MARKDOWN_VERSION',       "1.0.2b8" ); # Mon 21 May 2007
+define( 'MARKDOWNEXTRA_VERSION',  "1.1.3b1" ); # Mon 21 May 2007


 #
@ -71,7 +71,7 @@ function Markdown($text) {
 Plugin Name: Markdown Extra
 Plugin URI: http://www.michelf.com/projects/php-markdown/
 Description: <a href="http://daringfireball.net/projects/markdown/syntax">Markdown syntax</a> allows you to write using an easy-to-read, easy-to-write plain text format. Based on the original Perl version by <a href="http://daringfireball.net/">John Gruber</a>. <a href="http://www.michelf.com/projects/php-markdown/">More...</a>
-Version: 1.1.2
+Version: 1.1.3
 Author: Michel Fortin
 Author URI: http://www.michelf.com/
 */
@ -85,9 +85,11 @@ if (isset($wp_version)) {
 	# - Run Markdown on excerpt, then remove all tags.
 	# - Add paragraph tag around the excerpt, but remove it for the excerpt rss.
 	if (MARKDOWN_WP_POSTS) {
-		remove_filter('the_content',  'wpautop');
-		remove_filter('the_excerpt',  'wpautop');
+		remove_filter('the_content',     'wpautop');
+        remove_filter('the_content_rss', 'wpautop');
+		remove_filter('the_excerpt',     'wpautop');
 		add_filter('the_content',     'Markdown', 6);
+        add_filter('the_content_rss', 'Markdown', 6);
 		add_filter('get_the_excerpt', 'Markdown', 6);
 		add_filter('get_the_excerpt', 'trim', 7);
 		add_filter('the_excerpt',     'mdwp_add_p');
@ -105,7 +107,7 @@ if (isset($wp_version)) {
 	# - Scramble important tags before passing them to the kses filter.
 	# - Run Markdown on excerpt then remove paragraph tags.
 	if (MARKDOWN_WP_COMMENTS) {
-		remove_filter('comment_text', 'wpautop');
+		remove_filter('comment_text', 'wpautop', 30);
 		remove_filter('comment_text', 'make_clickable');
 		add_filter('pre_comment_content', 'Markdown', 6);
 		add_filter('pre_comment_content', 'mdwp_hide_tags', 8);
@ -114,14 +116,12 @@ if (isset($wp_version)) {
 		add_filter('get_comment_excerpt', 'Markdown', 6);
 		add_filter('get_comment_excerpt', 'mdwp_strip_p', 7);
 	
-		global $markdown_hidden_tags;
-		$markdown_hidden_tags = array(
-			'<p>'	=> md5('<p>'),		'</p>'	=> md5('</p>'),
-			'<pre>'	=> md5('<pre>'),	'</pre>'=> md5('</pre>'),
-			'<ol>'	=> md5('<ol>'),		'</ol>'	=> md5('</ol>'),
-			'<ul>'	=> md5('<ul>'),		'</ul>'	=> md5('</ul>'),
-			'<li>'	=> md5('<li>'),		'</li>'	=> md5('</li>'),
-			);
+		global $wp_markdown_hidden;
+		$wp_markdown_hidden[1] =
+			'<p> </p> <pre> </pre> <ol> </ol> <ul> </ul> <li> </li>';
+		$wp_markdown_hidden[2] = explode(str_rot13(
+			'pEj07ZbbBZ U1kqgh4w4p pre2zmeN6K QTi31t9pre ol0MP1jzJR '.
+			'ML5IjmbRol ulANi1NsGY J7zRLJqPul liA8ctl16T K9nhooUHli'));
 	}
 	
 	function mdwp_add_p($text) {
@ -135,9 +135,9 @@ if (isset($wp_version)) {
 	function mdwp_strip_p($t) { return preg_replace('{</?p>}i', '', $t); }

 	function mdwp_hide_tags($text) {
-		global $markdown_hidden_tags;
-		return str_replace(array_keys($markdown_hidden_tags), 
-							array_values($markdown_hidden_tags), $text);
+		global $wp_markdown_hidden;
+		return str_replace(explode($wp_markdown_hidden), 
+							explode($wp_markdown_hidden), $text);
 	}
 	function mdwp_show_tags($text) {
 		global $markdown_hidden_tags;
@ -205,6 +205,9 @@ class Markdown_Parser {
 	# Needed to insert a maximum bracked depth while converting to PHP.
 	var $nested_brackets_depth = 6;
 	var $nested_brackets;
+	
+	var $nested_url_parenthesis_depth = 4;
+	var $nested_url_parenthesis;

 	# Table of hash values for escaped characters:
 	var $escape_chars = '\`*_{}[]()>#+-.!';
@ -225,12 +228,16 @@ class Markdown_Parser {
 		$this->nested_brackets = 
 			str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth).
 			str_repeat('\])*', $this->nested_brackets_depth);
+	
+		$this->nested_url_parenthesis = 
+			str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth).
+			str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth);
 		
 		# Create an identical table but for escaped characters.
 		foreach (preg_split('/(?!^|$)/', $this->escape_chars) as $char) {
-			$hash = md5($char);
-			$this->escape_table[$char] = $hash;
-			$this->backslash_escape_table["\\$char"] = $hash;
+			$entity = "&#". ord($char). ";";
+			$this->escape_table[$char] = $entity;
+			$this->backslash_escape_table["\\$char"] = $entity;
 		}
 		
 		# Sort document, block, and span gamut in ascendent priority order.
@ -245,6 +252,9 @@ class Markdown_Parser {
 	var $titles = array();
 	var $html_blocks = array();
 	var $html_hashes = array(); # Contains both blocks and span hashes.
+	
+	# Status flag to avoid invalid nesting.
+	var $in_anchor = false;


 	function transform($text) {
@ -279,8 +289,8 @@ class Markdown_Parser {
 		# Strip any lines consisting only of spaces and tabs.
 		# This makes subsequent regexen easier to write, because we can
 		# match consecutive blank lines with /\n+/ instead of something
-		# contorted like /[ \t]*\n+/ .
-		$text = preg_replace('/^[ \t]+$/m', '', $text);
+		# contorted like /[ ]*\n+/ .
+		$text = preg_replace('/^[ ]+$/m', '', $text);

 		# Run document gamut methods.
 		foreach ($this->document_gamut as $method => $priority) {
@ -295,7 +305,6 @@ class Markdown_Parser {
 		"stripLinkDefinitions" => 20,
 		
 		"runBasicBlockGamut"   => 30,
-		"unescapeSpecialChars" => 90,
 		);


@ -309,19 +318,19 @@ class Markdown_Parser {
 		# Link defs are in the form: ^[id]: url "optional title"
 		$text = preg_replace_callback('{
 							^[ ]{0,'.$less_than_tab.'}\[(.+)\][ ]?:	# id = $1
-							  [ \t]*
+							  [ ]*
 							  \n?				# maybe *one* newline
-							  [ \t]*
+							  [ ]*
 							<?(\S+?)>?			# url = $2
-							  [ \t]*
+							  [ ]*
 							  \n?				# maybe one newline
-							  [ \t]*
+							  [ ]*
 							(?:
 								(?<=\s)			# lookbehind for whitespace
 								["(]
 								(.*?)			# title = $3
 								[")]
-								[ \t]*
+								[ ]*
 							)?	# title is optional
 							(?:\n+|\Z)
 			}xm',
@ -407,7 +416,7 @@ class Markdown_Parser {
 						'.$attr.'>\n		# attributes followed by > and \n
 						'.$content.'		# content, support nesting
 						</\2>				# the matching end tag
-						[ \t]*				# trailing spaces/tabs
+						[ ]*				# trailing spaces/tabs
 						(?=\n+|\Z)	# followed by a newline or end of document
 					)
 			}xm',
@ -424,7 +433,7 @@ class Markdown_Parser {
 						'.$attr.'>			# attributes followed by >
 						'.$content.'		# content, support nesting
 						</\2>				# the matching end tag
-						[ \t]*				# trailing spaces/tabs
+						[ ]*				# trailing spaces/tabs
 						(?=\n+|\Z)	# followed by a newline or end of document
 					)
 			}xm',
@ -445,7 +454,7 @@ class Markdown_Parser {
 						\b					# word break
 						([^<>])*?			# 
 						/?>					# the matching end tag
-						[ \t]*
+						[ ]*
 						(?=\n{2,}|\Z)		# followed by a blank line or end of document
 					)
 			}x',
@ -464,7 +473,7 @@ class Markdown_Parser {
 					(?s:
 						<!-- .*? -->
 					)
-					[ \t]*
+					[ ]*
 					(?=\n{2,}|\Z)		# followed by a blank line or end of document
 				)
 			}x',
@ -485,7 +494,7 @@ class Markdown_Parser {
 						.*?
 						\2>
 					)
-					[ \t]*
+					[ ]*
 					(?=\n{2,}|\Z)		# followed by a blank line or end of document
 				)
 			}x',
@ -512,25 +521,28 @@ class Markdown_Parser {
 		$text = $this->unhash($text);
 		
 		# Then hash the block.
-		$key = md5($text);
+		$key = "B\x1A". md5($text);
 		$this->html_hashes[$key] = $text;
 		$this->html_blocks[$key] = $text;
 		return $key; # String that will replace the tag.
 	}


-	function hashSpan($text) {
+	function hashSpan($text, $word_separator = false) {
 	#
 	# Called whenever a tag must be hashed when a function insert a span-level 
 	# element in $text, it pass through this function and is automaticaly 
-	# escaped, blocking invalid nested overlap.
+	# escaped, blocking invalid nested overlap. If optional argument 
+	# $word_separator is true, surround the hash value by spaces.
 	#
 		# Swap back any tag hash found in $text so we do not have to `unhash`
 		# multiple times at the end.
 		$text = $this->unhash($text);
 		
 		# Then hash the span.
-		$key = md5($text);
+		$key = "S\x1A". md5($text);
+		if ($word_separator) $key = ":$key:";
+		
 		$this->html_hashes[$key] = $text;
 		return $key; # String that will replace the span tag.
 	}
@ -583,9 +595,9 @@ class Markdown_Parser {
 	function doHorizontalRules($text) {
 		# Do Horizontal Rules:
 		return preg_replace(
-			array('{^[ ]{0,2}([ ]?\*[ ]?){3,}[ \t]*$}mx',
-				  '{^[ ]{0,2}([ ]? -[ ]?){3,}[ \t]*$}mx',
-				  '{^[ ]{0,2}([ ]? _[ ]?){3,}[ \t]*$}mx'),
+			array('{^[ ]{0,2}([ ]?\*[ ]?){3,}[ ]*$}mx',
+				  '{^[ ]{0,2}([ ]? -[ ]?){3,}[ ]*$}mx',
+				  '{^[ ]{0,2}([ ]? _[ ]?){3,}[ ]*$}mx'),
 			"\n".$this->hashBlock("<hr$this->empty_element_suffix")."\n", 
 			$text);
 	}
@ -648,7 +660,7 @@ class Markdown_Parser {
 		foreach ($tokens as $cur_token) {
 			if ($cur_token[0] == 'tag') {
 				$cur_token[1] = str_replace('\\', $this->escape_table['\\'], $cur_token[1]);
-				$cur_token[1] = str_replace(array('`'), $this->escape_table['`'], $cur_token[1]);
+				$cur_token[1] = str_replace('`', $this->escape_table['`'], $cur_token[1]);
 				$cur_token[1] = str_replace('*', $this->escape_table['*'], $cur_token[1]);
 				$cur_token[1] = str_replace('_', $this->escape_table['_'], $cur_token[1]);
 			}
@ -662,6 +674,9 @@ class Markdown_Parser {
 	#
 	# Turn Markdown link shortcuts into XHTML <a> tags.
 	#
+		if ($this->in_anchor) return $text;
+		$this->in_anchor = true;
+		
 		#
 		# First, handle reference-style links: [link text] [id]
 		#
@ -690,14 +705,18 @@ class Markdown_Parser {
 				('.$this->nested_brackets.')	# link text = $2
 			  \]
 			  \(			# literal paren
-				[ \t]*
-				<?(.*?)>?	# href = $3
-				[ \t]*
-				(			# $4
-				  ([\'"])	# quote char = $5
-				  (.*?)		# Title = $6
-				  \5		# matching quote
-				  [ \t]*	# ignore any spaces/tabs between closing quote and )
+				[ ]*
+				(?:
+					<(\S*)>	# href = $3
+				|
+					('.$this->nested_url_parenthesis.')	# href = $4
+				)
+				[ ]*
+				(			# $5
+				  ([\'"])	# quote char = $6
+				  (.*?)		# Title = $7
+				  \6		# matching quote
+				  [ ]*	# ignore any spaces/tabs between closing quote and )
 				)?			# title is optional
 			  \)
 			)
@ -709,15 +728,16 @@ class Markdown_Parser {
 		# These must come last in case you've also got [link test][1]
 		# or [link test](/foo)
 		#
-//		$text = preg_replace_callback('{
-//			(					# wrap whole match in $1
-//			  \[
-//				([^\[\]]+)		# link text = $2; can\'t contain [ or ]
-//			  \]
-//			)
-//			}xs',
-//			array(&$this, '_doAnchors_reference_callback'), $text);
+		$text = preg_replace_callback('{
+			(					# wrap whole match in $1
+			  \[
+				([^\[\]]+)		# link text = $2; can\'t contain [ or ]
+			  \]
+			)
+			}xs',
+			array(&$this, '_doAnchors_reference_callback'), $text);

+		$this->in_anchor = false;
 		return $text;
 	}
 	function _doAnchors_reference_callback($matches) {
@ -757,9 +777,9 @@ class Markdown_Parser {
 	function _doAnchors_inline_callback($matches) {
 		$whole_match	=  $matches[1];
 		$link_text		=  $this->runSpanGamut($matches[2]);
-		$url			=  $matches[3];
-		$title			=& $matches[6];
-		
+		$url			=  $matches[3] == '' ? $matches[4] : $matches[3];
+		$title			=& $matches[7];
+
 		$url = $this->encodeAmpsAndAngles($url);

 		$result = "<a href=\"$url\"";
@ -811,14 +831,18 @@ class Markdown_Parser {
 			  \]
 			  \s?			# One optional whitespace character
 			  \(			# literal paren
-				[ \t]*
-				<?(\S+?)>?	# src url = $3
-				[ \t]*
-				(			# $4
-				  ([\'"])	# quote char = $5
-				  (.*?)		# title = $6
-				  \5		# matching quote
-				  [ \t]*
+				[ ]*
+				(?:
+					<(\S*)>	# src url = $3
+				|
+					('.$this->nested_url_parenthesis.')	# src url = $4
+				)
+				[ ]*
+				(			# $5
+				  ([\'"])	# quote char = $6
+				  (.*?)		# title = $7
+				  \6		# matching quote
+				  [ ]*
 				)?			# title is optional
 			  \)
 			)
@ -857,8 +881,8 @@ class Markdown_Parser {
 	function _doImages_inline_callback($matches) {
 		$whole_match	= $matches[1];
 		$alt_text		= $matches[2];
-		$url			= $matches[3];
-		$title			=& $matches[6];
+		$url			= $matches[3] == '' ? $matches[4] : $matches[3];
+		$title			=& $matches[7];

 		$alt_text = str_replace('"', '&quot;', $alt_text);
 		$result = "<img src=\"$url\" alt=\"$alt_text\"";
@ -880,9 +904,9 @@ class Markdown_Parser {
 		#	  Header 2
 		#	  --------
 		#
-		$text = preg_replace_callback('{ ^(.+)[ \t]*\n=+[ \t]*\n+ }mx',
+		$text = preg_replace_callback('{ ^(.+?)[ ]*\n=+[ ]*\n+ }mx',
 			array(&$this, '_doHeaders_callback_setext_h1'), $text);
-		$text = preg_replace_callback('{ ^(.+)[ \t]*\n-+[ \t]*\n+ }mx',
+		$text = preg_replace_callback('{ ^(.+?)[ ]*\n-+[ ]*\n+ }mx',
 			array(&$this, '_doHeaders_callback_setext_h2'), $text);

 		# atx-style headers:
@ -894,9 +918,9 @@ class Markdown_Parser {
 		#
 		$text = preg_replace_callback('{
 				^(\#{1,6})	# $1 = string of #\'s
-				[ \t]*
+				[ ]*
 				(.+?)		# $2 = Header text
-				[ \t]*
+				[ ]*
 				\#*			# optional closing #\'s (not counted)
 				\n+
 			}xm',
@ -939,7 +963,7 @@ class Markdown_Parser {
 				  (								# $2
 					[ ]{0,'.$less_than_tab.'}
 					('.$marker.')				# $3 = first list item marker
-					[ \t]+
+					[ ]+
 				  )
 				  (?s:.+?)
 				  (								# $4
@ -948,8 +972,8 @@ class Markdown_Parser {
 					  \n{2,}
 					  (?=\S)
 					  (?!						# Negative lookahead for another list item marker
-						[ \t]*
-						'.$marker.'[ \t]+
+						[ ]*
+						'.$marker.'[ ]+
 					  )
 				  )
 				)
@ -1029,11 +1053,11 @@ class Markdown_Parser {

 		$list_str = preg_replace_callback('{
 			(\n)?							# leading line = $1
-			(^[ \t]*)						# leading whitespace = $2
-			('.$marker_any.') [ \t]+		# list marker = $3
+			(^[ ]*)						# leading whitespace = $2
+			('.$marker_any.') [ ]+		# list marker = $3
 			((?s:.+?))						# list item text   = $4
 			(?:(\n+(?=\n))|\n)				# tailing blank line = $5
-			(?= \n* (\z | \2 ('.$marker_any.') [ \t]+))
+			(?= \n* (\z | \2 ('.$marker_any.') [ ]+))
 			}xm',
 			array(&$this, '_processListItems_callback'), $list_str);

@ -1084,7 +1108,7 @@ class Markdown_Parser {
 		$codeblock = $matches[1];

 		$codeblock = $this->encodeCode($this->outdent($codeblock));
-	//	$codeblock = $this->detab($codeblock);
+//		$codeblock = $this->detab($codeblock);
 		# trim leading newlines and trailing whitespace
 		$codeblock = preg_replace(array('/\A\n+/', '/\n+\z/'), '', $codeblock);

@ -1133,8 +1157,8 @@ class Markdown_Parser {
 	}
 	function _doCodeSpans_callback($matches) {
 		$c = $matches[2];
-		$c = preg_replace('/^[ \t]*/', '', $c); # leading whitespace
-		$c = preg_replace('/[ \t]*$/', '', $c); # trailing whitespace
+		$c = preg_replace('/^[ ]*/', '', $c); # leading whitespace
+		$c = preg_replace('/[ ]*$/', '', $c); # trailing whitespace
 		$c = $this->encodeCode($c);
 		return $this->hashSpan("<code>$c</code>");
 	}
@ -1173,13 +1197,13 @@ class Markdown_Parser {
 				(?=\S) 					# Not followed by whitespace 
 				(?!\1\1)				#   or two others marker chars.
 				(						# $2: Content
-					(?:
+					(?>
 						[^*_]+?			# Anthing not em markers.
 					|
 										# Balence any regular emphasis inside.
 						\1 (?=\S) .+? (?<=\S) \1
 					|
-						(?! \1 ) .		# Allow unbalenced * and _.
+						.				# Allow unbalenced * and _.
 					)+?
 				)
 				(?<=\S) \1\1			# End mark not preceded by whitespace.
@ -1187,7 +1211,7 @@ class Markdown_Parser {
 			array(&$this, '_doItalicAndBold_strong_callback'), $text);
 		# Then <em>:
 		$text = preg_replace_callback(
-			'{ ( (?<!\*)\* | (?<!_)_ ) (?=\S) (?! \1) (.+?) (?<=\S) \1 }sx',
+			'{ ( (?<!\*)\* | (?<!_)_ ) (?=\S) (?! \1) (.+?) (?<=\S)(?<!\s(?=\1).) \1 }sx',
 			array(&$this, '_doItalicAndBold_em_callback'), $text);

 		return $text;
@ -1208,7 +1232,7 @@ class Markdown_Parser {
 		$text = preg_replace_callback('/
 			  (								# Wrap whole match in $1
 				(
-				  ^[ \t]*>[ \t]?			# ">" at the start of a line
+				  ^[ ]*>[ ]?			# ">" at the start of a line
 					.+\n					# rest of the first line
 				  (.+\n)*					# subsequent consecutive lines
 				  \n*						# blanks
@ -1222,7 +1246,7 @@ class Markdown_Parser {
 	function _doBlockQuotes_callback($matches) {
 		$bq = $matches[1];
 		# trim one level of quoting - trim whitespace-only lines
-		$bq = preg_replace(array('/^[ \t]*>[ \t]?/m', '/^[ \t]+$/m'), '', $bq);
+		$bq = preg_replace(array('/^[ ]*>[ ]?/m', '/^[ ]+$/m'), '', $bq);
 		$bq = $this->runBlockGamut($bq);		# recurse

 		$bq = preg_replace('/^/m', "  ", $bq);
@ -1256,7 +1280,7 @@ class Markdown_Parser {
 		foreach ($grafs as $key => $value) {
 			if (!isset( $this->html_blocks[$value] )) {
 				$value = $this->runSpanGamut($value);
-				$value = preg_replace('/^([ \t]*)/', "<p>", $value);
+				$value = preg_replace('/^([ ]*)/', "<p>", $value);
 				$value .= "</p>";
 				$grafs[$key] = $this->unhash($value);
 			}
@ -1270,41 +1294,41 @@ class Markdown_Parser {
 			if (isset($this->html_blocks[$graf])) {
 				$block = $this->html_blocks[$graf];
 				$graf = $block;
-//				if (preg_match('{
-//					\A
-//					(							# $1 = <div> tag
-//					  <div  \s+
-//					  [^>]*
-//					  \b
-//					  markdown\s*=\s*  ([\'"])	#	$2 = attr quote char
-//					  1
-//					  \2
-//					  [^>]*
-//					  >
-//					)
-//					(							# $3 = contents
-//					.*
-//					)
-//					(</div>)					# $4 = closing tag
-//					\z
-//					}xs', $block, $matches))
-//				{
-//					list(, $div_open, , $div_content, $div_close) = $matches;
-//
-//					# We can't call Markdown(), because that resets the hash;
-//					# that initialization code should be pulled into its own sub, though.
-//					$div_content = $this->hashHTMLBlocks($div_content);
-//					
-//					# Run document gamut methods on the content.
-//					foreach ($this->document_gamut as $method => $priority) {
-//						$div_content = $this->$method($div_content);
-//					}
-//
-//					$div_open = preg_replace(
-//						'{\smarkdown\s*=\s*([\'"]).+?\1}', '', $div_open);
-//
-//					$graf = $div_open . "\n" . $div_content . "\n" . $div_close;
-//				}
+				if (preg_match('{
+					\A
+					(							# $1 = <div> tag
+					  <div  \s+
+					  [^>]*
+					  \b
+					  markdown\s*=\s*  ([\'"])	#	$2 = attr quote char
+					  1
+					  \2
+					  [^>]*
+					  >
+					)
+					(							# $3 = contents
+					.*
+					)
+					(</div>)					# $4 = closing tag
+					\z
+					}xs', $block, $matches))
+				{
+					list(, $div_open, , $div_content, $div_close) = $matches;
+
+					# We can't call Markdown(), because that resets the hash;
+					# that initialization code should be pulled into its own sub, though.
+					$div_content = $this->hashHTMLBlocks($div_content);
+					
+					# Run document gamut methods on the content.
+					foreach ($this->document_gamut as $method => $priority) {
+						$div_content = $this->$method($div_content);
+					}
+
+					$div_open = preg_replace(
+						'{\smarkdown\s*=\s*([\'"]).+?\1}', '', $div_open);
+
+					$graf = $div_open . "\n" . $div_content . "\n" . $div_close;
+				}
 				$grafs[$key] = $graf;
 			}
 		}
@ -1366,7 +1390,6 @@ class Markdown_Parser {
 	}
 	function _doAutoLinks_email_callback($matches) {
 		$address = $matches[1];
-		$address = $this->unescapeSpecialChars($address);
 		$link = $this->encodeEmailAddress($address);
 		return $this->hashSpan($link);
 	}
@ -1413,15 +1436,6 @@ class Markdown_Parser {
 	}


-	function unescapeSpecialChars($text) {
-	#
-	# Swap back in all the special characters we've hidden.
-	#
-		return str_replace(array_values($this->escape_table), 
-						   array_keys($this->escape_table), $text);
-	}
-
-
 	function tokenizeHTML($str) {
 	#
 	#   Parameter:  String containing HTML + Markdown markup.
@ -1599,8 +1613,8 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 			"doDefLists"         => 45,
 			);
 		$this->span_gamut += array(
-			"doFootnotes"        =>  4,
-			"doAbbreviations"    =>  5,
+			"doFootnotes"        => 5,
+			"doAbbreviations"    => 70,
 			);
 		
 		parent::Markdown_Parser();
@ -1614,6 +1628,9 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 	var $abbr_matches = array();
 	var $html_cleans = array();
 	
+	# Status flag to avoid invalid nesting.
+	var $in_footnote = false;
+	
 	
 	function transform($text) {
 	#
@ -1763,8 +1780,9 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 			# If in Markdown span mode, add a empty-string span-level hash 
 			# after each newline to prevent triggering any block element.
 			if ($span) {
-				$newline = $this->hashSpan("") . "\n";
-				$parts[0] = str_replace("\n", $newline, $parts[0]);
+				$void = $this->hashSpan("", true) ;
+				$newline = $this->hashSpan("", true) . "\n";
+				$parts[0] = $void . str_replace("\n", $newline, $parts[0]) . $void;
 			}
 			
 			$parsed .= $parts[0]; # Text before current tag.
@ -1879,9 +1897,14 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 				\s*			# Eat whitespace before the `markdown` attribute
 				markdown
 				\s*=\s*
-				(["\'])		# $1: quote delimiter		
-				(.*?)		# $2: attribute value
-				\1			# matching delimiter	
+				(?:
+					(["\'])		# $1: quote delimiter		
+					(.*?)		# $2: attribute value
+					\1			# matching delimiter	
+				|
+					([^\s>]*)	# $3: unquoted attribute value
+				)
+				()				# $4: make $3 always defined (avoid warnings)
 			}xs';
 		
 		# Regex to match any tag.
@ -1967,14 +1990,14 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 				# Check for `markdown="1"` attribute and handle it.
 				#
 				if ($md_attr && 
-					preg_match($markdown_attr_match, $tag, $attr_matches) &&
-					preg_match('/^1|block|span$/', $attr_matches[2]))
+					preg_match($markdown_attr_match, $tag, $attr_m) &&
+					preg_match('/^1|block|span$/', $attr_m[2] . $attr_m[3]))
 				{
 					# Remove `markdown` attribute from opening tag.
 					$tag = preg_replace($markdown_attr_match, '', $tag);
 					
 					# Check if text inside this tag must be parsed in span mode.
-					$this->mode = $attr_matches[2];
+					$this->mode = $attr_m[2] . $attr_m[3];
 					$span_mode = $this->mode == 'span' || $this->mode != 'block' &&
 						preg_match("{^<(?:$this->contain_span_tags)\b}", $tag);
 					
@ -2033,7 +2056,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		$text = $this->unhash($text);
 		
 		# Then hash the tag.
-		$key = md5($text);
+		$key = "C\x1A". md5($text);
 		$this->html_cleans[$key] = $text;
 		$this->html_hashes[$key] = $text;
 		return $key; # String that will replace the clean tag.
@ -2052,10 +2075,10 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		#	  --------
 		#
 		$text = preg_replace_callback(
-			'{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ \t]*\n=+[ \t]*\n+ }mx',
+			'{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ ]*\n=+[ ]*\n+ }mx',
 			array(&$this, '_doHeaders_callback_setext_h1'), $text);
 		$text = preg_replace_callback(
-			'{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ \t]*\n-+[ \t]*\n+ }mx',
+			'{ (^.+?) (?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? [ ]*\n-+[ ]*\n+ }mx',
 			array(&$this, '_doHeaders_callback_setext_h2'), $text);

 		# atx-style headers:
@ -2067,12 +2090,12 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		#
 		$text = preg_replace_callback('{
 				^(\#{1,6})	# $1 = string of #\'s
-				[ \t]*
+				[ ]*
 				(.+?)		# $2 = Header text
-				[ \t]*
+				[ ]*
 				\#*			# optional closing #\'s (not counted)
 				(?:[ ]+\{\#([-_:a-zA-Z0-9]+)\})? # id attribute
-				[ \t]*
+				[ ]*
 				\n+
 			}xm',
 			array(&$this, '_doHeaders_callback_atx'), $text);
@ -2368,14 +2391,14 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 				(?=\S) 					# Not followed by whitespace 
 				(?!__)					#   or two others marker chars.
 				(						# $2: Content
-					(?:
+					(?>
 						[^_]+?			# Anthing not em markers.
 					|
 										# Balence any regular _ emphasis inside.
 						(?<![a-zA-Z0-9]) _ (?=\S) (.+?) 
 						(?<=\S) _ (?![a-zA-Z0-9])
 					|
-						___+
+						_+				# Allow unbalenced as last resort.
 					)+?
 				)
 				(?<=\S) __				# End mark not preceded by whitespace.
@ -2387,11 +2410,13 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 				(?=\S) 					# Not followed by whitespace 
 				(?!\1)					#   or two others marker chars.
 				(						# $2: Content
-					(?:
+					(?>
 						[^*]+?			# Anthing not em markers.
 					|
 										# Balence any regular * emphasis inside.
 						\* (?=\S) (.+?) (?<=\S) \*
+					|
+						\*				# Allow unbalenced as last resort.
 					)+?
 				)
 				(?<=\S) \*\*			# End mark not preceded by whitespace.
@ -2401,7 +2426,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		# Then <em>:
 		$text = preg_replace_callback(array(
 			'{ ( (?<![a-zA-Z0-9])(?<!_)_ ) (?=\S) (?! \1) (.+?) (?<=\S) \1(?![a-zA-Z0-9]) }sx',
-			'{ ( (?<!\*)\* ) (?=\S) (?! \1) (.+?) (?<=\S) \1 }sx',
+			'{ ( (?<!\*)\* ) (?=\S) (?! \1) (.+?) (?<=\S)(?<!\s\*) \1 }sx',
 			),
 			array(&$this, '_doItalicAndBold_em_callback'), $text);

@ -2428,7 +2453,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 			# Check if this should be enclosed in a paragraph.
 			# Clean tag hashes & block tag hashes are left alone.
 			$clean_key = $value;
-			$block_key = substr($value, 0, 32);
+			$block_key = substr($value, 0, 34);
 			
 			$is_p = (!isset($this->html_blocks[$block_key]) && 
 					 !isset($this->html_cleans[$clean_key]));
@ -2461,7 +2486,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		# Link defs are in the form: [^id]: url "optional title"
 		$text = preg_replace_callback('{
 			^[ ]{0,'.$less_than_tab.'}\[\^(.+?)\][ ]?:	# note_id = $1
-			  [ \t]*
+			  [ ]*
 			  \n?					# maybe *one* newline
 			(						# text = $2 (no blank lines allowed)
 				(?:					
@ -2479,7 +2504,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 		return $text;
 	}
 	function _stripFootnotes_callback($matches) {
-		$note_id = $matches[1];
+		$note_id = $this->fn_id_prefix . $matches[1];
 		$this->footnotes[$note_id] = $this->outdent($matches[2]);
 		return ''; # String that will replace the block
 	}
@ -2490,7 +2515,9 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 	# Replace footnote references in $text [^id] with a special text-token 
 	# which will be can be
 	#
-		$text = preg_replace('{\[\^(.+?)\]}', "a\0fn:\\1\0z", $text);
+		if (!$this->in_footnote && !$this->in_anchor) {
+			$text = preg_replace('{\[\^(.+?)\]}', "F\x1Afn:\\1\x1A:", $text);
+		}
 		return $text;
 	}

@ -2499,7 +2526,8 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 	#
 	# Append footnote list to text.
 	#
-		$text = preg_replace_callback('{a\0fn:(.*?)\0z}', 
+	
+		$text = preg_replace_callback('{F\x1Afn:(.*?)\x1A:}', 
 			array(&$this, '_appendFootnotes_callback'), $text);
 	
 		if (!empty($this->footnotes_ordered)) {
@ -2523,6 +2551,8 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 			}
 			$num = 0;
 			
+			$this->in_footnote = true;
+			
 			foreach ($this->footnotes_ordered as $note_id => $footnote) {
 				$footnote .= "\n"; # Need to append newline before parsing.
 				$footnote = $this->runBlockGamut("$footnote\n");
@ -2542,10 +2572,10 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 				$text .= "</li>\n\n";
 			}
 			
+			$this->in_footnote = false;
+			
 			$text .= "</ol>\n";
 			$text .= "</div>";
-			
-			$text = preg_replace('{a\{fn:(.*?)\}z}', '[^\\1]', $text);
 		}
 		return $text;
 	}
@ -2589,8 +2619,7 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 	
 	function stripAbbreviations($text) {
 	#
-	# Strips abbreviations from text, stores the URLs and titles in
-	# hash references.
+	# Strips abbreviations from text, stores titles in hash references.
 	#
 		$less_than_tab = $this->tab_width - 1;

@ -2614,12 +2643,16 @@ class MarkdownExtra_Parser extends Markdown_Parser {
 	
 	function doAbbreviations($text) {
 	#
-	# Replace footnote references in $text [^id] with a link to the footnote.
+	# Find defined abbreviations in text and wrap them in <abbr> elements.
 	#
 		if ($this->abbr_matches) {
-			$regex = '{(?<!\w)(?:'. implode('|', $this->abbr_matches) .')(?!\w)}';
-	
-			$text = preg_replace_callback($regex, 
+			// cannot use the /x modifier because abbr_matches may 
+			// contain spaces:
+			$text = preg_replace_callback('{'.
+				'(?<![\w\x1A])'.
+				'(?:'. implode('|', $this->abbr_matches) .')'.
+				'(?![\w\x1A])'.
+				'}', 
 				array(&$this, '_doAbbreviations_callback'), $text);
 		}
 		return $text;
@ -2686,6 +2719,34 @@ Version History

 See Readme file for details.

+Extra 1.1.3b1 (21 May 2007):
+
+*	The markdown="" attribute now accepts unquoted values.
+
+*	Fixed an issue where underscore-emphasis didn't work when applied on the 
+	first or the last word of an element having the markdown="1" or 
+	markdown="span" attribute set unless there was some surrounding whitespace.
+	This didn't work:
+	
+		<p markdown="1">_Hello_ _world_</p>
+	
+	Now it does produce emphasis as expected.
+
+*	Fixed an issue preventing footnotes from working when the parser's 
+	footnote id prefix variable (fn_id_prefix) is not empty.
+
+*	Fixed a performance problem with the regular expression for strong 
+	emphasis introduced in version 1.1 could sometime be long to process, 
+	give slightly wrong results, and in some circumstances could remove 
+	entirely the content for a whole paragraph.
+
+*	Fixed an issue were abbreviations tags could be incorrectly added 
+	inside URLs and title of links.
+
+*	Placing footnote markers inside a link, resulting in two nested links, is 
+	no longer allowed.
+
+
 Extra 1.1.2 (7 Feb 2007)

 Extra 1.1.1 (28 Dec 2006)