Merge pull request #37 from hkdobrev/htmlspecialshars-utf8

Use UTF-8 encoding for htmlspecialchars. See #36 .
Prior to PHP 5.4.0 the default encoding for `htmlentities()` and `htmlspecialchars` is "ISO-8859-1". For PHP 5.4+ is "UTF-8". This ensures always the right encoding is used no matter the PHP version and the locale settings.
2023-08-10 21:13:06 +03:00 · 2013-11-22 13:23:21 -08:00 · 2013-11-22 23:06:20 +02:00 · 2013-11-22 21:57:21 +02:00 · 2013-11-22 11:21:38 -08:00 · 2013-11-22 23:05:26 +08:00
91 changed files with 748 additions and 739 deletions
--- a/.travis.yml
+++ b/.travis.yml
@ -4,8 +4,4 @@ php:
  - 5.5
  - 5.4
  - 5.3
-  - 5.2
-
-matrix:
-  allow_failures:
-    - php: 5.2
+  - 5.2
--- a/Parsedown.php
+++ b/Parsedown.php
@ -46,17 +46,17 @@ class Parsedown

 	function parse($text)
 	{
-		# Removes UTF-8 BOM and marker characters.
+		# removes UTF-8 BOM and marker characters
 		$text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text);

-		# Removes \r characters.
+		# removes \r characters
 		$text = str_replace("\r\n", "\n", $text);
 		$text = str_replace("\r", "\n", $text);

-		# Replaces tabs with spaces.
+		# replaces tabs with spaces
 		$text = str_replace("\t", '    ', $text);

-		# Encodes escape sequences.
+		# encodes escape sequences

 		if (strpos($text, '\\') !== FALSE)
 		{
@ -66,7 +66,7 @@ class Parsedown
 			{
 				if (strpos($text, $escape_sequence) !== FALSE)
 				{
-					$code = "\x1A".'\\'.$index;
+					$code = "\x1A".'\\'.$index.';';

 					$text = str_replace($escape_sequence, $code, $text);

@ -84,7 +84,7 @@ class Parsedown

 		$text = $this->parse_block_elements($lines);

-		# Decodes escape sequences (leaves out backslashes).
+		# decodes escape sequences

 		foreach ($this->escape_sequence_map as $code => $escape_sequence)
 		{
@ -110,28 +110,56 @@ class Parsedown

 		foreach ($lines as $line)
 		{
-			# Block-Level HTML
+			#
+			# fenced elements

-			if ($element['type'] === 'block' and ! isset($element['closed']))
+			switch ($element['type'])
 			{
-				if (preg_match('{<'.$element['subtype'].'>$}', $line)) # <open>
-				{
-					$element['depth']++;
-				}
+				case 'fenced_code_block':

-				if (preg_match('{</'.$element['subtype'].'>$}', $line)) # </close>
-				{
-					$element['depth'] > 0
-						? $element['depth']--
-						: $element['closed'] = true;
-				}
+					if ( ! isset($element['closed']))
+					{
+						if (preg_match('/^[ ]*'.$element['fence'][0].'{3,}[ ]*$/', $line))
+						{
+							$element['closed'] = true;
+						}
+						else
+						{
+							$element['text'] !== '' and $element['text'] .= "\n";

-				$element['text'] .= "\n".$line;
+							$element['text'] .= $line;
+						}

-				continue;
+						continue 2;
+					}
+
+					break;
+
+				case 'markup':
+
+					if ( ! isset($element['closed']))
+					{
+						if (preg_match('{<'.$element['subtype'].'>$}', $line)) # opening tag
+						{
+							$element['depth']++;
+						}
+
+						if (preg_match('{</'.$element['subtype'].'>$}', $line)) # closing tag
+						{
+							$element['depth'] > 0
+								? $element['depth']--
+								: $element['closed'] = true;
+						}
+
+						$element['text'] .= "\n".$line;
+
+						continue 2;
+					}
+
+					break;
 			}

-			# Empty
+			# *

 			if ($line === '')
 			{
@ -140,269 +168,330 @@ class Parsedown
 				continue;
 			}

-			# Lazy Blockquote
+			#
+			# composite elements

-			if ($element['type'] === 'blockquote' and ! isset($element['interrupted']))
+			switch ($element['type'])
 			{
-				$line = preg_replace('/^[ ]*>[ ]?/', '', $line);
+				case 'blockquote':

-				$element['lines'] []= $line;
-
-				continue;
-			}
-
-			# Lazy List Item
-
-			if ($element['type'] === 'li')
-			{
-				if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
-				{
-					if ($element['indentation'] !== $matches[1])
+					if ( ! isset($element['interrupted']))
 					{
+						$line = preg_replace('/^[ ]*>[ ]?/', '', $line);
+
 						$element['lines'] []= $line;
+
+						continue 2;
+					}
+
+					break;
+
+				case 'li':
+
+					if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
+					{
+						if ($element['indentation'] !== $matches[1])
+						{
+							$element['lines'] []= $line;
+						}
+						else
+						{
+							unset($element['last']);
+
+							$elements []= $element;
+
+							$element = array(
+								'type' => 'li',
+								'indentation' => $matches[1],
+								'last' => true,
+								'lines' => array(
+									preg_replace('/^[ ]{0,4}/', '', $matches[3]),
+								),
+							);
+						}
+
+						continue 2;
+					}
+
+					if (isset($element['interrupted']))
+					{
+						if ($line[0] === ' ')
+						{
+							$element['lines'] []= '';
+
+							$line = preg_replace('/^[ ]{0,4}/', '', $line);
+
+							$element['lines'] []= $line;
+
+							continue 2;
+						}
 					}
 					else
 					{
-						unset($element['last']);
+						$line = preg_replace('/^[ ]{0,4}/', '', $line);

+						$element['lines'] []= $line;
+
+						continue 2;
+					}
+
+					break;
+			}
+
+			#
+			# indentation sensitive types
+
+			$deindented_line = $line;
+
+			switch ($line[0])
+			{
+				case ' ':
+
+					# ~
+
+					$deindented_line = ltrim($line);
+
+					if ($deindented_line === '')
+					{
+						continue 2;
+					}
+
+					# code block
+
+					if (preg_match('/^[ ]{4}(.*)/', $line, $matches))
+					{
+						if ($element['type'] === 'code_block')
+						{
+							if (isset($element['interrupted']))
+							{
+								$element['text'] .= "\n";
+
+								unset ($element['interrupted']);
+							}
+
+							$element['text'] .= "\n".$matches[1];
+						}
+						else
+						{
+							$elements []= $element;
+
+							$element = array(
+								'type' => 'code_block',
+								'text' => $matches[1],
+							);
+						}
+
+						continue 2;
+					}
+
+					break;
+
+				case '#':
+
+					# atx heading (#)
+
+					if (preg_match('/^(#{1,6})[ ]*(.+?)[ ]*#*$/', $line, $matches))
+					{
+						$elements []= $element;
+
+						$level = strlen($matches[1]);
+
+						$element = array(
+							'type' => 'h.',
+							'text' => $matches[2],
+							'level' => $level,
+						);
+
+						continue 2;
+					}
+
+					break;
+
+				case '-':
+
+					# setext heading (---)
+
+					if ($line[0] === '-' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[-]+[ ]*$/', $line))
+					{
+						$element['type'] = 'h.';
+						$element['level'] = 2;
+
+						continue 2;
+					}
+
+					break;
+
+				case '=':
+
+					# setext heading (===)
+
+					if ($line[0] === '=' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[=]+[ ]*$/', $line))
+					{
+						$element['type'] = 'h.';
+						$element['level'] = 1;
+
+						continue 2;
+					}
+
+					break;
+			}
+
+			#
+			# indentation insensitive types
+
+			switch ($deindented_line[0])
+			{
+				case '<':
+
+					# self-closing tag
+
+					if (preg_match('{^<.+?/>$}', $deindented_line))
+					{
+						$elements []= $element;
+
+						$element = array(
+							'type' => '',
+							'text' => $deindented_line,
+						);
+
+						continue 2;
+					}
+
+					# opening tag
+
+					if (preg_match('{^<(\w+)(?:[ ].*?)?>}', $deindented_line, $matches))
+					{
+						$elements []= $element;
+
+						$element = array(
+							'type' => 'markup',
+							'subtype' => strtolower($matches[1]),
+							'text' => $deindented_line,
+							'depth' => 0,
+						);
+
+						preg_match('{</'.$matches[1].'>\s*$}', $deindented_line) and $element['closed'] = true;
+
+						continue 2;
+					}
+
+					break;
+
+				case '>':
+
+					# quote
+
+					if (preg_match('/^>[ ]?(.*)/', $deindented_line, $matches))
+					{
+						$elements []= $element;
+
+						$element = array(
+							'type' => 'blockquote',
+							'lines' => array(
+								$matches[1],
+							),
+						);
+
+						continue 2;
+					}
+
+					break;
+
+				case '[':
+
+					# reference
+
+					if (preg_match('/^\[(.+?)\]:[ ]*([^ ]+)/', $deindented_line, $matches))
+					{
+						$label = strtolower($matches[1]);
+
+						$this->reference_map[$label] = trim($matches[2], '<>');;
+
+						continue 2;
+					}
+
+					break;
+
+				case '`':
+				case '~':
+
+					# fenced code block
+
+					if (preg_match('/^([`]{3,}|[~]{3,})[ ]*(\S+)?[ ]*$/', $deindented_line, $matches))
+					{
+						$elements []= $element;
+
+						$element = array(
+							'type' => 'fenced_code_block',
+							'text' => '',
+							'fence' => $matches[1],
+						);
+
+						isset($matches[2]) and $element['language'] = $matches[2];
+
+						continue 2;
+					}
+
+					break;
+
+				case '*':
+				case '+':
+				case '-':
+				case '_':
+
+					# hr
+
+					if (preg_match('/^([-*_])([ ]{0,2}\1){2,}[ ]*$/', $deindented_line))
+					{
+						$elements []= $element;
+
+						$element = array(
+							'type' => 'hr',
+						);
+
+						continue 2;
+					}
+
+					# li
+
+					if (preg_match('/^([ ]*)[*+-][ ](.*)/', $line, $matches))
+					{
 						$elements []= $element;

 						$element = array(
 							'type' => 'li',
+							'ordered' => false,
 							'indentation' => $matches[1],
 							'last' => true,
 							'lines' => array(
-								preg_replace('/^[ ]{0,4}/', '', $matches[3]),
+								preg_replace('/^[ ]{0,4}/', '', $matches[2]),
 							),
 						);
+
+						continue 2;
 					}
-
-					continue;
-				}
-
-				if (isset($element['interrupted']))
-				{
-					if ($line[0] === ' ')
-					{
-						$element['lines'] []= '';
-
-						$line = preg_replace('/^[ ]{0,4}/', '', $line);;
-
-						$element['lines'] []= $line;
-
-						continue;
-					}
-				}
-				else
-				{
-					$line = preg_replace('/^[ ]{0,4}/', '', $line);;
-
-					$element['lines'] []= $line;
-
-					continue;
-				}
 			}

-			# Quick Paragraph
+			# li

-			if ($line[0] >= 'a' or $line[0] >= 'A' and $line[0] <= 'Z')
-			{
-				goto paragraph;
-			}
-
-			# Code Block
-
-			if ($line[0] === ' ' and preg_match('/^[ ]{4}(.*)/', $line, $matches))
-			{
-				if (trim($line) === '')
-				{
-					continue;
-				}
-
-				if ($element['type'] === 'code')
-				{
-					if (isset($element['interrupted']))
-					{
-						$element['text'] .= "\n";
-
-						unset ($element['interrupted']);
-					}
-
-					$element['text'] .= "\n".$matches[1];
-				}
-				else
-				{
-					$elements []= $element;
-
-					$element = array(
-						'type' => 'code',
-						'text' => $matches[1],
-					);
-				}
-
-				continue;
-			}
-
-			# Setext Header (---)
-
-			if ($line[0] === '-' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[-]+[ ]*$/', $line))
-			{
-				$element['type'] = 'h.';
-				$element['level'] = 2;
-
-				continue;
-			}
-
-			# Atx Header (#)
-
-			if ($line[0] === '#' and preg_match('/^(#{1,6})[ ]*(.+?)[ ]*#*$/', $line, $matches))
-			{
-				$elements []= $element;
-
-				$level = strlen($matches[1]);
-
-				$element = array(
-					'type' => 'h.',
-					'text' => $matches[2],
-					'level' => $level,
-				);
-
-				continue;
-			}
-
-			# Setext Header (===)
-
-			if ($line[0] === '=' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[=]+[ ]*$/', $line))
-			{
-				$element['type'] = 'h.';
-				$element['level'] = 1;
-
-				continue;
-			}
-
-			# ~
-
-			$pure_line = $line[0] !== ' ' ? $line : ltrim($line);
-
-			if ($pure_line === '')
-			{
-				continue;
-			}
-
-			# Link Reference
-
-			if ($pure_line[0] === '[' and preg_match('/^\[(.+?)\]:[ ]*([^ ]+)/', $pure_line, $matches))
-			{
-				$label = strtolower($matches[1]);
-				$url = trim($matches[2], '<>');
-
-				$this->reference_map[$label] = $url;
-
-				continue;
-			}
-
-			# Blockquote
-
-			if ($pure_line[0] === '>' and preg_match('/^>[ ]?(.*)/', $pure_line, $matches))
-			{
-				if ($element['type'] === 'blockquote')
-				{
-					if (isset($element['interrupted']))
-					{
-						$element['lines'] []= '';
-
-						unset($element['interrupted']);
-					}
-
-					$element['lines'] []= $matches[1];
-				}
-				else
-				{
-					$elements []= $element;
-
-					$element = array(
-						'type' => 'blockquote',
-						'lines' => array(
-							$matches[1],
-						),
-					);
-				}
-
-				continue;
-			}
-
-			# HTML
-
-			if ($pure_line[0] === '<')
-			{
-				# Block-Level HTML <self-closing/>
-
-				if (preg_match('{^<.+?/>$}', $pure_line))
-				{
-					$elements []= $element;
-
-					$element = array(
-						'type' => '',
-						'text' => $pure_line,
-					);
-
-					continue;
-				}
-
-				# Block-Level HTML <open>
-
-				if (preg_match('{^<(\w+)(?:[ ].*?)?>}', $pure_line, $matches))
-				{
-					$elements []= $element;
-
-					$element = array(
-						'type' => 'block',
-						'subtype' => strtolower($matches[1]),
-						'text' => $pure_line,
-						'depth' => 0,
-					);
-
-					preg_match('{</'.$matches[1].'>\s*$}', $pure_line) and $element['closed'] = true;
-
-					continue;
-				}
-			}
-
-			# Horizontal Rule
-
-			if (preg_match('/^([-*_])([ ]{0,2}\1){2,}[ ]*$/', $pure_line))
-			{
-				$elements []= $element;
-
-				$element = array(
-					'type' => 'hr',
-				);
-
-				continue;
-			}
-
-			# List Item
-
-			if (preg_match('/^([ ]*)(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
+			if ($deindented_line[0] <= '9' and $deindented_line >= '0' and preg_match('/^([ ]*)\d+[.][ ](.*)/', $line, $matches))
 			{
 				$elements []= $element;

 				$element = array(
 					'type' => 'li',
-					'ordered' => isset($matches[2][1]),
+					'ordered' => true,
 					'indentation' => $matches[1],
 					'last' => true,
 					'lines' => array(
-						preg_replace('/^[ ]{0,4}/', '', $matches[3]),
+						preg_replace('/^[ ]{0,4}/', '', $matches[2]),
 					),
 				);

 				continue;
 			}

-			# ~
-
-			paragraph:
+			# paragraph

 			if ($element['type'] === 'p')
 			{
@ -432,7 +521,7 @@ class Parsedown

 		$elements []= $element;

-		array_shift($elements);
+		unset($elements[0]);

 		#
 		# ~
@ -440,10 +529,67 @@ class Parsedown

 		$markup = '';

-		foreach ($elements as $index => $element)
+		foreach ($elements as $element)
 		{
 			switch ($element['type'])
 			{
+				case 'p':
+
+					$text = $this->parse_span_elements($element['text']);
+
+					$text = preg_replace('/[ ]{2}\n/', '<br />'."\n", $text);
+
+					if ($context === 'li' and $markup === '')
+					{
+						if (isset($element['interrupted']))
+						{
+							$markup .= "\n".'<p>'.$text.'</p>'."\n";
+						}
+						else
+						{
+							$markup .= $text;
+						}
+					}
+					else
+					{
+						$markup .= '<p>'.$text.'</p>'."\n";
+					}
+
+					break;
+
+				case 'blockquote':
+
+					$text = $this->parse_block_elements($element['lines']);
+
+					$markup .= '<blockquote>'."\n".$text.'</blockquote>'."\n";
+
+					break;
+
+				case 'code_block':
+				case 'fenced_code_block':
+
+					$text = htmlspecialchars($element['text'], ENT_NOQUOTES, 'UTF-8');
+
+					strpos($text, "\x1A\\") !== FALSE and $text = strtr($text, $this->escape_sequence_map);
+
+					$markup .= '<pre><code>'.$text.'</code></pre>'."\n";
+
+					break;
+
+				case 'h.':
+
+					$text = $this->parse_span_elements($element['text']);
+
+					$markup .= '<h'.$element['level'].'>'.$text.'</h'.$element['level'].'>'."\n";
+
+					break;
+
+				case 'hr':
+
+					$markup .= '<hr />'."\n";
+
+					break;
+
 				case 'li':

 					if (isset($element['ordered'])) # first
@ -466,62 +612,6 @@ class Parsedown

 					break;

-				case 'p':
-
-					$text = $this->parse_inline_elements($element['text']);
-
-					$text = preg_replace('/[ ]{2}\n/', '<br />'."\n", $text);
-
-					if ($context === 'li' and $index === 0)
-					{
-						if (isset($element['interrupted']))
-						{
-							$markup .= "\n".'<p>'.$text.'</p>'."\n";
-						}
-						else
-						{
-							$markup .= $text;
-						}
-					}
-					else
-					{
-						$markup .= '<p>'.$text.'</p>'."\n";
-					}
-
-					break;
-
-				case 'code':
-
-					$text = htmlentities($element['text'], ENT_NOQUOTES);
-
-					strpos($text, "\x1A\\") !== FALSE and $text = strtr($text, $this->escape_sequence_map);
-
-					$markup .= '<pre><code>'.$text.'</code></pre>'."\n";
-
-					break;
-
-				case 'blockquote':
-
-					$text = $this->parse_block_elements($element['lines']);
-
-					$markup .= '<blockquote>'."\n".$text.'</blockquote>'."\n";
-
-					break;
-
-				case 'h.':
-
-					$text = $this->parse_inline_elements($element['text']);
-
-					$markup .= '<h'.$element['level'].'>'.$text.'</h'.$element['level'].'>'."\n";
-
-					break;
-
-				case 'hr':
-
-					$markup .= '<hr />'."\n";
-
-					break;
-
 				default:

 					$markup .= $element['text']."\n";
@ -531,32 +621,32 @@ class Parsedown
 		return $markup;
 	}

-	private function parse_inline_elements($text)
+	private function parse_span_elements($text)
 	{
 		$map = array();

 		$index = 0;

-		# Code Span
+		# code span

 		if (strpos($text, '`') !== FALSE and preg_match_all('/`(.+?)`/', $text, $matches, PREG_SET_ORDER))
 		{
 			foreach ($matches as $matches)
 			{
 				$element_text = $matches[1];
-				$element_text = htmlentities($element_text, ENT_NOQUOTES);
+				$element_text = htmlspecialchars($element_text, ENT_NOQUOTES, 'UTF-8');

-				# Decodes escape sequences.
+				# decodes escape sequences

 				$this->escape_sequence_map
 					and strpos($element_text, "\x1A") !== FALSE
 					and $element_text = strtr($element_text, $this->escape_sequence_map);

-				# Composes element.
+				# composes element

 				$element = '<code>'.$element_text.'</code>';

-				# Encodes element.
+				# encodes element

 				$code = "\x1A".'$'.$index;

@ -568,7 +658,7 @@ class Parsedown
 			}
 		}

-		# Inline Link / Image
+		# inline link or image

 		if (strpos($text, '](') !== FALSE and preg_match_all('/(!?)(\[((?:[^\[\]]|(?2))*)\])\((.*?)\)/', $text, $matches, PREG_SET_ORDER)) # inline
 		{
@ -584,7 +674,7 @@ class Parsedown
 				}
 				else
 				{
-					$element_text = $this->parse_inline_elements($matches[3]);
+					$element_text = $this->parse_span_elements($matches[3]);

 					$element = '<a href="'.$url.'">'.$element_text.'</a>';
 				}
@ -601,7 +691,7 @@ class Parsedown
 			}
 		}

-		# Reference(d) Link / Image
+		# reference link or image

 		if ($this->reference_map and strpos($text, '[') !== FALSE and preg_match_all('/(!?)\[(.+?)\](?:\n?[ ]?\[(.*?)\])?/ms', $text, $matches, PREG_SET_ORDER))
 		{
@ -625,7 +715,7 @@ class Parsedown
 					}
 					else # anchor
 					{
-						$element_text = $this->parse_inline_elements($matches[2]);
+						$element_text = $this->parse_span_elements($matches[2]);

 						$element = '<a href="'.$url.'">'.$element_text.'</a>';
 					}
@ -643,29 +733,35 @@ class Parsedown
 			}
 		}

-		# Automatic Links
-
-		if (strpos($text, '<') !== FALSE and preg_match_all('/<((https?|ftp|dict):[^\^\s]+?)>/i', $text, $matches, PREG_SET_ORDER))
+		if (strpos($text, '://') !== FALSE)
 		{
-			foreach ($matches as $matches)
+			switch (TRUE)
 			{
-				$url = $matches[1];
+				case preg_match_all('{<(https?:[/]{2}[^\s]+)>}i', $text, $matches, PREG_SET_ORDER):
+				case preg_match_all('{\b(https?:[/]{2}[^\s]+)\b}i', $text, $matches, PREG_SET_ORDER):

-				strpos($url, '&') !== FALSE and $url = preg_replace('/&(?!#?\w+;)/', '&amp;', $url);
+					foreach ($matches as $matches)
+					{
+						$url = $matches[1];

-				$element = '<a href=":href">:text</a>';
-				$element = str_replace(':text', $url, $element);
-				$element = str_replace(':href', $url, $element);
+						strpos($url, '&') !== FALSE and $url = preg_replace('/&(?!#?\w+;)/', '&amp;', $url);

-				# ~
+						$element = '<a href=":href">:text</a>';
+						$element = str_replace(':text', $url, $element);
+						$element = str_replace(':href', $url, $element);

-				$code = "\x1A".'$'.$index;
+						# ~

-				$text = str_replace($matches[0], $code, $text);
+						$code = "\x1A".'$'.$index;

-				$map[$code] = $element;
+						$text = str_replace($matches[0], $code, $text);

-				$index ++;
+						$map[$code] = $element;
+
+						$index ++;
+					}
+
+					break;
 			}
 		}

@ -676,10 +772,15 @@ class Parsedown

 		# ~

+		if (strpos($text, '~~') !== FALSE)
+		{
+			$text = preg_replace('/~~(?=\S)(.+?)(?<=\S)~~/s', '<del>$1</del>', $text);
+		}
+
 		if (strpos($text, '_') !== FALSE)
 		{
 			$text = preg_replace('/__(?=\S)(.+?)(?<=\S)__(?!_)/s', '<strong>$1</strong>', $text);
-			$text = preg_replace('/_(?=\S)(.+?)(?<=\S)_/s', '<em>$1</em>', $text);
+			$text = preg_replace('/\b_(?=\S)(.+?)(?<=\S)_\b/s', '<em>$1</em>', $text);
 		}

 		if (strpos($text, '*') !== FALSE)
@ -692,4 +793,4 @@ class Parsedown

 		return $text;
 	}
-}
+}
--- a/README.md
+++ b/README.md
@ -1,9 +1,8 @@
-## Parsedown PHP
+## Parsedown

-Parsedown is a parser for Markdown. It parses Markdown text the way people do. First, it divides texts into blocks. Then it looks at how these blocks start and how they relate to each other. Finally, it looks for special characters to identify inline elements. As a result, Parsedown is (super) fast, consistent and clean.
+Fast, consistent and easy to use [Markdown][1] parser for PHP.

-[Explorer (demo)](http://parsedown.org/explorer/)  
-[Tests](http://parsedown.org/tests/)
+[Home](http://parsedown.org) &middot; [Demo](http://parsedown.org/explorer/) &middot; [Tests](http://parsedown.org/tests/)

 ### Installation

@ -17,4 +16,6 @@ $text = 'Hello **Parsedown**!';
 $result = Parsedown::instance()->parse($text);

 echo $result; # prints: <p>Hello <strong>Parsedown</strong>!</p>
-```
+```
+
+[1]: http://daringfireball.net/projects/markdown/
--- a/tests/Test.php
+++ b/tests/Test.php
@ -5,7 +5,7 @@ include 'Parsedown.php';
 class Test extends PHPUnit_Framework_TestCase
 {
 	const provider_dir = 'data/';
-	
+
 	/**
 	 * @dataProvider provider
 	 */
@ -15,33 +15,41 @@ class Test extends PHPUnit_Framework_TestCase

 		$this->assertEquals($expected_markup, $actual_markup);
 	}
-	
+
 	function provider()
 	{
 		$provider = array();
-		
-		$DirectoryIterator = new DirectoryIterator(__DIR__ . '/' . self::provider_dir);
-		
+
+		$path = dirname(__FILE__).'/';
+
+		$DirectoryIterator = new DirectoryIterator($path . '/' . self::provider_dir);
+
 		foreach ($DirectoryIterator as $Item)
 		{
-			if ($Item->isFile() and $Item->getExtension() === 'md')
+			if ($Item->isFile())
 			{
+				$filename = $Item->getFilename();
+
+				$extension = pathinfo($filename, PATHINFO_EXTENSION);
+
+				if ($extension !== 'md')
+					continue;
+
 				$basename = $Item->getBasename('.md');
-				
-				$markdown = file_get_contents(__DIR__ . '/' . self::provider_dir . $basename . '.md');
-				
+
+				$markdown = file_get_contents($path . '/' . self::provider_dir . $basename . '.md');
+
 				if (!$markdown)
 					continue;
-				
-				$expected_markup = file_get_contents(__DIR__ . '/' . self::provider_dir . $basename . '.html');
+
+				$expected_markup = file_get_contents($path . '/' . self::provider_dir . $basename . '.html');
 				$expected_markup = str_replace("\r\n", "\n", $expected_markup);
 				$expected_markup = str_replace("\r", "\n", $expected_markup);
-				
+
 				$provider [] = array($markdown, $expected_markup);
 			}
 		}
-		
+
 		return $provider;
 	}
-}
-
+}
--- a/tests/data/atx_heading.html
+++ b/tests/data/atx_heading.html
@ -1,6 +1,7 @@
-<h1>This is an h1</h1>
-<h2>This is an h2</h2>
-<h3>This is an h3</h3>
-<h4>This is an h4</h4>
-<h5>This is an h5</h5>
-<h6>This is an h6</h6>
+<h1>h1</h1>
+<h2>h2</h2>
+<h3>h3</h3>
+<h4>h4</h4>
+<h5>h5</h5>
+<h6>h6</h6>
+<h1>closed h1</h1>
--- a/tests/data/atx_heading.md
+++ b/tests/data/atx_heading.md
@ -1,11 +1,13 @@
-# This is an h1
+# h1

-## This is an h2
+## h2

-### This is an h3
+### h3

-#### This is an h4
+#### h4

-##### This is an h5
+##### h5

-###### This is an h6
+###### h6
+
+# closed h1 #
--- a/tests/data/atx_heading_-_closed.html
+++ b/tests/data/atx_heading_-_closed.html
@ -1,6 +0,0 @@
-<h1>h1</h1>
-<h2>h2</h2>
-<h3>h3</h3>
-<h4>h4</h4>
-<h5>h5</h5>
-<h6>h6</h6>
--- a/tests/data/atx_heading_-_closed.md
+++ b/tests/data/atx_heading_-_closed.md
@ -1,11 +0,0 @@
-# h1 #
-
-## h2 ##
-
-### h3 ###
-
-#### h4 ####
-
-##### h5 #####
-
-###### h6 ######
--- a/tests/data/block-level_html.html
+++ b/tests/data/block-level_html.html
@ -0,0 +1,9 @@
+<div>content</div>
+<hr style="background: #eaa;" />
+<p>nested elements:</p>
+<div>
+parent
+<div>
+child
+</div>
+</div>
--- a/tests/data/block-level_html.md
+++ b/tests/data/block-level_html.md
@ -0,0 +1,12 @@
+<div>content</div>
+
+<hr style="background: #eaa;" />
+
+nested elements:
+
+<div>
+parent
+<div>
+child
+</div>
+</div>
--- a/tests/data/blockquote.html
+++ b/tests/data/blockquote.html
@ -1,9 +0,0 @@
-<p>Here's a blockquote:</p>
-<blockquote>
-<p>blockquote</p>
-</blockquote>
-<p>Here's one on multiple lines:</p>
-<blockquote>
-<p>line 1
-line 2</p>
-</blockquote>
--- a/tests/data/blockquote.md
+++ b/tests/data/blockquote.md
@ -1,8 +0,0 @@
-Here's a blockquote:
-
-> blockquote
-
-Here's one on multiple lines:
-
-> line 1
-> line 2
--- a/tests/data/blockquote_-_compound.html
+++ b/tests/data/blockquote_-_compound.html
@ -1,16 +0,0 @@
-<p>Here's one with multiple paragraphs:</p>
-<blockquote>
-<p>This is line one.</p>
-<p>This is line two.</p>
-</blockquote>
-<p>Here's one with multiple types of blocks:</p>
-<blockquote>
-<p>This is a quoted paragraph.</p>
-<ul>
-<li>This is a list item of a quoted list.</li>
-<li>This is another list item.</li>
-</ul>
-<blockquote>
-<p>This is a nested quote block.</p>
-</blockquote>
-</blockquote>
--- a/tests/data/blockquote_-_compound.md
+++ b/tests/data/blockquote_-_compound.md
@ -1,14 +0,0 @@
-Here's one with multiple paragraphs:
-
-> This is line one.
->
-> This is line two.
-
-Here's one with multiple types of blocks:
-
-> This is a quoted paragraph.
-> 
-> - This is a list item of a quoted list.
-> - This is another list item.
->
-> > This is a nested quote block.
--- a/tests/data/blockquote_-_lazy.html
+++ b/tests/data/blockquote_-_lazy.html
@ -1,11 +0,0 @@
-<p>Here's a lazy blockquote:</p>
-<blockquote>
-<p>line
-line</p>
-</blockquote>
-<p>Here's one with multiple lines:</p>
-<blockquote>
-<p>line
-line
-line</p>
-</blockquote>
--- a/tests/data/blockquote_-_lazy.md
+++ b/tests/data/blockquote_-_lazy.md
@ -1,10 +0,0 @@
-Here's a lazy blockquote:
-
-> line
-line
-
-Here's one with multiple lines:
-
-> line
-line
-line
--- a/tests/data/blockquote_-_whitespace.html
+++ b/tests/data/blockquote_-_whitespace.html
@ -1,12 +0,0 @@
-<p>Here's a blockquote with no space after the ">":</p>
-<blockquote>
-<p>blockquote</p>
-</blockquote>
-<p>Here's a blockquote with leading space:</p>
-<blockquote>
-<p>blockquote</p>
-</blockquote>
-<p>Here's a blockquote on the next line:</p>
-<blockquote>
-<p>blockquote</p>
-</blockquote>
--- a/tests/data/blockquote_-_whitespace.md
+++ b/tests/data/blockquote_-_whitespace.md
@ -1,10 +0,0 @@
-Here's a blockquote with no space after the ">":
-
->blockquote
-
-Here's a blockquote with leading space:
-
-   > blockquote
-
-Here's a blockquote on the next line:
-> blockquote
--- a/tests/data/code_block.html
+++ b/tests/data/code_block.html
@ -1,5 +1,8 @@
-<p>Here's a code block:</p>
 <pre><code>&lt;?php

 $message = 'Hello World!'; 
-echo $message;</code></pre>
+echo $message;</code></pre>
+<hr />
+<pre><code>&gt; not a quote 
+- not a list item
+[not a reference]: http://foo.com</code></pre>
--- a/tests/data/code_block.md
+++ b/tests/data/code_block.md
@ -1,6 +1,11 @@
-Here's a code block:
-
    <?php
    
    $message = 'Hello World!'; 
-    echo $message;
+    echo $message;
+
+---
+
+    > not a quote 
+    - not a list item
+    [not a reference]: http://foo.com
+    
--- a/tests/data/code_span.html
+++ b/tests/data/code_span.html
@ -1 +1 @@
-<p>This is a <code>code span</code>.</p>
+<p>a <code>code span</code></p>
--- a/tests/data/code_span.md
+++ b/tests/data/code_span.md
@ -1 +1 @@
-This is a `code span`.
+a `code span`
--- a/tests/data/compound_blockquote.html
+++ b/tests/data/compound_blockquote.html
@ -0,0 +1,9 @@
+<blockquote>
+<h2>header</h2>
+<p>paragraph</p>
+<ul>
+<li>li</li>
+</ul>
+<hr />
+<p>paragraph</p>
+</blockquote>
--- a/tests/data/compound_blockquote.md
+++ b/tests/data/compound_blockquote.md
@ -0,0 +1,10 @@
+> header
+> ------
+>
+> paragraph
+>
+> - li
+>
+> ---
+>
+> paragraph
--- a/tests/data/compound_list.html
+++ b/tests/data/compound_list.html
@ -0,0 +1,12 @@
+<ul>
+<li>
+<p>paragraph</p>
+<p>paragraph</p>
+</li>
+<li>
+<p>paragraph</p>
+<blockquote>
+<p>quote</p>
+</blockquote>
+</li>
+</ul>
--- a/tests/data/compound_list.md
+++ b/tests/data/compound_list.md
@ -0,0 +1,7 @@
+- paragraph
+
+  paragraph
+
+- paragraph
+
+  > quote
--- a/tests/data/emphasis_-_em_strong.html
+++ b/tests/data/emphasis_-_em_strong.html
--- a/tests/data/emphasis_-_em_strong.md
+++ b/tests/data/emphasis_-_em_strong.md
--- a/tests/data/emphasis.html
+++ b/tests/data/emphasis.html
@ -1,11 +1,6 @@
-<p>Here's <em>an emphasis</em>.</p>
-<p>A short one <em>a</em> <em>b</em> .</p>
-<p>Here's <strong>a strong one</strong>. </p>
-<p>Here's <em>one that uses underscores</em>. </p>
-<p>Here's <strong>a strong one that uses underscores</strong>.</p>
-<p>This is not _ one _ neither is * this * neither is _ this_ neither is _this _.</p>
-<p>An empty emphasis ** is not __ an emphasis.</p>
-<p>A <em>multi-line
+<p><em>underscore</em>, <em>asterisk</em>, <em>one two</em>, <em>three four</em>, <em>a</em>, <em>b</em></p>
+<p><em>multiline
 emphasis</em></p>
-<p>A <strong>multi-line
-strong emphasis</strong></p>
+<p>_ this _ is not an emphasis, neither is _ this_, _this _, or _this*</p>
+<p>this_is_not_an_emphasis</p>
+<p>an empty emphasis __ ** is not an emphasis</p>
--- a/tests/data/emphasis.md
+++ b/tests/data/emphasis.md
@ -1,19 +1,10 @@
-Here's *an emphasis*.
+_underscore_, *asterisk*, _one two_, *three four*, _a_, *b*

-A short one _a_ *b* .
+_multiline
+emphasis_

-Here's **a strong one**. 
+_ this _ is not an emphasis, neither is _ this_, _this _, or _this*

-Here's _one that uses underscores_. 
+this_is_not_an_emphasis

-Here's __a strong one that uses underscores__.
-
-This is not _ one _ neither is * this * neither is _ this_ neither is _this _.
-
-An empty emphasis ** is not __ an emphasis.
-
-A *multi-line
-emphasis*
-
-A **multi-line
-strong emphasis**
+an empty emphasis __ ** is not an emphasis
--- a/tests/data/escaping.html
+++ b/tests/data/escaping.html
@ -1,2 +1,4 @@
-<p>Here's an <em>emphasis</em> and here's an escaped *emphasis*. Here are also an escaped `code span`, an escaped [inline link](http://example.com) and an escaped <code>\*emphasis\*</code> inside of a code span.</p>
-<pre><code>An escaped \*emphasis\* inside of a code block.</code></pre>
+<p>escaped *emphasis*.</p>
+<p><code>escaped \*emphasis\* in a code span</code></p>
+<pre><code>escaped \*emphasis\* in a code block</code></pre>
+<p>\ ` * _ { } [ ] ( ) > # + - . !</p>
--- a/tests/data/escaping.md
+++ b/tests/data/escaping.md
@ -1,3 +1,7 @@
-Here's an *emphasis* and here's an escaped \*emphasis\*. Here are also an escaped \`code span\`, an escaped \[inline link](http://example.com) and an escaped `\*emphasis\*` inside of a code span.
+escaped \*emphasis\*.

-    An escaped \*emphasis\* inside of a code block.
+`escaped \*emphasis\* in a code span`
+
+    escaped \*emphasis\* in a code block
+
+\\ \` \* \_ \{ \} \[ \] \( \) \> \# \+ \- \. \!
--- a/tests/data/fenced_code_block.html
+++ b/tests/data/fenced_code_block.html
@ -0,0 +1,5 @@
+<pre><code>&lt;?php
+
+$message = 'fenced code block';
+echo $message;</code></pre>
+<pre><code>tilde</code></pre>
--- a/tests/data/fenced_code_block.md
+++ b/tests/data/fenced_code_block.md
@ -0,0 +1,10 @@
+```
+<?php
+
+$message = 'fenced code block';
+echo $message;
+```
+
+~~~
+tilde
+~~~
--- a/tests/data/horizontal_rule.html
+++ b/tests/data/horizontal_rule.html
@ -1,10 +1,5 @@
-<p>Dashes:</p>
 <hr />
 <hr />
 <hr />
-<p>Asterisks:</p>
 <hr />
-<p>Underscores:</p>
-<hr />
-<p>On the next line:</p>
 <hr />
--- a/tests/data/horizontal_rule.md
+++ b/tests/data/horizontal_rule.md
@ -1,18 +1,9 @@
-Dashes:
-
 ---

 - - -

   - - -

-Asterisks:
-
 ***

-Underscores:
-
-___
-
-On the next line:
 ___
--- a/tests/data/html.html
+++ b/tests/data/html.html
@ -1,15 +0,0 @@
-<p>A self-closing tag:</p>
-<hr/>
-<p>One with attributes:</p>
-<hr style="background: #eaa" />
-<p>A bare element:</p>
-<div>content</div>
-<p>One with attributes:</p>
-<a href="http://example.com">link</a>
-<p>Nested elements:</p>
-<div>
-parent
-<div>
-child
-</div>
-</div>
--- a/tests/data/html.md
+++ b/tests/data/html.md
@ -1,24 +0,0 @@
-A self-closing tag:
-
-<hr/>
-
-One with attributes:
-
-<hr style="background: #eaa" />
-
-A bare element:
-
-<div>content</div>
-
-One with attributes:
-
-<a href="http://example.com">link</a>
-
-Nested elements:
-
-<div>
-parent
-<div>
-child
-</div>
-</div>
--- a/tests/data/image_reference.html
+++ b/tests/data/image_reference.html
@ -0,0 +1 @@
+<p><img alt="Markdown Logo" src="/md.png"></p>
--- a/tests/data/image_reference.md
+++ b/tests/data/image_reference.md
@ -0,0 +1,3 @@
+![Markdown Logo][image]
+
+[image]: /md.png
--- a/tests/data/implicit_reference.html
+++ b/tests/data/implicit_reference.html
@ -0,0 +1,2 @@
+<p>an <a href="http://example.com">implicit</a> reference link</p>
+<p>an <a href="http://example.com">implicit</a> reference link with an empty link definition</p>
--- a/tests/data/implicit_reference.md
+++ b/tests/data/implicit_reference.md
@ -0,0 +1,5 @@
+an [implicit] reference link
+
+[implicit]: http://example.com
+
+an [implicit][] reference link with an empty link definition
--- a/tests/data/inline_link.html
+++ b/tests/data/inline_link.html
@ -1,2 +1,2 @@
-<p>Here's a <a href="http://example.com">link</a>.</p>
-<p>Here's one that is based on an image: <a href="http://daringfireball.net/projects/markdown/"><img alt="MD Logo" src="http://parsedown.org/md.png"></a>.</p>
+<p><a href="http://example.com">link</a></p>
+<p><a href="http://example.com"><img alt="MD Logo" src="http://parsedown.org/md.png"></a></p>
--- a/tests/data/inline_link.md
+++ b/tests/data/inline_link.md
@ -1,3 +1,3 @@
-Here's a [link](http://example.com).
+[link](http://example.com)

-Here's one that is based on an image: [![MD Logo](http://parsedown.org/md.png)](http://daringfireball.net/projects/markdown/).
+[![MD Logo](http://parsedown.org/md.png)](http://example.com)
--- a/tests/data/lazy_blockquote.html
+++ b/tests/data/lazy_blockquote.html
@ -0,0 +1,4 @@
+<blockquote>
+<p>quote
+the rest of it</p>
+</blockquote>
--- a/tests/data/lazy_blockquote.md
+++ b/tests/data/lazy_blockquote.md
@ -0,0 +1,2 @@
+> quote
+the rest of it
--- a/tests/data/lazy_list.html
+++ b/tests/data/lazy_list.html
@ -0,0 +1,4 @@
+<ul>
+<li>li
+the rest of it</li>
+</ul>
--- a/tests/data/lazy_list.md
+++ b/tests/data/lazy_list.md
@ -0,0 +1,2 @@
+- li
+the rest of it
--- a/tests/data/list.html
+++ b/tests/data/list.html
@ -1,5 +0,0 @@
-<p>Here's a list:</p>
-<ul>
-<li>li</li>
-<li>li</li>
-</ul>
--- a/tests/data/list.md
+++ b/tests/data/list.md
@ -1,4 +0,0 @@
-Here's a list:
-
- li
- li
--- a/tests/data/list_-_compound.html
+++ b/tests/data/list_-_compound.html
@ -1,13 +0,0 @@
-<p>Here's a compound list:</p>
-<ul>
-<li>
-<p>This is the first paragraph of the list item.</p>
-<p>This is the second one.</p>
-</li>
-<li>
-<p>This is another list item.</p>
-<blockquote>
-<p>This is a quote block that belongs to it.</p>
-</blockquote>
-</li>
-</ul>
--- a/tests/data/list_-_compound.md
+++ b/tests/data/list_-_compound.md
@ -1,9 +0,0 @@
-Here's a compound list:
-
- This is the first paragraph of the list item.
-
-  This is the second one.
-
- This is another list item.
-
-  > This is a quote block that belongs to it.
--- a/tests/data/list_-_lazy.html
+++ b/tests/data/list_-_lazy.html
@ -1,4 +0,0 @@
-<ul>
-<li>li
-more text</li>
-</ul>
--- a/tests/data/list_-_lazy.md
+++ b/tests/data/list_-_lazy.md
@ -1,2 +0,0 @@
- li
-more text
--- a/tests/data/list_-_ordered.html
+++ b/tests/data/list_-_ordered.html
@ -1,14 +0,0 @@
-<p>Here's a regular ordered list:</p>
-<ol>
-<li>one</li>
-<li>two</li>
-</ol>
-<p>Here's one with repeating numbers:</p>
-<ol>
-<li>one</li>
-<li>two</li>
-</ol>
-<p>Here's one with large numbers:</p>
-<ol>
-<li>one</li>
-</ol>
--- a/tests/data/list_-_ordered.md
+++ b/tests/data/list_-_ordered.md
@ -1,13 +0,0 @@
-Here's a regular ordered list:
-
-1. one
-2. two
-
-Here's one with repeating numbers:
-
-1. one
-1. two
-
-Here's one with large numbers:
-
-123. one
--- a/tests/data/list_-_sparse.html
+++ b/tests/data/list_-_sparse.html
@ -1,16 +0,0 @@
-<p>Here's a sparse list:</p>
-<ul>
-<li>
-<p>list item</p>
-</li>
-<li>another list item</li>
-</ul>
-<p>Here's one with an indented list item:</p>
-<ul>
-<li>
-<p>li</p>
-<ul>
-<li>li</li>
-</ul>
-</li>
-</ul>
--- a/tests/data/list_-_sparse.md
+++ b/tests/data/list_-_sparse.md
@ -1,11 +0,0 @@
-Here's a sparse list:
-
- list item
-
- another list item
-
-Here's one with an indented list item:
-
- li
-
-    - li
--- a/tests/data/list_-_unordered.md
+++ b/tests/data/list_-_unordered.md
@ -1,10 +0,0 @@
-Here's an unordered list:
-
- li
- li
-
-Here's one with mixed markers:
-
- li
-+ li
-* li
--- a/tests/data/list_-_whitespace.html
+++ b/tests/data/list_-_whitespace.html
@ -1,5 +0,0 @@
-<p>Here's one with white space around items:</p>
-<ul>
-<li>li  </li>
-<li>li  </li>
-</ul>
--- a/tests/data/list_-_whitespace.md
+++ b/tests/data/list_-_whitespace.md
@ -1,4 +0,0 @@
-Here's one with white space around items:
-
-  - li  
-  - li  
--- a/tests/data/ordered_list.html
+++ b/tests/data/ordered_list.html
@ -0,0 +1,13 @@
+<ol>
+<li>one</li>
+<li>two</li>
+</ol>
+<p>repeating numbers:</p>
+<ol>
+<li>one</li>
+<li>two</li>
+</ol>
+<p>large numbers:</p>
+<ol>
+<li>one</li>
+</ol>
--- a/tests/data/ordered_list.md
+++ b/tests/data/ordered_list.md
@ -0,0 +1,11 @@
+1. one
+2. two
+
+repeating numbers:
+
+1. one
+1. two
+
+large numbers:
+
+123. one
--- a/tests/data/reference_link.html
+++ b/tests/data/reference_link.html
@ -1,7 +0,0 @@
-<p>Here's a <a href="http://example.com">reference link</a>.</p>
-<p>Here's <a href="http://example.com">one</a> with a semantic name.</p>
-<p>Here's <a href="http://example.com">one</a> with an upper case label definition.</p>
-<p>Here's <a href="http://example.com">one</a> with definition name on the next line.</p>
-<p>Here's [one][404] with no definition.</p>
-<p>Here's a <a href="http://example.com">multiline
-one</a> defined on 2 lines.</p>
--- a/tests/data/reference_link.md
+++ b/tests/data/reference_link.md
@ -1,19 +0,0 @@
-Here's a [reference link][1].
-
-[1]: http://example.com
-
-Here's [one][website] with a semantic name.
-
-[website]: http://example.com
-
-Here's [one][case] with an upper case label definition.
-
-[CASE]: http://example.com
-
-Here's [one]
-[website] with definition name on the next line.
-
-Here's [one][404] with no definition.
-
-Here's a [multiline
-one][website] defined on 2 lines.
--- a/tests/data/reference_link_-_image.html
+++ b/tests/data/reference_link_-_image.html
@ -1 +0,0 @@
-<p>Here's an image: <img alt="Markdown Logo" src="/md.png"></p>
--- a/tests/data/reference_link_-_image.md
+++ b/tests/data/reference_link_-_image.md
@ -1,3 +0,0 @@
-Here's an image: ![Markdown Logo][image]
-
-[image]: /md.png
--- a/tests/data/reference_link_-_implicit.html
+++ b/tests/data/reference_link_-_implicit.html
@ -1,2 +0,0 @@
-<p>Here's an <a href="http://example.com">implicit</a> reference link.</p>
-<p>Here's an <a href="http://example.com">implicit</a> one with an empty link definition.</p>
--- a/tests/data/reference_link_-_implicit.md
+++ b/tests/data/reference_link_-_implicit.md
@ -1,5 +0,0 @@
-Here's an [implicit] reference link.
-
-[implicit]: http://example.com
-
-Here's an [implicit][] one with an empty link definition.
--- a/tests/data/reference_link_-_whitespace.html
+++ b/tests/data/reference_link_-_whitespace.html
@ -1 +0,0 @@
-<p>Here's a <a href="http://example.com">reference link</a> with a definition on the next line.</p>
--- a/tests/data/reference_link_-_whitespace.md
+++ b/tests/data/reference_link_-_whitespace.md
@ -1,2 +0,0 @@
-Here's a [reference link][2] with a definition on the next line.
-[2]: http://example.com
--- a/tests/data/simple_blockquote.html
+++ b/tests/data/simple_blockquote.html
@ -0,0 +1,11 @@
+<blockquote>
+<p>quote</p>
+</blockquote>
+<p>indented:</p>
+<blockquote>
+<p>quote</p>
+</blockquote>
+<p>no space after <code>&gt;</code>:</p>
+<blockquote>
+<p>quote</p>
+</blockquote>
--- a/tests/data/simple_blockquote.md
+++ b/tests/data/simple_blockquote.md
@ -0,0 +1,7 @@
+> quote
+
+indented:
+   > quote
+
+no space after `>`:
+>quote
--- a/tests/data/span-level_html.html
+++ b/tests/data/span-level_html.html
@ -0,0 +1,3 @@
+<p>an <b>important</b> <a href=''>link</a></p>
+<p>broken<br/>
+line</p>
--- a/tests/data/span-level_html.md
+++ b/tests/data/span-level_html.md
@ -0,0 +1,4 @@
+an <b>important</b> <a href=''>link</a>
+
+broken<br/>
+line
--- a/tests/data/span_level_html.html
+++ b/tests/data/span_level_html.html
@ -1 +0,0 @@
-<p>Here's an <b>important</b> <a href=''>link</a>.</p>
--- a/tests/data/span_level_html.md
+++ b/tests/data/span_level_html.md
@ -1 +0,0 @@
-Here's an <b>important</b> <a href=''>link</a>.
--- a/tests/data/sparse_list.html
+++ b/tests/data/sparse_list.html
@ -0,0 +1,15 @@
+<ul>
+<li>
+<p>li</p>
+</li>
+<li>li</li>
+</ul>
+<hr />
+<ul>
+<li>
+<p>li</p>
+<ul>
+<li>indented li</li>
+</ul>
+</li>
+</ul>
--- a/tests/data/sparse_list.md
+++ b/tests/data/sparse_list.md
@ -0,0 +1,9 @@
+- li
+
+- li
+
+---
+
+- li
+
+    - indented li
--- a/tests/data/special_characters.html
+++ b/tests/data/special_characters.html
@ -1,7 +1,8 @@
-<p>AT&amp;T has an ampersand in their name.</p>
-<p>AT&amp;T is another way to write it.</p>
-<p>This &amp; that.</p>
-<p>4 &lt; 5 and 6 > 5.</p>
-<p>Here's an autolink <a href="http://example.com/autolink?a=1&amp;b=2">http://example.com/autolink?a=1&amp;b=2</a></p>
-<p>Here's an inline <a href="/script?a=1&amp;b=2">link</a>.</p>
-<p>Here's a reference <a href="http://example.com/?a=1&amp;b=2">link</a> with an ampersand in the URL.</p>
+<p>AT&amp;T has an ampersand in their name</p>
+<pre><code>Let's play some cards ♠ ♣ ♥ ♦</code></pre>
+<p>AT&amp;T is another way to write it</p>
+<p>this &amp; that</p>
+<p>4 &lt; 5 and 6 > 5</p>
+<p><a href="http://example.com/autolink?a=1&amp;b=2">http://example.com/autolink?a=1&amp;b=2</a> </p>
+<p><a href="/script?a=1&amp;b=2">inline link</a></p>
+<p><a href="http://example.com/?a=1&amp;b=2">reference link</a></p>
--- a/tests/data/special_characters.md
+++ b/tests/data/special_characters.md
@ -1,15 +1,17 @@
-AT&T has an ampersand in their name.
+AT&T has an ampersand in their name

-AT&amp;T is another way to write it.
+    Let's play some cards ♠ ♣ ♥ ♦

-This & that.
+AT&T is another way to write it

-4 < 5 and 6 > 5.
+this & that

-Here's an autolink <http://example.com/autolink?a=1&b=2>
+4 < 5 and 6 > 5

-Here's an inline [link](/script?a=1&b=2).
+<http://example.com/autolink?a=1&b=2> 

-Here's a reference [link] [1] with an ampersand in the URL.
+[inline link](/script?a=1&b=2)
+
+[reference link][1]

 [1]: http://example.com/?a=1&b=2
--- a/tests/data/strikethrough.html
+++ b/tests/data/strikethrough.html
@ -0,0 +1,3 @@
+<p><del>strikethrough</del></p>
+<p>in the <del>middle</del> of a sentence</p>
+<p>in the middle of a w<del>or</del>d</p>
--- a/tests/data/strikethrough.md
+++ b/tests/data/strikethrough.md
@ -0,0 +1,5 @@
+~~strikethrough~~
+
+in the ~~middle~~ of a sentence
+
+in the middle of a w~~or~~d
--- a/tests/data/text_reference.html
+++ b/tests/data/text_reference.html
@ -0,0 +1,6 @@
+<p><a href="http://example.com">reference link</a></p>
+<p><a href="http://example.com">one</a> with a semantic name</p>
+<p>[one][404] with no definition</p>
+<p><a href="http://example.com">multiline
+one</a> defined on 2 lines</p>
+<p><a href="http://example.com">one</a> with an upper case label</p>
--- a/tests/data/text_reference.md
+++ b/tests/data/text_reference.md
@ -0,0 +1,16 @@
+[reference link][1]
+
+[1]: http://example.com
+
+[one][website] with a semantic name
+
+[website]: http://example.com
+
+[one][404] with no definition
+
+[multiline
+one][website] defined on 2 lines
+
+[one][label] with an upper case label
+
+[LABEL]: http://example.com
--- a/tests/data/list_-_unordered.html
+++ b/tests/data/list_-_unordered.html
@ -1,9 +1,8 @@
-<p>Here's an unordered list:</p>
 <ul>
 <li>li</li>
 <li>li</li>
 </ul>
-<p>Here's one with mixed markers:</p>
+<p>mixed markers:</p>
 <ul>
 <li>li</li>
 <li>li</li>
--- a/tests/data/unordered_list.md
+++ b/tests/data/unordered_list.md
@ -0,0 +1,8 @@
+- li
+- li
+
+mixed markers:
+
+* li
+ li
+- li
--- a/tests/data/url_autolinking.html
+++ b/tests/data/url_autolinking.html
@ -0,0 +1 @@
+<p>Here's an autolink <a href="http://example.com">http://example.com</a>.</p>
--- a/tests/data/url_autolinking.md
+++ b/tests/data/url_autolinking.md
@ -0,0 +1 @@
+Here's an autolink http://example.com.
--- a/tests/data/whitespace.html
+++ b/tests/data/whitespace.html
@ -1 +1 @@
-<pre><code>This text starts with a line that consists of 4 spaces and it ends with one. This is a code block to make sure that leading spaces don't get trimmed.</code></pre>
+<pre><code>code</code></pre>
--- a/tests/data/whitespace.md
+++ b/tests/data/whitespace.md
@ -1,5 +1,5 @@
    

-    This text starts with a line that consists of 4 spaces and it ends with one. This is a code block to make sure that leading spaces don't get trimmed.
+    code
Author	SHA1	Message	Date
Emanuil Rusev	f5451a9eff	Merge pull request #37 from hkdobrev/htmlspecialshars-utf8	2013-11-22 13:23:21 -08:00
Haralan Dobrev	849a89b121	Use UTF-8 encoding for htmlspecialchars. See #36 . Prior to PHP 5.4.0 the default encoding for `htmlentities()` and `htmlspecialchars` is "ISO-8859-1". For PHP 5.4+ is "UTF-8". This ensures always the right encoding is used no matter the PHP version and the locale settings.	2013-11-22 23:06:20 +02:00
Emanuil Rusev	28064a63b3	simplify encoding of special characters	2013-11-22 21:57:21 +02:00
Emanuil Rusev	800aac5b56	Merge pull request #36 from josephok/patch-1	2013-11-22 11:21:38 -08:00
josephok	b15d40e8a3	Update Parsedown.php Changes the htmlentities() to htmlspecialchars(). The htmlentities() has some problems encoding non-english words(like Chinese)	2013-11-22 23:05:26 +08:00
Emanuil Rusev	ddc5b7e2dd	implement URL auto-linking	2013-11-22 00:20:45 +02:00
Emanuil Rusev	5a563008aa	implement GFM strikethrough	2013-11-21 13:39:00 +02:00
Emanuil Rusev	b6f795962f	resolve #21	2013-11-21 00:59:30 +02:00
Emanuil Rusev	cdb2646063	update readme to match website	2013-11-20 23:10:03 +02:00
Emanuil Rusev	e3b8026e39	build should no longer allow failures	2013-11-18 22:39:44 +02:00
Emanuil Rusev	d96f668c42	update test case to make it run on PHP 5.2	2013-11-18 22:29:15 +02:00
Emanuil Rusev	96bf75bd91	remove goto to provide support for PHP 5.2	2013-11-18 21:42:00 +02:00
Emanuil Rusev	67b51794d8	implement fenced code block to resolve #2	2013-11-17 16:52:31 +02:00
Emanuil Rusev	a9d6232705	array_shift » unset to simplify code base and improve performance	2013-11-17 13:21:49 +02:00
Emanuil Rusev	b91629ad94	organize evaluation blocks into switch statements to improve code readability	2013-11-17 12:48:01 +02:00
Emanuil Rusev	24d300ea5d	$pure_line » $deindented_line	2013-11-17 01:52:40 +02:00
Emanuil Rusev	d54712b989	simplify comments	2013-11-17 01:52:40 +02:00
Emanuil Rusev	6ef043ba7d	arrange compile cases	2013-11-17 01:52:40 +02:00
Emanuil Rusev	fe27b70bdb	block » markup	2013-11-17 01:52:40 +02:00
Emanuil Rusev	18d3dbf4f6	simplify comments	2013-11-17 01:52:40 +02:00
Emanuil Rusev	4758f58f73	remove double semicolons	2013-11-17 01:52:40 +02:00
Emanuil Rusev	5fa3eb1b2f	parse_inline_elements » parse_span_elements to match the specs	2013-11-17 01:52:40 +02:00
Emanuil Rusev	38300323a6	simplify readme	2013-11-16 18:45:13 +02:00
Emanuil Rusev	96609329b9	improve readme	2013-11-16 09:51:01 +02:00
Emanuil Rusev	e497acb6dc	escape sequences with double digit codes do not get decoded properly	2013-11-16 02:05:31 +02:00
Emanuil Rusev	30e436ec7d	simplify tests	2013-11-16 02:05:31 +02:00
Emanuil Rusev	3972f18881	improve readme	2013-11-14 00:50:00 +02:00
Emanuil Rusev	4fb12be60a	improve introduction	2013-11-13 01:52:59 +02:00
Emanuil Rusev	f8b07611d3	homepage » home	2013-11-13 01:47:38 +02:00
Emanuil Rusev	21d7f75f5b	improve readme	2013-11-13 01:38:29 +02:00
				`@ -0,0 +1 @@`
				`<p><img alt="Markdown Logo" src="/md.png"></p>`
				`@ -1 +0,0 @@`
				`<p>Here's an image: <img alt="Markdown Logo" src="/md.png"></p>`
				`@ -1 +0,0 @@`
				`<p>Here's a <a href="http://example.com">reference link</a> with a definition on the next line.</p>`
				`@ -1 +0,0 @@`
				`<p>Here's an <b>important</b> <a href=''>link</a>.</p>`
				`@ -1 +0,0 @@`
				`Here's an <b>important</b> <a href=''>link</a>.`
				`@ -0,0 +1 @@`
				`<p>Here's an autolink <a href="http://example.com">http://example.com</a>.</p>`