1
0
mirror of https://github.com/erusev/parsedown.git synced 2023-08-10 21:13:06 +03:00

Compare commits

..

30 Commits
0.4.7 ... 0.7.1

Author SHA1 Message Date
f5451a9eff Merge pull request #37 from hkdobrev/htmlspecialshars-utf8 2013-11-22 13:23:21 -08:00
849a89b121 Use UTF-8 encoding for htmlspecialchars. See #36.
Prior to PHP 5.4.0 the default encoding for `htmlentities()`
and `htmlspecialchars` is "ISO-8859-1". For PHP 5.4+ is "UTF-8".

This ensures always the right encoding is used no matter the PHP version
and the locale settings.
2013-11-22 23:06:20 +02:00
28064a63b3 simplify encoding of special characters 2013-11-22 21:57:21 +02:00
800aac5b56 Merge pull request #36 from josephok/patch-1 2013-11-22 11:21:38 -08:00
b15d40e8a3 Update Parsedown.php
Changes the htmlentities() to htmlspecialchars(). The htmlentities() has some problems encoding non-english words(like Chinese)
2013-11-22 23:05:26 +08:00
ddc5b7e2dd implement URL auto-linking 2013-11-22 00:20:45 +02:00
5a563008aa implement GFM strikethrough 2013-11-21 13:39:00 +02:00
b6f795962f resolve #21 2013-11-21 00:59:30 +02:00
cdb2646063 update readme to match website 2013-11-20 23:10:03 +02:00
e3b8026e39 build should no longer allow failures 2013-11-18 22:39:44 +02:00
d96f668c42 update test case to make it run on PHP 5.2 2013-11-18 22:29:15 +02:00
96bf75bd91 remove goto to provide support for PHP 5.2 2013-11-18 21:42:00 +02:00
67b51794d8 implement fenced code block to resolve #2 2013-11-17 16:52:31 +02:00
a9d6232705 array_shift » unset to simplify code base and improve performance 2013-11-17 13:21:49 +02:00
b91629ad94 organize evaluation blocks into switch statements to improve code readability 2013-11-17 12:48:01 +02:00
24d300ea5d $pure_line » $deindented_line 2013-11-17 01:52:40 +02:00
d54712b989 simplify comments 2013-11-17 01:52:40 +02:00
6ef043ba7d arrange compile cases 2013-11-17 01:52:40 +02:00
fe27b70bdb block » markup 2013-11-17 01:52:40 +02:00
18d3dbf4f6 simplify comments 2013-11-17 01:52:40 +02:00
4758f58f73 remove double semicolons 2013-11-17 01:52:40 +02:00
5fa3eb1b2f parse_inline_elements » parse_span_elements to match the specs 2013-11-17 01:52:40 +02:00
38300323a6 simplify readme 2013-11-16 18:45:13 +02:00
96609329b9 improve readme 2013-11-16 09:51:01 +02:00
e497acb6dc escape sequences with double digit codes do not get decoded properly 2013-11-16 02:05:31 +02:00
30e436ec7d simplify tests 2013-11-16 02:05:31 +02:00
3972f18881 improve readme 2013-11-14 00:50:00 +02:00
4fb12be60a improve introduction 2013-11-13 01:52:59 +02:00
f8b07611d3 homepage » home 2013-11-13 01:47:38 +02:00
21d7f75f5b improve readme 2013-11-13 01:38:29 +02:00
91 changed files with 748 additions and 739 deletions

View File

@ -4,8 +4,4 @@ php:
- 5.5
- 5.4
- 5.3
- 5.2
matrix:
allow_failures:
- php: 5.2
- 5.2

View File

@ -46,17 +46,17 @@ class Parsedown
function parse($text)
{
# Removes UTF-8 BOM and marker characters.
# removes UTF-8 BOM and marker characters
$text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text);
# Removes \r characters.
# removes \r characters
$text = str_replace("\r\n", "\n", $text);
$text = str_replace("\r", "\n", $text);
# Replaces tabs with spaces.
# replaces tabs with spaces
$text = str_replace("\t", ' ', $text);
# Encodes escape sequences.
# encodes escape sequences
if (strpos($text, '\\') !== FALSE)
{
@ -66,7 +66,7 @@ class Parsedown
{
if (strpos($text, $escape_sequence) !== FALSE)
{
$code = "\x1A".'\\'.$index;
$code = "\x1A".'\\'.$index.';';
$text = str_replace($escape_sequence, $code, $text);
@ -84,7 +84,7 @@ class Parsedown
$text = $this->parse_block_elements($lines);
# Decodes escape sequences (leaves out backslashes).
# decodes escape sequences
foreach ($this->escape_sequence_map as $code => $escape_sequence)
{
@ -110,28 +110,56 @@ class Parsedown
foreach ($lines as $line)
{
# Block-Level HTML
#
# fenced elements
if ($element['type'] === 'block' and ! isset($element['closed']))
switch ($element['type'])
{
if (preg_match('{<'.$element['subtype'].'>$}', $line)) # <open>
{
$element['depth']++;
}
case 'fenced_code_block':
if (preg_match('{</'.$element['subtype'].'>$}', $line)) # </close>
{
$element['depth'] > 0
? $element['depth']--
: $element['closed'] = true;
}
if ( ! isset($element['closed']))
{
if (preg_match('/^[ ]*'.$element['fence'][0].'{3,}[ ]*$/', $line))
{
$element['closed'] = true;
}
else
{
$element['text'] !== '' and $element['text'] .= "\n";
$element['text'] .= "\n".$line;
$element['text'] .= $line;
}
continue;
continue 2;
}
break;
case 'markup':
if ( ! isset($element['closed']))
{
if (preg_match('{<'.$element['subtype'].'>$}', $line)) # opening tag
{
$element['depth']++;
}
if (preg_match('{</'.$element['subtype'].'>$}', $line)) # closing tag
{
$element['depth'] > 0
? $element['depth']--
: $element['closed'] = true;
}
$element['text'] .= "\n".$line;
continue 2;
}
break;
}
# Empty
# *
if ($line === '')
{
@ -140,269 +168,330 @@ class Parsedown
continue;
}
# Lazy Blockquote
#
# composite elements
if ($element['type'] === 'blockquote' and ! isset($element['interrupted']))
switch ($element['type'])
{
$line = preg_replace('/^[ ]*>[ ]?/', '', $line);
case 'blockquote':
$element['lines'] []= $line;
continue;
}
# Lazy List Item
if ($element['type'] === 'li')
{
if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
{
if ($element['indentation'] !== $matches[1])
if ( ! isset($element['interrupted']))
{
$line = preg_replace('/^[ ]*>[ ]?/', '', $line);
$element['lines'] []= $line;
continue 2;
}
break;
case 'li':
if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
{
if ($element['indentation'] !== $matches[1])
{
$element['lines'] []= $line;
}
else
{
unset($element['last']);
$elements []= $element;
$element = array(
'type' => 'li',
'indentation' => $matches[1],
'last' => true,
'lines' => array(
preg_replace('/^[ ]{0,4}/', '', $matches[3]),
),
);
}
continue 2;
}
if (isset($element['interrupted']))
{
if ($line[0] === ' ')
{
$element['lines'] []= '';
$line = preg_replace('/^[ ]{0,4}/', '', $line);
$element['lines'] []= $line;
continue 2;
}
}
else
{
unset($element['last']);
$line = preg_replace('/^[ ]{0,4}/', '', $line);
$element['lines'] []= $line;
continue 2;
}
break;
}
#
# indentation sensitive types
$deindented_line = $line;
switch ($line[0])
{
case ' ':
# ~
$deindented_line = ltrim($line);
if ($deindented_line === '')
{
continue 2;
}
# code block
if (preg_match('/^[ ]{4}(.*)/', $line, $matches))
{
if ($element['type'] === 'code_block')
{
if (isset($element['interrupted']))
{
$element['text'] .= "\n";
unset ($element['interrupted']);
}
$element['text'] .= "\n".$matches[1];
}
else
{
$elements []= $element;
$element = array(
'type' => 'code_block',
'text' => $matches[1],
);
}
continue 2;
}
break;
case '#':
# atx heading (#)
if (preg_match('/^(#{1,6})[ ]*(.+?)[ ]*#*$/', $line, $matches))
{
$elements []= $element;
$level = strlen($matches[1]);
$element = array(
'type' => 'h.',
'text' => $matches[2],
'level' => $level,
);
continue 2;
}
break;
case '-':
# setext heading (---)
if ($line[0] === '-' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[-]+[ ]*$/', $line))
{
$element['type'] = 'h.';
$element['level'] = 2;
continue 2;
}
break;
case '=':
# setext heading (===)
if ($line[0] === '=' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[=]+[ ]*$/', $line))
{
$element['type'] = 'h.';
$element['level'] = 1;
continue 2;
}
break;
}
#
# indentation insensitive types
switch ($deindented_line[0])
{
case '<':
# self-closing tag
if (preg_match('{^<.+?/>$}', $deindented_line))
{
$elements []= $element;
$element = array(
'type' => '',
'text' => $deindented_line,
);
continue 2;
}
# opening tag
if (preg_match('{^<(\w+)(?:[ ].*?)?>}', $deindented_line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'markup',
'subtype' => strtolower($matches[1]),
'text' => $deindented_line,
'depth' => 0,
);
preg_match('{</'.$matches[1].'>\s*$}', $deindented_line) and $element['closed'] = true;
continue 2;
}
break;
case '>':
# quote
if (preg_match('/^>[ ]?(.*)/', $deindented_line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'blockquote',
'lines' => array(
$matches[1],
),
);
continue 2;
}
break;
case '[':
# reference
if (preg_match('/^\[(.+?)\]:[ ]*([^ ]+)/', $deindented_line, $matches))
{
$label = strtolower($matches[1]);
$this->reference_map[$label] = trim($matches[2], '<>');;
continue 2;
}
break;
case '`':
case '~':
# fenced code block
if (preg_match('/^([`]{3,}|[~]{3,})[ ]*(\S+)?[ ]*$/', $deindented_line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'fenced_code_block',
'text' => '',
'fence' => $matches[1],
);
isset($matches[2]) and $element['language'] = $matches[2];
continue 2;
}
break;
case '*':
case '+':
case '-':
case '_':
# hr
if (preg_match('/^([-*_])([ ]{0,2}\1){2,}[ ]*$/', $deindented_line))
{
$elements []= $element;
$element = array(
'type' => 'hr',
);
continue 2;
}
# li
if (preg_match('/^([ ]*)[*+-][ ](.*)/', $line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'li',
'ordered' => false,
'indentation' => $matches[1],
'last' => true,
'lines' => array(
preg_replace('/^[ ]{0,4}/', '', $matches[3]),
preg_replace('/^[ ]{0,4}/', '', $matches[2]),
),
);
continue 2;
}
continue;
}
if (isset($element['interrupted']))
{
if ($line[0] === ' ')
{
$element['lines'] []= '';
$line = preg_replace('/^[ ]{0,4}/', '', $line);;
$element['lines'] []= $line;
continue;
}
}
else
{
$line = preg_replace('/^[ ]{0,4}/', '', $line);;
$element['lines'] []= $line;
continue;
}
}
# Quick Paragraph
# li
if ($line[0] >= 'a' or $line[0] >= 'A' and $line[0] <= 'Z')
{
goto paragraph;
}
# Code Block
if ($line[0] === ' ' and preg_match('/^[ ]{4}(.*)/', $line, $matches))
{
if (trim($line) === '')
{
continue;
}
if ($element['type'] === 'code')
{
if (isset($element['interrupted']))
{
$element['text'] .= "\n";
unset ($element['interrupted']);
}
$element['text'] .= "\n".$matches[1];
}
else
{
$elements []= $element;
$element = array(
'type' => 'code',
'text' => $matches[1],
);
}
continue;
}
# Setext Header (---)
if ($line[0] === '-' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[-]+[ ]*$/', $line))
{
$element['type'] = 'h.';
$element['level'] = 2;
continue;
}
# Atx Header (#)
if ($line[0] === '#' and preg_match('/^(#{1,6})[ ]*(.+?)[ ]*#*$/', $line, $matches))
{
$elements []= $element;
$level = strlen($matches[1]);
$element = array(
'type' => 'h.',
'text' => $matches[2],
'level' => $level,
);
continue;
}
# Setext Header (===)
if ($line[0] === '=' and $element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[=]+[ ]*$/', $line))
{
$element['type'] = 'h.';
$element['level'] = 1;
continue;
}
# ~
$pure_line = $line[0] !== ' ' ? $line : ltrim($line);
if ($pure_line === '')
{
continue;
}
# Link Reference
if ($pure_line[0] === '[' and preg_match('/^\[(.+?)\]:[ ]*([^ ]+)/', $pure_line, $matches))
{
$label = strtolower($matches[1]);
$url = trim($matches[2], '<>');
$this->reference_map[$label] = $url;
continue;
}
# Blockquote
if ($pure_line[0] === '>' and preg_match('/^>[ ]?(.*)/', $pure_line, $matches))
{
if ($element['type'] === 'blockquote')
{
if (isset($element['interrupted']))
{
$element['lines'] []= '';
unset($element['interrupted']);
}
$element['lines'] []= $matches[1];
}
else
{
$elements []= $element;
$element = array(
'type' => 'blockquote',
'lines' => array(
$matches[1],
),
);
}
continue;
}
# HTML
if ($pure_line[0] === '<')
{
# Block-Level HTML <self-closing/>
if (preg_match('{^<.+?/>$}', $pure_line))
{
$elements []= $element;
$element = array(
'type' => '',
'text' => $pure_line,
);
continue;
}
# Block-Level HTML <open>
if (preg_match('{^<(\w+)(?:[ ].*?)?>}', $pure_line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'block',
'subtype' => strtolower($matches[1]),
'text' => $pure_line,
'depth' => 0,
);
preg_match('{</'.$matches[1].'>\s*$}', $pure_line) and $element['closed'] = true;
continue;
}
}
# Horizontal Rule
if (preg_match('/^([-*_])([ ]{0,2}\1){2,}[ ]*$/', $pure_line))
{
$elements []= $element;
$element = array(
'type' => 'hr',
);
continue;
}
# List Item
if (preg_match('/^([ ]*)(\d+[.]|[*+-])[ ](.*)/', $line, $matches))
if ($deindented_line[0] <= '9' and $deindented_line >= '0' and preg_match('/^([ ]*)\d+[.][ ](.*)/', $line, $matches))
{
$elements []= $element;
$element = array(
'type' => 'li',
'ordered' => isset($matches[2][1]),
'ordered' => true,
'indentation' => $matches[1],
'last' => true,
'lines' => array(
preg_replace('/^[ ]{0,4}/', '', $matches[3]),
preg_replace('/^[ ]{0,4}/', '', $matches[2]),
),
);
continue;
}
# ~
paragraph:
# paragraph
if ($element['type'] === 'p')
{
@ -432,7 +521,7 @@ class Parsedown
$elements []= $element;
array_shift($elements);
unset($elements[0]);
#
# ~
@ -440,10 +529,67 @@ class Parsedown
$markup = '';
foreach ($elements as $index => $element)
foreach ($elements as $element)
{
switch ($element['type'])
{
case 'p':
$text = $this->parse_span_elements($element['text']);
$text = preg_replace('/[ ]{2}\n/', '<br />'."\n", $text);
if ($context === 'li' and $markup === '')
{
if (isset($element['interrupted']))
{
$markup .= "\n".'<p>'.$text.'</p>'."\n";
}
else
{
$markup .= $text;
}
}
else
{
$markup .= '<p>'.$text.'</p>'."\n";
}
break;
case 'blockquote':
$text = $this->parse_block_elements($element['lines']);
$markup .= '<blockquote>'."\n".$text.'</blockquote>'."\n";
break;
case 'code_block':
case 'fenced_code_block':
$text = htmlspecialchars($element['text'], ENT_NOQUOTES, 'UTF-8');
strpos($text, "\x1A\\") !== FALSE and $text = strtr($text, $this->escape_sequence_map);
$markup .= '<pre><code>'.$text.'</code></pre>'."\n";
break;
case 'h.':
$text = $this->parse_span_elements($element['text']);
$markup .= '<h'.$element['level'].'>'.$text.'</h'.$element['level'].'>'."\n";
break;
case 'hr':
$markup .= '<hr />'."\n";
break;
case 'li':
if (isset($element['ordered'])) # first
@ -466,62 +612,6 @@ class Parsedown
break;
case 'p':
$text = $this->parse_inline_elements($element['text']);
$text = preg_replace('/[ ]{2}\n/', '<br />'."\n", $text);
if ($context === 'li' and $index === 0)
{
if (isset($element['interrupted']))
{
$markup .= "\n".'<p>'.$text.'</p>'."\n";
}
else
{
$markup .= $text;
}
}
else
{
$markup .= '<p>'.$text.'</p>'."\n";
}
break;
case 'code':
$text = htmlentities($element['text'], ENT_NOQUOTES);
strpos($text, "\x1A\\") !== FALSE and $text = strtr($text, $this->escape_sequence_map);
$markup .= '<pre><code>'.$text.'</code></pre>'."\n";
break;
case 'blockquote':
$text = $this->parse_block_elements($element['lines']);
$markup .= '<blockquote>'."\n".$text.'</blockquote>'."\n";
break;
case 'h.':
$text = $this->parse_inline_elements($element['text']);
$markup .= '<h'.$element['level'].'>'.$text.'</h'.$element['level'].'>'."\n";
break;
case 'hr':
$markup .= '<hr />'."\n";
break;
default:
$markup .= $element['text']."\n";
@ -531,32 +621,32 @@ class Parsedown
return $markup;
}
private function parse_inline_elements($text)
private function parse_span_elements($text)
{
$map = array();
$index = 0;
# Code Span
# code span
if (strpos($text, '`') !== FALSE and preg_match_all('/`(.+?)`/', $text, $matches, PREG_SET_ORDER))
{
foreach ($matches as $matches)
{
$element_text = $matches[1];
$element_text = htmlentities($element_text, ENT_NOQUOTES);
$element_text = htmlspecialchars($element_text, ENT_NOQUOTES, 'UTF-8');
# Decodes escape sequences.
# decodes escape sequences
$this->escape_sequence_map
and strpos($element_text, "\x1A") !== FALSE
and $element_text = strtr($element_text, $this->escape_sequence_map);
# Composes element.
# composes element
$element = '<code>'.$element_text.'</code>';
# Encodes element.
# encodes element
$code = "\x1A".'$'.$index;
@ -568,7 +658,7 @@ class Parsedown
}
}
# Inline Link / Image
# inline link or image
if (strpos($text, '](') !== FALSE and preg_match_all('/(!?)(\[((?:[^\[\]]|(?2))*)\])\((.*?)\)/', $text, $matches, PREG_SET_ORDER)) # inline
{
@ -584,7 +674,7 @@ class Parsedown
}
else
{
$element_text = $this->parse_inline_elements($matches[3]);
$element_text = $this->parse_span_elements($matches[3]);
$element = '<a href="'.$url.'">'.$element_text.'</a>';
}
@ -601,7 +691,7 @@ class Parsedown
}
}
# Reference(d) Link / Image
# reference link or image
if ($this->reference_map and strpos($text, '[') !== FALSE and preg_match_all('/(!?)\[(.+?)\](?:\n?[ ]?\[(.*?)\])?/ms', $text, $matches, PREG_SET_ORDER))
{
@ -625,7 +715,7 @@ class Parsedown
}
else # anchor
{
$element_text = $this->parse_inline_elements($matches[2]);
$element_text = $this->parse_span_elements($matches[2]);
$element = '<a href="'.$url.'">'.$element_text.'</a>';
}
@ -643,29 +733,35 @@ class Parsedown
}
}
# Automatic Links
if (strpos($text, '<') !== FALSE and preg_match_all('/<((https?|ftp|dict):[^\^\s]+?)>/i', $text, $matches, PREG_SET_ORDER))
if (strpos($text, '://') !== FALSE)
{
foreach ($matches as $matches)
switch (TRUE)
{
$url = $matches[1];
case preg_match_all('{<(https?:[/]{2}[^\s]+)>}i', $text, $matches, PREG_SET_ORDER):
case preg_match_all('{\b(https?:[/]{2}[^\s]+)\b}i', $text, $matches, PREG_SET_ORDER):
strpos($url, '&') !== FALSE and $url = preg_replace('/&(?!#?\w+;)/', '&amp;', $url);
foreach ($matches as $matches)
{
$url = $matches[1];
$element = '<a href=":href">:text</a>';
$element = str_replace(':text', $url, $element);
$element = str_replace(':href', $url, $element);
strpos($url, '&') !== FALSE and $url = preg_replace('/&(?!#?\w+;)/', '&amp;', $url);
# ~
$element = '<a href=":href">:text</a>';
$element = str_replace(':text', $url, $element);
$element = str_replace(':href', $url, $element);
$code = "\x1A".'$'.$index;
# ~
$text = str_replace($matches[0], $code, $text);
$code = "\x1A".'$'.$index;
$map[$code] = $element;
$text = str_replace($matches[0], $code, $text);
$index ++;
$map[$code] = $element;
$index ++;
}
break;
}
}
@ -676,10 +772,15 @@ class Parsedown
# ~
if (strpos($text, '~~') !== FALSE)
{
$text = preg_replace('/~~(?=\S)(.+?)(?<=\S)~~/s', '<del>$1</del>', $text);
}
if (strpos($text, '_') !== FALSE)
{
$text = preg_replace('/__(?=\S)(.+?)(?<=\S)__(?!_)/s', '<strong>$1</strong>', $text);
$text = preg_replace('/_(?=\S)(.+?)(?<=\S)_/s', '<em>$1</em>', $text);
$text = preg_replace('/\b_(?=\S)(.+?)(?<=\S)_\b/s', '<em>$1</em>', $text);
}
if (strpos($text, '*') !== FALSE)
@ -692,4 +793,4 @@ class Parsedown
return $text;
}
}
}

View File

@ -1,9 +1,8 @@
## Parsedown PHP
## Parsedown
Parsedown is a parser for Markdown. It parses Markdown text the way people do. First, it divides texts into blocks. Then it looks at how these blocks start and how they relate to each other. Finally, it looks for special characters to identify inline elements. As a result, Parsedown is (super) fast, consistent and clean.
Fast, consistent and easy to use [Markdown][1] parser for PHP.
[Explorer (demo)](http://parsedown.org/explorer/)
[Tests](http://parsedown.org/tests/)
[Home](http://parsedown.org) &middot; [Demo](http://parsedown.org/explorer/) &middot; [Tests](http://parsedown.org/tests/)
### Installation
@ -17,4 +16,6 @@ $text = 'Hello **Parsedown**!';
$result = Parsedown::instance()->parse($text);
echo $result; # prints: <p>Hello <strong>Parsedown</strong>!</p>
```
```
[1]: http://daringfireball.net/projects/markdown/

View File

@ -5,7 +5,7 @@ include 'Parsedown.php';
class Test extends PHPUnit_Framework_TestCase
{
const provider_dir = 'data/';
/**
* @dataProvider provider
*/
@ -15,33 +15,41 @@ class Test extends PHPUnit_Framework_TestCase
$this->assertEquals($expected_markup, $actual_markup);
}
function provider()
{
$provider = array();
$DirectoryIterator = new DirectoryIterator(__DIR__ . '/' . self::provider_dir);
$path = dirname(__FILE__).'/';
$DirectoryIterator = new DirectoryIterator($path . '/' . self::provider_dir);
foreach ($DirectoryIterator as $Item)
{
if ($Item->isFile() and $Item->getExtension() === 'md')
if ($Item->isFile())
{
$filename = $Item->getFilename();
$extension = pathinfo($filename, PATHINFO_EXTENSION);
if ($extension !== 'md')
continue;
$basename = $Item->getBasename('.md');
$markdown = file_get_contents(__DIR__ . '/' . self::provider_dir . $basename . '.md');
$markdown = file_get_contents($path . '/' . self::provider_dir . $basename . '.md');
if (!$markdown)
continue;
$expected_markup = file_get_contents(__DIR__ . '/' . self::provider_dir . $basename . '.html');
$expected_markup = file_get_contents($path . '/' . self::provider_dir . $basename . '.html');
$expected_markup = str_replace("\r\n", "\n", $expected_markup);
$expected_markup = str_replace("\r", "\n", $expected_markup);
$provider [] = array($markdown, $expected_markup);
}
}
return $provider;
}
}
}

View File

@ -1,6 +1,7 @@
<h1>This is an h1</h1>
<h2>This is an h2</h2>
<h3>This is an h3</h3>
<h4>This is an h4</h4>
<h5>This is an h5</h5>
<h6>This is an h6</h6>
<h1>h1</h1>
<h2>h2</h2>
<h3>h3</h3>
<h4>h4</h4>
<h5>h5</h5>
<h6>h6</h6>
<h1>closed h1</h1>

View File

@ -1,11 +1,13 @@
# This is an h1
# h1
## This is an h2
## h2
### This is an h3
### h3
#### This is an h4
#### h4
##### This is an h5
##### h5
###### This is an h6
###### h6
# closed h1 #

View File

@ -1,6 +0,0 @@
<h1>h1</h1>
<h2>h2</h2>
<h3>h3</h3>
<h4>h4</h4>
<h5>h5</h5>
<h6>h6</h6>

View File

@ -1,11 +0,0 @@
# h1 #
## h2 ##
### h3 ###
#### h4 ####
##### h5 #####
###### h6 ######

View File

@ -0,0 +1,9 @@
<div>content</div>
<hr style="background: #eaa;" />
<p>nested elements:</p>
<div>
parent
<div>
child
</div>
</div>

View File

@ -0,0 +1,12 @@
<div>content</div>
<hr style="background: #eaa;" />
nested elements:
<div>
parent
<div>
child
</div>
</div>

View File

@ -1,9 +0,0 @@
<p>Here's a blockquote:</p>
<blockquote>
<p>blockquote</p>
</blockquote>
<p>Here's one on multiple lines:</p>
<blockquote>
<p>line 1
line 2</p>
</blockquote>

View File

@ -1,8 +0,0 @@
Here's a blockquote:
> blockquote
Here's one on multiple lines:
> line 1
> line 2

View File

@ -1,16 +0,0 @@
<p>Here's one with multiple paragraphs:</p>
<blockquote>
<p>This is line one.</p>
<p>This is line two.</p>
</blockquote>
<p>Here's one with multiple types of blocks:</p>
<blockquote>
<p>This is a quoted paragraph.</p>
<ul>
<li>This is a list item of a quoted list.</li>
<li>This is another list item.</li>
</ul>
<blockquote>
<p>This is a nested quote block.</p>
</blockquote>
</blockquote>

View File

@ -1,14 +0,0 @@
Here's one with multiple paragraphs:
> This is line one.
>
> This is line two.
Here's one with multiple types of blocks:
> This is a quoted paragraph.
>
> - This is a list item of a quoted list.
> - This is another list item.
>
> > This is a nested quote block.

View File

@ -1,11 +0,0 @@
<p>Here's a lazy blockquote:</p>
<blockquote>
<p>line
line</p>
</blockquote>
<p>Here's one with multiple lines:</p>
<blockquote>
<p>line
line
line</p>
</blockquote>

View File

@ -1,10 +0,0 @@
Here's a lazy blockquote:
> line
line
Here's one with multiple lines:
> line
line
line

View File

@ -1,12 +0,0 @@
<p>Here's a blockquote with no space after the ">":</p>
<blockquote>
<p>blockquote</p>
</blockquote>
<p>Here's a blockquote with leading space:</p>
<blockquote>
<p>blockquote</p>
</blockquote>
<p>Here's a blockquote on the next line:</p>
<blockquote>
<p>blockquote</p>
</blockquote>

View File

@ -1,10 +0,0 @@
Here's a blockquote with no space after the ">":
>blockquote
Here's a blockquote with leading space:
> blockquote
Here's a blockquote on the next line:
> blockquote

View File

@ -1,5 +1,8 @@
<p>Here's a code block:</p>
<pre><code>&lt;?php
$message = 'Hello World!';
echo $message;</code></pre>
echo $message;</code></pre>
<hr />
<pre><code>&gt; not a quote
- not a list item
[not a reference]: http://foo.com</code></pre>

View File

@ -1,6 +1,11 @@
Here's a code block:
<?php
$message = 'Hello World!';
echo $message;
echo $message;
---
> not a quote
- not a list item
[not a reference]: http://foo.com

View File

@ -1 +1 @@
<p>This is a <code>code span</code>.</p>
<p>a <code>code span</code></p>

View File

@ -1 +1 @@
This is a `code span`.
a `code span`

View File

@ -0,0 +1,9 @@
<blockquote>
<h2>header</h2>
<p>paragraph</p>
<ul>
<li>li</li>
</ul>
<hr />
<p>paragraph</p>
</blockquote>

View File

@ -0,0 +1,10 @@
> header
> ------
>
> paragraph
>
> - li
>
> ---
>
> paragraph

View File

@ -0,0 +1,12 @@
<ul>
<li>
<p>paragraph</p>
<p>paragraph</p>
</li>
<li>
<p>paragraph</p>
<blockquote>
<p>quote</p>
</blockquote>
</li>
</ul>

View File

@ -0,0 +1,7 @@
- paragraph
paragraph
- paragraph
> quote

View File

@ -1,11 +1,6 @@
<p>Here's <em>an emphasis</em>.</p>
<p>A short one <em>a</em> <em>b</em> .</p>
<p>Here's <strong>a strong one</strong>. </p>
<p>Here's <em>one that uses underscores</em>. </p>
<p>Here's <strong>a strong one that uses underscores</strong>.</p>
<p>This is not _ one _ neither is * this * neither is _ this_ neither is _this _.</p>
<p>An empty emphasis ** is not __ an emphasis.</p>
<p>A <em>multi-line
<p><em>underscore</em>, <em>asterisk</em>, <em>one two</em>, <em>three four</em>, <em>a</em>, <em>b</em></p>
<p><em>multiline
emphasis</em></p>
<p>A <strong>multi-line
strong emphasis</strong></p>
<p>_ this _ is not an emphasis, neither is _ this_, _this _, or _this*</p>
<p>this_is_not_an_emphasis</p>
<p>an empty emphasis __ ** is not an emphasis</p>

View File

@ -1,19 +1,10 @@
Here's *an emphasis*.
_underscore_, *asterisk*, _one two_, *three four*, _a_, *b*
A short one _a_ *b* .
_multiline
emphasis_
Here's **a strong one**.
_ this _ is not an emphasis, neither is _ this_, _this _, or _this*
Here's _one that uses underscores_.
this_is_not_an_emphasis
Here's __a strong one that uses underscores__.
This is not _ one _ neither is * this * neither is _ this_ neither is _this _.
An empty emphasis ** is not __ an emphasis.
A *multi-line
emphasis*
A **multi-line
strong emphasis**
an empty emphasis __ ** is not an emphasis

View File

@ -1,2 +1,4 @@
<p>Here's an <em>emphasis</em> and here's an escaped *emphasis*. Here are also an escaped `code span`, an escaped [inline link](http://example.com) and an escaped <code>\*emphasis\*</code> inside of a code span.</p>
<pre><code>An escaped \*emphasis\* inside of a code block.</code></pre>
<p>escaped *emphasis*.</p>
<p><code>escaped \*emphasis\* in a code span</code></p>
<pre><code>escaped \*emphasis\* in a code block</code></pre>
<p>\ ` * _ { } [ ] ( ) > # + - . !</p>

View File

@ -1,3 +1,7 @@
Here's an *emphasis* and here's an escaped \*emphasis\*. Here are also an escaped \`code span\`, an escaped \[inline link](http://example.com) and an escaped `\*emphasis\*` inside of a code span.
escaped \*emphasis\*.
An escaped \*emphasis\* inside of a code block.
`escaped \*emphasis\* in a code span`
escaped \*emphasis\* in a code block
\\ \` \* \_ \{ \} \[ \] \( \) \> \# \+ \- \. \!

View File

@ -0,0 +1,5 @@
<pre><code>&lt;?php
$message = 'fenced code block';
echo $message;</code></pre>
<pre><code>tilde</code></pre>

View File

@ -0,0 +1,10 @@
```
<?php
$message = 'fenced code block';
echo $message;
```
~~~
tilde
~~~

View File

@ -1,10 +1,5 @@
<p>Dashes:</p>
<hr />
<hr />
<hr />
<p>Asterisks:</p>
<hr />
<p>Underscores:</p>
<hr />
<p>On the next line:</p>
<hr />

View File

@ -1,18 +1,9 @@
Dashes:
---
- - -
- - -
Asterisks:
***
Underscores:
___
On the next line:
___

View File

@ -1,15 +0,0 @@
<p>A self-closing tag:</p>
<hr/>
<p>One with attributes:</p>
<hr style="background: #eaa" />
<p>A bare element:</p>
<div>content</div>
<p>One with attributes:</p>
<a href="http://example.com">link</a>
<p>Nested elements:</p>
<div>
parent
<div>
child
</div>
</div>

View File

@ -1,24 +0,0 @@
A self-closing tag:
<hr/>
One with attributes:
<hr style="background: #eaa" />
A bare element:
<div>content</div>
One with attributes:
<a href="http://example.com">link</a>
Nested elements:
<div>
parent
<div>
child
</div>
</div>

View File

@ -0,0 +1 @@
<p><img alt="Markdown Logo" src="/md.png"></p>

View File

@ -0,0 +1,3 @@
![Markdown Logo][image]
[image]: /md.png

View File

@ -0,0 +1,2 @@
<p>an <a href="http://example.com">implicit</a> reference link</p>
<p>an <a href="http://example.com">implicit</a> reference link with an empty link definition</p>

View File

@ -0,0 +1,5 @@
an [implicit] reference link
[implicit]: http://example.com
an [implicit][] reference link with an empty link definition

View File

@ -1,2 +1,2 @@
<p>Here's a <a href="http://example.com">link</a>.</p>
<p>Here's one that is based on an image: <a href="http://daringfireball.net/projects/markdown/"><img alt="MD Logo" src="http://parsedown.org/md.png"></a>.</p>
<p><a href="http://example.com">link</a></p>
<p><a href="http://example.com"><img alt="MD Logo" src="http://parsedown.org/md.png"></a></p>

View File

@ -1,3 +1,3 @@
Here's a [link](http://example.com).
[link](http://example.com)
Here's one that is based on an image: [![MD Logo](http://parsedown.org/md.png)](http://daringfireball.net/projects/markdown/).
[![MD Logo](http://parsedown.org/md.png)](http://example.com)

View File

@ -0,0 +1,4 @@
<blockquote>
<p>quote
the rest of it</p>
</blockquote>

View File

@ -0,0 +1,2 @@
> quote
the rest of it

View File

@ -0,0 +1,4 @@
<ul>
<li>li
the rest of it</li>
</ul>

2
tests/data/lazy_list.md Normal file
View File

@ -0,0 +1,2 @@
- li
the rest of it

View File

@ -1,5 +0,0 @@
<p>Here's a list:</p>
<ul>
<li>li</li>
<li>li</li>
</ul>

View File

@ -1,4 +0,0 @@
Here's a list:
- li
- li

View File

@ -1,13 +0,0 @@
<p>Here's a compound list:</p>
<ul>
<li>
<p>This is the first paragraph of the list item.</p>
<p>This is the second one.</p>
</li>
<li>
<p>This is another list item.</p>
<blockquote>
<p>This is a quote block that belongs to it.</p>
</blockquote>
</li>
</ul>

View File

@ -1,9 +0,0 @@
Here's a compound list:
- This is the first paragraph of the list item.
This is the second one.
- This is another list item.
> This is a quote block that belongs to it.

View File

@ -1,4 +0,0 @@
<ul>
<li>li
more text</li>
</ul>

View File

@ -1,2 +0,0 @@
- li
more text

View File

@ -1,14 +0,0 @@
<p>Here's a regular ordered list:</p>
<ol>
<li>one</li>
<li>two</li>
</ol>
<p>Here's one with repeating numbers:</p>
<ol>
<li>one</li>
<li>two</li>
</ol>
<p>Here's one with large numbers:</p>
<ol>
<li>one</li>
</ol>

View File

@ -1,13 +0,0 @@
Here's a regular ordered list:
1. one
2. two
Here's one with repeating numbers:
1. one
1. two
Here's one with large numbers:
123. one

View File

@ -1,16 +0,0 @@
<p>Here's a sparse list:</p>
<ul>
<li>
<p>list item</p>
</li>
<li>another list item</li>
</ul>
<p>Here's one with an indented list item:</p>
<ul>
<li>
<p>li</p>
<ul>
<li>li</li>
</ul>
</li>
</ul>

View File

@ -1,11 +0,0 @@
Here's a sparse list:
- list item
- another list item
Here's one with an indented list item:
- li
- li

View File

@ -1,10 +0,0 @@
Here's an unordered list:
- li
- li
Here's one with mixed markers:
- li
+ li
* li

View File

@ -1,5 +0,0 @@
<p>Here's one with white space around items:</p>
<ul>
<li>li </li>
<li>li </li>
</ul>

View File

@ -1,4 +0,0 @@
Here's one with white space around items:
- li
- li

View File

@ -0,0 +1,13 @@
<ol>
<li>one</li>
<li>two</li>
</ol>
<p>repeating numbers:</p>
<ol>
<li>one</li>
<li>two</li>
</ol>
<p>large numbers:</p>
<ol>
<li>one</li>
</ol>

View File

@ -0,0 +1,11 @@
1. one
2. two
repeating numbers:
1. one
1. two
large numbers:
123. one

View File

@ -1,7 +0,0 @@
<p>Here's a <a href="http://example.com">reference link</a>.</p>
<p>Here's <a href="http://example.com">one</a> with a semantic name.</p>
<p>Here's <a href="http://example.com">one</a> with an upper case label definition.</p>
<p>Here's <a href="http://example.com">one</a> with definition name on the next line.</p>
<p>Here's [one][404] with no definition.</p>
<p>Here's a <a href="http://example.com">multiline
one</a> defined on 2 lines.</p>

View File

@ -1,19 +0,0 @@
Here's a [reference link][1].
[1]: http://example.com
Here's [one][website] with a semantic name.
[website]: http://example.com
Here's [one][case] with an upper case label definition.
[CASE]: http://example.com
Here's [one]
[website] with definition name on the next line.
Here's [one][404] with no definition.
Here's a [multiline
one][website] defined on 2 lines.

View File

@ -1 +0,0 @@
<p>Here's an image: <img alt="Markdown Logo" src="/md.png"></p>

View File

@ -1,3 +0,0 @@
Here's an image: ![Markdown Logo][image]
[image]: /md.png

View File

@ -1,2 +0,0 @@
<p>Here's an <a href="http://example.com">implicit</a> reference link.</p>
<p>Here's an <a href="http://example.com">implicit</a> one with an empty link definition.</p>

View File

@ -1,5 +0,0 @@
Here's an [implicit] reference link.
[implicit]: http://example.com
Here's an [implicit][] one with an empty link definition.

View File

@ -1 +0,0 @@
<p>Here's a <a href="http://example.com">reference link</a> with a definition on the next line.</p>

View File

@ -1,2 +0,0 @@
Here's a [reference link][2] with a definition on the next line.
[2]: http://example.com

View File

@ -0,0 +1,11 @@
<blockquote>
<p>quote</p>
</blockquote>
<p>indented:</p>
<blockquote>
<p>quote</p>
</blockquote>
<p>no space after <code>&gt;</code>:</p>
<blockquote>
<p>quote</p>
</blockquote>

View File

@ -0,0 +1,7 @@
> quote
indented:
> quote
no space after `>`:
>quote

View File

@ -0,0 +1,3 @@
<p>an <b>important</b> <a href=''>link</a></p>
<p>broken<br/>
line</p>

View File

@ -0,0 +1,4 @@
an <b>important</b> <a href=''>link</a>
broken<br/>
line

View File

@ -1 +0,0 @@
<p>Here's an <b>important</b> <a href=''>link</a>.</p>

View File

@ -1 +0,0 @@
Here's an <b>important</b> <a href=''>link</a>.

View File

@ -0,0 +1,15 @@
<ul>
<li>
<p>li</p>
</li>
<li>li</li>
</ul>
<hr />
<ul>
<li>
<p>li</p>
<ul>
<li>indented li</li>
</ul>
</li>
</ul>

View File

@ -0,0 +1,9 @@
- li
- li
---
- li
- indented li

View File

@ -1,7 +1,8 @@
<p>AT&amp;T has an ampersand in their name.</p>
<p>AT&amp;T is another way to write it.</p>
<p>This &amp; that.</p>
<p>4 &lt; 5 and 6 > 5.</p>
<p>Here's an autolink <a href="http://example.com/autolink?a=1&amp;b=2">http://example.com/autolink?a=1&amp;b=2</a></p>
<p>Here's an inline <a href="/script?a=1&amp;b=2">link</a>.</p>
<p>Here's a reference <a href="http://example.com/?a=1&amp;b=2">link</a> with an ampersand in the URL.</p>
<p>AT&amp;T has an ampersand in their name</p>
<pre><code>Let's play some cards ♠ ♣ ♥ ♦</code></pre>
<p>AT&amp;T is another way to write it</p>
<p>this &amp; that</p>
<p>4 &lt; 5 and 6 > 5</p>
<p><a href="http://example.com/autolink?a=1&amp;b=2">http://example.com/autolink?a=1&amp;b=2</a> </p>
<p><a href="/script?a=1&amp;b=2">inline link</a></p>
<p><a href="http://example.com/?a=1&amp;b=2">reference link</a></p>

View File

@ -1,15 +1,17 @@
AT&T has an ampersand in their name.
AT&T has an ampersand in their name
AT&amp;T is another way to write it.
Let's play some cards ♠ ♣ ♥ ♦
This & that.
AT&T is another way to write it
4 < 5 and 6 > 5.
this & that
Here's an autolink <http://example.com/autolink?a=1&b=2>
4 < 5 and 6 > 5
Here's an inline [link](/script?a=1&b=2).
<http://example.com/autolink?a=1&b=2>
Here's a reference [link] [1] with an ampersand in the URL.
[inline link](/script?a=1&b=2)
[reference link][1]
[1]: http://example.com/?a=1&b=2

View File

@ -0,0 +1,3 @@
<p><del>strikethrough</del></p>
<p>in the <del>middle</del> of a sentence</p>
<p>in the middle of a w<del>or</del>d</p>

View File

@ -0,0 +1,5 @@
~~strikethrough~~
in the ~~middle~~ of a sentence
in the middle of a w~~or~~d

View File

@ -0,0 +1,6 @@
<p><a href="http://example.com">reference link</a></p>
<p><a href="http://example.com">one</a> with a semantic name</p>
<p>[one][404] with no definition</p>
<p><a href="http://example.com">multiline
one</a> defined on 2 lines</p>
<p><a href="http://example.com">one</a> with an upper case label</p>

View File

@ -0,0 +1,16 @@
[reference link][1]
[1]: http://example.com
[one][website] with a semantic name
[website]: http://example.com
[one][404] with no definition
[multiline
one][website] defined on 2 lines
[one][label] with an upper case label
[LABEL]: http://example.com

View File

@ -1,9 +1,8 @@
<p>Here's an unordered list:</p>
<ul>
<li>li</li>
<li>li</li>
</ul>
<p>Here's one with mixed markers:</p>
<p>mixed markers:</p>
<ul>
<li>li</li>
<li>li</li>

View File

@ -0,0 +1,8 @@
- li
- li
mixed markers:
* li
+ li
- li

View File

@ -0,0 +1 @@
<p>Here's an autolink <a href="http://example.com">http://example.com</a>.</p>

View File

@ -0,0 +1 @@
Here's an autolink http://example.com.

View File

@ -1 +1 @@
<pre><code>This text starts with a line that consists of 4 spaces and it ends with one. This is a code block to make sure that leading spaces don't get trimmed.</code></pre>
<pre><code>code</code></pre>

View File

@ -1,5 +1,5 @@
This text starts with a line that consists of 4 spaces and it ends with one. This is a code block to make sure that leading spaces don't get trimmed.
code