', '\#', '\+', '\-', '\.', '\!'); foreach ($escape_sequences as $index => $escape_sequence) { if (strpos($text, $escape_sequence) !== FALSE) { $code = "\x1A".'\\'.$index; $text = str_replace($escape_sequence, $code, $text); $this->escape_sequence_map[$code] = $escape_sequence; } } } # Extracts link references. if (preg_match_all('/^[ ]{0,3}\[(.+)\][ ]?:[ ]*\n?[ ]*(.+)$/m', $text, $matches, PREG_SET_ORDER)) { foreach ($matches as $matches) { $this->reference_map[strtolower($matches[1])] = $matches[2]; $text = str_replace($matches[0], '', $text); } } # ~ $text = preg_replace('/\n\s*\n/', "\n\n", $text); $text = trim($text, "\n"); $lines = explode("\n", $text); $text = $this->parse_block_elements($lines); # Decodes escape sequences (leaves out backslashes). foreach ($this->escape_sequence_map as $code => $escape_sequence) { $text = str_replace($code, $escape_sequence[1], $text); } $text = rtrim($text, "\n"); return $text; } # # Private Methods # private function parse_block_elements(array $lines, $context = '') { $elements = array(); $element = array( 'type' => '', ); foreach ($lines as $line) { # Empty if ($line === '') { $element['interrupted'] = true; $element['type'] === 'code' and $element['text'] .= "\n"; continue; } # Lazy Blockquote if ($element['type'] === 'blockquote' and ! isset($element['interrupted'])) { $line = preg_replace('/^[ ]*>[ ]?/', '', $line); $element['lines'] []= $line; continue; } # Lazy List Item if ($element['type'] === 'li') { if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches)) { if ($element['indentation'] !== $matches[1]) { $element['lines'] []= $line; } else { unset($element['last']); $elements []= $element; $element = array( 'type' => 'li', 'indentation' => $matches[1], 'last' => true, 'lines' => array( preg_replace('/^[ ]{0,4}/', '', $matches[3]), ), ); } continue; } if (isset($element['interrupted'])) { if ($line[0] === ' ') { $element['lines'] []= ''; $line = preg_replace('/^[ ]{0,4}/', '', $line);; $element['lines'] []= $line; continue; } } else { $line = preg_replace('/^[ ]{0,4}/', '', $line);; $element['lines'] []= $line; continue; } } # Quick Paragraph if ($line[0] >= 'A' and $line['0'] !== '_') { goto paragraph; # trust me } # Setext Header (---) if ($element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[-]+[ ]*$/', $line)) { $element['type'] = 'h.'; $element['level'] = 2; continue; } # Horizontal Rule if (preg_match('/^[ ]{0,3}([-*_])([ ]{0,2}\1){2,}[ ]*$/', $line)) { $elements []= $element; $element = array( 'type' => 'hr', ); continue; } # List Item if (preg_match('/^([ ]{0,3})(\d+[.]|[*+-])[ ](.*)/', $line, $matches)) { $elements []= $element; $element = array( 'type' => 'li', 'ordered' => isset($matches[2][1]), 'indentation' => $matches[1], 'last' => true, 'lines' => array( preg_replace('/^[ ]{0,4}/', '', $matches[3]), ), ); continue; } # Code if (preg_match('/^[ ]{4}(.*)/', $line, $matches)) { if ($element['type'] === 'code') { $element['text'] .= "\n".$matches[1]; } else { $elements []= $element; $element = array( 'type' => 'code', 'text' => $matches[1], ); } continue; } # Atx Header (#) if ($line[0] === '#' and preg_match('/^(#{1,6})[ ]*(.+?)[ ]*#*$/', $line, $matches)) { $elements []= $element; $level = strlen($matches[1]); $element = array( 'type' => 'h.', 'text' => $matches[2], 'level' => $level, ); continue; } # Blockquote if (preg_match('/^[ ]*>[ ]?(.*)/', $line, $matches)) { if ($element['type'] === 'blockquote') { if (isset($element['interrupted'])) { $element['lines'] []= ''; unset($element['interrupted']); } $element['lines'] []= $matches[1]; } else { $elements []= $element; $element = array( 'type' => 'blockquote', 'lines' => array( $matches[1], ), ); } continue; } # Setext Header (===) if ($element['type'] === 'p' and ! isset($element['interrupted']) and preg_match('/^[=]+[ ]*$/', $line)) { $element['type'] = 'h.'; $element['level'] = 1; continue; } # ~ paragraph: if ($element['type'] === 'p') { if (isset($element['interrupted'])) { $elements []= $element; $element['text'] = $line; unset($element['interrupted']); } else { $element['text'] .= "\n".$line; } } else { $elements []= $element; $element = array( 'type' => 'p', 'text' => $line, ); } } $elements []= $element; array_shift($elements); # # ~ # $markup = ''; foreach ($elements as $index => $element) { switch ($element['type']) { case 'li': if (isset($element['ordered'])) # first { $list_type = $element['ordered'] ? 'ol' : 'ul'; $markup .= '<'.$list_type.'>'."\n"; } if (isset($element['interrupted']) and ! isset($element['last'])) { $element['lines'] []= ''; } $text = $this->parse_block_elements($element['lines'], 'li'); $markup .= '
'.$text.'
'."\n"; } else { $markup .= $text; } } else { $markup .= ''.$text.'
'."\n"; } break; case 'code': $text = rtrim($element['text'], "\n"); $text = htmlentities($text, ENT_NOQUOTES); strpos($text, "\x1A\\") !== FALSE and $text = strtr($text, $this->escape_sequence_map); $markup .= ''.$text.'
'."\n";
break;
case 'blockquote':
$text = $this->parse_block_elements($element['lines']);
$markup .= ''."\n".$text.''."\n"; break; case 'h.': $text = $this->parse_inline_elements($element['text']); $markup .= '
'.$element_text.'
';
# Encodes element.
$code = "\x1A".'$'.$index;
$text = str_replace($matches[0], $code, $text);
$map[$code] = $element;
$index ++;
}
}
# Inline Link / Image
if (strpos($text, '](') !== FALSE and preg_match_all('/(!?)(\[((?:[^][]+|(?2))*)\])\((.*?)\)/', $text, $matches, PREG_SET_ORDER)) # inline
{
foreach ($matches as $matches)
{
if ($matches[1]) # image
{
$element = '';
}
else
{
$element_text = $this->parse_inline_elements($matches[3]);
$element = ''.$element_text.'';
}
# ~
$code = "\x1A".'$'.$index;
$text = str_replace($matches[0], $code, $text);
$map[$code] = $element;
$index ++;
}
}
# Reference(d) Link / Image
if ($this->reference_map and strpos($text, '[') !== FALSE and preg_match_all('/(!?)\[(.+?)\](?:\n?[ ]?\[(.*?)\])?/ms', $text, $matches, PREG_SET_ORDER))
{
foreach ($matches as $matches)
{
$link_definition = isset($matches[3]) && $matches[3]
? $matches[3]
: $matches[2]; # implicit
$link_definition = strtolower($link_definition);
if (isset($this->reference_map[$link_definition]))
{
$url = $this->reference_map[$link_definition];
if ($matches[1]) # image
{
$element = '';
}
else # anchor
{
$element_text = $this->parse_inline_elements($matches[2]);
$element = ''.$element_text.'';
}
# ~
$code = "\x1A".'$'.$index;
$text = str_replace($matches[0], $code, $text);
$map[$code] = $element;
$index ++;
}
}
}
if (strpos($text, '<') !== FALSE and preg_match_all('/<((https?|ftp|dict):[^\^\s]+?)>/i', $text, $matches, PREG_SET_ORDER))
{
foreach ($matches as $matches)
{
$element = ':text';
$element = str_replace(':text', $matches[1], $element);
$element = str_replace(':href', $matches[1], $element);
# ~
$code = "\x1A".'$'.$index;
$text = str_replace($matches[0], $code, $text);
$map[$code] = $element;
$index ++;
}
}
if (strpos($text, '_') !== FALSE)
{
$text = preg_replace('/__(?=\S)(.+?)(?<=\S)__/', '$1', $text);
$text = preg_replace('/_(?=\S)(.+?)(?<=\S)_/', '$1', $text);
}
if (strpos($text, '*') !== FALSE)
{
$text = preg_replace('/\*\*(?=\S)(.+?)(?<=\S)\*\*/', '$1', $text);
$text = preg_replace('/\*(?=\S)(.+?)(?<=\S)\*/', '$1', $text);
}
$text = strtr($text, $map);
return $text;
}
}