123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526 |
- <?php
- #
- #
- # Parsedown Extra
- # https://github.com/erusev/parsedown-extra
- #
- # (c) Emanuil Rusev
- # http://erusev.com
- #
- # For the full license information, view the LICENSE file that was distributed
- # with this source code.
- #
- #
- class ParsedownExtra extends Parsedown
- {
- # ~
- const version = '0.7.0';
- # ~
- function __construct()
- {
- if (parent::version < '1.5.0')
- {
- throw new Exception('ParsedownExtra requires a later version of Parsedown');
- }
- $this->BlockTypes[':'] []= 'DefinitionList';
- $this->BlockTypes['*'] []= 'Abbreviation';
- # identify footnote definitions before reference definitions
- array_unshift($this->BlockTypes['['], 'Footnote');
- # identify footnote markers before before links
- array_unshift($this->InlineTypes['['], 'FootnoteMarker');
- }
- #
- # ~
- function text($text)
- {
- $markup = parent::text($text);
- # merge consecutive dl elements
- $markup = preg_replace('/<\/dl>\s+<dl>\s+/', '', $markup);
- # add footnotes
- if (isset($this->DefinitionData['Footnote']))
- {
- $Element = $this->buildFootnoteElement();
- $markup .= "\n" . $this->element($Element);
- }
- return $markup;
- }
- #
- # Blocks
- #
- #
- # Abbreviation
- protected function blockAbbreviation($Line)
- {
- if (preg_match('/^\*\[(.+?)\]:[ ]*(.+?)[ ]*$/', $Line['text'], $matches))
- {
- $this->DefinitionData['Abbreviation'][$matches[1]] = $matches[2];
- $Block = array(
- 'hidden' => true,
- );
- return $Block;
- }
- }
- #
- # Footnote
- protected function blockFootnote($Line)
- {
- if (preg_match('/^\[\^(.+?)\]:[ ]?(.*)$/', $Line['text'], $matches))
- {
- $Block = array(
- 'label' => $matches[1],
- 'text' => $matches[2],
- 'hidden' => true,
- );
- return $Block;
- }
- }
- protected function blockFootnoteContinue($Line, $Block)
- {
- if ($Line['text'][0] === '[' and preg_match('/^\[\^(.+?)\]:/', $Line['text']))
- {
- return;
- }
- if (isset($Block['interrupted']))
- {
- if ($Line['indent'] >= 4)
- {
- $Block['text'] .= "\n\n" . $Line['text'];
- return $Block;
- }
- }
- else
- {
- $Block['text'] .= "\n" . $Line['text'];
- return $Block;
- }
- }
- protected function blockFootnoteComplete($Block)
- {
- $this->DefinitionData['Footnote'][$Block['label']] = array(
- 'text' => $Block['text'],
- 'count' => null,
- 'number' => null,
- );
- return $Block;
- }
- #
- # Definition List
- protected function blockDefinitionList($Line, $Block)
- {
- if ( ! isset($Block) or isset($Block['type']))
- {
- return;
- }
- $Element = array(
- 'name' => 'dl',
- 'handler' => 'elements',
- 'text' => array(),
- );
- $terms = explode("\n", $Block['element']['text']);
- foreach ($terms as $term)
- {
- $Element['text'] []= array(
- 'name' => 'dt',
- 'handler' => 'line',
- 'text' => $term,
- );
- }
- $Block['element'] = $Element;
- $Block = $this->addDdElement($Line, $Block);
- return $Block;
- }
- protected function blockDefinitionListContinue($Line, array $Block)
- {
- if ($Line['text'][0] === ':')
- {
- $Block = $this->addDdElement($Line, $Block);
- return $Block;
- }
- else
- {
- if (isset($Block['interrupted']) and $Line['indent'] === 0)
- {
- return;
- }
- if (isset($Block['interrupted']))
- {
- $Block['dd']['handler'] = 'text';
- $Block['dd']['text'] .= "\n\n";
- unset($Block['interrupted']);
- }
- $text = substr($Line['body'], min($Line['indent'], 4));
- $Block['dd']['text'] .= "\n" . $text;
- return $Block;
- }
- }
- #
- # Header
- protected function blockHeader($Line)
- {
- $Block = parent::blockHeader($Line);
- if (preg_match('/[ #]*{('.$this->regexAttribute.'+)}[ ]*$/', $Block['element']['text'], $matches, PREG_OFFSET_CAPTURE))
- {
- $attributeString = $matches[1][0];
- $Block['element']['attributes'] = $this->parseAttributeData($attributeString);
- $Block['element']['text'] = substr($Block['element']['text'], 0, $matches[0][1]);
- }
- return $Block;
- }
- #
- # Markup
- protected function blockMarkupComplete($Block)
- {
- if ( ! isset($Block['void']))
- {
- $Block['markup'] = $this->processTag($Block['markup']);
- }
- return $Block;
- }
- #
- # Setext
- protected function blockSetextHeader($Line, array $Block = null)
- {
- $Block = parent::blockSetextHeader($Line, $Block);
- if (preg_match('/[ ]*{('.$this->regexAttribute.'+)}[ ]*$/', $Block['element']['text'], $matches, PREG_OFFSET_CAPTURE))
- {
- $attributeString = $matches[1][0];
- $Block['element']['attributes'] = $this->parseAttributeData($attributeString);
- $Block['element']['text'] = substr($Block['element']['text'], 0, $matches[0][1]);
- }
- return $Block;
- }
- #
- # Inline Elements
- #
- #
- # Footnote Marker
- protected function inlineFootnoteMarker($Excerpt)
- {
- if (preg_match('/^\[\^(.+?)\]/', $Excerpt['text'], $matches))
- {
- $name = $matches[1];
- if ( ! isset($this->DefinitionData['Footnote'][$name]))
- {
- return;
- }
- $this->DefinitionData['Footnote'][$name]['count'] ++;
- if ( ! isset($this->DefinitionData['Footnote'][$name]['number']))
- {
- $this->DefinitionData['Footnote'][$name]['number'] = ++ $this->footnoteCount; # » &
- }
- $Element = array(
- 'name' => 'sup',
- 'attributes' => array('id' => 'fnref'.$this->DefinitionData['Footnote'][$name]['count'].':'.$name),
- 'handler' => 'element',
- 'text' => array(
- 'name' => 'a',
- 'attributes' => array('href' => '#fn:'.$name, 'class' => 'footnote-ref'),
- 'text' => $this->DefinitionData['Footnote'][$name]['number'],
- ),
- );
- return array(
- 'extent' => strlen($matches[0]),
- 'element' => $Element,
- );
- }
- }
- private $footnoteCount = 0;
- #
- # Link
- protected function inlineLink($Excerpt)
- {
- $Link = parent::inlineLink($Excerpt);
- $remainder = substr($Excerpt['text'], $Link['extent']);
- if (preg_match('/^[ ]*{('.$this->regexAttribute.'+)}/', $remainder, $matches))
- {
- $Link['element']['attributes'] += $this->parseAttributeData($matches[1]);
- $Link['extent'] += strlen($matches[0]);
- }
- return $Link;
- }
- #
- # ~
- #
- protected function unmarkedText($text)
- {
- $text = parent::unmarkedText($text);
- if (isset($this->DefinitionData['Abbreviation']))
- {
- foreach ($this->DefinitionData['Abbreviation'] as $abbreviation => $meaning)
- {
- $pattern = '/\b'.preg_quote($abbreviation, '/').'\b/';
- $text = preg_replace($pattern, '<abbr title="'.$meaning.'">'.$abbreviation.'</abbr>', $text);
- }
- }
- return $text;
- }
- #
- # Util Methods
- #
- protected function addDdElement(array $Line, array $Block)
- {
- $text = substr($Line['text'], 1);
- $text = trim($text);
- unset($Block['dd']);
- $Block['dd'] = array(
- 'name' => 'dd',
- 'handler' => 'line',
- 'text' => $text,
- );
- if (isset($Block['interrupted']))
- {
- $Block['dd']['handler'] = 'text';
- unset($Block['interrupted']);
- }
- $Block['element']['text'] []= & $Block['dd'];
- return $Block;
- }
- protected function buildFootnoteElement()
- {
- $Element = array(
- 'name' => 'div',
- 'attributes' => array('class' => 'footnotes'),
- 'handler' => 'elements',
- 'text' => array(
- array(
- 'name' => 'hr',
- ),
- array(
- 'name' => 'ol',
- 'handler' => 'elements',
- 'text' => array(),
- ),
- ),
- );
- uasort($this->DefinitionData['Footnote'], 'self::sortFootnotes');
- foreach ($this->DefinitionData['Footnote'] as $definitionId => $DefinitionData)
- {
- if ( ! isset($DefinitionData['number']))
- {
- continue;
- }
- $text = $DefinitionData['text'];
- $text = parent::text($text);
- $numbers = range(1, $DefinitionData['count']);
- $backLinksMarkup = '';
- foreach ($numbers as $number)
- {
- $backLinksMarkup .= ' <a href="#fnref'.$number.':'.$definitionId.'" rev="footnote" class="footnote-backref">↩</a>';
- }
- $backLinksMarkup = substr($backLinksMarkup, 1);
- if (substr($text, - 4) === '</p>')
- {
- $backLinksMarkup = ' '.$backLinksMarkup;
- $text = substr_replace($text, $backLinksMarkup.'</p>', - 4);
- }
- else
- {
- $text .= "\n".'<p>'.$backLinksMarkup.'</p>';
- }
- $Element['text'][1]['text'] []= array(
- 'name' => 'li',
- 'attributes' => array('id' => 'fn:'.$definitionId),
- 'text' => "\n".$text."\n",
- );
- }
- return $Element;
- }
- # ~
- protected function parseAttributeData($attributeString)
- {
- $Data = array();
- $attributes = preg_split('/[ ]+/', $attributeString, - 1, PREG_SPLIT_NO_EMPTY);
- foreach ($attributes as $attribute)
- {
- if ($attribute[0] === '#')
- {
- $Data['id'] = substr($attribute, 1);
- }
- else # "."
- {
- $classes []= substr($attribute, 1);
- }
- }
- if (isset($classes))
- {
- $Data['class'] = implode(' ', $classes);
- }
- return $Data;
- }
- # ~
- protected function processTag($elementMarkup) # recursive
- {
- # http://stackoverflow.com/q/1148928/200145
- libxml_use_internal_errors(true);
- $DOMDocument = new DOMDocument;
- # http://stackoverflow.com/q/11309194/200145
- $elementMarkup = mb_convert_encoding($elementMarkup, 'HTML-ENTITIES', 'UTF-8');
- # http://stackoverflow.com/q/4879946/200145
- $DOMDocument->loadHTML($elementMarkup);
- $DOMDocument->removeChild($DOMDocument->doctype);
- $DOMDocument->replaceChild($DOMDocument->firstChild->firstChild->firstChild, $DOMDocument->firstChild);
- $elementText = '';
- if ($DOMDocument->documentElement->getAttribute('markdown') === '1')
- {
- foreach ($DOMDocument->documentElement->childNodes as $Node)
- {
- $elementText .= $DOMDocument->saveHTML($Node);
- }
- $DOMDocument->documentElement->removeAttribute('markdown');
- $elementText = "\n".$this->text($elementText)."\n";
- }
- else
- {
- foreach ($DOMDocument->documentElement->childNodes as $Node)
- {
- $nodeMarkup = $DOMDocument->saveHTML($Node);
- if ($Node instanceof DOMElement and ! in_array($Node->nodeName, $this->textLevelElements))
- {
- $elementText .= $this->processTag($nodeMarkup);
- }
- else
- {
- $elementText .= $nodeMarkup;
- }
- }
- }
- # because we don't want for markup to get encoded
- $DOMDocument->documentElement->nodeValue = 'placeholder\x1A';
- $markup = $DOMDocument->saveHTML($DOMDocument->documentElement);
- $markup = str_replace('placeholder\x1A', $elementText, $markup);
- return $markup;
- }
- # ~
- protected function sortFootnotes($A, $B) # callback
- {
- return $A['number'] - $B['number'];
- }
- #
- # Fields
- #
- protected $regexAttribute = '(?:[#.][-\w]+[ ]*)';
- }
|