123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129 |
- <?php
- /**
- * @copyright Copyright (c) 2014 Carsten Brandt
- * @license https://github.com/cebe/markdown/blob/master/LICENSE
- * @link https://github.com/cebe/markdown#readme
- */
- namespace cebe\markdown;
- /**
- * Markdown parser for the [initial markdown spec](http://daringfireball.net/projects/markdown/syntax).
- *
- * @author Carsten Brandt <mail@cebe.cc>
- */
- class Markdown extends Parser
- {
- // include block element parsing using traits
- use block\CodeTrait;
- use block\HeadlineTrait;
- use block\HtmlTrait {
- parseInlineHtml as private;
- }
- use block\ListTrait {
- // Check Ul List before headline
- identifyUl as protected identifyBUl;
- consumeUl as protected consumeBUl;
- }
- use block\QuoteTrait;
- use block\RuleTrait {
- // Check Hr before checking lists
- identifyHr as protected identifyAHr;
- consumeHr as protected consumeAHr;
- }
- // include inline element parsing using traits
- use inline\CodeTrait;
- use inline\EmphStrongTrait;
- use inline\LinkTrait;
- /**
- * @var boolean whether to format markup according to HTML5 spec.
- * Defaults to `false` which means that markup is formatted as HTML4.
- */
- public $html5 = false;
- /**
- * @var array these are "escapeable" characters. When using one of these prefixed with a
- * backslash, the character will be outputted without the backslash and is not interpreted
- * as markdown.
- */
- protected $escapeCharacters = [
- '\\', // backslash
- '`', // backtick
- '*', // asterisk
- '_', // underscore
- '{', '}', // curly braces
- '[', ']', // square brackets
- '(', ')', // parentheses
- '#', // hash mark
- '+', // plus sign
- '-', // minus sign (hyphen)
- '.', // dot
- '!', // exclamation mark
- '<', '>',
- ];
- /**
- * @inheritDoc
- */
- protected function prepare()
- {
- // reset references
- $this->references = [];
- }
- /**
- * Consume lines for a paragraph
- *
- * Allow headlines and code to break paragraphs
- */
- protected function consumeParagraph($lines, $current)
- {
- // consume until newline
- $content = [];
- for ($i = $current, $count = count($lines); $i < $count; $i++) {
- $line = $lines[$i];
- // a list may break a paragraph when it is inside of a list
- if (isset($this->context[1]) && $this->context[1] === 'list' && !ctype_alpha($line[0]) && (
- $this->identifyUl($line, $lines, $i) || $this->identifyOl($line, $lines, $i))) {
- break;
- }
- if ($line === '' || ltrim($line) === '' || $this->identifyHeadline($line, $lines, $i)) {
- break;
- } elseif ($line[0] === "\t" || $line[0] === " " && strncmp($line, ' ', 4) === 0) {
- // possible beginning of a code block
- // but check for continued inline HTML
- // e.g. <img src="file.jpg"
- // alt="some alt aligned with src attribute" title="some text" />
- if (preg_match('~<\w+([^>]+)$~s', implode("\n", $content))) {
- $content[] = $line;
- } else {
- break;
- }
- } else {
- $content[] = $line;
- }
- }
- $block = [
- 'paragraph',
- 'content' => $this->parseInline(implode("\n", $content)),
- ];
- return [$block, --$i];
- }
- /**
- * @inheritdocs
- *
- * Parses a newline indicated by two spaces on the end of a markdown line.
- */
- protected function renderText($text)
- {
- return str_replace(" \n", $this->html5 ? "<br>\n" : "<br />\n", $text[1]);
- }
- }
|