| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382 | <?php/** * @copyright Copyright (c) 2014 Carsten Brandt * @license https://github.com/cebe/markdown/blob/master/LICENSE * @link https://github.com/cebe/markdown#readme */namespace cebe\markdown\latex;use cebe\markdown\block\CodeTrait;use cebe\markdown\block\HeadlineTrait;use cebe\markdown\block\ListTrait;use cebe\markdown\block\QuoteTrait;use cebe\markdown\block\RuleTrait;use cebe\markdown\inline\CodeTrait as InlineCodeTrait;use cebe\markdown\inline\EmphStrongTrait;use cebe\markdown\inline\LinkTrait;use MikeVanRiel\TextToLatex;/** * Markdown parser for the [initial markdown spec](http://daringfireball.net/projects/markdown/syntax). * * @author Carsten Brandt <mail@cebe.cc> */class Markdown extends \cebe\markdown\Parser{	// include block element parsing using traits	use CodeTrait;	use HeadlineTrait;	use ListTrait {		// Check Ul List before headline		identifyUl as protected identifyBUl;		consumeUl as protected consumeBUl;	}	use QuoteTrait;	use RuleTrait {		// Check Hr before checking lists		identifyHr as protected identifyAHr;		consumeHr as protected consumeAHr;	}	// include inline element parsing using traits	use InlineCodeTrait;	use EmphStrongTrait;	use LinkTrait;	/**	 * @var string this string will be prefixed to all auto generated labels.	 * This can be used to disambiguate labels when combining multiple markdown files into one document.	 */	public $labelPrefix = '';	const LINK_STYLE_FOOTNOTE = 'footnote';	const LINK_STYLE_HREF = 'href';	/**	 * @var string link style defines how links are rendered in LaTeX, there are two different options:	 *	 * - `footnote` (default) - render all links with a footnote, which contains the full URL of the link. This is good for printing the PDF.	 * - `href` - render all links with a hyperref, similar to HTML, the link target is not visible in this case.	 */	public $linkStyle = self::LINK_STYLE_FOOTNOTE;	/**	 * @var array these are "escapeable" characters. When using one of these prefixed with a	 * backslash, the character will be outputted without the backslash and is not interpreted	 * as markdown.	 */	protected $escapeCharacters = [		'\\', // backslash		'`', // backtick		'*', // asterisk		'_', // underscore		'{', '}', // curly braces		'[', ']', // square brackets		'(', ')', // parentheses		'#', // hash mark		'+', // plus sign		'-', // minus sign (hyphen)		'.', // dot		'!', // exclamation mark		'<', '>',	];	/**	 * @inheritDoc	 */	protected function prepare()	{		// reset references		$this->references = [];	}	/**	 * Consume lines for a paragraph	 *	 * Allow headlines and code to break paragraphs	 */	protected function consumeParagraph($lines, $current)	{		// consume until newline		$content = [];		for ($i = $current, $count = count($lines); $i < $count; $i++) {			$line = $lines[$i];			if (!empty($line) && ltrim($line) !== '' &&				!($line[0] === "\t" || $line[0] === " " && strncmp($line, '    ', 4) === 0) &&				!$this->identifyHeadline($line, $lines, $i))			{				$content[] = $line;			} else {				break;			}		}		$block = [			'paragraph',			'content' => $this->parseInline(implode("\n", $content)),		];		return [$block, --$i];	}	// rendering adjusted for LaTeX output	/**	 * @inheritdoc	 */	protected function renderParagraph($block)	{		return $this->renderAbsy($block['content']) . "\n\n";	}	/**	 * @inheritdoc	 */	protected function renderQuote($block)	{		return '\begin{quote}' . $this->renderAbsy($block['content']) . "\\end{quote}\n";	}	/**	 * @inheritdoc	 */	protected function renderCode($block)	{		$language = isset($block['language']) ? "\\lstset{language={$block['language']}}" : '\lstset{language={}}';		$content = $block['content'];		// replace No-Break Space characters in code block, which do not render in LaTeX		$content = preg_replace("/[\x{00a0}\x{202f}]/u", ' ', $content);		return "$language\\begin{lstlisting}\n{$content}\n\\end{lstlisting}\n";	}	/**	 * @inheritdoc	 */	protected function renderList($block)	{		$type = ($block['list'] === 'ol') ? 'enumerate' : 'itemize';		$output = "\\begin{{$type}}\n";		foreach ($block['items'] as $item => $itemLines) {			$output .= '\item ' . $this->renderAbsy($itemLines). "\n";		}		return "$output\\end{{$type}}\n";	}	/**	 * @inheritdoc	 */	protected function renderHeadline($block)	{		$content = $this->renderAbsy($block['content']);		switch($block['level']) {			case 1: return "\\section{{$content}}\n";			case 2: return "\\subsection{{$content}}\n";			case 3: return "\\subsubsection{{$content}}\n";			default: return "\\paragraph{{$content}}\n";		}	}	/**	 * @inheritdoc	 */	protected function renderHr($block)	{		return "\n\\noindent\\rule{\\textwidth}{0.4pt}\n";	}	/**	 * @inheritdoc	 */	protected function renderLink($block)	{		if (isset($block['refkey'])) {			if (($ref = $this->lookupReference($block['refkey'])) !== false) {				$block = array_merge($block, $ref);			} else {				return $block['orig'];			}		}		$url = $block['url'];		$text = $this->renderAbsy($block['text']);		if (strpos($url, '://') === false) {			// consider all non absolute links as relative in the document			// $title is ignored in this case.			if (isset($url[0]) && $url[0] === '#') {				$url = $this->labelPrefix . $url;			}			return '\hyperref['.str_replace('#', '::', $url).']{' . $text . '}';		} else {			if ($this->linkStyle === self::LINK_STYLE_HREF) {				return '\href{' . $this->escapeUrl($url) . '}{' . $text . '}';			}			return $text . '\\footnote{' . (empty($block['title']) ? '' : $this->escapeLatex($block['title']) . ': ') . '\url{' . $this->escapeUrl($url) . '}}';		}	}	/**	 * @inheritdoc	 */	protected function renderImage($block)	{		if (isset($block['refkey'])) {			if (($ref = $this->lookupReference($block['refkey'])) !== false) {				$block = array_merge($block, $ref);			} else {				return $block['orig'];			}		}		// TODO create figure with caption with title		$replaces = [			'%' => '\\%',			'{' => '\\%7B',			'}' => '\\%7D',			'\\' => '\\\\',			'#' => '\\#',			'$' => '\\%24',		];		$url = str_replace(array_keys($replaces), array_values($replaces), $block['url']);		return "\\noindent\\includegraphics[width=\\textwidth]{{$url}}";	}	/**	 * Parses <a name="..."></a> tags as reference labels	 */	private function parseInlineHtml($text)	{		if (strpos($text, '>') !== false) {			// convert a name markers to \labels			if (preg_match('~^<((a|span)) (name|id)="(.*?)">.*?</\1>~i', $text, $matches)) {				return [					['label', 'name' => str_replace('#', '::', $this->labelPrefix . $matches[4])],					strlen($matches[0])				];			}		}		return [['text', '<'], 1];	}	/**	 * renders a reference label	 */	protected function renderLabel($block)	{		return "\\label{{$block['name']}}";	}	/**	 * @inheritdoc	 */	protected function renderEmail($block)	{		$email = $this->escapeUrl($block[1]);		return "\\href{mailto:{$email}}{{$email}}";	}	/**	 * @inheritdoc	 */	protected function renderUrl($block)	{		return '\url{' . $this->escapeUrl($block[1]) . '}';	}	/**	 * @inheritdoc	 */	protected function renderInlineCode($block)	{		// replace No-Break Space characters in code block, which do not render in LaTeX		$content = preg_replace("/[\x{00a0}\x{202f}]/u", ' ', $block[1]);		if (strpos($content, '|') !== false) {			return '\\lstinline`' . str_replace("\n", ' ', $content) . '`'; // TODO make this more robust against code containing backticks		} else {			return '\\lstinline|' . str_replace("\n", ' ', $content) . '|';		}	}	/**	 * @inheritdoc	 */	protected function renderStrong($block)	{		return '\textbf{' . $this->renderAbsy($block[1]) . '}';	}	/**	 * @inheritdoc	 */	protected function renderEmph($block)	{		return '\textit{' . $this->renderAbsy($block[1]) . '}';	}	/**	 * Parses escaped special characters.	 * This allow a backslash to be interpreted as LaTeX	 * @marker \	 */	protected function parseEscape($text)	{		if (isset($text[1]) && in_array($text[1], $this->escapeCharacters)) {			if ($text[1] === '\\') {				return [['backslash'], 2];			}			return [['text', $text[1]], 2];		}		return [['text', $text[0]], 1];	}	protected function renderBackslash()	{		return '\\';	}	private $_escaper;	/**	 * Escape special characters in URLs	 */	protected function escapeUrl($string)	{		return str_replace('%', '\\%', $this->escapeLatex($string));	}	/**	 * Escape special LaTeX characters	 */	protected function escapeLatex($string)	{		if ($this->_escaper === null) {			$this->_escaper = new TextToLatex();		}		return $this->_escaper->convert($string);	}	/**	 * @inheritdocs	 *	 * Parses a newline indicated by two spaces on the end of a markdown line.	 */	protected function renderText($text)	{		$output = str_replace("  \n", "\\\\\n", $this->escapeLatex($text[1]));		// support No-Break Space in LaTeX		$output = preg_replace("/\x{00a0}/u", '~', $output);		// support Narrow No-Break Space spaces in LaTeX		// http://unicode-table.com/en/202F/		// http://tex.stackexchange.com/questions/76132/how-to-typeset-a-small-non-breaking-space		$output = preg_replace("/\x{202f}/u", '\nobreak\hspace{.16667em plus .08333em}', $output);		return $output;	}}
 |