path = $path; } /** * Retrieve doc as HTML converted from markdown files sorted by filename and the table of contents * * @return array * @throws DocException */ public function getDocAndToc() { $iter = new RecursiveIteratorIterator( new MarkdownFileIterator( new RecursiveDirectoryIterator($this->path) ) ); $fileInfos = iterator_to_array($iter); natcasesort($fileInfos); $cat = array(); $toc = array((object) array( 'level' => 0, 'item' => new Menu('doc') )); $itemPriority = 1; foreach ($fileInfos as $fileInfo) { try { $fileObject = $fileInfo->openFile(); } catch (RuntimeException $e) { throw new DocException($e->getMessage()); } if ($fileObject->flock(LOCK_SH) === false) { throw new DocException('Couldn\'t get the lock'); } $line = null; while (! $fileObject->eof()) { // Save last line for setext-style headers $lastLine = $line; $line = $fileObject->fgets(); $header = $this->extractHeader($line, $lastLine); if ($header !== null) { list($header, $level) = $header; $id = $this->extractHeaderId($header); $nofollow = false; $this->reduceToc($toc, $level); if ($id === null) { $path = array(); foreach (array_slice($toc, 1) as $entry) { $path[] = $entry->item->getTitle(); } $path[] = $header; $id = implode('-', $path); $nofollow = true; } $id = urlencode(str_replace('.', '.', strip_tags($id))); $item = end($toc)->item->addChild( $id, array( 'id' => $id, 'title' => $header, 'priority' => $itemPriority++, // Post-increment is on purpose 'nofollow' => $nofollow ) ); $toc[] = ((object) array( 'level' => $level, 'item' => $item )); $line = '' . PHP_EOL . $line; } $cat[] = $line; } $fileObject->flock(LOCK_UN); } $html = Parsedown::instance()->text(implode('', $cat)); $html = preg_replace_callback( '#
(.*?)\
#s', array($this, 'highlight'), $html ); return array($html, $toc[0]->item); } /** * Syntax highlighting for PHP code * * @param $match * * @return string */ protected function highlight($match) { return highlight_string(htmlspecialchars_decode($match[1]), true); } /** * Extract atx- or setext-style headers from the given lines * * @param string $line * @param string $lastLine * * @return array|null An array containing the header and the header level or null if there's nothing to extract */ protected function extractHeader($line, $lastLine) { if (! $line) { return null; } $header = null; if ($line && $line[0] === '#' && preg_match('/^#+/', $line, $match) === 1 ) { // Atx-style $level = strlen($match[0]); $header = trim(substr($line, $level)); if (! $header) { return null; } } elseif ( $line && ($line[0] === '=' || $line[0] === '-') && preg_match('/^[=-]+\s*$/', $line, $match) === 1 ) { // Setext $header = trim($lastLine); if (! $header) { return null; } if ($match[0][0] === '=') { $level = 1; } else { $level = 2; } } if ($header === null) { return null; } return array($header, $level); } /** * Extract header id in an a or a span tag * * @param string &$header * * @return id|null */ protected function extractHeaderId(&$header) { if ($header[0] === '<' && preg_match('#(?:<(?Pa|span) id="(?P.+)">)#u', $header, $match) ) { $header = str_replace($match[0], '', $header); return $match['id']; } return null; } /** * Reduce the toc to the given level * * @param array &$toc * @param int $level */ protected function reduceToc(array &$toc, $level) { while (end($toc)->level >= $level) { array_pop($toc); } } }