icingaweb2/modules/doc/library/Doc/DocParser.php

236 lines
7.4 KiB
PHP
Raw Normal View History

2013-10-16 14:45:23 +02:00
<?php
/* Icinga Web 2 | (c) 2013 Icinga Development Team | GPLv2+ */
2013-10-16 14:45:23 +02:00
namespace Icinga\Module\Doc;
use CachingIterator;
2016-03-30 15:29:50 +02:00
use RecursiveIteratorIterator;
2015-11-24 16:10:45 +01:00
use SplFileObject;
use SplStack;
use Icinga\Data\Tree\SimpleTree;
use Icinga\Exception\NotReadableError;
2015-11-24 16:10:45 +01:00
use Icinga\Util\DirectoryIterator;
use Icinga\Module\Doc\Exception\DocException;
2013-10-16 14:45:23 +02:00
/**
* Parser for documentation written in Markdown
2013-10-16 14:45:23 +02:00
*/
class DocParser
2013-10-16 14:45:23 +02:00
{
/**
* Internal identifier for Atx-style headers
*
* @var int
*/
const HEADER_ATX = 1;
/**
* Internal identifier for Setext-style headers
*
* @var int
*/
const HEADER_SETEXT = 2;
/**
* Path to the documentation
*
* @var string
*/
protected $path;
/**
* Iterator over documentation files
*
2015-11-24 16:10:45 +01:00
* @var DirectoryIterator
*/
protected $docIterator;
2013-10-16 14:45:23 +02:00
/**
* Create a new documentation parser for the given path
*
2014-12-09 14:24:11 +01:00
* @param string $path Path to the documentation
2013-10-16 14:45:23 +02:00
*
* @throws DocException If the documentation directory does not exist
* @throws NotReadableError If the documentation directory is not readable
*/
public function __construct($path)
{
2015-11-24 16:10:45 +01:00
if (! DirectoryIterator::isReadable($path)) {
throw new DocException(
2015-11-24 16:10:45 +01:00
mt('doc', 'Documentation directory \'%s\' is not readable'),
$path
);
}
$this->path = $path;
2016-03-30 15:29:50 +02:00
$this->docIterator = new DirectoryIterator($path, 'md', DirectoryIterator::FILES_FIRST);
}
/**
* Extract atx- or setext-style headers from the given lines
*
* @param string $line
* @param string $nextLine
*
* @return array|null An array containing the header and the header level or null if there's nothing to extract
*/
protected function extractHeader($line, $nextLine)
{
if (! $line) {
return null;
}
$header = null;
if ($line
&& $line[0] === '#'
&& preg_match('/^#+/', $line, $match) === 1
) {
// Atx
$level = strlen($match[0]);
$header = trim(substr($line, $level));
if (! $header) {
return null;
}
$headerStyle = static::HEADER_ATX;
} elseif ($nextLine
&& ($nextLine[0] === '=' || $nextLine[0] === '-')
&& preg_match('/^[=-]+\s*$/', $nextLine, $match) === 1
) {
// Setext
$header = trim($line);
if (! $header) {
return null;
}
if ($match[0][0] === '=') {
$level = 1;
} else {
$level = 2;
}
$headerStyle = static::HEADER_SETEXT;
}
if ($header === null) {
return null;
}
2017-07-28 10:20:18 +02:00
if (strpos($header, '<') !== false
&& preg_match('#(?:<(?P<tag>a|span) (?:id|name)="(?P<id>.+)"></(?P=tag)>)\s*#u', $header, $match)
) {
$header = str_replace($match[0], '', $header);
$id = $match['id'];
} else {
$id = null;
}
2016-03-30 15:29:50 +02:00
/** @noinspection PhpUndefinedVariableInspection */
return array($header, $id, $level, $headerStyle);
}
2016-03-30 15:29:50 +02:00
/**
* Generate unique section ID
*
* @param string $id
* @param string $filename
* @param SimpleTree $tree
*
* @return string
*/
protected function uuid($id, $filename, SimpleTree $tree)
{
$id = str_replace(' ', '-', $id);
if ($tree->getNode($id) === null) {
return $id;
2016-03-30 15:29:50 +02:00
}
$id = $id . '-' . md5($filename);
2016-03-30 15:29:50 +02:00
$offset = 0;
while ($tree->getNode($id)) {
if ($offset++ === 0) {
$id .= '-' . $offset;
} else {
$id = substr($id, 0, -1) . $offset;
}
}
return $id;
}
/**
* Get the documentation tree
*
* @return SimpleTree
*/
public function getDocTree()
{
$tree = new SimpleTree();
2016-03-30 15:29:50 +02:00
foreach (new RecursiveIteratorIterator($this->docIterator) as $filename) {
2015-11-24 16:10:45 +01:00
$file = new SplFileObject($filename);
$file->setFlags(SplFileObject::READ_AHEAD);
2015-08-10 13:23:14 +02:00
$stack = new SplStack();
$cachingIterator = new CachingIterator($file);
$insideFencedCodeBlock = false;
for ($cachingIterator->rewind(); $cachingIterator->valid(); $cachingIterator->next()) {
$line = $cachingIterator->current();
$header = null;
if (substr($line, 0, 3) === '```') {
$insideFencedCodeBlock = ! $insideFencedCodeBlock;
} elseif (! $insideFencedCodeBlock) {
$fileIterator = $cachingIterator->getInnerIterator();
$header = $this->extractHeader($line, $fileIterator->valid() ? $fileIterator->current() : null);
}
if ($header !== null) {
list($title, $id, $level, $headerStyle) = $header;
while (! $stack->isEmpty() && $stack->top()->getLevel() >= $level) {
$stack->pop();
}
if ($id === null) {
$path = array();
foreach ($stack as $section) {
/** @var $section DocSection */
$path[] = $section->getTitle();
}
$path[] = $title;
$id = implode('-', $path);
$noFollow = true;
} else {
$noFollow = false;
}
2016-03-30 15:29:50 +02:00
$id = $this->uuid($id, $filename, $tree);
$section = new DocSection();
$section
->setId($id)
->setTitle($title)
->setLevel($level)
->setNoFollow($noFollow);
if ($stack->isEmpty()) {
$section->setChapter($section);
$tree->addChild($section);
} else {
$section->setChapter($stack->bottom());
$tree->addChild($section, $stack->top());
}
$stack->push($section);
if ($headerStyle === static::HEADER_SETEXT) {
$cachingIterator->next();
continue;
}
} else {
if ($stack->isEmpty()) {
2015-08-10 13:23:14 +02:00
$title = ucfirst($file->getBasename('.' . pathinfo($file->getFilename(), PATHINFO_EXTENSION)));
2016-03-30 15:29:50 +02:00
$id = $this->uuid($title, $filename, $tree);
2015-08-10 13:23:14 +02:00
$section = new DocSection();
$section
->setId($id)
->setTitle($title)
->setLevel(1)
->setNoFollow(true);
$section->setChapter($section);
$tree->addChild($section);
$stack->push($section);
}
$stack->top()->appendContent($line);
}
}
}
return $tree;
2013-10-16 14:45:23 +02:00
}
}