mirror of
https://github.com/BookStackApp/BookStack.git
synced 2024-10-01 01:36:00 -04:00
db7b11fe93
Adds a thin wrapper for DOMDocument to simplify and align usage within all areas of BookStack. Also means we move away from old depreacted mb_convert_encoding usage. Closes #4638
97 lines
2.5 KiB
PHP
97 lines
2.5 KiB
PHP
<?php
|
|
|
|
namespace BookStack\References;
|
|
|
|
use BookStack\App\Model;
|
|
use BookStack\References\ModelResolvers\BookLinkModelResolver;
|
|
use BookStack\References\ModelResolvers\BookshelfLinkModelResolver;
|
|
use BookStack\References\ModelResolvers\ChapterLinkModelResolver;
|
|
use BookStack\References\ModelResolvers\CrossLinkModelResolver;
|
|
use BookStack\References\ModelResolvers\PageLinkModelResolver;
|
|
use BookStack\References\ModelResolvers\PagePermalinkModelResolver;
|
|
use BookStack\Util\HtmlDocument;
|
|
|
|
class CrossLinkParser
|
|
{
|
|
/**
|
|
* @var CrossLinkModelResolver[]
|
|
*/
|
|
protected array $modelResolvers;
|
|
|
|
public function __construct(array $modelResolvers)
|
|
{
|
|
$this->modelResolvers = $modelResolvers;
|
|
}
|
|
|
|
/**
|
|
* Extract any found models within the given HTML content.
|
|
*
|
|
* @return Model[]
|
|
*/
|
|
public function extractLinkedModels(string $html): array
|
|
{
|
|
$models = [];
|
|
|
|
$links = $this->getLinksFromContent($html);
|
|
|
|
foreach ($links as $link) {
|
|
$model = $this->linkToModel($link);
|
|
if (!is_null($model)) {
|
|
$models[get_class($model) . ':' . $model->id] = $model;
|
|
}
|
|
}
|
|
|
|
return array_values($models);
|
|
}
|
|
|
|
/**
|
|
* Get a list of href values from the given document.
|
|
*
|
|
* @returns string[]
|
|
*/
|
|
protected function getLinksFromContent(string $html): array
|
|
{
|
|
$links = [];
|
|
|
|
$doc = new HtmlDocument($html);
|
|
$anchors = $doc->queryXPath('//a[@href]');
|
|
|
|
/** @var \DOMElement $anchor */
|
|
foreach ($anchors as $anchor) {
|
|
$links[] = $anchor->getAttribute('href');
|
|
}
|
|
|
|
return $links;
|
|
}
|
|
|
|
/**
|
|
* Attempt to resolve the given link to a model using the instance model resolvers.
|
|
*/
|
|
protected function linkToModel(string $link): ?Model
|
|
{
|
|
foreach ($this->modelResolvers as $resolver) {
|
|
$model = $resolver->resolve($link);
|
|
if (!is_null($model)) {
|
|
return $model;
|
|
}
|
|
}
|
|
|
|
return null;
|
|
}
|
|
|
|
/**
|
|
* Create a new instance with a pre-defined set of model resolvers, specifically for the
|
|
* default set of entities within BookStack.
|
|
*/
|
|
public static function createWithEntityResolvers(): self
|
|
{
|
|
return new self([
|
|
new PagePermalinkModelResolver(),
|
|
new PageLinkModelResolver(),
|
|
new ChapterLinkModelResolver(),
|
|
new BookLinkModelResolver(),
|
|
new BookshelfLinkModelResolver(),
|
|
]);
|
|
}
|
|
}
|