X-Git-Url: http://git.shiar.net/minimedit.git/blobdiff_plain/1abb286e88defee799e43cdd296914f74f722bde..ea491f36c7f81ed231444ed5e4a76c52b03434ac:/article.inc.php diff --git a/article.inc.php b/article.inc.php index bc8dbff..93bbe3b 100644 --- a/article.inc.php +++ b/article.inc.php @@ -16,34 +16,70 @@ function showdate($parts) class ArchiveArticle { + public $raw, $title, $body; # file contents + public $meta = []; # head metadata properties + function __construct($path) { - $this->page = $path; - $this->link = preg_replace('{(?:/index)?\.html$}', '', $path); + $this->page = preg_replace('{^\.(?:/|$)}', '', $path); + $this->link = preg_replace('{(?:(?:/|^)index)?\.html$}', '', $this->page); + $this->raw($this->page); } - function __get($col) + function raw($page) { - return $this->$col = $this->$col(); # run method and cache - } + if (!file_exists($page)) { + return; + } + $this->raw = file_get_contents($page); - function file() - { - if (!file_exists($this->page)) return; - return fopen($this->page, 'r'); + if (preg_match_all('{ + \G \s* + }x', $this->raw, $meta)) { + $matchlen = array_sum(array_map('strlen', $meta[0])); + $this->raw = substr($this->raw, $matchlen); # delete matched contents + $this->meta = array_combine($meta[1], $meta[2]); # [property => content] + } + + // find significant contents + $this->body = preg_replace('{}s', '', $this->raw); + if (preg_match('{

(.*?)

\s*(.*)}s', $this->body, $titlematch)) { + list (, $this->title, $this->body) = $titlematch; + } } - function rawtitle() + function __get($col) { - return fgets($this->file); + return $this->$col = $this->$col(); # run method and cache } - function title() - { - return preg_replace('{

(.*)

\s*}', '\1', $this->rawtitle); + + function handler() + { + $path = $this->link; + $this->path = ''; + $this->restricted = FALSE; + while (TRUE) { + if (file_exists("$path/.private")) { + $this->restricted = $path; + } + + if (file_exists("$path/index.php")) { + return $path; + } + + $up = strrpos($path, '/'); + $this->path = substr($path, $up) . $this->path; + $path = substr($path, 0, $up); + if ($up === FALSE) { + break; + } + } + return; } + function safetitle() { - return trim(strip_tags($this->title)); + return trim($this->meta['og:title'] ?? strip_tags($this->title)); } function name() { @@ -74,16 +110,10 @@ class ArchiveArticle return showdate($this->dateparts); } - function body() - { - if (!$this->file) return; - $this->rawtitle; - return fread($this->file, filesize($this->page) ?: 1); - } function story() { if ( preg_match('{ - \n (?: < (?: p | figure [^>]* ) >\s* )+ (]*>) | \n + (?: < (?: p | figure [^>]* ) >\s* )+ (]*>) | \n }x', $this->body, $img, PREG_OFFSET_CAPTURE) ) { # strip part after matching divider (image) if (isset($img[1])) { @@ -94,13 +124,17 @@ class ArchiveArticle return $this->body; } - function raw() - { - return $this->rawtitle . $this->body; - } function teaser() { - if (preg_match('{

(.*?)

}s', $this->story, $bodyp)) { + if ($override = @$this->meta['og:description']) { + # prefer specific page description if found in metadata + return $override; + } + + # paragraph contents following the page header if any + if (preg_match('{ + \G (?> \s+ |
]*> | \[\[[^]]*\]\] )*

\s* (.*?)

+ }sx', $this->body, $bodyp, 0)) { return $bodyp[1]; } } @@ -113,6 +147,11 @@ class ArchiveArticle } function image() { + if ($override = @$this->meta['og:image']) { + # prefer specific page image if found in metadata + return $override; + } + if ( preg_match('/\bsrc="([^"]*)"/', $this->img, $src) ) { return $src[1]; } @@ -126,3 +165,41 @@ class ArchiveArticle ); } } + +class PageSearch +{ + function __construct($path = '.') + { + $this->iterator = new RecursiveCallbackFilterIterator( + new RecursiveDirectoryIterator($path), + function ($current) { + if ($current->getFilename()[0] === '.') { + # skip hidden files and directories + return FALSE; + } + if ($current->isLink()) { + # ignore symlinks, original contents only + return FALSE; + } + if ($current->isDir()) { + # traverse subdirectories unless untracked in any amount + return !file_exists("$current/.gitignore"); + } + # match **/*.html + return preg_match('/(?getFilename()); + } + ); + } + + function files() + { + # order alphabetically by link + $dir = iterator_to_array(new RecursiveIteratorIterator($this->iterator)); + array_walk($dir, function (&$row, $name) { + # prepare values for sorting (directory index first) + $row = preg_replace('{/index\.html$}', '', $name); + }); + asort($dir); + return $dir; + } +}