praiadeseselle/wire/modules/PagePathHistory.module

1197 lines
36 KiB
Text
Raw Normal View History

2022-03-08 15:55:41 +01:00
<?php namespace ProcessWire;
/**
* ProcessWire Page Path History
*
* Keeps track of past URLs where pages have lived and automatically 301 redirects
* to the new location whenever the past URL is accessed.
*
2023-03-10 19:41:40 +01:00
* ProcessWire 3.x, Copyright 2022 by Ryan Cramer
2022-03-08 15:55:41 +01:00
* https://processwire.com
*
* @method upgrade($fromVersion, $toVersion)
* @property int $minimumAge
2022-11-05 18:32:48 +01:00
* @property array|bool $rootSegments
2022-03-08 15:55:41 +01:00
*
*
*/
class PagePathHistory extends WireData implements Module, ConfigurableModule {
public static function getModuleInfo() {
return array(
'title' => 'Page Path History',
2022-11-05 18:32:48 +01:00
'version' => 8,
2023-03-10 19:41:40 +01:00
'summary' => "Keeps track of past URLs where pages have lived and automatically redirects (301 permanent) to the new location whenever the past URL is accessed.",
2022-03-08 15:55:41 +01:00
'singular' => true,
'autoload' => true,
2022-11-05 18:32:48 +01:00
);
2022-03-08 15:55:41 +01:00
}
/**
* Table created by this module
*
*/
const dbTableName = 'page_path_history';
/**
* Minimum age in seconds that a page must be before we'll bother remembering its previous path
*
*/
const minimumAge = 120;
/**
* Maximum segments to support in a redirect URL
*
* Used to place a limit on recursion and paths
*
*/
const maxSegments = 10;
/**
* PagePageHistory module/schema version
*
* @var int
*
*/
protected $version = 0;
/**
* Construct
*
*/
public function __construct() {
parent::__construct();
$this->set('minimumAge', self::minimumAge);
2022-11-05 18:32:48 +01:00
$this->set('rootSegments', false);
2022-03-08 15:55:41 +01:00
}
/**
* Initialize the hooks
*
*/
public function init() {
$this->pages->addHook('moved', $this, 'hookPageMoved');
$this->pages->addHook('renamed', $this, 'hookPageMoved');
$this->pages->addHook('deleted', $this, 'hookPageDeleted');
$this->addHook('ProcessPageView::pageNotFound', $this, 'hookPageNotFound');
$this->addHook('Page::addUrl', $this, 'hookPageAddUrl');
$this->addHook('Page::removeUrl', $this, 'hookPageRemoveUrl');
}
/**
* Get version of this module/schema
*
* @return int
*
*/
protected function getVersion() {
if($this->version) return $this->version;
2023-03-10 19:41:40 +01:00
$this->version = $this->wire()->modules->getModuleInfoProperty($this, 'version');
2022-03-08 15:55:41 +01:00
if(!$this->version) $this->version = 1;
return $this->version;
}
/**
* Whether or not to consider language_id in page_path_history module table
*
* @return Languages|bool Returns Languages object if yes, or boolean false if not
*
*/
protected function getLanguages() {
if($this->getVersion() < 2) return false;
2022-11-05 18:32:48 +01:00
$languages = $this->wire()->languages;
return $languages && $languages->hasPageNames() ? $languages : false;
2022-03-08 15:55:41 +01:00
}
/**
* Given a language ID, name or Language object, return Language object or NULL if not found
*
* @param int|string|Language $language
* @return Language|null
*
*/
protected function getLanguage($language) {
$languages = $this->getLanguages();
if(!$languages) return null;
if($language instanceof Page) {
// ok
} else if($language === 0) {
$language = $languages->getDefault();
2023-03-10 19:41:40 +01:00
} else if(is_int($language) || ctype_digit("$language")) {
2022-03-08 15:55:41 +01:00
$language = $languages->get((int) $language);
} else if(is_string($language) && $language) {
2023-03-10 19:41:40 +01:00
$language = $languages->get($this->wire()->sanitizer->pageNameUTF8($language));
2022-03-08 15:55:41 +01:00
}
if($language && !$language->id) $language = null;
return $language;
}
/**
* Set a history path for a page and delete any existing entries for pages current path
*
* @param Page $page
* @param string $path
* @param Language|int $language
* @return bool True on success, or false if path already consumed in history
*
*/
public function setPathHistory(Page $page, $path, $language = null) {
2023-03-10 19:41:40 +01:00
$database = $this->wire()->database;
2022-03-08 15:55:41 +01:00
$table = self::dbTableName;
$result = $this->addPathHistory($page, $path, $language);
if($result) {
// delete any possible entries that overlap with the $page current path since are no longer applicable
$query = $database->prepare("DELETE FROM $table WHERE path=:path LIMIT 1");
2022-11-05 18:32:48 +01:00
$query->bindValue(":path", rtrim($this->wire()->sanitizer->pagePathName($page->path, Sanitizer::toAscii), '/'));
2022-03-08 15:55:41 +01:00
$query->execute();
}
return $result;
}
/**
* Add a history path for a page
*
* @param Page $page
* @param string $path
* @param null|Language $language
* @return bool True if path was added, or false if it likely overlaps with an existing path
*
*/
public function addPathHistory(Page $page, $path, $language = null) {
2022-11-05 18:32:48 +01:00
$sanitizer = $this->wire()->sanitizer;
$database = $this->wire()->database;
$modules = $this->wire()->modules;
2022-03-08 15:55:41 +01:00
$table = self::dbTableName;
2022-11-05 18:32:48 +01:00
$path = $sanitizer->pagePathName('/' . trim($path, '/'), Sanitizer::toAscii);
2022-03-08 15:55:41 +01:00
$selector = "path=$path";
2022-11-05 18:32:48 +01:00
if($modules->isInstalled('PagePaths')) $selector .= ", id!=$page->id";
if($this->wire()->pages->count($selector)) return false;
2022-03-08 15:55:41 +01:00
$language = $this->getLanguage($language);
$sql = "INSERT INTO $table SET path=:path, pages_id=:pages_id, created=NOW()";
if($language) $sql .= ', language_id=:language_id';
$query = $database->prepare($sql);
$query->bindValue(":path", $path);
$query->bindValue(":pages_id", $page->id, \PDO::PARAM_INT);
if($language) $query->bindValue(':language_id', $language->id, \PDO::PARAM_INT);
try {
$result = $query->execute();
} catch(\Exception $e) {
// ignore the exception because it means there is already a past URL (duplicate)
$result = false;
}
2022-11-05 18:32:48 +01:00
$this->addRootSegment($path);
2022-03-08 15:55:41 +01:00
return $result;
}
/**
* Delete path entry for given page and path
*
* @param Page $page
* @param string $path
* @return int
*
*/
public function deletePathHistory(Page $page, $path) {
2022-11-05 18:32:48 +01:00
$database = $this->wire()->database;
2022-03-08 15:55:41 +01:00
$table = self::dbTableName;
2022-11-05 18:32:48 +01:00
$path = $this->wire()->sanitizer->pagePathName('/' . trim($path, '/'), Sanitizer::toAscii);
2022-03-08 15:55:41 +01:00
$sql = "DELETE FROM $table WHERE path=:path AND pages_id=:pages_id LIMIT 1";
$query = $database->prepare($sql);
$query->bindValue(':path', $path);
$query->bindValue(':pages_id', $page->id, \PDO::PARAM_INT);
$query->execute();
$cnt = $query->rowCount();
$query->closeCursor();
return $cnt;
}
/**
* Delete all path history for a given Page or for all pages
*
* @param Page|true $page If value of this param is boolean true (rather than Page), all paths for all pages are cleared
* @throws WireException if param $page is not of expected type (true or Page)
* @since 3.0.178
*
*/
public function deleteAllPathHistory($page) {
$database = $this->wire()->database;
if($page === true) {
$database->exec('DELETE FROM ' . self::dbTableName);
} else if($page instanceof Page && $page->id) {
$query = $database->prepare('DELETE FROM ' . self::dbTableName . ' WHERE pages_id=:pages_id');
$query->bindValue(':pages_id', $page->id, \PDO::PARAM_INT);
$query->execute();
} else {
throw new WireException("Invalid param: instance of Page or boolean true expected");
}
2022-11-05 18:32:48 +01:00
$this->rebuildRootSegments();
2022-03-08 15:55:41 +01:00
}
/**
* Get an array of all paths the given page has previously had, oldest to newest
*
* For the options argument:
* - Optionally specify a Language instance (or name or ID) to isolate results to a specific language.
* - Optionally specify boolean true to return verbose info.
*
* @param Page $page Page to retrieve paths for.
* @param Language|null|array|bool Specify an option below:
* - `language` (Language|int|string): Limit returned paths to this language. If none specified, then all languages are included.
* - `verbose` (bool): Return associative array for each path with additional info (date and language, if present).
* - `virtual` (bool): Return history that includes auto-determined virtual entries from parent history? (default=true)
* What this does is also include changes to parent pages that would affect overall URL to requested page.
* - Or you may specify the `language` option for the options argument.
* - Or you may specify boolean `true` for options argument as a shortcut for the `verbose` option.
* @return array of paths
*
*/
public function getPathHistory(Page $page, $options = array()) {
static $level = 0;
$level++;
$defaults = array(
'language' => !is_array($options) && !is_bool($options) ? $options : null,
'verbose' => is_bool($options) ? $options : false,
'virtual' => true,
);
2022-11-05 18:32:48 +01:00
$database = $this->wire()->database;
$sanitizer = $this->wire()->sanitizer;
$languages = $this->wire()->languages;
2022-03-08 15:55:41 +01:00
$paths = array();
$options = is_array($options) ? array_merge($defaults, $options) : $defaults;
if($this->getVersion() < 2) {
$options['language'] = null;
$allowLanguage = false;
} else {
2022-11-05 18:32:48 +01:00
$allowLanguage = $languages && $languages->hasPageNames();
2022-03-08 15:55:41 +01:00
}
$language = $options['language'] && $allowLanguage ? $this->getLanguage($options['language']) : null;
$finds = array('pages_id' => $page->id);
$selects = array('path');
$wheres = array();
if($options['verbose']) $selects[] = 'created';
if($options['verbose'] && $allowLanguage) $selects[] = 'language_id';
if($language) $finds['language_id'] = $language->isDefault() ? 0 : $language->id;
foreach($finds as $col => $value) {
$wheres[] = "$col=:$col";
}
$query = $database->prepare(
'SELECT ' . implode(', ', $selects) . ' FROM ' . self::dbTableName . ' ' .
'WHERE ' . implode(' AND ', $wheres) . ' ' .
"ORDER BY created"
);
foreach($finds as $col => $value) {
$query->bindValue(":$col", $value, \PDO::PARAM_INT);
}
try {
$query->execute();
/** @noinspection PhpAssignmentInConditionInspection */
while($row = $query->fetch(\PDO::FETCH_ASSOC)) {
$path = $sanitizer->pagePathName($row['path'], Sanitizer::toUTF8);
if($options['verbose']) {
$value = array('path' => $path);
$pathDate = $row['created'];
$value['date'] = $pathDate;
if($allowLanguage && isset($row['language_id'])) {
$pathLanguage = $this->getLanguage((int) $row['language_id']);
$value['language'] = $pathLanguage && $pathLanguage->id ? $pathLanguage : null;
}
} else {
$value = $path;
}
$paths[$path] = $value;
}
} catch(\Exception $e) {
2022-11-05 18:32:48 +01:00
if(!$this->checkTableSchema()) {
$this->error($e->getMessage(), Notice::superuser | Notice::log);
}
2022-03-08 15:55:41 +01:00
}
if($options['virtual']) {
// get changes to current and previous parents as well
foreach($paths as $value) {
$virtualPaths = $this->getVirtualHistory($page, $value, $options);
foreach($virtualPaths as $virtualPath => $virtualInfo) {
if(isset($paths[$virtualPath])) continue;
$paths[$virtualPath] = $virtualInfo;
}
}
if($level === 1 && $options['verbose']) {
$paths = $this->sortVerbosePathInfo($paths);
}
}
$level--;
return array_values($paths);
}
/**
* Sort verbose paths by date
*
* @param array $paths Verbose paths
* @param bool $newest Sort newest to oldest? Specify false so sort oldest to newest. (default=true)
* @return array
*
*/
protected function sortVerbosePathInfo(array $paths, $newest = true) {
$sortPaths = array();
foreach($paths as $value) {
$date = strtotime($value['date']);
while(isset($sortPaths[$date])) $date++;
$sortPaths[$date] = $value;
}
if($newest) {
krsort($sortPaths);
} else {
ksort($sortPaths);
}
return $sortPaths;
}
/**
* Get history which includes entries not actually in pages_paths table reflecting changes to parents
*
* @param Page $page
* @param string|array $path
* @param array $options
*
* @return array
*
*/
protected function getVirtualHistory(Page $page, $path, array $options) {
$paths = array();
$checkParents = array();
if(is_array($path)) {
// path is verbose info
$pathInfo = $path;
$path = $pathInfo['path'];
} else {
// path is string
$pathInfo = array('path');
}
// separate page name and parent path
$parts = explode('/', trim($path, '/'));
$pageName = array_pop($parts);
$parentPath = implode('/', $parts);
// if pages current parent is not homepage, include it
if($page->parent_id > 1) {
$checkParents[] = $page->parent;
}
// if historical parent path differs from pages current parent path, include it
if($parentPath === '' || $parentPath === '/') {
// historial parent is root/home
} else if($parentPath === trim($page->parent()->path(), '/')) {
// historial parent is the same as current parent
} else if($parentPath === trim($page->path(), '/')) {
// historial parent is the page itself
} else {
// historial parent may be one we want to check
$parent = $this->wire()->pages->get("/$parentPath");
if(!$parent->id) $parent = $this->getPage($parentPath);
// if parent from path is different from current page parent, include in our list of parents to check
if($parent->id > 1 && $parent->id != $page->parent_id && $parent->id != $page->id) {
$checkParents[] = $parent;
}
}
// get paths for each parent
foreach($checkParents as $parent) {
$parentPaths = $this->getVirtualHistoryParent($page, $pageName, $pathInfo, $parent, $options);
foreach($parentPaths as $parentPath => $parentInfo) {
if(!isset($paths[$parentPath])) {
$paths[$parentPath] = $parentInfo;
}
}
}
return $paths;
}
/**
* Get virtual history for page in context of a specific parent (companion to getVirtualHistory method)
*
* @param Page $page
* @param string $pageName Historical name (or same as page->name)
* @param array|string $pagePathInfo Path or pathInfo array
* @param Page $parent
* @param array $options
* @return array
*
*/
protected function getVirtualHistoryParent(Page $page, $pageName, array $pagePathInfo, Page $parent, array $options) {
$paths = array();
// get path history for this parent
$parentPaths = $this->getPathHistory($parent, $options);
// pageNamesDates is array of name => timestamp
$pageNamesDates = array(
$pageName => isset($pagePathInfo['date']) ? strtotime($pagePathInfo['date']) : 0
);
// if historical name differs from current name, include current name in pageNamesDates
if($page->name != $pageName) {
$pageNamesDates[$page->name] = $page->modified;
}
// iterate through each of the names this page has had, along with the date that it was changed to it
foreach($pageNamesDates as $name => $date) {
// iterate through all possible parent paths
foreach($parentPaths as $parentPathInfo) {
$parentPath = $options['verbose'] ? $parentPathInfo['path'] : $parentPathInfo;
// create path that is historical parent path plus current iteration of page name
$path = $parentPath . '/' . $name;
// if we've already got this path, skip it
if(isset($paths[$path])) continue;
// non-verbose mode only includes paths
if(empty($options['verbose'])) {
$paths[$path] = $path;
continue;
}
// if parent change date is older than page change date, then we can skip it
if(strtotime($parentPathInfo['date']) < $date) continue;
// if path is related to trash do not include it
if(strpos($path, '/trash/') === 0 || preg_match('!/\d+\.\d+\.\d+_[-_a-z0-9]+!', $path)) {
continue;
}
// create verbose info for this entry
$pathInfo = array(
'path' => $path,
'date' => $parentPathInfo['date'],
'virtual' => $parent->id
);
// if parent is specific to a language, include that info in the verbose value
if(isset($parentPathInfo['language'])) {
$pathInfo['language'] = $parentPathInfo['language'];
}
$paths[$path] = $pathInfo;
}
}
return $paths;
}
/**
2022-11-05 18:32:48 +01:00
* Get array of info about a path if it is in history
*
* If path is found in history, the returned array `id` value will be populated with a positive
* integer of the found page ID. If not found, it will be populated with integer 0.
*
* By default this method attempts to perform exact path matches only. To enable partial matches
* of paths that may be appended with additional URL segments, set the `allowUrlSegments` option
* to true. Note that it will only apply to matched pages that have templates allowing URL
* segments.
*
* Return array includes:
*
* - `id` (int): ID of matched page or 0 if no match.
* - `path` (string): Path that was matched.
* - `language_id` (int): ID of language for path, if applicable.
* - `templates_id` (int): ID of template for page that was matched.
* - `parent_id (int): ID of parent for page that was matched.
* - `status` (int): Status of the page that was matched.
* - `created` (string): Date that this entry was created (ISO-8601 date/time string).
* - `name` (string): Name of page that was matched in default language.
* - `urlSegmentStr` (string): Portion of path that was identified as URL segments (for partial match).
* - `matchType` (string): Contains value “exact” when exact match, “partial” when partial/URL segments
* match, or blank string when no match.
*
* Note that the `urlSegmentStr` and `matchType` properties may only be of interest if the
* given `allowUrlSegments` option is set to `true`.
*
* @param string $path
* @param array $options
* - `allowUrlSegments` (bool): Allow matching paths with URL segments? (default=false)
* When used, the `urlSegmentStr` return value property will be populated with slash
* separated URL segments that were not part of the matched path, and the `matchType`
* property will contain the value “partial”.
* @return array
* @since 3.0.186
2022-03-08 15:55:41 +01:00
*
2022-11-05 18:32:48 +01:00
*/
public function getPathInfo($path, array $options = array()) {
$defaults = array(
'allowUrlSegments' => false,
);
$options = array_merge($defaults, $options);
$sanitizer = $this->wire()->sanitizer;
$templates = $this->wire()->templates;
$database = $this->wire()->database;
$config = $this->wire()->config;
$table = self::dbTableName;
$path = '/' . trim($path, '/');
$originalPath = $path; // original path (without ascii conversion)
$namesUTF8 = $config->pageNameCharset === 'UTF8';
$result = array(
'id' => 0,
'path' => $path,
'language_id' => 0,
'templates_id' => 0,
'parent_id' => 0,
'created' => '',
'status' => 0,
'name' => '',
'matchType' => '',
'urlSegmentStr' => '',
);
if($namesUTF8) $path = $sanitizer->pagePathName($path, Sanitizer::toAscii);
$requestPath = $path; // path that was requested (with ascii conversion)
$wheres = array("$table.path=:path");
$binds['path'] = $requestPath;
if($options['allowUrlSegments']) {
$n = 0;
while(strlen($path)) {
$pos = strrpos($path, '/');
if(!$pos) break;
$path = substr($path, 0, $pos);
$wheres[] = "$table.path=:path$n";
$binds["path$n"] = rtrim($path, '/');
$n++;
}
}
$sql =
"SELECT $table.path AS path, $table.pages_id AS id, $table.created AS created, $table.language_id AS language_id, " .
"pages.templates_id AS templates_id, pages.parent_id AS parent_id, pages.status AS status, pages.name AS name " .
"FROM $table " .
"LEFT JOIN pages ON $table.pages_id=pages.id " .
"WHERE " . implode(' OR ', $wheres);
try {
$query = $database->prepare($sql);
foreach($binds as $bindKey => $bindValue) {
$query->bindValue(":$bindKey", $bindValue);
}
$query->execute();
$rowCount = $query->rowCount();
$query->closeCursor();
} catch(\Exception $e) {
if(!$this->checkTableSchema()) throw $e;
$rowCount = 0;
$query = null;
}
if(!$rowCount || $query) return $result;
$rows = array();
$pathCounts = array();
$matchRow = null;
while($row = $query->fetch(\PDO::FETCH_ASSOC)) {
$path = $row['path'];
if($path === $requestPath) {
// found exact match
$matchRow = $row;
break;
} else {
// path with urlSegments match
$rows[$path] = $row;
$pathCounts[$path] = substr_count($path, '/');
}
}
$query->closeCursor();
if($matchRow) {
// ok found
$result['matchType'] = 'exact';
2023-03-10 19:41:40 +01:00
} else {
2022-11-05 18:32:48 +01:00
// select from multiple matched rows (urlSegments mode only)
// order by quantity of slashes (most to least)
arsort($pathCounts);
// find first row that has a template allowing URL segments
foreach($pathCounts as $path => $count) {
$row = $rows[$path];
$template = $templates->get((int) $row['templates_id']);
if(!$template || !$template->urlSegments) continue;
$matchRow = $row;
$result['matchType'] = 'partial';
break;
}
}
if($matchRow) {
$result = array_merge($result, $matchRow);
}
// if no match return now
if(!$result['id']) return $result;
foreach($result as $key => $value) {
if($key === 'id' || $key === 'status' || strpos($key, '_id')) {
$result[$key] = (int) $value;
} else if($key === 'path' && $namesUTF8) {
$result['path'] = $sanitizer->pagePathName($value, Sanitizer::toUTF8);
} else if($key === 'name' && $namesUTF8) {
$result['name'] = $sanitizer->pageName($value, Sanitizer::toUTF8);
}
}
if($result['matchType'] === 'partial') {
$result['urlSegmentStr'] = trim(substr($originalPath, strlen($result['path'])+1), '/');
}
return $result;
}
/**
* Given a previously existing path, return the matching Page object or NullPage if not found.
*
* If the path is for a specific language, this method also sets a $page->_language property
* containing the Language object the path is for.
*
* @param string $path Historical path of page you want to retrieve
* @param int $level Recursion level for internal recursive use only
* @return Page|NullPage
*
*/
public function getPage($path, $level = 0) {
$pages = $this->wire()->pages;
$page = $pages->newNullPage();
$sanitizer = $this->wire()->sanitizer;
$languages = $this->getLanguages();
$database = $this->wire()->database;
$table = self::dbTableName;
$pathRemoved = '';
$cnt = 0;
if(!$level) {
$path = $sanitizer->pagePathName($path, Sanitizer::toAscii);
if(!$this->isRootSegment($path)) return $pages->newNullPage();
}
$path = '/' . trim($path, '/');
while(strlen($path) && !$page->id && $cnt < self::maxSegments) {
$sql = "SELECT pages_id ";
if($languages) $sql .= ", language_id ";
$sql .= "FROM $table WHERE path=:path";
$query = $database->prepare($sql);
$query->bindValue(":path", $path);
$error = false;
try {
$query->execute();
} catch(\Exception $e) {
if(strpos($e->getMessage(), '1054') !== false) $this->upgrade(1, 2);
$this->wire()->log->error('PagePathHistory::getPage() - ' . $e->getMessage());
$error = true;
}
if($error) break;
if($query->rowCount() > 0) {
// found a match
$row = $query->fetch(\PDO::FETCH_NUM);
$pages_id = (int) $row[0];
$language_id = $languages && isset($row[1]) ? $row[1] : 0;
$page = $this->pages->get((int) $pages_id);
if($language_id) $page->setQuietly("_language", $this->getLanguage($language_id));
} else {
// didn't find a match, we'll pop the last segment off and try again for the parent
$pos = strrpos($path, '/');
$pathRemoved = substr($path, $pos) . $pathRemoved;
$path = substr($path, 0, $pos);
}
$query->closeCursor();
$cnt++;
}
// if no page was found, then we can stop trying now
if(!$page->id) return $page;
if($cnt > 1) {
// a parent match was found if our counter is > 1
$parent = $page;
// use the new parent path and add the removed components back on to it
$path = rtrim($parent->path, '/') . $pathRemoved;
// see if it might exist at the new parent's URL
$page = $pages->getByPath($path, array(
'useHistory' => false,
'useLanguages' => $languages ? true : false
));
if($page->id) {
// found a page
$languagePageNames = $languages ? $languages->pageNames() : null;
if($languagePageNames) {
$language = $languagePageNames->getPagePathLanguage($path, $page);
if($language) $page->setQuietly('_language', $language);
}
} else if($level < self::maxSegments) {
// if not, then go recursive, trying again
$page = $this->getPage($path, $level + 1);
}
}
return $page;
}
/*** ROOT SEGMENTS ***********************************************************/
/**
* Get all root segments
*
* @return array
* @since 3.0.186
*
*/
public function getRootSegments() {
if(is_array($this->rootSegments)) return $this->rootSegments;
return $this->rebuildRootSegments();
}
/**
* Is/was given segment ever a root segment?
*
* @param string $segment Segment or path containing it (in ascii format)
* @return bool
* @since 3.0.186
*
*/
public function isRootSegment($segment) {
$segment = trim($segment, '/');
if(strpos($segment, '/')) list($segment,) = explode('/', $segment, 2);
$segments = $this->getRootSegments();
return in_array($segment, $segments, true);
}
/**
* Add a root segment
*
* @param string $segment May be a segment or path to extract it from (in ascii format)
* @return bool True if added, false if it was already present
* @since 3.0.186
*
*/
protected function addRootSegment($segment) {
$segment = trim($segment, '/');
if(strpos($segment, '/')) list($segment,) = explode('/', $segment, 2);
$rootSegments = $this->rootSegments;
if(!is_array($rootSegments)) $rootSegments = array();
if(in_array($segment, $rootSegments, true)) return false;
$rootSegments[] = $segment;
$this->rootSegments = $rootSegments;
$this->wire()->modules->saveConfig($this, 'rootSegments', $rootSegments);
return true;
}
/**
* Rebuild all root segments
*
* @return array
* @since 3.0.186
*
*/
protected function rebuildRootSegments() {
$segments = array();
$sql = 'SELECT path FROM ' . self::dbTableName;
$query = $this->wire()->database->prepare($sql);
$query->execute();
while($row = $query->fetch(\PDO::FETCH_NUM)) {
$path = trim($row[0], '/');
list($segment,) = explode('/', $path, 2);
$segments[$segment] = $segment;
}
$query->closeCursor();
$segments = array_values($segments);
$this->rootSegments = $segments;
$this->wire()->modules->saveConfig($this, 'rootSegments', $segments);
return $segments;
}
/*** HOOKS *******************************************************************/
/**
* Hook called when a page is moved or renamed
*
2022-03-08 15:55:41 +01:00
* @param HookEvent $event
*
*/
public function hookPageMoved(HookEvent $event) {
/** @var Page $page */
$page = $event->arguments[0];
/** @var Languages $languages */
$languages = $this->getLanguages();
$age = time() - $page->created;
2022-11-05 18:32:48 +01:00
if($page->template->name === 'admin' || $this->wire()->pages->cloning || $age < $this->minimumAge) return;
2022-03-08 15:55:41 +01:00
// note that the paths we store have no trailing slash
2022-11-05 18:32:48 +01:00
2022-03-08 15:55:41 +01:00
if($languages) {
$parent = $page->parent();
$parentPrevious = $page->parentPrevious;
if($parentPrevious && $parentPrevious->id == $parent->id) $parentPrevious = null;
foreach($languages as $language) {
/** @var Language $language */
if($language->isDefault()) continue;
$namePrevious = $page->get("-name$language");
if(!$namePrevious && !$parentPrevious) continue;
if(!$namePrevious) $namePrevious = $page->name;
$languages->setLanguage($language);
$pathPrevious = $parentPrevious ? $parentPrevious->path() : $page->parent()->path();
$pathPrevious = rtrim($pathPrevious, '/') . "/$namePrevious";
$this->setPathHistory($page, $pathPrevious, $language->id);
$languages->unsetLanguage();
}
}
if(!$page->namePrevious) {
// abort saving a former URL if it looks like there isn't going to be one
if(!$page->parentPrevious || $page->parentPrevious->id == $page->parent->id) return;
}
if($page->parentPrevious) {
// if former or current parent is in trash, then don't bother saving redirects
2022-11-05 18:32:48 +01:00
if($page->parentPrevious->isTrash() || $page->parent->isTrash()) return;
2022-03-08 15:55:41 +01:00
// the start of our redirect URL will be the previous parent's URL
$path = $page->parentPrevious->path;
} else {
// the start of our redirect URL will be the current parent's URL (i.e. name changed)
$path = $page->parent->path;
}
if($page->namePrevious) {
$path = rtrim($path, '/') . '/' . $page->namePrevious;
} else {
$path = rtrim($path, '/') . '/' . $page->name;
}
2022-11-05 18:32:48 +01:00
// do not save paths that reference recovery format used by trash
// example: /blog/posts/5134.3096.83_page-name
if(strpos($path, '.') !== false && strpos($path, '_') !== false) {
if(preg_match('!/\d+\.\d+\.\d+_!', $path)) return;
}
// do not save paths that match any untitled page name
// example: /blog/posts/untitled-123123
$untitled = $this->wire()->pages->names()->untitledPageName();
if(strpos($path, $untitled) !== false) {
if(preg_match('!/' . preg_quote($untitled) . '[-]!', $path)) return;
}
2022-03-08 15:55:41 +01:00
if($languages) $languages->setDefault();
$this->setPathHistory($page, $path);
if($languages) $languages->unsetDefault();
}
/**
* Hook called upon 404 from ProcessPageView::pageNotFound
2022-11-05 18:32:48 +01:00
*
2022-03-08 15:55:41 +01:00
* @param HookEvent $event
*
*/
public function hookPageNotFound(HookEvent $event) {
2022-11-05 18:32:48 +01:00
2022-03-08 15:55:41 +01:00
/** @var Page $page */
$page = $event->arguments(0);
/** @var Wire404Exception $exception */
2022-11-05 18:32:48 +01:00
$exception = $event->arguments(4);
2022-03-08 15:55:41 +01:00
// If there is a page object set, then it means the 404 was triggered
// by the user not having access to it, or by the $page's template
// throwing a 404 exception. In either case, we don't want to do a
// redirect if there is a $page since any 404 is intentional there.
if($page && $page->id) {
// it did resolve to a Page: maybe a front-end 404
if(!$exception) {
// pageNotFound was called without an Exception
return;
} else if($exception->getCode() == Wire404Exception::codeFunction) {
// the wire404() function was called: allow PagePathHistory
} else if($exception->getMessage() === "1") {
// also allow PagePathHistory to operate when: throw new WireException(true);
} else {
// likely user didn't have access or intentional 404 that should not redirect
return;
2022-11-05 18:32:48 +01:00
}
2022-03-08 15:55:41 +01:00
}
2022-11-05 18:32:48 +01:00
2022-03-08 15:55:41 +01:00
$languages = $this->getLanguages();
2022-11-05 18:32:48 +01:00
$languagePageNames = $languages ? $languages->pageNames() : null;
if($languagePageNames) {
2022-03-08 15:55:41 +01:00
// the LanguageSupportPageNames may change the original requested path, so we ask it for the original
2022-11-05 18:32:48 +01:00
$path = $languagePageNames->getRequestPath();
$path = $path ? $this->wire()->sanitizer->pagePathName($path) : $event->arguments(1);
2022-03-08 15:55:41 +01:00
} else {
$path = $event->arguments(1);
}
2022-11-05 18:32:48 +01:00
2022-03-08 15:55:41 +01:00
$page = $this->getPage($path);
2022-11-05 18:32:48 +01:00
2022-03-08 15:55:41 +01:00
if($page->id && $page->viewable()) {
// if a page was found, redirect to it...
$language = $page->get('_language');
if($language && $languages) {
// ...optionally for a specific language
if($page->get("status$language")) {
$languages->setLanguage($language);
}
}
$this->session->redirect($page->url);
}
}
/**
* When a page is deleted, remove it from our redirects list as well
*
* @param HookEvent $event
*
*/
public function hookPageDeleted(HookEvent $event) {
$page = $event->arguments[0];
2022-11-05 18:32:48 +01:00
$database = $this->wire()->database;
$table = self::dbTableName;
$query = $database->prepare("DELETE FROM $table WHERE pages_id=:pages_id");
2022-03-08 15:55:41 +01:00
$query->bindValue(":pages_id", $page->id, \PDO::PARAM_INT);
$query->execute();
}
/**
* Implementation for $page->addUrl($url, [$language]) method
*
* @param HookEvent $event
*
*/
public function hookPageAddUrl(HookEvent $event) {
/** @var Page $page */
$page = $event->object;
/** @var string $url */
$url = $event->arguments(0);
/** @var Language|null $language */
$language = $event->arguments(1);
$event->return = $this->addPathHistory($page, $this->urlToPath($url), $language);
}
/**
* Implementation for $page->removeUrl($url, [$language]) method
*
* @param HookEvent $event
*
*/
public function hookPageRemoveUrl(HookEvent $event) {
/** @var page $page */
$page = $event->object;
/** @var string $url */
$url = $event->arguments(0);
$event->return = (bool) $this->deletePathHistory($page, $this->urlToPath($url));
}
2022-11-05 18:32:48 +01:00
/*** MODULE ******************************************************************/
2022-03-08 15:55:41 +01:00
/**
* Given URL that may include a root subdirectory, convert it to path relative to root subdirectory
*
* @param string $url
* @return string
*
*/
protected function urlToPath($url) {
2022-11-05 18:32:48 +01:00
$rootUrl = $this->wire()->config->urls->root;
2022-03-08 15:55:41 +01:00
if(strlen($rootUrl) > 1 && strpos($url, $rootUrl) === 0) {
$path = substr($url, strlen($rootUrl) - 1);
} else {
$path = $url;
}
return $path;
}
/**
2022-11-05 18:32:48 +01:00
* Check table schema and update as needed
*
* @return bool True if schema updated, false if not
2022-03-08 15:55:41 +01:00
*
*/
2022-11-05 18:32:48 +01:00
protected function checkTableSchema() {
$database = $this->wire()->database;
$table = self::dbTableName;
$updated = false;
if(!$database->columnExists($table, 'language_id')) {
try {
$database->exec("ALTER TABLE $table ADD language_id INT UNSIGNED DEFAULT 0");
$this->message("Added 'language_id' column to table $table", Notice::debug);
$updated = true;
} catch(\Exception $e) {
$this->error($e->getMessage(), Notice::superuser | Notice::log);
}
}
2022-03-08 15:55:41 +01:00
2022-11-05 18:32:48 +01:00
return $updated;
}
2022-03-08 15:55:41 +01:00
2022-11-05 18:32:48 +01:00
/**
* Install
*
*/
public function ___install() {
$database = $this->wire()->database;
$len = $database->getMaxIndexLength();
$table = self::dbTableName;
if($database->tableExists($table)) {
$this->checkTableSchema();
return;
}
2022-03-08 15:55:41 +01:00
2022-11-05 18:32:48 +01:00
$sql =
"CREATE TABLE $table (" .
"path VARCHAR($len) NOT NULL, " .
"pages_id INT UNSIGNED NOT NULL, " .
"language_id INT UNSIGNED DEFAULT 0, " . // v2
"created TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP, " .
"PRIMARY KEY path (path), " .
"INDEX pages_id (pages_id), " .
"INDEX created (created) " .
") ENGINE={$this->config->dbEngine} DEFAULT CHARSET={$this->config->dbCharset}";
2022-03-08 15:55:41 +01:00
2022-11-05 18:32:48 +01:00
$database->exec($sql);
2022-03-08 15:55:41 +01:00
}
/**
* Uninstall
*
*/
public function ___uninstall() {
2022-11-05 18:32:48 +01:00
$this->wire()->database->query("DROP TABLE " . self::dbTableName);
2022-03-08 15:55:41 +01:00
}
/**
* Upgrade PagePathHistory module schema
*
* @param int $fromVersion
* @param int $toVersion
*
*/
public function ___upgrade($fromVersion, $toVersion) {
2022-11-05 18:32:48 +01:00
if($this->checkTableSchema()) {
if($fromVersion != $toVersion) $this->message("PagePathHistory v$fromVersion => v$toVersion");
2022-03-08 15:55:41 +01:00
}
2022-11-05 18:32:48 +01:00
$this->rebuildRootSegments();
2022-03-08 15:55:41 +01:00
}
/**
* Module config
*
* @param InputfieldWrapper $inputfields
*
*/
public function getModuleConfigInputfields(InputfieldWrapper $inputfields) {
$modules = $this->wire()->modules;
/** @var InputfieldInteger $f */
$f = $modules->get('InputfieldInteger');
$f->attr('name', 'minimumAge');
$f->label = $this->_('Minimum age (seconds)');
$f->description = $this->_('Start recording history for a page this many seconds after it has been created. At least 2 or more seconds recommended.');
$f->notes = sprintf($this->_('Default: %s'), self::minimumAge);
$f->val((int) $this->minimumAge);
$f->required = true;
$inputfields->add($f);
$query = $this->wire()->database->query('SELECT COUNT(*) FROM ' . self::dbTableName);
$numPaths = (int) $query->fetchColumn();
$query->closeCursor();
if($numPaths) {
$input = $this->wire()->input;
$deleteNow = $input->post('_deleteAll') && $input->post('_deleteAllConfirm') === "$numPaths";
if($deleteNow) {
$this->deleteAllPathHistory(true);
$inputfields->message(sprintf($this->_('Deleted %d historical page paths'), $numPaths));
$numPaths = 0;
}
/** @var InputfieldCheckbox $f */
$f = $modules->get('InputfieldCheckbox');
$f->attr('name', '_deleteAll');
$f->attr('value', 1);
$f->label = $this->_('Delete all page path history?');
$f->description = sprintf($this->_('There are currently %d historical page paths in the database.'), $numPaths);
$f->collapsed = Inputfield::collapsedYes;
$inputfields->add($f);
/** @var InputfieldCheckbox $f */
$f = $modules->get('InputfieldCheckbox');
$f->attr('name', '_deleteAllConfirm');
$f->attr('value', 1);
$f->label = $this->_('Are you sure?');
$f->description = $this->_('This information is used for automatic redirects and more. It cannot be recovered once deleted. Check the box to confirm you really want to do this.');
$f->showIf = '_deleteAll=1';
$f->val($numPaths);
$inputfields->add($f);
}
}
}