dokuwiki/inc/pageutils.php

b625487dSandi<?php
a5752066Sjpedryc
b625487dSandi/**
b625487dSandi * Utilities for handling pagenames
b625487dSandi *
b625487dSandi * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
b625487dSandi * @author     Andreas Gohr <andi@splitbrain.org>
1380fc45SAndreas Gohr * @todo       Combine similar functions like {wiki,media,meta}FN()
b625487dSandi */
d4f83172SAndreas Gohr
24870174SAndreas Gohruse dokuwiki\Utf8\PhpString;
24870174SAndreas Gohruse dokuwiki\Utf8\Clean;
24870174SAndreas Gohruse dokuwiki\File\Resolver;
24870174SAndreas Gohruse dokuwiki\Extension\Event;
0c3a5702SAndreas Gohruse dokuwiki\ChangeLog\MediaChangeLog;
0c3a5702SAndreas Gohruse dokuwiki\ChangeLog\PageChangeLog;
2cd6cc0aSAndreas Gohruse dokuwiki\File\MediaResolver;
2cd6cc0aSAndreas Gohruse dokuwiki\File\PageResolver;
0c3a5702SAndreas Gohr
6c7843b5Sandi/**
6de3759aSAndreas Gohr * Fetch the an ID from request
6c7843b5Sandi *
6c7843b5Sandi * Uses either standard $_REQUEST variable or extracts it from
6c7843b5Sandi * the full request URI when userewrite is set to 2
6c7843b5Sandi *
42905504SAndreas Gohr * For $param='id' $conf['start'] is returned if no id was found.
42905504SAndreas Gohr * If the second parameter is true (default) the ID is cleaned.
6c7843b5Sandi *
6c7843b5Sandi * @author Andreas Gohr <andi@splitbrain.org>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $param  the $_REQUEST variable name, default 'id'
84657ea2SGerrit Uitslag * @param bool   $clean  if true, ID is cleaned
42ea7f44SGerrit Uitslag * @return string
6c7843b5Sandi */
a5752066Sjpedrycfunction getID($param = 'id', $clean = true)
a5752066Sjpedryc{
585bf44eSChristopher Smith    /** @var Input $INPUT */
7d01a0eaSTom N Harris    global $INPUT;
6c7843b5Sandi    global $conf;
4e90caaaSMichael Hamann    global $ACT;
6c7843b5Sandi
7d01a0eaSTom N Harris    $id = $INPUT->str($param);
48665d38SAndreas Gohr
6c7843b5Sandi    //construct page id from request URI
6c7843b5Sandi    if (empty($id) && $conf['userewrite'] == 2) {
585bf44eSChristopher Smith        $request = $INPUT->server->str('REQUEST_URI');
06368e4dSMichael Hamann        $script = '';
06368e4dSMichael Hamann
6c7843b5Sandi        //get the script URL
6c7843b5Sandi        if ($conf['basedir']) {
81124000Sjan            $relpath = '';
81124000Sjan            if ($param != 'id') {
81124000Sjan                $relpath = 'lib/exe/';
81124000Sjan            }
6ce3e5f8SAndreas Gohr            $script = $conf['basedir'] . $relpath .
24870174SAndreas Gohr                PhpString::basename($INPUT->server->str('SCRIPT_FILENAME'));
585bf44eSChristopher Smith        } elseif ($INPUT->server->str('PATH_INFO')) {
585bf44eSChristopher Smith            $request = $INPUT->server->str('PATH_INFO');
585bf44eSChristopher Smith        } elseif ($INPUT->server->str('SCRIPT_NAME')) {
585bf44eSChristopher Smith            $script = $INPUT->server->str('SCRIPT_NAME');
585bf44eSChristopher Smith        } elseif ($INPUT->server->str('DOCUMENT_ROOT') && $INPUT->server->str('SCRIPT_FILENAME')) {
a5752066Sjpedryc            $script = preg_replace(
a5752066Sjpedryc                '/^' . preg_quote($INPUT->server->str('DOCUMENT_ROOT'), '/') . '/',
a5752066Sjpedryc                '',
a5752066Sjpedryc                $INPUT->server->str('SCRIPT_FILENAME')
a5752066Sjpedryc            );
6c7843b5Sandi            $script = '/' . $script;
6c7843b5Sandi        }
6c7843b5Sandi
52339126Sandi        //clean script and request (fixes a windows problem)
52339126Sandi        $script  = preg_replace('/\/\/+/', '/', $script);
7d71d4b7SAndreas Gohr        $request = preg_replace('/\/\/+/', '/', $request);
52339126Sandi
6c7843b5Sandi        //remove script URL and Querystring to gain the id
52339126Sandi        if (preg_match('/^' . preg_quote($script, '/') . '(.*)/', $request, $match)) {
6c7843b5Sandi            $id = preg_replace('/\?.*/', '', $match[1]);
6c7843b5Sandi        }
6de3759aSAndreas Gohr        $id = urldecode($id);
42905504SAndreas Gohr        //strip leading slashes
42905504SAndreas Gohr        $id = preg_replace('!^/+!', '', $id);
6c7843b5Sandi    }
671a58a6SGuy Brand
671a58a6SGuy Brand    // Namespace autolinking from URL
*6c16a3a9Sfiwswe    if (str_ends_with($id, ':') || ($conf['useslash'] && str_ends_with($id, '/'))) {
103c256aSChris Smith        if (page_exists($id . $conf['start'])) {
671a58a6SGuy Brand            // start page inside namespace
24870174SAndreas Gohr            $id .= $conf['start'];
103c256aSChris Smith        } elseif (page_exists($id . noNS(cleanID($id)))) {
671a58a6SGuy Brand            // page named like the NS inside the NS
24870174SAndreas Gohr            $id .= noNS(cleanID($id));
103c256aSChris Smith        } elseif (page_exists($id)) {
671a58a6SGuy Brand            // page like namespace exists
7a42ac9eSBen Coburn            $id = substr($id, 0, -1);
671a58a6SGuy Brand        } else {
671a58a6SGuy Brand            // fall back to default
24870174SAndreas Gohr            $id .= $conf['start'];
671a58a6SGuy Brand        }
9dc53973SMichael Grosse        if (isset($ACT) && $ACT === 'show') {
9dc53973SMichael Grosse            $urlParameters = $_GET;
e380abb2SMichael Grosse            if (isset($urlParameters['id'])) {
e380abb2SMichael Grosse                unset($urlParameters['id']);
e380abb2SMichael Grosse            }
e9fede20SPhy            send_redirect(wl($id, $urlParameters, true, '&'));
9dc53973SMichael Grosse        }
671a58a6SGuy Brand    }
42905504SAndreas Gohr    if ($clean) $id = cleanID($id);
40b5fb5bSPhy    if ($id === '' && $param == 'id') $id = $conf['start'];
6c7843b5Sandi
6c7843b5Sandi    return $id;
6c7843b5Sandi}
b625487dSandi
b625487dSandi/**
b625487dSandi * Remove unwanted chars from ID
b625487dSandi *
b625487dSandi * Cleans a given ID to only use allowed characters. Accented characters are
b625487dSandi * converted to unaccented ones
b625487dSandi *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
42ea7f44SGerrit Uitslag *
6e0cc83aSchris * @param  string  $raw_id    The pageid to clean
8a831f2bSAndreas Gohr * @param  boolean $ascii     Force ASCII
dbf714f7SGerrit Uitslag * @return string cleaned id
b625487dSandi */
a5752066Sjpedrycfunction cleanID($raw_id, $ascii = false)
a5752066Sjpedryc{
b625487dSandi    global $conf;
4b5db43bSjoe.lapp    static $sepcharpat = null;
4b5db43bSjoe.lapp
dc2c0e04Schris    global $cache_cleanid;
dc2c0e04Schris    $cache = & $cache_cleanid;
6e0cc83aSchris
6e0cc83aSchris    // check if it's already in the memory cache
30f3bd15SMichael Grosse    if (!$ascii && isset($cache[(string)$raw_id])) {
3a50618cSgweissbach        return $cache[(string)$raw_id];
6e0cc83aSchris    }
6e0cc83aSchris
4b5db43bSjoe.lapp    $sepchar = $conf['sepchar'];
4b5db43bSjoe.lapp    if ($sepcharpat == null) // build string only once to save clock cycles
4b5db43bSjoe.lapp        $sepcharpat = '#\\' . $sepchar . '+#';
4b5db43bSjoe.lapp
3a50618cSgweissbach    $id = trim((string)$raw_id);
24870174SAndreas Gohr    $id = PhpString::strtolower($id);
b625487dSandi
b625487dSandi    //alternative namespace seperator
b625487dSandi    if ($conf['useslash']) {
3755fc25STom N Harris        $id = strtr($id, ';/', '::');
b625487dSandi    } else {
3755fc25STom N Harris        $id = strtr($id, ';/', ':' . $sepchar);
b625487dSandi    }
b625487dSandi
24870174SAndreas Gohr    if ($conf['deaccent'] == 2 || $ascii) $id = Clean::romanize($id);
24870174SAndreas Gohr    if ($conf['deaccent'] || $ascii) $id = Clean::deaccent($id, -1);
b625487dSandi
b625487dSandi    //remove specials
24870174SAndreas Gohr    $id = Clean::stripspecials($id, $sepchar, '\*');
b625487dSandi
24870174SAndreas Gohr    if ($ascii) $id = Clean::strip($id);
8a831f2bSAndreas Gohr
b625487dSandi    //clean up
4b5db43bSjoe.lapp    $id = preg_replace($sepcharpat, $sepchar, $id);
b625487dSandi    $id = preg_replace('#:+#', ':', $id);
3543c6deSAndreas Gohr    $id = trim($id, ':._-');
b625487dSandi    $id = preg_replace('#:[:\._\-]+#', ':', $id);
b680ea06SAndreas Gohr    $id = preg_replace('#[:\._\-]+:#', ':', $id);
b625487dSandi
30f3bd15SMichael Grosse    if (!$ascii) $cache[(string)$raw_id] = $id;
b625487dSandi    return($id);
b625487dSandi}
b625487dSandi
b625487dSandi/**
b625487dSandi * Return namespacepart of a wiki ID
b625487dSandi *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
15851b98SGerrit Uitslag *
15851b98SGerrit Uitslag * @param string $id
42ea7f44SGerrit Uitslag * @return string|false the namespace part or false if the given ID has no namespace (root)
b625487dSandi */
a5752066Sjpedrycfunction getNS($id)
a5752066Sjpedryc{
3a50618cSgweissbach    $pos = strrpos((string)$id, ':');
c4e0e4a1SAndreas Gohr    if ($pos !== false) {
3a50618cSgweissbach        return substr((string)$id, 0, $pos);
b625487dSandi    }
ef11fcfcSAndreas Gohr    return false;
b625487dSandi}
b625487dSandi
b625487dSandi/**
b625487dSandi * Returns the ID without the namespace
b625487dSandi *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
15851b98SGerrit Uitslag *
15851b98SGerrit Uitslag * @param string $id
15851b98SGerrit Uitslag * @return string
b625487dSandi */
a5752066Sjpedrycfunction noNS($id)
a5752066Sjpedryc{
2844584fSBen Coburn    $pos = strrpos($id, ':');
2844584fSBen Coburn    if ($pos !== false) {
2844584fSBen Coburn        return substr($id, $pos + 1);
2844584fSBen Coburn    } else {
2844584fSBen Coburn        return $id;
2844584fSBen Coburn    }
1a84a0f3SAnika Henke}
1a84a0f3SAnika Henke
1a84a0f3SAnika Henke/**
1a84a0f3SAnika Henke * Returns the current namespace
1a84a0f3SAnika Henke *
1a84a0f3SAnika Henke * @author Nathan Fritz <fritzn@crown.edu>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id
84657ea2SGerrit Uitslag * @return string
1a84a0f3SAnika Henke */
a5752066Sjpedrycfunction curNS($id)
a5752066Sjpedryc{
1a84a0f3SAnika Henke    return noNS(getNS($id));
1a84a0f3SAnika Henke}
1a84a0f3SAnika Henke
1a84a0f3SAnika Henke/**
1a84a0f3SAnika Henke * Returns the ID without the namespace or current namespace for 'start' pages
1a84a0f3SAnika Henke *
1a84a0f3SAnika Henke * @author Nathan Fritz <fritzn@crown.edu>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id
84657ea2SGerrit Uitslag * @return string
1a84a0f3SAnika Henke */
a5752066Sjpedrycfunction noNSorNS($id)
a5752066Sjpedryc{
1a84a0f3SAnika Henke    global $conf;
1a84a0f3SAnika Henke
1a84a0f3SAnika Henke    $p = noNS($id);
c077d4dcSAndreas Gohr    if ($p === $conf['start'] || $p === false || $p === '') {
1a84a0f3SAnika Henke        $p = curNS($id);
c077d4dcSAndreas Gohr        if ($p === false || $p === '') {
9708106bSAdrian Lang            return $conf['start'];
1a84a0f3SAnika Henke        }
1a84a0f3SAnika Henke    }
1a84a0f3SAnika Henke    return $p;
b625487dSandi}
4ceab83fSAndreas Gohr
4ceab83fSAndreas Gohr/**
4ceab83fSAndreas Gohr * Creates a XHTML valid linkid from a given headline title
4ceab83fSAndreas Gohr *
4ceab83fSAndreas Gohr * @param string  $title   The headline title
4f582736SGuillaume Turri * @param array|bool   $check   Existing IDs
c857afe0SMichael Hamann * @return string the title
84657ea2SGerrit Uitslag *
4ceab83fSAndreas Gohr * @author Andreas Gohr <andi@splitbrain.org>
4ceab83fSAndreas Gohr */
a5752066Sjpedrycfunction sectionID($title, &$check)
a5752066Sjpedryc{
24870174SAndreas Gohr    $title = str_replace([':', '.'], '', cleanID($title));
de9114eaSAnika Henke    $new = ltrim($title, '0123456789_-');
4ceab83fSAndreas Gohr    if (empty($new)) {
4ceab83fSAndreas Gohr        $title = 'section' . preg_replace('/[^0-9]+/', '', $title); //keep numbers from headline
4ceab83fSAndreas Gohr    } else {
4ceab83fSAndreas Gohr        $title = $new;
4ceab83fSAndreas Gohr    }
4ceab83fSAndreas Gohr
443d207bSAndreas Gohr    if (is_array($check)) {
4f582736SGuillaume Turri        $suffix = 0;
4f582736SGuillaume Turri        $candidateTitle = $title;
4f582736SGuillaume Turri        while (in_array($candidateTitle, $check)) {
4f582736SGuillaume Turri            $candidateTitle = $title . ++$suffix;
4f582736SGuillaume Turri        }
4f582736SGuillaume Turri        $check [] = $candidateTitle;
4f582736SGuillaume Turri        return $candidateTitle;
01e3159cSChris Tapp    } else {
4ceab83fSAndreas Gohr        return $title;
4ceab83fSAndreas Gohr    }
4f582736SGuillaume Turri}
4ceab83fSAndreas Gohr
b625487dSandi/**
103c256aSChris Smith * Wiki page existence check
103c256aSChris Smith *
103c256aSChris Smith * parameters as for wikiFN
103c256aSChris Smith *
103c256aSChris Smith * @author Chris Smith <chris@jalakai.co.uk>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @param string|int $rev empty or revision timestamp
84657ea2SGerrit Uitslag * @param bool $clean flag indicating that $id should be cleaned (see wikiFN as well)
7de86af9SGerrit Uitslag * @param bool $date_at
84657ea2SGerrit Uitslag * @return bool exists?
103c256aSChris Smith */
a5752066Sjpedrycfunction page_exists($id, $rev = '', $clean = true, $date_at = false)
a5752066Sjpedryc{
92085f13SAndreas Gohr    $id = (explode('#', $id, 2))[0]; // #3608
92085f13SAndreas Gohr
90bee600Slisps    if ($rev !== '' && $date_at) {
1d053a56Slisps        $pagelog = new PageChangeLog($id);
90bee600Slisps        $pagelog_rev = $pagelog->getLastRevisionAt($rev);
90bee600Slisps        if ($pagelog_rev !== false)
90bee600Slisps            $rev = $pagelog_rev;
90bee600Slisps    }
79e79377SAndreas Gohr    return file_exists(wikiFN($id, $rev, $clean));
103c256aSChris Smith}
103c256aSChris Smith
103c256aSChris Smith/**
5c844bb3SAndreas Gohr * Media existence check
5c844bb3SAndreas Gohr *
5c844bb3SAndreas Gohr * @param string $id page id
5c844bb3SAndreas Gohr * @param string|int $rev empty or revision timestamp
5c844bb3SAndreas Gohr * @param bool $clean flag indicating that $id should be cleaned (see mediaFN as well)
5c844bb3SAndreas Gohr * @param bool $date_at
5c844bb3SAndreas Gohr * @return bool exists?
5c844bb3SAndreas Gohr */
5c844bb3SAndreas Gohrfunction media_exists($id, $rev = '', $clean = true, $date_at = false)
5c844bb3SAndreas Gohr{
5c844bb3SAndreas Gohr    if ($rev !== '' && $date_at) {
5c844bb3SAndreas Gohr        $changeLog = new MediaChangeLog($id);
5c844bb3SAndreas Gohr        $changelog_rev = $changeLog->getLastRevisionAt($rev);
5c844bb3SAndreas Gohr        if ($changelog_rev !== false) {
5c844bb3SAndreas Gohr            $rev = $changelog_rev;
5c844bb3SAndreas Gohr        }
5c844bb3SAndreas Gohr    }
5c844bb3SAndreas Gohr    return file_exists(mediaFN($id, $rev, $clean));
5c844bb3SAndreas Gohr}
5c844bb3SAndreas Gohr
5c844bb3SAndreas Gohr/**
103c256aSChris Smith * returns the full path to the datafile specified by ID and optional revision
b625487dSandi *
b625487dSandi * The filename is URL encoded to protect Unicode chars
b625487dSandi *
103c256aSChris Smith * @param  $raw_id  string   id of wikipage
e0c26282SGerrit Uitslag * @param  $rev     int|string   page revision, empty string for current
103c256aSChris Smith * @param  $clean   bool     flag indicating that $raw_id should be cleaned.  Only set to false
103c256aSChris Smith *                           when $id is guaranteed to have been cleaned already.
dbf714f7SGerrit Uitslag * @return string full path
103c256aSChris Smith *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
b625487dSandi */
a5752066Sjpedrycfunction wikiFN($raw_id, $rev = '', $clean = true)
a5752066Sjpedryc{
b625487dSandi    global $conf;
6e0cc83aSchris
dc2c0e04Schris    global $cache_wikifn;
dc2c0e04Schris    $cache = & $cache_wikifn;
dc2c0e04Schris
6e0cc83aSchris    $id = $raw_id;
6e0cc83aSchris
0d8ea614Schris    if ($clean) $id = cleanID($id);
b625487dSandi    $id = str_replace(':', '/', $id);
b018ecbeSMichael Grosse
b018ecbeSMichael Grosse    if (isset($cache[$id]) && isset($cache[$id][$rev])) {
b018ecbeSMichael Grosse        return $cache[$id][$rev];
b018ecbeSMichael Grosse    }
b018ecbeSMichael Grosse
b625487dSandi    if (empty($rev)) {
b625487dSandi        $fn = $conf['datadir'] . '/' . utf8_encodeFN($id) . '.txt';
b625487dSandi    } else {
b625487dSandi        $fn = $conf['olddir'] . '/' . utf8_encodeFN($id) . '.' . $rev . '.txt';
ff3ed99fSmarcel        if ($conf['compression']) {
ff3ed99fSmarcel            //test for extensions here, we want to read both compressions
79e79377SAndreas Gohr            if (file_exists($fn . '.gz')) {
b625487dSandi                $fn .= '.gz';
79e79377SAndreas Gohr            } elseif (file_exists($fn . '.bz2')) {
ff3ed99fSmarcel                $fn .= '.bz2';
ff3ed99fSmarcel            } else {
ff3ed99fSmarcel                //file doesnt exist yet, so we take the configured extension
ff3ed99fSmarcel                $fn .= '.' . $conf['compression'];
ff3ed99fSmarcel            }
b625487dSandi        }
b625487dSandi    }
6e0cc83aSchris
a5752066Sjpedryc    if (!isset($cache[$id])) {
24870174SAndreas Gohr        $cache[$id] = [];
a5752066Sjpedryc    }
b018ecbeSMichael Grosse    $cache[$id][$rev] = $fn;
b625487dSandi    return $fn;
b625487dSandi}
b625487dSandi
b625487dSandi/**
c9b4bd1eSBen Coburn * Returns the full path to the file for locking the page while editing.
c9b4bd1eSBen Coburn *
c9b4bd1eSBen Coburn * @author Ben Coburn <btcoburn@silicodon.net>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @return string full path
c9b4bd1eSBen Coburn */
a5752066Sjpedrycfunction wikiLockFN($id)
a5752066Sjpedryc{
c9b4bd1eSBen Coburn    global $conf;
662ff478SAndreas Gohr    return $conf['lockdir'] . '/' . md5(cleanID($id)) . '.lock';
c9b4bd1eSBen Coburn}
c9b4bd1eSBen Coburn
c9b4bd1eSBen Coburn
c9b4bd1eSBen Coburn/**
1380fc45SAndreas Gohr * returns the full path to the meta file specified by ID and extension
b158d625SSteven Danz *
b158d625SSteven Danz * @author Steven Danz <steven-danz@kc.rr.com>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id   page id
84657ea2SGerrit Uitslag * @param string $ext  file extension
84657ea2SGerrit Uitslag * @return string full path
b158d625SSteven Danz */
a5752066Sjpedrycfunction metaFN($id, $ext)
a5752066Sjpedryc{
b158d625SSteven Danz    global $conf;
b158d625SSteven Danz    $id = cleanID($id);
b158d625SSteven Danz    $id = str_replace(':', '/', $id);
24870174SAndreas Gohr
1380fc45SAndreas Gohr    $fn = $conf['metadir'] . '/' . utf8_encodeFN($id) . $ext;
b158d625SSteven Danz    return $fn;
b158d625SSteven Danz}
b158d625SSteven Danz
b158d625SSteven Danz/**
e4f389efSKate Arzamastseva * returns the full path to the media's meta file specified by ID and extension
e4f389efSKate Arzamastseva *
cbe26ad6SKate Arzamastseva * @author Kate Arzamastseva <pshns@ukr.net>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id   media id
84657ea2SGerrit Uitslag * @param string $ext  extension of media
84657ea2SGerrit Uitslag * @return string
e4f389efSKate Arzamastseva */
a5752066Sjpedrycfunction mediaMetaFN($id, $ext)
a5752066Sjpedryc{
e4f389efSKate Arzamastseva    global $conf;
e4f389efSKate Arzamastseva    $id = cleanID($id);
e4f389efSKate Arzamastseva    $id = str_replace(':', '/', $id);
24870174SAndreas Gohr
e4f389efSKate Arzamastseva    $fn = $conf['mediametadir'] . '/' . utf8_encodeFN($id) . $ext;
e4f389efSKate Arzamastseva    return $fn;
e4f389efSKate Arzamastseva}
e4f389efSKate Arzamastseva
e4f389efSKate Arzamastseva/**
e1f3d9e1SEsther Brunner * returns an array of full paths to all metafiles of a given ID
e1f3d9e1SEsther Brunner *
e1f3d9e1SEsther Brunner * @author Esther Brunner <esther@kaffeehaus.ch>
ba0267b3SMichael Hamann * @author Michael Hamann <michael@content-space.de>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @return array
e1f3d9e1SEsther Brunner */
a5752066Sjpedrycfunction metaFiles($id)
a5752066Sjpedryc{
ba0267b3SMichael Hamann    $basename = metaFN($id, '');
ba0267b3SMichael Hamann    $files    = glob($basename . '.*', GLOB_MARK);
ba0267b3SMichael Hamann    // filter files like foo.bar.meta when $id == 'foo'
24870174SAndreas Gohr    return    $files ? preg_grep('/^' . preg_quote($basename, '/') . '\.[^.\/]*$/u', $files) : [];
e1f3d9e1SEsther Brunner}
e1f3d9e1SEsther Brunner
e1f3d9e1SEsther Brunner/**
b625487dSandi * returns the full path to the mediafile specified by ID
b625487dSandi *
b625487dSandi * The filename is URL encoded to protect Unicode chars
b625487dSandi *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
cbe26ad6SKate Arzamastseva * @author Kate Arzamastseva <pshns@ukr.net>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string     $id  media id
84657ea2SGerrit Uitslag * @param string|int $rev empty string or revision timestamp
f50a239bSTakamura * @param bool $clean
f50a239bSTakamura *
84657ea2SGerrit Uitslag * @return string full path
b625487dSandi */
a5752066Sjpedrycfunction mediaFN($id, $rev = '', $clean = true)
a5752066Sjpedryc{
b625487dSandi    global $conf;
d0e997c6SMichael Große    if ($clean) $id = cleanID($id);
b625487dSandi    $id = str_replace(':', '/', $id);
e4f389efSKate Arzamastseva    if (empty($rev)) {
b625487dSandi        $fn = $conf['mediadir'] . '/' . utf8_encodeFN($id);
e4f389efSKate Arzamastseva    } else {
cbe26ad6SKate Arzamastseva        $ext = mimetype($id);
8e69fd30SKate Arzamastseva        $name = substr($id, 0, -1 * strlen($ext[0]) - 1);
61f1aad8SKate Arzamastseva        $fn = $conf['mediaolddir'] . '/' . utf8_encodeFN($name . '.' . ( (int) $rev ) . '.' . $ext[0]);
e4f389efSKate Arzamastseva    }
b625487dSandi    return $fn;
b625487dSandi}
b625487dSandi
b625487dSandi/**
2adaf2b8SAndreas Gohr * Returns the full filepath to a localized file if local
b625487dSandi * version isn't found the english one is returned
b625487dSandi *
2adaf2b8SAndreas Gohr * @param  string $id  The id of the local file
2adaf2b8SAndreas Gohr * @param  string $ext The file extension (usually txt)
dbf714f7SGerrit Uitslag * @return string full filepath to localized file
84657ea2SGerrit Uitslag *
b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
b625487dSandi */
a5752066Sjpedrycfunction localeFN($id, $ext = 'txt')
a5752066Sjpedryc{
b625487dSandi    global $conf;
8819fbf5ShArpanet    $file = DOKU_CONF . 'lang/' . $conf['lang'] . '/' . $id . '.' . $ext;
79e79377SAndreas Gohr    if (!file_exists($file)) {
2adaf2b8SAndreas Gohr        $file = DOKU_INC . 'inc/lang/' . $conf['lang'] . '/' . $id . '.' . $ext;
79e79377SAndreas Gohr        if (!file_exists($file)) {
b625487dSandi            //fall back to english
2adaf2b8SAndreas Gohr            $file = DOKU_INC . 'inc/lang/en/' . $id . '.' . $ext;
b625487dSandi        }
e6cecb08SMichael Hamann    }
b625487dSandi    return $file;
b625487dSandi}
b625487dSandi
b625487dSandi/**
c4e0e4a1SAndreas Gohr * Resolve relative paths in IDs
c4e0e4a1SAndreas Gohr *
c4e0e4a1SAndreas Gohr * Do not call directly use resolve_mediaid or resolve_pageid
c4e0e4a1SAndreas Gohr * instead
c4e0e4a1SAndreas Gohr *
c4e0e4a1SAndreas Gohr * Partyly based on a cleanPath function found at
59752844SAnders Sandblad * http://php.net/manual/en/function.realpath.php#57016
c4e0e4a1SAndreas Gohr *
bfcf8009SAndreas Gohr * @deprecated 2020-09-30
84657ea2SGerrit Uitslag * @param string $ns     namespace which is context of id
84657ea2SGerrit Uitslag * @param string $id     relative id
84657ea2SGerrit Uitslag * @param bool   $clean  flag indicating that id should be cleaned
42ea7f44SGerrit Uitslag * @return string
c4e0e4a1SAndreas Gohr */
a5752066Sjpedrycfunction resolve_id($ns, $id, $clean = true)
a5752066Sjpedryc{
c662a49aSAndreas Gohr    global $conf;
24870174SAndreas Gohr    dbg_deprecated(Resolver::class . ' and its children');
c662a49aSAndreas Gohr
c662a49aSAndreas Gohr    // some pre cleaning for useslash:
c662a49aSAndreas Gohr    if ($conf['useslash']) $id = str_replace('/', ':', $id);
c662a49aSAndreas Gohr
c4e0e4a1SAndreas Gohr    // if the id starts with a dot we need to handle the
c4e0e4a1SAndreas Gohr    // relative stuff
2401f18dSSyntaxseed    if ($id && $id[0] == '.') {
c4e0e4a1SAndreas Gohr        // normalize initial dots without a colon
4986a584SPhy        $id = preg_replace('/^((\.+:)*)(\.+)(?=[^:\.])/', '\1\3:', $id);
c4e0e4a1SAndreas Gohr        // prepend the current namespace
c4e0e4a1SAndreas Gohr        $id = $ns . ':' . $id;
c4e0e4a1SAndreas Gohr
c4e0e4a1SAndreas Gohr        // cleanup relatives
24870174SAndreas Gohr        $result = [];
c4e0e4a1SAndreas Gohr        $pathA  = explode(':', $id);
c4e0e4a1SAndreas Gohr        if (!$pathA[0]) $result[] = '';
24870174SAndreas Gohr        foreach ($pathA as $dir) {
c4e0e4a1SAndreas Gohr            if ($dir == '..') {
c4e0e4a1SAndreas Gohr                if (end($result) == '..') {
c4e0e4a1SAndreas Gohr                    $result[] = '..';
c4e0e4a1SAndreas Gohr                } elseif (!array_pop($result)) {
c4e0e4a1SAndreas Gohr                    $result[] = '..';
c4e0e4a1SAndreas Gohr                }
c4e0e4a1SAndreas Gohr            } elseif ($dir && $dir != '.') {
c4e0e4a1SAndreas Gohr                $result[] = $dir;
c4e0e4a1SAndreas Gohr            }
c4e0e4a1SAndreas Gohr        }
c4e0e4a1SAndreas Gohr        if (!end($pathA)) $result[] = '';
c4e0e4a1SAndreas Gohr        $id = implode(':', $result);
c4e0e4a1SAndreas Gohr    } elseif ($ns !== false && strpos($id, ':') === false) {
c4e0e4a1SAndreas Gohr        //if link contains no namespace. add current namespace (if any)
c4e0e4a1SAndreas Gohr        $id = $ns . ':' . $id;
c4e0e4a1SAndreas Gohr    }
c4e0e4a1SAndreas Gohr
a6ef4796SAndreas Gohr    if ($clean) $id = cleanID($id);
a6ef4796SAndreas Gohr    return $id;
c4e0e4a1SAndreas Gohr}
c4e0e4a1SAndreas Gohr
c4e0e4a1SAndreas Gohr/**
b625487dSandi * Returns a full media id
b625487dSandi *
84657ea2SGerrit Uitslag * @param string $ns namespace which is context of id
5c844bb3SAndreas Gohr * @param string &$media (reference) relative media id, updated to resolved id
84657ea2SGerrit Uitslag * @param bool &$exists (reference) updated with existance of media
7de86af9SGerrit Uitslag * @param int|string $rev
7de86af9SGerrit Uitslag * @param bool $date_at
5c844bb3SAndreas Gohr * @deprecated 2020-09-30
b625487dSandi */
a5752066Sjpedrycfunction resolve_mediaid($ns, &$media, &$exists, $rev = '', $date_at = false)
a5752066Sjpedryc{
5c844bb3SAndreas Gohr    dbg_deprecated(MediaResolver::class);
5c844bb3SAndreas Gohr    $resolver = new MediaResolver("$ns:deprecated");
5c844bb3SAndreas Gohr    $media = $resolver->resolveId($media, $rev, $date_at);
5c844bb3SAndreas Gohr    $exists = media_exists($media, $rev, false, $date_at);
b625487dSandi}
b625487dSandi
b625487dSandi/**
b625487dSandi * Returns a full page id
b625487dSandi *
bfcf8009SAndreas Gohr * @deprecated 2020-09-30
84657ea2SGerrit Uitslag * @param string $ns namespace which is context of id
84657ea2SGerrit Uitslag * @param string &$page (reference) relative page id, updated to resolved id
84657ea2SGerrit Uitslag * @param bool &$exists (reference) updated with existance of media
7de86af9SGerrit Uitslag * @param string $rev
7de86af9SGerrit Uitslag * @param bool $date_at
b625487dSandi */
bfcf8009SAndreas Gohrfunction resolve_pageid($ns, &$page, &$exists, $rev = '', $date_at = false)
bfcf8009SAndreas Gohr{
8c6be208SAndreas Gohr    dbg_deprecated(PageResolver::class);
54611a7aSAndreas Gohr
54611a7aSAndreas Gohr    global $ID;
54611a7aSAndreas Gohr    if (getNS($ID) == $ns) {
54611a7aSAndreas Gohr        $context = $ID; // this is usually the case
54611a7aSAndreas Gohr    } else {
54611a7aSAndreas Gohr        $context = "$ns:deprecated"; // only used when a different context namespace was given
54611a7aSAndreas Gohr    }
54611a7aSAndreas Gohr
54611a7aSAndreas Gohr    $resolver = new PageResolver($context);
bfcf8009SAndreas Gohr    $page = $resolver->resolveId($page, $rev, $date_at);
bfcf8009SAndreas Gohr    $exists = page_exists($page, $rev, false, $date_at);
b625487dSandi}
b625487dSandi
98407a7aSandi/**
98407a7aSandi * Returns the name of a cachefile from given data
98407a7aSandi *
98407a7aSandi * The needed directory is created by this function!
98407a7aSandi *
98407a7aSandi * @author Andreas Gohr <andi@splitbrain.org>
98407a7aSandi *
98407a7aSandi * @param string $data  This data is used to create a unique md5 name
98407a7aSandi * @param string $ext   This is appended to the filename if given
98407a7aSandi * @return string       The filename of the cachefile
98407a7aSandi */
a5752066Sjpedrycfunction getCacheName($data, $ext = '')
a5752066Sjpedryc{
98407a7aSandi    global $conf;
98407a7aSandi    $md5  = md5($data);
2401f18dSSyntaxseed    $file = $conf['cachedir'] . '/' . $md5[0] . '/' . $md5 . $ext;
98407a7aSandi    io_makeFileDir($file);
98407a7aSandi    return $file;
98407a7aSandi}
98407a7aSandi
0dc92c6fSAndreas Gohr/**
0dc92c6fSAndreas Gohr * Checks a pageid against $conf['hidepages']
0dc92c6fSAndreas Gohr *
0dc92c6fSAndreas Gohr * @author Andreas Gohr <gohr@cosmocode.de>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @return bool
0dc92c6fSAndreas Gohr */
a5752066Sjpedrycfunction isHiddenPage($id)
a5752066Sjpedryc{
24870174SAndreas Gohr    $data = ['id' => $id, 'hidden' => false];
24870174SAndreas Gohr    Event::createAndTrigger('PAGEUTILS_ID_HIDEPAGE', $data, '_isHiddenPage');
fb55b51eSDominik Eckelmann    return $data['hidden'];
0dc92c6fSAndreas Gohr}
fb55b51eSDominik Eckelmann
dbf714f7SGerrit Uitslag/**
dbf714f7SGerrit Uitslag * callback checks if page is hidden
dbf714f7SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param array $data event data    - see isHiddenPage()
dbf714f7SGerrit Uitslag */
a5752066Sjpedrycfunction _isHiddenPage(&$data)
a5752066Sjpedryc{
fb55b51eSDominik Eckelmann    global $conf;
fb55b51eSDominik Eckelmann    global $ACT;
fb55b51eSDominik Eckelmann
fb55b51eSDominik Eckelmann    if ($data['hidden']) return;
fb55b51eSDominik Eckelmann    if (empty($conf['hidepages'])) return;
fb55b51eSDominik Eckelmann    if ($ACT == 'admin') return;
fb55b51eSDominik Eckelmann
fb55b51eSDominik Eckelmann    if (preg_match('/' . $conf['hidepages'] . '/ui', ':' . $data['id'])) {
fb55b51eSDominik Eckelmann        $data['hidden'] = true;
fb55b51eSDominik Eckelmann    }
0dc92c6fSAndreas Gohr}
0dc92c6fSAndreas Gohr
0dc92c6fSAndreas Gohr/**
0dc92c6fSAndreas Gohr * Reverse of isHiddenPage
0dc92c6fSAndreas Gohr *
0dc92c6fSAndreas Gohr * @author Andreas Gohr <gohr@cosmocode.de>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @return bool
0dc92c6fSAndreas Gohr */
a5752066Sjpedrycfunction isVisiblePage($id)
a5752066Sjpedryc{
0dc92c6fSAndreas Gohr    return !isHiddenPage($id);
0dc92c6fSAndreas Gohr}
0dc92c6fSAndreas Gohr
5b75cd1fSAdrian Lang/**
5b75cd1fSAdrian Lang * Format an id for output to a user
5b75cd1fSAdrian Lang *
5b75cd1fSAdrian Lang * Namespaces are denoted by a trailing “:*”. The root namespace is
5b75cd1fSAdrian Lang * “*”. Output is escaped.
5b75cd1fSAdrian Lang *
5b75cd1fSAdrian Lang * @author Adrian Lang <lang@cosmocode.de>
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $id page id
84657ea2SGerrit Uitslag * @return string
5b75cd1fSAdrian Lang */
a5752066Sjpedrycfunction prettyprint_id($id)
a5752066Sjpedryc{
5b75cd1fSAdrian Lang    if (!$id || $id === ':') {
5b75cd1fSAdrian Lang        return '*';
5b75cd1fSAdrian Lang    }
*6c16a3a9Sfiwswe    if (str_ends_with($id, ':')) {
5b75cd1fSAdrian Lang        $id .= '*';
5b75cd1fSAdrian Lang    }
5b75cd1fSAdrian Lang    return hsc($id);
5b75cd1fSAdrian Lang}
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr/**
f03fd957SAndreas Gohr * Encode a UTF-8 filename to use on any filesystem
f03fd957SAndreas Gohr *
f03fd957SAndreas Gohr * Uses the 'fnencode' option to determine encoding
f03fd957SAndreas Gohr *
f03fd957SAndreas Gohr * When the second parameter is true the string will
f03fd957SAndreas Gohr * be encoded only if non ASCII characters are detected -
f03fd957SAndreas Gohr * This makes it safe to run it multiple times on the
f03fd957SAndreas Gohr * same string (default is true)
f03fd957SAndreas Gohr *
f03fd957SAndreas Gohr * @author Andreas Gohr <andi@splitbrain.org>
f03fd957SAndreas Gohr * @see    urlencode
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $file file name
84657ea2SGerrit Uitslag * @param bool   $safe if true, only encoded when non ASCII characters detected
84657ea2SGerrit Uitslag * @return string
f03fd957SAndreas Gohr */
a5752066Sjpedrycfunction utf8_encodeFN($file, $safe = true)
a5752066Sjpedryc{
f03fd957SAndreas Gohr    global $conf;
f03fd957SAndreas Gohr    if ($conf['fnencode'] == 'utf-8') return $file;
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr    if ($safe && preg_match('#^[a-zA-Z0-9/_\-\.%]+$#', $file)) {
f03fd957SAndreas Gohr        return $file;
f03fd957SAndreas Gohr    }
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr    if ($conf['fnencode'] == 'safe') {
f03fd957SAndreas Gohr        return SafeFN::encode($file);
f03fd957SAndreas Gohr    }
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr    $file = urlencode($file);
f03fd957SAndreas Gohr    $file = str_replace('%2F', '/', $file);
f03fd957SAndreas Gohr    return $file;
f03fd957SAndreas Gohr}
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr/**
f03fd957SAndreas Gohr * Decode a filename back to UTF-8
f03fd957SAndreas Gohr *
f03fd957SAndreas Gohr * Uses the 'fnencode' option to determine encoding
f03fd957SAndreas Gohr *
f03fd957SAndreas Gohr * @author Andreas Gohr <andi@splitbrain.org>
f03fd957SAndreas Gohr * @see    urldecode
84657ea2SGerrit Uitslag *
84657ea2SGerrit Uitslag * @param string $file file name
84657ea2SGerrit Uitslag * @return string
f03fd957SAndreas Gohr */
a5752066Sjpedrycfunction utf8_decodeFN($file)
a5752066Sjpedryc{
f03fd957SAndreas Gohr    global $conf;
f03fd957SAndreas Gohr    if ($conf['fnencode'] == 'utf-8') return $file;
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr    if ($conf['fnencode'] == 'safe') {
f03fd957SAndreas Gohr        return SafeFN::decode($file);
f03fd957SAndreas Gohr    }
f03fd957SAndreas Gohr
f03fd957SAndreas Gohr    return urldecode($file);
f03fd957SAndreas Gohr}
f03fd957SAndreas Gohr
e66d3e6dSAndreas Gohr/**
e66d3e6dSAndreas Gohr * Find a page in the current namespace (determined from $ID) or any
cc529468SMichael Hamann * higher namespace that can be accessed by the current user,
cc529468SMichael Hamann * this condition can be overriden by an optional parameter.
e66d3e6dSAndreas Gohr *
e66d3e6dSAndreas Gohr * Used for sidebars, but can be used other stuff as well
e66d3e6dSAndreas Gohr *
e66d3e6dSAndreas Gohr * @todo   add event hook
42ea7f44SGerrit Uitslag *
e66d3e6dSAndreas Gohr * @param  string $page the pagename you're looking for
7c3e4a67SAndreas Gohr * @param bool $useacl only return pages readable by the current user, false to ignore ACLs
cc529468SMichael Hamann * @return false|string the full page id of the found page, false if any
e66d3e6dSAndreas Gohr */
a5752066Sjpedrycfunction page_findnearest($page, $useacl = true)
a5752066Sjpedryc{
06a70133SPhy    if ((string) $page === '') return false;
e66d3e6dSAndreas Gohr    global $ID;
e66d3e6dSAndreas Gohr
e66d3e6dSAndreas Gohr    $ns = $ID;
e66d3e6dSAndreas Gohr    do {
e66d3e6dSAndreas Gohr        $ns = getNS($ns);
cc529468SMichael Hamann        $pageid = cleanID("$ns:$page");
7c3e4a67SAndreas Gohr        if (page_exists($pageid) && (!$useacl || auth_quickaclcheck($pageid) >= AUTH_READ)) {
e66d3e6dSAndreas Gohr            return $pageid;
e66d3e6dSAndreas Gohr        }
06a70133SPhy    } while ($ns !== false);
e66d3e6dSAndreas Gohr
e66d3e6dSAndreas Gohr    return false;
e66d3e6dSAndreas Gohr}