1b625487dSandi<?php 2b625487dSandi/** 3b625487dSandi * Utilities for handling pagenames 4b625487dSandi * 5b625487dSandi * @license GPL 2 (http://www.gnu.org/licenses/gpl.html) 6b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 71380fc45SAndreas Gohr * @todo Combine similar functions like {wiki,media,meta}FN() 8b625487dSandi */ 9b625487dSandi 106c7843b5Sandi/** 116de3759aSAndreas Gohr * Fetch the an ID from request 126c7843b5Sandi * 136c7843b5Sandi * Uses either standard $_REQUEST variable or extracts it from 146c7843b5Sandi * the full request URI when userewrite is set to 2 156c7843b5Sandi * 1642905504SAndreas Gohr * For $param='id' $conf['start'] is returned if no id was found. 1742905504SAndreas Gohr * If the second parameter is true (default) the ID is cleaned. 186c7843b5Sandi * 196c7843b5Sandi * @author Andreas Gohr <andi@splitbrain.org> 206c7843b5Sandi */ 2142905504SAndreas Gohrfunction getID($param='id',$clean=true){ 226c7843b5Sandi global $conf; 236c7843b5Sandi 2448665d38SAndreas Gohr $id = $_REQUEST[$param]; 2548665d38SAndreas Gohr 266c7843b5Sandi //construct page id from request URI 276c7843b5Sandi if(empty($id) && $conf['userewrite'] == 2){ 286c7843b5Sandi //get the script URL 296c7843b5Sandi if($conf['basedir']){ 3081124000Sjan $relpath = ''; 3181124000Sjan if($param != 'id') { 3281124000Sjan $relpath = 'lib/exe/'; 3381124000Sjan } 3481124000Sjan $script = $conf['basedir'].$relpath.basename($_SERVER['SCRIPT_FILENAME']); 356c7843b5Sandi }elseif($_SERVER['DOCUMENT_ROOT'] && $_SERVER['SCRIPT_FILENAME']){ 366c7843b5Sandi $script = preg_replace ('/^'.preg_quote($_SERVER['DOCUMENT_ROOT'],'/').'/','', 376c7843b5Sandi $_SERVER['SCRIPT_FILENAME']); 386c7843b5Sandi $script = '/'.$script; 396c7843b5Sandi }else{ 406c7843b5Sandi $script = $_SERVER['SCRIPT_NAME']; 416c7843b5Sandi } 426c7843b5Sandi 4352339126Sandi //clean script and request (fixes a windows problem) 4452339126Sandi $script = preg_replace('/\/\/+/','/',$script); 4552339126Sandi $request = preg_replace('/\/\/+/','/',$_SERVER['REQUEST_URI']); 4652339126Sandi 476c7843b5Sandi //remove script URL and Querystring to gain the id 4852339126Sandi if(preg_match('/^'.preg_quote($script,'/').'(.*)/',$request, $match)){ 496c7843b5Sandi $id = preg_replace ('/\?.*/','',$match[1]); 506c7843b5Sandi } 516de3759aSAndreas Gohr $id = urldecode($id); 5242905504SAndreas Gohr //strip leading slashes 5342905504SAndreas Gohr $id = preg_replace('!^/+!','',$id); 546c7843b5Sandi } 5542905504SAndreas Gohr if($clean) $id = cleanID($id); 560868021bSAndreas Gohr if(empty($id) && $param=='id') $id = $conf['start']; 576c7843b5Sandi 586c7843b5Sandi return $id; 596c7843b5Sandi} 60b625487dSandi 61b625487dSandi/** 62b625487dSandi * Remove unwanted chars from ID 63b625487dSandi * 64b625487dSandi * Cleans a given ID to only use allowed characters. Accented characters are 65b625487dSandi * converted to unaccented ones 66b625487dSandi * 67b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 688a831f2bSAndreas Gohr * @param string $id The pageid to clean 698a831f2bSAndreas Gohr * @param boolean $ascii Force ASCII 70b625487dSandi */ 718a831f2bSAndreas Gohrfunction cleanID($id,$ascii=false){ 72b625487dSandi global $conf; 73b625487dSandi global $lang; 744b5db43bSjoe.lapp static $sepcharpat = null; 754b5db43bSjoe.lapp 764b5db43bSjoe.lapp $sepchar = $conf['sepchar']; 774b5db43bSjoe.lapp if($sepcharpat == null) // build string only once to save clock cycles 784b5db43bSjoe.lapp $sepcharpat = '#\\'.$sepchar.'+#'; 794b5db43bSjoe.lapp 80b625487dSandi $id = trim($id); 81b625487dSandi $id = utf8_strtolower($id); 82b625487dSandi 83b625487dSandi //alternative namespace seperator 84b625487dSandi $id = strtr($id,';',':'); 85b625487dSandi if($conf['useslash']){ 86b625487dSandi $id = strtr($id,'/',':'); 87b625487dSandi }else{ 884eeffcd2SAndreas Gohr $id = strtr($id,'/',$sepchar); 89b625487dSandi } 90b625487dSandi 918a831f2bSAndreas Gohr if($conf['deaccent'] == 2 || $ascii) $id = utf8_romanize($id); 928a831f2bSAndreas Gohr if($conf['deaccent'] || $ascii) $id = utf8_deaccent($id,-1); 93b625487dSandi 94b625487dSandi //remove specials 95ad81d431SAndreas Gohr $id = utf8_stripspecials($id,$sepchar,'\*'); 96b625487dSandi 978a831f2bSAndreas Gohr if($ascii) $id = utf8_strip($id); 988a831f2bSAndreas Gohr 99b625487dSandi //clean up 1004b5db43bSjoe.lapp $id = preg_replace($sepcharpat,$sepchar,$id); 101b625487dSandi $id = preg_replace('#:+#',':',$id); 102b625487dSandi $id = trim($id,':._-'); 103b625487dSandi $id = preg_replace('#:[:\._\-]+#',':',$id); 104b625487dSandi 105b625487dSandi return($id); 106b625487dSandi} 107b625487dSandi 108b625487dSandi/** 109b625487dSandi * Return namespacepart of a wiki ID 110b625487dSandi * 111b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 112b625487dSandi */ 113b625487dSandifunction getNS($id){ 114c4e0e4a1SAndreas Gohr $pos = strrpos($id,':'); 115c4e0e4a1SAndreas Gohr if($pos!==false){ 116c4e0e4a1SAndreas Gohr return substr($id,0,$pos); 117b625487dSandi } 118b625487dSandi return false; 119b625487dSandi} 120b625487dSandi 121b625487dSandi/** 122b625487dSandi * Returns the ID without the namespace 123b625487dSandi * 124b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 125b625487dSandi */ 126b625487dSandifunction noNS($id){ 127b625487dSandi return preg_replace('/.*:/','',$id); 128b625487dSandi} 129b625487dSandi 130b625487dSandi/** 131b625487dSandi * returns the full path to the datafile specified by ID and 132b625487dSandi * optional revision 133b625487dSandi * 134b625487dSandi * The filename is URL encoded to protect Unicode chars 135b625487dSandi * 136b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 137b625487dSandi */ 138b625487dSandifunction wikiFN($id,$rev=''){ 139b625487dSandi global $conf; 140b625487dSandi $id = cleanID($id); 141b625487dSandi $id = str_replace(':','/',$id); 142b625487dSandi if(empty($rev)){ 143b625487dSandi $fn = $conf['datadir'].'/'.utf8_encodeFN($id).'.txt'; 144b625487dSandi }else{ 145b625487dSandi $fn = $conf['olddir'].'/'.utf8_encodeFN($id).'.'.$rev.'.txt'; 146b625487dSandi if($conf['usegzip'] && !@file_exists($fn)){ 147b625487dSandi //return gzip if enabled and plaintext doesn't exist 148b625487dSandi $fn .= '.gz'; 149b625487dSandi } 150b625487dSandi } 151b625487dSandi return $fn; 152b625487dSandi} 153b625487dSandi 154b625487dSandi/** 155*c9b4bd1eSBen Coburn * Returns the full path to the file for locking the page while editing. 156*c9b4bd1eSBen Coburn * 157*c9b4bd1eSBen Coburn * @author Ben Coburn <btcoburn@silicodon.net> 158*c9b4bd1eSBen Coburn */ 159*c9b4bd1eSBen Coburnfunction wikiLockFN($id) { 160*c9b4bd1eSBen Coburn global $conf; 161*c9b4bd1eSBen Coburn return $conf['lockdir'].'/'.sha1(cleanID($id)).'.lock'; 162*c9b4bd1eSBen Coburn} 163*c9b4bd1eSBen Coburn 164*c9b4bd1eSBen Coburn 165*c9b4bd1eSBen Coburn/** 1661380fc45SAndreas Gohr * returns the full path to the meta file specified by ID and extension 167b158d625SSteven Danz * 168b158d625SSteven Danz * The filename is URL encoded to protect Unicode chars 169b158d625SSteven Danz * 170b158d625SSteven Danz * @author Steven Danz <steven-danz@kc.rr.com> 171b158d625SSteven Danz */ 1721380fc45SAndreas Gohrfunction metaFN($id,$ext){ 173b158d625SSteven Danz global $conf; 174b158d625SSteven Danz $id = cleanID($id); 175b158d625SSteven Danz $id = str_replace(':','/',$id); 1761380fc45SAndreas Gohr $fn = $conf['metadir'].'/'.utf8_encodeFN($id).$ext; 177b158d625SSteven Danz return $fn; 178b158d625SSteven Danz} 179b158d625SSteven Danz 180b158d625SSteven Danz/** 181e1f3d9e1SEsther Brunner * returns an array of full paths to all metafiles of a given ID 182e1f3d9e1SEsther Brunner * 183e1f3d9e1SEsther Brunner * @author Esther Brunner <esther@kaffeehaus.ch> 184e1f3d9e1SEsther Brunner */ 185e1f3d9e1SEsther Brunnerfunction metaFiles($id){ 186e1f3d9e1SEsther Brunner $name = noNS($id); 187e1f3d9e1SEsther Brunner $dir = metaFN(getNS($id),''); 188e1f3d9e1SEsther Brunner $files = array(); 189e1f3d9e1SEsther Brunner 190e1f3d9e1SEsther Brunner $dh = @opendir($dir); 1915011da9dSEsther Brunner if(!$dh) return $files; 192e1f3d9e1SEsther Brunner while(($file = readdir($dh)) !== false){ 1931a54dfabSEsther Brunner if(strpos($file,$name.'.') === 0 && !is_dir($dir.$file)) 194e1f3d9e1SEsther Brunner $files[] = $dir.$file; 195e1f3d9e1SEsther Brunner } 196e1f3d9e1SEsther Brunner closedir($dh); 197e1f3d9e1SEsther Brunner 198e1f3d9e1SEsther Brunner return $files; 199e1f3d9e1SEsther Brunner} 200e1f3d9e1SEsther Brunner 201e1f3d9e1SEsther Brunner/** 202b625487dSandi * returns the full path to the mediafile specified by ID 203b625487dSandi * 204b625487dSandi * The filename is URL encoded to protect Unicode chars 205b625487dSandi * 206b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 207b625487dSandi */ 208b625487dSandifunction mediaFN($id){ 209b625487dSandi global $conf; 210b625487dSandi $id = cleanID($id); 211b625487dSandi $id = str_replace(':','/',$id); 212b625487dSandi $fn = $conf['mediadir'].'/'.utf8_encodeFN($id); 213b625487dSandi return $fn; 214b625487dSandi} 215b625487dSandi 216b625487dSandi/** 217b625487dSandi * Returns the full filepath to a localized textfile if local 218b625487dSandi * version isn't found the english one is returned 219b625487dSandi * 220b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 221b625487dSandi */ 222b625487dSandifunction localeFN($id){ 223b625487dSandi global $conf; 224bc3b6aecSandi $file = DOKU_INC.'inc/lang/'.$conf['lang'].'/'.$id.'.txt'; 225b625487dSandi if(!@file_exists($file)){ 226b625487dSandi //fall back to english 227bc3b6aecSandi $file = DOKU_INC.'inc/lang/en/'.$id.'.txt'; 228b625487dSandi } 229b625487dSandi return $file; 230b625487dSandi} 231b625487dSandi 232b625487dSandi/** 233c4e0e4a1SAndreas Gohr * Resolve relative paths in IDs 234c4e0e4a1SAndreas Gohr * 235c4e0e4a1SAndreas Gohr * Do not call directly use resolve_mediaid or resolve_pageid 236c4e0e4a1SAndreas Gohr * instead 237c4e0e4a1SAndreas Gohr * 238c4e0e4a1SAndreas Gohr * Partyly based on a cleanPath function found at 239c4e0e4a1SAndreas Gohr * http://www.php.net/manual/en/function.realpath.php#57016 240c4e0e4a1SAndreas Gohr * 241c4e0e4a1SAndreas Gohr * @author <bart at mediawave dot nl> 242c4e0e4a1SAndreas Gohr */ 243a6ef4796SAndreas Gohrfunction resolve_id($ns,$id,$clean=true){ 244c4e0e4a1SAndreas Gohr // if the id starts with a dot we need to handle the 245c4e0e4a1SAndreas Gohr // relative stuff 246c4e0e4a1SAndreas Gohr if($id{0} == '.'){ 247c4e0e4a1SAndreas Gohr // normalize initial dots without a colon 248c4e0e4a1SAndreas Gohr $id = preg_replace('/^(\.+)(?=[^:\.])/','\1:',$id); 249c4e0e4a1SAndreas Gohr // prepend the current namespace 250c4e0e4a1SAndreas Gohr $id = $ns.':'.$id; 251c4e0e4a1SAndreas Gohr 252c4e0e4a1SAndreas Gohr // cleanup relatives 253c4e0e4a1SAndreas Gohr $result = array(); 254c4e0e4a1SAndreas Gohr $pathA = explode(':', $id); 255c4e0e4a1SAndreas Gohr if (!$pathA[0]) $result[] = ''; 256c4e0e4a1SAndreas Gohr foreach ($pathA AS $key => $dir) { 257c4e0e4a1SAndreas Gohr if ($dir == '..') { 258c4e0e4a1SAndreas Gohr if (end($result) == '..') { 259c4e0e4a1SAndreas Gohr $result[] = '..'; 260c4e0e4a1SAndreas Gohr } elseif (!array_pop($result)) { 261c4e0e4a1SAndreas Gohr $result[] = '..'; 262c4e0e4a1SAndreas Gohr } 263c4e0e4a1SAndreas Gohr } elseif ($dir && $dir != '.') { 264c4e0e4a1SAndreas Gohr $result[] = $dir; 265c4e0e4a1SAndreas Gohr } 266c4e0e4a1SAndreas Gohr } 267c4e0e4a1SAndreas Gohr if (!end($pathA)) $result[] = ''; 268c4e0e4a1SAndreas Gohr $id = implode(':', $result); 269c4e0e4a1SAndreas Gohr }elseif($ns !== false && strpos($id,':') === false){ 270c4e0e4a1SAndreas Gohr //if link contains no namespace. add current namespace (if any) 271c4e0e4a1SAndreas Gohr $id = $ns.':'.$id; 272c4e0e4a1SAndreas Gohr } 273c4e0e4a1SAndreas Gohr 274a6ef4796SAndreas Gohr if($clean) $id = cleanID($id); 275a6ef4796SAndreas Gohr return $id; 276c4e0e4a1SAndreas Gohr} 277c4e0e4a1SAndreas Gohr 278c4e0e4a1SAndreas Gohr/** 279b625487dSandi * Returns a full media id 280b625487dSandi * 281b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 282b625487dSandi */ 28337e34a5eSandifunction resolve_mediaid($ns,&$page,&$exists){ 284c4e0e4a1SAndreas Gohr $page = resolve_id($ns,$page); 285b625487dSandi $file = mediaFN($page); 286b625487dSandi $exists = @file_exists($file); 287b625487dSandi} 288b625487dSandi 289b625487dSandi/** 290b625487dSandi * Returns a full page id 291b625487dSandi * 292b625487dSandi * @author Andreas Gohr <andi@splitbrain.org> 293b625487dSandi */ 29437e34a5eSandifunction resolve_pageid($ns,&$page,&$exists){ 295b625487dSandi global $conf; 2960b7c14c2Sandi $exists = false; 297b625487dSandi 298b625487dSandi //keep hashlink if exists then clean both parts 299b625487dSandi list($page,$hash) = split('#',$page,2); 300b625487dSandi $hash = cleanID($hash); 301a6ef4796SAndreas Gohr $page = resolve_id($ns,$page,false); // resolve but don't clean, yet 302b625487dSandi 303a6ef4796SAndreas Gohr // get filename (calls clean itself) 304b625487dSandi $file = wikiFN($page); 305b625487dSandi 306a6ef4796SAndreas Gohr // if ends with colon we have a namespace link 307a6ef4796SAndreas Gohr if(substr($page,-1) == ':'){ 308a6ef4796SAndreas Gohr if(@file_exists(wikiFN($page.$conf['start']))){ 309a6ef4796SAndreas Gohr // start page inside namespace 310a6ef4796SAndreas Gohr $page = $page.$conf['start']; 311a6ef4796SAndreas Gohr $exists = true; 312a6ef4796SAndreas Gohr }elseif(@file_exists(wikiFN($page.noNS(cleanID($page))))){ 313a6ef4796SAndreas Gohr // page named like the NS inside the NS 314a6ef4796SAndreas Gohr $page = $page.noNS(cleanID($page)); 315a6ef4796SAndreas Gohr $exists = true; 316a6ef4796SAndreas Gohr }elseif(@file_exists(wikiFN($page))){ 317a6ef4796SAndreas Gohr // page like namespace exists 318a6ef4796SAndreas Gohr $page = $page; 319a6ef4796SAndreas Gohr $exists = true; 320a6ef4796SAndreas Gohr }else{ 321a6ef4796SAndreas Gohr // fall back to default 322a6ef4796SAndreas Gohr $page = $page.$conf['start']; 323a6ef4796SAndreas Gohr } 324a6ef4796SAndreas Gohr }else{ 325b625487dSandi //check alternative plural/nonplural form 326b625487dSandi if(!@file_exists($file)){ 327b625487dSandi if( $conf['autoplural'] ){ 328b625487dSandi if(substr($page,-1) == 's'){ 329b625487dSandi $try = substr($page,0,-1); 330b625487dSandi }else{ 331b625487dSandi $try = $page.'s'; 332b625487dSandi } 333b625487dSandi if(@file_exists(wikiFN($try))){ 334b625487dSandi $page = $try; 335b625487dSandi $exists = true; 336b625487dSandi } 337b625487dSandi } 338b625487dSandi }else{ 339b625487dSandi $exists = true; 340b625487dSandi } 341a6ef4796SAndreas Gohr } 342a6ef4796SAndreas Gohr 343a6ef4796SAndreas Gohr // now make sure we have a clean page 344a6ef4796SAndreas Gohr $page = cleanID($page); 345b625487dSandi 346b625487dSandi //add hash if any 347b2d7d3f2Sandi if(!empty($hash)) $page .= '#'.$hash; 348b625487dSandi} 349b625487dSandi 35098407a7aSandi/** 35198407a7aSandi * Returns the name of a cachefile from given data 35298407a7aSandi * 35398407a7aSandi * The needed directory is created by this function! 35498407a7aSandi * 35598407a7aSandi * @author Andreas Gohr <andi@splitbrain.org> 35698407a7aSandi * 35798407a7aSandi * @param string $data This data is used to create a unique md5 name 35898407a7aSandi * @param string $ext This is appended to the filename if given 35998407a7aSandi * @return string The filename of the cachefile 36098407a7aSandi */ 36198407a7aSandifunction getCacheName($data,$ext=''){ 36298407a7aSandi global $conf; 36398407a7aSandi $md5 = md5($data); 36498407a7aSandi $file = $conf['cachedir'].'/'.$md5{0}.'/'.$md5.$ext; 36598407a7aSandi io_makeFileDir($file); 36698407a7aSandi return $file; 36798407a7aSandi} 36898407a7aSandi 3690dc92c6fSAndreas Gohr/** 3700dc92c6fSAndreas Gohr * Checks a pageid against $conf['hidepages'] 3710dc92c6fSAndreas Gohr * 3720dc92c6fSAndreas Gohr * @author Andreas Gohr <gohr@cosmocode.de> 3730dc92c6fSAndreas Gohr */ 3740dc92c6fSAndreas Gohrfunction isHiddenPage($id){ 3750dc92c6fSAndreas Gohr global $conf; 3760dc92c6fSAndreas Gohr if(empty($conf['hidepages'])) return false; 3770dc92c6fSAndreas Gohr 3780dc92c6fSAndreas Gohr if(preg_match('/'.$conf['hidepages'].'/ui',':'.$id)){ 3790dc92c6fSAndreas Gohr return true; 3800dc92c6fSAndreas Gohr } 3810dc92c6fSAndreas Gohr return false; 3820dc92c6fSAndreas Gohr} 3830dc92c6fSAndreas Gohr 3840dc92c6fSAndreas Gohr/** 3850dc92c6fSAndreas Gohr * Reverse of isHiddenPage 3860dc92c6fSAndreas Gohr * 3870dc92c6fSAndreas Gohr * @author Andreas Gohr <gohr@cosmocode.de> 3880dc92c6fSAndreas Gohr */ 3890dc92c6fSAndreas Gohrfunction isVisiblePage($id){ 3900dc92c6fSAndreas Gohr return !isHiddenPage($id); 3910dc92c6fSAndreas Gohr} 3920dc92c6fSAndreas Gohr 393254e5c84SBen Coburn/** 394254e5c84SBen Coburn * Checks and sets HTTP headers for conditional HTTP requests 395254e5c84SBen Coburn * 396254e5c84SBen Coburn * @author Simon Willison <swillison@gmail.com> 397254e5c84SBen Coburn * @link http://simon.incutio.com/archive/2003/04/23/conditionalGet 398254e5c84SBen Coburn */ 399254e5c84SBen Coburnfunction http_conditionalRequest($timestamp){ 400254e5c84SBen Coburn // A PHP implementation of conditional get, see 401254e5c84SBen Coburn // http://fishbowl.pastiche.org/archives/001132.html 402254e5c84SBen Coburn $last_modified = substr(date('r', $timestamp), 0, -5).'GMT'; 403254e5c84SBen Coburn $etag = '"'.md5($last_modified).'"'; 404254e5c84SBen Coburn // Send the headers 405254e5c84SBen Coburn header("Last-Modified: $last_modified"); 406254e5c84SBen Coburn header("ETag: $etag"); 407254e5c84SBen Coburn // See if the client has provided the required headers 408254e5c84SBen Coburn $if_modified_since = isset($_SERVER['HTTP_IF_MODIFIED_SINCE']) ? 409254e5c84SBen Coburn stripslashes($_SERVER['HTTP_IF_MODIFIED_SINCE']) : 410254e5c84SBen Coburn false; 411254e5c84SBen Coburn $if_none_match = isset($_SERVER['HTTP_IF_NONE_MATCH']) ? 412254e5c84SBen Coburn stripslashes($_SERVER['HTTP_IF_NONE_MATCH']) : 413254e5c84SBen Coburn false; 414254e5c84SBen Coburn if (!$if_modified_since && !$if_none_match) { 415254e5c84SBen Coburn return; 416254e5c84SBen Coburn } 417254e5c84SBen Coburn // At least one of the headers is there - check them 418254e5c84SBen Coburn if ($if_none_match && $if_none_match != $etag) { 419254e5c84SBen Coburn return; // etag is there but doesn't match 420254e5c84SBen Coburn } 421254e5c84SBen Coburn if ($if_modified_since && $if_modified_since != $last_modified) { 422254e5c84SBen Coburn return; // if-modified-since is there but doesn't match 423254e5c84SBen Coburn } 424254e5c84SBen Coburn // Nothing has changed since their last request - serve a 304 and exit 425254e5c84SBen Coburn header('HTTP/1.0 304 Not Modified'); 426254e5c84SBen Coburn exit; 427254e5c84SBen Coburn} 428254e5c84SBen Coburn 429b625487dSandi//Setup VIM: ex: et ts=2 enc=utf-8 : 430