xref: /dokuwiki/inc/pageutils.php (revision 6de3759a1b7a74492845c76e1f0bd1078e2220c7)
1b625487dSandi<?php
2b625487dSandi/**
3b625487dSandi * Utilities for handling pagenames
4b625487dSandi *
5b625487dSandi * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
6b625487dSandi * @author     Andreas Gohr <andi@splitbrain.org>
71380fc45SAndreas Gohr * @todo       Combine similar functions like {wiki,media,meta}FN()
8b625487dSandi */
9b625487dSandi
106c7843b5Sandi/**
11*6de3759aSAndreas Gohr * Fetch the an ID from request
126c7843b5Sandi *
136c7843b5Sandi * Uses either standard $_REQUEST variable or extracts it from
146c7843b5Sandi * the full request URI when userewrite is set to 2
156c7843b5Sandi *
16*6de3759aSAndreas Gohr * Returns $conf['start'] if no id was found and $param is 'id'
176c7843b5Sandi *
186c7843b5Sandi * @author Andreas Gohr <andi@splitbrain.org>
196c7843b5Sandi */
20*6de3759aSAndreas Gohrfunction getID($param='id'){
216c7843b5Sandi  global $conf;
226c7843b5Sandi
23*6de3759aSAndreas Gohr  $id = cleanID($_REQUEST[$param]);
246c7843b5Sandi
256c7843b5Sandi  //construct page id from request URI
266c7843b5Sandi  if(empty($id) && $conf['userewrite'] == 2){
276c7843b5Sandi    //get the script URL
286c7843b5Sandi    if($conf['basedir']){
29*6de3759aSAndreas Gohr      $script = $conf['basedir'].basedir($_SERVER['SCRIPT_FILENAME']);
306c7843b5Sandi    }elseif($_SERVER['DOCUMENT_ROOT'] && $_SERVER['SCRIPT_FILENAME']){
316c7843b5Sandi      $script = preg_replace ('/^'.preg_quote($_SERVER['DOCUMENT_ROOT'],'/').'/','',
326c7843b5Sandi                              $_SERVER['SCRIPT_FILENAME']);
336c7843b5Sandi      $script = '/'.$script;
346c7843b5Sandi    }else{
356c7843b5Sandi      $script = $_SERVER['SCRIPT_NAME'];
366c7843b5Sandi    }
376c7843b5Sandi
3852339126Sandi    //clean script and request (fixes a windows problem)
3952339126Sandi    $script  = preg_replace('/\/\/+/','/',$script);
4052339126Sandi    $request = preg_replace('/\/\/+/','/',$_SERVER['REQUEST_URI']);
4152339126Sandi
426c7843b5Sandi    //remove script URL and Querystring to gain the id
4352339126Sandi    if(preg_match('/^'.preg_quote($script,'/').'(.*)/',$request, $match)){
446c7843b5Sandi      $id = preg_replace ('/\?.*/','',$match[1]);
456c7843b5Sandi    }
46*6de3759aSAndreas Gohr    $id = urldecode($id);
476c7843b5Sandi    $id = cleanID($id);
486c7843b5Sandi  }
49*6de3759aSAndreas Gohr  if(empty($id) && $param='id') $id = $conf['start'];
506c7843b5Sandi
516c7843b5Sandi  return $id;
526c7843b5Sandi}
53b625487dSandi
54b625487dSandi/**
55b625487dSandi * Remove unwanted chars from ID
56b625487dSandi *
57b625487dSandi * Cleans a given ID to only use allowed characters. Accented characters are
58b625487dSandi * converted to unaccented ones
59b625487dSandi *
60b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
61b625487dSandi */
62b625487dSandifunction cleanID($id){
63b625487dSandi  global $conf;
64b625487dSandi  global $lang;
65b625487dSandi  $id = trim($id);
66b625487dSandi  $id = utf8_strtolower($id);
67b625487dSandi
68b625487dSandi  //alternative namespace seperator
69b625487dSandi  $id = strtr($id,';',':');
70b625487dSandi  if($conf['useslash']){
71b625487dSandi    $id = strtr($id,'/',':');
72b625487dSandi  }else{
73b625487dSandi    $id = strtr($id,'/','_');
74b625487dSandi  }
75b625487dSandi
76b625487dSandi  if($conf['deaccent']) $id = utf8_deaccent($id,-1);
77b625487dSandi
78b625487dSandi  //remove specials
795c812709Sandi  $id = utf8_stripspecials($id,'_');
80b625487dSandi
81b625487dSandi  //clean up
8206bd9a88Sandi  $id = preg_replace('#_+#','_',$id);
83b625487dSandi  $id = preg_replace('#:+#',':',$id);
84b625487dSandi  $id = trim($id,':._-');
85b625487dSandi  $id = preg_replace('#:[:\._\-]+#',':',$id);
86b625487dSandi
87b625487dSandi  return($id);
88b625487dSandi}
89b625487dSandi
90b625487dSandi/**
91b625487dSandi * Return namespacepart of a wiki ID
92b625487dSandi *
93b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
94b625487dSandi */
95b625487dSandifunction getNS($id){
96b625487dSandi if(strpos($id,':')!==false){
97b625487dSandi   return substr($id,0,strrpos($id,':'));
98b625487dSandi }
99b625487dSandi return false;
100b625487dSandi}
101b625487dSandi
102b625487dSandi/**
103b625487dSandi * Returns the ID without the namespace
104b625487dSandi *
105b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
106b625487dSandi */
107b625487dSandifunction noNS($id){
108b625487dSandi  return preg_replace('/.*:/','',$id);
109b625487dSandi}
110b625487dSandi
111b625487dSandi/**
112b625487dSandi * returns the full path to the datafile specified by ID and
113b625487dSandi * optional revision
114b625487dSandi *
115b625487dSandi * The filename is URL encoded to protect Unicode chars
116b625487dSandi *
117b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
118b625487dSandi */
119b625487dSandifunction wikiFN($id,$rev=''){
120b625487dSandi  global $conf;
121b625487dSandi  $id = cleanID($id);
122b625487dSandi  $id = str_replace(':','/',$id);
123b625487dSandi  if(empty($rev)){
124b625487dSandi    $fn = $conf['datadir'].'/'.utf8_encodeFN($id).'.txt';
125b625487dSandi  }else{
126b625487dSandi    $fn = $conf['olddir'].'/'.utf8_encodeFN($id).'.'.$rev.'.txt';
127b625487dSandi    if($conf['usegzip'] && !@file_exists($fn)){
128b625487dSandi      //return gzip if enabled and plaintext doesn't exist
129b625487dSandi      $fn .= '.gz';
130b625487dSandi    }
131b625487dSandi  }
132b625487dSandi  return $fn;
133b625487dSandi}
134b625487dSandi
135b625487dSandi/**
1361380fc45SAndreas Gohr * returns the full path to the meta file specified by ID and extension
137b158d625SSteven Danz *
138b158d625SSteven Danz * The filename is URL encoded to protect Unicode chars
139b158d625SSteven Danz *
140b158d625SSteven Danz * @author Steven Danz <steven-danz@kc.rr.com>
141b158d625SSteven Danz */
1421380fc45SAndreas Gohrfunction metaFN($id,$ext){
143b158d625SSteven Danz  global $conf;
144b158d625SSteven Danz  $id = cleanID($id);
145b158d625SSteven Danz  $id = str_replace(':','/',$id);
1461380fc45SAndreas Gohr  $fn = $conf['metadir'].'/'.utf8_encodeFN($id).$ext;
147b158d625SSteven Danz  return $fn;
148b158d625SSteven Danz}
149b158d625SSteven Danz
150b158d625SSteven Danz/**
151b625487dSandi * returns the full path to the mediafile specified by ID
152b625487dSandi *
153b625487dSandi * The filename is URL encoded to protect Unicode chars
154b625487dSandi *
155b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
156b625487dSandi */
157b625487dSandifunction mediaFN($id){
158b625487dSandi  global $conf;
159b625487dSandi  $id = cleanID($id);
160b625487dSandi  $id = str_replace(':','/',$id);
161b625487dSandi    $fn = $conf['mediadir'].'/'.utf8_encodeFN($id);
162b625487dSandi  return $fn;
163b625487dSandi}
164b625487dSandi
165b625487dSandi/**
166b625487dSandi * Returns the full filepath to a localized textfile if local
167b625487dSandi * version isn't found the english one is returned
168b625487dSandi *
169b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
170b625487dSandi */
171b625487dSandifunction localeFN($id){
172b625487dSandi  global $conf;
173bc3b6aecSandi  $file = DOKU_INC.'inc/lang/'.$conf['lang'].'/'.$id.'.txt';
174b625487dSandi  if(!@file_exists($file)){
175b625487dSandi    //fall back to english
176bc3b6aecSandi    $file = DOKU_INC.'inc/lang/en/'.$id.'.txt';
177b625487dSandi  }
178b625487dSandi  return $file;
179b625487dSandi}
180b625487dSandi
181b625487dSandi/**
182b625487dSandi * Returns a full media id
183b625487dSandi *
184b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
185b625487dSandi */
18637e34a5eSandifunction resolve_mediaid($ns,&$page,&$exists){
187b625487dSandi  global $conf;
18837e34a5eSandi
189b625487dSandi  //if links starts with . add current namespace
190b625487dSandi  if($page{0} == '.'){
191b625487dSandi    $page = $ns.':'.substr($page,1);
192b625487dSandi  }
193b625487dSandi
194b625487dSandi  //if link contains no namespace. add current namespace (if any)
195b625487dSandi  if($ns !== false && strpos($page,':') === false){
196b625487dSandi    $page = $ns.':'.$page;
197b625487dSandi  }
198b625487dSandi
199b625487dSandi  $page   = cleanID($page);
200b625487dSandi  $file   = mediaFN($page);
201b625487dSandi  $exists = @file_exists($file);
202b625487dSandi}
203b625487dSandi
204b625487dSandi/**
205b625487dSandi * Returns a full page id
206b625487dSandi *
207b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
208b625487dSandi */
20937e34a5eSandifunction resolve_pageid($ns,&$page,&$exists){
210b625487dSandi  global $conf;
2110b7c14c2Sandi  $exists = false;
212b625487dSandi
213b625487dSandi  //if links starts with . add current namespace
214b625487dSandi  if($page{0} == '.'){
215b625487dSandi    $page = $ns.':'.substr($page,1);
216b625487dSandi  }
217b625487dSandi
218b625487dSandi  //if link contains no namespace. add current namespace (if any)
219b625487dSandi  if($ns !== false && strpos($page,':') === false){
220b625487dSandi    $page = $ns.':'.$page;
221b625487dSandi  }
222b625487dSandi
223b625487dSandi  //keep hashlink if exists then clean both parts
224b625487dSandi  list($page,$hash) = split('#',$page,2);
225b625487dSandi  $page = cleanID($page);
226b625487dSandi  $hash = cleanID($hash);
227b625487dSandi
228b625487dSandi  $file = wikiFN($page);
229b625487dSandi
230b625487dSandi  //check alternative plural/nonplural form
231b625487dSandi  if(!@file_exists($file)){
232b625487dSandi    if( $conf['autoplural'] ){
233b625487dSandi      if(substr($page,-1) == 's'){
234b625487dSandi        $try = substr($page,0,-1);
235b625487dSandi      }else{
236b625487dSandi        $try = $page.'s';
237b625487dSandi      }
238b625487dSandi      if(@file_exists(wikiFN($try))){
239b625487dSandi        $page   = $try;
240b625487dSandi        $exists = true;
241b625487dSandi      }
242b625487dSandi    }
243b625487dSandi  }else{
244b625487dSandi    $exists = true;
245b625487dSandi  }
246b625487dSandi
247b625487dSandi  //add hash if any
248b2d7d3f2Sandi  if(!empty($hash)) $page .= '#'.$hash;
249b625487dSandi}
250b625487dSandi
25198407a7aSandi/**
25298407a7aSandi * Returns the name of a cachefile from given data
25398407a7aSandi *
25498407a7aSandi * The needed directory is created by this function!
25598407a7aSandi *
25698407a7aSandi * @author Andreas Gohr <andi@splitbrain.org>
25798407a7aSandi *
25898407a7aSandi * @param string $data  This data is used to create a unique md5 name
25998407a7aSandi * @param string $ext   This is appended to the filename if given
26098407a7aSandi * @return string       The filename of the cachefile
26198407a7aSandi */
26298407a7aSandifunction getCacheName($data,$ext=''){
26398407a7aSandi  global $conf;
26498407a7aSandi  $md5  = md5($data);
26598407a7aSandi  $file = $conf['cachedir'].'/'.$md5{0}.'/'.$md5.$ext;
26698407a7aSandi  io_makeFileDir($file);
26798407a7aSandi  return $file;
26898407a7aSandi}
26998407a7aSandi
270b625487dSandi//Setup VIM: ex: et ts=2 enc=utf-8 :
271