xref: /dokuwiki/inc/pageutils.php (revision 5c8127091e246636c7d712a1db509d596708a532)
1b625487dSandi<?php
2b625487dSandi/**
3b625487dSandi * Utilities for handling pagenames
4b625487dSandi *
5b625487dSandi * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
6b625487dSandi * @author     Andreas Gohr <andi@splitbrain.org>
7b625487dSandi */
8b625487dSandi
96c7843b5Sandi/**
106c7843b5Sandi * Fetch the pageid
116c7843b5Sandi *
126c7843b5Sandi * Uses either standard $_REQUEST variable or extracts it from
136c7843b5Sandi * the full request URI when userewrite is set to 2
146c7843b5Sandi *
156c7843b5Sandi * Returns $conf['start'] if no id was found.
166c7843b5Sandi *
176c7843b5Sandi * @author Andreas Gohr <andi@splitbrain.org>
186c7843b5Sandi */
196c7843b5Sandifunction getID(){
206c7843b5Sandi  global $conf;
216c7843b5Sandi
226c7843b5Sandi  $id = cleanID($_REQUEST['id']);
236c7843b5Sandi
246c7843b5Sandi  //construct page id from request URI
256c7843b5Sandi  if(empty($id) && $conf['userewrite'] == 2){
266c7843b5Sandi    //get the script URL
276c7843b5Sandi    if($conf['basedir']){
286c7843b5Sandi      $script = $conf['basedir'].DOKU_SCRIPT;
296c7843b5Sandi    }elseif($_SERVER['DOCUMENT_ROOT'] && $_SERVER['SCRIPT_FILENAME']){
306c7843b5Sandi      $script = preg_replace ('/^'.preg_quote($_SERVER['DOCUMENT_ROOT'],'/').'/','',
316c7843b5Sandi                              $_SERVER['SCRIPT_FILENAME']);
326c7843b5Sandi      $script = '/'.$script;
336c7843b5Sandi    }else{
346c7843b5Sandi      $script = $_SERVER['SCRIPT_NAME'];
356c7843b5Sandi    }
366c7843b5Sandi
376c7843b5Sandi    //remove script URL and Querystring to gain the id
386c7843b5Sandi    if(preg_match('/^'.preg_quote($script,'/').'(.*)/',
396c7843b5Sandi                  $_SERVER['REQUEST_URI'], $match)){
406c7843b5Sandi      $id = preg_replace ('/\?.*/','',$match[1]);
416c7843b5Sandi    }
426c7843b5Sandi    $id = cleanID($id);
436c7843b5Sandi  }
446c7843b5Sandi  if(empty($id)) $id = $conf['start'];
456c7843b5Sandi
466c7843b5Sandi  return $id;
476c7843b5Sandi}
48b625487dSandi
49b625487dSandi/**
50b625487dSandi * Remove unwanted chars from ID
51b625487dSandi *
52b625487dSandi * Cleans a given ID to only use allowed characters. Accented characters are
53b625487dSandi * converted to unaccented ones
54b625487dSandi *
55b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
56b625487dSandi */
57b625487dSandifunction cleanID($id){
58b625487dSandi  global $conf;
59b625487dSandi  global $lang;
60b625487dSandi  $id = trim($id);
61b625487dSandi  $id = utf8_strtolower($id);
62b625487dSandi
63b625487dSandi  //alternative namespace seperator
64b625487dSandi  $id = strtr($id,';',':');
65b625487dSandi  if($conf['useslash']){
66b625487dSandi    $id = strtr($id,'/',':');
67b625487dSandi  }else{
68b625487dSandi    $id = strtr($id,'/','_');
69b625487dSandi  }
70b625487dSandi
71b625487dSandi  if($conf['deaccent']) $id = utf8_deaccent($id,-1);
72b625487dSandi
73b625487dSandi  //remove specials
74*5c812709Sandi  $id = utf8_stripspecials($id,'_');
75b625487dSandi
76b625487dSandi  //clean up
7706bd9a88Sandi  $id = preg_replace('#_+#','_',$id);
78b625487dSandi  $id = preg_replace('#:+#',':',$id);
79b625487dSandi  $id = trim($id,':._-');
80b625487dSandi  $id = preg_replace('#:[:\._\-]+#',':',$id);
81b625487dSandi
82b625487dSandi  return($id);
83b625487dSandi}
84b625487dSandi
85b625487dSandi/**
86b625487dSandi * Return namespacepart of a wiki ID
87b625487dSandi *
88b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
89b625487dSandi */
90b625487dSandifunction getNS($id){
91b625487dSandi if(strpos($id,':')!==false){
92b625487dSandi   return substr($id,0,strrpos($id,':'));
93b625487dSandi }
94b625487dSandi return false;
95b625487dSandi}
96b625487dSandi
97b625487dSandi/**
98b625487dSandi * Returns the ID without the namespace
99b625487dSandi *
100b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
101b625487dSandi */
102b625487dSandifunction noNS($id){
103b625487dSandi  return preg_replace('/.*:/','',$id);
104b625487dSandi}
105b625487dSandi
106b625487dSandi/**
107b625487dSandi * returns the full path to the datafile specified by ID and
108b625487dSandi * optional revision
109b625487dSandi *
110b625487dSandi * The filename is URL encoded to protect Unicode chars
111b625487dSandi *
112b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
113b625487dSandi */
114b625487dSandifunction wikiFN($id,$rev=''){
115b625487dSandi  global $conf;
116b625487dSandi  $id = cleanID($id);
117b625487dSandi  $id = str_replace(':','/',$id);
118b625487dSandi  if(empty($rev)){
119b625487dSandi    $fn = $conf['datadir'].'/'.utf8_encodeFN($id).'.txt';
120b625487dSandi  }else{
121b625487dSandi    $fn = $conf['olddir'].'/'.utf8_encodeFN($id).'.'.$rev.'.txt';
122b625487dSandi    if($conf['usegzip'] && !@file_exists($fn)){
123b625487dSandi      //return gzip if enabled and plaintext doesn't exist
124b625487dSandi      $fn .= '.gz';
125b625487dSandi    }
126b625487dSandi  }
127b625487dSandi  return $fn;
128b625487dSandi}
129b625487dSandi
130b625487dSandi/**
131b625487dSandi * returns the full path to the mediafile specified by ID
132b625487dSandi *
133b625487dSandi * The filename is URL encoded to protect Unicode chars
134b625487dSandi *
135b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
136b625487dSandi */
137b625487dSandifunction mediaFN($id){
138b625487dSandi  global $conf;
139b625487dSandi  $id = cleanID($id);
140b625487dSandi  $id = str_replace(':','/',$id);
141b625487dSandi    $fn = $conf['mediadir'].'/'.utf8_encodeFN($id);
142b625487dSandi  return $fn;
143b625487dSandi}
144b625487dSandi
145b625487dSandi/**
146b625487dSandi * Returns the full filepath to a localized textfile if local
147b625487dSandi * version isn't found the english one is returned
148b625487dSandi *
149b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
150b625487dSandi */
151b625487dSandifunction localeFN($id){
152b625487dSandi  global $conf;
153b625487dSandi  $file = './lang/'.$conf['lang'].'/'.$id.'.txt';
154b625487dSandi  if(!@file_exists($file)){
155b625487dSandi    //fall back to english
156b625487dSandi    $file = './lang/en/'.$id.'.txt';
157b625487dSandi  }
158b625487dSandi  return $file;
159b625487dSandi}
160b625487dSandi
161b625487dSandi/**
162b625487dSandi * Returns a full media id
163b625487dSandi *
164b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
165b625487dSandi */
16637e34a5eSandifunction resolve_mediaid($ns,&$page,&$exists){
167b625487dSandi  global $conf;
16837e34a5eSandi
169b625487dSandi  //if links starts with . add current namespace
170b625487dSandi  if($page{0} == '.'){
171b625487dSandi    $page = $ns.':'.substr($page,1);
172b625487dSandi  }
173b625487dSandi
174b625487dSandi  //if link contains no namespace. add current namespace (if any)
175b625487dSandi  if($ns !== false && strpos($page,':') === false){
176b625487dSandi    $page = $ns.':'.$page;
177b625487dSandi  }
178b625487dSandi
179b625487dSandi  $page   = cleanID($page);
180b625487dSandi  $file   = mediaFN($page);
181b625487dSandi  $exists = @file_exists($file);
182b625487dSandi}
183b625487dSandi
184b625487dSandi/**
185b625487dSandi * Returns a full page id
186b625487dSandi *
187b625487dSandi * @author Andreas Gohr <andi@splitbrain.org>
188b625487dSandi */
18937e34a5eSandifunction resolve_pageid($ns,&$page,&$exists){
190b625487dSandi  global $conf;
191b625487dSandi
192b625487dSandi  //if links starts with . add current namespace
193b625487dSandi  if($page{0} == '.'){
194b625487dSandi    $page = $ns.':'.substr($page,1);
195b625487dSandi  }
196b625487dSandi
197b625487dSandi  //if link contains no namespace. add current namespace (if any)
198b625487dSandi  if($ns !== false && strpos($page,':') === false){
199b625487dSandi    $page = $ns.':'.$page;
200b625487dSandi  }
201b625487dSandi
202b625487dSandi  //keep hashlink if exists then clean both parts
203b625487dSandi  list($page,$hash) = split('#',$page,2);
204b625487dSandi  $page = cleanID($page);
205b625487dSandi  $hash = cleanID($hash);
206b625487dSandi
207b625487dSandi  $file = wikiFN($page);
208b625487dSandi
209b625487dSandi  $exists = false;
210b625487dSandi
211b625487dSandi  //check alternative plural/nonplural form
212b625487dSandi  if(!@file_exists($file)){
213b625487dSandi    if( $conf['autoplural'] ){
214b625487dSandi      if(substr($page,-1) == 's'){
215b625487dSandi        $try = substr($page,0,-1);
216b625487dSandi      }else{
217b625487dSandi        $try = $page.'s';
218b625487dSandi      }
219b625487dSandi      if(@file_exists(wikiFN($try))){
220b625487dSandi        $page   = $try;
221b625487dSandi        $exists = true;
222b625487dSandi      }
223b625487dSandi    }
224b625487dSandi  }else{
225b625487dSandi    $exists = true;
226b625487dSandi  }
227b625487dSandi
228b625487dSandi  //add hash if any
229b2d7d3f2Sandi  if(!empty($hash)) $page .= '#'.$hash;
230b625487dSandi}
231b625487dSandi
232b625487dSandi//Setup VIM: ex: et ts=2 enc=utf-8 :
233