xref: /dokuwiki/inc/parserutils.php (revision 1094c7983299907018a4a7ee455bf3a6ce743ece)
1c112d578Sandi<?php
2c112d578Sandi/**
3c112d578Sandi * Utilities for collecting data from config files
4c112d578Sandi *
5c112d578Sandi * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
6c112d578Sandi * @author     Harry Fuecks <hfuecks@gmail.com>
7c112d578Sandi * @author     Andreas Gohr <andi@splitbrain.org>
8c112d578Sandi */
9c112d578Sandi
10c112d578Sandi  if(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../').'/');
11c112d578Sandi
12c112d578Sandi  require_once(DOKU_INC.'inc/confutils.php');
13c112d578Sandi  require_once(DOKU_INC.'inc/pageutils.php');
14c112d578Sandi
15c112d578Sandi/**
16c112d578Sandi * Returns the parsed Wikitext in XHTML for the given id and revision.
17c112d578Sandi *
18c112d578Sandi * If $excuse is true an explanation is returned if the file
19c112d578Sandi * wasn't found
20c112d578Sandi *
21c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
22c112d578Sandi */
23c112d578Sandifunction p_wiki_xhtml($id, $rev='', $excuse=true){
24c112d578Sandi  $file = wikiFN($id,$rev);
25c112d578Sandi  $ret  = '';
26c112d578Sandi
27c112d578Sandi  //ensure $id is in global $ID (needed for parsing)
281e76272cSandi  global $ID;
291e76272cSandi  $ID = $id;
30c112d578Sandi
31c112d578Sandi  if($rev){
32c112d578Sandi    if(@file_exists($file)){
33ac83b9d8Sandi      $ret = p_render('xhtml',p_get_instructions(io_readfile($file))); //no caching on old revisions
34c112d578Sandi    }elseif($excuse){
35c112d578Sandi      $ret = p_locale_xhtml('norev');
36c112d578Sandi    }
37c112d578Sandi  }else{
38c112d578Sandi    if(@file_exists($file)){
39c112d578Sandi      $ret = p_cached_xhtml($file);
40c112d578Sandi    }elseif($excuse){
41c112d578Sandi      $ret = p_locale_xhtml('newpage');
42c112d578Sandi    }
43c112d578Sandi  }
44c112d578Sandi
45c112d578Sandi  return $ret;
46c112d578Sandi}
47c112d578Sandi
48c112d578Sandi/**
49c112d578Sandi * Returns the specified local text in parsed format
50c112d578Sandi *
51c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
52c112d578Sandi */
53c112d578Sandifunction p_locale_xhtml($id){
54c112d578Sandi  //fetch parsed locale
55c112d578Sandi  $html = p_cached_xhtml(localeFN($id));
56c112d578Sandi  return $html;
57c112d578Sandi}
58c112d578Sandi
59c112d578Sandi/**
60c112d578Sandi * Returns the given file parsed to XHTML
61c112d578Sandi *
62c112d578Sandi * Uses and creates a cachefile
63c112d578Sandi *
64c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
65c112d578Sandi */
66c112d578Sandifunction p_cached_xhtml($file){
67c112d578Sandi  global $conf;
68c112d578Sandi  $cache  = $conf['datadir'].'/_cache/xhtml/';
69c112d578Sandi  $cache .= md5($file.$_SERVER['HTTP_HOST'].$_SERVER['SERVER_PORT']);
70*1094c798Sandi  $purge  = $conf['datadir'].'/_cache/purgefile';
71c112d578Sandi
72c112d578Sandi  // check if cache can be used
73c112d578Sandi  $cachetime = @filemtime($cache); // 0 if not exists
74c112d578Sandi
75c112d578Sandi  if( @file_exists($file)                                             // does the source exist
76c112d578Sandi      && $cachetime > @filemtime($file)                               // cache is fresh
77c112d578Sandi      && ((time() - $cachetime) < $conf['cachetime'])                 // and is cachefile young enough
78c112d578Sandi      && !isset($_REQUEST['purge'])                                   // no purge param was set
79*1094c798Sandi      && ($cachetime > @filemtime($purge))                            // and newer than the purgefile
80c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'conf/dokuwiki.php'))      // newer than the config file
81c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'conf/local.php'))         // newer than the local config file
82c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'inc/parser/xhtml.php'))   // newer than the renderer
83c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'inc/parser/parser.php'))  // newer than the parser
84c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'inc/parser/handler.php')))// newer than the handler
85c112d578Sandi  {
86c112d578Sandi    //well then use the cache
87c112d578Sandi    $parsed = io_readfile($cache);
88c112d578Sandi    $parsed .= "\n<!-- cachefile $cache used -->\n";
89c112d578Sandi  }else{
90ac83b9d8Sandi    $parsed = p_render('xhtml', p_cached_instructions($file)); //try to use cached instructions
91c112d578Sandi    io_saveFile($cache,$parsed); //save cachefile
92c112d578Sandi    $parsed .= "\n<!-- no cachefile used, but created -->\n";
93c112d578Sandi
94c112d578Sandi    /* FIXME add nocache directive handling like this:
95c112d578Sandi    if($parser['cache']){
96c112d578Sandi      io_saveFile($cache,$parsed); //save cachefile
97c112d578Sandi      $parsed .= "\n<!-- no cachefile used, but created -->\n";
98c112d578Sandi    }else{
99c112d578Sandi      @unlink($cache); //try to delete cachefile
100c112d578Sandi      $parsed .= "\n<!-- no cachefile used, caching forbidden -->\n";
101c112d578Sandi    }
102c112d578Sandi    */
103c112d578Sandi  }
104c112d578Sandi
105c112d578Sandi  return $parsed;
106c112d578Sandi}
107c112d578Sandi
108c112d578Sandi/**
109c112d578Sandi * Returns the render instructions for a file
110c112d578Sandi *
111c112d578Sandi * Uses and creates a serialized cache file
112c112d578Sandi *
113c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
114c112d578Sandi */
11537e34a5eSandifunction p_cached_instructions($file,$cacheonly=false){
116c112d578Sandi  global $conf;
117c112d578Sandi  $cache  = $conf['datadir'].'/_cache/instructions/';
118c112d578Sandi  $cache .= md5($file.$_SERVER['HTTP_HOST'].$_SERVER['SERVER_PORT']);
119c112d578Sandi
120c112d578Sandi  // check if cache can be used
121c112d578Sandi  $cachetime = @filemtime($cache); // 0 if not exists
122c112d578Sandi
12337e34a5eSandi  // cache forced?
12437e34a5eSandi  if($cacheonly){
12537e34a5eSandi    if($cachetime){
12637e34a5eSandi      return unserialize(io_readfile($cache));
12737e34a5eSandi    }else{
12837e34a5eSandi      return NULL;
12937e34a5eSandi    }
13037e34a5eSandi  }
13137e34a5eSandi
132c112d578Sandi  if( @file_exists($file)                                             // does the source exist
133c112d578Sandi      && $cachetime > @filemtime($file)                               // cache is fresh
134c112d578Sandi      && !isset($_REQUEST['purge'])                                   // no purge param was set
135c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'conf/dokuwiki.php'))      // newer than the config file
136c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'conf/local.php'))         // newer than the local config file
137c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'inc/parser/parser.php'))  // newer than the parser
138c112d578Sandi      && ($cachetime > @filemtime(DOKU_INC.'inc/parser/handler.php')))// newer than the handler
139c112d578Sandi  {
140c112d578Sandi    //well then use the cache
141c112d578Sandi    return unserialize(io_readfile($cache));
142c112d578Sandi  }elseif(@file_exists($file)){
143c112d578Sandi    // no cache - do some work
1446bbae538Sandi    $ins = p_get_instructions(io_readfile($file));
145c112d578Sandi    io_savefile($cache,serialize($ins));
146c112d578Sandi    return $ins;
147c112d578Sandi  }
148c112d578Sandi
149c112d578Sandi  return NULL;
150c112d578Sandi}
151c112d578Sandi
152c112d578Sandi/**
153c112d578Sandi * turns a page into a list of instructions
154c112d578Sandi *
155c112d578Sandi * @author Harry Fuecks <hfuecks@gmail.com>
156c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
157c112d578Sandi */
1586bbae538Sandifunction p_get_instructions($text){
159c112d578Sandi  global $conf;
160c112d578Sandi
161c112d578Sandi  require_once DOKU_INC . 'inc/parser/parser.php';
162c112d578Sandi
163c112d578Sandi  // Create the parser
164c112d578Sandi  $Parser = & new Doku_Parser();
165c112d578Sandi
166c112d578Sandi  // Add the Handler
167c112d578Sandi  $Parser->Handler = & new Doku_Handler();
168c112d578Sandi
169c112d578Sandi  // Load all the modes
170c112d578Sandi  $Parser->addMode('listblock',new Doku_Parser_Mode_ListBlock());
171c112d578Sandi  $Parser->addMode('preformatted',new Doku_Parser_Mode_Preformatted());
172c112d578Sandi  $Parser->addMode('notoc',new Doku_Parser_Mode_NoToc());
173c112d578Sandi  $Parser->addMode('header',new Doku_Parser_Mode_Header());
174c112d578Sandi  $Parser->addMode('table',new Doku_Parser_Mode_Table());
175c112d578Sandi
176c112d578Sandi  $formats = array (
177c112d578Sandi      'strong', 'emphasis', 'underline', 'monospace',
178c112d578Sandi      'subscript', 'superscript', 'deleted',
179c112d578Sandi  );
180c112d578Sandi  foreach ( $formats as $format ) {
181c112d578Sandi      $Parser->addMode($format,new Doku_Parser_Mode_Formatting($format));
182c112d578Sandi  }
183c112d578Sandi
184c112d578Sandi  $Parser->addMode('linebreak',new Doku_Parser_Mode_Linebreak());
185c112d578Sandi  $Parser->addMode('footnote',new Doku_Parser_Mode_Footnote());
186c112d578Sandi  $Parser->addMode('hr',new Doku_Parser_Mode_HR());
187c112d578Sandi
188c112d578Sandi  $Parser->addMode('unformatted',new Doku_Parser_Mode_Unformatted());
189c112d578Sandi  $Parser->addMode('php',new Doku_Parser_Mode_PHP());
190c112d578Sandi  $Parser->addMode('html',new Doku_Parser_Mode_HTML());
191c112d578Sandi  $Parser->addMode('code',new Doku_Parser_Mode_Code());
192c112d578Sandi  $Parser->addMode('file',new Doku_Parser_Mode_File());
193c112d578Sandi  $Parser->addMode('quote',new Doku_Parser_Mode_Quote());
194c112d578Sandi
195c112d578Sandi  $Parser->addMode('smiley',new Doku_Parser_Mode_Smiley(array_keys(getSmileys())));
196c112d578Sandi  $Parser->addMode('acronym',new Doku_Parser_Mode_Acronym(array_keys(getAcronyms())));
197c112d578Sandi  #$Parser->addMode('wordblock',new Doku_Parser_Mode_Wordblock(getBadWords()));
198c112d578Sandi  $Parser->addMode('entity',new Doku_Parser_Mode_Entity(array_keys(getEntities())));
199c112d578Sandi
200c112d578Sandi  $Parser->addMode('multiplyentity',new Doku_Parser_Mode_MultiplyEntity());
201c112d578Sandi  $Parser->addMode('quotes',new Doku_Parser_Mode_Quotes());
202c112d578Sandi
203c112d578Sandi  if($conf['camelcase']){
204c112d578Sandi    $Parser->addMode('camelcaselink',new Doku_Parser_Mode_CamelCaseLink());
205c112d578Sandi  }
206c112d578Sandi
207c112d578Sandi  $Parser->addMode('internallink',new Doku_Parser_Mode_InternalLink());
208c112d578Sandi  $Parser->addMode('rss',new Doku_Parser_Mode_RSS());
209c112d578Sandi  $Parser->addMode('media',new Doku_Parser_Mode_Media());
210c112d578Sandi  $Parser->addMode('externallink',new Doku_Parser_Mode_ExternalLink());
21171352defSandi  $Parser->addMode('emaillink',new Doku_Parser_Mode_EmailLink());
212c112d578Sandi  $Parser->addMode('windowssharelink',new Doku_Parser_Mode_WindowsShareLink());
213c112d578Sandi  //$Parser->addMode('filelink',new Doku_Parser_Mode_FileLink()); //FIXME ???
214c112d578Sandi  $Parser->addMode('eol',new Doku_Parser_Mode_Eol());
215c112d578Sandi
216c112d578Sandi  // Do the parsing
217a2d649c4Sandi  $p    = $Parser->parse($text);
218a2d649c4Sandi#  dbg($p);
219a2d649c4Sandi  return $p;
220c112d578Sandi}
221c112d578Sandi
222c112d578Sandi/**
223ac83b9d8Sandi * Renders a list of instruction to the specified output mode
224c112d578Sandi *
225c112d578Sandi * @author Harry Fuecks <hfuecks@gmail.com>
226c112d578Sandi * @author Andreas Gohr <andi@splitbrain.org>
227c112d578Sandi */
228ac83b9d8Sandifunction p_render($mode,$instructions){
229c112d578Sandi  if(is_null($instructions)) return '';
230c112d578Sandi
231c112d578Sandi  // Create the renderer
232ac83b9d8Sandi  if(!@file_exists(DOKU_INC."inc/parser/$mode.php")){
233ac83b9d8Sandi    msg("No renderer for $mode found",-1);
234ac83b9d8Sandi    return null;
235ac83b9d8Sandi  }
236ac83b9d8Sandi
237ac83b9d8Sandi  require_once DOKU_INC."inc/parser/$mode.php";
238ac83b9d8Sandi  $rclass = "Doku_Renderer_$mode";
239ac83b9d8Sandi  $Renderer = & new $rclass(); #FIXME any way to check for class existance?
240c112d578Sandi
241c112d578Sandi  $Renderer->smileys = getSmileys();
242c112d578Sandi  $Renderer->entities = getEntities();
243c112d578Sandi  $Renderer->acronyms = getAcronyms();
244c112d578Sandi  $Renderer->interwiki = getInterwiki();
245c112d578Sandi  #$Renderer->badwords = getBadWords();
246c112d578Sandi
247c112d578Sandi  // Loop through the instructions
248c112d578Sandi  foreach ( $instructions as $instruction ) {
249c112d578Sandi      // Execute the callback against the Renderer
250c112d578Sandi      call_user_func_array(array(&$Renderer, $instruction[0]),$instruction[1]);
251c112d578Sandi  }
252c112d578Sandi  // Return the output
253c112d578Sandi  return $Renderer->doc;
254c112d578Sandi}
255c112d578Sandi
256bb0a59d4Sjan/**
257bb0a59d4Sjan * Gets the first heading from a file
258bb0a59d4Sjan *
259bb0a59d4Sjan * @author Jan Decaluwe <jan@jandecaluwe.com>
260bb0a59d4Sjan */
261bb0a59d4Sjanfunction p_get_first_heading($id){
262bb0a59d4Sjan  $file = wikiFN($id);
263bb0a59d4Sjan  if (@file_exists($file)) {
2646e38d921Sandi    $instructions = p_cached_instructions($file,true);
265bb0a59d4Sjan    foreach ( $instructions as $instruction ) {
266bb0a59d4Sjan      if ($instruction[0] == 'header') {
267bb0a59d4Sjan        return $instruction[1][0];
268bb0a59d4Sjan      }
269bb0a59d4Sjan    }
270bb0a59d4Sjan  }
271bb0a59d4Sjan  return NULL;
272bb0a59d4Sjan}
273bb0a59d4Sjan
274c112d578Sandi//Setup VIM: ex: et ts=2 enc=utf-8 :
275