xref: /dokuwiki/feed.php (revision 4c3263af6652b0a479e2c742914eb67a7929b9b9)
1<?php
2/**
3 * XML feed export
4 *
5 * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
6 * @author     Andreas Gohr <andi@splitbrain.org>
7 *
8 * @global array $conf
9 * @global Input $INPUT
10 */
11
12if(!defined('DOKU_INC')) define('DOKU_INC', dirname(__FILE__).'/');
13require_once(DOKU_INC.'inc/init.php');
14
15//close session
16session_write_close();
17
18// get params
19$opt = rss_parseOptions();
20
21// the feed is dynamic - we need a cache for each combo
22// (but most people just use the default feed so it's still effective)
23$cache = getCacheName(join('', array_values($opt)).$_SERVER['REMOTE_USER'], '.feed');
24$key   = join('', array_values($opt)).$_SERVER['REMOTE_USER'];
25$cache = new cache($key, '.feed');
26
27// prepare cache depends
28$depends['files'] = getConfigFiles('main');
29$depends['age']   = $conf['rss_update'];
30$depends['purge'] = $INPUT->bool('purge');
31
32// check cacheage and deliver if nothing has changed since last
33// time or the update interval has not passed, also handles conditional requests
34header('Cache-Control: must-revalidate, post-check=0, pre-check=0');
35header('Pragma: public');
36header('Content-Type: application/xml; charset=utf-8');
37header('X-Robots-Tag: noindex');
38if($cache->useCache($depends)) {
39    http_conditionalRequest($cache->_time);
40    if($conf['allowdebug']) header("X-CacheUsed: $cache->cache");
41    print $cache->retrieveCache();
42    exit;
43} else {
44    http_conditionalRequest(time());
45}
46
47// create new feed
48$rss                 = new DokuWikiFeedCreator();
49$rss->title          = $conf['title'].(($opt['namespace']) ? ' '.$opt['namespace'] : '');
50$rss->link           = DOKU_URL;
51$rss->syndicationURL = DOKU_URL.'feed.php';
52$rss->cssStyleSheet  = DOKU_URL.'lib/exe/css.php?s=feed';
53
54$image        = new FeedImage();
55$image->title = $conf['title'];
56$image->url   = tpl_getMediaFile(array(':wiki:favicon.ico', ':favicon.ico', 'images/favicon.ico'), true);
57$image->link  = DOKU_URL;
58$rss->image   = $image;
59
60$data  = null;
61$modes = array(
62    'list'   => 'rssListNamespace',
63    'search' => 'rssSearch',
64    'recent' => 'rssRecentChanges'
65);
66if(isset($modes[$opt['feed_mode']])) {
67    $data = $modes[$opt['feed_mode']]($opt);
68} else {
69    $eventData = array(
70        'opt'  => &$opt,
71        'data' => &$data,
72    );
73    $event     = new Doku_Event('FEED_MODE_UNKNOWN', $eventData);
74    if($event->advise_before(true)) {
75        echo sprintf('<error>Unknown feed mode %s</error>', hsc($opt['feed_mode']));
76        exit;
77    }
78    $event->advise_after();
79}
80
81rss_buildItems($rss, $data, $opt);
82$feed = $rss->createFeed($opt['feed_type'], 'utf-8');
83
84// save cachefile
85$cache->storeCache($feed);
86
87// finally deliver
88print $feed;
89
90// ---------------------------------------------------------------- //
91
92/**
93 * Get URL parameters and config options and return an initialized option array
94 *
95 * @author Andreas Gohr <andi@splitbrain.org>
96 */
97function rss_parseOptions() {
98    global $conf;
99    global $INPUT;
100
101    $opt = array();
102
103    foreach(array(
104                // Basic feed properties
105                // Plugins may probably want to add new values to these
106                // properties for implementing own feeds
107
108                // One of: list, search, recent
109                'feed_mode'    => array('str', 'mode', 'recent'),
110                // One of: diff, page, rev, current
111                'link_to'      => array('str', 'linkto', $conf['rss_linkto']),
112                // One of: abstract, diff, htmldiff, html
113                'item_content' => array('str', 'content', $conf['rss_content']),
114
115                // Special feed properties
116                // These are only used by certain feed_modes
117
118                // String, used for feed title, in list and rc mode
119                'namespace'    => array('str', 'ns', null),
120                // Positive integer, only used in rc mode
121                'items'        => array('int', 'num', $conf['recent']),
122                // Boolean, only used in rc mode
123                'show_minor'   => array('bool', 'minor', false),
124                // String, only used in search mode
125                'search_query' => array('str', 'q', null),
126                // One of: pages, media, both
127                'content_type' => array('str', 'view', $conf['rss_media'])
128
129            ) as $name => $val) {
130        $opt[$name] = $INPUT->$val[0]($val[1], $val[2], true);
131    }
132
133    $opt['items']      = max(0, (int) $opt['items']);
134    $opt['show_minor'] = (bool) $opt['show_minor'];
135
136    $opt['guardmail'] = ($conf['mailguard'] != '' && $conf['mailguard'] != 'none');
137
138    $type = valid_input_set(
139        'type', array(
140                     'rss', 'rss2', 'atom', 'atom1', 'rss1',
141                     'default' => $conf['rss_type']
142                ),
143        $_REQUEST
144    );
145    switch($type) {
146        case 'rss':
147            $opt['feed_type'] = 'RSS0.91';
148            $opt['mime_type'] = 'text/xml';
149            break;
150        case 'rss2':
151            $opt['feed_type'] = 'RSS2.0';
152            $opt['mime_type'] = 'text/xml';
153            break;
154        case 'atom':
155            $opt['feed_type'] = 'ATOM0.3';
156            $opt['mime_type'] = 'application/xml';
157            break;
158        case 'atom1':
159            $opt['feed_type'] = 'ATOM1.0';
160            $opt['mime_type'] = 'application/atom+xml';
161            break;
162        default:
163            $opt['feed_type'] = 'RSS1.0';
164            $opt['mime_type'] = 'application/xml';
165    }
166
167    $eventData = array(
168        'opt' => &$opt,
169    );
170    trigger_event('FEED_OPTS_POSTPROCESS', $eventData);
171    return $opt;
172}
173
174/**
175 * Add recent changed pages to a feed object
176 *
177 * @author Andreas Gohr <andi@splitbrain.org>
178 * @param  FeedCreator $rss the FeedCreator Object
179 * @param  array       $data the items to add
180 * @param  array       $opt  the feed options
181 */
182function rss_buildItems(&$rss, &$data, $opt) {
183    global $conf;
184    global $lang;
185    /* @var auth_basic $auth */
186    global $auth;
187
188    $eventData = array(
189        'rss'  => &$rss,
190        'data' => &$data,
191        'opt'  => &$opt,
192    );
193    $event     = new Doku_Event('FEED_DATA_PROCESS', $eventData);
194    if($event->advise_before(false)) {
195        foreach($data as $ditem) {
196            if(!is_array($ditem)) {
197                // not an array? then only a list of IDs was given
198                $ditem = array('id' => $ditem);
199            }
200
201            $item = new FeedItem();
202            $id   = $ditem['id'];
203            if(!$ditem['media']) {
204                $meta = p_get_metadata($id);
205            } else {
206                $meta = array();
207            }
208
209            // add date
210            if($ditem['date']) {
211                $date = $ditem['date'];
212            } elseif ($ditem['media']) {
213                $date = @filemtime(mediaFN($id));
214            } elseif (@file_exists(wikiFN($id))) {
215                $date = @filemtime(wikiFN($id));
216            } elseif($meta['date']['modified']) {
217                $date = $meta['date']['modified'];
218            } else {
219                $date = 0;
220            }
221            if($date) $item->date = date('r', $date);
222
223            // add title
224            if($conf['useheading'] && $meta['title']) {
225                $item->title = $meta['title'];
226            } else {
227                $item->title = $ditem['id'];
228            }
229            if($conf['rss_show_summary'] && !empty($ditem['sum'])) {
230                $item->title .= ' - '.strip_tags($ditem['sum']);
231            }
232
233            // add item link
234            switch($opt['link_to']) {
235                case 'page':
236                    if($ditem['media']) {
237                        $item->link = media_managerURL(
238                            array(
239                                 'image' => $id,
240                                 'ns'    => getNS($id),
241                                 'rev'   => $date
242                            ), '&', true
243                        );
244                    } else {
245                        $item->link = wl($id, 'rev='.$date, true, '&');
246                    }
247                    break;
248                case 'rev':
249                    if($ditem['media']) {
250                        $item->link = media_managerURL(
251                            array(
252                                 'image'       => $id,
253                                 'ns'          => getNS($id),
254                                 'rev'         => $date,
255                                 'tab_details' => 'history'
256                            ), '&', true
257                        );
258                    } else {
259                        $item->link = wl($id, 'do=revisions&rev='.$date, true, '&');
260                    }
261                    break;
262                case 'current':
263                    if($ditem['media']) {
264                        $item->link = media_managerURL(
265                            array(
266                                 'image' => $id,
267                                 'ns'    => getNS($id)
268                            ), '&', true
269                        );
270                    } else {
271                        $item->link = wl($id, '', true, '&');
272                    }
273                    break;
274                case 'diff':
275                default:
276                    if($ditem['media']) {
277                        $item->link = media_managerURL(
278                            array(
279                                 'image'       => $id,
280                                 'ns'          => getNS($id),
281                                 'rev'         => $date,
282                                 'tab_details' => 'history',
283                                 'mediado'     => 'diff'
284                            ), '&', true
285                        );
286                    } else {
287                        $item->link = wl($id, 'rev='.$date.'&do=diff', true, '&');
288                    }
289            }
290
291            // add item content
292            switch($opt['item_content']) {
293                case 'diff':
294                case 'htmldiff':
295                    if($ditem['media']) {
296                        $medialog = new MediaChangeLog($id);
297                        $revs  = $medialog->getRevisions(0, 1);
298                        $rev   = $revs[0];
299                        $src_r = '';
300                        $src_l = '';
301
302                        if($size = media_image_preview_size($id, false, new JpegMeta(mediaFN($id)), 300)) {
303                            $more  = 'w='.$size[0].'&h='.$size[1].'t='.@filemtime(mediaFN($id));
304                            $src_r = ml($id, $more);
305                        }
306                        if($rev && $size = media_image_preview_size($id, $rev, new JpegMeta(mediaFN($id, $rev)), 300)) {
307                            $more  = 'rev='.$rev.'&w='.$size[0].'&h='.$size[1];
308                            $src_l = ml($id, $more);
309                        }
310                        $content = '';
311                        if($src_r) {
312                            $content = '<table>';
313                            $content .= '<tr><th width="50%">'.$rev.'</th>';
314                            $content .= '<th width="50%">'.$lang['current'].'</th></tr>';
315                            $content .= '<tr align="center"><td><img src="'.$src_l.'" alt="" /></td><td>';
316                            $content .= '<img src="'.$src_r.'" alt="'.$id.'" /></td></tr>';
317                            $content .= '</table>';
318                        }
319
320                    } else {
321                        require_once(DOKU_INC.'inc/DifferenceEngine.php');
322                        $pagelog = new PageChangeLog($id);
323                        $revs = $pagelog->getRevisions(0, 1);
324                        $rev  = $revs[0];
325
326                        if($rev) {
327                            $df = new Diff(explode("\n", rawWiki($id, $rev)),
328                                           explode("\n", rawWiki($id, '')));
329                        } else {
330                            $df = new Diff(array(''),
331                                           explode("\n", rawWiki($id, '')));
332                        }
333
334                        if($opt['item_content'] == 'htmldiff') {
335                            // note: no need to escape diff output, TableDiffFormatter provides 'safe' html
336                            $tdf     = new TableDiffFormatter();
337                            $content = '<table>';
338                            $content .= '<tr><th colspan="2" width="50%">'.$rev.'</th>';
339                            $content .= '<th colspan="2" width="50%">'.$lang['current'].'</th></tr>';
340                            $content .= $tdf->format($df);
341                            $content .= '</table>';
342                        } else {
343                            // note: diff output must be escaped, UnifiedDiffFormatter provides plain text
344                            $udf     = new UnifiedDiffFormatter();
345                            $content = "<pre>\n".hsc($udf->format($df))."\n</pre>";
346                        }
347                    }
348                    break;
349                case 'html':
350                    if($ditem['media']) {
351                        if($size = media_image_preview_size($id, false, new JpegMeta(mediaFN($id)))) {
352                            $more    = 'w='.$size[0].'&h='.$size[1].'t='.@filemtime(mediaFN($id));
353                            $src     = ml($id, $more);
354                            $content = '<img src="'.$src.'" alt="'.$id.'" />';
355                        } else {
356                            $content = '';
357                        }
358                    } else {
359                        if (@filemtime(wikiFN($id)) === $date) {
360                            $content = p_wiki_xhtml($id, '', false);
361                        } else {
362                            $content = p_wiki_xhtml($id, $date, false);
363                        }
364                        // no TOC in feeds
365                        $content = preg_replace('/(<!-- TOC START -->).*(<!-- TOC END -->)/s', '', $content);
366
367                        // add alignment for images
368                        $content = preg_replace('/(<img .*?class="medialeft")/s', '\\1 align="left"', $content);
369                        $content = preg_replace('/(<img .*?class="mediaright")/s', '\\1 align="right"', $content);
370
371                        // make URLs work when canonical is not set, regexp instead of rerendering!
372                        if(!$conf['canonical']) {
373                            $base    = preg_quote(DOKU_REL, '/');
374                            $content = preg_replace('/(<a href|<img src)="('.$base.')/s', '$1="'.DOKU_URL, $content);
375                        }
376                    }
377
378                    break;
379                case 'abstract':
380                default:
381                    if($ditem['media']) {
382                        if($size = media_image_preview_size($id, false, new JpegMeta(mediaFN($id)))) {
383                            $more    = 'w='.$size[0].'&h='.$size[1].'t='.@filemtime(mediaFN($id));
384                            $src     = ml($id, $more);
385                            $content = '<img src="'.$src.'" alt="'.$id.'" />';
386                        } else {
387                            $content = '';
388                        }
389                    } else {
390                        $content = $meta['description']['abstract'];
391                    }
392            }
393            $item->description = $content; //FIXME a plugin hook here could be senseful
394
395            // add user
396            # FIXME should the user be pulled from metadata as well?
397            $user         = @$ditem['user']; // the @ spares time repeating lookup
398            $item->author = '';
399            if($user && $conf['useacl'] && $auth) {
400                $userInfo = $auth->getUserData($user);
401                if($userInfo) {
402                    switch($conf['showuseras']) {
403                        case 'username':
404                            $item->author = $userInfo['name'];
405                            break;
406                        default:
407                            $item->author = $user;
408                            break;
409                    }
410                } else {
411                    $item->author = $user;
412                }
413                if($userInfo && !$opt['guardmail']) {
414                    $item->authorEmail = $userInfo['mail'];
415                } else {
416                    //cannot obfuscate because some RSS readers may check validity
417                    $item->authorEmail = $user.'@'.$ditem['ip'];
418                }
419            } elseif($user) {
420                // this happens when no ACL but some Apache auth is used
421                $item->author      = $user;
422                $item->authorEmail = $user.'@'.$ditem['ip'];
423            } else {
424                $item->authorEmail = 'anonymous@'.$ditem['ip'];
425            }
426
427            // add category
428            if(isset($meta['subject'])) {
429                $item->category = $meta['subject'];
430            } else {
431                $cat = getNS($id);
432                if($cat) $item->category = $cat;
433            }
434
435            // Add only visible items
436            if(isVisiblePage($id)) {
437                // finally add the item to the feed object, after handing it to registered plugins
438                $evdata = array(
439                    'item'  => &$item,
440                    'opt'   => &$opt,
441                    'ditem' => &$ditem,
442                    'rss'   => &$rss
443                );
444                $evt    = new Doku_Event('FEED_ITEM_ADD', $evdata);
445                if($evt->advise_before()) {
446                    $rss->addItem($item);
447                }
448                $evt->advise_after(); // for completeness
449            }
450        }
451    }
452    $event->advise_after();
453}
454
455/**
456 * Add recent changed pages to the feed object
457 *
458 * @author Andreas Gohr <andi@splitbrain.org>
459 */
460function rssRecentChanges($opt) {
461    global $conf;
462    $flags = RECENTS_SKIP_DELETED;
463    if(!$opt['show_minor']) $flags += RECENTS_SKIP_MINORS;
464    if($opt['content_type'] == 'media' && $conf['mediarevisions']) $flags += RECENTS_MEDIA_CHANGES;
465    if($opt['content_type'] == 'both' && $conf['mediarevisions']) $flags += RECENTS_MEDIA_PAGES_MIXED;
466
467    $recents = getRecents(0, $opt['items'], $opt['namespace'], $flags);
468    return $recents;
469}
470
471/**
472 * Add all pages of a namespace to the feed object
473 *
474 * @author Andreas Gohr <andi@splitbrain.org>
475 */
476function rssListNamespace($opt) {
477    require_once(DOKU_INC.'inc/search.php');
478    global $conf;
479
480    $ns = ':'.cleanID($opt['namespace']);
481    $ns = str_replace(':', '/', $ns);
482
483    $data = array();
484    sort($data);
485    search($data, $conf['datadir'], 'search_list', '', $ns);
486
487    return $data;
488}
489
490/**
491 * Add the result of a full text search to the feed object
492 *
493 * @author Andreas Gohr <andi@splitbrain.org>
494 */
495function rssSearch($opt) {
496    if(!$opt['search_query']) return array();
497
498    require_once(DOKU_INC.'inc/fulltext.php');
499    $data = ft_pageSearch($opt['search_query'], $poswords);
500    $data = array_keys($data);
501
502    return $data;
503}
504
505//Setup VIM: ex: et ts=4 :
506