xref: /dokuwiki/inc/changelog.php (revision 33f552fab34c9ddcc3b647aedcc86a6209c708af)
1<?php
2/**
3 * Changelog handling functions
4 *
5 * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
6 * @author     Andreas Gohr <andi@splitbrain.org>
7 */
8
9// Constants for known core changelog line types.
10// Use these in place of string literals for more readable code.
11define('DOKU_CHANGE_TYPE_CREATE',       'C');
12define('DOKU_CHANGE_TYPE_EDIT',         'E');
13define('DOKU_CHANGE_TYPE_MINOR_EDIT',   'e');
14define('DOKU_CHANGE_TYPE_DELETE',       'D');
15define('DOKU_CHANGE_TYPE_REVERT',       'R');
16
17/**
18 * parses a changelog line into it's components
19 *
20 * @author Ben Coburn <btcoburn@silicodon.net>
21 */
22function parseChangelogLine($line) {
23    $tmp = explode("\t", $line);
24    if ($tmp!==false && count($tmp)>1) {
25        $info = array();
26        $info['date']  = (int)$tmp[0]; // unix timestamp
27        $info['ip']    = $tmp[1]; // IPv4 address (127.0.0.1)
28        $info['type']  = $tmp[2]; // log line type
29        $info['id']    = $tmp[3]; // page id
30        $info['user']  = $tmp[4]; // user name
31        $info['sum']   = $tmp[5]; // edit summary (or action reason)
32        $info['extra'] = rtrim($tmp[6], "\n"); // extra data (varies by line type)
33        return $info;
34    } else { return false; }
35}
36
37/**
38 * Add's an entry to the changelog and saves the metadata for the page
39 *
40 * @param int    $date      Timestamp of the change
41 * @param String $id        Name of the affected page
42 * @param String $type      Type of the change see DOKU_CHANGE_TYPE_*
43 * @param String $summary   Summary of the change
44 * @param mixed  $extra     In case of a revert the revision (timestmp) of the reverted page
45 * @param array  $flags     Additional flags in a key value array.
46 *                             Availible flags:
47 *                             - ExternalEdit - mark as an external edit.
48 *
49 * @author Andreas Gohr <andi@splitbrain.org>
50 * @author Esther Brunner <wikidesign@gmail.com>
51 * @author Ben Coburn <btcoburn@silicodon.net>
52 */
53function addLogEntry($date, $id, $type=DOKU_CHANGE_TYPE_EDIT, $summary='', $extra='', $flags=null){
54    global $conf, $INFO;
55
56    // check for special flags as keys
57    if (!is_array($flags)) { $flags = array(); }
58    $flagExternalEdit = isset($flags['ExternalEdit']);
59
60    $id = cleanid($id);
61    $file = wikiFN($id);
62    $created = @filectime($file);
63    $minor = ($type===DOKU_CHANGE_TYPE_MINOR_EDIT);
64    $wasRemoved = ($type===DOKU_CHANGE_TYPE_DELETE);
65
66    if(!$date) $date = time(); //use current time if none supplied
67    $remote = (!$flagExternalEdit)?clientIP(true):'127.0.0.1';
68    $user   = (!$flagExternalEdit)?$_SERVER['REMOTE_USER']:'';
69
70    $strip = array("\t", "\n");
71    $logline = array(
72            'date'  => $date,
73            'ip'    => $remote,
74            'type'  => str_replace($strip, '', $type),
75            'id'    => $id,
76            'user'  => $user,
77            'sum'   => utf8_substr(str_replace($strip, '', $summary),0,255),
78            'extra' => str_replace($strip, '', $extra)
79            );
80
81    // update metadata
82    if (!$wasRemoved) {
83        $oldmeta = p_read_metadata($id);
84        $meta    = array();
85        if (!$INFO['exists'] && empty($oldmeta['persistent']['date']['created'])){ // newly created
86            $meta['date']['created'] = $created;
87            if ($user){
88                $meta['creator'] = $INFO['userinfo']['name'];
89                $meta['user']    = $user;
90            }
91        } elseif (!$INFO['exists'] && !empty($oldmeta['persistent']['date']['created'])) { // re-created / restored
92            $meta['date']['created']  = $oldmeta['persistent']['date']['created'];
93            $meta['date']['modified'] = $created; // use the files ctime here
94            $meta['creator'] = $oldmeta['persistent']['creator'];
95            if ($user) $meta['contributor'][$user] = $INFO['userinfo']['name'];
96        } elseif (!$minor) {   // non-minor modification
97            $meta['date']['modified'] = $date;
98            if ($user) $meta['contributor'][$user] = $INFO['userinfo']['name'];
99        }
100        $meta['last_change'] = $logline;
101        p_set_metadata($id, $meta);
102    }
103
104    // add changelog lines
105    $logline = implode("\t", $logline)."\n";
106    io_saveFile(metaFN($id,'.changes'),$logline,true); //page changelog
107    io_saveFile($conf['changelog'],$logline,true); //global changelog cache
108}
109
110/**
111 * Add's an entry to the media changelog
112 *
113 * @author Michael Hamann <michael@content-space.de>
114 * @author Andreas Gohr <andi@splitbrain.org>
115 * @author Esther Brunner <wikidesign@gmail.com>
116 * @author Ben Coburn <btcoburn@silicodon.net>
117 */
118function addMediaLogEntry($date, $id, $type=DOKU_CHANGE_TYPE_EDIT, $summary='', $extra='', $flags=null){
119    global $conf;
120
121    $id = cleanid($id);
122
123    if(!$date) $date = time(); //use current time if none supplied
124    $remote = clientIP(true);
125    $user   = $_SERVER['REMOTE_USER'];
126
127    $strip = array("\t", "\n");
128    $logline = array(
129            'date'  => $date,
130            'ip'    => $remote,
131            'type'  => str_replace($strip, '', $type),
132            'id'    => $id,
133            'user'  => $user,
134            'sum'   => utf8_substr(str_replace($strip, '', $summary),0,255),
135            'extra' => str_replace($strip, '', $extra)
136            );
137
138    // add changelog lines
139    $logline = implode("\t", $logline)."\n";
140    io_saveFile($conf['media_changelog'],$logline,true); //global media changelog cache
141    io_saveFile(mediaMetaFN($id,'.changes'),$logline,true); //media file's changelog
142}
143
144/**
145 * returns an array of recently changed files using the
146 * changelog
147 *
148 * The following constants can be used to control which changes are
149 * included. Add them together as needed.
150 *
151 * RECENTS_SKIP_DELETED   - don't include deleted pages
152 * RECENTS_SKIP_MINORS    - don't include minor changes
153 * RECENTS_SKIP_SUBSPACES - don't include subspaces
154 * RECENTS_MEDIA_CHANGES  - return media changes instead of page changes
155 * RECENTS_MEDIA_PAGES_MIXED  - return both media changes and page changes
156 *
157 * @param int    $first   number of first entry returned (for paginating
158 * @param int    $num     return $num entries
159 * @param string $ns      restrict to given namespace
160 * @param int    $flags   see above
161 * @return array recently changed files
162 *
163 * @author Ben Coburn <btcoburn@silicodon.net>
164 * @author Kate Arzamastseva <pshns@ukr.net>
165 */
166function getRecents($first,$num,$ns='',$flags=0){
167    global $conf;
168    $recent = array();
169    $count  = 0;
170
171    if(!$num)
172        return $recent;
173
174    // read all recent changes. (kept short)
175    if ($flags & RECENTS_MEDIA_CHANGES) {
176        $lines = @file($conf['media_changelog']);
177    } else {
178        $lines = @file($conf['changelog']);
179    }
180    $lines_position = count($lines)-1;
181    $media_lines_position = 0;
182    $media_lines = array();
183
184    if ($flags & RECENTS_MEDIA_PAGES_MIXED) {
185        $media_lines = @file($conf['media_changelog']);
186        $media_lines_position = count($media_lines)-1;
187    }
188
189    $seen = array(); // caches seen lines, _handleRecent() skips them
190
191    // handle lines
192    while ($lines_position >= 0 || (($flags & RECENTS_MEDIA_PAGES_MIXED) && $media_lines_position >=0)) {
193        if (empty($rec) && $lines_position >= 0) {
194            $rec = _handleRecent(@$lines[$lines_position], $ns, $flags, $seen);
195            if (!$rec) {
196                $lines_position --;
197                continue;
198            }
199        }
200        if (($flags & RECENTS_MEDIA_PAGES_MIXED) && empty($media_rec) && $media_lines_position >= 0) {
201            $media_rec = _handleRecent(@$media_lines[$media_lines_position], $ns, $flags | RECENTS_MEDIA_CHANGES, $seen);
202            if (!$media_rec) {
203                $media_lines_position --;
204                continue;
205            }
206        }
207        if (($flags & RECENTS_MEDIA_PAGES_MIXED) && @$media_rec['date'] >= @$rec['date']) {
208            $media_lines_position--;
209            $x = $media_rec;
210            $x['media'] = true;
211            $media_rec = false;
212        } else {
213            $lines_position--;
214            $x = $rec;
215            if ($flags & RECENTS_MEDIA_CHANGES) $x['media'] = true;
216            $rec = false;
217        }
218        if(--$first >= 0) continue; // skip first entries
219        $recent[] = $x;
220        $count++;
221        // break when we have enough entries
222        if($count >= $num){ break; }
223    }
224    return $recent;
225}
226
227/**
228 * returns an array of files changed since a given time using the
229 * changelog
230 *
231 * The following constants can be used to control which changes are
232 * included. Add them together as needed.
233 *
234 * RECENTS_SKIP_DELETED   - don't include deleted pages
235 * RECENTS_SKIP_MINORS    - don't include minor changes
236 * RECENTS_SKIP_SUBSPACES - don't include subspaces
237 * RECENTS_MEDIA_CHANGES  - return media changes instead of page changes
238 *
239 * @param int    $from    date of the oldest entry to return
240 * @param int    $to      date of the newest entry to return (for pagination, optional)
241 * @param string $ns      restrict to given namespace (optional)
242 * @param int    $flags   see above (optional)
243 * @return array of files
244 *
245 * @author Michael Hamann <michael@content-space.de>
246 * @author Ben Coburn <btcoburn@silicodon.net>
247 */
248function getRecentsSince($from,$to=null,$ns='',$flags=0){
249    global $conf;
250    $recent = array();
251
252    if($to && $to < $from)
253        return $recent;
254
255    // read all recent changes. (kept short)
256    if ($flags & RECENTS_MEDIA_CHANGES) {
257        $lines = @file($conf['media_changelog']);
258    } else {
259        $lines = @file($conf['changelog']);
260    }
261    if(!$lines) return $recent;
262
263    // we start searching at the end of the list
264    $lines = array_reverse($lines);
265
266    // handle lines
267    $seen = array(); // caches seen lines, _handleRecent() skips them
268
269    foreach($lines as $line){
270        $rec = _handleRecent($line, $ns, $flags, $seen);
271        if($rec !== false) {
272            if ($rec['date'] >= $from) {
273                if (!$to || $rec['date'] <= $to) {
274                    $recent[] = $rec;
275                }
276            } else {
277                break;
278            }
279        }
280    }
281
282    return array_reverse($recent);
283}
284
285/**
286 * Internal function used by getRecents
287 *
288 * don't call directly
289 *
290 * @see getRecents()
291 * @author Andreas Gohr <andi@splitbrain.org>
292 * @author Ben Coburn <btcoburn@silicodon.net>
293 */
294function _handleRecent($line,$ns,$flags,&$seen){
295    if(empty($line)) return false;   //skip empty lines
296
297    // split the line into parts
298    $recent = parseChangelogLine($line);
299    if ($recent===false) { return false; }
300
301    // skip seen ones
302    if(isset($seen[$recent['id']])) return false;
303
304    // skip minors
305    if($recent['type']===DOKU_CHANGE_TYPE_MINOR_EDIT && ($flags & RECENTS_SKIP_MINORS)) return false;
306
307    // remember in seen to skip additional sights
308    $seen[$recent['id']] = 1;
309
310    // check if it's a hidden page
311    if(isHiddenPage($recent['id'])) return false;
312
313    // filter namespace
314    if (($ns) && (strpos($recent['id'],$ns.':') !== 0)) return false;
315
316    // exclude subnamespaces
317    if (($flags & RECENTS_SKIP_SUBSPACES) && (getNS($recent['id']) != $ns)) return false;
318
319    // check ACL
320    if ($flags & RECENTS_MEDIA_CHANGES) {
321        $recent['perms'] = auth_quickaclcheck(getNS($recent['id']).':*');
322    } else {
323        $recent['perms'] = auth_quickaclcheck($recent['id']);
324    }
325    if ($recent['perms'] < AUTH_READ) return false;
326
327    // check existance
328    if($flags & RECENTS_SKIP_DELETED){
329        $fn = (($flags & RECENTS_MEDIA_CHANGES) ? mediaFN($recent['id']) : wikiFN($recent['id']));
330        if(!@file_exists($fn)) return false;
331    }
332
333    return $recent;
334}
335
336/**
337 * Get the changelog information for a specific page id
338 * and revision (timestamp). Adjacent changelog lines
339 * are optimistically parsed and cached to speed up
340 * consecutive calls to getRevisionInfo. For large
341 * changelog files, only the chunk containing the
342 * requested changelog line is read.
343 *
344 * @author Ben Coburn <btcoburn@silicodon.net>
345 * @author Kate Arzamastseva <pshns@ukr.net>
346 */
347function getRevisionInfo($id, $rev, $chunk_size=8192, $media=false) {
348    global $cache_revinfo;
349    $cache =& $cache_revinfo;
350    if (!isset($cache[$id])) { $cache[$id] = array(); }
351    $rev = max($rev, 0);
352
353    // check if it's already in the memory cache
354    if (isset($cache[$id]) && isset($cache[$id][$rev])) {
355        return $cache[$id][$rev];
356    }
357
358    if ($media) {
359        $file = mediaMetaFN($id, '.changes');
360    } else {
361        $file = metaFN($id, '.changes');
362    }
363    if (!@file_exists($file)) { return false; }
364    if (filesize($file)<$chunk_size || $chunk_size==0) {
365        // read whole file
366        $lines = file($file);
367        if ($lines===false) { return false; }
368    } else {
369        // read by chunk
370        $fp = fopen($file, 'rb'); // "file pointer"
371        if ($fp===false) { return false; }
372        $head = 0;
373        fseek($fp, 0, SEEK_END);
374        $tail = ftell($fp);
375        $finger = 0;
376        $finger_rev = 0;
377
378        // find chunk
379        while ($tail-$head>$chunk_size) {
380            $finger = $head+floor(($tail-$head)/2.0);
381            fseek($fp, $finger);
382            fgets($fp); // slip the finger forward to a new line
383            $finger = ftell($fp);
384            $tmp = fgets($fp); // then read at that location
385            $tmp = parseChangelogLine($tmp);
386            $finger_rev = $tmp['date'];
387            if ($finger==$head || $finger==$tail) { break; }
388            if ($finger_rev>$rev) {
389                $tail = $finger;
390            } else {
391                $head = $finger;
392            }
393        }
394
395        if ($tail-$head<1) {
396            // cound not find chunk, assume requested rev is missing
397            fclose($fp);
398            return false;
399        }
400
401        // read chunk
402        $chunk = '';
403        $chunk_size = max($tail-$head, 0); // found chunk size
404        $got = 0;
405        fseek($fp, $head);
406        while ($got<$chunk_size && !feof($fp)) {
407            $tmp = @fread($fp, max($chunk_size-$got, 0));
408            if ($tmp===false) { break; } //error state
409            $got += strlen($tmp);
410            $chunk .= $tmp;
411        }
412        $lines = explode("\n", $chunk);
413        array_pop($lines); // remove trailing newline
414        fclose($fp);
415    }
416
417    // parse and cache changelog lines
418    foreach ($lines as $value) {
419        $tmp = parseChangelogLine($value);
420        if ($tmp!==false) {
421            $cache[$id][$tmp['date']] = $tmp;
422        }
423    }
424    if (!isset($cache[$id][$rev])) { return false; }
425    return $cache[$id][$rev];
426}
427
428/**
429 * Return a list of page revisions numbers
430 * Does not guarantee that the revision exists in the attic,
431 * only that a line with the date exists in the changelog.
432 * By default the current revision is skipped.
433 *
434 * id:    the page of interest
435 * first: skip the first n changelog lines
436 * num:   number of revisions to return
437 *
438 * The current revision is automatically skipped when the page exists.
439 * See $INFO['meta']['last_change'] for the current revision.
440 *
441 * For efficiency, the log lines are parsed and cached for later
442 * calls to getRevisionInfo. Large changelog files are read
443 * backwards in chunks until the requested number of changelog
444 * lines are recieved.
445 *
446 * @author Ben Coburn <btcoburn@silicodon.net>
447 * @author Kate Arzamastseva <pshns@ukr.net>
448 */
449function getRevisions($id, $first, $num, $chunk_size=8192, $media=false) {
450    global $cache_revinfo;
451    $cache =& $cache_revinfo;
452    if (!isset($cache[$id])) { $cache[$id] = array(); }
453
454    $revs = array();
455    $lines = array();
456    $count  = 0;
457    if ($media) {
458        $file = mediaMetaFN($id, '.changes');
459    } else {
460        $file = metaFN($id, '.changes');
461    }
462    $num = max($num, 0);
463    if ($num == 0) { return $revs; }
464
465    $chunk_size = max($chunk_size, 0);
466    if ($first<0) {
467        $first = 0;
468    } else if (!$media && @file_exists(wikiFN($id)) || $media && @file_exists(mediaFN($id))) {
469        // skip current revision if the page exists
470        $first = max($first+1, 0);
471    }
472
473    if (!@file_exists($file)) { return $revs; }
474    if (filesize($file)<$chunk_size || $chunk_size==0) {
475        // read whole file
476        $lines = file($file);
477        if ($lines===false) { return $revs; }
478    } else {
479        // read chunks backwards
480        $fp = fopen($file, 'rb'); // "file pointer"
481        if ($fp===false) { return $revs; }
482        fseek($fp, 0, SEEK_END);
483        $tail = ftell($fp);
484
485        // chunk backwards
486        $finger = max($tail-$chunk_size, 0);
487        while ($count<$num+$first) {
488            fseek($fp, $finger);
489            $nl = $finger;
490            if ($finger>0) {
491                fgets($fp); // slip the finger forward to a new line
492                $nl = ftell($fp);
493            }
494
495            // was the chunk big enough? if not, take another bite
496            if($nl > 0 && $tail <= $nl){
497                $finger = max($finger-$chunk_size, 0);
498                continue;
499            }else{
500                $finger = $nl;
501            }
502
503            // read chunk
504            $chunk = '';
505            $read_size = max($tail-$finger, 0); // found chunk size
506            $got = 0;
507            while ($got<$read_size && !feof($fp)) {
508                $tmp = @fread($fp, max($read_size-$got, 0));
509                if ($tmp===false) { break; } //error state
510                $got += strlen($tmp);
511                $chunk .= $tmp;
512            }
513            $tmp = explode("\n", $chunk);
514            array_pop($tmp); // remove trailing newline
515
516            // combine with previous chunk
517            $count += count($tmp);
518            $lines = array_merge($tmp, $lines);
519
520            // next chunk
521            if ($finger==0) { break; } // already read all the lines
522            else {
523                $tail = $finger;
524                $finger = max($tail-$chunk_size, 0);
525            }
526        }
527        fclose($fp);
528    }
529
530    // skip parsing extra lines
531    $num = max(min(count($lines)-$first, $num), 0);
532    if      ($first>0 && $num>0)  { $lines = array_slice($lines, max(count($lines)-$first-$num, 0), $num); }
533    else if ($first>0 && $num==0) { $lines = array_slice($lines, 0, max(count($lines)-$first, 0)); }
534    else if ($first==0 && $num>0) { $lines = array_slice($lines, max(count($lines)-$num, 0)); }
535
536    // handle lines in reverse order
537    for ($i = count($lines)-1; $i >= 0; $i--) {
538        $tmp = parseChangelogLine($lines[$i]);
539        if ($tmp!==false) {
540            $cache[$id][$tmp['date']] = $tmp;
541            $revs[] = $tmp['date'];
542        }
543    }
544
545    return $revs;
546}
547
548
549