1<?php 2/** 3 * Changelog handling functions 4 * 5 * @license GPL 2 (http://www.gnu.org/licenses/gpl.html) 6 * @author Andreas Gohr <andi@splitbrain.org> 7 */ 8 9// Constants for known core changelog line types. 10// Use these in place of string literals for more readable code. 11define('DOKU_CHANGE_TYPE_CREATE', 'C'); 12define('DOKU_CHANGE_TYPE_EDIT', 'E'); 13define('DOKU_CHANGE_TYPE_MINOR_EDIT', 'e'); 14define('DOKU_CHANGE_TYPE_DELETE', 'D'); 15define('DOKU_CHANGE_TYPE_REVERT', 'R'); 16 17/** 18 * parses a changelog line into it's components 19 * 20 * @author Ben Coburn <btcoburn@silicodon.net> 21 */ 22function parseChangelogLine($line) { 23 $tmp = explode("\t", $line); 24 if ($tmp!==false && count($tmp)>1) { 25 $info = array(); 26 $info['date'] = (int)$tmp[0]; // unix timestamp 27 $info['ip'] = $tmp[1]; // IPv4 address (127.0.0.1) 28 $info['type'] = $tmp[2]; // log line type 29 $info['id'] = $tmp[3]; // page id 30 $info['user'] = $tmp[4]; // user name 31 $info['sum'] = $tmp[5]; // edit summary (or action reason) 32 $info['extra'] = rtrim($tmp[6], "\n"); // extra data (varies by line type) 33 return $info; 34 } else { return false; } 35} 36 37/** 38 * Add's an entry to the changelog and saves the metadata for the page 39 * 40 * @param int $date Timestamp of the change 41 * @param String $id Name of the affected page 42 * @param String $type Type of the change see DOKU_CHANGE_TYPE_* 43 * @param String $summary Summary of the change 44 * @param mixed $extra In case of a revert the revision (timestmp) of the reverted page 45 * @param array $flags Additional flags in a key value array. 46 * Availible flags: 47 * - ExternalEdit - mark as an external edit. 48 * 49 * @author Andreas Gohr <andi@splitbrain.org> 50 * @author Esther Brunner <wikidesign@gmail.com> 51 * @author Ben Coburn <btcoburn@silicodon.net> 52 */ 53function addLogEntry($date, $id, $type=DOKU_CHANGE_TYPE_EDIT, $summary='', $extra='', $flags=null){ 54 global $conf, $INFO; 55 56 // check for special flags as keys 57 if (!is_array($flags)) { $flags = array(); } 58 $flagExternalEdit = isset($flags['ExternalEdit']); 59 60 $id = cleanid($id); 61 $file = wikiFN($id); 62 $created = @filectime($file); 63 $minor = ($type===DOKU_CHANGE_TYPE_MINOR_EDIT); 64 $wasRemoved = ($type===DOKU_CHANGE_TYPE_DELETE); 65 66 if(!$date) $date = time(); //use current time if none supplied 67 $remote = (!$flagExternalEdit)?clientIP(true):'127.0.0.1'; 68 $user = (!$flagExternalEdit)?$_SERVER['REMOTE_USER']:''; 69 70 $strip = array("\t", "\n"); 71 $logline = array( 72 'date' => $date, 73 'ip' => $remote, 74 'type' => str_replace($strip, '', $type), 75 'id' => $id, 76 'user' => $user, 77 'sum' => utf8_substr(str_replace($strip, '', $summary),0,255), 78 'extra' => str_replace($strip, '', $extra) 79 ); 80 81 // update metadata 82 if (!$wasRemoved) { 83 $oldmeta = p_read_metadata($id); 84 $meta = array(); 85 if (!$INFO['exists'] && empty($oldmeta['persistent']['date']['created'])){ // newly created 86 $meta['date']['created'] = $created; 87 if ($user){ 88 $meta['creator'] = $INFO['userinfo']['name']; 89 $meta['user'] = $user; 90 } 91 } elseif (!$INFO['exists'] && !empty($oldmeta['persistent']['date']['created'])) { // re-created / restored 92 $meta['date']['created'] = $oldmeta['persistent']['date']['created']; 93 $meta['date']['modified'] = $created; // use the files ctime here 94 $meta['creator'] = $oldmeta['persistent']['creator']; 95 if ($user) $meta['contributor'][$user] = $INFO['userinfo']['name']; 96 } elseif (!$minor) { // non-minor modification 97 $meta['date']['modified'] = $date; 98 if ($user) $meta['contributor'][$user] = $INFO['userinfo']['name']; 99 } 100 $meta['last_change'] = $logline; 101 p_set_metadata($id, $meta); 102 } 103 104 // add changelog lines 105 $logline = implode("\t", $logline)."\n"; 106 io_saveFile(metaFN($id,'.changes'),$logline,true); //page changelog 107 io_saveFile($conf['changelog'],$logline,true); //global changelog cache 108} 109 110/** 111 * Add's an entry to the media changelog 112 * 113 * @author Michael Hamann <michael@content-space.de> 114 * @author Andreas Gohr <andi@splitbrain.org> 115 * @author Esther Brunner <wikidesign@gmail.com> 116 * @author Ben Coburn <btcoburn@silicodon.net> 117 */ 118function addMediaLogEntry($date, $id, $type=DOKU_CHANGE_TYPE_EDIT, $summary='', $extra='', $flags=null){ 119 global $conf; 120 121 $id = cleanid($id); 122 123 if(!$date) $date = time(); //use current time if none supplied 124 $remote = clientIP(true); 125 $user = $_SERVER['REMOTE_USER']; 126 127 $strip = array("\t", "\n"); 128 $logline = array( 129 'date' => $date, 130 'ip' => $remote, 131 'type' => str_replace($strip, '', $type), 132 'id' => $id, 133 'user' => $user, 134 'sum' => utf8_substr(str_replace($strip, '', $summary),0,255), 135 'extra' => str_replace($strip, '', $extra) 136 ); 137 138 // add changelog lines 139 $logline = implode("\t", $logline)."\n"; 140 io_saveFile($conf['media_changelog'],$logline,true); //global media changelog cache 141 io_saveFile(mediaMetaFN($id,'.changes'),$logline,true); //media file's changelog 142} 143 144/** 145 * returns an array of recently changed files using the 146 * changelog 147 * 148 * The following constants can be used to control which changes are 149 * included. Add them together as needed. 150 * 151 * RECENTS_SKIP_DELETED - don't include deleted pages 152 * RECENTS_SKIP_MINORS - don't include minor changes 153 * RECENTS_SKIP_SUBSPACES - don't include subspaces 154 * RECENTS_MEDIA_CHANGES - return media changes instead of page changes 155 * RECENTS_MEDIA_PAGES_MIXED - return both media changes and page changes 156 * 157 * @param int $first number of first entry returned (for paginating 158 * @param int $num return $num entries 159 * @param string $ns restrict to given namespace 160 * @param int $flags see above 161 * @return array recently changed files 162 * 163 * @author Ben Coburn <btcoburn@silicodon.net> 164 * @author Kate Arzamastseva <pshns@ukr.net> 165 */ 166function getRecents($first,$num,$ns='',$flags=0){ 167 global $conf; 168 $recent = array(); 169 $count = 0; 170 171 if(!$num) 172 return $recent; 173 174 // read all recent changes. (kept short) 175 if ($flags & RECENTS_MEDIA_CHANGES) { 176 $lines = @file($conf['media_changelog']); 177 } else { 178 $lines = @file($conf['changelog']); 179 } 180 $lines_position = count($lines)-1; 181 $media_lines_position = 0; 182 $media_lines = array(); 183 184 if ($flags & RECENTS_MEDIA_PAGES_MIXED) { 185 $media_lines = @file($conf['media_changelog']); 186 $media_lines_position = count($media_lines)-1; 187 } 188 189 $seen = array(); // caches seen lines, _handleRecent() skips them 190 191 // handle lines 192 while ($lines_position >= 0 || (($flags & RECENTS_MEDIA_PAGES_MIXED) && $media_lines_position >=0)) { 193 if (empty($rec) && $lines_position >= 0) { 194 $rec = _handleRecent(@$lines[$lines_position], $ns, $flags, $seen); 195 if (!$rec) { 196 $lines_position --; 197 continue; 198 } 199 } 200 if (($flags & RECENTS_MEDIA_PAGES_MIXED) && empty($media_rec) && $media_lines_position >= 0) { 201 $media_rec = _handleRecent(@$media_lines[$media_lines_position], $ns, $flags | RECENTS_MEDIA_CHANGES, $seen); 202 if (!$media_rec) { 203 $media_lines_position --; 204 continue; 205 } 206 } 207 if (($flags & RECENTS_MEDIA_PAGES_MIXED) && @$media_rec['date'] >= @$rec['date']) { 208 $media_lines_position--; 209 $x = $media_rec; 210 $x['media'] = true; 211 $media_rec = false; 212 } else { 213 $lines_position--; 214 $x = $rec; 215 if ($flags & RECENTS_MEDIA_CHANGES) $x['media'] = true; 216 $rec = false; 217 } 218 if(--$first >= 0) continue; // skip first entries 219 $recent[] = $x; 220 $count++; 221 // break when we have enough entries 222 if($count >= $num){ break; } 223 } 224 return $recent; 225} 226 227/** 228 * returns an array of files changed since a given time using the 229 * changelog 230 * 231 * The following constants can be used to control which changes are 232 * included. Add them together as needed. 233 * 234 * RECENTS_SKIP_DELETED - don't include deleted pages 235 * RECENTS_SKIP_MINORS - don't include minor changes 236 * RECENTS_SKIP_SUBSPACES - don't include subspaces 237 * RECENTS_MEDIA_CHANGES - return media changes instead of page changes 238 * 239 * @param int $from date of the oldest entry to return 240 * @param int $to date of the newest entry to return (for pagination, optional) 241 * @param string $ns restrict to given namespace (optional) 242 * @param int $flags see above (optional) 243 * @return array of files 244 * 245 * @author Michael Hamann <michael@content-space.de> 246 * @author Ben Coburn <btcoburn@silicodon.net> 247 */ 248function getRecentsSince($from,$to=null,$ns='',$flags=0){ 249 global $conf; 250 $recent = array(); 251 252 if($to && $to < $from) 253 return $recent; 254 255 // read all recent changes. (kept short) 256 if ($flags & RECENTS_MEDIA_CHANGES) { 257 $lines = @file($conf['media_changelog']); 258 } else { 259 $lines = @file($conf['changelog']); 260 } 261 if(!$lines) return $recent; 262 263 // we start searching at the end of the list 264 $lines = array_reverse($lines); 265 266 // handle lines 267 $seen = array(); // caches seen lines, _handleRecent() skips them 268 269 foreach($lines as $line){ 270 $rec = _handleRecent($line, $ns, $flags, $seen); 271 if($rec !== false) { 272 if ($rec['date'] >= $from) { 273 if (!$to || $rec['date'] <= $to) { 274 $recent[] = $rec; 275 } 276 } else { 277 break; 278 } 279 } 280 } 281 282 return array_reverse($recent); 283} 284 285/** 286 * Internal function used by getRecents 287 * 288 * don't call directly 289 * 290 * @see getRecents() 291 * @author Andreas Gohr <andi@splitbrain.org> 292 * @author Ben Coburn <btcoburn@silicodon.net> 293 */ 294function _handleRecent($line,$ns,$flags,&$seen){ 295 if(empty($line)) return false; //skip empty lines 296 297 // split the line into parts 298 $recent = parseChangelogLine($line); 299 if ($recent===false) { return false; } 300 301 // skip seen ones 302 if(isset($seen[$recent['id']])) return false; 303 304 // skip minors 305 if($recent['type']===DOKU_CHANGE_TYPE_MINOR_EDIT && ($flags & RECENTS_SKIP_MINORS)) return false; 306 307 // remember in seen to skip additional sights 308 $seen[$recent['id']] = 1; 309 310 // check if it's a hidden page 311 if(isHiddenPage($recent['id'])) return false; 312 313 // filter namespace 314 if (($ns) && (strpos($recent['id'],$ns.':') !== 0)) return false; 315 316 // exclude subnamespaces 317 if (($flags & RECENTS_SKIP_SUBSPACES) && (getNS($recent['id']) != $ns)) return false; 318 319 // check ACL 320 if ($flags & RECENTS_MEDIA_CHANGES) { 321 $recent['perms'] = auth_quickaclcheck(getNS($recent['id']).':*'); 322 } else { 323 $recent['perms'] = auth_quickaclcheck($recent['id']); 324 } 325 if ($recent['perms'] < AUTH_READ) return false; 326 327 // check existance 328 if($flags & RECENTS_SKIP_DELETED){ 329 $fn = (($flags & RECENTS_MEDIA_CHANGES) ? mediaFN($recent['id']) : wikiFN($recent['id'])); 330 if(!@file_exists($fn)) return false; 331 } 332 333 return $recent; 334} 335 336/** 337 * Get the changelog information for a specific page id 338 * and revision (timestamp). Adjacent changelog lines 339 * are optimistically parsed and cached to speed up 340 * consecutive calls to getRevisionInfo. For large 341 * changelog files, only the chunk containing the 342 * requested changelog line is read. 343 * 344 * @author Ben Coburn <btcoburn@silicodon.net> 345 * @author Kate Arzamastseva <pshns@ukr.net> 346 */ 347function getRevisionInfo($id, $rev, $chunk_size=8192, $media=false) { 348 global $cache_revinfo; 349 $cache =& $cache_revinfo; 350 if (!isset($cache[$id])) { $cache[$id] = array(); } 351 $rev = max($rev, 0); 352 353 // check if it's already in the memory cache 354 if (isset($cache[$id]) && isset($cache[$id][$rev])) { 355 return $cache[$id][$rev]; 356 } 357 358 if ($media) { 359 $file = mediaMetaFN($id, '.changes'); 360 } else { 361 $file = metaFN($id, '.changes'); 362 } 363 if (!@file_exists($file)) { return false; } 364 if (filesize($file)<$chunk_size || $chunk_size==0) { 365 // read whole file 366 $lines = file($file); 367 if ($lines===false) { return false; } 368 } else { 369 // read by chunk 370 $fp = fopen($file, 'rb'); // "file pointer" 371 if ($fp===false) { return false; } 372 $head = 0; 373 fseek($fp, 0, SEEK_END); 374 $tail = ftell($fp); 375 $finger = 0; 376 $finger_rev = 0; 377 378 // find chunk 379 while ($tail-$head>$chunk_size) { 380 $finger = $head+floor(($tail-$head)/2.0); 381 fseek($fp, $finger); 382 fgets($fp); // slip the finger forward to a new line 383 $finger = ftell($fp); 384 $tmp = fgets($fp); // then read at that location 385 $tmp = parseChangelogLine($tmp); 386 $finger_rev = $tmp['date']; 387 if ($finger==$head || $finger==$tail) { break; } 388 if ($finger_rev>$rev) { 389 $tail = $finger; 390 } else { 391 $head = $finger; 392 } 393 } 394 395 if ($tail-$head<1) { 396 // cound not find chunk, assume requested rev is missing 397 fclose($fp); 398 return false; 399 } 400 401 // read chunk 402 $chunk = ''; 403 $chunk_size = max($tail-$head, 0); // found chunk size 404 $got = 0; 405 fseek($fp, $head); 406 while ($got<$chunk_size && !feof($fp)) { 407 $tmp = @fread($fp, max($chunk_size-$got, 0)); 408 if ($tmp===false) { break; } //error state 409 $got += strlen($tmp); 410 $chunk .= $tmp; 411 } 412 $lines = explode("\n", $chunk); 413 array_pop($lines); // remove trailing newline 414 fclose($fp); 415 } 416 417 // parse and cache changelog lines 418 foreach ($lines as $value) { 419 $tmp = parseChangelogLine($value); 420 if ($tmp!==false) { 421 $cache[$id][$tmp['date']] = $tmp; 422 } 423 } 424 if (!isset($cache[$id][$rev])) { return false; } 425 return $cache[$id][$rev]; 426} 427 428/** 429 * Return a list of page revisions numbers 430 * Does not guarantee that the revision exists in the attic, 431 * only that a line with the date exists in the changelog. 432 * By default the current revision is skipped. 433 * 434 * id: the page of interest 435 * first: skip the first n changelog lines 436 * num: number of revisions to return 437 * 438 * The current revision is automatically skipped when the page exists. 439 * See $INFO['meta']['last_change'] for the current revision. 440 * 441 * For efficiency, the log lines are parsed and cached for later 442 * calls to getRevisionInfo. Large changelog files are read 443 * backwards in chunks until the requested number of changelog 444 * lines are recieved. 445 * 446 * @author Ben Coburn <btcoburn@silicodon.net> 447 * @author Kate Arzamastseva <pshns@ukr.net> 448 */ 449function getRevisions($id, $first, $num, $chunk_size=8192, $media=false) { 450 global $cache_revinfo; 451 $cache =& $cache_revinfo; 452 if (!isset($cache[$id])) { $cache[$id] = array(); } 453 454 $revs = array(); 455 $lines = array(); 456 $count = 0; 457 if ($media) { 458 $file = mediaMetaFN($id, '.changes'); 459 } else { 460 $file = metaFN($id, '.changes'); 461 } 462 $num = max($num, 0); 463 if ($num == 0) { return $revs; } 464 465 $chunk_size = max($chunk_size, 0); 466 if ($first<0) { 467 $first = 0; 468 } else if (!$media && @file_exists(wikiFN($id)) || $media && @file_exists(mediaFN($id))) { 469 // skip current revision if the page exists 470 $first = max($first+1, 0); 471 } 472 473 if (!@file_exists($file)) { return $revs; } 474 if (filesize($file)<$chunk_size || $chunk_size==0) { 475 // read whole file 476 $lines = file($file); 477 if ($lines===false) { return $revs; } 478 } else { 479 // read chunks backwards 480 $fp = fopen($file, 'rb'); // "file pointer" 481 if ($fp===false) { return $revs; } 482 fseek($fp, 0, SEEK_END); 483 $tail = ftell($fp); 484 485 // chunk backwards 486 $finger = max($tail-$chunk_size, 0); 487 while ($count<$num+$first) { 488 fseek($fp, $finger); 489 $nl = $finger; 490 if ($finger>0) { 491 fgets($fp); // slip the finger forward to a new line 492 $nl = ftell($fp); 493 } 494 495 // was the chunk big enough? if not, take another bite 496 if($nl > 0 && $tail <= $nl){ 497 $finger = max($finger-$chunk_size, 0); 498 continue; 499 }else{ 500 $finger = $nl; 501 } 502 503 // read chunk 504 $chunk = ''; 505 $read_size = max($tail-$finger, 0); // found chunk size 506 $got = 0; 507 while ($got<$read_size && !feof($fp)) { 508 $tmp = @fread($fp, max($read_size-$got, 0)); 509 if ($tmp===false) { break; } //error state 510 $got += strlen($tmp); 511 $chunk .= $tmp; 512 } 513 $tmp = explode("\n", $chunk); 514 array_pop($tmp); // remove trailing newline 515 516 // combine with previous chunk 517 $count += count($tmp); 518 $lines = array_merge($tmp, $lines); 519 520 // next chunk 521 if ($finger==0) { break; } // already read all the lines 522 else { 523 $tail = $finger; 524 $finger = max($tail-$chunk_size, 0); 525 } 526 } 527 fclose($fp); 528 } 529 530 // skip parsing extra lines 531 $num = max(min(count($lines)-$first, $num), 0); 532 if ($first>0 && $num>0) { $lines = array_slice($lines, max(count($lines)-$first-$num, 0), $num); } 533 else if ($first>0 && $num==0) { $lines = array_slice($lines, 0, max(count($lines)-$first, 0)); } 534 else if ($first==0 && $num>0) { $lines = array_slice($lines, max(count($lines)-$num, 0)); } 535 536 // handle lines in reverse order 537 for ($i = count($lines)-1; $i >= 0; $i--) { 538 $tmp = parseChangelogLine($lines[$i]); 539 if ($tmp!==false) { 540 $cache[$id][$tmp['date']] = $tmp; 541 $revs[] = $tmp['date']; 542 } 543 } 544 545 return $revs; 546} 547 548 549