10c3a5702SAndreas Gohr<?php 20c3a5702SAndreas Gohr 30c3a5702SAndreas Gohrnamespace dokuwiki\ChangeLog; 40c3a5702SAndreas Gohr 566f4cdd4SSatoshi Saharause dokuwiki\Logger; 666f4cdd4SSatoshi Sahara 70c3a5702SAndreas Gohr/** 81d11f1d3SSatoshi Sahara * ChangeLog Prototype; methods for handling changelog 90c3a5702SAndreas Gohr */ 100c3a5702SAndreas Gohrabstract class ChangeLog 110c3a5702SAndreas Gohr{ 121d11f1d3SSatoshi Sahara use ChangeLogTrait; 131d11f1d3SSatoshi Sahara 140c3a5702SAndreas Gohr /** @var string */ 150c3a5702SAndreas Gohr protected $id; 1679a2d784SGerrit Uitslag /** @var false|int */ 17bd17ac90SSatoshi Sahara protected $currentRevision; 180c3a5702SAndreas Gohr /** @var array */ 190603e565SAndreas Gohr protected $cache = []; 200c3a5702SAndreas Gohr 210c3a5702SAndreas Gohr /** 220c3a5702SAndreas Gohr * Constructor 230c3a5702SAndreas Gohr * 240c3a5702SAndreas Gohr * @param string $id page id 250c3a5702SAndreas Gohr * @param int $chunk_size maximum block size read from file 260c3a5702SAndreas Gohr */ 270c3a5702SAndreas Gohr public function __construct($id, $chunk_size = 8192) 280c3a5702SAndreas Gohr { 290c3a5702SAndreas Gohr global $cache_revinfo; 300c3a5702SAndreas Gohr 310c3a5702SAndreas Gohr $this->cache =& $cache_revinfo; 320c3a5702SAndreas Gohr if (!isset($this->cache[$id])) { 330603e565SAndreas Gohr $this->cache[$id] = []; 340c3a5702SAndreas Gohr } 350c3a5702SAndreas Gohr 360c3a5702SAndreas Gohr $this->id = $id; 370c3a5702SAndreas Gohr $this->setChunkSize($chunk_size); 380c3a5702SAndreas Gohr } 390c3a5702SAndreas Gohr 400c3a5702SAndreas Gohr /** 410c3a5702SAndreas Gohr * Returns path to current page/media 420c3a5702SAndreas Gohr * 430c3a5702SAndreas Gohr * @return string path to file 440c3a5702SAndreas Gohr */ 450c3a5702SAndreas Gohr abstract protected function getFilename(); 460c3a5702SAndreas Gohr 47df7627d6SSatoshi Sahara /** 48df7627d6SSatoshi Sahara * Check whether given revision is the current page 49df7627d6SSatoshi Sahara * 50df7627d6SSatoshi Sahara * @param int $rev timestamp of current page 51df7627d6SSatoshi Sahara * @return bool true if $rev is current revision, otherwise false 52df7627d6SSatoshi Sahara */ 53df7627d6SSatoshi Sahara public function isCurrentRevision($rev) 54df7627d6SSatoshi Sahara { 55df7627d6SSatoshi Sahara return $rev == $this->currentRevision(); 56df7627d6SSatoshi Sahara } 57df7627d6SSatoshi Sahara 58df7627d6SSatoshi Sahara /** 59df7627d6SSatoshi Sahara * Checks if the revision is last revision 60df7627d6SSatoshi Sahara * 61df7627d6SSatoshi Sahara * @param int $rev revision timestamp 62df7627d6SSatoshi Sahara * @return bool true if $rev is last revision, otherwise false 63df7627d6SSatoshi Sahara */ 64df7627d6SSatoshi Sahara public function isLastRevision($rev = null) 65df7627d6SSatoshi Sahara { 66df7627d6SSatoshi Sahara return $rev === $this->lastRevision(); 67df7627d6SSatoshi Sahara } 68df7627d6SSatoshi Sahara 69df7627d6SSatoshi Sahara /** 70eeda7adaSGerrit Uitslag * Return the current revision identifier 7105282e9fSSatoshi Sahara * 7205282e9fSSatoshi Sahara * The "current" revision means current version of the page or media file. It is either 7305282e9fSSatoshi Sahara * identical with or newer than the "last" revision, that depends on whether the file 7405282e9fSSatoshi Sahara * has modified, created or deleted outside of DokuWiki. 7505282e9fSSatoshi Sahara * The value of identifier can be determined by timestamp as far as the file exists, 7605282e9fSSatoshi Sahara * otherwise it must be assigned larger than any other revisions to keep them sortable. 7705282e9fSSatoshi Sahara * 7805282e9fSSatoshi Sahara * @return int|false revision timestamp 79df7627d6SSatoshi Sahara */ 80df7627d6SSatoshi Sahara public function currentRevision() 81df7627d6SSatoshi Sahara { 82df7627d6SSatoshi Sahara if (!isset($this->currentRevision)) { 83df7627d6SSatoshi Sahara // set ChangeLog::currentRevision property 84df7627d6SSatoshi Sahara $this->getCurrentRevisionInfo(); 85df7627d6SSatoshi Sahara } 86df7627d6SSatoshi Sahara return $this->currentRevision; 87df7627d6SSatoshi Sahara } 88df7627d6SSatoshi Sahara 89df7627d6SSatoshi Sahara /** 90eeda7adaSGerrit Uitslag * Return the last revision identifier, date value of the last entry of the changelog 91d154755dSSatoshi Sahara * 9205282e9fSSatoshi Sahara * @return int|false revision timestamp 93df7627d6SSatoshi Sahara */ 94df7627d6SSatoshi Sahara public function lastRevision() 95df7627d6SSatoshi Sahara { 96df7627d6SSatoshi Sahara $revs = $this->getRevisions(-1, 1); 97df7627d6SSatoshi Sahara return empty($revs) ? false : $revs[0]; 98df7627d6SSatoshi Sahara } 99df7627d6SSatoshi Sahara 1000c3a5702SAndreas Gohr /** 101b82f2411SSatoshi Sahara * Save revision info to the cache pool 102b82f2411SSatoshi Sahara * 103d154755dSSatoshi Sahara * @param array $info Revision info structure 104b82f2411SSatoshi Sahara * @return bool 105b82f2411SSatoshi Sahara */ 106d154755dSSatoshi Sahara protected function cacheRevisionInfo($info) 107b82f2411SSatoshi Sahara { 108b82f2411SSatoshi Sahara if (!is_array($info)) return false; 109b82f2411SSatoshi Sahara //$this->cache[$this->id][$info['date']] ??= $info; // since php 7.4 1100603e565SAndreas Gohr $this->cache[$this->id][$info['date']] ??= $info; 111b82f2411SSatoshi Sahara return true; 112b82f2411SSatoshi Sahara } 113b82f2411SSatoshi Sahara 114b82f2411SSatoshi Sahara /** 115d154755dSSatoshi Sahara * Get the changelog information for a specific revision (timestamp) 1160c3a5702SAndreas Gohr * 1170c3a5702SAndreas Gohr * Adjacent changelog lines are optimistically parsed and cached to speed up 1180c3a5702SAndreas Gohr * consecutive calls to getRevisionInfo. For large changelog files, only the chunk 1190c3a5702SAndreas Gohr * containing the requested changelog line is read. 1200c3a5702SAndreas Gohr * 1210c3a5702SAndreas Gohr * @param int $rev revision timestamp 12286216bf0SGerrit Uitslag * @param bool $retrieveCurrentRevInfo allows to skip for getting other revision info in the 12386216bf0SGerrit Uitslag * getCurrentRevisionInfo() where $currentRevision is not yet determined 1240c3a5702SAndreas Gohr * @return bool|array false or array with entries: 1250c3a5702SAndreas Gohr * - date: unix timestamp 1260c3a5702SAndreas Gohr * - ip: IPv4 address (127.0.0.1) 1270c3a5702SAndreas Gohr * - type: log line type 1280c3a5702SAndreas Gohr * - id: page id 1290c3a5702SAndreas Gohr * - user: user name 1300c3a5702SAndreas Gohr * - sum: edit summary (or action reason) 1310c3a5702SAndreas Gohr * - extra: extra data (varies by line type) 132bd17ac90SSatoshi Sahara * - sizechange: change of filesize 1330c3a5702SAndreas Gohr * 1340c3a5702SAndreas Gohr * @author Ben Coburn <btcoburn@silicodon.net> 1350c3a5702SAndreas Gohr * @author Kate Arzamastseva <pshns@ukr.net> 1360c3a5702SAndreas Gohr */ 13786216bf0SGerrit Uitslag public function getRevisionInfo($rev, $retrieveCurrentRevInfo = true) 1380c3a5702SAndreas Gohr { 139a3984ddfSSatoshi Sahara $rev = max(0, $rev); 140a3984ddfSSatoshi Sahara if (!$rev) return false; 1410c3a5702SAndreas Gohr 14286216bf0SGerrit Uitslag //ensure the external edits are cached as well 14386216bf0SGerrit Uitslag if (!isset($this->currentRevision) && $retrieveCurrentRevInfo) { 14486216bf0SGerrit Uitslag $this->getCurrentRevisionInfo(); 14586216bf0SGerrit Uitslag } 14686216bf0SGerrit Uitslag 1470c3a5702SAndreas Gohr // check if it's already in the memory cache 1480c3a5702SAndreas Gohr if (isset($this->cache[$this->id]) && isset($this->cache[$this->id][$rev])) { 1490c3a5702SAndreas Gohr return $this->cache[$this->id][$rev]; 1500c3a5702SAndreas Gohr } 1510c3a5702SAndreas Gohr 1520c3a5702SAndreas Gohr //read lines from changelog 1530603e565SAndreas Gohr [$fp, $lines] = $this->readloglines($rev); 1540c3a5702SAndreas Gohr if ($fp) { 1550c3a5702SAndreas Gohr fclose($fp); 1560c3a5702SAndreas Gohr } 1570c3a5702SAndreas Gohr if (empty($lines)) return false; 1580c3a5702SAndreas Gohr 1590c3a5702SAndreas Gohr // parse and cache changelog lines 1600c3a5702SAndreas Gohr foreach ($lines as $value) { 1610603e565SAndreas Gohr $info = static::parseLogLine($value); 162d154755dSSatoshi Sahara $this->cacheRevisionInfo($info); 1630c3a5702SAndreas Gohr } 1640c3a5702SAndreas Gohr if (!isset($this->cache[$this->id][$rev])) { 1650c3a5702SAndreas Gohr return false; 1660c3a5702SAndreas Gohr } 1670c3a5702SAndreas Gohr return $this->cache[$this->id][$rev]; 1680c3a5702SAndreas Gohr } 1690c3a5702SAndreas Gohr 1700c3a5702SAndreas Gohr /** 1710c3a5702SAndreas Gohr * Return a list of page revisions numbers 1720c3a5702SAndreas Gohr * 1730c3a5702SAndreas Gohr * Does not guarantee that the revision exists in the attic, 1740c3a5702SAndreas Gohr * only that a line with the date exists in the changelog. 1750c3a5702SAndreas Gohr * By default the current revision is skipped. 1760c3a5702SAndreas Gohr * 1770c3a5702SAndreas Gohr * The current revision is automatically skipped when the page exists. 1780c3a5702SAndreas Gohr * See $INFO['meta']['last_change'] for the current revision. 1790c3a5702SAndreas Gohr * A negative $first let read the current revision too. 1800c3a5702SAndreas Gohr * 1810c3a5702SAndreas Gohr * For efficiency, the log lines are parsed and cached for later 1820c3a5702SAndreas Gohr * calls to getRevisionInfo. Large changelog files are read 1830c3a5702SAndreas Gohr * backwards in chunks until the requested number of changelog 184eeda7adaSGerrit Uitslag * lines are received. 1850c3a5702SAndreas Gohr * 1860c3a5702SAndreas Gohr * @param int $first skip the first n changelog lines 1870c3a5702SAndreas Gohr * @param int $num number of revisions to return 1880c3a5702SAndreas Gohr * @return array with the revision timestamps 1890c3a5702SAndreas Gohr * 1900c3a5702SAndreas Gohr * @author Ben Coburn <btcoburn@silicodon.net> 1910c3a5702SAndreas Gohr * @author Kate Arzamastseva <pshns@ukr.net> 1920c3a5702SAndreas Gohr */ 1930c3a5702SAndreas Gohr public function getRevisions($first, $num) 1940c3a5702SAndreas Gohr { 1950603e565SAndreas Gohr $revs = []; 1960603e565SAndreas Gohr $lines = []; 1970c3a5702SAndreas Gohr $count = 0; 1980c3a5702SAndreas Gohr 199d154755dSSatoshi Sahara $logfile = $this->getChangelogFilename(); 200d154755dSSatoshi Sahara if (!file_exists($logfile)) return $revs; 201d154755dSSatoshi Sahara 2020c3a5702SAndreas Gohr $num = max($num, 0); 2030c3a5702SAndreas Gohr if ($num == 0) { 2040c3a5702SAndreas Gohr return $revs; 2050c3a5702SAndreas Gohr } 2060c3a5702SAndreas Gohr 2070c3a5702SAndreas Gohr if ($first < 0) { 2080c3a5702SAndreas Gohr $first = 0; 2090c3a5702SAndreas Gohr } else { 210df7627d6SSatoshi Sahara $fileLastMod = $this->getFilename(); 211df7627d6SSatoshi Sahara if (file_exists($fileLastMod) && $this->isLastRevision(filemtime($fileLastMod))) { 212df7627d6SSatoshi Sahara // skip last revision if the page exists 2130c3a5702SAndreas Gohr $first = max($first + 1, 0); 2140c3a5702SAndreas Gohr } 2150c3a5702SAndreas Gohr } 2160c3a5702SAndreas Gohr 217d154755dSSatoshi Sahara if (filesize($logfile) < $this->chunk_size || $this->chunk_size == 0) { 2180c3a5702SAndreas Gohr // read whole file 219d154755dSSatoshi Sahara $lines = file($logfile); 2200c3a5702SAndreas Gohr if ($lines === false) { 2210c3a5702SAndreas Gohr return $revs; 2220c3a5702SAndreas Gohr } 2230c3a5702SAndreas Gohr } else { 2240c3a5702SAndreas Gohr // read chunks backwards 225d154755dSSatoshi Sahara $fp = fopen($logfile, 'rb'); // "file pointer" 2260c3a5702SAndreas Gohr if ($fp === false) { 2270c3a5702SAndreas Gohr return $revs; 2280c3a5702SAndreas Gohr } 2290c3a5702SAndreas Gohr fseek($fp, 0, SEEK_END); 2300c3a5702SAndreas Gohr $tail = ftell($fp); 2310c3a5702SAndreas Gohr 2320c3a5702SAndreas Gohr // chunk backwards 2330c3a5702SAndreas Gohr $finger = max($tail - $this->chunk_size, 0); 2340c3a5702SAndreas Gohr while ($count < $num + $first) { 2350c3a5702SAndreas Gohr $nl = $this->getNewlinepointer($fp, $finger); 2360c3a5702SAndreas Gohr 2370c3a5702SAndreas Gohr // was the chunk big enough? if not, take another bite 2380c3a5702SAndreas Gohr if ($nl > 0 && $tail <= $nl) { 2390c3a5702SAndreas Gohr $finger = max($finger - $this->chunk_size, 0); 2400c3a5702SAndreas Gohr continue; 2410c3a5702SAndreas Gohr } else { 2420c3a5702SAndreas Gohr $finger = $nl; 2430c3a5702SAndreas Gohr } 2440c3a5702SAndreas Gohr 2450c3a5702SAndreas Gohr // read chunk 2460c3a5702SAndreas Gohr $chunk = ''; 2470c3a5702SAndreas Gohr $read_size = max($tail - $finger, 0); // found chunk size 2480c3a5702SAndreas Gohr $got = 0; 2490c3a5702SAndreas Gohr while ($got < $read_size && !feof($fp)) { 2500c3a5702SAndreas Gohr $tmp = @fread($fp, max(min($this->chunk_size, $read_size - $got), 0)); 2510c3a5702SAndreas Gohr if ($tmp === false) { 2520c3a5702SAndreas Gohr break; 2530c3a5702SAndreas Gohr } //error state 2540c3a5702SAndreas Gohr $got += strlen($tmp); 2550c3a5702SAndreas Gohr $chunk .= $tmp; 2560c3a5702SAndreas Gohr } 2570c3a5702SAndreas Gohr $tmp = explode("\n", $chunk); 2580c3a5702SAndreas Gohr array_pop($tmp); // remove trailing newline 2590c3a5702SAndreas Gohr 2600c3a5702SAndreas Gohr // combine with previous chunk 2610c3a5702SAndreas Gohr $count += count($tmp); 2620603e565SAndreas Gohr $lines = [...$tmp, ...$lines]; 2630c3a5702SAndreas Gohr 2640c3a5702SAndreas Gohr // next chunk 2650c3a5702SAndreas Gohr if ($finger == 0) { 2660c3a5702SAndreas Gohr break; 267e24a74c0SAndreas Gohr } else { // already read all the lines 2680c3a5702SAndreas Gohr $tail = $finger; 2690c3a5702SAndreas Gohr $finger = max($tail - $this->chunk_size, 0); 2700c3a5702SAndreas Gohr } 2710c3a5702SAndreas Gohr } 2720c3a5702SAndreas Gohr fclose($fp); 2730c3a5702SAndreas Gohr } 2740c3a5702SAndreas Gohr 2750c3a5702SAndreas Gohr // skip parsing extra lines 2760c3a5702SAndreas Gohr $num = max(min(count($lines) - $first, $num), 0); 2770c3a5702SAndreas Gohr if ($first > 0 && $num > 0) { 2780c3a5702SAndreas Gohr $lines = array_slice($lines, max(count($lines) - $first - $num, 0), $num); 279df7627d6SSatoshi Sahara } elseif ($first > 0 && $num == 0) { 2800c3a5702SAndreas Gohr $lines = array_slice($lines, 0, max(count($lines) - $first, 0)); 2810c3a5702SAndreas Gohr } elseif ($first == 0 && $num > 0) { 2820c3a5702SAndreas Gohr $lines = array_slice($lines, max(count($lines) - $num, 0)); 2830c3a5702SAndreas Gohr } 2840c3a5702SAndreas Gohr 2850c3a5702SAndreas Gohr // handle lines in reverse order 2860c3a5702SAndreas Gohr for ($i = count($lines) - 1; $i >= 0; $i--) { 2870603e565SAndreas Gohr $info = static::parseLogLine($lines[$i]); 288d154755dSSatoshi Sahara if ($this->cacheRevisionInfo($info)) { 289bd17ac90SSatoshi Sahara $revs[] = $info['date']; 2900c3a5702SAndreas Gohr } 2910c3a5702SAndreas Gohr } 2920c3a5702SAndreas Gohr 2930c3a5702SAndreas Gohr return $revs; 2940c3a5702SAndreas Gohr } 2950c3a5702SAndreas Gohr 2960c3a5702SAndreas Gohr /** 297eeda7adaSGerrit Uitslag * Get the nth revision left or right-hand side for a specific page id and revision (timestamp) 2980c3a5702SAndreas Gohr * 2990c3a5702SAndreas Gohr * For large changelog files, only the chunk containing the 300eeda7adaSGerrit Uitslag * reference revision $rev is read and sometimes a next chunk. 3010c3a5702SAndreas Gohr * 3020c3a5702SAndreas Gohr * Adjacent changelog lines are optimistically parsed and cached to speed up 3030c3a5702SAndreas Gohr * consecutive calls to getRevisionInfo. 3040c3a5702SAndreas Gohr * 305d154755dSSatoshi Sahara * @param int $rev revision timestamp used as start date 306d154755dSSatoshi Sahara * (doesn't need to be exact revision number) 307d154755dSSatoshi Sahara * @param int $direction give position of returned revision with respect to $rev; 308d154755dSSatoshi Sahara positive=next, negative=prev 3090c3a5702SAndreas Gohr * @return bool|int 3100c3a5702SAndreas Gohr * timestamp of the requested revision 3110c3a5702SAndreas Gohr * otherwise false 3120c3a5702SAndreas Gohr */ 3130c3a5702SAndreas Gohr public function getRelativeRevision($rev, $direction) 3140c3a5702SAndreas Gohr { 3150c3a5702SAndreas Gohr $rev = max($rev, 0); 3160c3a5702SAndreas Gohr $direction = (int)$direction; 3170c3a5702SAndreas Gohr 3180c3a5702SAndreas Gohr //no direction given or last rev, so no follow-up 3190c3a5702SAndreas Gohr if (!$direction || ($direction > 0 && $this->isCurrentRevision($rev))) { 3200c3a5702SAndreas Gohr return false; 3210c3a5702SAndreas Gohr } 3220c3a5702SAndreas Gohr 3230c3a5702SAndreas Gohr //get lines from changelog 3240603e565SAndreas Gohr [$fp, $lines, $head, $tail, $eof] = $this->readloglines($rev); 3250c3a5702SAndreas Gohr if (empty($lines)) return false; 3260c3a5702SAndreas Gohr 3275d9428a0SSatoshi Sahara // look for revisions later/earlier than $rev, when founded count till the wanted revision is reached 3280c3a5702SAndreas Gohr // also parse and cache changelog lines for getRevisionInfo(). 329eeda7adaSGerrit Uitslag $revCounter = 0; 330eeda7adaSGerrit Uitslag $relativeRev = false; 331eeda7adaSGerrit Uitslag $checkOtherChunk = true; //always runs once 332eeda7adaSGerrit Uitslag while (!$relativeRev && $checkOtherChunk) { 3330603e565SAndreas Gohr $info = []; 3340c3a5702SAndreas Gohr //parse in normal or reverse order 3350c3a5702SAndreas Gohr $count = count($lines); 3360c3a5702SAndreas Gohr if ($direction > 0) { 3370c3a5702SAndreas Gohr $start = 0; 3380c3a5702SAndreas Gohr $step = 1; 3390c3a5702SAndreas Gohr } else { 3400c3a5702SAndreas Gohr $start = $count - 1; 3410c3a5702SAndreas Gohr $step = -1; 3420c3a5702SAndreas Gohr } 3430603e565SAndreas Gohr for ($i = $start; $i >= 0 && $i < $count; $i += $step) { 3440603e565SAndreas Gohr $info = static::parseLogLine($lines[$i]); 345d154755dSSatoshi Sahara if ($this->cacheRevisionInfo($info)) { 3460c3a5702SAndreas Gohr //look for revs older/earlier then reference $rev and select $direction-th one 347bd17ac90SSatoshi Sahara if (($direction > 0 && $info['date'] > $rev) || ($direction < 0 && $info['date'] < $rev)) { 348eeda7adaSGerrit Uitslag $revCounter++; 349eeda7adaSGerrit Uitslag if ($revCounter == abs($direction)) { 350eeda7adaSGerrit Uitslag $relativeRev = $info['date']; 3510c3a5702SAndreas Gohr } 3520c3a5702SAndreas Gohr } 3530c3a5702SAndreas Gohr } 3540c3a5702SAndreas Gohr } 3550c3a5702SAndreas Gohr 3560c3a5702SAndreas Gohr //true when $rev is found, but not the wanted follow-up. 357eeda7adaSGerrit Uitslag $checkOtherChunk = $fp 358eeda7adaSGerrit Uitslag && ($info['date'] == $rev || ($revCounter > 0 && !$relativeRev)) 3590603e565SAndreas Gohr && (!($tail == $eof && $direction > 0) && !($head == 0 && $direction < 0)); 3600c3a5702SAndreas Gohr 361eeda7adaSGerrit Uitslag if ($checkOtherChunk) { 3620603e565SAndreas Gohr [$lines, $head, $tail] = $this->readAdjacentChunk($fp, $head, $tail, $direction); 3630c3a5702SAndreas Gohr 3640c3a5702SAndreas Gohr if (empty($lines)) break; 3650c3a5702SAndreas Gohr } 3660c3a5702SAndreas Gohr } 3670c3a5702SAndreas Gohr if ($fp) { 3680c3a5702SAndreas Gohr fclose($fp); 3690c3a5702SAndreas Gohr } 3700c3a5702SAndreas Gohr 371eeda7adaSGerrit Uitslag return $relativeRev; 3720c3a5702SAndreas Gohr } 3730c3a5702SAndreas Gohr 3740c3a5702SAndreas Gohr /** 3750c3a5702SAndreas Gohr * Returns revisions around rev1 and rev2 3760c3a5702SAndreas Gohr * When available it returns $max entries for each revision 3770c3a5702SAndreas Gohr * 3780c3a5702SAndreas Gohr * @param int $rev1 oldest revision timestamp 3790c3a5702SAndreas Gohr * @param int $rev2 newest revision timestamp (0 looks up last revision) 3800c3a5702SAndreas Gohr * @param int $max maximum number of revisions returned 3810c3a5702SAndreas Gohr * @return array with two arrays with revisions surrounding rev1 respectively rev2 3820c3a5702SAndreas Gohr */ 3830c3a5702SAndreas Gohr public function getRevisionsAround($rev1, $rev2, $max = 50) 3840c3a5702SAndreas Gohr { 3850603e565SAndreas Gohr $max = (int) (abs($max) / 2) * 2 + 1; 3860c3a5702SAndreas Gohr $rev1 = max($rev1, 0); 3870c3a5702SAndreas Gohr $rev2 = max($rev2, 0); 3880c3a5702SAndreas Gohr 3890c3a5702SAndreas Gohr if ($rev2) { 3900c3a5702SAndreas Gohr if ($rev2 < $rev1) { 3910c3a5702SAndreas Gohr $rev = $rev2; 3920c3a5702SAndreas Gohr $rev2 = $rev1; 3930c3a5702SAndreas Gohr $rev1 = $rev; 3940c3a5702SAndreas Gohr } 3950c3a5702SAndreas Gohr } else { 3960c3a5702SAndreas Gohr //empty right side means a removed page. Look up last revision. 397bd17ac90SSatoshi Sahara $rev2 = $this->currentRevision(); 3980c3a5702SAndreas Gohr } 3990c3a5702SAndreas Gohr //collect revisions around rev2 4000603e565SAndreas Gohr [$revs2, $allRevs, $fp, $lines, $head, $tail] = $this->retrieveRevisionsAround($rev2, $max); 4010c3a5702SAndreas Gohr 4020603e565SAndreas Gohr if (empty($revs2)) return [[], []]; 4030c3a5702SAndreas Gohr 4040c3a5702SAndreas Gohr //collect revisions around rev1 4050603e565SAndreas Gohr $index = array_search($rev1, $allRevs, true); 4060c3a5702SAndreas Gohr if ($index === false) { 4070c3a5702SAndreas Gohr //no overlapping revisions 4080603e565SAndreas Gohr [$revs1, , , , , ] = $this->retrieveRevisionsAround($rev1, $max); 4090603e565SAndreas Gohr if (empty($revs1)) $revs1 = []; 4100c3a5702SAndreas Gohr } else { 4110c3a5702SAndreas Gohr //revisions overlaps, reuse revisions around rev2 412eeda7adaSGerrit Uitslag $lastRev = array_pop($allRevs); //keep last entry that could be external edit 413eeda7adaSGerrit Uitslag $revs1 = $allRevs; 4140c3a5702SAndreas Gohr while ($head > 0) { 4150c3a5702SAndreas Gohr for ($i = count($lines) - 1; $i >= 0; $i--) { 4160603e565SAndreas Gohr $info = static::parseLogLine($lines[$i]); 417d154755dSSatoshi Sahara if ($this->cacheRevisionInfo($info)) { 418bd17ac90SSatoshi Sahara $revs1[] = $info['date']; 4190c3a5702SAndreas Gohr $index++; 4200c3a5702SAndreas Gohr 4210603e565SAndreas Gohr if ($index > (int) ($max / 2)) break 2; 4220c3a5702SAndreas Gohr } 4230c3a5702SAndreas Gohr } 4240c3a5702SAndreas Gohr 4250603e565SAndreas Gohr [$lines, $head, $tail] = $this->readAdjacentChunk($fp, $head, $tail, -1); 4260c3a5702SAndreas Gohr } 4270c3a5702SAndreas Gohr sort($revs1); 428eeda7adaSGerrit Uitslag $revs1[] = $lastRev; //push back last entry 4295d9428a0SSatoshi Sahara 4300c3a5702SAndreas Gohr //return wanted selection 4310603e565SAndreas Gohr $revs1 = array_slice($revs1, max($index - (int) ($max / 2), 0), $max); 4320c3a5702SAndreas Gohr } 4330c3a5702SAndreas Gohr 4340603e565SAndreas Gohr return [array_reverse($revs1), array_reverse($revs2)]; 4350c3a5702SAndreas Gohr } 4360c3a5702SAndreas Gohr 4370c3a5702SAndreas Gohr /** 4380c3a5702SAndreas Gohr * Return an existing revision for a specific date which is 4390c3a5702SAndreas Gohr * the current one or younger or equal then the date 4400c3a5702SAndreas Gohr * 4410c3a5702SAndreas Gohr * @param number $date_at timestamp 4420c3a5702SAndreas Gohr * @return string revision ('' for current) 4430c3a5702SAndreas Gohr */ 4440c3a5702SAndreas Gohr public function getLastRevisionAt($date_at) 4450c3a5702SAndreas Gohr { 446d154755dSSatoshi Sahara $fileLastMod = $this->getFilename(); 4470c3a5702SAndreas Gohr //requested date_at(timestamp) younger or equal then modified_time($this->id) => load current 448d154755dSSatoshi Sahara if (file_exists($fileLastMod) && $date_at >= @filemtime($fileLastMod)) { 4490c3a5702SAndreas Gohr return ''; 4500603e565SAndreas Gohr } elseif ($rev = $this->getRelativeRevision($date_at + 1, -1)) { 4510603e565SAndreas Gohr //+1 to get also the requested date revision 4520c3a5702SAndreas Gohr return $rev; 4530c3a5702SAndreas Gohr } else { 4540c3a5702SAndreas Gohr return false; 4550c3a5702SAndreas Gohr } 4560c3a5702SAndreas Gohr } 4570c3a5702SAndreas Gohr 4580c3a5702SAndreas Gohr /** 4590c3a5702SAndreas Gohr * Collect the $max revisions near to the timestamp $rev 4600c3a5702SAndreas Gohr * 461bd17ac90SSatoshi Sahara * Ideally, half of retrieved timestamps are older than $rev, another half are newer. 462eeda7adaSGerrit Uitslag * The returned array $requestedRevs may not contain the reference timestamp $rev 463bd17ac90SSatoshi Sahara * when it does not match any revision value recorded in changelog. 464bd17ac90SSatoshi Sahara * 4650c3a5702SAndreas Gohr * @param int $rev revision timestamp 4660c3a5702SAndreas Gohr * @param int $max maximum number of revisions to be returned 4670c3a5702SAndreas Gohr * @return bool|array 4680c3a5702SAndreas Gohr * return array with entries: 469eeda7adaSGerrit Uitslag * - $requestedRevs: array of with $max revision timestamps 4700c3a5702SAndreas Gohr * - $revs: all parsed revision timestamps 4710c3a5702SAndreas Gohr * - $fp: file pointer only defined for chuck reading, needs closing. 4720c3a5702SAndreas Gohr * - $lines: non-parsed changelog lines before the parsed revisions 473eeda7adaSGerrit Uitslag * - $head: position of first read changelog line 474eeda7adaSGerrit Uitslag * - $lastTail: position of end of last read changelog line 4750c3a5702SAndreas Gohr * otherwise false 4760c3a5702SAndreas Gohr */ 4770c3a5702SAndreas Gohr protected function retrieveRevisionsAround($rev, $max) 4780c3a5702SAndreas Gohr { 4790603e565SAndreas Gohr $revs = []; 4800603e565SAndreas Gohr $afterCount = 0; 4810603e565SAndreas Gohr $beforeCount = 0; 482a3984ddfSSatoshi Sahara 4830c3a5702SAndreas Gohr //get lines from changelog 4840603e565SAndreas Gohr [$fp, $lines, $startHead, $startTail, $eof] = $this->readloglines($rev); 485bd17ac90SSatoshi Sahara if (empty($lines)) return false; 4860c3a5702SAndreas Gohr 487bd17ac90SSatoshi Sahara //parse changelog lines in chunk, and read forward more chunks until $max/2 is reached 488eeda7adaSGerrit Uitslag $head = $startHead; 489eeda7adaSGerrit Uitslag $tail = $startTail; 4900c3a5702SAndreas Gohr while (count($lines) > 0) { 4910c3a5702SAndreas Gohr foreach ($lines as $line) { 4920603e565SAndreas Gohr $info = static::parseLogLine($line); 493d154755dSSatoshi Sahara if ($this->cacheRevisionInfo($info)) { 494bd17ac90SSatoshi Sahara $revs[] = $info['date']; 495bd17ac90SSatoshi Sahara if ($info['date'] >= $rev) { 4960c3a5702SAndreas Gohr //count revs after reference $rev 497eeda7adaSGerrit Uitslag $afterCount++; 498eeda7adaSGerrit Uitslag if ($afterCount == 1) $beforeCount = count($revs); 4990c3a5702SAndreas Gohr } 5000c3a5702SAndreas Gohr //enough revs after reference $rev? 5010603e565SAndreas Gohr if ($afterCount > (int) ($max / 2)) break 2; 5020c3a5702SAndreas Gohr } 5030c3a5702SAndreas Gohr } 5040c3a5702SAndreas Gohr //retrieve next chunk 5050603e565SAndreas Gohr [$lines, $head, $tail] = $this->readAdjacentChunk($fp, $head, $tail, 1); 5060c3a5702SAndreas Gohr } 507eeda7adaSGerrit Uitslag $lastTail = $tail; 5080c3a5702SAndreas Gohr 509bd17ac90SSatoshi Sahara // add a possible revision of external edit, create or deletion 5100603e565SAndreas Gohr if ($lastTail == $eof && $afterCount <= (int) ($max / 2) && 511df7627d6SSatoshi Sahara count($revs) && !$this->isCurrentRevision($revs[count($revs)-1]) 512df7627d6SSatoshi Sahara ) { 513bd17ac90SSatoshi Sahara $revs[] = $this->currentRevision; 514eeda7adaSGerrit Uitslag $afterCount++; 515bd17ac90SSatoshi Sahara } 516bd17ac90SSatoshi Sahara 517eeda7adaSGerrit Uitslag if ($afterCount == 0) { 518bd17ac90SSatoshi Sahara //given timestamp $rev is newer than the most recent line in chunk 519bd17ac90SSatoshi Sahara return false; //FIXME: or proceed to collect older revisions? 520bd17ac90SSatoshi Sahara } 521bd17ac90SSatoshi Sahara 522bd17ac90SSatoshi Sahara //read more chunks backward until $max/2 is reached and total number of revs is equal to $max 5230603e565SAndreas Gohr $lines = []; 5240c3a5702SAndreas Gohr $i = 0; 525eeda7adaSGerrit Uitslag $head = $startHead; 526eeda7adaSGerrit Uitslag $tail = $startTail; 5270c3a5702SAndreas Gohr while ($head > 0) { 5280603e565SAndreas Gohr [$lines, $head, $tail] = $this->readAdjacentChunk($fp, $head, $tail, -1); 5290c3a5702SAndreas Gohr 5300c3a5702SAndreas Gohr for ($i = count($lines) - 1; $i >= 0; $i--) { 5310603e565SAndreas Gohr $info = static::parseLogLine($lines[$i]); 532d154755dSSatoshi Sahara if ($this->cacheRevisionInfo($info)) { 533bd17ac90SSatoshi Sahara $revs[] = $info['date']; 534eeda7adaSGerrit Uitslag $beforeCount++; 5350c3a5702SAndreas Gohr //enough revs before reference $rev? 5360603e565SAndreas Gohr if ($beforeCount > max((int) ($max / 2), $max - $afterCount)) break 2; 5370c3a5702SAndreas Gohr } 5380c3a5702SAndreas Gohr } 5390c3a5702SAndreas Gohr } 5400c3a5702SAndreas Gohr //keep only non-parsed lines 5410c3a5702SAndreas Gohr $lines = array_slice($lines, 0, $i); 542bd17ac90SSatoshi Sahara 543bd17ac90SSatoshi Sahara sort($revs); 544bd17ac90SSatoshi Sahara 5450c3a5702SAndreas Gohr //trunk desired selection 546eeda7adaSGerrit Uitslag $requestedRevs = array_slice($revs, -$max, $max); 5470c3a5702SAndreas Gohr 5480603e565SAndreas Gohr return [$requestedRevs, $revs, $fp, $lines, $head, $lastTail]; 5490c3a5702SAndreas Gohr } 550a3984ddfSSatoshi Sahara 551a3984ddfSSatoshi Sahara /** 552bd17ac90SSatoshi Sahara * Get the current revision information, considering external edit, create or deletion 553bd17ac90SSatoshi Sahara * 554a19054e9SSatoshi Sahara * When the file has not modified since its last revision, the information of the last 55505282e9fSSatoshi Sahara * change that had already recorded in the changelog is returned as current change info. 556a19054e9SSatoshi Sahara * Otherwise, the change information since the last revision caused outside DokuWiki 55705282e9fSSatoshi Sahara * should be returned, which is referred as "external revision". 558bd17ac90SSatoshi Sahara * 55905282e9fSSatoshi Sahara * The change date of the file can be determined by timestamp as far as the file exists, 56005282e9fSSatoshi Sahara * however this is not possible when the file has already deleted outside of DokuWiki. 56166f4cdd4SSatoshi Sahara * In such case we assign 1 sec before current time() for the external deletion. 56205282e9fSSatoshi Sahara * As a result, the value of current revision identifier may change each time because: 56305282e9fSSatoshi Sahara * 1) the file has again modified outside of DokuWiki, or 56405282e9fSSatoshi Sahara * 2) the value is essentially volatile for deleted but once existed files. 565bd17ac90SSatoshi Sahara * 566bd17ac90SSatoshi Sahara * @return bool|array false when page had never existed or array with entries: 567bd17ac90SSatoshi Sahara * - date: revision identifier (timestamp or last revision +1) 568bd17ac90SSatoshi Sahara * - ip: IPv4 address (127.0.0.1) 569bd17ac90SSatoshi Sahara * - type: log line type 570bd17ac90SSatoshi Sahara * - id: id of page or media 571bd17ac90SSatoshi Sahara * - user: user name 572bd17ac90SSatoshi Sahara * - sum: edit summary (or action reason) 573bd17ac90SSatoshi Sahara * - extra: extra data (varies by line type) 574bd17ac90SSatoshi Sahara * - sizechange: change of filesize 575dbf582ddSSatoshi Sahara * - timestamp: unix timestamp or false (key set only for external edit occurred) 576bd17ac90SSatoshi Sahara * 577bd17ac90SSatoshi Sahara * @author Satoshi Sahara <sahara.satoshi@gmail.com> 578bd17ac90SSatoshi Sahara */ 579bd17ac90SSatoshi Sahara public function getCurrentRevisionInfo() 580bd17ac90SSatoshi Sahara { 581bd17ac90SSatoshi Sahara global $lang; 582bd17ac90SSatoshi Sahara 583bd17ac90SSatoshi Sahara if (isset($this->currentRevision)) return $this->getRevisionInfo($this->currentRevision); 584bd17ac90SSatoshi Sahara 585eeda7adaSGerrit Uitslag // get revision id from the item file timestamp and changelog 586dbf582ddSSatoshi Sahara $fileLastMod = $this->getFilename(); 587dbf582ddSSatoshi Sahara $fileRev = @filemtime($fileLastMod); // false when the file not exist 588df7627d6SSatoshi Sahara $lastRev = $this->lastRevision(); // false when no changelog 589bd17ac90SSatoshi Sahara 590df7627d6SSatoshi Sahara if (!$fileRev && !$lastRev) { // has never existed 591df7627d6SSatoshi Sahara $this->currentRevision = false; 592bd17ac90SSatoshi Sahara return false; 593bd17ac90SSatoshi Sahara } elseif ($fileRev === $lastRev) { // not external edit 594bd17ac90SSatoshi Sahara $this->currentRevision = $lastRev; 5955ec96136SSatoshi Sahara return $this->getRevisionInfo($lastRev); 596bd17ac90SSatoshi Sahara } 597bd17ac90SSatoshi Sahara 598bd17ac90SSatoshi Sahara if (!$fileRev && $lastRev) { // item file does not exist 599bd17ac90SSatoshi Sahara // check consistency against changelog 60086216bf0SGerrit Uitslag $revInfo = $this->getRevisionInfo($lastRev, false); 601bd17ac90SSatoshi Sahara if ($revInfo['type'] == DOKU_CHANGE_TYPE_DELETE) { 602bd17ac90SSatoshi Sahara $this->currentRevision = $lastRev; 60354d95e36SGerrit Uitslag return $revInfo; 604bd17ac90SSatoshi Sahara } 605bd17ac90SSatoshi Sahara 60666f4cdd4SSatoshi Sahara // externally deleted, set revision date as late as possible 607bd17ac90SSatoshi Sahara $revInfo = [ 60866f4cdd4SSatoshi Sahara 'date' => max($lastRev +1, time() -1), // 1 sec before now or new page save 609bd17ac90SSatoshi Sahara 'ip' => '127.0.0.1', 610bd17ac90SSatoshi Sahara 'type' => DOKU_CHANGE_TYPE_DELETE, 611bd17ac90SSatoshi Sahara 'id' => $this->id, 612bd17ac90SSatoshi Sahara 'user' => '', 613df7627d6SSatoshi Sahara 'sum' => $lang['deleted'].' - '.$lang['external_edit'].' ('.$lang['unknowndate'].')', 614bd17ac90SSatoshi Sahara 'extra' => '', 615*6e695190SAndreas Gohr 'sizechange' => -io_getSizeFile($this->getFilename($lastRev)), 616dbf582ddSSatoshi Sahara 'timestamp' => false, 617bd17ac90SSatoshi Sahara ]; 618bd17ac90SSatoshi Sahara 6190b5bb6b4SGerrit Uitslag } else { // item file exists, with timestamp $fileRev 62054d95e36SGerrit Uitslag // here, file timestamp $fileRev is different with last revision timestamp $lastRev in changelog 621df7627d6SSatoshi Sahara $isJustCreated = $lastRev === false || ( 622e39c2efbSSatoshi Sahara $fileRev > $lastRev && 62386216bf0SGerrit Uitslag $this->getRevisionInfo($lastRev, false)['type'] == DOKU_CHANGE_TYPE_DELETE 624e39c2efbSSatoshi Sahara ); 625bd17ac90SSatoshi Sahara $filesize_new = filesize($this->getFilename()); 626*6e695190SAndreas Gohr $filesize_old = $isJustCreated ? 0 : io_getSizeFile($this->getFilename($lastRev)); 627bd17ac90SSatoshi Sahara $sizechange = $filesize_new - $filesize_old; 628bd17ac90SSatoshi Sahara 629dbf582ddSSatoshi Sahara if ($isJustCreated) { 6308ff5c11aSSatoshi Sahara $timestamp = $fileRev; 631bd17ac90SSatoshi Sahara $sum = $lang['created'].' - '.$lang['external_edit']; 632bd17ac90SSatoshi Sahara } elseif ($fileRev > $lastRev) { 6338ff5c11aSSatoshi Sahara $timestamp = $fileRev; 634bd17ac90SSatoshi Sahara $sum = $lang['external_edit']; 635bd17ac90SSatoshi Sahara } else { 636eeda7adaSGerrit Uitslag // $fileRev is older than $lastRev, that is erroneous/incorrect occurrence. 63766f4cdd4SSatoshi Sahara $msg = "Warning: current file modification time is older than last revision date"; 63810f359adSAndreas Gohr $details = 'File revision: '.$fileRev.' '.dformat($fileRev, "%Y-%m-%d %H:%M:%S")."\n" 63910f359adSAndreas Gohr .'Last revision: '.$lastRev.' '.dformat($lastRev, "%Y-%m-%d %H:%M:%S"); 64066f4cdd4SSatoshi Sahara Logger::error($msg, $details, $this->getFilename()); 64166f4cdd4SSatoshi Sahara $timestamp = false; 642df7627d6SSatoshi Sahara $sum = $lang['external_edit'].' ('.$lang['unknowndate'].')'; 643bd17ac90SSatoshi Sahara } 644bd17ac90SSatoshi Sahara 645bd17ac90SSatoshi Sahara // externally created or edited 646bd17ac90SSatoshi Sahara $revInfo = [ 64766f4cdd4SSatoshi Sahara 'date' => $timestamp ?: $lastRev +1, 648bd17ac90SSatoshi Sahara 'ip' => '127.0.0.1', 649bd17ac90SSatoshi Sahara 'type' => $isJustCreated ? DOKU_CHANGE_TYPE_CREATE : DOKU_CHANGE_TYPE_EDIT, 650bd17ac90SSatoshi Sahara 'id' => $this->id, 651bd17ac90SSatoshi Sahara 'user' => '', 652bd17ac90SSatoshi Sahara 'sum' => $sum, 653bd17ac90SSatoshi Sahara 'extra' => '', 654bd17ac90SSatoshi Sahara 'sizechange' => $sizechange, 655bd17ac90SSatoshi Sahara 'timestamp' => $timestamp, 656bd17ac90SSatoshi Sahara ]; 657bd17ac90SSatoshi Sahara } 658bd17ac90SSatoshi Sahara 659bd17ac90SSatoshi Sahara // cache current revision information of external edition 660bd17ac90SSatoshi Sahara $this->currentRevision = $revInfo['date']; 661bd17ac90SSatoshi Sahara $this->cache[$this->id][$this->currentRevision] = $revInfo; 662bd17ac90SSatoshi Sahara return $this->getRevisionInfo($this->currentRevision); 663bd17ac90SSatoshi Sahara } 664312e7095SSatoshi Sahara 665312e7095SSatoshi Sahara /** 666312e7095SSatoshi Sahara * Mechanism to trace no-actual external current revision 667312e7095SSatoshi Sahara * @param int $rev 668312e7095SSatoshi Sahara */ 669312e7095SSatoshi Sahara public function traceCurrentRevision($rev) 670312e7095SSatoshi Sahara { 671312e7095SSatoshi Sahara if ($rev > $this->lastRevision()) { 672312e7095SSatoshi Sahara $rev = $this->currentRevision(); 673312e7095SSatoshi Sahara } 674312e7095SSatoshi Sahara return $rev; 675312e7095SSatoshi Sahara } 6760c3a5702SAndreas Gohr} 677