cache =& $cache_revinfo; if (!isset($this->cache[$id])) { $this->cache[$id] = array(); } $this->id = $id; $this->setChunkSize($chunk_size); // set property currentRevision and cache prior to getRevisionInfo($currentRev) call $this->getCurrentRevisionInfo(); } /** * Set chunk size for file reading * Chunk size zero let read whole file at once * * @param int $chunk_size maximum block size read from file */ public function setChunkSize($chunk_size) { if (!is_numeric($chunk_size)) $chunk_size = 0; $this->chunk_size = (int)max($chunk_size, 0); } /** * Returns path to changelog * * @return string path to file */ abstract protected function getChangelogFilename(); /** * Returns path to current page/media * * @return string path to file */ abstract protected function getFilename(); /** * Save revision info to the cache pool * * @return bool */ protected function saveRevisionInfo($info) { if (!is_array($info)) return false; //$this->cache[$this->id][$info['date']] ??= $info; // since php 7.4 $this->cache[$this->id][$info['date']] = $this->cache[$this->id][$info['date']] ?? $info; return true; } /** * Get the changelog information for a specific page id and revision (timestamp) * * Adjacent changelog lines are optimistically parsed and cached to speed up * consecutive calls to getRevisionInfo. For large changelog files, only the chunk * containing the requested changelog line is read. * * @param int $rev revision timestamp * @return bool|array false or array with entries: * - date: unix timestamp * - ip: IPv4 address (127.0.0.1) * - type: log line type * - id: page id * - user: user name * - sum: edit summary (or action reason) * - extra: extra data (varies by line type) * - sizechange: change of filesize * * @author Ben Coburn * @author Kate Arzamastseva */ public function getRevisionInfo($rev) { $rev = max(0, $rev); if (!$rev) return false; // check if it's already in the memory cache if (isset($this->cache[$this->id]) && isset($this->cache[$this->id][$rev])) { return $this->cache[$this->id][$rev]; } //read lines from changelog list($fp, $lines) = $this->readloglines($rev); if ($fp) { fclose($fp); } if (empty($lines)) return false; // parse and cache changelog lines foreach ($lines as $value) { $info = parseChangelogLine($value); $this->saveRevisionInfo($info); } if (!isset($this->cache[$this->id][$rev])) { return false; } return $this->cache[$this->id][$rev]; } /** * Return a list of page revisions numbers * * Does not guarantee that the revision exists in the attic, * only that a line with the date exists in the changelog. * By default the current revision is skipped. * * The current revision is automatically skipped when the page exists. * See $INFO['meta']['last_change'] for the current revision. * A negative $first let read the current revision too. * * For efficiency, the log lines are parsed and cached for later * calls to getRevisionInfo. Large changelog files are read * backwards in chunks until the requested number of changelog * lines are recieved. * * @param int $first skip the first n changelog lines * @param int $num number of revisions to return * @return array with the revision timestamps * * @author Ben Coburn * @author Kate Arzamastseva */ public function getRevisions($first, $num) { $revs = array(); $lines = array(); $count = 0; $num = max($num, 0); if ($num == 0) { return $revs; } if ($first < 0) { $first = 0; } else { if (file_exists($this->getFilename()) && !$this->isExternalEdition()) { // skip current revision if the page exist and not external edition $first = max($first + 1, 0); } } $file = $this->getChangelogFilename(); if (!file_exists($file)) { return $revs; } if (filesize($file) < $this->chunk_size || $this->chunk_size == 0) { // read whole file $lines = file($file); if ($lines === false) { return $revs; } } else { // read chunks backwards $fp = fopen($file, 'rb'); // "file pointer" if ($fp === false) { return $revs; } fseek($fp, 0, SEEK_END); $tail = ftell($fp); // chunk backwards $finger = max($tail - $this->chunk_size, 0); while ($count < $num + $first) { $nl = $this->getNewlinepointer($fp, $finger); // was the chunk big enough? if not, take another bite if ($nl > 0 && $tail <= $nl) { $finger = max($finger - $this->chunk_size, 0); continue; } else { $finger = $nl; } // read chunk $chunk = ''; $read_size = max($tail - $finger, 0); // found chunk size $got = 0; while ($got < $read_size && !feof($fp)) { $tmp = @fread($fp, max(min($this->chunk_size, $read_size - $got), 0)); if ($tmp === false) { break; } //error state $got += strlen($tmp); $chunk .= $tmp; } $tmp = explode("\n", $chunk); array_pop($tmp); // remove trailing newline // combine with previous chunk $count += count($tmp); $lines = array_merge($tmp, $lines); // next chunk if ($finger == 0) { break; } else { // already read all the lines $tail = $finger; $finger = max($tail - $this->chunk_size, 0); } } fclose($fp); } // skip parsing extra lines $num = max(min(count($lines) - $first, $num), 0); if ($first > 0 && $num > 0) { $lines = array_slice($lines, max(count($lines) - $first - $num, 0), $num); } else { if ($first > 0 && $num == 0) { $lines = array_slice($lines, 0, max(count($lines) - $first, 0)); } elseif ($first == 0 && $num > 0) { $lines = array_slice($lines, max(count($lines) - $num, 0)); } } // handle lines in reverse order for ($i = count($lines) - 1; $i >= 0; $i--) { $info = parseChangelogLine($lines[$i]); if ($this->saveRevisionInfo($info)) { $revs[] = $info['date']; } } return $revs; } /** * Get the nth revision left or right handside for a specific page id and revision (timestamp) * * For large changelog files, only the chunk containing the * reference revision $rev is read and sometimes a next chunck. * * Adjacent changelog lines are optimistically parsed and cached to speed up * consecutive calls to getRevisionInfo. * * @param int $rev revision timestamp used as startdate (doesn't need to be revisionnumber) * @param int $direction give position of returned revision with respect to $rev; positive=next, negative=prev * @return bool|int * timestamp of the requested revision * otherwise false */ public function getRelativeRevision($rev, $direction) { $rev = max($rev, 0); $direction = (int)$direction; //no direction given or last rev, so no follow-up if (!$direction || ($direction > 0 && $this->isCurrentRevision($rev))) { return false; } //get lines from changelog list($fp, $lines, $head, $tail, $eof) = $this->readloglines($rev); if (empty($lines)) return false; // look for revisions later/earlier than $rev, when founded count till the wanted revision is reached // also parse and cache changelog lines for getRevisionInfo(). $revcounter = 0; $relativerev = false; $checkotherchunck = true; //always runs once while (!$relativerev && $checkotherchunck) { $info = array(); //parse in normal or reverse order $count = count($lines); if ($direction > 0) { $start = 0; $step = 1; } else { $start = $count - 1; $step = -1; } for ($i = $start; $i >= 0 && $i < $count; $i = $i + $step) { $info = parseChangelogLine($lines[$i]); if ($this->saveRevisionInfo($info)) { //look for revs older/earlier then reference $rev and select $direction-th one if (($direction > 0 && $info['date'] > $rev) || ($direction < 0 && $info['date'] < $rev)) { $revcounter++; if ($revcounter == abs($direction)) { $relativerev = $info['date']; } } } } //true when $rev is found, but not the wanted follow-up. $checkotherchunck = $fp && ($info['date'] == $rev || ($revcounter > 0 && !$relativerev)) && !(($tail == $eof && $direction > 0) || ($head == 0 && $direction < 0)); if ($checkotherchunck) { list($lines, $head, $tail) = $this->readAdjacentChunk($fp, $head, $tail, $direction); if (empty($lines)) break; } } if ($fp) { fclose($fp); } return $relativerev; } /** * Returns revisions around rev1 and rev2 * When available it returns $max entries for each revision * * @param int $rev1 oldest revision timestamp * @param int $rev2 newest revision timestamp (0 looks up last revision) * @param int $max maximum number of revisions returned * @return array with two arrays with revisions surrounding rev1 respectively rev2 */ public function getRevisionsAround($rev1, $rev2, $max = 50) { $max = intval(abs($max) / 2) * 2 + 1; $rev1 = max($rev1, 0); $rev2 = max($rev2, 0); if ($rev2) { if ($rev2 < $rev1) { $rev = $rev2; $rev2 = $rev1; $rev1 = $rev; } } else { //empty right side means a removed page. Look up last revision. $rev2 = $this->currentRevision(); } //collect revisions around rev2 list($revs2, $allrevs, $fp, $lines, $head, $tail) = $this->retrieveRevisionsAround($rev2, $max); if (empty($revs2)) return array(array(), array()); //collect revisions around rev1 $index = array_search($rev1, $allrevs); if ($index === false) { //no overlapping revisions list($revs1, , , , ,) = $this->retrieveRevisionsAround($rev1, $max); if (empty($revs1)) $revs1 = array(); } else { //revisions overlaps, reuse revisions around rev2 $lastrev = array_pop($allrevs); //keep last entry that could be external edit $revs1 = $allrevs; while ($head > 0) { for ($i = count($lines) - 1; $i >= 0; $i--) { $info = parseChangelogLine($lines[$i]); if ($this->saveRevisionInfo($info)) { $revs1[] = $info['date']; $index++; if ($index > intval($max / 2)) break 2; } } list($lines, $head, $tail) = $this->readAdjacentChunk($fp, $head, $tail, -1); } sort($revs1); $revs1[] = $lastrev; //push back last entry //return wanted selection $revs1 = array_slice($revs1, max($index - intval($max / 2), 0), $max); } return array(array_reverse($revs1), array_reverse($revs2)); } /** * Checks if the ID has old revisons * @return boolean */ public function hasRevisions() { $file = $this->getChangelogFilename(); return file_exists($file); } /** * Returns lines from changelog. * If file larger than $chuncksize, only chunck is read that could contain $rev. * * When reference timestamp $rev is outside time range of changelog, readloglines() will return * lines in first or last chunk, but they obviously does not contain $rev. * * @param int $rev revision timestamp * @return array|false * if success returns array(fp, array(changeloglines), $head, $tail, $eof) * where fp only defined for chuck reading, needs closing. * otherwise false */ protected function readloglines($rev) { $file = $this->getChangelogFilename(); if (!file_exists($file)) { return false; } $fp = null; $head = 0; $tail = 0; $eof = 0; if (filesize($file) < $this->chunk_size || $this->chunk_size == 0) { // read whole file $lines = file($file); if ($lines === false) { return false; } } else { // read by chunk $fp = fopen($file, 'rb'); // "file pointer" if ($fp === false) { return false; } $head = 0; fseek($fp, 0, SEEK_END); $eof = ftell($fp); $tail = $eof; // find chunk while ($tail - $head > $this->chunk_size) { $finger = $head + intval(($tail - $head) / 2); $finger = $this->getNewlinepointer($fp, $finger); $tmp = fgets($fp); if ($finger == $head || $finger == $tail) { break; } $info = parseChangelogLine($tmp); $finger_rev = $info['date']; if ($finger_rev > $rev) { $tail = $finger; } else { $head = $finger; } } if ($tail - $head < 1) { // cound not find chunk, assume requested rev is missing fclose($fp); return false; } $lines = $this->readChunk($fp, $head, $tail); } return array( $fp, $lines, $head, $tail, $eof, ); } /** * Read chunk and return array with lines of given chunck. * Has no check if $head and $tail are really at a new line * * @param resource $fp resource filepointer * @param int $head start point chunck * @param int $tail end point chunck * @return array lines read from chunck */ protected function readChunk($fp, $head, $tail) { $chunk = ''; $chunk_size = max($tail - $head, 0); // found chunk size $got = 0; fseek($fp, $head); while ($got < $chunk_size && !feof($fp)) { $tmp = @fread($fp, max(min($this->chunk_size, $chunk_size - $got), 0)); if ($tmp === false) { //error state break; } $got += strlen($tmp); $chunk .= $tmp; } $lines = explode("\n", $chunk); array_pop($lines); // remove trailing newline return $lines; } /** * Set pointer to first new line after $finger and return its position * * @param resource $fp filepointer * @param int $finger a pointer * @return int pointer */ protected function getNewlinepointer($fp, $finger) { fseek($fp, $finger); $nl = $finger; if ($finger > 0) { fgets($fp); // slip the finger forward to a new line $nl = ftell($fp); } return $nl; } /** * Check whether given revision is the current page * * @param int $rev timestamp of current page * @return bool true if $rev is current revision, otherwise false */ public function isCurrentRevision($rev) { return $rev == $this->currentRevision(); } /** * Return an existing revision for a specific date which is * the current one or younger or equal then the date * * @param number $date_at timestamp * @return string revision ('' for current) */ public function getLastRevisionAt($date_at) { //requested date_at(timestamp) younger or equal then modified_time($this->id) => load current if (file_exists($this->getFilename()) && $date_at >= @filemtime($this->getFilename())) { return ''; } else { if ($rev = $this->getRelativeRevision($date_at + 1, -1)) { //+1 to get also the requested date revision return $rev; } else { return false; } } } /** * Returns the next lines of the changelog of the chunck before head or after tail * * @param resource $fp filepointer * @param int $head position head of last chunk * @param int $tail position tail of last chunk * @param int $direction positive forward, negative backward * @return array with entries: * - $lines: changelog lines of readed chunk * - $head: head of chunk * - $tail: tail of chunk */ protected function readAdjacentChunk($fp, $head, $tail, $direction) { if (!$fp) return array(array(), $head, $tail); if ($direction > 0) { //read forward $head = $tail; $tail = $head + intval($this->chunk_size * (2 / 3)); $tail = $this->getNewlinepointer($fp, $tail); } else { //read backward $tail = $head; $head = max($tail - $this->chunk_size, 0); while (true) { $nl = $this->getNewlinepointer($fp, $head); // was the chunk big enough? if not, take another bite if ($nl > 0 && $tail <= $nl) { $head = max($head - $this->chunk_size, 0); } else { $head = $nl; break; } } } //load next chunck $lines = $this->readChunk($fp, $head, $tail); return array($lines, $head, $tail); } /** * Collect the $max revisions near to the timestamp $rev * * Ideally, half of retrieved timestamps are older than $rev, another half are newer. * The returned array $requestedrevs may not contain the reference timestamp $rev * when it does not match any revision value recorded in changelog. * * @param int $rev revision timestamp * @param int $max maximum number of revisions to be returned * @return bool|array * return array with entries: * - $requestedrevs: array of with $max revision timestamps * - $revs: all parsed revision timestamps * - $fp: filepointer only defined for chuck reading, needs closing. * - $lines: non-parsed changelog lines before the parsed revisions * - $head: position of first readed changelogline * - $lasttail: position of end of last readed changelogline * otherwise false */ protected function retrieveRevisionsAround($rev, $max) { $revs = array(); $aftercount = $beforecount = 0; //get lines from changelog list($fp, $lines, $starthead, $starttail, $eof) = $this->readloglines($rev); if (empty($lines)) return false; //parse changelog lines in chunk, and read forward more chunks until $max/2 is reached $head = $starthead; $tail = $starttail; while (count($lines) > 0) { foreach ($lines as $line) { $info = parseChangelogLine($line); if ($this->saveRevisionInfo($info)) { $revs[] = $info['date']; if ($info['date'] >= $rev) { //count revs after reference $rev $aftercount++; if ($aftercount == 1) $beforecount = count($revs); } //enough revs after reference $rev? if ($aftercount > intval($max / 2)) break 2; } } //retrieve next chunk list($lines, $head, $tail) = $this->readAdjacentChunk($fp, $head, $tail, 1); } $lasttail = $tail; // add a possible revision of external edit, create or deletion if ($lasttail == $eof && $aftercount <= intval($max / 2) && $this->isExternalEdition()) { $revs[] = $this->currentRevision; $aftercount++; } if ($aftercount == 0) { //given timestamp $rev is newer than the most recent line in chunk return false; //FIXME: or proceed to collect older revisions? } //read more chunks backward until $max/2 is reached and total number of revs is equal to $max $lines = array(); $i = 0; if ($aftercount > 0) { $head = $starthead; $tail = $starttail; while ($head > 0) { list($lines, $head, $tail) = $this->readAdjacentChunk($fp, $head, $tail, -1); for ($i = count($lines) - 1; $i >= 0; $i--) { $info = parseChangelogLine($lines[$i]); if ($this->saveRevisionInfo($info)) { $revs[] = $info['date']; $beforecount++; //enough revs before reference $rev? if ($beforecount > max(intval($max / 2), $max - $aftercount)) break 2; } } } } //keep only non-parsed lines $lines = array_slice($lines, 0, $i); sort($revs); //trunk desired selection $requestedrevs = array_slice($revs, -$max, $max); return array($requestedrevs, $revs, $fp, $lines, $head, $lasttail); } /** * Get the current revision information, considering external edit, create or deletion * * The "current" revison is the last timestamp of the page in the context of changelog. * However it is often recognised that is in sight now from the DokuWiki user perspective. * The current page is accessible without any revision identifier (eg. doku.php?id=foo), * but it has unique modification time of the source txt file and kept in changelog. * When the page is deleted by saving blank text in the DokuWiki editor, the deletion * time is to be kept as its revision identifier in the changelog. * * External edit will break consistency between the file and changelog. A page source * file might be modified, created or deleted without using DokuWiki editor, instead * by accessing direct to the file stored in data directory via server console. * Such editions are never recorded in changelog. However after external file edit, * now we can see new "current" content of the edited page! * * A tentative revision should be assigned for the external edition to handle whole * revisions successfully in DokuWiki revision list and diff view interface. * As far as the source file of the edition exists, a unique revision can be decided * using function filemtime(), but it could be unknown if the foo.txt file had deleted * or moved to foo.bak file. * In such case, we assume unknown revision as "last timestamp in chagelog" +1 * to ensure that current one should be newer than any revisions in changelog. * Another case of external edit: when foo.bak file moved back to foo.txt, the current * one could become older than latest timestamp in changelog. In this case, we should * assume the revison as "last timestamp in chagelog" +1, instead of its timestamp. * * @return bool|array false when page had never existed or array with entries: * - date: revision identifier (timestamp or last revision +1) * - ip: IPv4 address (127.0.0.1) * - type: log line type * - id: id of page or media * - user: user name * - sum: edit summary (or action reason) * - extra: extra data (varies by line type) * - sizechange: change of filesize * - timestamp: timestamp or 'unknown' (key set only for external edition) * * @author Satoshi Sahara */ public function getCurrentRevisionInfo() { global $lang; if (isset($this->currentRevision)) return $this->getRevisionInfo($this->currentRevision); // get revision id from the item file timestamp and chagelog $fileRev = @filemtime($this->getFilename()); // false when the file not exist $lastRev = @$this->getRevisions(-1, 1)[0]; // null when failed if (!$fileRev && $lastRev === null) { // has never existed return false; } elseif ($fileRev === $lastRev) { // not external edit $this->currentRevision = $lastRev; $this->cache[$this->id][$this->currentRevision] += [ 'current' => true, ]; return $this->getRevisionInfo($this->currentRevision); } if (!$fileRev && $lastRev) { // item file does not exist // check consistency against changelog $revInfo = $this->getRevisionInfo($lastRev); if ($revInfo['type'] == DOKU_CHANGE_TYPE_DELETE) { $this->currentRevision = $lastRev; $this->cache[$this->id][$this->currentRevision] += [ 'current' => true, ]; return $this->getRevisionInfo($this->currentRevision); } // externally deleted $revInfo = [ 'date' => $lastRev +1, 'ip' => '127.0.0.1', 'type' => DOKU_CHANGE_TYPE_DELETE, 'id' => $this->id, 'user' => '', 'sum' => $lang['deleted'] .' - '. $lang['external_edit'], 'extra' => '', 'sizechange' => -io_getSizeFile($this->getFilename($lastRev)), 'current' => true, 'timestamp' => 'unknown', ]; } elseif ($fileRev) { // item file exist // here, file timestamp is different with last revision in changelog $isJustCreated = is_null($lastRev) || ( $fileRev > $lastRev && $this->getRevisionInfo($lastRev)['type'] == DOKU_CHANGE_TYPE_DELETE ); $filesize_new = filesize($this->getFilename()); $filesize_old = $isJustCreated ? 0 : io_getSizeFile($this->getFilename($lastRev)); $sizechange = $filesize_new - $filesize_old; if ($isJustCreated) { // lastRev is null $rev = $timestamp = $fileRev; $sum = $lang['created'] .' - '. $lang['external_edit']; } elseif ($fileRev > $lastRev) { $rev = $timestamp = $fileRev; $sum = $lang['external_edit']; } else { // $fileRev is older than $lastRev, externally reverted an old file $rev = max($fileRev, $lastRev +1); $timestamp = 'unknown'; $sum = $lang['external_edit']; } // externally created or edited $revInfo = [ 'date' => $rev, 'ip' => '127.0.0.1', 'type' => $isJustCreated ? DOKU_CHANGE_TYPE_CREATE : DOKU_CHANGE_TYPE_EDIT, 'id' => $this->id, 'user' => '', 'sum' => $sum, 'extra' => '', 'sizechange' => $sizechange, 'current' => true, 'timestamp' => $timestamp, ]; } // cache current revision information of external edition $this->currentRevision = $revInfo['date']; $this->cache[$this->id][$this->currentRevision] = $revInfo; return $this->getRevisionInfo($this->currentRevision); } /** * Checks if the revision is external edition * @return boolean */ public function isExternalEdition($rev =null) { if ($rev === 'current' || $rev === null) { $revInfo = $this->getCurrentRevisionInfo(); } elseif (is_int($rev)) { $revInfo = $this->getRevisionInfo($rev); } elseif (is_array($rev)) { $revInfo = $rev; } return array_key_exists('timestamp', $revInfo); } /** * Return the current revision identifer * @return int|false */ public function currentRevision() { if (!isset($this->currentRevision)) { // set ChangeLog::currentRevision property $this->getCurrentRevisionInfo(); } return $this->currentRevision; } }