1fe2d1da1SSatoshi Sahara<?php 246b83514SSatoshi Sahara 3fe2d1da1SSatoshi Saharanamespace dokuwiki\Search; 4fe2d1da1SSatoshi Sahara 5fe2d1da1SSatoshi Saharause dokuwiki\Extension\Event; 686fc7283SSatoshi Saharause dokuwiki\Search\MetadataIndex; 7fe2d1da1SSatoshi Saharause dokuwiki\Search\QueryParser; 8fe2d1da1SSatoshi Sahara 9fe2d1da1SSatoshi Sahara/** 10fe2d1da1SSatoshi Sahara * Class DokuWiki Metadata Search 11fe2d1da1SSatoshi Sahara * 12fe2d1da1SSatoshi Sahara * @license GPL 2 (http://www.gnu.org/licenses/gpl.html) 13fe2d1da1SSatoshi Sahara * @author Andreas Gohr <andi@splitbrain.org> 14fe2d1da1SSatoshi Sahara */ 15fe2d1da1SSatoshi Saharaclass MetadataSearch 16fe2d1da1SSatoshi Sahara{ 17fe2d1da1SSatoshi Sahara /** 18fe2d1da1SSatoshi Sahara * Metadata Search constructor. prevent direct object creation 19fe2d1da1SSatoshi Sahara */ 20fe2d1da1SSatoshi Sahara protected function __construct() {} 21fe2d1da1SSatoshi Sahara 22fe2d1da1SSatoshi Sahara /** 23fe2d1da1SSatoshi Sahara * Returns the backlinks for a given page 24fe2d1da1SSatoshi Sahara * 25fe2d1da1SSatoshi Sahara * Uses the metadata index. 26fe2d1da1SSatoshi Sahara * 27fe2d1da1SSatoshi Sahara * @param string $id The id for which links shall be returned 28fe2d1da1SSatoshi Sahara * @param bool $ignore_perms Ignore the fact that pages are hidden or read-protected 29fe2d1da1SSatoshi Sahara * @return array The pages that contain links to the given page 30fe2d1da1SSatoshi Sahara */ 31fe2d1da1SSatoshi Sahara public static function backlinks($id, $ignore_perms = false) 32fe2d1da1SSatoshi Sahara { 33be5c1ea2SSatoshi Sahara $MetadataIndex = MetadataIndex::getInstance(); 34be5c1ea2SSatoshi Sahara $result = $MetadataIndex->lookupKey('relation_references', $id); 35fe2d1da1SSatoshi Sahara 36fe2d1da1SSatoshi Sahara if (!count($result)) return $result; 37fe2d1da1SSatoshi Sahara 38fe2d1da1SSatoshi Sahara // check ACL permissions 39fe2d1da1SSatoshi Sahara foreach (array_keys($result) as $idx) { 40fe2d1da1SSatoshi Sahara if (($ignore_perms !== true 41fe2d1da1SSatoshi Sahara && (isHiddenPage($result[$idx]) || auth_quickaclcheck($result[$idx]) < AUTH_READ) 42fe2d1da1SSatoshi Sahara ) || !page_exists($result[$idx], '', false) 43fe2d1da1SSatoshi Sahara ) { 44fe2d1da1SSatoshi Sahara unset($result[$idx]); 45fe2d1da1SSatoshi Sahara } 46fe2d1da1SSatoshi Sahara } 47fe2d1da1SSatoshi Sahara 48fe2d1da1SSatoshi Sahara sort($result); 49fe2d1da1SSatoshi Sahara return $result; 50fe2d1da1SSatoshi Sahara } 51fe2d1da1SSatoshi Sahara 52fe2d1da1SSatoshi Sahara /** 53fe2d1da1SSatoshi Sahara * Returns the pages that use a given media file 54fe2d1da1SSatoshi Sahara * 55fe2d1da1SSatoshi Sahara * Uses the relation media metadata property and the metadata index. 56fe2d1da1SSatoshi Sahara * 57fe2d1da1SSatoshi Sahara * Note that before 2013-07-31 the second parameter was the maximum number 58fe2d1da1SSatoshi Sahara * of results and permissions were ignored. That's why the parameter is now 59fe2d1da1SSatoshi Sahara * checked to be explicitely set to true (with type bool) in order to be 60fe2d1da1SSatoshi Sahara * compatible with older uses of the function. 61fe2d1da1SSatoshi Sahara * 62fe2d1da1SSatoshi Sahara * @param string $id The media id to look for 63fe2d1da1SSatoshi Sahara * @param bool $ignore_perms Ignore hidden pages and acls (optional, default: false) 64fe2d1da1SSatoshi Sahara * @return array A list of pages that use the given media file 65fe2d1da1SSatoshi Sahara */ 66fe2d1da1SSatoshi Sahara public static function mediause($id, $ignore_perms = false) 67fe2d1da1SSatoshi Sahara { 68be5c1ea2SSatoshi Sahara $MetadataIndex = MetadataIndex::getInstance(); 69be5c1ea2SSatoshi Sahara $result = $MetadataIndex->lookupKey('relation_media', $id); 70fe2d1da1SSatoshi Sahara 71fe2d1da1SSatoshi Sahara if (!count($result)) return $result; 72fe2d1da1SSatoshi Sahara 73fe2d1da1SSatoshi Sahara // check ACL permissions 74fe2d1da1SSatoshi Sahara foreach (array_keys($result) as $idx) { 75fe2d1da1SSatoshi Sahara if (($ignore_perms !== true 76fe2d1da1SSatoshi Sahara && (isHiddenPage($result[$idx]) || auth_quickaclcheck($result[$idx]) < AUTH_READ) 77fe2d1da1SSatoshi Sahara ) || !page_exists($result[$idx], '', false) 78fe2d1da1SSatoshi Sahara ) { 79fe2d1da1SSatoshi Sahara unset($result[$idx]); 80fe2d1da1SSatoshi Sahara } 81fe2d1da1SSatoshi Sahara } 82fe2d1da1SSatoshi Sahara 83fe2d1da1SSatoshi Sahara sort($result); 84fe2d1da1SSatoshi Sahara return $result; 85fe2d1da1SSatoshi Sahara } 86fe2d1da1SSatoshi Sahara 87fe2d1da1SSatoshi Sahara 88fe2d1da1SSatoshi Sahara /** 89fe2d1da1SSatoshi Sahara * Quicksearch for pagenames 90fe2d1da1SSatoshi Sahara * 91fe2d1da1SSatoshi Sahara * By default it only matches the pagename and ignores the namespace. 92fe2d1da1SSatoshi Sahara * This can be changed with the second parameter. 93fe2d1da1SSatoshi Sahara * The third parameter allows to search in titles as well. 94fe2d1da1SSatoshi Sahara * 95fe2d1da1SSatoshi Sahara * The function always returns titles as well 96fe2d1da1SSatoshi Sahara * 97fe2d1da1SSatoshi Sahara * @triggers SEARCH_QUERY_PAGELOOKUP 98fe2d1da1SSatoshi Sahara * @author Andreas Gohr <andi@splitbrain.org> 99fe2d1da1SSatoshi Sahara * @author Adrian Lang <lang@cosmocode.de> 100fe2d1da1SSatoshi Sahara * 101fe2d1da1SSatoshi Sahara * @param string $id page id 102fe2d1da1SSatoshi Sahara * @param bool $in_ns match against namespace as well? 103fe2d1da1SSatoshi Sahara * @param bool $in_title search in title? 104fe2d1da1SSatoshi Sahara * @param int|string $after only show results with mtime after this date, 105fe2d1da1SSatoshi Sahara * accepts timestap or strtotime arguments 106fe2d1da1SSatoshi Sahara * @param int|string $before only show results with mtime before this date, 107fe2d1da1SSatoshi Sahara * accepts timestap or strtotime arguments 108fe2d1da1SSatoshi Sahara * 109fe2d1da1SSatoshi Sahara * @return string[] 110fe2d1da1SSatoshi Sahara */ 111fe2d1da1SSatoshi Sahara public static function pageLookup($id, $in_ns = false, $in_title = false, $after = null, $before = null) 112fe2d1da1SSatoshi Sahara { 113fe2d1da1SSatoshi Sahara $data = [ 114fe2d1da1SSatoshi Sahara 'id' => $id, 115fe2d1da1SSatoshi Sahara 'in_ns' => $in_ns, 116fe2d1da1SSatoshi Sahara 'in_title' => $in_title, 117fe2d1da1SSatoshi Sahara 'after' => $after, 118fe2d1da1SSatoshi Sahara 'before' => $before 119fe2d1da1SSatoshi Sahara ]; 120fe2d1da1SSatoshi Sahara $data['has_titles'] = true; // for plugin backward compatibility check 12146b83514SSatoshi Sahara $action = static::class.'::pageLookupCallBack'; 122fe2d1da1SSatoshi Sahara return Event::createAndTrigger('SEARCH_QUERY_PAGELOOKUP', $data, $action); 123fe2d1da1SSatoshi Sahara } 124fe2d1da1SSatoshi Sahara 125fe2d1da1SSatoshi Sahara /** 126fe2d1da1SSatoshi Sahara * Returns list of pages as array(pageid => First Heading) 127fe2d1da1SSatoshi Sahara * 128fe2d1da1SSatoshi Sahara * @param array $data event data 129fe2d1da1SSatoshi Sahara * @return string[] 130fe2d1da1SSatoshi Sahara */ 13146b83514SSatoshi Sahara public static function pageLookupCallBack(&$data) 132fe2d1da1SSatoshi Sahara { 133fe2d1da1SSatoshi Sahara // split out original parameters 134fe2d1da1SSatoshi Sahara $id = $data['id']; 135fe2d1da1SSatoshi Sahara $parsedQuery = QueryParser::convert($id); 136fe2d1da1SSatoshi Sahara 137fe2d1da1SSatoshi Sahara if (count($parsedQuery['ns']) > 0) { 138fe2d1da1SSatoshi Sahara $ns = cleanID($parsedQuery['ns'][0]) . ':'; 139fe2d1da1SSatoshi Sahara $id = implode(' ', $parsedQuery['highlight']); 140fe2d1da1SSatoshi Sahara } 141fe2d1da1SSatoshi Sahara 142fe2d1da1SSatoshi Sahara $in_ns = $data['in_ns']; 143fe2d1da1SSatoshi Sahara $in_title = $data['in_title']; 144fe2d1da1SSatoshi Sahara $cleaned = cleanID($id); 145fe2d1da1SSatoshi Sahara 146fe2d1da1SSatoshi Sahara $pages = array(); 147fe2d1da1SSatoshi Sahara if ($id !== '' && $cleaned !== '') { 148*02361d2aSSatoshi Sahara $MetadataIndex = MetadataIndex::getInstance(); 149*02361d2aSSatoshi Sahara $page_idx = $MetadataIndex->getPages(); 150fe2d1da1SSatoshi Sahara foreach ($page_idx as $p_id) { 151fe2d1da1SSatoshi Sahara if ((strpos($in_ns ? $p_id : noNSorNS($p_id), $cleaned) !== false)) { 152fe2d1da1SSatoshi Sahara if (!isset($pages[$p_id])) { 153fe2d1da1SSatoshi Sahara $pages[$p_id] = p_get_first_heading($p_id, METADATA_DONT_RENDER); 154fe2d1da1SSatoshi Sahara } 155fe2d1da1SSatoshi Sahara } 156fe2d1da1SSatoshi Sahara } 157fe2d1da1SSatoshi Sahara if ($in_title) { 158fe2d1da1SSatoshi Sahara $func = static::class.'::pageLookupTitleCompare'; 159be5c1ea2SSatoshi Sahara foreach ($MetadataIndex->lookupKey('title', $id, $func) as $p_id) { 160fe2d1da1SSatoshi Sahara if (!isset($pages[$p_id])) { 161fe2d1da1SSatoshi Sahara $pages[$p_id] = p_get_first_heading($p_id, METADATA_DONT_RENDER); 162fe2d1da1SSatoshi Sahara } 163fe2d1da1SSatoshi Sahara } 164fe2d1da1SSatoshi Sahara } 165fe2d1da1SSatoshi Sahara } 166fe2d1da1SSatoshi Sahara 167fe2d1da1SSatoshi Sahara if (isset($ns)) { 168fe2d1da1SSatoshi Sahara foreach (array_keys($pages) as $p_id) { 169fe2d1da1SSatoshi Sahara if (strpos($p_id, $ns) !== 0) { 170fe2d1da1SSatoshi Sahara unset($pages[$p_id]); 171fe2d1da1SSatoshi Sahara } 172fe2d1da1SSatoshi Sahara } 173fe2d1da1SSatoshi Sahara } 174fe2d1da1SSatoshi Sahara 175fe2d1da1SSatoshi Sahara // discard hidden pages 176fe2d1da1SSatoshi Sahara // discard nonexistent pages 177fe2d1da1SSatoshi Sahara // check ACL permissions 178fe2d1da1SSatoshi Sahara foreach (array_keys($pages) as $idx) { 179fe2d1da1SSatoshi Sahara if (!isVisiblePage($idx) || !page_exists($idx) || auth_quickaclcheck($idx) < AUTH_READ) { 180fe2d1da1SSatoshi Sahara unset($pages[$idx]); 181fe2d1da1SSatoshi Sahara } 182fe2d1da1SSatoshi Sahara } 183fe2d1da1SSatoshi Sahara 184fe2d1da1SSatoshi Sahara $pages = static::filterResultsByTime($pages, $data['after'], $data['before']); 185fe2d1da1SSatoshi Sahara 186fe2d1da1SSatoshi Sahara uksort($pages, static::class.'::pagesorter'); 187fe2d1da1SSatoshi Sahara return $pages; 188fe2d1da1SSatoshi Sahara } 189fe2d1da1SSatoshi Sahara 190fe2d1da1SSatoshi Sahara /** 191fe2d1da1SSatoshi Sahara * Tiny helper function for comparing the searched title with the title 192fe2d1da1SSatoshi Sahara * from the search index. This function is a wrapper around stripos with 193fe2d1da1SSatoshi Sahara * adapted argument order and return value. 194fe2d1da1SSatoshi Sahara * 195fe2d1da1SSatoshi Sahara * @param string $search searched title 196fe2d1da1SSatoshi Sahara * @param string $title title from index 197fe2d1da1SSatoshi Sahara * @return bool 198fe2d1da1SSatoshi Sahara */ 199fe2d1da1SSatoshi Sahara protected static function pageLookupTitleCompare($search, $title) 200fe2d1da1SSatoshi Sahara { 201fe2d1da1SSatoshi Sahara return stripos($title, $search) !== false; 202fe2d1da1SSatoshi Sahara } 203fe2d1da1SSatoshi Sahara 204fe2d1da1SSatoshi Sahara /** 205fe2d1da1SSatoshi Sahara * Sort pages based on their namespace level first, then on their string 206fe2d1da1SSatoshi Sahara * values. This makes higher hierarchy pages rank higher than lower hierarchy 207fe2d1da1SSatoshi Sahara * pages. 208fe2d1da1SSatoshi Sahara * 209fe2d1da1SSatoshi Sahara * @param string $a 210fe2d1da1SSatoshi Sahara * @param string $b 211fe2d1da1SSatoshi Sahara * @return int Returns < 0 if $a is less than $b; > 0 if $a is greater than $b, 212fe2d1da1SSatoshi Sahara * and 0 if they are equal. 213fe2d1da1SSatoshi Sahara */ 214fe2d1da1SSatoshi Sahara protected static function pagesorter($a, $b) 215fe2d1da1SSatoshi Sahara { 216fe2d1da1SSatoshi Sahara $ac = count(explode(':',$a)); 217fe2d1da1SSatoshi Sahara $bc = count(explode(':',$b)); 218fe2d1da1SSatoshi Sahara if ($ac < $bc) { 219fe2d1da1SSatoshi Sahara return -1; 220fe2d1da1SSatoshi Sahara } elseif ($ac > $bc) { 221fe2d1da1SSatoshi Sahara return 1; 222fe2d1da1SSatoshi Sahara } 223fe2d1da1SSatoshi Sahara return strcmp ($a,$b); 224fe2d1da1SSatoshi Sahara } 225fe2d1da1SSatoshi Sahara 226fe2d1da1SSatoshi Sahara /** 227fe2d1da1SSatoshi Sahara * @param array $results search results in the form pageid => value 228fe2d1da1SSatoshi Sahara * @param int|string $after only returns results with mtime after this date, 229fe2d1da1SSatoshi Sahara * accepts timestap or strtotime arguments 230fe2d1da1SSatoshi Sahara * @param int|string $before only returns results with mtime after this date, 231fe2d1da1SSatoshi Sahara * accepts timestap or strtotime arguments 232fe2d1da1SSatoshi Sahara * 233fe2d1da1SSatoshi Sahara * @return array 234fe2d1da1SSatoshi Sahara */ 235fe2d1da1SSatoshi Sahara protected static function filterResultsByTime(array $results, $after, $before) 236fe2d1da1SSatoshi Sahara { 237fe2d1da1SSatoshi Sahara if ($after || $before) { 238fe2d1da1SSatoshi Sahara $after = is_int($after) ? $after : strtotime($after); 239fe2d1da1SSatoshi Sahara $before = is_int($before) ? $before : strtotime($before); 240fe2d1da1SSatoshi Sahara 241fe2d1da1SSatoshi Sahara foreach ($results as $id => $value) { 242fe2d1da1SSatoshi Sahara $mTime = filemtime(wikiFN($id)); 243fe2d1da1SSatoshi Sahara if ($after && $after > $mTime) { 244fe2d1da1SSatoshi Sahara unset($results[$id]); 245fe2d1da1SSatoshi Sahara continue; 246fe2d1da1SSatoshi Sahara } 247fe2d1da1SSatoshi Sahara if ($before && $before < $mTime) { 248fe2d1da1SSatoshi Sahara unset($results[$id]); 249fe2d1da1SSatoshi Sahara } 250fe2d1da1SSatoshi Sahara } 251fe2d1da1SSatoshi Sahara } 252fe2d1da1SSatoshi Sahara return $results; 253fe2d1da1SSatoshi Sahara } 254fe2d1da1SSatoshi Sahara} 255