124c3e0d2SAndreas Gohr#!/usr/bin/php 224c3e0d2SAndreas Gohr<?php 378ba70a7Schrisif ('cli' != php_sapi_name()) die(); 424c3e0d2SAndreas Gohr 550b78159SElan Ruusamäeini_set('memory_limit','128M'); 624c3e0d2SAndreas Gohrif(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../').'/'); 724c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/init.php'); 824c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/common.php'); 924c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/pageutils.php'); 1024c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/search.php'); 1124c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/indexer.php'); 123a50618cSgweissbachrequire_once(DOKU_INC.'inc/auth.php'); 1324c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/cliopts.php'); 1424c3e0d2SAndreas Gohrsession_write_close(); 1524c3e0d2SAndreas Gohr 1624c3e0d2SAndreas Gohr// handle options 17981f048aSGabriel Birke$short_opts = 'hcuq'; 18981f048aSGabriel Birke$long_opts = array('help', 'clear', 'update', 'quiet'); 1924c3e0d2SAndreas Gohr$OPTS = Doku_Cli_Opts::getOptions(__FILE__,$short_opts,$long_opts); 2024c3e0d2SAndreas Gohrif ( $OPTS->isError() ) { 2124c3e0d2SAndreas Gohr fwrite( STDERR, $OPTS->getMessage() . "\n"); 2224c3e0d2SAndreas Gohr _usage(); 2324c3e0d2SAndreas Gohr exit(1); 2424c3e0d2SAndreas Gohr} 2524c3e0d2SAndreas Gohr$CLEAR = false; 26981f048aSGabriel Birke$QUIET = false; 27*9b41be24STom N Harris$INDEXER = null; 2824c3e0d2SAndreas Gohrforeach ($OPTS->options as $key => $val) { 2924c3e0d2SAndreas Gohr switch ($key) { 3024c3e0d2SAndreas Gohr case 'h': 3124c3e0d2SAndreas Gohr case 'help': 3224c3e0d2SAndreas Gohr _usage(); 3324c3e0d2SAndreas Gohr exit; 3424c3e0d2SAndreas Gohr case 'c': 3524c3e0d2SAndreas Gohr case 'clear': 3624c3e0d2SAndreas Gohr $CLEAR = true; 3724c3e0d2SAndreas Gohr break; 38981f048aSGabriel Birke case 'q': 39981f048aSGabriel Birke case 'quiet': 40981f048aSGabriel Birke $QUIET = true; 41981f048aSGabriel Birke break; 4224c3e0d2SAndreas Gohr } 4324c3e0d2SAndreas Gohr} 4424c3e0d2SAndreas Gohr 4524c3e0d2SAndreas Gohr#------------------------------------------------------------------------------ 4624c3e0d2SAndreas Gohr# Action 4724c3e0d2SAndreas Gohr 4824c3e0d2SAndreas Gohrif($CLEAR) _clearindex(); 4924c3e0d2SAndreas Gohr_update(); 5024c3e0d2SAndreas Gohr 5124c3e0d2SAndreas Gohr 5224c3e0d2SAndreas Gohr 5324c3e0d2SAndreas Gohr#------------------------------------------------------------------------------ 5424c3e0d2SAndreas Gohr 5524c3e0d2SAndreas Gohrfunction _usage() { 5624c3e0d2SAndreas Gohr print "Usage: indexer.php <options> 5724c3e0d2SAndreas Gohr 5824c3e0d2SAndreas Gohr Updates the searchindex by indexing all new or changed pages 5924c3e0d2SAndreas Gohr when the -c option is given the index is cleared first. 6024c3e0d2SAndreas Gohr 6124c3e0d2SAndreas Gohr OPTIONS 6224c3e0d2SAndreas Gohr -h, --help show this help and exit 6324c3e0d2SAndreas Gohr -c, --clear clear the index before updating 64981f048aSGabriel Birke -q, --quiet don't produce any output 6524c3e0d2SAndreas Gohr"; 6624c3e0d2SAndreas Gohr} 6724c3e0d2SAndreas Gohr 6824c3e0d2SAndreas Gohrfunction _update(){ 6924c3e0d2SAndreas Gohr global $conf; 70*9b41be24STom N Harris global $INDEXER; 71*9b41be24STom N Harris 72*9b41be24STom N Harris $INDEXER = idx_get_indexer(); 73a0c5c349STom N Harris 7424c3e0d2SAndreas Gohr $data = array(); 75981f048aSGabriel Birke _quietecho("Searching pages... "); 769df39f14SRoland Alder search($data,$conf['datadir'],'search_allpages',array('skipacl' => true)); 77981f048aSGabriel Birke _quietecho(count($data)." pages found.\n"); 7824c3e0d2SAndreas Gohr 7924c3e0d2SAndreas Gohr foreach($data as $val){ 8024c3e0d2SAndreas Gohr _index($val['id']); 8124c3e0d2SAndreas Gohr } 8224c3e0d2SAndreas Gohr} 8324c3e0d2SAndreas Gohr 8424c3e0d2SAndreas Gohrfunction _index($id){ 85*9b41be24STom N Harris global $INDEXER; 8624c3e0d2SAndreas Gohr global $CLEAR; 87*9b41be24STom N Harris global $QUIET; 8824c3e0d2SAndreas Gohr 8924c3e0d2SAndreas Gohr // if not cleared only update changed and new files 9024c3e0d2SAndreas Gohr if(!$CLEAR){ 9166b95544STom N Harris $idxtag = metaFN($id,'.indexed'); 9266b95544STom N Harris if(@file_exists($idxtag)){ 937c2ef4e8STom N Harris if(io_readFile($idxtag) == idx_get_version()){ 94*9b41be24STom N Harris $last = @filemtime($idxtag); 9524c3e0d2SAndreas Gohr if($last > @filemtime(wikiFN($id))) return; 9624c3e0d2SAndreas Gohr } 9766b95544STom N Harris } 9866b95544STom N Harris } 9924c3e0d2SAndreas Gohr 100981f048aSGabriel Birke _quietecho("$id... "); 101*9b41be24STom N Harris $body = ''; 102*9b41be24STom N Harris $data = array($id, $body); 103*9b41be24STom N Harris $evt = new Doku_Event('INDEXER_PAGE_ADD', $data); 104*9b41be24STom N Harris if ($evt->advise_before()) $data[1] = $data[1] . " " . rawWiki($id); 105*9b41be24STom N Harris $evt->advise_after(); 106*9b41be24STom N Harris unset($evt); 107*9b41be24STom N Harris list($id,$body) = $data; 108*9b41be24STom N Harris $said = false; 109*9b41be24STom N Harris while(true) { 110*9b41be24STom N Harris $result = $INDEXER->addPageWords($id, $body); 111*9b41be24STom N Harris if ($result == "locked") { 112*9b41be24STom N Harris if($said){ 113*9b41be24STom N Harris _quietecho("."); 114*9b41be24STom N Harris }else{ 115*9b41be24STom N Harris _quietecho("Waiting for lockfile (max. 5 min)"); 116*9b41be24STom N Harris $said = true; 117*9b41be24STom N Harris } 118*9b41be24STom N Harris sleep(15); 119*9b41be24STom N Harris } else { 120*9b41be24STom N Harris break; 121*9b41be24STom N Harris } 122*9b41be24STom N Harris } 123*9b41be24STom N Harris if ($result) 1247c2ef4e8STom N Harris io_saveFile(metaFN($id,'.indexed'), idx_get_version()); 125981f048aSGabriel Birke _quietecho("done.\n"); 12624c3e0d2SAndreas Gohr} 12724c3e0d2SAndreas Gohr 12824c3e0d2SAndreas Gohr/** 12924c3e0d2SAndreas Gohr * lock the indexer system 13024c3e0d2SAndreas Gohr */ 13124c3e0d2SAndreas Gohrfunction _lock(){ 13224c3e0d2SAndreas Gohr global $conf; 13324c3e0d2SAndreas Gohr $lock = $conf['lockdir'].'/_indexer.lock'; 13424c3e0d2SAndreas Gohr $said = false; 13544881d27STroels Liebe Bentsen while(!@mkdir($lock, $conf['dmode'])){ 13624c3e0d2SAndreas Gohr if(time()-@filemtime($lock) > 60*5){ 13724c3e0d2SAndreas Gohr // looks like a stale lock - remove it 13824c3e0d2SAndreas Gohr @rmdir($lock); 13924c3e0d2SAndreas Gohr }else{ 14024c3e0d2SAndreas Gohr if($said){ 141981f048aSGabriel Birke _quietecho("."); 14224c3e0d2SAndreas Gohr }else{ 143981f048aSGabriel Birke _quietecho("Waiting for lockfile (max. 5 min)"); 14424c3e0d2SAndreas Gohr $said = true; 14524c3e0d2SAndreas Gohr } 14624c3e0d2SAndreas Gohr sleep(15); 14724c3e0d2SAndreas Gohr } 14824c3e0d2SAndreas Gohr } 1491ca31cfeSAndreas Gohr if($conf['dperm']) chmod($lock, $conf['dperm']); 150981f048aSGabriel Birke if($said) _quietecho("\n"); 15124c3e0d2SAndreas Gohr} 15224c3e0d2SAndreas Gohr 15324c3e0d2SAndreas Gohr/** 15424c3e0d2SAndreas Gohr * unlock the indexer sytem 15524c3e0d2SAndreas Gohr */ 15624c3e0d2SAndreas Gohrfunction _unlock(){ 15724c3e0d2SAndreas Gohr global $conf; 15824c3e0d2SAndreas Gohr $lock = $conf['lockdir'].'/_indexer.lock'; 15924c3e0d2SAndreas Gohr @rmdir($lock); 16024c3e0d2SAndreas Gohr} 16124c3e0d2SAndreas Gohr 16224c3e0d2SAndreas Gohr/** 16324c3e0d2SAndreas Gohr * Clear all index files 16424c3e0d2SAndreas Gohr */ 16524c3e0d2SAndreas Gohrfunction _clearindex(){ 16624c3e0d2SAndreas Gohr global $conf; 16724c3e0d2SAndreas Gohr _lock(); 168981f048aSGabriel Birke _quietecho("Clearing index... "); 16966b95544STom N Harris io_saveFile($conf['indexdir'].'/page.idx',''); 170*9b41be24STom N Harris //io_saveFile($conf['indexdir'].'/title.idx',''); 17166b95544STom N Harris $dir = @opendir($conf['indexdir']); 17266b95544STom N Harris if($dir!==false){ 17366b95544STom N Harris while(($f = readdir($dir)) !== false){ 17466b95544STom N Harris if(substr($f,-4)=='.idx' && 17566b95544STom N Harris (substr($f,0,1)=='i' || substr($f,0,1)=='w')) 17666b95544STom N Harris @unlink($conf['indexdir']."/$f"); 17766b95544STom N Harris } 17866b95544STom N Harris } 179*9b41be24STom N Harris @unlink($conf['indexdir'].'/lengths.idx'); 180981f048aSGabriel Birke _quietecho("done.\n"); 18124c3e0d2SAndreas Gohr _unlock(); 18224c3e0d2SAndreas Gohr} 18324c3e0d2SAndreas Gohr 184981f048aSGabriel Birkefunction _quietecho($msg) { 185981f048aSGabriel Birke global $QUIET; 186981f048aSGabriel Birke if(!$QUIET) echo $msg; 187981f048aSGabriel Birke} 188981f048aSGabriel Birke 18924c3e0d2SAndreas Gohr//Setup VIM: ex: et ts=2 enc=utf-8 : 190