xref: /dokuwiki/bin/indexer.php (revision 9b41be2446ea725a496f34b28ac4db84bece57c9)
124c3e0d2SAndreas Gohr#!/usr/bin/php
224c3e0d2SAndreas Gohr<?php
378ba70a7Schrisif ('cli' != php_sapi_name()) die();
424c3e0d2SAndreas Gohr
550b78159SElan Ruusamäeini_set('memory_limit','128M');
624c3e0d2SAndreas Gohrif(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../').'/');
724c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/init.php');
824c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/common.php');
924c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/pageutils.php');
1024c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/search.php');
1124c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/indexer.php');
123a50618cSgweissbachrequire_once(DOKU_INC.'inc/auth.php');
1324c3e0d2SAndreas Gohrrequire_once(DOKU_INC.'inc/cliopts.php');
1424c3e0d2SAndreas Gohrsession_write_close();
1524c3e0d2SAndreas Gohr
1624c3e0d2SAndreas Gohr// handle options
17981f048aSGabriel Birke$short_opts = 'hcuq';
18981f048aSGabriel Birke$long_opts  = array('help', 'clear', 'update', 'quiet');
1924c3e0d2SAndreas Gohr$OPTS = Doku_Cli_Opts::getOptions(__FILE__,$short_opts,$long_opts);
2024c3e0d2SAndreas Gohrif ( $OPTS->isError() ) {
2124c3e0d2SAndreas Gohr    fwrite( STDERR, $OPTS->getMessage() . "\n");
2224c3e0d2SAndreas Gohr    _usage();
2324c3e0d2SAndreas Gohr    exit(1);
2424c3e0d2SAndreas Gohr}
2524c3e0d2SAndreas Gohr$CLEAR = false;
26981f048aSGabriel Birke$QUIET = false;
27*9b41be24STom N Harris$INDEXER = null;
2824c3e0d2SAndreas Gohrforeach ($OPTS->options as $key => $val) {
2924c3e0d2SAndreas Gohr    switch ($key) {
3024c3e0d2SAndreas Gohr        case 'h':
3124c3e0d2SAndreas Gohr        case 'help':
3224c3e0d2SAndreas Gohr            _usage();
3324c3e0d2SAndreas Gohr            exit;
3424c3e0d2SAndreas Gohr        case 'c':
3524c3e0d2SAndreas Gohr        case 'clear':
3624c3e0d2SAndreas Gohr            $CLEAR = true;
3724c3e0d2SAndreas Gohr            break;
38981f048aSGabriel Birke        case 'q':
39981f048aSGabriel Birke        case 'quiet':
40981f048aSGabriel Birke            $QUIET = true;
41981f048aSGabriel Birke            break;
4224c3e0d2SAndreas Gohr    }
4324c3e0d2SAndreas Gohr}
4424c3e0d2SAndreas Gohr
4524c3e0d2SAndreas Gohr#------------------------------------------------------------------------------
4624c3e0d2SAndreas Gohr# Action
4724c3e0d2SAndreas Gohr
4824c3e0d2SAndreas Gohrif($CLEAR) _clearindex();
4924c3e0d2SAndreas Gohr_update();
5024c3e0d2SAndreas Gohr
5124c3e0d2SAndreas Gohr
5224c3e0d2SAndreas Gohr
5324c3e0d2SAndreas Gohr#------------------------------------------------------------------------------
5424c3e0d2SAndreas Gohr
5524c3e0d2SAndreas Gohrfunction _usage() {
5624c3e0d2SAndreas Gohr    print "Usage: indexer.php <options>
5724c3e0d2SAndreas Gohr
5824c3e0d2SAndreas Gohr    Updates the searchindex by indexing all new or changed pages
5924c3e0d2SAndreas Gohr    when the -c option is given the index is cleared first.
6024c3e0d2SAndreas Gohr
6124c3e0d2SAndreas Gohr    OPTIONS
6224c3e0d2SAndreas Gohr        -h, --help     show this help and exit
6324c3e0d2SAndreas Gohr        -c, --clear    clear the index before updating
64981f048aSGabriel Birke        -q, --quiet    don't produce any output
6524c3e0d2SAndreas Gohr";
6624c3e0d2SAndreas Gohr}
6724c3e0d2SAndreas Gohr
6824c3e0d2SAndreas Gohrfunction _update(){
6924c3e0d2SAndreas Gohr    global $conf;
70*9b41be24STom N Harris    global $INDEXER;
71*9b41be24STom N Harris
72*9b41be24STom N Harris    $INDEXER = idx_get_indexer();
73a0c5c349STom N Harris
7424c3e0d2SAndreas Gohr    $data = array();
75981f048aSGabriel Birke    _quietecho("Searching pages... ");
769df39f14SRoland Alder    search($data,$conf['datadir'],'search_allpages',array('skipacl' => true));
77981f048aSGabriel Birke    _quietecho(count($data)." pages found.\n");
7824c3e0d2SAndreas Gohr
7924c3e0d2SAndreas Gohr    foreach($data as $val){
8024c3e0d2SAndreas Gohr        _index($val['id']);
8124c3e0d2SAndreas Gohr    }
8224c3e0d2SAndreas Gohr}
8324c3e0d2SAndreas Gohr
8424c3e0d2SAndreas Gohrfunction _index($id){
85*9b41be24STom N Harris    global $INDEXER;
8624c3e0d2SAndreas Gohr    global $CLEAR;
87*9b41be24STom N Harris    global $QUIET;
8824c3e0d2SAndreas Gohr
8924c3e0d2SAndreas Gohr    // if not cleared only update changed and new files
9024c3e0d2SAndreas Gohr    if(!$CLEAR){
9166b95544STom N Harris        $idxtag = metaFN($id,'.indexed');
9266b95544STom N Harris        if(@file_exists($idxtag)){
937c2ef4e8STom N Harris            if(io_readFile($idxtag) == idx_get_version()){
94*9b41be24STom N Harris                $last = @filemtime($idxtag);
9524c3e0d2SAndreas Gohr                if($last > @filemtime(wikiFN($id))) return;
9624c3e0d2SAndreas Gohr            }
9766b95544STom N Harris        }
9866b95544STom N Harris    }
9924c3e0d2SAndreas Gohr
100981f048aSGabriel Birke    _quietecho("$id... ");
101*9b41be24STom N Harris    $body = '';
102*9b41be24STom N Harris    $data = array($id, $body);
103*9b41be24STom N Harris    $evt = new Doku_Event('INDEXER_PAGE_ADD', $data);
104*9b41be24STom N Harris    if ($evt->advise_before()) $data[1] = $data[1] . " " . rawWiki($id);
105*9b41be24STom N Harris    $evt->advise_after();
106*9b41be24STom N Harris    unset($evt);
107*9b41be24STom N Harris    list($id,$body) = $data;
108*9b41be24STom N Harris    $said = false;
109*9b41be24STom N Harris    while(true) {
110*9b41be24STom N Harris        $result = $INDEXER->addPageWords($id, $body);
111*9b41be24STom N Harris        if ($result == "locked") {
112*9b41be24STom N Harris            if($said){
113*9b41be24STom N Harris                _quietecho(".");
114*9b41be24STom N Harris            }else{
115*9b41be24STom N Harris                _quietecho("Waiting for lockfile (max. 5 min)");
116*9b41be24STom N Harris                $said = true;
117*9b41be24STom N Harris            }
118*9b41be24STom N Harris            sleep(15);
119*9b41be24STom N Harris        } else {
120*9b41be24STom N Harris            break;
121*9b41be24STom N Harris        }
122*9b41be24STom N Harris    }
123*9b41be24STom N Harris    if ($result)
1247c2ef4e8STom N Harris        io_saveFile(metaFN($id,'.indexed'), idx_get_version());
125981f048aSGabriel Birke    _quietecho("done.\n");
12624c3e0d2SAndreas Gohr}
12724c3e0d2SAndreas Gohr
12824c3e0d2SAndreas Gohr/**
12924c3e0d2SAndreas Gohr * lock the indexer system
13024c3e0d2SAndreas Gohr */
13124c3e0d2SAndreas Gohrfunction _lock(){
13224c3e0d2SAndreas Gohr    global $conf;
13324c3e0d2SAndreas Gohr    $lock = $conf['lockdir'].'/_indexer.lock';
13424c3e0d2SAndreas Gohr    $said = false;
13544881d27STroels Liebe Bentsen    while(!@mkdir($lock, $conf['dmode'])){
13624c3e0d2SAndreas Gohr        if(time()-@filemtime($lock) > 60*5){
13724c3e0d2SAndreas Gohr            // looks like a stale lock - remove it
13824c3e0d2SAndreas Gohr            @rmdir($lock);
13924c3e0d2SAndreas Gohr        }else{
14024c3e0d2SAndreas Gohr            if($said){
141981f048aSGabriel Birke                _quietecho(".");
14224c3e0d2SAndreas Gohr            }else{
143981f048aSGabriel Birke                _quietecho("Waiting for lockfile (max. 5 min)");
14424c3e0d2SAndreas Gohr                $said = true;
14524c3e0d2SAndreas Gohr            }
14624c3e0d2SAndreas Gohr            sleep(15);
14724c3e0d2SAndreas Gohr        }
14824c3e0d2SAndreas Gohr    }
1491ca31cfeSAndreas Gohr    if($conf['dperm']) chmod($lock, $conf['dperm']);
150981f048aSGabriel Birke    if($said) _quietecho("\n");
15124c3e0d2SAndreas Gohr}
15224c3e0d2SAndreas Gohr
15324c3e0d2SAndreas Gohr/**
15424c3e0d2SAndreas Gohr * unlock the indexer sytem
15524c3e0d2SAndreas Gohr */
15624c3e0d2SAndreas Gohrfunction _unlock(){
15724c3e0d2SAndreas Gohr    global $conf;
15824c3e0d2SAndreas Gohr    $lock = $conf['lockdir'].'/_indexer.lock';
15924c3e0d2SAndreas Gohr    @rmdir($lock);
16024c3e0d2SAndreas Gohr}
16124c3e0d2SAndreas Gohr
16224c3e0d2SAndreas Gohr/**
16324c3e0d2SAndreas Gohr * Clear all index files
16424c3e0d2SAndreas Gohr */
16524c3e0d2SAndreas Gohrfunction _clearindex(){
16624c3e0d2SAndreas Gohr    global $conf;
16724c3e0d2SAndreas Gohr    _lock();
168981f048aSGabriel Birke    _quietecho("Clearing index... ");
16966b95544STom N Harris    io_saveFile($conf['indexdir'].'/page.idx','');
170*9b41be24STom N Harris    //io_saveFile($conf['indexdir'].'/title.idx','');
17166b95544STom N Harris    $dir = @opendir($conf['indexdir']);
17266b95544STom N Harris    if($dir!==false){
17366b95544STom N Harris        while(($f = readdir($dir)) !== false){
17466b95544STom N Harris            if(substr($f,-4)=='.idx' &&
17566b95544STom N Harris               (substr($f,0,1)=='i' || substr($f,0,1)=='w'))
17666b95544STom N Harris                @unlink($conf['indexdir']."/$f");
17766b95544STom N Harris        }
17866b95544STom N Harris    }
179*9b41be24STom N Harris    @unlink($conf['indexdir'].'/lengths.idx');
180981f048aSGabriel Birke    _quietecho("done.\n");
18124c3e0d2SAndreas Gohr    _unlock();
18224c3e0d2SAndreas Gohr}
18324c3e0d2SAndreas Gohr
184981f048aSGabriel Birkefunction _quietecho($msg) {
185981f048aSGabriel Birke    global $QUIET;
186981f048aSGabriel Birke    if(!$QUIET) echo $msg;
187981f048aSGabriel Birke}
188981f048aSGabriel Birke
18924c3e0d2SAndreas Gohr//Setup VIM: ex: et ts=2 enc=utf-8 :
190