xref: /dokuwiki/inc/parser/parser.php (revision 702eb8985f33ca5781d2da5cedd9d6a4b9c6a030)
10cecf9d5Sandi<?php
20cecf9d5Sandi
30cecf9d5Sandiif(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../../').'/');
40cecf9d5Sandi
50cecf9d5Sandirequire_once DOKU_INC . 'inc/parser/lexer.php';
60cecf9d5Sandirequire_once DOKU_INC . 'inc/parser/handler.php';
70cecf9d5Sandi
80cecf9d5Sandi//-------------------------------------------------------------------
90cecf9d5Sandi
100cecf9d5Sandi/**
110cecf9d5Sandi* Sets up the Lexer with modes and points it to the Handler
120cecf9d5Sandi* For an intro to the Lexer see: wiki:parser
130cecf9d5Sandi*/
140cecf9d5Sandiclass Doku_Parser {
150cecf9d5Sandi
160cecf9d5Sandi    var $Handler;
170cecf9d5Sandi
180cecf9d5Sandi    var $Lexer;
190cecf9d5Sandi
200cecf9d5Sandi    var $modes = array();
210cecf9d5Sandi
220cecf9d5Sandi    var $connected = FALSE;
230cecf9d5Sandi
24b7c441b9SHarry Fuecks    function addBaseMode(& $BaseMode) {
25b7c441b9SHarry Fuecks        $this->modes['base'] = & $BaseMode;
260cecf9d5Sandi        if ( !$this->Lexer ) {
270cecf9d5Sandi            $this->Lexer = & new Doku_Lexer($this->Handler,'base', TRUE);
280cecf9d5Sandi        }
290cecf9d5Sandi        $this->modes['base']->Lexer = & $this->Lexer;
300cecf9d5Sandi    }
310cecf9d5Sandi
320cecf9d5Sandi    /**
330cecf9d5Sandi    * PHP preserves order of associative elements
340cecf9d5Sandi    * Mode sequence is important
350cecf9d5Sandi    */
360cecf9d5Sandi    function addMode($name, & $Mode) {
370cecf9d5Sandi        if ( !isset($this->modes['base']) ) {
38b7c441b9SHarry Fuecks            $this->addBaseMode(new Doku_Parser_Mode_Base());
390cecf9d5Sandi        }
400cecf9d5Sandi        $Mode->Lexer = & $this->Lexer;
410cecf9d5Sandi        $this->modes[$name] = & $Mode;
420cecf9d5Sandi    }
430cecf9d5Sandi
440cecf9d5Sandi    function connectModes() {
450cecf9d5Sandi
460cecf9d5Sandi        if ( $this->connected ) {
470cecf9d5Sandi            return;
480cecf9d5Sandi        }
490cecf9d5Sandi
500cecf9d5Sandi        foreach ( array_keys($this->modes) as $mode ) {
510cecf9d5Sandi
520cecf9d5Sandi            // Base isn't connected to anything
530cecf9d5Sandi            if ( $mode == 'base' ) {
540cecf9d5Sandi                continue;
550cecf9d5Sandi            }
560cecf9d5Sandi
570cecf9d5Sandi            $this->modes[$mode]->preConnect();
580cecf9d5Sandi
590cecf9d5Sandi            foreach ( array_keys($this->modes) as $cm ) {
600cecf9d5Sandi
610cecf9d5Sandi                if ( $this->modes[$cm]->accepts($mode) ) {
620cecf9d5Sandi                    $this->modes[$mode]->connectTo($cm);
630cecf9d5Sandi                }
640cecf9d5Sandi
650cecf9d5Sandi            }
660cecf9d5Sandi
670cecf9d5Sandi            $this->modes[$mode]->postConnect();
680cecf9d5Sandi        }
690cecf9d5Sandi
700cecf9d5Sandi        $this->connected = TRUE;
710cecf9d5Sandi    }
720cecf9d5Sandi
730cecf9d5Sandi    function parse($doc) {
740cecf9d5Sandi        if ( $this->Lexer ) {
750cecf9d5Sandi            $this->connectModes();
760cecf9d5Sandi            // Normalize CRs and pad doc
770cecf9d5Sandi            $doc = "\n".str_replace("\r\n","\n",$doc)."\n";
780cecf9d5Sandi            $this->Lexer->parse($doc);
79433bef32Sandi            $this->Handler->_finalize();
800cecf9d5Sandi            return $this->Handler->calls;
810cecf9d5Sandi        } else {
820cecf9d5Sandi            return FALSE;
830cecf9d5Sandi        }
840cecf9d5Sandi    }
850cecf9d5Sandi
860cecf9d5Sandi}
870cecf9d5Sandi
880cecf9d5Sandi//-------------------------------------------------------------------
890cecf9d5Sandi/**
900cecf9d5Sandi * This class and all the subclasses below are
910cecf9d5Sandi * used to reduce the effort required to register
920cecf9d5Sandi * modes with the Lexer. For performance these
930cecf9d5Sandi * could all be eliminated later perhaps, or
940cecf9d5Sandi * the Parser could be serialized to a file once
950cecf9d5Sandi * all modes are registered
96*702eb898Sandi *
97*702eb898Sandi * @author Harry Fuecks <harryf@gmail.com>
980cecf9d5Sandi*/
990cecf9d5Sandiclass Doku_Parser_Mode {
1000cecf9d5Sandi
1010cecf9d5Sandi    var $Lexer;
1020cecf9d5Sandi
1030cecf9d5Sandi    var $allowedModes = array();
1040cecf9d5Sandi
1050cecf9d5Sandi    // Called before any calls to connectTo
1060cecf9d5Sandi    function preConnect() {}
1070cecf9d5Sandi
1080cecf9d5Sandi    function connectTo($mode) {}
1090cecf9d5Sandi
1100cecf9d5Sandi    // Called after all calls to connectTo
1110cecf9d5Sandi    function postConnect() {}
1120cecf9d5Sandi
1130cecf9d5Sandi    function accepts($mode) {
1140cecf9d5Sandi        return in_array($mode, $this->allowedModes );
1150cecf9d5Sandi    }
1160cecf9d5Sandi
1170cecf9d5Sandi}
1180cecf9d5Sandi
1190cecf9d5Sandi//-------------------------------------------------------------------
1200cecf9d5Sandiclass Doku_Parser_Mode_Base extends Doku_Parser_Mode {
1210cecf9d5Sandi
1220cecf9d5Sandi    function Doku_Parser_Mode_Base() {
1230cecf9d5Sandi
1240cecf9d5Sandi        $this->allowedModes = array_merge (
1250cecf9d5Sandi                Doku_Parser_BlockContainers(),
1260cecf9d5Sandi                Doku_Parser_BaseOnly(),
1270cecf9d5Sandi                Doku_Parser_Paragraphs(),
1280cecf9d5Sandi                Doku_Parser_Formatting(),
1290cecf9d5Sandi                Doku_Parser_Substition(),
1300cecf9d5Sandi                Doku_Parser_Protected(),
1310cecf9d5Sandi                Doku_Parser_Disabled()
1320cecf9d5Sandi            );
1330cecf9d5Sandi    }
1340cecf9d5Sandi}
1350cecf9d5Sandi
1360cecf9d5Sandi//-------------------------------------------------------------------
1370cecf9d5Sandiclass Doku_Parser_Mode_Footnote extends Doku_Parser_Mode {
1380cecf9d5Sandi
1390cecf9d5Sandi    function Doku_Parser_Mode_Footnote() {
1400cecf9d5Sandi
1410cecf9d5Sandi        $this->allowedModes = array_merge (
1420cecf9d5Sandi                Doku_Parser_BlockContainers(),
1430cecf9d5Sandi                Doku_Parser_Formatting(),
1440cecf9d5Sandi                Doku_Parser_Substition(),
1450cecf9d5Sandi                Doku_Parser_Protected(),
1460cecf9d5Sandi                Doku_Parser_Disabled()
1470cecf9d5Sandi            );
1480cecf9d5Sandi
1490cecf9d5Sandi    }
1500cecf9d5Sandi
1510cecf9d5Sandi    function connectTo($mode) {
1520cecf9d5Sandi        $this->Lexer->addEntryPattern(
1530cecf9d5Sandi            '\x28\x28(?=.*\x29\x29)',$mode,'footnote'
1540cecf9d5Sandi            );
1550cecf9d5Sandi    }
1560cecf9d5Sandi
1570cecf9d5Sandi    function postConnect() {
1580cecf9d5Sandi        $this->Lexer->addExitPattern(
1590cecf9d5Sandi            '\x29\x29','footnote'
1600cecf9d5Sandi            );
1610cecf9d5Sandi
1620cecf9d5Sandi    }
1630cecf9d5Sandi
1640cecf9d5Sandi}
1650cecf9d5Sandi
1660cecf9d5Sandi//-------------------------------------------------------------------
1670cecf9d5Sandiclass Doku_Parser_Mode_Header extends Doku_Parser_Mode {
1680cecf9d5Sandi
1690cecf9d5Sandi    function preConnect() {
170506ae684Sandi        //we're not picky about the closing ones, two are enough
1710cecf9d5Sandi
1720cecf9d5Sandi        // Header 1 is special case - match 6 or more
1730cecf9d5Sandi        $this->Lexer->addSpecialPattern(
1746f0c5dbfSandi                            '[ \t]*={6,}[^\n]+={2,}[ \t]*(?=\n)',
1750cecf9d5Sandi                            'base',
1760cecf9d5Sandi                            'header'
1770cecf9d5Sandi                        );
1780cecf9d5Sandi
1790cecf9d5Sandi        // For the rest, match exactly
1800cecf9d5Sandi        for ( $i = 5; $i > 1; $i--) {
1810cecf9d5Sandi            $this->Lexer->addSpecialPattern(
1826f0c5dbfSandi                                '[ \t]*={'.$i.'}[^\n]+={2,}[ \t]*(?=\n)',
1830cecf9d5Sandi                                'base',
1840cecf9d5Sandi                                'header'
1850cecf9d5Sandi                            );
1860cecf9d5Sandi        }
1870cecf9d5Sandi    }
1880cecf9d5Sandi
1890cecf9d5Sandi}
1900cecf9d5Sandi
1910cecf9d5Sandi//-------------------------------------------------------------------
1920cecf9d5Sandiclass Doku_Parser_Mode_NoToc extends Doku_Parser_Mode {
1930cecf9d5Sandi
1940cecf9d5Sandi    function connectTo($mode) {
1950cecf9d5Sandi        $this->Lexer->addSpecialPattern('~~NOTOC~~',$mode,'notoc');
1960cecf9d5Sandi    }
1970cecf9d5Sandi
1980cecf9d5Sandi}
1990cecf9d5Sandi
2000cecf9d5Sandi//-------------------------------------------------------------------
2010cecf9d5Sandiclass Doku_Parser_Mode_Linebreak extends Doku_Parser_Mode {
2020cecf9d5Sandi
2030cecf9d5Sandi    function connectTo($mode) {
2040cecf9d5Sandi        $this->Lexer->addSpecialPattern('\x5C{2}\s',$mode,'linebreak');
2050cecf9d5Sandi    }
2060cecf9d5Sandi}
2070cecf9d5Sandi
2080cecf9d5Sandi//-------------------------------------------------------------------
2090cecf9d5Sandiclass Doku_Parser_Mode_Eol extends Doku_Parser_Mode {
2100cecf9d5Sandi
2110cecf9d5Sandi    function connectTo($mode) {
2120cecf9d5Sandi        $badModes = array('listblock','table');
2130cecf9d5Sandi        if ( in_array($mode, $badModes) ) {
2140cecf9d5Sandi            return;
2150cecf9d5Sandi        }
2160cecf9d5Sandi        $this->Lexer->addSpecialPattern('\n',$mode,'eol');
2170cecf9d5Sandi    }
2180cecf9d5Sandi}
2190cecf9d5Sandi
2200cecf9d5Sandi//-------------------------------------------------------------------
2210cecf9d5Sandiclass Doku_Parser_Mode_HR extends Doku_Parser_Mode {
2220cecf9d5Sandi
2230cecf9d5Sandi    function connectTo($mode) {
2246f0c5dbfSandi        $this->Lexer->addSpecialPattern('\n[ \t]*-{4,}[ \t]*(?=\n)',$mode,'hr');
2250cecf9d5Sandi    }
2260cecf9d5Sandi
2270cecf9d5Sandi}
2280cecf9d5Sandi
2290cecf9d5Sandi//-------------------------------------------------------------------
2300cecf9d5Sandiclass Doku_Parser_Mode_Formatting extends Doku_Parser_Mode {
2310cecf9d5Sandi
2320cecf9d5Sandi    var $type;
2330cecf9d5Sandi
2340cecf9d5Sandi    var $formatting = array (
2350cecf9d5Sandi        'strong' => array (
2360cecf9d5Sandi            'entry'=>'\*\*(?=.*\*\*)',
2370cecf9d5Sandi            'exit'=>'\*\*',
2380cecf9d5Sandi            ),
2390cecf9d5Sandi
2400cecf9d5Sandi        'emphasis'=> array (
2410cecf9d5Sandi            'entry'=>'//(?=.*//)',
2420cecf9d5Sandi            'exit'=>'//',
2430cecf9d5Sandi            ),
2440cecf9d5Sandi
2450cecf9d5Sandi        'underline'=> array (
2460cecf9d5Sandi            'entry'=>'__(?=.*__)',
2470cecf9d5Sandi            'exit'=>'__',
2480cecf9d5Sandi            ),
2490cecf9d5Sandi
2500cecf9d5Sandi        'monospace'=> array (
2510cecf9d5Sandi            'entry'=>'\x27\x27(?=.*\x27\x27)',
2520cecf9d5Sandi            'exit'=>'\x27\x27',
2530cecf9d5Sandi            ),
2540cecf9d5Sandi
2550cecf9d5Sandi        'subscript'=> array (
2560cecf9d5Sandi            'entry'=>'<sub>(?=.*\x3C/sub\x3E)',
2570cecf9d5Sandi            'exit'=>'</sub>',
2580cecf9d5Sandi            ),
2590cecf9d5Sandi
2600cecf9d5Sandi        'superscript'=> array (
2610cecf9d5Sandi            'entry'=>'<sup>(?=.*\x3C/sup\x3E)',
2620cecf9d5Sandi            'exit'=>'</sup>',
2630cecf9d5Sandi            ),
2640cecf9d5Sandi
2650cecf9d5Sandi        'deleted'=> array (
2660cecf9d5Sandi            'entry'=>'<del>(?=.*\x3C/del\x3E)',
2670cecf9d5Sandi            'exit'=>'</del>',
2680cecf9d5Sandi            ),
2690cecf9d5Sandi        );
2700cecf9d5Sandi
2710cecf9d5Sandi    function Doku_Parser_Mode_Formatting($type) {
2720cecf9d5Sandi
2730cecf9d5Sandi        if ( !array_key_exists($type, $this->formatting) ) {
2740cecf9d5Sandi            trigger_error('Invalid formatting type '.$type, E_USER_WARNING);
2750cecf9d5Sandi        }
2760cecf9d5Sandi
2770cecf9d5Sandi        $this->type = $type;
2780cecf9d5Sandi
2790cecf9d5Sandi        $this->allowedModes = array_merge (
2800cecf9d5Sandi                Doku_Parser_Formatting($type),
2810cecf9d5Sandi                Doku_Parser_Substition(),
2820cecf9d5Sandi                Doku_Parser_Disabled()
2830cecf9d5Sandi            );
2840cecf9d5Sandi
2850cecf9d5Sandi    }
2860cecf9d5Sandi
2870cecf9d5Sandi    function connectTo($mode) {
2880cecf9d5Sandi
2890cecf9d5Sandi        // Can't nest formatting in itself
2900cecf9d5Sandi        if ( $mode == $this->type ) {
2910cecf9d5Sandi            return;
2920cecf9d5Sandi        }
2930cecf9d5Sandi
2940cecf9d5Sandi        $this->Lexer->addEntryPattern(
2950cecf9d5Sandi                $this->formatting[$this->type]['entry'],
2960cecf9d5Sandi                $mode,
2970cecf9d5Sandi                $this->type
2980cecf9d5Sandi            );
2990cecf9d5Sandi    }
3000cecf9d5Sandi
3010cecf9d5Sandi    function postConnect() {
3020cecf9d5Sandi
3030cecf9d5Sandi        $this->Lexer->addExitPattern(
3040cecf9d5Sandi            $this->formatting[$this->type]['exit'],
3050cecf9d5Sandi            $this->type
3060cecf9d5Sandi            );
3070cecf9d5Sandi
3080cecf9d5Sandi    }
3090cecf9d5Sandi}
3100cecf9d5Sandi
3110cecf9d5Sandi//-------------------------------------------------------------------
3120cecf9d5Sandiclass Doku_Parser_Mode_ListBlock extends Doku_Parser_Mode {
3130cecf9d5Sandi
3140cecf9d5Sandi    function Doku_Parser_Mode_ListBlock() {
3150cecf9d5Sandi
3160cecf9d5Sandi        $this->allowedModes = array_merge (
3170cecf9d5Sandi                Doku_Parser_Formatting(),
3180cecf9d5Sandi                Doku_Parser_Substition(),
3190cecf9d5Sandi                Doku_Parser_Disabled()
3200cecf9d5Sandi            );
321*702eb898Sandi
3220cecf9d5Sandi        $this->allowedModes[] = 'footnote';
3230cecf9d5Sandi        $this->allowedModes[] = 'preformatted';
3240cecf9d5Sandi        $this->allowedModes[] = 'unformatted';
325*702eb898Sandi        $this->allowedModes[] = 'html';
326*702eb898Sandi        $this->allowedModes[] = 'php';
327*702eb898Sandi        $this->allowedModes[] = 'code';
328*702eb898Sandi        $this->allowedModes[] = 'file';
3290cecf9d5Sandi    }
3300cecf9d5Sandi
3310cecf9d5Sandi    function connectTo($mode) {
3320cecf9d5Sandi        $this->Lexer->addEntryPattern('\n {2,}[\-\*]',$mode,'listblock');
3330cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\t{1,}[\-\*]',$mode,'listblock');
3340cecf9d5Sandi
3350cecf9d5Sandi        $this->Lexer->addPattern('\n {2,}[\-\*]','listblock');
3360cecf9d5Sandi        $this->Lexer->addPattern('\n\t{1,}[\-\*]','listblock');
3370cecf9d5Sandi
3380cecf9d5Sandi    }
3390cecf9d5Sandi
3400cecf9d5Sandi    function postConnect() {
3410cecf9d5Sandi        $this->Lexer->addExitPattern('\n','listblock');
3420cecf9d5Sandi    }
3430cecf9d5Sandi}
3440cecf9d5Sandi
3450cecf9d5Sandi//-------------------------------------------------------------------
3460cecf9d5Sandiclass Doku_Parser_Mode_Table extends Doku_Parser_Mode {
3470cecf9d5Sandi
3480cecf9d5Sandi    function Doku_Parser_Mode_Table() {
3490cecf9d5Sandi
3500cecf9d5Sandi        $this->allowedModes = array_merge (
3510cecf9d5Sandi                Doku_Parser_Formatting(),
3520cecf9d5Sandi                Doku_Parser_Substition(),
3530cecf9d5Sandi                Doku_Parser_Disabled()
3540cecf9d5Sandi            );
3550cecf9d5Sandi        $this->allowedModes[] = 'footnote';
3560cecf9d5Sandi        $this->allowedModes[] = 'preformatted';
3570cecf9d5Sandi        $this->allowedModes[] = 'unformatted';
3580cecf9d5Sandi    }
3590cecf9d5Sandi
3600cecf9d5Sandi    function connectTo($mode) {
3610cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\^',$mode,'table');
3620cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\|',$mode,'table');
3630cecf9d5Sandi    }
3640cecf9d5Sandi
3650cecf9d5Sandi    function postConnect() {
3660cecf9d5Sandi        $this->Lexer->addPattern('\n\^','table');
3670cecf9d5Sandi        $this->Lexer->addPattern('\n\|','table');
3680cecf9d5Sandi        $this->Lexer->addPattern(' {2,}','table');
3690cecf9d5Sandi        $this->Lexer->addPattern('\^','table');
3700cecf9d5Sandi        $this->Lexer->addPattern('\|','table');
3710cecf9d5Sandi        $this->Lexer->addExitPattern('\n','table');
3720cecf9d5Sandi    }
3730cecf9d5Sandi}
3740cecf9d5Sandi
3750cecf9d5Sandi//-------------------------------------------------------------------
3760cecf9d5Sandiclass Doku_Parser_Mode_Unformatted extends Doku_Parser_Mode {
3770cecf9d5Sandi
3780cecf9d5Sandi    function connectTo($mode) {
3790cecf9d5Sandi        $this->Lexer->addEntryPattern('<nowiki>(?=.*\x3C/nowiki\x3E)',$mode,'unformatted');
3800cecf9d5Sandi        $this->Lexer->addEntryPattern('%%(?=.*%%)',$mode,'unformattedalt');
3810cecf9d5Sandi    }
3820cecf9d5Sandi
3830cecf9d5Sandi    function postConnect() {
3840cecf9d5Sandi        $this->Lexer->addExitPattern('</nowiki>','unformatted');
3850cecf9d5Sandi        $this->Lexer->addExitPattern('%%','unformattedalt');
3860cecf9d5Sandi        $this->Lexer->mapHandler('unformattedalt','unformatted');
3870cecf9d5Sandi    }
3880cecf9d5Sandi
3890cecf9d5Sandi}
3900cecf9d5Sandi
3910cecf9d5Sandi//-------------------------------------------------------------------
3920cecf9d5Sandiclass Doku_Parser_Mode_PHP extends Doku_Parser_Mode {
3930cecf9d5Sandi
3940cecf9d5Sandi    function connectTo($mode) {
3950cecf9d5Sandi        $this->Lexer->addEntryPattern('<php>(?=.*\x3C/php\x3E)',$mode,'php');
3960cecf9d5Sandi    }
3970cecf9d5Sandi
3980cecf9d5Sandi    function postConnect() {
3990cecf9d5Sandi        $this->Lexer->addExitPattern('</php>','php');
4000cecf9d5Sandi    }
4010cecf9d5Sandi
4020cecf9d5Sandi}
4030cecf9d5Sandi
4040cecf9d5Sandi//-------------------------------------------------------------------
4050cecf9d5Sandiclass Doku_Parser_Mode_HTML extends Doku_Parser_Mode {
4060cecf9d5Sandi
4070cecf9d5Sandi    function connectTo($mode) {
4080cecf9d5Sandi        $this->Lexer->addEntryPattern('<html>(?=.*\x3C/html\x3E)',$mode,'html');
4090cecf9d5Sandi    }
4100cecf9d5Sandi
4110cecf9d5Sandi    function postConnect() {
4120cecf9d5Sandi        $this->Lexer->addExitPattern('</html>','html');
4130cecf9d5Sandi    }
4140cecf9d5Sandi
4150cecf9d5Sandi}
4160cecf9d5Sandi
4170cecf9d5Sandi//-------------------------------------------------------------------
4180cecf9d5Sandiclass Doku_Parser_Mode_Preformatted extends Doku_Parser_Mode {
4190cecf9d5Sandi
4200cecf9d5Sandi    function connectTo($mode) {
4210cecf9d5Sandi        // Has hard coded awareness of lists...
4220cecf9d5Sandi        $this->Lexer->addEntryPattern('\n  (?![\*\-])',$mode,'preformatted');
4230cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\t(?![\*\-])',$mode,'preformatted');
4240cecf9d5Sandi
4250cecf9d5Sandi        // How to effect a sub pattern with the Lexer!
4260cecf9d5Sandi        $this->Lexer->addPattern('\n  ','preformatted');
4270cecf9d5Sandi        $this->Lexer->addPattern('\n\t','preformatted');
4280cecf9d5Sandi
4290cecf9d5Sandi    }
4300cecf9d5Sandi
4310cecf9d5Sandi    function postConnect() {
4320cecf9d5Sandi        $this->Lexer->addExitPattern('\n','preformatted');
4330cecf9d5Sandi    }
4340cecf9d5Sandi
4350cecf9d5Sandi}
4360cecf9d5Sandi
4370cecf9d5Sandi//-------------------------------------------------------------------
4380cecf9d5Sandiclass Doku_Parser_Mode_Code extends Doku_Parser_Mode {
4390cecf9d5Sandi
4400cecf9d5Sandi    function connectTo($mode) {
4410cecf9d5Sandi        $this->Lexer->addEntryPattern('<code(?=.*\x3C/code\x3E)',$mode,'code');
4420cecf9d5Sandi    }
4430cecf9d5Sandi
4440cecf9d5Sandi    function postConnect() {
4450cecf9d5Sandi        $this->Lexer->addExitPattern('</code>','code');
4460cecf9d5Sandi    }
4470cecf9d5Sandi
4480cecf9d5Sandi}
4490cecf9d5Sandi
4500cecf9d5Sandi//-------------------------------------------------------------------
4510cecf9d5Sandiclass Doku_Parser_Mode_File extends Doku_Parser_Mode {
4520cecf9d5Sandi
4530cecf9d5Sandi    function connectTo($mode) {
4540cecf9d5Sandi        $this->Lexer->addEntryPattern('<file>(?=.*\x3C/file\x3E)',$mode,'file');
4550cecf9d5Sandi    }
4560cecf9d5Sandi
4570cecf9d5Sandi    function postConnect() {
4580cecf9d5Sandi        $this->Lexer->addExitPattern('</file>','file');
4590cecf9d5Sandi    }
4600cecf9d5Sandi
4610cecf9d5Sandi}
4620cecf9d5Sandi
4630cecf9d5Sandi//-------------------------------------------------------------------
4640cecf9d5Sandiclass Doku_Parser_Mode_Quote extends Doku_Parser_Mode {
4650cecf9d5Sandi
4660cecf9d5Sandi    function Doku_Parser_Mode_Quote() {
4670cecf9d5Sandi
4680cecf9d5Sandi        $this->allowedModes = array_merge (
4690cecf9d5Sandi                Doku_Parser_Formatting(),
4700cecf9d5Sandi                Doku_Parser_Substition(),
4710cecf9d5Sandi                Doku_Parser_Disabled()
4720cecf9d5Sandi            );
4730cecf9d5Sandi            $this->allowedModes[] = 'footnote';
4740cecf9d5Sandi            $this->allowedModes[] = 'preformatted';
4750cecf9d5Sandi            $this->allowedModes[] = 'unformatted';
4760cecf9d5Sandi    }
4770cecf9d5Sandi
4780cecf9d5Sandi    function connectTo($mode) {
4790cecf9d5Sandi        $this->Lexer->addEntryPattern('\n>{1,}',$mode,'quote');
4800cecf9d5Sandi    }
4810cecf9d5Sandi
4820cecf9d5Sandi    function postConnect() {
4830cecf9d5Sandi        $this->Lexer->addPattern('\n>{1,}','quote');
4840cecf9d5Sandi        $this->Lexer->addExitPattern('\n','quote');
4850cecf9d5Sandi    }
4860cecf9d5Sandi
4870cecf9d5Sandi}
4880cecf9d5Sandi
4890cecf9d5Sandi//-------------------------------------------------------------------
4900cecf9d5Sandiclass Doku_Parser_Mode_Acronym extends Doku_Parser_Mode {
4910cecf9d5Sandi    // A list
4920cecf9d5Sandi    var $acronyms = array();
4930cecf9d5Sandi    var $pattern = '';
4940cecf9d5Sandi
4950cecf9d5Sandi    function Doku_Parser_Mode_Acronym($acronyms) {
4960cecf9d5Sandi        $this->acronyms = $acronyms;
4970cecf9d5Sandi    }
4980cecf9d5Sandi
4990cecf9d5Sandi    function preConnect() {
5000cecf9d5Sandi        $sep = '';
5010cecf9d5Sandi        foreach ( $this->acronyms as $acronym ) {
5020cecf9d5Sandi            $this->pattern .= $sep.'(?<=\b)'.Doku_Lexer_Escape($acronym).'(?=\b)';
5030cecf9d5Sandi            $sep = '|';
5040cecf9d5Sandi        }
5050cecf9d5Sandi    }
5060cecf9d5Sandi
5070cecf9d5Sandi    function connectTo($mode) {
5080cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5090cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'acronym');
5100cecf9d5Sandi        }
5110cecf9d5Sandi    }
5120cecf9d5Sandi
5130cecf9d5Sandi}
5140cecf9d5Sandi
5150cecf9d5Sandi//-------------------------------------------------------------------
5160cecf9d5Sandiclass Doku_Parser_Mode_Smiley extends Doku_Parser_Mode {
5170cecf9d5Sandi    // A list
5180cecf9d5Sandi    var $smileys = array();
5190cecf9d5Sandi    var $pattern = '';
5200cecf9d5Sandi
5210cecf9d5Sandi    function Doku_Parser_Mode_Smiley($smileys) {
5220cecf9d5Sandi        $this->smileys = $smileys;
5230cecf9d5Sandi    }
5240cecf9d5Sandi
5250cecf9d5Sandi    function preConnect() {
5260cecf9d5Sandi        $sep = '';
5270cecf9d5Sandi        foreach ( $this->smileys as $smiley ) {
5280cecf9d5Sandi            $this->pattern .= $sep.Doku_Lexer_Escape($smiley);
5290cecf9d5Sandi            $sep = '|';
5300cecf9d5Sandi        }
5310cecf9d5Sandi    }
5320cecf9d5Sandi
5330cecf9d5Sandi    function connectTo($mode) {
5340cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5350cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'smiley');
5360cecf9d5Sandi        }
5370cecf9d5Sandi    }
5380cecf9d5Sandi
5390cecf9d5Sandi}
5400cecf9d5Sandi
5410cecf9d5Sandi//-------------------------------------------------------------------
5420cecf9d5Sandiclass Doku_Parser_Mode_Wordblock extends Doku_Parser_Mode {
5430cecf9d5Sandi    // A list
5440cecf9d5Sandi    var $badwords = array();
5450cecf9d5Sandi    var $pattern = '';
5460cecf9d5Sandi
5470cecf9d5Sandi    function Doku_Parser_Mode_Wordblock($badwords) {
5480cecf9d5Sandi        $this->badwords = $badwords;
5490cecf9d5Sandi    }
5500cecf9d5Sandi
5510cecf9d5Sandi    function preConnect() {
5520cecf9d5Sandi
5530cecf9d5Sandi        if ( count($this->badwords) == 0 ) {
5540cecf9d5Sandi            return;
5550cecf9d5Sandi        }
5560cecf9d5Sandi
5570cecf9d5Sandi        $sep = '';
5580cecf9d5Sandi        foreach ( $this->badwords as $badword ) {
5590cecf9d5Sandi            $this->pattern .= $sep.'(?<=\b)(?i)'.Doku_Lexer_Escape($badword).'(?-i)(?=\b)';
5600cecf9d5Sandi            $sep = '|';
5610cecf9d5Sandi        }
5620cecf9d5Sandi
5630cecf9d5Sandi    }
5640cecf9d5Sandi
5650cecf9d5Sandi    function connectTo($mode) {
5660cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5670cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'wordblock');
5680cecf9d5Sandi        }
5690cecf9d5Sandi    }
5700cecf9d5Sandi
5710cecf9d5Sandi}
5720cecf9d5Sandi
5730cecf9d5Sandi//-------------------------------------------------------------------
5740cecf9d5Sandi/**
5754de671bcSandi* @TODO Quotes and 640x480 are not supported - just straight replacements here
5760cecf9d5Sandi*/
5770cecf9d5Sandiclass Doku_Parser_Mode_Entity extends Doku_Parser_Mode {
5780cecf9d5Sandi    // A list
5790cecf9d5Sandi    var $entities = array();
5800cecf9d5Sandi    var $pattern = '';
5810cecf9d5Sandi
5820cecf9d5Sandi    function Doku_Parser_Mode_Entity($entities) {
5830cecf9d5Sandi        $this->entities = $entities;
5840cecf9d5Sandi    }
5850cecf9d5Sandi
5860cecf9d5Sandi    function preConnect() {
5870cecf9d5Sandi        $sep = '';
5880cecf9d5Sandi        foreach ( $this->entities as $entity ) {
5890cecf9d5Sandi            $this->pattern .= $sep.Doku_Lexer_Escape($entity);
5900cecf9d5Sandi            $sep = '|';
5910cecf9d5Sandi        }
5920cecf9d5Sandi    }
5930cecf9d5Sandi
5940cecf9d5Sandi    function connectTo($mode) {
5950cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5960cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'entity');
5970cecf9d5Sandi        }
5980cecf9d5Sandi    }
5990cecf9d5Sandi
6000cecf9d5Sandi}
6010cecf9d5Sandi
6020cecf9d5Sandi//-------------------------------------------------------------------
6030cecf9d5Sandi// Implements the 640x480 replacement
6040cecf9d5Sandiclass Doku_Parser_Mode_MultiplyEntity extends Doku_Parser_Mode {
6050cecf9d5Sandi
6060cecf9d5Sandi    function connectTo($mode) {
6070cecf9d5Sandi
6080cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6090cecf9d5Sandi                    '(?<=\b)\d+[x|X]\d+(?=\b)',$mode,'multiplyentity'
6100cecf9d5Sandi                );
6110cecf9d5Sandi
6120cecf9d5Sandi    }
6130cecf9d5Sandi
6140cecf9d5Sandi}
6150cecf9d5Sandi
6160cecf9d5Sandi//-------------------------------------------------------------------
6170cecf9d5Sandiclass Doku_Parser_Mode_Quotes extends Doku_Parser_Mode {
6180cecf9d5Sandi
6190cecf9d5Sandi    function connectTo($mode) {
6200cecf9d5Sandi
6210cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6220cecf9d5Sandi                    '(?<=\s)\'(?=\S)',$mode,'singlequoteopening'
6230cecf9d5Sandi                );
6240cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6254de671bcSandi                    '(?<=^|\S)\'',$mode,'singlequoteclosing'
6260cecf9d5Sandi                );
6270cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6284de671bcSandi                    '(?<=^|\s)"(?=\S)',$mode,'doublequoteopening'
6290cecf9d5Sandi                );
6300cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6310cecf9d5Sandi                    '(?<=\S)"',$mode,'doublequoteclosing'
6320cecf9d5Sandi                );
6330cecf9d5Sandi
6340cecf9d5Sandi    }
6350cecf9d5Sandi
6360cecf9d5Sandi}
6370cecf9d5Sandi
6380cecf9d5Sandi//-------------------------------------------------------------------
6390cecf9d5Sandiclass Doku_Parser_Mode_CamelCaseLink extends Doku_Parser_Mode {
6400cecf9d5Sandi
6410cecf9d5Sandi    function connectTo($mode) {
6420cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6430cecf9d5Sandi                '\b[A-Z]+[a-z]+[A-Z][A-Za-z]*\b',$mode,'camelcaselink'
6440cecf9d5Sandi            );
6450cecf9d5Sandi    }
6460cecf9d5Sandi
6470cecf9d5Sandi}
6480cecf9d5Sandi
6490cecf9d5Sandi//-------------------------------------------------------------------
6500cecf9d5Sandiclass Doku_Parser_Mode_InternalLink extends Doku_Parser_Mode {
6510cecf9d5Sandi
6520cecf9d5Sandi    function connectTo($mode) {
6530cecf9d5Sandi        // Word boundaries?
6540cecf9d5Sandi        $this->Lexer->addSpecialPattern("\[\[[^\]]+?\]\]",$mode,'internallink');
6550cecf9d5Sandi    }
6560cecf9d5Sandi
6570cecf9d5Sandi}
6580cecf9d5Sandi
6590cecf9d5Sandi//-------------------------------------------------------------------
6600cecf9d5Sandiclass Doku_Parser_Mode_Media extends Doku_Parser_Mode {
6610cecf9d5Sandi
6620cecf9d5Sandi    function connectTo($mode) {
6630cecf9d5Sandi        // Word boundaries?
6640cecf9d5Sandi        $this->Lexer->addSpecialPattern("\{\{[^\}]+\}\}",$mode,'media');
6650cecf9d5Sandi    }
6660cecf9d5Sandi
6670cecf9d5Sandi}
6680cecf9d5Sandi
6690cecf9d5Sandi//-------------------------------------------------------------------
670b625487dSandiclass Doku_Parser_Mode_RSS extends Doku_Parser_Mode {
671b625487dSandi
672b625487dSandi    function connectTo($mode) {
673b625487dSandi        $this->Lexer->addSpecialPattern("\{\{rss>[^\}]+\}\}",$mode,'rss');
674b625487dSandi    }
675b625487dSandi
676b625487dSandi}
677b625487dSandi
678b625487dSandi//-------------------------------------------------------------------
6790cecf9d5Sandiclass Doku_Parser_Mode_ExternalLink extends Doku_Parser_Mode {
6800cecf9d5Sandi    var $schemes = array('http','https','telnet','gopher','wais','ftp','ed2k','irc');
6810cecf9d5Sandi    var $patterns = array();
6820cecf9d5Sandi
6830cecf9d5Sandi    function preConnect() {
6840cecf9d5Sandi
6850cecf9d5Sandi        $ltrs = '\w';
6860cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
6870cecf9d5Sandi        $punc = '.:?\-;,';
6880cecf9d5Sandi        $host = $ltrs.$punc;
6890cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
6900cecf9d5Sandi
6910cecf9d5Sandi        foreach ( $this->schemes as $scheme ) {
6926f0c5dbfSandi            $this->patterns[] = '\b(?i)'.$scheme.'(?-i)://['.$any.']+?(?=['.$punc.']*[^'.$any.'])';
6930cecf9d5Sandi        }
6940cecf9d5Sandi
6956f0c5dbfSandi        $this->patterns[] = '\b(?i)www?(?-i)\.['.$host.']+?\.['.$host.']+?['.$any.']+?(?=['.$punc.']*[^'.$any.'])';
6966f0c5dbfSandi        $this->patterns[] = '\b(?i)ftp?(?-i)\.['.$host.']+?\.['.$host.']+?['.$any.']+?(?=['.$punc.']*[^'.$any.'])';
6970cecf9d5Sandi
6980cecf9d5Sandi    }
6990cecf9d5Sandi
7000cecf9d5Sandi    function connectTo($mode) {
7010cecf9d5Sandi        foreach ( $this->patterns as $pattern ) {
7020cecf9d5Sandi            $this->Lexer->addSpecialPattern($pattern,$mode,'externallink');
7030cecf9d5Sandi        }
7040cecf9d5Sandi    }
7050cecf9d5Sandi
7060cecf9d5Sandi}
7070cecf9d5Sandi
7080cecf9d5Sandi//-------------------------------------------------------------------
7090cecf9d5Sandiclass Doku_Parser_Mode_FileLink extends Doku_Parser_Mode {
7100cecf9d5Sandi
7110cecf9d5Sandi    var $pattern;
7120cecf9d5Sandi
7130cecf9d5Sandi    function preConnect() {
7140cecf9d5Sandi
7150cecf9d5Sandi        $ltrs = '\w';
7160cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
7170cecf9d5Sandi        $punc = '.:?\-;,';
7180cecf9d5Sandi        $host = $ltrs.$punc;
7190cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
7200cecf9d5Sandi
7210cecf9d5Sandi        $this->pattern = '\b(?i)file(?-i)://['.$any.']+?['.
7220cecf9d5Sandi            $punc.']*[^'.$any.']';
7230cecf9d5Sandi    }
7240cecf9d5Sandi
7250cecf9d5Sandi    function connectTo($mode) {
7260cecf9d5Sandi        $this->Lexer->addSpecialPattern(
7270cecf9d5Sandi            $this->pattern,$mode,'filelink');
7280cecf9d5Sandi    }
7290cecf9d5Sandi
7300cecf9d5Sandi
7310cecf9d5Sandi}
7320cecf9d5Sandi
7330cecf9d5Sandi//-------------------------------------------------------------------
7340cecf9d5Sandiclass Doku_Parser_Mode_WindowsShareLink extends Doku_Parser_Mode {
7350cecf9d5Sandi
7360cecf9d5Sandi    var $pattern;
7370cecf9d5Sandi
7380cecf9d5Sandi    function preConnect() {
7390cecf9d5Sandi
7400cecf9d5Sandi        $ltrs = '\w';
7410cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
7420cecf9d5Sandi        $punc = '.:?\-;,';
7430cecf9d5Sandi        $host = $ltrs.$punc;
7440cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
7450cecf9d5Sandi
7460cecf9d5Sandi        $this->pattern = "[$gunk$punc\s]\\\\\\\\[$host]+?\\\\[$any]+?[$punc]*[^$any]";
7470cecf9d5Sandi    }
7480cecf9d5Sandi
7490cecf9d5Sandi    function connectTo($mode) {
7500cecf9d5Sandi        $this->Lexer->addSpecialPattern(
7510cecf9d5Sandi            $this->pattern,$mode,'windowssharelink');
7520cecf9d5Sandi    }
7530cecf9d5Sandi
7540cecf9d5Sandi
7550cecf9d5Sandi}
7560cecf9d5Sandi
7570cecf9d5Sandi//-------------------------------------------------------------------
75871352defSandiclass Doku_Parser_Mode_EmailLink extends Doku_Parser_Mode {
7590cecf9d5Sandi
7600cecf9d5Sandi    function connectTo($mode) {
7610cecf9d5Sandi    //<([\w0-9\-_.]+?)@([\w\-]+\.([\w\-\.]+\.)*[\w]+)>
76271352defSandi        $this->Lexer->addSpecialPattern("<[\w0-9\-_.]+?@[\w\-]+\.[\w\-\.]+\.*[\w]+>",$mode,'emaillink');
7630cecf9d5Sandi    }
7640cecf9d5Sandi
7650cecf9d5Sandi}
7660cecf9d5Sandi
7670cecf9d5Sandi//-------------------------------------------------------------------
7680cecf9d5Sandi// Help fns to keep mode lists - used to make it easier to populate
7690cecf9d5Sandi// the list of modes another mode accepts
7700cecf9d5Sandi
7710cecf9d5Sandi// Can contain many other modes
7720cecf9d5Sandi// E.g. a footnote can containing formatting etc.
7730cecf9d5Sandifunction Doku_Parser_BlockContainers() {
7740cecf9d5Sandi    $modes = array(
7750cecf9d5Sandi        'footnote', 'listblock', 'table','quote',
7760cecf9d5Sandi        // hr breaks the principle but HRs should not be used in tables / lists
7770cecf9d5Sandi        // so put it here
7780cecf9d5Sandi        'hr',
7790cecf9d5Sandi    );
7800cecf9d5Sandi    return $modes;
7810cecf9d5Sandi}
7820cecf9d5Sandi
7830cecf9d5Sandi// Used to mark paragraph boundaries
7840cecf9d5Sandifunction Doku_Parser_Paragraphs() {
7850cecf9d5Sandi    $modes = array(
7860cecf9d5Sandi        'eol'
7870cecf9d5Sandi    );
7880cecf9d5Sandi    return $modes;
7890cecf9d5Sandi}
7900cecf9d5Sandi
7910cecf9d5Sandi// Can only be used by the base mode
7920cecf9d5Sandifunction Doku_Parser_BaseOnly() {
7930cecf9d5Sandi    $modes = array(
7940cecf9d5Sandi        'header'
7950cecf9d5Sandi    );
7960cecf9d5Sandi    return $modes;
7970cecf9d5Sandi}
7980cecf9d5Sandi
7990cecf9d5Sandi// "Styling" modes that format text.
8000cecf9d5Sandifunction Doku_Parser_Formatting($remove = '') {
8010cecf9d5Sandi    $modes = array(
8020cecf9d5Sandi        'strong', 'emphasis', 'underline', 'monospace',
8030cecf9d5Sandi        'subscript', 'superscript', 'deleted',
8040cecf9d5Sandi        );
8050cecf9d5Sandi    $key = array_search($remove, $modes);
8060cecf9d5Sandi    if ( is_int($key) ) {
8070cecf9d5Sandi        unset($modes[$key]);
8080cecf9d5Sandi    }
8090cecf9d5Sandi
8100cecf9d5Sandi    return $modes;
8110cecf9d5Sandi}
8120cecf9d5Sandi
8130cecf9d5Sandi// Modes where the token is simply replaced - contain no
8140cecf9d5Sandi// other modes
8150cecf9d5Sandifunction Doku_Parser_Substition() {
8160cecf9d5Sandi    $modes = array(
8170cecf9d5Sandi        'acronym','smiley','wordblock','entity','camelcaselink',
81871352defSandi        'internallink','media','externallink','linebreak','emaillink',
8190cecf9d5Sandi        'windowssharelink','filelink','notoc','multiplyentity',
820f1cf0e10Sandi        'quotes','rss',
8210cecf9d5Sandi    );
8220cecf9d5Sandi    return $modes;
8230cecf9d5Sandi}
8240cecf9d5Sandi
8250cecf9d5Sandi// Modes which have a start and end token but inside which
8260cecf9d5Sandi// no other modes should be applied
8270cecf9d5Sandifunction Doku_Parser_Protected() {
8280cecf9d5Sandi    $modes = array(
8290cecf9d5Sandi        'preformatted','code','file',
8300cecf9d5Sandi        'php','html','quote',
8310cecf9d5Sandi    );
8320cecf9d5Sandi    return $modes;
8330cecf9d5Sandi}
8340cecf9d5Sandi
8350cecf9d5Sandi// Disable wiki markup inside this mode
8360cecf9d5Sandifunction Doku_Parser_Disabled() {
8370cecf9d5Sandi    $modes = array(
8380cecf9d5Sandi        'unformatted'
8390cecf9d5Sandi    );
8400cecf9d5Sandi    return $modes;
8410cecf9d5Sandi}
8420cecf9d5Sandi
843340756e4Sandi
844b625487dSandi//Setup VIM: ex: et ts=4 enc=utf-8 :
845