xref: /dokuwiki/inc/parser/parser.php (revision 4de671bc5e749ac76ad85252df59feb45c749eab)
10cecf9d5Sandi<?php
20cecf9d5Sandi
30cecf9d5Sandiif(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../../').'/');
40cecf9d5Sandi
50cecf9d5Sandirequire_once DOKU_INC . 'inc/parser/lexer.php';
60cecf9d5Sandirequire_once DOKU_INC . 'inc/parser/handler.php';
70cecf9d5Sandi
80cecf9d5Sandi//-------------------------------------------------------------------
90cecf9d5Sandi
100cecf9d5Sandi/**
110cecf9d5Sandi* Sets up the Lexer with modes and points it to the Handler
120cecf9d5Sandi* For an intro to the Lexer see: wiki:parser
130cecf9d5Sandi*/
140cecf9d5Sandiclass Doku_Parser {
150cecf9d5Sandi
160cecf9d5Sandi    var $Handler;
170cecf9d5Sandi
180cecf9d5Sandi    var $Lexer;
190cecf9d5Sandi
200cecf9d5Sandi    var $modes = array();
210cecf9d5Sandi
220cecf9d5Sandi    var $connected = FALSE;
230cecf9d5Sandi
24b7c441b9SHarry Fuecks    function addBaseMode(& $BaseMode) {
25b7c441b9SHarry Fuecks        $this->modes['base'] = & $BaseMode;
260cecf9d5Sandi        if ( !$this->Lexer ) {
270cecf9d5Sandi            $this->Lexer = & new Doku_Lexer($this->Handler,'base', TRUE);
280cecf9d5Sandi        }
290cecf9d5Sandi        $this->modes['base']->Lexer = & $this->Lexer;
300cecf9d5Sandi    }
310cecf9d5Sandi
320cecf9d5Sandi    /**
330cecf9d5Sandi    * PHP preserves order of associative elements
340cecf9d5Sandi    * Mode sequence is important
350cecf9d5Sandi    */
360cecf9d5Sandi    function addMode($name, & $Mode) {
370cecf9d5Sandi        if ( !isset($this->modes['base']) ) {
38b7c441b9SHarry Fuecks            $this->addBaseMode(new Doku_Parser_Mode_Base());
390cecf9d5Sandi        }
400cecf9d5Sandi        $Mode->Lexer = & $this->Lexer;
410cecf9d5Sandi        $this->modes[$name] = & $Mode;
420cecf9d5Sandi    }
430cecf9d5Sandi
440cecf9d5Sandi    function connectModes() {
450cecf9d5Sandi
460cecf9d5Sandi        if ( $this->connected ) {
470cecf9d5Sandi            return;
480cecf9d5Sandi        }
490cecf9d5Sandi
500cecf9d5Sandi        foreach ( array_keys($this->modes) as $mode ) {
510cecf9d5Sandi
520cecf9d5Sandi            // Base isn't connected to anything
530cecf9d5Sandi            if ( $mode == 'base' ) {
540cecf9d5Sandi                continue;
550cecf9d5Sandi            }
560cecf9d5Sandi
570cecf9d5Sandi            $this->modes[$mode]->preConnect();
580cecf9d5Sandi
590cecf9d5Sandi            foreach ( array_keys($this->modes) as $cm ) {
600cecf9d5Sandi
610cecf9d5Sandi                if ( $this->modes[$cm]->accepts($mode) ) {
620cecf9d5Sandi                    $this->modes[$mode]->connectTo($cm);
630cecf9d5Sandi                }
640cecf9d5Sandi
650cecf9d5Sandi            }
660cecf9d5Sandi
670cecf9d5Sandi            $this->modes[$mode]->postConnect();
680cecf9d5Sandi        }
690cecf9d5Sandi
700cecf9d5Sandi        $this->connected = TRUE;
710cecf9d5Sandi    }
720cecf9d5Sandi
730cecf9d5Sandi    function parse($doc) {
740cecf9d5Sandi        if ( $this->Lexer ) {
750cecf9d5Sandi            $this->connectModes();
760cecf9d5Sandi            // Normalize CRs and pad doc
770cecf9d5Sandi            $doc = "\n".str_replace("\r\n","\n",$doc)."\n";
780cecf9d5Sandi            $this->Lexer->parse($doc);
790cecf9d5Sandi            $this->Handler->__finalize();
800cecf9d5Sandi            return $this->Handler->calls;
810cecf9d5Sandi        } else {
820cecf9d5Sandi            return FALSE;
830cecf9d5Sandi        }
840cecf9d5Sandi    }
850cecf9d5Sandi
860cecf9d5Sandi}
870cecf9d5Sandi
880cecf9d5Sandi//-------------------------------------------------------------------
890cecf9d5Sandi/**
900cecf9d5Sandi* This class and all the subclasses below are
910cecf9d5Sandi* used to reduce the effort required to register
920cecf9d5Sandi* modes with the Lexer. For performance these
930cecf9d5Sandi* could all be eliminated later perhaps, or
940cecf9d5Sandi* the Parser could be serialized to a file once
950cecf9d5Sandi* all modes are registered
960cecf9d5Sandi*/
970cecf9d5Sandiclass Doku_Parser_Mode {
980cecf9d5Sandi
990cecf9d5Sandi    var $Lexer;
1000cecf9d5Sandi
1010cecf9d5Sandi    var $allowedModes = array();
1020cecf9d5Sandi
1030cecf9d5Sandi    // Called before any calls to connectTo
1040cecf9d5Sandi    function preConnect() {}
1050cecf9d5Sandi
1060cecf9d5Sandi    function connectTo($mode) {}
1070cecf9d5Sandi
1080cecf9d5Sandi    // Called after all calls to connectTo
1090cecf9d5Sandi    function postConnect() {}
1100cecf9d5Sandi
1110cecf9d5Sandi    function accepts($mode) {
1120cecf9d5Sandi        return in_array($mode, $this->allowedModes );
1130cecf9d5Sandi    }
1140cecf9d5Sandi
1150cecf9d5Sandi}
1160cecf9d5Sandi
1170cecf9d5Sandi//-------------------------------------------------------------------
1180cecf9d5Sandiclass Doku_Parser_Mode_Base extends Doku_Parser_Mode {
1190cecf9d5Sandi
1200cecf9d5Sandi    function Doku_Parser_Mode_Base() {
1210cecf9d5Sandi
1220cecf9d5Sandi        $this->allowedModes = array_merge (
1230cecf9d5Sandi                Doku_Parser_BlockContainers(),
1240cecf9d5Sandi                Doku_Parser_BaseOnly(),
1250cecf9d5Sandi                Doku_Parser_Paragraphs(),
1260cecf9d5Sandi                Doku_Parser_Formatting(),
1270cecf9d5Sandi                Doku_Parser_Substition(),
1280cecf9d5Sandi                Doku_Parser_Protected(),
1290cecf9d5Sandi                Doku_Parser_Disabled()
1300cecf9d5Sandi            );
1310cecf9d5Sandi    }
1320cecf9d5Sandi}
1330cecf9d5Sandi
1340cecf9d5Sandi//-------------------------------------------------------------------
1350cecf9d5Sandiclass Doku_Parser_Mode_Footnote extends Doku_Parser_Mode {
1360cecf9d5Sandi
1370cecf9d5Sandi    function Doku_Parser_Mode_Footnote() {
1380cecf9d5Sandi
1390cecf9d5Sandi        $this->allowedModes = array_merge (
1400cecf9d5Sandi                Doku_Parser_BlockContainers(),
1410cecf9d5Sandi                Doku_Parser_Formatting(),
1420cecf9d5Sandi                Doku_Parser_Substition(),
1430cecf9d5Sandi                Doku_Parser_Protected(),
1440cecf9d5Sandi                Doku_Parser_Disabled()
1450cecf9d5Sandi            );
1460cecf9d5Sandi
1470cecf9d5Sandi    }
1480cecf9d5Sandi
1490cecf9d5Sandi    function connectTo($mode) {
1500cecf9d5Sandi        $this->Lexer->addEntryPattern(
1510cecf9d5Sandi            '\x28\x28(?=.*\x29\x29)',$mode,'footnote'
1520cecf9d5Sandi            );
1530cecf9d5Sandi    }
1540cecf9d5Sandi
1550cecf9d5Sandi    function postConnect() {
1560cecf9d5Sandi        $this->Lexer->addExitPattern(
1570cecf9d5Sandi            '\x29\x29','footnote'
1580cecf9d5Sandi            );
1590cecf9d5Sandi
1600cecf9d5Sandi    }
1610cecf9d5Sandi
1620cecf9d5Sandi}
1630cecf9d5Sandi
1640cecf9d5Sandi//-------------------------------------------------------------------
1650cecf9d5Sandiclass Doku_Parser_Mode_Header extends Doku_Parser_Mode {
1660cecf9d5Sandi
1670cecf9d5Sandi    function preConnect() {
1680cecf9d5Sandi
1690cecf9d5Sandi        // Header 1 is special case - match 6 or more
1700cecf9d5Sandi        $this->Lexer->addSpecialPattern(
1710cecf9d5Sandi                            '[ \t]*={6,}[^\n]+={6,}[ \t]*\n',
1720cecf9d5Sandi                            'base',
1730cecf9d5Sandi                            'header'
1740cecf9d5Sandi                        );
1750cecf9d5Sandi
1760cecf9d5Sandi        // For the rest, match exactly
1770cecf9d5Sandi        for ( $i = 5; $i > 1; $i--) {
1780cecf9d5Sandi            $this->Lexer->addSpecialPattern(
1790cecf9d5Sandi                                '[ \t]*={'.$i.'}[^\n]+={'.$i.'}[ \t]*\n',
1800cecf9d5Sandi                                'base',
1810cecf9d5Sandi                                'header'
1820cecf9d5Sandi                            );
1830cecf9d5Sandi        }
1840cecf9d5Sandi    }
1850cecf9d5Sandi
1860cecf9d5Sandi}
1870cecf9d5Sandi
1880cecf9d5Sandi//-------------------------------------------------------------------
1890cecf9d5Sandiclass Doku_Parser_Mode_NoToc extends Doku_Parser_Mode {
1900cecf9d5Sandi
1910cecf9d5Sandi    function connectTo($mode) {
1920cecf9d5Sandi        $this->Lexer->addSpecialPattern('~~NOTOC~~',$mode,'notoc');
1930cecf9d5Sandi    }
1940cecf9d5Sandi
1950cecf9d5Sandi}
1960cecf9d5Sandi
1970cecf9d5Sandi//-------------------------------------------------------------------
1980cecf9d5Sandiclass Doku_Parser_Mode_Linebreak extends Doku_Parser_Mode {
1990cecf9d5Sandi
2000cecf9d5Sandi    function connectTo($mode) {
2010cecf9d5Sandi        $this->Lexer->addSpecialPattern('\x5C{2}\s',$mode,'linebreak');
2020cecf9d5Sandi    }
2030cecf9d5Sandi}
2040cecf9d5Sandi
2050cecf9d5Sandi//-------------------------------------------------------------------
2060cecf9d5Sandiclass Doku_Parser_Mode_Eol extends Doku_Parser_Mode {
2070cecf9d5Sandi
2080cecf9d5Sandi    function connectTo($mode) {
2090cecf9d5Sandi        $badModes = array('listblock','table');
2100cecf9d5Sandi        if ( in_array($mode, $badModes) ) {
2110cecf9d5Sandi            return;
2120cecf9d5Sandi        }
2130cecf9d5Sandi        $this->Lexer->addSpecialPattern('\n',$mode,'eol');
2140cecf9d5Sandi    }
2150cecf9d5Sandi}
2160cecf9d5Sandi
2170cecf9d5Sandi//-------------------------------------------------------------------
2180cecf9d5Sandiclass Doku_Parser_Mode_HR extends Doku_Parser_Mode {
2190cecf9d5Sandi
2200cecf9d5Sandi    function connectTo($mode) {
2210cecf9d5Sandi        $this->Lexer->addSpecialPattern('\n[ \t]*-{4,}[ \t]*\n',$mode,'hr');
2220cecf9d5Sandi    }
2230cecf9d5Sandi
2240cecf9d5Sandi}
2250cecf9d5Sandi
2260cecf9d5Sandi//-------------------------------------------------------------------
2270cecf9d5Sandiclass Doku_Parser_Mode_Formatting extends Doku_Parser_Mode {
2280cecf9d5Sandi
2290cecf9d5Sandi    var $type;
2300cecf9d5Sandi
2310cecf9d5Sandi    var $formatting = array (
2320cecf9d5Sandi        'strong' => array (
2330cecf9d5Sandi            'entry'=>'\*\*(?=.*\*\*)',
2340cecf9d5Sandi            'exit'=>'\*\*',
2350cecf9d5Sandi            ),
2360cecf9d5Sandi
2370cecf9d5Sandi        'emphasis'=> array (
2380cecf9d5Sandi            'entry'=>'//(?=.*//)',
2390cecf9d5Sandi            'exit'=>'//',
2400cecf9d5Sandi            ),
2410cecf9d5Sandi
2420cecf9d5Sandi        'underline'=> array (
2430cecf9d5Sandi            'entry'=>'__(?=.*__)',
2440cecf9d5Sandi            'exit'=>'__',
2450cecf9d5Sandi            ),
2460cecf9d5Sandi
2470cecf9d5Sandi        'monospace'=> array (
2480cecf9d5Sandi            'entry'=>'\x27\x27(?=.*\x27\x27)',
2490cecf9d5Sandi            'exit'=>'\x27\x27',
2500cecf9d5Sandi            ),
2510cecf9d5Sandi
2520cecf9d5Sandi        'subscript'=> array (
2530cecf9d5Sandi            'entry'=>'<sub>(?=.*\x3C/sub\x3E)',
2540cecf9d5Sandi            'exit'=>'</sub>',
2550cecf9d5Sandi            ),
2560cecf9d5Sandi
2570cecf9d5Sandi        'superscript'=> array (
2580cecf9d5Sandi            'entry'=>'<sup>(?=.*\x3C/sup\x3E)',
2590cecf9d5Sandi            'exit'=>'</sup>',
2600cecf9d5Sandi            ),
2610cecf9d5Sandi
2620cecf9d5Sandi        'deleted'=> array (
2630cecf9d5Sandi            'entry'=>'<del>(?=.*\x3C/del\x3E)',
2640cecf9d5Sandi            'exit'=>'</del>',
2650cecf9d5Sandi            ),
2660cecf9d5Sandi        );
2670cecf9d5Sandi
2680cecf9d5Sandi    function Doku_Parser_Mode_Formatting($type) {
2690cecf9d5Sandi
2700cecf9d5Sandi        if ( !array_key_exists($type, $this->formatting) ) {
2710cecf9d5Sandi            trigger_error('Invalid formatting type '.$type, E_USER_WARNING);
2720cecf9d5Sandi        }
2730cecf9d5Sandi
2740cecf9d5Sandi        $this->type = $type;
2750cecf9d5Sandi
2760cecf9d5Sandi        $this->allowedModes = array_merge (
2770cecf9d5Sandi                Doku_Parser_Formatting($type),
2780cecf9d5Sandi                Doku_Parser_Substition(),
2790cecf9d5Sandi                Doku_Parser_Disabled()
2800cecf9d5Sandi            );
2810cecf9d5Sandi
2820cecf9d5Sandi    }
2830cecf9d5Sandi
2840cecf9d5Sandi    function connectTo($mode) {
2850cecf9d5Sandi
2860cecf9d5Sandi        // Can't nest formatting in itself
2870cecf9d5Sandi        if ( $mode == $this->type ) {
2880cecf9d5Sandi            return;
2890cecf9d5Sandi        }
2900cecf9d5Sandi
2910cecf9d5Sandi        $this->Lexer->addEntryPattern(
2920cecf9d5Sandi                $this->formatting[$this->type]['entry'],
2930cecf9d5Sandi                $mode,
2940cecf9d5Sandi                $this->type
2950cecf9d5Sandi            );
2960cecf9d5Sandi    }
2970cecf9d5Sandi
2980cecf9d5Sandi    function postConnect() {
2990cecf9d5Sandi
3000cecf9d5Sandi        $this->Lexer->addExitPattern(
3010cecf9d5Sandi            $this->formatting[$this->type]['exit'],
3020cecf9d5Sandi            $this->type
3030cecf9d5Sandi            );
3040cecf9d5Sandi
3050cecf9d5Sandi    }
3060cecf9d5Sandi}
3070cecf9d5Sandi
3080cecf9d5Sandi//-------------------------------------------------------------------
3090cecf9d5Sandiclass Doku_Parser_Mode_ListBlock extends Doku_Parser_Mode {
3100cecf9d5Sandi
3110cecf9d5Sandi    function Doku_Parser_Mode_ListBlock() {
3120cecf9d5Sandi
3130cecf9d5Sandi        $this->allowedModes = array_merge (
3140cecf9d5Sandi                Doku_Parser_Formatting(),
3150cecf9d5Sandi                Doku_Parser_Substition(),
3160cecf9d5Sandi                Doku_Parser_Disabled()
3170cecf9d5Sandi            );
3180cecf9d5Sandi        $this->allowedModes[] = 'footnote';
3190cecf9d5Sandi        $this->allowedModes[] = 'preformatted';
3200cecf9d5Sandi        $this->allowedModes[] = 'unformatted';
3210cecf9d5Sandi
3220cecf9d5Sandi    }
3230cecf9d5Sandi
3240cecf9d5Sandi    function connectTo($mode) {
3250cecf9d5Sandi        $this->Lexer->addEntryPattern('\n {2,}[\-\*]',$mode,'listblock');
3260cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\t{1,}[\-\*]',$mode,'listblock');
3270cecf9d5Sandi
3280cecf9d5Sandi        $this->Lexer->addPattern('\n {2,}[\-\*]','listblock');
3290cecf9d5Sandi        $this->Lexer->addPattern('\n\t{1,}[\-\*]','listblock');
3300cecf9d5Sandi
3310cecf9d5Sandi    }
3320cecf9d5Sandi
3330cecf9d5Sandi    function postConnect() {
3340cecf9d5Sandi        $this->Lexer->addExitPattern('\n','listblock');
3350cecf9d5Sandi    }
3360cecf9d5Sandi}
3370cecf9d5Sandi
3380cecf9d5Sandi//-------------------------------------------------------------------
3390cecf9d5Sandiclass Doku_Parser_Mode_Table extends Doku_Parser_Mode {
3400cecf9d5Sandi
3410cecf9d5Sandi    function Doku_Parser_Mode_Table() {
3420cecf9d5Sandi
3430cecf9d5Sandi        $this->allowedModes = array_merge (
3440cecf9d5Sandi                Doku_Parser_Formatting(),
3450cecf9d5Sandi                Doku_Parser_Substition(),
3460cecf9d5Sandi                Doku_Parser_Disabled()
3470cecf9d5Sandi            );
3480cecf9d5Sandi        $this->allowedModes[] = 'footnote';
3490cecf9d5Sandi        $this->allowedModes[] = 'preformatted';
3500cecf9d5Sandi        $this->allowedModes[] = 'unformatted';
3510cecf9d5Sandi    }
3520cecf9d5Sandi
3530cecf9d5Sandi    function connectTo($mode) {
3540cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\^',$mode,'table');
3550cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\|',$mode,'table');
3560cecf9d5Sandi    }
3570cecf9d5Sandi
3580cecf9d5Sandi    function postConnect() {
3590cecf9d5Sandi        $this->Lexer->addPattern('\n\^','table');
3600cecf9d5Sandi        $this->Lexer->addPattern('\n\|','table');
3610cecf9d5Sandi        $this->Lexer->addPattern(' {2,}','table');
3620cecf9d5Sandi        $this->Lexer->addPattern('\^','table');
3630cecf9d5Sandi        $this->Lexer->addPattern('\|','table');
3640cecf9d5Sandi        $this->Lexer->addExitPattern('\n','table');
3650cecf9d5Sandi    }
3660cecf9d5Sandi}
3670cecf9d5Sandi
3680cecf9d5Sandi//-------------------------------------------------------------------
3690cecf9d5Sandiclass Doku_Parser_Mode_Unformatted extends Doku_Parser_Mode {
3700cecf9d5Sandi
3710cecf9d5Sandi    function connectTo($mode) {
3720cecf9d5Sandi        $this->Lexer->addEntryPattern('<nowiki>(?=.*\x3C/nowiki\x3E)',$mode,'unformatted');
3730cecf9d5Sandi        $this->Lexer->addEntryPattern('%%(?=.*%%)',$mode,'unformattedalt');
3740cecf9d5Sandi    }
3750cecf9d5Sandi
3760cecf9d5Sandi    function postConnect() {
3770cecf9d5Sandi        $this->Lexer->addExitPattern('</nowiki>','unformatted');
3780cecf9d5Sandi        $this->Lexer->addExitPattern('%%','unformattedalt');
3790cecf9d5Sandi        $this->Lexer->mapHandler('unformattedalt','unformatted');
3800cecf9d5Sandi    }
3810cecf9d5Sandi
3820cecf9d5Sandi}
3830cecf9d5Sandi
3840cecf9d5Sandi//-------------------------------------------------------------------
3850cecf9d5Sandiclass Doku_Parser_Mode_PHP extends Doku_Parser_Mode {
3860cecf9d5Sandi
3870cecf9d5Sandi    function connectTo($mode) {
3880cecf9d5Sandi        $this->Lexer->addEntryPattern('<php>(?=.*\x3C/php\x3E)',$mode,'php');
3890cecf9d5Sandi    }
3900cecf9d5Sandi
3910cecf9d5Sandi    function postConnect() {
3920cecf9d5Sandi        $this->Lexer->addExitPattern('</php>','php');
3930cecf9d5Sandi    }
3940cecf9d5Sandi
3950cecf9d5Sandi}
3960cecf9d5Sandi
3970cecf9d5Sandi//-------------------------------------------------------------------
3980cecf9d5Sandiclass Doku_Parser_Mode_HTML extends Doku_Parser_Mode {
3990cecf9d5Sandi
4000cecf9d5Sandi    function connectTo($mode) {
4010cecf9d5Sandi        $this->Lexer->addEntryPattern('<html>(?=.*\x3C/html\x3E)',$mode,'html');
4020cecf9d5Sandi    }
4030cecf9d5Sandi
4040cecf9d5Sandi    function postConnect() {
4050cecf9d5Sandi        $this->Lexer->addExitPattern('</html>','html');
4060cecf9d5Sandi    }
4070cecf9d5Sandi
4080cecf9d5Sandi}
4090cecf9d5Sandi
4100cecf9d5Sandi//-------------------------------------------------------------------
4110cecf9d5Sandiclass Doku_Parser_Mode_Preformatted extends Doku_Parser_Mode {
4120cecf9d5Sandi
4130cecf9d5Sandi    function connectTo($mode) {
4140cecf9d5Sandi        // Has hard coded awareness of lists...
4150cecf9d5Sandi        $this->Lexer->addEntryPattern('\n  (?![\*\-])',$mode,'preformatted');
4160cecf9d5Sandi        $this->Lexer->addEntryPattern('\n\t(?![\*\-])',$mode,'preformatted');
4170cecf9d5Sandi
4180cecf9d5Sandi        // How to effect a sub pattern with the Lexer!
4190cecf9d5Sandi        $this->Lexer->addPattern('\n  ','preformatted');
4200cecf9d5Sandi        $this->Lexer->addPattern('\n\t','preformatted');
4210cecf9d5Sandi
4220cecf9d5Sandi    }
4230cecf9d5Sandi
4240cecf9d5Sandi    function postConnect() {
4250cecf9d5Sandi        $this->Lexer->addExitPattern('\n','preformatted');
4260cecf9d5Sandi    }
4270cecf9d5Sandi
4280cecf9d5Sandi}
4290cecf9d5Sandi
4300cecf9d5Sandi//-------------------------------------------------------------------
4310cecf9d5Sandiclass Doku_Parser_Mode_Code extends Doku_Parser_Mode {
4320cecf9d5Sandi
4330cecf9d5Sandi    function connectTo($mode) {
4340cecf9d5Sandi        $this->Lexer->addEntryPattern('<code(?=.*\x3C/code\x3E)',$mode,'code');
4350cecf9d5Sandi    }
4360cecf9d5Sandi
4370cecf9d5Sandi    function postConnect() {
4380cecf9d5Sandi        $this->Lexer->addExitPattern('</code>','code');
4390cecf9d5Sandi    }
4400cecf9d5Sandi
4410cecf9d5Sandi}
4420cecf9d5Sandi
4430cecf9d5Sandi//-------------------------------------------------------------------
4440cecf9d5Sandiclass Doku_Parser_Mode_File extends Doku_Parser_Mode {
4450cecf9d5Sandi
4460cecf9d5Sandi    function connectTo($mode) {
4470cecf9d5Sandi        $this->Lexer->addEntryPattern('<file>(?=.*\x3C/file\x3E)',$mode,'file');
4480cecf9d5Sandi    }
4490cecf9d5Sandi
4500cecf9d5Sandi    function postConnect() {
4510cecf9d5Sandi        $this->Lexer->addExitPattern('</file>','file');
4520cecf9d5Sandi    }
4530cecf9d5Sandi
4540cecf9d5Sandi}
4550cecf9d5Sandi
4560cecf9d5Sandi//-------------------------------------------------------------------
4570cecf9d5Sandiclass Doku_Parser_Mode_Quote extends Doku_Parser_Mode {
4580cecf9d5Sandi
4590cecf9d5Sandi    function Doku_Parser_Mode_Quote() {
4600cecf9d5Sandi
4610cecf9d5Sandi        $this->allowedModes = array_merge (
4620cecf9d5Sandi                Doku_Parser_Formatting(),
4630cecf9d5Sandi                Doku_Parser_Substition(),
4640cecf9d5Sandi                Doku_Parser_Disabled()
4650cecf9d5Sandi            );
4660cecf9d5Sandi            $this->allowedModes[] = 'footnote';
4670cecf9d5Sandi            $this->allowedModes[] = 'preformatted';
4680cecf9d5Sandi            $this->allowedModes[] = 'unformatted';
4690cecf9d5Sandi    }
4700cecf9d5Sandi
4710cecf9d5Sandi    function connectTo($mode) {
4720cecf9d5Sandi        $this->Lexer->addEntryPattern('\n>{1,}',$mode,'quote');
4730cecf9d5Sandi    }
4740cecf9d5Sandi
4750cecf9d5Sandi    function postConnect() {
4760cecf9d5Sandi        $this->Lexer->addPattern('\n>{1,}','quote');
4770cecf9d5Sandi        $this->Lexer->addExitPattern('\n','quote');
4780cecf9d5Sandi    }
4790cecf9d5Sandi
4800cecf9d5Sandi}
4810cecf9d5Sandi
4820cecf9d5Sandi//-------------------------------------------------------------------
4830cecf9d5Sandiclass Doku_Parser_Mode_Acronym extends Doku_Parser_Mode {
4840cecf9d5Sandi    // A list
4850cecf9d5Sandi    var $acronyms = array();
4860cecf9d5Sandi    var $pattern = '';
4870cecf9d5Sandi
4880cecf9d5Sandi    function Doku_Parser_Mode_Acronym($acronyms) {
4890cecf9d5Sandi        $this->acronyms = $acronyms;
4900cecf9d5Sandi    }
4910cecf9d5Sandi
4920cecf9d5Sandi    function preConnect() {
4930cecf9d5Sandi        $sep = '';
4940cecf9d5Sandi        foreach ( $this->acronyms as $acronym ) {
4950cecf9d5Sandi            $this->pattern .= $sep.'(?<=\b)'.Doku_Lexer_Escape($acronym).'(?=\b)';
4960cecf9d5Sandi            $sep = '|';
4970cecf9d5Sandi        }
4980cecf9d5Sandi    }
4990cecf9d5Sandi
5000cecf9d5Sandi    function connectTo($mode) {
5010cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5020cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'acronym');
5030cecf9d5Sandi        }
5040cecf9d5Sandi    }
5050cecf9d5Sandi
5060cecf9d5Sandi}
5070cecf9d5Sandi
5080cecf9d5Sandi//-------------------------------------------------------------------
5090cecf9d5Sandiclass Doku_Parser_Mode_Smiley extends Doku_Parser_Mode {
5100cecf9d5Sandi    // A list
5110cecf9d5Sandi    var $smileys = array();
5120cecf9d5Sandi    var $pattern = '';
5130cecf9d5Sandi
5140cecf9d5Sandi    function Doku_Parser_Mode_Smiley($smileys) {
5150cecf9d5Sandi        $this->smileys = $smileys;
5160cecf9d5Sandi    }
5170cecf9d5Sandi
5180cecf9d5Sandi    function preConnect() {
5190cecf9d5Sandi        $sep = '';
5200cecf9d5Sandi        foreach ( $this->smileys as $smiley ) {
5210cecf9d5Sandi            $this->pattern .= $sep.Doku_Lexer_Escape($smiley);
5220cecf9d5Sandi            $sep = '|';
5230cecf9d5Sandi        }
5240cecf9d5Sandi    }
5250cecf9d5Sandi
5260cecf9d5Sandi    function connectTo($mode) {
5270cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5280cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'smiley');
5290cecf9d5Sandi        }
5300cecf9d5Sandi    }
5310cecf9d5Sandi
5320cecf9d5Sandi}
5330cecf9d5Sandi
5340cecf9d5Sandi//-------------------------------------------------------------------
5350cecf9d5Sandiclass Doku_Parser_Mode_Wordblock extends Doku_Parser_Mode {
5360cecf9d5Sandi    // A list
5370cecf9d5Sandi    var $badwords = array();
5380cecf9d5Sandi    var $pattern = '';
5390cecf9d5Sandi
5400cecf9d5Sandi    function Doku_Parser_Mode_Wordblock($badwords) {
5410cecf9d5Sandi        $this->badwords = $badwords;
5420cecf9d5Sandi    }
5430cecf9d5Sandi
5440cecf9d5Sandi    function preConnect() {
5450cecf9d5Sandi
5460cecf9d5Sandi        if ( count($this->badwords) == 0 ) {
5470cecf9d5Sandi            return;
5480cecf9d5Sandi        }
5490cecf9d5Sandi
5500cecf9d5Sandi        $sep = '';
5510cecf9d5Sandi        foreach ( $this->badwords as $badword ) {
5520cecf9d5Sandi            $this->pattern .= $sep.'(?<=\b)(?i)'.Doku_Lexer_Escape($badword).'(?-i)(?=\b)';
5530cecf9d5Sandi            $sep = '|';
5540cecf9d5Sandi        }
5550cecf9d5Sandi
5560cecf9d5Sandi    }
5570cecf9d5Sandi
5580cecf9d5Sandi    function connectTo($mode) {
5590cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5600cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'wordblock');
5610cecf9d5Sandi        }
5620cecf9d5Sandi    }
5630cecf9d5Sandi
5640cecf9d5Sandi}
5650cecf9d5Sandi
5660cecf9d5Sandi//-------------------------------------------------------------------
5670cecf9d5Sandi/**
568*4de671bcSandi* @TODO Quotes and 640x480 are not supported - just straight replacements here
5690cecf9d5Sandi*/
5700cecf9d5Sandiclass Doku_Parser_Mode_Entity extends Doku_Parser_Mode {
5710cecf9d5Sandi    // A list
5720cecf9d5Sandi    var $entities = array();
5730cecf9d5Sandi    var $pattern = '';
5740cecf9d5Sandi
5750cecf9d5Sandi    function Doku_Parser_Mode_Entity($entities) {
5760cecf9d5Sandi        $this->entities = $entities;
5770cecf9d5Sandi    }
5780cecf9d5Sandi
5790cecf9d5Sandi    function preConnect() {
5800cecf9d5Sandi        $sep = '';
5810cecf9d5Sandi        foreach ( $this->entities as $entity ) {
5820cecf9d5Sandi            $this->pattern .= $sep.Doku_Lexer_Escape($entity);
5830cecf9d5Sandi            $sep = '|';
5840cecf9d5Sandi        }
5850cecf9d5Sandi    }
5860cecf9d5Sandi
5870cecf9d5Sandi    function connectTo($mode) {
5880cecf9d5Sandi        if ( strlen($this->pattern) > 0 ) {
5890cecf9d5Sandi            $this->Lexer->addSpecialPattern($this->pattern,$mode,'entity');
5900cecf9d5Sandi        }
5910cecf9d5Sandi    }
5920cecf9d5Sandi
5930cecf9d5Sandi}
5940cecf9d5Sandi
5950cecf9d5Sandi//-------------------------------------------------------------------
5960cecf9d5Sandi// Implements the 640x480 replacement
5970cecf9d5Sandiclass Doku_Parser_Mode_MultiplyEntity extends Doku_Parser_Mode {
5980cecf9d5Sandi
5990cecf9d5Sandi    function connectTo($mode) {
6000cecf9d5Sandi
6010cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6020cecf9d5Sandi                    '(?<=\b)\d+[x|X]\d+(?=\b)',$mode,'multiplyentity'
6030cecf9d5Sandi                );
6040cecf9d5Sandi
6050cecf9d5Sandi    }
6060cecf9d5Sandi
6070cecf9d5Sandi}
6080cecf9d5Sandi
6090cecf9d5Sandi//-------------------------------------------------------------------
6100cecf9d5Sandiclass Doku_Parser_Mode_Quotes extends Doku_Parser_Mode {
6110cecf9d5Sandi
6120cecf9d5Sandi    function connectTo($mode) {
6130cecf9d5Sandi
6140cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6150cecf9d5Sandi                    '(?<=\s)\'(?=\S)',$mode,'singlequoteopening'
6160cecf9d5Sandi                );
6170cecf9d5Sandi        $this->Lexer->addSpecialPattern(
618*4de671bcSandi                    '(?<=^|\S)\'',$mode,'singlequoteclosing'
6190cecf9d5Sandi                );
6200cecf9d5Sandi        $this->Lexer->addSpecialPattern(
621*4de671bcSandi                    '(?<=^|\s)"(?=\S)',$mode,'doublequoteopening'
6220cecf9d5Sandi                );
6230cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6240cecf9d5Sandi                    '(?<=\S)"',$mode,'doublequoteclosing'
6250cecf9d5Sandi                );
6260cecf9d5Sandi
6270cecf9d5Sandi    }
6280cecf9d5Sandi
6290cecf9d5Sandi}
6300cecf9d5Sandi
6310cecf9d5Sandi//-------------------------------------------------------------------
6320cecf9d5Sandiclass Doku_Parser_Mode_CamelCaseLink extends Doku_Parser_Mode {
6330cecf9d5Sandi
6340cecf9d5Sandi    function connectTo($mode) {
6350cecf9d5Sandi        $this->Lexer->addSpecialPattern(
6360cecf9d5Sandi                '\b[A-Z]+[a-z]+[A-Z][A-Za-z]*\b',$mode,'camelcaselink'
6370cecf9d5Sandi            );
6380cecf9d5Sandi    }
6390cecf9d5Sandi
6400cecf9d5Sandi}
6410cecf9d5Sandi
6420cecf9d5Sandi//-------------------------------------------------------------------
6430cecf9d5Sandiclass Doku_Parser_Mode_InternalLink extends Doku_Parser_Mode {
6440cecf9d5Sandi
6450cecf9d5Sandi    function connectTo($mode) {
6460cecf9d5Sandi        // Word boundaries?
6470cecf9d5Sandi        $this->Lexer->addSpecialPattern("\[\[[^\]]+?\]\]",$mode,'internallink');
6480cecf9d5Sandi    }
6490cecf9d5Sandi
6500cecf9d5Sandi}
6510cecf9d5Sandi
6520cecf9d5Sandi//-------------------------------------------------------------------
6530cecf9d5Sandiclass Doku_Parser_Mode_Media extends Doku_Parser_Mode {
6540cecf9d5Sandi
6550cecf9d5Sandi    function connectTo($mode) {
6560cecf9d5Sandi        // Word boundaries?
6570cecf9d5Sandi        $this->Lexer->addSpecialPattern("\{\{[^\}]+\}\}",$mode,'media');
6580cecf9d5Sandi    }
6590cecf9d5Sandi
6600cecf9d5Sandi}
6610cecf9d5Sandi
6620cecf9d5Sandi//-------------------------------------------------------------------
6630cecf9d5Sandiclass Doku_Parser_Mode_ExternalLink extends Doku_Parser_Mode {
6640cecf9d5Sandi    var $schemes = array('http','https','telnet','gopher','wais','ftp','ed2k','irc');
6650cecf9d5Sandi    var $patterns = array();
6660cecf9d5Sandi
6670cecf9d5Sandi    function preConnect() {
6680cecf9d5Sandi
6690cecf9d5Sandi        $ltrs = '\w';
6700cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
6710cecf9d5Sandi        $punc = '.:?\-;,';
6720cecf9d5Sandi        $host = $ltrs.$punc;
6730cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
6740cecf9d5Sandi
6750cecf9d5Sandi        foreach ( $this->schemes as $scheme ) {
6760cecf9d5Sandi            $this->patterns[] = '\b(?i)'.$scheme.'(?-i)://['.$any.']+?['.$punc.']*[^'.$any.']';
6770cecf9d5Sandi        }
6780cecf9d5Sandi
6790cecf9d5Sandi        $this->patterns[] = '\b(?i)www?(?-i)\.['.$host.']+?\.['.$host.']+?['.$any.']+?['.$punc.']*[^'.$any.']';
6800cecf9d5Sandi        $this->patterns[] = '\b(?i)ftp?(?-i)\.['.$host.']+?\.['.$host.']+?['.$any.']+?['.$punc.']*[^'.$any.']';
6810cecf9d5Sandi
6820cecf9d5Sandi    }
6830cecf9d5Sandi
6840cecf9d5Sandi    function connectTo($mode) {
6850cecf9d5Sandi        foreach ( $this->patterns as $pattern ) {
6860cecf9d5Sandi            $this->Lexer->addSpecialPattern($pattern,$mode,'externallink');
6870cecf9d5Sandi        }
6880cecf9d5Sandi    }
6890cecf9d5Sandi
6900cecf9d5Sandi}
6910cecf9d5Sandi
6920cecf9d5Sandi//-------------------------------------------------------------------
6930cecf9d5Sandiclass Doku_Parser_Mode_FileLink extends Doku_Parser_Mode {
6940cecf9d5Sandi
6950cecf9d5Sandi    var $pattern;
6960cecf9d5Sandi
6970cecf9d5Sandi    function preConnect() {
6980cecf9d5Sandi
6990cecf9d5Sandi        $ltrs = '\w';
7000cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
7010cecf9d5Sandi        $punc = '.:?\-;,';
7020cecf9d5Sandi        $host = $ltrs.$punc;
7030cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
7040cecf9d5Sandi
7050cecf9d5Sandi        $this->pattern = '\b(?i)file(?-i)://['.$any.']+?['.
7060cecf9d5Sandi            $punc.']*[^'.$any.']';
7070cecf9d5Sandi    }
7080cecf9d5Sandi
7090cecf9d5Sandi    function connectTo($mode) {
7100cecf9d5Sandi        $this->Lexer->addSpecialPattern(
7110cecf9d5Sandi            $this->pattern,$mode,'filelink');
7120cecf9d5Sandi    }
7130cecf9d5Sandi
7140cecf9d5Sandi
7150cecf9d5Sandi}
7160cecf9d5Sandi
7170cecf9d5Sandi//-------------------------------------------------------------------
7180cecf9d5Sandiclass Doku_Parser_Mode_WindowsShareLink extends Doku_Parser_Mode {
7190cecf9d5Sandi
7200cecf9d5Sandi    var $pattern;
7210cecf9d5Sandi
7220cecf9d5Sandi    function preConnect() {
7230cecf9d5Sandi
7240cecf9d5Sandi        $ltrs = '\w';
7250cecf9d5Sandi        $gunk = '/\#~:.?+=&%@!\-';
7260cecf9d5Sandi        $punc = '.:?\-;,';
7270cecf9d5Sandi        $host = $ltrs.$punc;
7280cecf9d5Sandi        $any  = $ltrs.$gunk.$punc;
7290cecf9d5Sandi
7300cecf9d5Sandi        $this->pattern = "[$gunk$punc\s]\\\\\\\\[$host]+?\\\\[$any]+?[$punc]*[^$any]";
7310cecf9d5Sandi    }
7320cecf9d5Sandi
7330cecf9d5Sandi    function connectTo($mode) {
7340cecf9d5Sandi        $this->Lexer->addSpecialPattern(
7350cecf9d5Sandi            $this->pattern,$mode,'windowssharelink');
7360cecf9d5Sandi    }
7370cecf9d5Sandi
7380cecf9d5Sandi
7390cecf9d5Sandi}
7400cecf9d5Sandi
7410cecf9d5Sandi//-------------------------------------------------------------------
7420cecf9d5Sandiclass Doku_Parser_Mode_Email extends Doku_Parser_Mode {
7430cecf9d5Sandi
7440cecf9d5Sandi    function connectTo($mode) {
7450cecf9d5Sandi    //<([\w0-9\-_.]+?)@([\w\-]+\.([\w\-\.]+\.)*[\w]+)>
7460cecf9d5Sandi        $this->Lexer->addSpecialPattern("<[\w0-9\-_.]+?@[\w\-]+\.[\w\-\.]+\.*[\w]+>",$mode,'email');
7470cecf9d5Sandi    }
7480cecf9d5Sandi
7490cecf9d5Sandi}
7500cecf9d5Sandi
7510cecf9d5Sandi//-------------------------------------------------------------------
7520cecf9d5Sandi// Help fns to keep mode lists - used to make it easier to populate
7530cecf9d5Sandi// the list of modes another mode accepts
7540cecf9d5Sandi
7550cecf9d5Sandi// Can contain many other modes
7560cecf9d5Sandi// E.g. a footnote can containing formatting etc.
7570cecf9d5Sandifunction Doku_Parser_BlockContainers() {
7580cecf9d5Sandi    $modes = array(
7590cecf9d5Sandi        'footnote', 'listblock', 'table','quote',
7600cecf9d5Sandi        // hr breaks the principle but HRs should not be used in tables / lists
7610cecf9d5Sandi        // so put it here
7620cecf9d5Sandi        'hr',
7630cecf9d5Sandi    );
7640cecf9d5Sandi    return $modes;
7650cecf9d5Sandi}
7660cecf9d5Sandi
7670cecf9d5Sandi// Used to mark paragraph boundaries
7680cecf9d5Sandifunction Doku_Parser_Paragraphs() {
7690cecf9d5Sandi    $modes = array(
7700cecf9d5Sandi        'eol'
7710cecf9d5Sandi    );
7720cecf9d5Sandi    return $modes;
7730cecf9d5Sandi}
7740cecf9d5Sandi
7750cecf9d5Sandi// Can only be used by the base mode
7760cecf9d5Sandifunction Doku_Parser_BaseOnly() {
7770cecf9d5Sandi    $modes = array(
7780cecf9d5Sandi        'header'
7790cecf9d5Sandi    );
7800cecf9d5Sandi    return $modes;
7810cecf9d5Sandi}
7820cecf9d5Sandi
7830cecf9d5Sandi// "Styling" modes that format text.
7840cecf9d5Sandifunction Doku_Parser_Formatting($remove = '') {
7850cecf9d5Sandi    $modes = array(
7860cecf9d5Sandi        'strong', 'emphasis', 'underline', 'monospace',
7870cecf9d5Sandi        'subscript', 'superscript', 'deleted',
7880cecf9d5Sandi        );
7890cecf9d5Sandi    $key = array_search($remove, $modes);
7900cecf9d5Sandi    if ( is_int($key) ) {
7910cecf9d5Sandi        unset($modes[$key]);
7920cecf9d5Sandi    }
7930cecf9d5Sandi
7940cecf9d5Sandi    return $modes;
7950cecf9d5Sandi}
7960cecf9d5Sandi
7970cecf9d5Sandi// Modes where the token is simply replaced - contain no
7980cecf9d5Sandi// other modes
7990cecf9d5Sandifunction Doku_Parser_Substition() {
8000cecf9d5Sandi    $modes = array(
8010cecf9d5Sandi        'acronym','smiley','wordblock','entity','camelcaselink',
8020cecf9d5Sandi        'internallink','media','externallink','linebreak','email',
8030cecf9d5Sandi        'windowssharelink','filelink','notoc','multiplyentity',
8040cecf9d5Sandi        'quotes',
8050cecf9d5Sandi
8060cecf9d5Sandi    );
8070cecf9d5Sandi    return $modes;
8080cecf9d5Sandi}
8090cecf9d5Sandi
8100cecf9d5Sandi// Modes which have a start and end token but inside which
8110cecf9d5Sandi// no other modes should be applied
8120cecf9d5Sandifunction Doku_Parser_Protected() {
8130cecf9d5Sandi    $modes = array(
8140cecf9d5Sandi        'preformatted','code','file',
8150cecf9d5Sandi        'php','html','quote',
8160cecf9d5Sandi    );
8170cecf9d5Sandi    return $modes;
8180cecf9d5Sandi}
8190cecf9d5Sandi
8200cecf9d5Sandi// Disable wiki markup inside this mode
8210cecf9d5Sandifunction Doku_Parser_Disabled() {
8220cecf9d5Sandi    $modes = array(
8230cecf9d5Sandi        'unformatted'
8240cecf9d5Sandi    );
8250cecf9d5Sandi    return $modes;
8260cecf9d5Sandi}
8270cecf9d5Sandi
8280cecf9d5Sandi?>
829