16980370bSSascha Leib<?php 26980370bSSascha Leib 36980370bSSascha Leibuse dokuwiki\Extension\EventHandler; 46980370bSSascha Leibuse dokuwiki\Extension\Event; 55fbe88f7SSascha Leibuse dokuwiki\Logger; 66980370bSSascha Leib 76980370bSSascha Leib/** 87bd08c30SSascha Leib * Action Component for the Bot Monitoring Plugin 96980370bSSascha Leib * 106980370bSSascha Leib * @license GPL 3 (http://www.gnu.org/licenses/gpl.html) 116980370bSSascha Leib * @author Sascha Leib <sascha.leib(at)kolmio.com> 126980370bSSascha Leib */ 136980370bSSascha Leib 147bd08c30SSascha Leibclass action_plugin_botmon extends DokuWiki_Action_Plugin { 156980370bSSascha Leib 166980370bSSascha Leib /** 176980370bSSascha Leib * Registers a callback functions 186980370bSSascha Leib * 196980370bSSascha Leib * @param EventHandler $controller DokuWiki's event controller object 206980370bSSascha Leib * @return void 216980370bSSascha Leib */ 226980370bSSascha Leib public function register(EventHandler $controller) { 235f2c1759SSascha Leib 24e56d7b71SSascha Leib global $ACT; 25e56d7b71SSascha Leib 26d49ab213SSascha Leib // initialize the session id and type with random data: 27d49ab213SSascha Leib $this->sessionId = rand(1000000, 9999999); 28d49ab213SSascha Leib $this->sessionType = 'rnd'; 29d49ab213SSascha Leib 305f2c1759SSascha Leib // insert header data into the page: 31d49ab213SSascha Leib if ($ACT == 'show' || $ACT == 'edit' || $ACT == 'media') { 326980370bSSascha Leib $controller->register_hook('TPL_METAHEADER_OUTPUT', 'BEFORE', $this, 'insertHeader'); 33d49ab213SSascha Leib 34d49ab213SSascha Leib // Override the page rendering, if a captcha needs to be displayed: 35d49ab213SSascha Leib $controller->register_hook('TPL_ACT_RENDER', 'BEFORE', $this, 'showCaptcha'); 36d49ab213SSascha Leib 37e56d7b71SSascha Leib } else if ($ACT == 'admin' && isset($_REQUEST['page']) && $_REQUEST['page'] == 'botmon') { 38e56d7b71SSascha Leib $controller->register_hook('TPL_METAHEADER_OUTPUT', 'BEFORE', $this, 'insertAdminHeader'); 39e56d7b71SSascha Leib } 405f2c1759SSascha Leib 41d49ab213SSascha Leib // also show a captcha before the image preview 42d49ab213SSascha Leib $controller->register_hook('TPL_IMG_DISPLAY', 'BEFORE', $this, 'showImageCaptcha'); 43f5f4ca13SSascha Leib 445f2c1759SSascha Leib // write to the log after the page content was displayed: 455f2c1759SSascha Leib $controller->register_hook('TPL_CONTENT_DISPLAY', 'AFTER', $this, 'writeServerLog'); 465f2c1759SSascha Leib 476980370bSSascha Leib } 486980370bSSascha Leib 49b148c85eSSascha Leib /* session information */ 50f6a7ebc1SSascha Leib private $sessionId = null; 51f6a7ebc1SSascha Leib private $sessionType = ''; 522c641262SSascha Leib private $showCaptcha = '-'; 53b148c85eSSascha Leib 546980370bSSascha Leib /** 556980370bSSascha Leib * Inserts tracking code to the page header 56e56d7b71SSascha Leib * (only called on 'show' actions) 576980370bSSascha Leib * 586980370bSSascha Leib * @param Event $event event object by reference 596980370bSSascha Leib * @return void 606980370bSSascha Leib */ 616980370bSSascha Leib public function insertHeader(Event $event, $param) { 626980370bSSascha Leib 636980370bSSascha Leib global $INFO; 646980370bSSascha Leib 65b148c85eSSascha Leib // populate the session id and type: 66b148c85eSSascha Leib $this->getSessionInfo(); 67b148c85eSSascha Leib 686980370bSSascha Leib // build the tracker code: 69d49ab213SSascha Leib $code = $this->getBMHeader(); 706980370bSSascha Leib 715f2c1759SSascha Leib // add the deferred script loader:: 72e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . "addEventListener('DOMContentLoaded', function(){" . NL; 73e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "const e=document.createElement('script');" . NL; 74e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "e.async=true;e.defer=true;" . NL; 75e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "e.src='".DOKU_BASE."lib/plugins/botmon/client.js';" . NL; 76e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "document.getElementsByTagName('head')[0].appendChild(e);" . NL; 77e56d7b71SSascha Leib $code .= DOKU_TAB . DOKU_TAB . "});"; 785f2c1759SSascha Leib $event->data['script'][] = ['_data' => $code]; 79451abfadSSascha Leib } 80451abfadSSascha Leib 81d49ab213SSascha Leib /* create the BM object code for insertion into a script element: */ 82d49ab213SSascha Leib private function getBMHeader() { 83d49ab213SSascha Leib 84d49ab213SSascha Leib // build the tracker code: 85d49ab213SSascha Leib $code = DOKU_TAB . DOKU_TAB . "document._botmon = {t0: Date.now(), session: " . json_encode($this->sessionId) . ", seed: " . json_encode($this->getConf('captchaSeed')) . ", ip: " . json_encode($_SERVER['REMOTE_ADDR']) . "};" . NL; 86d49ab213SSascha Leib 87d49ab213SSascha Leib // is there a user logged in? 88d49ab213SSascha Leib $username = ( !empty($INFO['userinfo']) && !empty($INFO['userinfo']['name']) ? $INFO['userinfo']['name'] : ''); 89d49ab213SSascha Leib if ($username) { 90d49ab213SSascha Leib $code .= DOKU_TAB . DOKU_TAB . 'document._botmon.user = "' . $username . '";'. NL; 91d49ab213SSascha Leib } 92d49ab213SSascha Leib 93d49ab213SSascha Leib return $code; 94d49ab213SSascha Leib 95d49ab213SSascha Leib } 96d49ab213SSascha Leib 97451abfadSSascha Leib /** 98e56d7b71SSascha Leib * Inserts tracking code to the page header 99e56d7b71SSascha Leib * (only called on 'show' actions) 100e56d7b71SSascha Leib * 101e56d7b71SSascha Leib * @param Event $event event object by reference 102e56d7b71SSascha Leib * @return void 103e56d7b71SSascha Leib */ 104e56d7b71SSascha Leib public function insertAdminHeader(Event $event, $param) { 105e56d7b71SSascha Leib 106e56d7b71SSascha Leib $event->data['link'][] = ['rel' => 'stylesheet', 'href' => DOKU_BASE.'lib/plugins/botmon/admin.css', 'defer' => 'defer']; 1070edf1a56SSascha Leib $event->data['script'][] = ['src' => DOKU_BASE.'lib/plugins/botmon/admin.js', 'defer' => 'defer', '_data' => '']; 108e56d7b71SSascha Leib } 109e56d7b71SSascha Leib 110e56d7b71SSascha Leib /** 111451abfadSSascha Leib * Writes data to the server log. 112451abfadSSascha Leib * 113451abfadSSascha Leib * @return void 114451abfadSSascha Leib */ 1155f2c1759SSascha Leib public function writeServerLog(Event $event, $param) { 116451abfadSSascha Leib 117451abfadSSascha Leib global $conf; 118451abfadSSascha Leib global $INFO; 119091b5998SSascha Leib 1205f2c1759SSascha Leib // is there a user logged in? 1215f2c1759SSascha Leib $username = ( !empty($INFO['userinfo']) && !empty($INFO['userinfo']['name']) 1225f2c1759SSascha Leib ? $INFO['userinfo']['name'] : ''); 1235f2c1759SSascha Leib 124b2e3bd8bSSascha Leib // clean the page ID 125b2e3bd8bSSascha Leib $pageId = preg_replace('/[\x00-\x1F]/', "\u{FFFD}", $INFO['id'] ?? ''); 126b2e3bd8bSSascha Leib 127451abfadSSascha Leib // create the log array: 128cf9f7fe8SSascha Leib $logArr = Array( 129f5f4ca13SSascha Leib $_SERVER['REMOTE_ADDR'], /* remote IP */ 130b2e3bd8bSSascha Leib $pageId, /* page ID */ 131b148c85eSSascha Leib $this->sessionId, /* Session ID */ 132b148c85eSSascha Leib $this->sessionType, /* session ID type */ 1335f2c1759SSascha Leib $username, /* user name */ 1342f2bc93aSSascha Leib $_SERVER['HTTP_USER_AGENT'] ?? '', /* User agent */ 135451abfadSSascha Leib $_SERVER['HTTP_REFERER'] ?? '', /* HTTP Referrer */ 136451abfadSSascha Leib substr($conf['lang'],0,2), /* page language */ 137a93de874SSascha Leib implode(',', array_unique(array_map( function($it) { return substr(trim($it),0,2); }, explode(',',trim($_SERVER['HTTP_ACCEPT_LANGUAGE'], " \t;,*"))))), /* accepted client languages */ 1382c641262SSascha Leib $this->getCountryCode(), /* GeoIP country code */ 139d49ab213SSascha Leib $this->showCaptcha /* show captcha? */ 140d49ab213SSascha Leib ); 141cf9f7fe8SSascha Leib 142cf9f7fe8SSascha Leib //* create the log line */ 1434cddc661SSascha Leib $filename = __DIR__ .'/logs/' . gmdate('Y-m-d') . '.srv.txt'; /* use GMT date for filename */ 144cf9f7fe8SSascha Leib $logline = gmdate('Y-m-d H:i:s'); /* use GMT time for log entries */ 145cf9f7fe8SSascha Leib foreach ($logArr as $tab) { 146cf9f7fe8SSascha Leib $logline .= "\t" . $tab; 147cf9f7fe8SSascha Leib }; 148cf9f7fe8SSascha Leib 149cf9f7fe8SSascha Leib /* write the log line to the file */ 150cf9f7fe8SSascha Leib $logfile = fopen($filename, 'a'); 151cf9f7fe8SSascha Leib if (!$logfile) die(); 152cf9f7fe8SSascha Leib if (fwrite($logfile, $logline . "\n") === false) { 153cf9f7fe8SSascha Leib fclose($logfile); 154cf9f7fe8SSascha Leib die(); 1556980370bSSascha Leib } 156cf9f7fe8SSascha Leib 157cf9f7fe8SSascha Leib /* Done */ 158cf9f7fe8SSascha Leib fclose($logfile); 159cf9f7fe8SSascha Leib } 160b148c85eSSascha Leib 1615f2c1759SSascha Leib private function getCountryCode() { 1625f2c1759SSascha Leib 163f5f4ca13SSascha Leib $country = ( $_SERVER['REMOTE_ADDR'] == '127.0.0.1' ? 'local' : 'ZZ' ); // default if no geoip is available! 1645f2c1759SSascha Leib 1655f2c1759SSascha Leib $lib = $this->getConf('geoiplib'); /* which library to use? (can only be phpgeoip or disabled) */ 1665f2c1759SSascha Leib 1675f2c1759SSascha Leib try { 1685f2c1759SSascha Leib 1695f2c1759SSascha Leib // use GeoIP module? 1705f2c1759SSascha Leib if ($lib == 'phpgeoip' && extension_loaded('geoip') && geoip_db_avail(GEOIP_COUNTRY_EDITION)) { // Use PHP GeoIP module 1715f2c1759SSascha Leib $result = geoip_country_code_by_name($_SERVER['REMOTE_ADDR']); 1725f2c1759SSascha Leib $country = ($result ? $result : $country); 1735f2c1759SSascha Leib } 1745f2c1759SSascha Leib } catch (Exception $e) { 1755f2c1759SSascha Leib Logger::error('BotMon Plugin: GeoIP Error', $e->getMessage()); 1765f2c1759SSascha Leib } 1775f2c1759SSascha Leib 1785f2c1759SSascha Leib return $country; 1795f2c1759SSascha Leib } 1805f2c1759SSascha Leib 181b148c85eSSascha Leib private function getSessionInfo() { 182b148c85eSSascha Leib 183b148c85eSSascha Leib // what is the session identifier? 184b148c85eSSascha Leib if (isset($_SESSION)) { 185b148c85eSSascha Leib $sesKeys = array_keys($_SESSION); /* DokuWiki Session ID preferred */ 186b148c85eSSascha Leib foreach ($sesKeys as $key) { 187b148c85eSSascha Leib if (substr($key, 0, 2) == 'DW') { 188b148c85eSSascha Leib $this->sessionId = $key; 189b148c85eSSascha Leib $this->sessionType = 'dw'; 190b148c85eSSascha Leib return; 191b148c85eSSascha Leib } 192b148c85eSSascha Leib } 193b148c85eSSascha Leib } 194f6a7ebc1SSascha Leib if (!$this->sessionId) { /* no DokuWiki Session ID, try PHP session ID */ 195b148c85eSSascha Leib $this->sessionId = session_id(); 196b148c85eSSascha Leib $this->sessionType = 'php'; 197b148c85eSSascha Leib } 198f5f4ca13SSascha Leib if (!$this->sessionId) { /* no PHP session ID, try IP address */ 199f5f4ca13SSascha Leib $this->sessionId = $_SERVER['REMOTE_ADDR']; 200b148c85eSSascha Leib $this->sessionType = 'ip'; 201b148c85eSSascha Leib } 202b148c85eSSascha Leib } 203f5f4ca13SSascha Leib 204f5f4ca13SSascha Leib public function showCaptcha(Event $event) { 205f5f4ca13SSascha Leib 20612993035SSascha Leib $useCaptcha = $this->getConf('useCaptcha'); 207f5f4ca13SSascha Leib 208d49ab213SSascha Leib $cCode = '-'; 209d49ab213SSascha Leib if ($useCaptcha !== 'disabled') { 210d49ab213SSascha Leib if ($this->captchaWhitelisted()) { 211d49ab213SSascha Leib $cCode = 'W'; // whitelisted 212d49ab213SSascha Leib } elseif ($this->hasCaptchaCookie()) { 213d49ab213SSascha Leib $cCode = 'N'; // user already has a cookie 214d49ab213SSascha Leib } else { 215d49ab213SSascha Leib $cCode = 'Y'; // show the captcha 2162c641262SSascha Leib 2172c641262SSascha Leib 21812993035SSascha Leib echo '<h1 class="sectionedit1">'; tpl_pagetitle(); echo "</h1>\n"; // always show the original page title 219f5f4ca13SSascha Leib $event->preventDefault(); // don't show normal content 22012993035SSascha Leib switch ($useCaptcha) { 22112993035SSascha Leib case 'blank': 22212993035SSascha Leib $this->insertBlankBox(); // show dada filler instead of text 22312993035SSascha Leib break; 22412993035SSascha Leib case 'dada': 22512993035SSascha Leib $this->insertDadaFiller(); // show dada filler instead of text 22612993035SSascha Leib break; 22712993035SSascha Leib } 228f5f4ca13SSascha Leib $this->insertCaptchaLoader(); // and load the captcha 229f5f4ca13SSascha Leib } 230f5f4ca13SSascha Leib } 231d49ab213SSascha Leib $this->showCaptcha = $cCode; // store the captcha code for the logfile 232d49ab213SSascha Leib 233d49ab213SSascha Leib } 234f5f4ca13SSascha Leib 235d49ab213SSascha Leib public function showImageCaptcha(Event $event, $param) { 236d49ab213SSascha Leib 237d49ab213SSascha Leib $useCaptcha = $this->getConf('useCaptcha'); 238d49ab213SSascha Leib 239d49ab213SSascha Leib echo '<script>' . $this->getBMHeader($event, $param) . '</script>'; 240d49ab213SSascha Leib 241d49ab213SSascha Leib $cCode = '-'; 242d49ab213SSascha Leib if ($useCaptcha !== 'disabled') { 243d49ab213SSascha Leib if ($this->captchaWhitelisted()) { 244d49ab213SSascha Leib $cCode = 'W'; // whitelisted 245d49ab213SSascha Leib } 246d49ab213SSascha Leib elseif ($this->hasCaptchaCookie()) { 247d49ab213SSascha Leib $cCode = 'N'; // user already has a cookie 248d49ab213SSascha Leib } 249d49ab213SSascha Leib else { 250d49ab213SSascha Leib $cCode = 'Y'; // show the captcha 251d49ab213SSascha Leib 252d49ab213SSascha Leib echo '<svg width="100%" height="100%" viewBox="0 0 800 400" version="1.1" xmlns="http://www.w3.org/2000/svg"><path d="M1,1l798,398" style="fill:none;stroke:#f00;stroke-width:1px;"/><path d="M1,399l798,-398" style="fill:none;stroke:#f00;stroke-width:1px;"/><rect x="1" y="1" width="798" height="398" style="fill:none;stroke:#000;stroke-width:1px;"/></svg>'; // placeholder image 253d49ab213SSascha Leib $event->preventDefault(); // don't show normal content 254d49ab213SSascha Leib 255d49ab213SSascha Leib // TODO Insert dummy image 256d49ab213SSascha Leib $this->insertCaptchaLoader(); // and load the captcha 257d49ab213SSascha Leib } 258d49ab213SSascha Leib }; 259d49ab213SSascha Leib 260d49ab213SSascha Leib $this->showCaptcha = $cCode; // store the captcha code for the logfile 261d49ab213SSascha Leib } 262d49ab213SSascha Leib 263d49ab213SSascha Leib private function hasCaptchaCookie() { 264f5f4ca13SSascha Leib 265cdc02cd4SSascha Leib $cookieVal = isset($_COOKIE['DWConfirm']) ? $_COOKIE['DWConfirm'] : null; 266f5f4ca13SSascha Leib 267cdc02cd4SSascha Leib $today = substr((new DateTime())->format('c'), 0, 10); 26812993035SSascha Leib 269cdc02cd4SSascha Leib $raw = $this->getConf('captchaSeed') . '|' . $_SERVER['SERVER_NAME'] . '|' . $_SERVER['REMOTE_ADDR'] . '|' . $today; 270cdc02cd4SSascha Leib $expected = hash('sha256', $raw); 27112993035SSascha Leib 272cdc02cd4SSascha Leib //echo '<ul><li>cookie: ' . $cookieVal . '</li><li>expected: ' . $expected . '</li><li>matches: ' .($cookieVal == $expected ? 'true' : 'false') . '</li></ul>'; 273cdc02cd4SSascha Leib 274d49ab213SSascha Leib return $cookieVal == $expected; 275f5f4ca13SSascha Leib } 276f5f4ca13SSascha Leib 2772c641262SSascha Leib // check if the visitor's IP is on a whitelist: 2782c641262SSascha Leib private function captchaWhitelisted() { 2792c641262SSascha Leib 2802c641262SSascha Leib // normalise IP address: 2812c641262SSascha Leib $ip = inet_pton($_SERVER['REMOTE_ADDR']); 2822c641262SSascha Leib 2832c641262SSascha Leib // find which file to open: 2842c641262SSascha Leib $prefixes = ['user', 'default']; 2852c641262SSascha Leib foreach ($prefixes as $pre) { 2862c641262SSascha Leib $filename = __DIR__ .'/config/' . $pre . '-whitelist.txt'; 2872c641262SSascha Leib if (file_exists($filename)) { 2882c641262SSascha Leib break; 2892c641262SSascha Leib } 2902c641262SSascha Leib } 2912c641262SSascha Leib 2922c641262SSascha Leib if (file_exists($filename)) { 2932c641262SSascha Leib $lines = file($filename, FILE_SKIP_EMPTY_LINES); 2942c641262SSascha Leib foreach ($lines as $line) { 2952c641262SSascha Leib if (trim($line) !== '' && !str_starts_with($line, '#')) { 2962c641262SSascha Leib $col = explode("\t", $line); 2972c641262SSascha Leib if (count($col) >= 2) { 2982c641262SSascha Leib $from = inet_pton($col[0]); 2992c641262SSascha Leib $to = inet_pton($col[1]); 3002c641262SSascha Leib 3012c641262SSascha Leib if ($ip >= $from && $ip <= $to) { 302d49ab213SSascha Leib return true; /* IP whitelisted */ 3032c641262SSascha Leib } 3042c641262SSascha Leib } 3052c641262SSascha Leib } 3062c641262SSascha Leib } 3072c641262SSascha Leib } 308d49ab213SSascha Leib return false; /* IP not found in whitelist */ 3092c641262SSascha Leib } 3102c641262SSascha Leib 311f5f4ca13SSascha Leib private function insertCaptchaLoader() { 312*620d9253SSascha Leib 31312993035SSascha Leib echo '<script>' . NL; 31412993035SSascha Leib 31512993035SSascha Leib // add the deferred script loader:: 31612993035SSascha Leib echo DOKU_TAB . "addEventListener('DOMContentLoaded', function(){" . NL; 31712993035SSascha Leib echo DOKU_TAB . DOKU_TAB . "const cj=document.createElement('script');" . NL; 31812993035SSascha Leib echo DOKU_TAB . DOKU_TAB . "cj.async=true;cj.defer=true;cj.type='text/javascript';" . NL; 31912993035SSascha Leib echo DOKU_TAB . DOKU_TAB . "cj.src='".DOKU_BASE."lib/plugins/botmon/captcha.js';" . NL; 32012993035SSascha Leib echo DOKU_TAB . DOKU_TAB . "document.getElementsByTagName('head')[0].appendChild(cj);" . NL; 32112993035SSascha Leib echo DOKU_TAB . "});"; 322*620d9253SSascha Leib 323*620d9253SSascha Leib // add the locales for the captcha: 324*620d9253SSascha Leib echo DOKU_TAB . '$BMLocales = {' . NL; 325*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgTitle": ' . json_encode($this->getLang('bm_dlgTitle')) . ',' . NL; 326*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgSubtitle": ' . json_encode($this->getLang('bm_dlgSubtitle')) . ',' . NL; 327*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgConfirm": ' . json_encode($this->getLang('bm_dlgConfirm')) . ',' . NL; 328*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgChecking": ' . json_encode($this->getLang('bm_dlgChecking')) . ',' . NL; 329*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgLoading": ' . json_encode($this->getLang('bm_dlgLoading')) . ',' . NL; 330*620d9253SSascha Leib echo DOKU_TAB . DOKU_TAB . '"dlgError": ' . json_encode($this->getLang('bm_dlgError')) . ',' . NL; 331*620d9253SSascha Leib echo DOKU_TAB . '};' . NL; 332*620d9253SSascha Leib 33312993035SSascha Leib echo '</script>' . NL; 334f5f4ca13SSascha Leib 335f5f4ca13SSascha Leib } 336f5f4ca13SSascha Leib 33712993035SSascha Leib // inserts a blank box to ensure there is enough space for the captcha: 33812993035SSascha Leib private function insertBlankBox() { 33912993035SSascha Leib 34012993035SSascha Leib echo '<p style="min-height: 100px;"> </p>'; 34112993035SSascha Leib } 34212993035SSascha Leib 34312993035SSascha Leib /* Generates a few paragraphs of Dada text to show instead of the article content */ 344f5f4ca13SSascha Leib private function insertDadaFiller() { 345f5f4ca13SSascha Leib 34612993035SSascha Leib global $conf; 34712993035SSascha Leib global $TOC; 34812993035SSascha Leib global $ID; 349f5f4ca13SSascha Leib 35012993035SSascha Leib // list of languages to search for the wordlist 35112993035SSascha Leib $langs = array_unique([$conf['lang'], 'la']); 352f5f4ca13SSascha Leib 35312993035SSascha Leib // find path to the first available wordlist: 35412993035SSascha Leib foreach ($langs as $lang) { 35512993035SSascha Leib $filename = __DIR__ .'/lang/' . $lang . '/wordlist.txt'; /* language-specific wordlist */ 35612993035SSascha Leib if (file_exists($filename)) { 35712993035SSascha Leib break; 35812993035SSascha Leib } 35912993035SSascha Leib } 360f5f4ca13SSascha Leib 36112993035SSascha Leib // load the wordlist file: 36212993035SSascha Leib if (file_exists($filename)) { 36312993035SSascha Leib $words = array(); 36412993035SSascha Leib $totalWeight = 0; 36512993035SSascha Leib $lines = file($filename, FILE_SKIP_EMPTY_LINES); 36612993035SSascha Leib foreach ($lines as $line) { 36712993035SSascha Leib $arr = explode("\t", $line); 36812993035SSascha Leib $arr[1] = ( count($arr) > 1 ? (int) trim($arr[1]) : 1 ); 36912993035SSascha Leib $totalWeight += (int) $arr[1]; 37012993035SSascha Leib array_push($words, $arr); 37112993035SSascha Leib } 37212993035SSascha Leib } else { 37312993035SSascha Leib echo '<script> console.log("Can’t generate filler text: wordlist file not found!"); </script>'; 37412993035SSascha Leib return; 37512993035SSascha Leib } 376f5f4ca13SSascha Leib 37712993035SSascha Leib // If a TOC exists, use it for the headlines: 37812993035SSascha Leib if(is_array($TOC)) { 37912993035SSascha Leib $toc = $TOC; 38012993035SSascha Leib } else { 38112993035SSascha Leib $meta = p_get_metadata($ID, '', METADATA_RENDER_USING_CACHE); 38212993035SSascha Leib //$tocok = (isset($meta['internal']['toc']) ? $meta['internal']['toc'] : $tocok = true); 38312993035SSascha Leib $toc = isset($meta['description']['tableofcontents']) ? $meta['description']['tableofcontents'] : null; 38412993035SSascha Leib } 38512993035SSascha Leib if (!$toc) { // no TOC, generate my own: 38612993035SSascha Leib $hlCount = mt_rand(0, (int) $conf['tocminheads']); 38712993035SSascha Leib $toc = array(); 38812993035SSascha Leib for ($i=0; $i<$hlCount; $i++) { 38912993035SSascha Leib array_push($toc, $this->dadaMakeHeadline($words, $totalWeight)); // $toc 39012993035SSascha Leib } 39112993035SSascha Leib } 39212993035SSascha Leib 39312993035SSascha Leib // if H1 heading is not in the TOC, add a chappeau section: 39412993035SSascha Leib $chapeauCount = mt_rand(1, 3); 39512993035SSascha Leib if ((int) $conf['toptoclevel'] > 1) { 39612993035SSascha Leib echo "<div class=\"level1\">\n"; 39712993035SSascha Leib for ($i=0; $i<$chapeauCount; $i++) { 39812993035SSascha Leib echo $this->dadaMakeParagraph($words, $totalWeight); 39912993035SSascha Leib } 40012993035SSascha Leib echo "</div>\n"; 40112993035SSascha Leib } 40212993035SSascha Leib 40312993035SSascha Leib // text sections for each sub-headline: 40412993035SSascha Leib foreach ($toc as $hl) { 40512993035SSascha Leib echo $this->dadaMakeSection($words, $totalWeight, $hl); 40612993035SSascha Leib } 40712993035SSascha Leib } 40812993035SSascha Leib 40912993035SSascha Leib private function dadaMakeSection($words, $totalWeight, $hl) { 41012993035SSascha Leib 41112993035SSascha Leib global $conf; 41212993035SSascha Leib 41312993035SSascha Leib // how many paragraphs? 41412993035SSascha Leib $paragraphCount = mt_rand(1, 4); 41512993035SSascha Leib 41612993035SSascha Leib // section level 41712993035SSascha Leib $topTocLevel = (int) $conf['toptoclevel']; 41812993035SSascha Leib $secLevel = $hl['level'] + 1;; 41912993035SSascha Leib 42012993035SSascha Leib // return value: 42112993035SSascha Leib $sec = ""; 42212993035SSascha Leib 42312993035SSascha Leib // make a headline: 42412993035SSascha Leib if ($topTocLevel > 1 || $secLevel > 1) { 42512993035SSascha Leib $sec .= "<h{$secLevel} id=\"{$hl['hid']}\">{$hl['title']}</h{$secLevel}>\n"; 42612993035SSascha Leib } 42712993035SSascha Leib 42812993035SSascha Leib // add the paragraphs: 42912993035SSascha Leib $sec .= "<div class=\"level{$secLevel}\">\n"; 43012993035SSascha Leib for ($i=0; $i<$paragraphCount; $i++) { 43112993035SSascha Leib $sec .= $this->dadaMakeParagraph($words, $totalWeight); 43212993035SSascha Leib } 43312993035SSascha Leib $sec .= "</div>\n"; 43412993035SSascha Leib 43512993035SSascha Leib return $sec; 43612993035SSascha Leib } 43712993035SSascha Leib 43812993035SSascha Leib private function dadaMakeHeadline($words, $totalWeight) { 43912993035SSascha Leib 44012993035SSascha Leib // how many words to generate? 44112993035SSascha Leib $wordCount = mt_rand(2, 5); 44212993035SSascha Leib 44312993035SSascha Leib // function returns an array: 44412993035SSascha Leib $r = Array(); 44512993035SSascha Leib 44612993035SSascha Leib // generate the headline: 44712993035SSascha Leib $hlArr = array(); 44812993035SSascha Leib for ($i=0; $i<$wordCount; $i++) { 44912993035SSascha Leib array_push($hlArr, $this->dadaSelectRandomWord($words, $totalWeight)); 45012993035SSascha Leib } 45112993035SSascha Leib 45212993035SSascha Leib $r['title'] = ucfirst(implode(' ', $hlArr)); 45312993035SSascha Leib 45412993035SSascha Leib $r['hid'] = preg_replace('/[^\w\d\-]+/i', '_', strtolower($r['title'])); 45512993035SSascha Leib $r['type'] = 'ul'; // always ul! 45612993035SSascha Leib $r['level'] = 1; // always level 1 for now 45712993035SSascha Leib 45812993035SSascha Leib return $r; 45912993035SSascha Leib } 46012993035SSascha Leib 46112993035SSascha Leib private function dadaMakeParagraph($words, $totalWeight) { 46212993035SSascha Leib 46312993035SSascha Leib // how many words to generate? 46412993035SSascha Leib $sentenceCount = mt_rand(2, 5); 46512993035SSascha Leib 46612993035SSascha Leib $paragraph = array(); 46712993035SSascha Leib for ($i=0; $i<$sentenceCount; $i++) { 46812993035SSascha Leib array_push($paragraph, $this->dadaMakeSentence($words, $totalWeight)); 46912993035SSascha Leib } 47012993035SSascha Leib 47112993035SSascha Leib return "<p>\n" . implode(' ', $paragraph) . "\n</p>\n"; 47212993035SSascha Leib 47312993035SSascha Leib } 47412993035SSascha Leib 47512993035SSascha Leib private function dadaMakeSentence($words, $totalWeight) { 47612993035SSascha Leib 47712993035SSascha Leib // how many words to generate? 47812993035SSascha Leib $wordCount = mt_rand(4, 20); 47912993035SSascha Leib 48012993035SSascha Leib // generate the sentence: 48112993035SSascha Leib $sentence = array(); 48212993035SSascha Leib for ($i=0; $i<$wordCount; $i++) { 48312993035SSascha Leib array_push($sentence, $this->dadaSelectRandomWord($words, $totalWeight)); 48412993035SSascha Leib } 48512993035SSascha Leib 48612993035SSascha Leib return ucfirst(implode(' ', $sentence)) . '.'; 48712993035SSascha Leib 48812993035SSascha Leib } 48912993035SSascha Leib 49012993035SSascha Leib private function dadaSelectRandomWord($list, $totalWeight) { 49112993035SSascha Leib 49212993035SSascha Leib // get a random selection: 49312993035SSascha Leib $rand = mt_rand(0, $totalWeight); 49412993035SSascha Leib 49512993035SSascha Leib // match the selection to the weighted list: 49612993035SSascha Leib $cumulativeWeight = 0; 49712993035SSascha Leib for ($i=0; $i<count($list); $i++) { 49812993035SSascha Leib $cumulativeWeight += $list[$i][1]; 49912993035SSascha Leib if ($cumulativeWeight >= $rand) { 50012993035SSascha Leib return $list[$i][0]; 50112993035SSascha Leib } 50212993035SSascha Leib } 50312993035SSascha Leib return '***'; 504f5f4ca13SSascha Leib } 505f5f4ca13SSascha Leib 5066980370bSSascha Leib}