xref: /plugin/botmon/action.php (revision d49ab21345bfb6cded26d15d08eeffa4cb39f627)
16980370bSSascha Leib<?php
26980370bSSascha Leib
36980370bSSascha Leibuse dokuwiki\Extension\EventHandler;
46980370bSSascha Leibuse dokuwiki\Extension\Event;
55fbe88f7SSascha Leibuse dokuwiki\Logger;
66980370bSSascha Leib
76980370bSSascha Leib/**
87bd08c30SSascha Leib * Action Component for the Bot Monitoring Plugin
96980370bSSascha Leib *
106980370bSSascha Leib * @license	GPL 3 (http://www.gnu.org/licenses/gpl.html)
116980370bSSascha Leib * @author	 Sascha Leib <sascha.leib(at)kolmio.com>
126980370bSSascha Leib */
136980370bSSascha Leib
147bd08c30SSascha Leibclass action_plugin_botmon extends DokuWiki_Action_Plugin {
156980370bSSascha Leib
166980370bSSascha Leib	/**
176980370bSSascha Leib	 * Registers a callback functions
186980370bSSascha Leib	 *
196980370bSSascha Leib	 * @param EventHandler $controller DokuWiki's event controller object
206980370bSSascha Leib	 * @return void
216980370bSSascha Leib	 */
226980370bSSascha Leib	public function register(EventHandler $controller) {
235f2c1759SSascha Leib
24e56d7b71SSascha Leib		global $ACT;
25e56d7b71SSascha Leib
26*d49ab213SSascha Leib		// initialize the session id and type with random data:
27*d49ab213SSascha Leib		$this->sessionId = rand(1000000, 9999999);
28*d49ab213SSascha Leib		$this->sessionType = 'rnd';
29*d49ab213SSascha Leib
305f2c1759SSascha Leib		// insert header data into the page:
31*d49ab213SSascha Leib		if ($ACT == 'show' || $ACT == 'edit' || $ACT == 'media') {
326980370bSSascha Leib			$controller->register_hook('TPL_METAHEADER_OUTPUT', 'BEFORE', $this, 'insertHeader');
33*d49ab213SSascha Leib
34*d49ab213SSascha Leib			// Override the page rendering, if a captcha needs to be displayed:
35*d49ab213SSascha Leib			$controller->register_hook('TPL_ACT_RENDER', 'BEFORE', $this, 'showCaptcha');
36*d49ab213SSascha Leib
37e56d7b71SSascha Leib		} else if ($ACT == 'admin' && isset($_REQUEST['page']) && $_REQUEST['page'] == 'botmon') {
38e56d7b71SSascha Leib			$controller->register_hook('TPL_METAHEADER_OUTPUT', 'BEFORE', $this, 'insertAdminHeader');
39e56d7b71SSascha Leib		}
405f2c1759SSascha Leib
41*d49ab213SSascha Leib		// also show a captcha before the image preview
42*d49ab213SSascha Leib		$controller->register_hook('TPL_IMG_DISPLAY', 'BEFORE', $this, 'showImageCaptcha');
43f5f4ca13SSascha Leib
445f2c1759SSascha Leib		// write to the log after the page content was displayed:
455f2c1759SSascha Leib		$controller->register_hook('TPL_CONTENT_DISPLAY', 'AFTER', $this, 'writeServerLog');
465f2c1759SSascha Leib
476980370bSSascha Leib	}
486980370bSSascha Leib
49b148c85eSSascha Leib	/* session information */
50f6a7ebc1SSascha Leib	private $sessionId = null;
51f6a7ebc1SSascha Leib	private $sessionType = '';
522c641262SSascha Leib	private $showCaptcha = '-';
53b148c85eSSascha Leib
546980370bSSascha Leib	/**
556980370bSSascha Leib	 * Inserts tracking code to the page header
56e56d7b71SSascha Leib	 * (only called on 'show' actions)
576980370bSSascha Leib	 *
586980370bSSascha Leib	 * @param Event $event event object by reference
596980370bSSascha Leib	 * @return void
606980370bSSascha Leib	 */
616980370bSSascha Leib	public function insertHeader(Event $event, $param) {
626980370bSSascha Leib
636980370bSSascha Leib		global $INFO;
646980370bSSascha Leib
65b148c85eSSascha Leib		// populate the session id and type:
66b148c85eSSascha Leib		$this->getSessionInfo();
67b148c85eSSascha Leib
686980370bSSascha Leib		// build the tracker code:
69*d49ab213SSascha Leib		$code = $this->getBMHeader();
706980370bSSascha Leib
715f2c1759SSascha Leib		// add the deferred script loader::
72e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . "addEventListener('DOMContentLoaded', function(){" . NL;
73e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "const e=document.createElement('script');" . NL;
74e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "e.async=true;e.defer=true;" . NL;
75e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "e.src='".DOKU_BASE."lib/plugins/botmon/client.js';" . NL;
76e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . DOKU_TAB . "document.getElementsByTagName('head')[0].appendChild(e);" . NL;
77e56d7b71SSascha Leib		$code .= DOKU_TAB . DOKU_TAB . "});";
785f2c1759SSascha Leib		$event->data['script'][] = ['_data' => $code];
79451abfadSSascha Leib	}
80451abfadSSascha Leib
81*d49ab213SSascha Leib	/* create the BM object code for insertion into a script element: */
82*d49ab213SSascha Leib	private function getBMHeader() {
83*d49ab213SSascha Leib
84*d49ab213SSascha Leib		// build the tracker code:
85*d49ab213SSascha Leib		$code = DOKU_TAB . DOKU_TAB . "document._botmon = {t0: Date.now(), session: " . json_encode($this->sessionId) . ", seed: " . json_encode($this->getConf('captchaSeed')) . ", ip: " . json_encode($_SERVER['REMOTE_ADDR']) . "};" . NL;
86*d49ab213SSascha Leib
87*d49ab213SSascha Leib		// is there a user logged in?
88*d49ab213SSascha Leib		$username = ( !empty($INFO['userinfo']) && !empty($INFO['userinfo']['name']) ?  $INFO['userinfo']['name'] : '');
89*d49ab213SSascha Leib		if ($username) {
90*d49ab213SSascha Leib			$code .= DOKU_TAB . DOKU_TAB . 'document._botmon.user = "' . $username . '";'. NL;
91*d49ab213SSascha Leib		}
92*d49ab213SSascha Leib
93*d49ab213SSascha Leib		return $code;
94*d49ab213SSascha Leib
95*d49ab213SSascha Leib	}
96*d49ab213SSascha Leib
97451abfadSSascha Leib	/**
98e56d7b71SSascha Leib	 * Inserts tracking code to the page header
99e56d7b71SSascha Leib	 * (only called on 'show' actions)
100e56d7b71SSascha Leib	 *
101e56d7b71SSascha Leib	 * @param Event $event event object by reference
102e56d7b71SSascha Leib	 * @return void
103e56d7b71SSascha Leib	 */
104e56d7b71SSascha Leib	public function insertAdminHeader(Event $event, $param) {
105e56d7b71SSascha Leib
106e56d7b71SSascha Leib		$event->data['link'][] = ['rel' => 'stylesheet', 'href' => DOKU_BASE.'lib/plugins/botmon/admin.css', 'defer' => 'defer'];
1070edf1a56SSascha Leib		$event->data['script'][] = ['src' => DOKU_BASE.'lib/plugins/botmon/admin.js', 'defer' => 'defer', '_data' => ''];
108e56d7b71SSascha Leib	}
109e56d7b71SSascha Leib
110e56d7b71SSascha Leib	/**
111451abfadSSascha Leib	 * Writes data to the server log.
112451abfadSSascha Leib	 *
113451abfadSSascha Leib	 * @return void
114451abfadSSascha Leib	 */
1155f2c1759SSascha Leib	public function writeServerLog(Event $event, $param) {
116451abfadSSascha Leib
117451abfadSSascha Leib		global $conf;
118451abfadSSascha Leib		global $INFO;
119091b5998SSascha Leib
1205f2c1759SSascha Leib		// is there a user logged in?
1215f2c1759SSascha Leib		$username = ( !empty($INFO['userinfo']) && !empty($INFO['userinfo']['name'])
1225f2c1759SSascha Leib					?  $INFO['userinfo']['name'] : '');
1235f2c1759SSascha Leib
124b2e3bd8bSSascha Leib		// clean the page ID
125b2e3bd8bSSascha Leib		$pageId = preg_replace('/[\x00-\x1F]/', "\u{FFFD}", $INFO['id'] ?? '');
126b2e3bd8bSSascha Leib
127451abfadSSascha Leib		// create the log array:
128cf9f7fe8SSascha Leib		$logArr = Array(
129f5f4ca13SSascha Leib			$_SERVER['REMOTE_ADDR'], /* remote IP */
130b2e3bd8bSSascha Leib			$pageId, /* page ID */
131b148c85eSSascha Leib			$this->sessionId, /* Session ID */
132b148c85eSSascha Leib			$this->sessionType, /* session ID type */
1335f2c1759SSascha Leib			$username, /* user name */
1342f2bc93aSSascha Leib			$_SERVER['HTTP_USER_AGENT'] ?? '', /* User agent */
135451abfadSSascha Leib			$_SERVER['HTTP_REFERER'] ?? '', /* HTTP Referrer */
136451abfadSSascha Leib			substr($conf['lang'],0,2), /* page language */
137a93de874SSascha Leib			implode(',', array_unique(array_map( function($it) { return substr(trim($it),0,2); }, explode(',',trim($_SERVER['HTTP_ACCEPT_LANGUAGE'], " \t;,*"))))), /* accepted client languages */
1382c641262SSascha Leib			$this->getCountryCode(), /* GeoIP country code */
139*d49ab213SSascha Leib			$this->showCaptcha /* show captcha? */
140*d49ab213SSascha Leib		);
141cf9f7fe8SSascha Leib
142cf9f7fe8SSascha Leib		//* create the log line */
1434cddc661SSascha Leib		$filename = __DIR__ .'/logs/' . gmdate('Y-m-d') . '.srv.txt'; /* use GMT date for filename */
144cf9f7fe8SSascha Leib		$logline = gmdate('Y-m-d H:i:s'); /* use GMT time for log entries */
145cf9f7fe8SSascha Leib		foreach ($logArr as $tab) {
146cf9f7fe8SSascha Leib			$logline .= "\t" . $tab;
147cf9f7fe8SSascha Leib		};
148cf9f7fe8SSascha Leib
149cf9f7fe8SSascha Leib		/* write the log line to the file */
150cf9f7fe8SSascha Leib		$logfile = fopen($filename, 'a');
151cf9f7fe8SSascha Leib		if (!$logfile) die();
152cf9f7fe8SSascha Leib		if (fwrite($logfile, $logline . "\n") === false) {
153cf9f7fe8SSascha Leib			fclose($logfile);
154cf9f7fe8SSascha Leib			die();
1556980370bSSascha Leib		}
156cf9f7fe8SSascha Leib
157cf9f7fe8SSascha Leib		/* Done */
158cf9f7fe8SSascha Leib		fclose($logfile);
159cf9f7fe8SSascha Leib	}
160b148c85eSSascha Leib
1615f2c1759SSascha Leib	private function getCountryCode() {
1625f2c1759SSascha Leib
163f5f4ca13SSascha Leib		$country = ( $_SERVER['REMOTE_ADDR'] == '127.0.0.1' ? 'local' : 'ZZ' ); // default if no geoip is available!
1645f2c1759SSascha Leib
1655f2c1759SSascha Leib		$lib = $this->getConf('geoiplib'); /* which library to use? (can only be phpgeoip or disabled) */
1665f2c1759SSascha Leib
1675f2c1759SSascha Leib		try {
1685f2c1759SSascha Leib
1695f2c1759SSascha Leib			// use GeoIP module?
1705f2c1759SSascha Leib			if ($lib == 'phpgeoip' && extension_loaded('geoip') && geoip_db_avail(GEOIP_COUNTRY_EDITION)) { // Use PHP GeoIP module
1715f2c1759SSascha Leib				$result = geoip_country_code_by_name($_SERVER['REMOTE_ADDR']);
1725f2c1759SSascha Leib				$country = ($result ? $result : $country);
1735f2c1759SSascha Leib			}
1745f2c1759SSascha Leib		} catch (Exception $e) {
1755f2c1759SSascha Leib			Logger::error('BotMon Plugin: GeoIP Error', $e->getMessage());
1765f2c1759SSascha Leib		}
1775f2c1759SSascha Leib
1785f2c1759SSascha Leib		return $country;
1795f2c1759SSascha Leib	}
1805f2c1759SSascha Leib
181b148c85eSSascha Leib	private function getSessionInfo() {
182b148c85eSSascha Leib
183b148c85eSSascha Leib		// what is the session identifier?
184b148c85eSSascha Leib		if (isset($_SESSION)) {
185b148c85eSSascha Leib			$sesKeys = array_keys($_SESSION); /* DokuWiki Session ID preferred */
186b148c85eSSascha Leib			foreach ($sesKeys as $key) {
187b148c85eSSascha Leib				if (substr($key, 0, 2) == 'DW') {
188b148c85eSSascha Leib					$this->sessionId = $key;
189b148c85eSSascha Leib					$this->sessionType = 'dw';
190b148c85eSSascha Leib					return;
191b148c85eSSascha Leib				}
192b148c85eSSascha Leib			}
193b148c85eSSascha Leib		}
194f6a7ebc1SSascha Leib		if (!$this->sessionId) { /* no DokuWiki Session ID, try PHP session ID */
195b148c85eSSascha Leib			$this->sessionId = session_id();
196b148c85eSSascha Leib			$this->sessionType = 'php';
197b148c85eSSascha Leib		}
198f5f4ca13SSascha Leib		if (!$this->sessionId) { /* no PHP session ID, try IP address */
199f5f4ca13SSascha Leib			$this->sessionId = $_SERVER['REMOTE_ADDR'];
200b148c85eSSascha Leib			$this->sessionType = 'ip';
201b148c85eSSascha Leib		}
202b148c85eSSascha Leib	}
203f5f4ca13SSascha Leib
204f5f4ca13SSascha Leib	public function showCaptcha(Event $event) {
205f5f4ca13SSascha Leib
20612993035SSascha Leib		$useCaptcha = $this->getConf('useCaptcha');
207f5f4ca13SSascha Leib
208*d49ab213SSascha Leib		$cCode = '-';
209*d49ab213SSascha Leib		if ($useCaptcha !== 'disabled') {
210*d49ab213SSascha Leib			if ($this->captchaWhitelisted()) {
211*d49ab213SSascha Leib				$cCode = 'W'; // whitelisted
212*d49ab213SSascha Leib			} elseif ($this->hasCaptchaCookie()) {
213*d49ab213SSascha Leib				$cCode  = 'N'; // user already has a cookie
214*d49ab213SSascha Leib			} else {
215*d49ab213SSascha Leib				$cCode  = 'Y'; // show the captcha
2162c641262SSascha Leib
2172c641262SSascha Leib
21812993035SSascha Leib				echo '<h1 class="sectionedit1">'; tpl_pagetitle(); echo "</h1>\n"; // always show the original page title
219f5f4ca13SSascha Leib				$event->preventDefault(); // don't show normal content
22012993035SSascha Leib				switch ($useCaptcha) {
22112993035SSascha Leib					case 'blank':
22212993035SSascha Leib						$this->insertBlankBox();  // show dada filler instead of text
22312993035SSascha Leib						break;
22412993035SSascha Leib					case 'dada':
22512993035SSascha Leib						$this->insertDadaFiller();  // show dada filler instead of text
22612993035SSascha Leib						break;
22712993035SSascha Leib				}
228f5f4ca13SSascha Leib				$this->insertCaptchaLoader(); // and load the captcha
229f5f4ca13SSascha Leib			}
230f5f4ca13SSascha Leib		}
231*d49ab213SSascha Leib		$this->showCaptcha = $cCode; // store the captcha code for the logfile
232*d49ab213SSascha Leib
233*d49ab213SSascha Leib	}
234f5f4ca13SSascha Leib
235*d49ab213SSascha Leib	public function showImageCaptcha(Event $event, $param) {
236*d49ab213SSascha Leib
237*d49ab213SSascha Leib		$useCaptcha = $this->getConf('useCaptcha');
238*d49ab213SSascha Leib
239*d49ab213SSascha Leib		echo '<script>' . $this->getBMHeader($event, $param) . '</script>';
240*d49ab213SSascha Leib
241*d49ab213SSascha Leib		$cCode = '-';
242*d49ab213SSascha Leib		if ($useCaptcha !== 'disabled') {
243*d49ab213SSascha Leib			if ($this->captchaWhitelisted()) {
244*d49ab213SSascha Leib				$cCode = 'W'; // whitelisted
245*d49ab213SSascha Leib			}
246*d49ab213SSascha Leib			elseif ($this->hasCaptchaCookie()) {
247*d49ab213SSascha Leib				$cCode  = 'N'; // user already has a cookie
248*d49ab213SSascha Leib			}
249*d49ab213SSascha Leib			else {
250*d49ab213SSascha Leib				$cCode  = 'Y'; // show the captcha
251*d49ab213SSascha Leib
252*d49ab213SSascha Leib				echo '<svg width="100%" height="100%" viewBox="0 0 800 400" version="1.1" xmlns="http://www.w3.org/2000/svg"><path d="M1,1l798,398" style="fill:none;stroke:#f00;stroke-width:1px;"/><path d="M1,399l798,-398" style="fill:none;stroke:#f00;stroke-width:1px;"/><rect x="1" y="1" width="798" height="398" style="fill:none;stroke:#000;stroke-width:1px;"/></svg>'; // placeholder image
253*d49ab213SSascha Leib				$event->preventDefault(); // don't show normal content
254*d49ab213SSascha Leib
255*d49ab213SSascha Leib				// TODO Insert dummy image
256*d49ab213SSascha Leib				$this->insertCaptchaLoader(); // and load the captcha
257*d49ab213SSascha Leib			}
258*d49ab213SSascha Leib		};
259*d49ab213SSascha Leib
260*d49ab213SSascha Leib		$this->showCaptcha = $cCode; // store the captcha code for the logfile
261*d49ab213SSascha Leib	}
262*d49ab213SSascha Leib
263*d49ab213SSascha Leib	private function hasCaptchaCookie() {
264f5f4ca13SSascha Leib
265cdc02cd4SSascha Leib		$cookieVal = isset($_COOKIE['DWConfirm']) ? $_COOKIE['DWConfirm'] : null;
266f5f4ca13SSascha Leib
267cdc02cd4SSascha Leib		$today = substr((new DateTime())->format('c'), 0, 10);
26812993035SSascha Leib
269cdc02cd4SSascha Leib		$raw = $this->getConf('captchaSeed') . '|' . $_SERVER['SERVER_NAME'] . '|' . $_SERVER['REMOTE_ADDR'] . '|' . $today;
270cdc02cd4SSascha Leib		$expected = hash('sha256', $raw);
27112993035SSascha Leib
272cdc02cd4SSascha Leib		//echo '<ul><li>cookie: ' . $cookieVal . '</li><li>expected: ' . $expected . '</li><li>matches: ' .($cookieVal == $expected ? 'true' : 'false') . '</li></ul>';
273cdc02cd4SSascha Leib
274*d49ab213SSascha Leib		return $cookieVal == $expected;
275f5f4ca13SSascha Leib	}
276f5f4ca13SSascha Leib
2772c641262SSascha Leib	// check if the visitor's IP is on a whitelist:
2782c641262SSascha Leib	private function captchaWhitelisted() {
2792c641262SSascha Leib
2802c641262SSascha Leib		// normalise IP address:
2812c641262SSascha Leib		$ip = inet_pton($_SERVER['REMOTE_ADDR']);
2822c641262SSascha Leib
2832c641262SSascha Leib		// find which file to open:
2842c641262SSascha Leib		$prefixes = ['user', 'default'];
2852c641262SSascha Leib		foreach ($prefixes as $pre) {
2862c641262SSascha Leib			$filename = __DIR__ .'/config/' . $pre . '-whitelist.txt';
2872c641262SSascha Leib			if (file_exists($filename)) {
2882c641262SSascha Leib				break;
2892c641262SSascha Leib			}
2902c641262SSascha Leib		}
2912c641262SSascha Leib
2922c641262SSascha Leib		if (file_exists($filename)) {
2932c641262SSascha Leib			$lines = file($filename, FILE_SKIP_EMPTY_LINES);
2942c641262SSascha Leib			foreach ($lines as $line) {
2952c641262SSascha Leib				if (trim($line) !== '' && !str_starts_with($line, '#')) {
2962c641262SSascha Leib					$col = explode("\t", $line);
2972c641262SSascha Leib					if (count($col) >= 2) {
2982c641262SSascha Leib						$from = inet_pton($col[0]);
2992c641262SSascha Leib						$to = inet_pton($col[1]);
3002c641262SSascha Leib
3012c641262SSascha Leib						if ($ip >= $from && $ip <= $to) {
302*d49ab213SSascha Leib							return true; /* IP whitelisted */
3032c641262SSascha Leib						}
3042c641262SSascha Leib					}
3052c641262SSascha Leib				}
3062c641262SSascha Leib			}
3072c641262SSascha Leib		}
308*d49ab213SSascha Leib		return false; /* IP not found in whitelist */
3092c641262SSascha Leib	}
3102c641262SSascha Leib
311f5f4ca13SSascha Leib	private function insertCaptchaLoader() {
31212993035SSascha Leib		echo '<script>' . NL;
31312993035SSascha Leib
31412993035SSascha Leib		// add the deferred script loader::
31512993035SSascha Leib		echo  DOKU_TAB . "addEventListener('DOMContentLoaded', function(){" . NL;
31612993035SSascha Leib		echo  DOKU_TAB . DOKU_TAB . "const cj=document.createElement('script');" . NL;
31712993035SSascha Leib		echo  DOKU_TAB . DOKU_TAB . "cj.async=true;cj.defer=true;cj.type='text/javascript';" . NL;
31812993035SSascha Leib		echo  DOKU_TAB . DOKU_TAB . "cj.src='".DOKU_BASE."lib/plugins/botmon/captcha.js';" . NL;
31912993035SSascha Leib		echo  DOKU_TAB . DOKU_TAB . "document.getElementsByTagName('head')[0].appendChild(cj);" . NL;
32012993035SSascha Leib		echo  DOKU_TAB . "});";
32112993035SSascha Leib		echo '</script>' . NL;
322f5f4ca13SSascha Leib
323f5f4ca13SSascha Leib	}
324f5f4ca13SSascha Leib
32512993035SSascha Leib	// inserts a blank box to ensure there is enough space for the captcha:
32612993035SSascha Leib	private function insertBlankBox() {
32712993035SSascha Leib
32812993035SSascha Leib		echo '<p style="min-height: 100px;">&nbsp;</p>';
32912993035SSascha Leib	}
33012993035SSascha Leib
33112993035SSascha Leib	/* Generates a few paragraphs of Dada text to show instead of the article content */
332f5f4ca13SSascha Leib	private function insertDadaFiller() {
333f5f4ca13SSascha Leib
33412993035SSascha Leib		global $conf;
33512993035SSascha Leib		global $TOC;
33612993035SSascha Leib		global $ID;
337f5f4ca13SSascha Leib
33812993035SSascha Leib		// list of languages to search for the wordlist
33912993035SSascha Leib		$langs = array_unique([$conf['lang'], 'la']);
340f5f4ca13SSascha Leib
34112993035SSascha Leib		// find path to the first available wordlist:
34212993035SSascha Leib		foreach ($langs as $lang) {
34312993035SSascha Leib			$filename = __DIR__ .'/lang/' . $lang . '/wordlist.txt'; /* language-specific wordlist */
34412993035SSascha Leib			if (file_exists($filename)) {
34512993035SSascha Leib				break;
34612993035SSascha Leib			}
34712993035SSascha Leib		}
348f5f4ca13SSascha Leib
34912993035SSascha Leib		// load the wordlist file:
35012993035SSascha Leib		if (file_exists($filename)) {
35112993035SSascha Leib			$words = array();
35212993035SSascha Leib			$totalWeight = 0;
35312993035SSascha Leib			$lines = file($filename, FILE_SKIP_EMPTY_LINES);
35412993035SSascha Leib			foreach ($lines as $line) {
35512993035SSascha Leib				$arr = explode("\t", $line);
35612993035SSascha Leib				$arr[1] = ( count($arr) > 1 ? (int) trim($arr[1]) : 1 );
35712993035SSascha Leib				$totalWeight += (int) $arr[1];
35812993035SSascha Leib				array_push($words, $arr);
35912993035SSascha Leib			}
36012993035SSascha Leib		} else {
36112993035SSascha Leib			echo '<script> console.log("Can’t generate filler text: wordlist file not found!"); </script>';
36212993035SSascha Leib			return;
36312993035SSascha Leib		}
364f5f4ca13SSascha Leib
36512993035SSascha Leib		// If a TOC exists, use it for the headlines:
36612993035SSascha Leib		if(is_array($TOC)) {
36712993035SSascha Leib			$toc = $TOC;
36812993035SSascha Leib		} else {
36912993035SSascha Leib			$meta = p_get_metadata($ID, '', METADATA_RENDER_USING_CACHE);
37012993035SSascha Leib			//$tocok = (isset($meta['internal']['toc']) ? $meta['internal']['toc'] : $tocok = true);
37112993035SSascha Leib			$toc = isset($meta['description']['tableofcontents']) ? $meta['description']['tableofcontents'] : null;
37212993035SSascha Leib		}
37312993035SSascha Leib		if (!$toc) { // no TOC, generate my own:
37412993035SSascha Leib			$hlCount = mt_rand(0, (int) $conf['tocminheads']);
37512993035SSascha Leib			$toc = array();
37612993035SSascha Leib			for ($i=0; $i<$hlCount; $i++) {
37712993035SSascha Leib				array_push($toc, $this->dadaMakeHeadline($words, $totalWeight)); // $toc
37812993035SSascha Leib			}
37912993035SSascha Leib		}
38012993035SSascha Leib
38112993035SSascha Leib		// if H1 heading is not in the TOC, add a chappeau section:
38212993035SSascha Leib		$chapeauCount = mt_rand(1, 3);
38312993035SSascha Leib		if ((int) $conf['toptoclevel'] > 1) {
38412993035SSascha Leib			echo "<div class=\"level1\">\n";
38512993035SSascha Leib			for ($i=0; $i<$chapeauCount; $i++) {
38612993035SSascha Leib				echo $this->dadaMakeParagraph($words, $totalWeight);
38712993035SSascha Leib			}
38812993035SSascha Leib			echo "</div>\n";
38912993035SSascha Leib		}
39012993035SSascha Leib
39112993035SSascha Leib		//  text sections for each sub-headline:
39212993035SSascha Leib		foreach ($toc as $hl) {
39312993035SSascha Leib			echo $this->dadaMakeSection($words, $totalWeight, $hl);
39412993035SSascha Leib		}
39512993035SSascha Leib	}
39612993035SSascha Leib
39712993035SSascha Leib	private function dadaMakeSection($words, $totalWeight, $hl) {
39812993035SSascha Leib
39912993035SSascha Leib		global $conf;
40012993035SSascha Leib
40112993035SSascha Leib		// how many paragraphs?
40212993035SSascha Leib		$paragraphCount = mt_rand(1, 4);
40312993035SSascha Leib
40412993035SSascha Leib		// section level
40512993035SSascha Leib		$topTocLevel = (int) $conf['toptoclevel'];
40612993035SSascha Leib		$secLevel = $hl['level'] + 1;;
40712993035SSascha Leib
40812993035SSascha Leib		// return value:
40912993035SSascha Leib		$sec = "";
41012993035SSascha Leib
41112993035SSascha Leib		// make a headline:
41212993035SSascha Leib		if ($topTocLevel > 1 || $secLevel > 1) {
41312993035SSascha Leib			$sec .= "<h{$secLevel} id=\"{$hl['hid']}\">{$hl['title']}</h{$secLevel}>\n";
41412993035SSascha Leib		}
41512993035SSascha Leib
41612993035SSascha Leib		// add the paragraphs:
41712993035SSascha Leib		$sec .= "<div class=\"level{$secLevel}\">\n";
41812993035SSascha Leib		for ($i=0; $i<$paragraphCount; $i++) {
41912993035SSascha Leib			$sec .= $this->dadaMakeParagraph($words, $totalWeight);
42012993035SSascha Leib		}
42112993035SSascha Leib		$sec .= "</div>\n";
42212993035SSascha Leib
42312993035SSascha Leib		return $sec;
42412993035SSascha Leib	}
42512993035SSascha Leib
42612993035SSascha Leib	private function dadaMakeHeadline($words, $totalWeight) {
42712993035SSascha Leib
42812993035SSascha Leib		// how many words to generate?
42912993035SSascha Leib		$wordCount = mt_rand(2, 5);
43012993035SSascha Leib
43112993035SSascha Leib		// function returns an array:
43212993035SSascha Leib		$r = Array();
43312993035SSascha Leib
43412993035SSascha Leib		// generate the headline:
43512993035SSascha Leib		$hlArr = array();
43612993035SSascha Leib		for ($i=0; $i<$wordCount; $i++) {
43712993035SSascha Leib			array_push($hlArr, $this->dadaSelectRandomWord($words, $totalWeight));
43812993035SSascha Leib		}
43912993035SSascha Leib
44012993035SSascha Leib		$r['title'] =  ucfirst(implode(' ', $hlArr));
44112993035SSascha Leib
44212993035SSascha Leib		$r['hid'] = preg_replace('/[^\w\d\-]+/i', '_', strtolower($r['title']));
44312993035SSascha Leib		$r['type'] = 'ul'; // always ul!
44412993035SSascha Leib		$r['level'] = 1; // always level 1 for now
44512993035SSascha Leib
44612993035SSascha Leib		return $r;
44712993035SSascha Leib	}
44812993035SSascha Leib
44912993035SSascha Leib	private function dadaMakeParagraph($words, $totalWeight) {
45012993035SSascha Leib
45112993035SSascha Leib		// how many words to generate?
45212993035SSascha Leib		$sentenceCount = mt_rand(2, 5);
45312993035SSascha Leib
45412993035SSascha Leib		$paragraph = array();
45512993035SSascha Leib		for ($i=0; $i<$sentenceCount; $i++) {
45612993035SSascha Leib			array_push($paragraph, $this->dadaMakeSentence($words, $totalWeight));
45712993035SSascha Leib		}
45812993035SSascha Leib
45912993035SSascha Leib		return "<p>\n" . implode(' ', $paragraph) . "\n</p>\n";
46012993035SSascha Leib
46112993035SSascha Leib	}
46212993035SSascha Leib
46312993035SSascha Leib	private function dadaMakeSentence($words, $totalWeight) {
46412993035SSascha Leib
46512993035SSascha Leib		// how many words to generate?
46612993035SSascha Leib		$wordCount = mt_rand(4, 20);
46712993035SSascha Leib
46812993035SSascha Leib		// generate the sentence:
46912993035SSascha Leib		$sentence = array();
47012993035SSascha Leib		for ($i=0; $i<$wordCount; $i++) {
47112993035SSascha Leib			array_push($sentence, $this->dadaSelectRandomWord($words, $totalWeight));
47212993035SSascha Leib		}
47312993035SSascha Leib
47412993035SSascha Leib		return ucfirst(implode(' ', $sentence)) . '.';
47512993035SSascha Leib
47612993035SSascha Leib	}
47712993035SSascha Leib
47812993035SSascha Leib	private function dadaSelectRandomWord($list, $totalWeight) {
47912993035SSascha Leib
48012993035SSascha Leib		// get a random selection:
48112993035SSascha Leib		$rand = mt_rand(0, $totalWeight);
48212993035SSascha Leib
48312993035SSascha Leib		// match the selection to the weighted list:
48412993035SSascha Leib		$cumulativeWeight = 0;
48512993035SSascha Leib		for ($i=0; $i<count($list); $i++) {
48612993035SSascha Leib			$cumulativeWeight += $list[$i][1];
48712993035SSascha Leib			if ($cumulativeWeight >= $rand) {
48812993035SSascha Leib				return $list[$i][0];
48912993035SSascha Leib			}
49012993035SSascha Leib		}
49112993035SSascha Leib		return '***';
492f5f4ca13SSascha Leib	}
493f5f4ca13SSascha Leib
4946980370bSSascha Leib}