12d85e841SAndreas Gohr<?php 22d85e841SAndreas Gohr 32d85e841SAndreas Gohrnamespace dokuwiki\Utf8; 42d85e841SAndreas Gohr 52d85e841SAndreas Gohr/** 62d85e841SAndreas Gohr * DokuWiki sort functions 72d85e841SAndreas Gohr * 82d85e841SAndreas Gohr * When "intl" extension is available, all sorts are done using a collator. 92d85e841SAndreas Gohr * Otherwise, primitive PHP functions are called. 102d85e841SAndreas Gohr * 112d85e841SAndreas Gohr * The collator is created using the locale given in $conf['lang']. 122d85e841SAndreas Gohr * It always uses case insensitive "natural" ordering in its collation. 132d85e841SAndreas Gohr * The fallback solution uses the primitive PHP functions that return almost the same results 142d85e841SAndreas Gohr * when the input is text with only [A-Za-z0-9] characters. 152d85e841SAndreas Gohr * 162d85e841SAndreas Gohr * @license GPL 2 (http://www.gnu.org/licenses/gpl.html) 172d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 18*0489c64bSMoisés Braga Ribeiro * @author Andreas Gohr <andi@splitbrain.org> 192d85e841SAndreas Gohr */ 202d85e841SAndreas Gohrclass Sort 212d85e841SAndreas Gohr{ 222d85e841SAndreas Gohr /** @var \Collator[] language specific collators, usually only one */ 23*0489c64bSMoisés Braga Ribeiro protected static $collators = []; 24f9aa34a3SAndreas Gohr 25f9aa34a3SAndreas Gohr /** @var bool should the intl extension be used if available? For testing only */ 26f9aa34a3SAndreas Gohr protected static $useIntl = true; 272d85e841SAndreas Gohr 282d85e841SAndreas Gohr /** 292d85e841SAndreas Gohr * Initialization of a collator using $conf['lang'] as the locale. 30*0489c64bSMoisés Braga Ribeiro * The initialization is done only once. 312d85e841SAndreas Gohr * The collation takes "natural ordering" into account, that is, "page 2" is before "page 10". 322d85e841SAndreas Gohr * 332d85e841SAndreas Gohr * @return \Collator Returns a configured collator or null if the collator cannot be created. 342d85e841SAndreas Gohr * 352d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 362d85e841SAndreas Gohr */ 37*0489c64bSMoisés Braga Ribeiro protected static function getCollator() 382d85e841SAndreas Gohr { 392d85e841SAndreas Gohr global $conf; 402d85e841SAndreas Gohr $lc = $conf['lang']; 412d85e841SAndreas Gohr 422d85e841SAndreas Gohr // check if intl extension is available 43f9aa34a3SAndreas Gohr if (!self::$useIntl || !class_exists('\Collator')) { 442d85e841SAndreas Gohr return null; 452d85e841SAndreas Gohr } 462d85e841SAndreas Gohr 472d85e841SAndreas Gohr // load collator if not available yet 48*0489c64bSMoisés Braga Ribeiro if (!isset(self::$collators[$lc])) { 492d85e841SAndreas Gohr $collator = \Collator::create($lc); 50*0489c64bSMoisés Braga Ribeiro if (!isset($collator)) return null; // check needed as stated in the docs 512d85e841SAndreas Gohr $collator->setAttribute(\Collator::NUMERIC_COLLATION, \Collator::ON); 52*0489c64bSMoisés Braga Ribeiro dbglog('Collator created with locale "' . $lc . '": numeric collation on, ' . 53*0489c64bSMoisés Braga Ribeiro 'valid locale "' . $collator->getLocale(\Locale::VALID_LOCALE) . '", ' . 54*0489c64bSMoisés Braga Ribeiro 'actual locale "' . $collator->getLocale(\Locale::ACTUAL_LOCALE) . '"'); 55*0489c64bSMoisés Braga Ribeiro self::$collators[$lc] = $collator; 562d85e841SAndreas Gohr } 572d85e841SAndreas Gohr 58*0489c64bSMoisés Braga Ribeiro return self::$collators[$lc]; 592d85e841SAndreas Gohr } 602d85e841SAndreas Gohr 612d85e841SAndreas Gohr /** 62*0489c64bSMoisés Braga Ribeiro * Enable or disable the use of the "intl" extension collator. 63*0489c64bSMoisés Braga Ribeiro * This is used for testing and should not be used in normal code. 64f9aa34a3SAndreas Gohr * 65f9aa34a3SAndreas Gohr * @param bool $use 66*0489c64bSMoisés Braga Ribeiro * 67*0489c64bSMoisés Braga Ribeiro * @author Andreas Gohr <andi@splitbrain.org> 68f9aa34a3SAndreas Gohr */ 69f9aa34a3SAndreas Gohr public static function useIntl($use = true) 70f9aa34a3SAndreas Gohr { 71f9aa34a3SAndreas Gohr self::$useIntl = $use; 72f9aa34a3SAndreas Gohr } 73f9aa34a3SAndreas Gohr 74f9aa34a3SAndreas Gohr /** 752d85e841SAndreas Gohr * Drop-in replacement for strcmp(), strcasecmp(), strnatcmp() and strnatcasecmp(). 762d85e841SAndreas Gohr * It uses a collator-based comparison, or strnatcasecmp() as a fallback. 772d85e841SAndreas Gohr * 782d85e841SAndreas Gohr * @param string $str1 The first string. 792d85e841SAndreas Gohr * @param string $str2 The second string. 802d85e841SAndreas Gohr * @return int Returns < 0 if $str1 is less than $str2; > 0 if $str1 is greater than $str2, and 0 if they are equal. 812d85e841SAndreas Gohr * 822d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 832d85e841SAndreas Gohr */ 842d85e841SAndreas Gohr public static function strcmp($str1, $str2) 852d85e841SAndreas Gohr { 862d85e841SAndreas Gohr $collator = self::getCollator(); 872d85e841SAndreas Gohr if (isset($collator)) { 882d85e841SAndreas Gohr return $collator->compare($str1, $str2); 892d85e841SAndreas Gohr } else { 902d85e841SAndreas Gohr return strnatcasecmp($str1, $str2); 912d85e841SAndreas Gohr } 922d85e841SAndreas Gohr } 932d85e841SAndreas Gohr 942d85e841SAndreas Gohr /** 952d85e841SAndreas Gohr * Drop-in replacement for sort(). 962d85e841SAndreas Gohr * It uses a collator-based sort, or sort() with flags SORT_NATURAL and SORT_FLAG_CASE as a fallback. 972d85e841SAndreas Gohr * 982d85e841SAndreas Gohr * @param array $array The input array. 992d85e841SAndreas Gohr * @return bool Returns true on success or false on failure. 1002d85e841SAndreas Gohr * 1012d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 1022d85e841SAndreas Gohr */ 1032d85e841SAndreas Gohr public static function sort(&$array) 1042d85e841SAndreas Gohr { 1052d85e841SAndreas Gohr $collator = self::getCollator(); 1062d85e841SAndreas Gohr if (isset($collator)) { 1072d85e841SAndreas Gohr return $collator->sort($array); 1082d85e841SAndreas Gohr } else { 1092d85e841SAndreas Gohr return sort($array, SORT_NATURAL | SORT_FLAG_CASE); 1102d85e841SAndreas Gohr } 1112d85e841SAndreas Gohr } 1122d85e841SAndreas Gohr 1132d85e841SAndreas Gohr /** 1142d85e841SAndreas Gohr * Drop-in replacement for ksort(). 1152d85e841SAndreas Gohr * It uses a collator-based sort, or ksort() with flags SORT_NATURAL and SORT_FLAG_CASE as a fallback. 1162d85e841SAndreas Gohr * 1172d85e841SAndreas Gohr * @param array $array The input array. 1182d85e841SAndreas Gohr * @return bool Returns true on success or false on failure. 1192d85e841SAndreas Gohr * 1202d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 1212d85e841SAndreas Gohr */ 1222d85e841SAndreas Gohr public static function ksort(&$array) 1232d85e841SAndreas Gohr { 1242d85e841SAndreas Gohr $collator = self::getCollator(); 1252d85e841SAndreas Gohr if (isset($collator)) { 1262d85e841SAndreas Gohr return uksort($array, array($collator, 'compare')); 1272d85e841SAndreas Gohr } else { 1282d85e841SAndreas Gohr return ksort($array, SORT_NATURAL | SORT_FLAG_CASE); 1292d85e841SAndreas Gohr } 1302d85e841SAndreas Gohr } 1312d85e841SAndreas Gohr 1322d85e841SAndreas Gohr /** 1332d85e841SAndreas Gohr * Drop-in replacement for asort(), natsort() and natcasesort(). 1342d85e841SAndreas Gohr * It uses a collator-based sort, or asort() with flags SORT_NATURAL and SORT_FLAG_CASE as a fallback. 1352d85e841SAndreas Gohr * 1362d85e841SAndreas Gohr * @param array $array The input array. 1372d85e841SAndreas Gohr * @return bool Returns true on success or false on failure. 1382d85e841SAndreas Gohr * 1392d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 1402d85e841SAndreas Gohr */ 1412d85e841SAndreas Gohr public static function asort(&$array) 1422d85e841SAndreas Gohr { 1432d85e841SAndreas Gohr $collator = self::getCollator(); 1442d85e841SAndreas Gohr if (isset($collator)) { 1452d85e841SAndreas Gohr return $collator->asort($array); 1462d85e841SAndreas Gohr } else { 1472d85e841SAndreas Gohr return asort($array, SORT_NATURAL | SORT_FLAG_CASE); 1482d85e841SAndreas Gohr } 1492d85e841SAndreas Gohr } 1502d85e841SAndreas Gohr 1512d85e841SAndreas Gohr /** 1522d85e841SAndreas Gohr * Drop-in replacement for asort(), natsort() and natcasesort() when the parameter is an array of filenames. 1532d85e841SAndreas Gohr * Filenames may not be equal to page names, depending on the setting in $conf['fnencode'], 1542d85e841SAndreas Gohr * so the correct behavior is to sort page names and reflect this sorting in the filename array. 1552d85e841SAndreas Gohr * 1562d85e841SAndreas Gohr * @param array $array The input array. 1572d85e841SAndreas Gohr * @return bool Returns true on success or false on failure. 1582d85e841SAndreas Gohr * 1592d85e841SAndreas Gohr * @author Moisés Braga Ribeiro <moisesbr@gmail.com> 160*0489c64bSMoisés Braga Ribeiro * @author Andreas Gohr <andi@splitbrain.org> 1612d85e841SAndreas Gohr */ 1622d85e841SAndreas Gohr public static function asortFN(&$array) 1632d85e841SAndreas Gohr { 1642d85e841SAndreas Gohr $collator = self::getCollator(); 1652d85e841SAndreas Gohr return uasort($array, function ($fn1, $fn2) use ($collator) { 1662d85e841SAndreas Gohr if (isset($collator)) { 1672d85e841SAndreas Gohr return $collator->compare(utf8_decodeFN($fn1), utf8_decodeFN($fn2)); 1682d85e841SAndreas Gohr } else { 1692d85e841SAndreas Gohr return strnatcasecmp(utf8_decodeFN($fn1), utf8_decodeFN($fn2)); 1702d85e841SAndreas Gohr } 1712d85e841SAndreas Gohr }); 1722d85e841SAndreas Gohr } 1732d85e841SAndreas Gohr} 174