combo/ComboStrap/StringUtility.php

37748cd8SNickeau<?php
37748cd8SNickeau
37748cd8SNickeaunamespace ComboStrap;
37748cd8SNickeau
37748cd8SNickeau/**
37748cd8SNickeau * Class StringUtility
37748cd8SNickeau * @package ComboStrap
37748cd8SNickeau * A class with string utility
37748cd8SNickeau */
37748cd8SNickeauclass StringUtility
37748cd8SNickeau{
37748cd8SNickeau
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * Generate a text with a max length of $length
37748cd8SNickeau     * and add ... if above
37748cd8SNickeau     * @param $myString
37748cd8SNickeau     * @param $length
37748cd8SNickeau     * @return string
37748cd8SNickeau     */
*1fa8c418SNickeau    static function truncateString($myString, $length): string
37748cd8SNickeau    {
37748cd8SNickeau
37748cd8SNickeau        if (strlen($myString) > $length) {
37748cd8SNickeau            $suffix = ' ...';
37748cd8SNickeau            $myString = substr($myString, 0, ($length - 1) - strlen($suffix)) . $suffix;
37748cd8SNickeau        }
37748cd8SNickeau        return $myString;
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * @param $string
37748cd8SNickeau     * @return string - the string without any carriage return
37748cd8SNickeau     * Used to compare string without worrying about carriage return
37748cd8SNickeau     */
37748cd8SNickeau    public static function normalized($string)
37748cd8SNickeau    {
37748cd8SNickeau        return str_replace("\n", "", $string);
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * @param $needle
37748cd8SNickeau     * @param $haystack
37748cd8SNickeau     * @return bool
37748cd8SNickeau     */
37748cd8SNickeau    public static function contain($needle, $haystack)
37748cd8SNickeau    {
37748cd8SNickeau        $pos = strpos($haystack, $needle);
37748cd8SNickeau        if ($pos === FALSE) {
37748cd8SNickeau            return false;
37748cd8SNickeau        } else {
37748cd8SNickeau            return true;
37748cd8SNickeau        }
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function toString($value)
37748cd8SNickeau    {
37748cd8SNickeau        /**
37748cd8SNickeau         * No transformation if it's a string
37748cd8SNickeau         * var_export below is not idempotent
37748cd8SNickeau         * ie \ would become \\
37748cd8SNickeau         */
37748cd8SNickeau        if(is_string($value)){
37748cd8SNickeau            return $value;
37748cd8SNickeau        }
37748cd8SNickeau
37748cd8SNickeau        $string = var_export($value, true);
37748cd8SNickeau
37748cd8SNickeau        // An array value gets command in var_export
37748cd8SNickeau        $lastCharacterIndex = strlen($string) - 1;
37748cd8SNickeau        if ($string[0] === "'" && $string[$lastCharacterIndex] === "'") {
37748cd8SNickeau            $string = substr($string, 1, strlen($string) - 2);
37748cd8SNickeau        }
37748cd8SNickeau        return $string;
37748cd8SNickeau
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * Add an EOL if not present at the end of the string
37748cd8SNickeau     * @param $doc
37748cd8SNickeau     */
37748cd8SNickeau    public static function addEolCharacterIfNotPresent(&$doc)
37748cd8SNickeau    {
37748cd8SNickeau        if ($doc[strlen($doc) - 1] != DOKU_LF) {
37748cd8SNickeau            $doc .= DOKU_LF;
37748cd8SNickeau        }
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * Delete the string from the end
37748cd8SNickeau     * This is used generally to delete the previous opening tag of an header or a blockquote
37748cd8SNickeau     * @param $doc
37748cd8SNickeau     * @param $string
37748cd8SNickeau     */
37748cd8SNickeau    public static function rtrim(&$doc, $string)
37748cd8SNickeau    {
37748cd8SNickeau
37748cd8SNickeau        /**
37748cd8SNickeau         * We trim because in the process, we may get extra {@link DOKU_LF} at the end
37748cd8SNickeau         */
37748cd8SNickeau        $doc = trim($doc);
37748cd8SNickeau        $string = trim($string);
37748cd8SNickeau        $length = strlen($doc) - strlen($string);
37748cd8SNickeau        if (substr($doc, $length) === $string) {
37748cd8SNickeau            $doc = substr($doc, 0, $length);
37748cd8SNickeau        }
37748cd8SNickeau
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * Delete the string from the beginning
37748cd8SNickeau     * This is used to delete a tag for instance
37748cd8SNickeau     * @param $doc
37748cd8SNickeau     * @param $string
37748cd8SNickeau     */
37748cd8SNickeau    public static function ltrim(&$doc, $string)
37748cd8SNickeau    {
37748cd8SNickeau
37748cd8SNickeau        $doc = trim($doc);
37748cd8SNickeau        $string = trim($string);
37748cd8SNickeau        $length = strlen($string);
37748cd8SNickeau        if (substr($doc, 0, $length) === $string) {
37748cd8SNickeau            $doc = substr($doc, $length);
37748cd8SNickeau        }
37748cd8SNickeau
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * The word count does not take into account
37748cd8SNickeau     * words with non-words characters such as < =
37748cd8SNickeau     * Therefore the node <node> and attribute name=value are not taken in the count
37748cd8SNickeau     * @param $text
37748cd8SNickeau     * @return int the number of words
37748cd8SNickeau     */
37748cd8SNickeau    public static function getWordCount($text)
37748cd8SNickeau    {
37748cd8SNickeau        /**
37748cd8SNickeau         * Delete the frontmatter
37748cd8SNickeau         */
37748cd8SNickeau        $text = preg_replace("/^---(json)?$.*^---$/Ums", "", $text);
37748cd8SNickeau        /**
37748cd8SNickeau         * New line for node
37748cd8SNickeau         */
37748cd8SNickeau        $text = str_replace("<", "\n<", $text);
37748cd8SNickeau        $text = str_replace(">", ">\n", $text);
37748cd8SNickeau        // \s shorthand for whitespace
37748cd8SNickeau        // | the table and links are separated with a |
37748cd8SNickeau        // / to take into account expression such as and/or
37748cd8SNickeau        // /u for unicode support (https://www.php.net/manual/en/reference.pcre.pattern.modifiers.php)
37748cd8SNickeau        $wordSeparator = '/[\s|\/]/u';
37748cd8SNickeau        $preg_split = preg_split($wordSeparator, $text);
37748cd8SNickeau        $wordsWithoutEmpty = array_filter($preg_split, 'self::isWord');
37748cd8SNickeau        return count($wordsWithoutEmpty);
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function normalize($expected)
37748cd8SNickeau    {
37748cd8SNickeau        $expected = preg_replace("/[\s]/", " ", $expected);
37748cd8SNickeau        $expected = str_replace("  ", " ", $expected);
37748cd8SNickeau        $expected = str_replace("  ", " ", $expected);
37748cd8SNickeau        $expected = str_replace("  ", " ", $expected);
37748cd8SNickeau        $expected = str_replace("  ", " ", $expected);
37748cd8SNickeau        return trim($expected);
37748cd8SNickeau
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    /**
37748cd8SNickeau     * @param $text
37748cd8SNickeau     * @return bool
37748cd8SNickeau     */
37748cd8SNickeau    public static function isWord($text)
37748cd8SNickeau    {
37748cd8SNickeau        if (empty($text)) {
37748cd8SNickeau            return false;
37748cd8SNickeau        }
37748cd8SNickeau        /**
37748cd8SNickeau         * We also allow `-` minus
37748cd8SNickeau         *
37748cd8SNickeau         * And because otherwise the words are not counted:
37748cd8SNickeau         *   * `'` (used to highlight words)
37748cd8SNickeau         *   * `[]` used in links
37748cd8SNickeau         *   * `,` used at the end of a sentenct
37748cd8SNickeau         */
37748cd8SNickeau        $preg_match = preg_match("/^[\w\-'\]\[,]*$/u", $text);
37748cd8SNickeau        return $preg_match == 1;
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function match($subject, $pattern)
37748cd8SNickeau    {
37748cd8SNickeau        return preg_match("/$pattern/", $subject) === 1;
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function endWiths($string, $suffix)
37748cd8SNickeau    {
37748cd8SNickeau        $suffixStartPosition = strlen($string) - strlen($suffix);
37748cd8SNickeau        return strrpos($string, $suffix) === $suffixStartPosition;
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function explodeAndTrim($string, $delimiter = ",")
37748cd8SNickeau    {
37748cd8SNickeau        return array_map('trim', explode($delimiter, $string));
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function lastIndexOf($haystack, $needle)
37748cd8SNickeau    {
37748cd8SNickeau        /**
37748cd8SNickeau         * strRpos
37748cd8SNickeau         * and not strpos
37748cd8SNickeau         */
37748cd8SNickeau        return strrpos($haystack, $needle);
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau    public static function startWiths($string, $prefix)
37748cd8SNickeau    {
37748cd8SNickeau        return strrpos($string, $prefix) === 0;
37748cd8SNickeau    }
37748cd8SNickeau
37748cd8SNickeau}