= 0 && \mb_strpos($haystack, $needle, $temp) !== false)) { return true; } } return false; } /** * Makes first letter of a multi byte string upper case. * * @param string $string string to upper case first letter * * @return string multi byte string with first character as upper case * * @since 1.0.0 */ public static function mb_ucfirst(string $string) : string { $strlen = \mb_strlen($string); $firstChar = \mb_substr($string, 0, 1); $then = \mb_substr($string, 1, $strlen - 1); return \mb_strtoupper($firstChar) . $then; } /** * Makes first letter of a multi byte string lower case. * * @param string $string string to lower case first letter * * @return string multi byte string with first character as lower case * * @since 1.0.0 */ public static function mb_lcfirst(string $string) : string { $strlen = \mb_strlen($string); $firstChar = \mb_substr($string, 0, 1); $then = \mb_substr($string, 1, $strlen - 1); return \mb_strtolower($firstChar) . $then; } /** * Trim multi byte characters from a multi byte string. * * @param string $string multi byte string to trim multi byte characters from * @param string $charlist Multi byte character list used for trimming * * @return string trimmed multi byte string * * @since 1.0.0 */ public static function mb_trim(string $string, string $charlist = ' ') : string { if ($charlist === ' ') { return \trim($string); } else { $charlist = \str_replace('/', '\/', \preg_quote($charlist)); return \preg_replace('/(^[' . $charlist . ']+)|([ ' . $charlist . ']+$)/us', '', $string) ?? ''; } } /** * Trim multi byte characters from the right of a multi byte string. * * @param string $string multi byte string to trim multi byte characters from * @param string $charlist Multi byte character list used for trimming * * @return string trimmed multi byte string * * @since 1.0.0 */ public static function mb_rtrim(string $string, string $charlist = ' ') : string { if ($charlist === ' ') { return \rtrim($string); } else { $charlist = \str_replace('/', '\/', \preg_quote($charlist)); return \preg_replace('/([' . $charlist . ']+$)/us', '', $string) ?? ''; } } /** * Trim multi byte characters from the left of a multi byte string. * * @param string $string multi byte string to trim multi byte characters from * @param string $charlist Multi byte character list used for trimming * * @return string trimmed multi byte string * * @since 1.0.0 */ public static function mb_ltrim(string $string, string $charlist = ' ') : string { if ($charlist === ' ') { return \ltrim($string); } else { $charlist = \str_replace('/', '\/', \preg_quote($charlist)); return \preg_replace('/(^[' . $charlist . ']+)/us', '', $string) ?? ''; } } /** * Calculate string entropy * * @param string $value string to analyze * * @return float * * @since 1.0.0 */ public static function mb_entropy(string $value) : float { $entropy = 0.0; $size = \mb_strlen($value); $countChars = self::mb_count_chars($value); foreach ($countChars as $v) { $p = $v / $size; $entropy -= $p * \log($p) / \log(2); } return $entropy; } /** * Count chars of utf-8 string. * * @param string $input string to count chars * * @return array * * @since 1.0.0 */ public static function mb_count_chars(string $input) : array { $l = \mb_strlen($input, 'UTF-8'); $unique = []; for ($i = 0; $i < $l; ++$i) { $char = \mb_substr($input, $i, 1, 'UTF-8'); if (!\array_key_exists($char, $unique)) { $unique[$char] = 0; } ++$unique[$char]; } return $unique; } /** * Get the utf-8 boundary of a string * * @param string $text To search for utf-8 boundary * @param int $offset Search offset * * @return int * * @since 1.0.0 */ public static function utf8CharBoundary(string $text, int $offset = 0) : int { $reset = 3; $pos = $offset; do { $lastChunk = \substr($text, $pos - $reset, $reset); $encodedPos = \strpos($lastChunk, '='); if ($encodedPos === false) { break; } $hex = \substr($text, $pos - $reset + $encodedPos + 1, 2); $dec = \hexdec($hex); if ($dec < 128) { if ($encodedPos > 0) { $pos -= $reset - $encodedPos; } break; } elseif ($dec >= 192) { $pos -= $reset - $encodedPos; break; } elseif ($dec < 192) { $reset += 3; } } while (true); return $pos; } /** * Test if a string has multibytes * * @param string $text Text to check * @param string $charset Charset to check * * @return bool * * @since 1.0.0 */ public static function hasMultiBytes(string $text, string $charset = CharsetType::UTF_8) : bool { return \strlen($text) > \mb_strlen($text, $charset); } }