isophonics-drupal-site: core/lib/Drupal/Component/Utility/Unicode.php comparison

comparison core/lib/Drupal/Component/Utility/Unicode.php @ 17:129ea1e6d783

Update, including to Drupal core 8.6.10

author	Chris Cannam
date	Thu, 28 Feb 2019 13:21:36 +0000
parents	1fec387a4317
children

comparison

equal deleted inserted replaced

-:c2387f117808
+:129ea1e6d783
 * Indicates an error during check for PHP unicode support.
 */
 const STATUS_ERROR = -1;
 /**
-* Holds the multibyte capabilities of the current environment.
-*
-* @var int
-*/
-protected static $status = 0;
-/**
 * Gets the current status of unicode/multibyte support on this environment.
 *
 * @return int
 *   The status of multibyte support. It can be one of:
 *   - \Drupal\Component\Utility\Unicode::STATUS_MULTIBYTE
 *     Standard PHP (emulated) unicode support.
 *   - \Drupal\Component\Utility\Unicode::STATUS_ERROR
 *     An error occurred. No unicode support.
 */
 public static function getStatus() {
-return static::$status;
+switch (static::check()) {
+case 'mb_strlen':
+return Unicode::STATUS_SINGLEBYTE;
+case '':
+return Unicode::STATUS_MULTIBYTE;
+}
+return Unicode::STATUS_ERROR;
 }
 /**
 * Sets the value for multibyte support status for the current environment.
 *
 *   - \Drupal\Component\Utility\Unicode::STATUS_ERROR
 *     An error occurred. No unicode support.
 *
 * @param int $status
 *   The new status of multibyte support.
+*
+* @deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. In
+*   Drupal 9 there will be no way to set the status and in Drupal 8 this
+*   ability has been removed because mb_*() functions are supplied using
+*   Symfony's polyfill.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function setStatus($status) {
-if (!in_array($status, [static::STATUS_SINGLEBYTE, static::STATUS_MULTIBYTE, static::STATUS_ERROR])) {
+@trigger_error('\Drupal\Component\Utility\Unicode::setStatus() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. In Drupal 9 there will be no way to set the status and in Drupal 8 this ability has been removed because mb_*() functions are supplied using Symfony\'s polyfill. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
-throw new \InvalidArgumentException('Invalid status value for unicode support.');
-}
-static::$status = $status;
 }
 /**
 * Checks for Unicode support in PHP and sets the proper settings if possible.
 *
 * @return string
 *   A string identifier of a failed multibyte extension check, if any.
 *   Otherwise, an empty string.
 */
 public static function check() {
+// Set appropriate configuration.
+mb_internal_encoding('utf-8');
+mb_language('uni');
 // Check for mbstring extension.
-if (!function_exists('mb_strlen')) {
+if (!extension_loaded('mbstring')) {
-static::$status = static::STATUS_SINGLEBYTE;
 return 'mb_strlen';
 }
 // Check mbstring configuration.
 if (ini_get('mbstring.func_overload') != 0) {
-static::$status = static::STATUS_ERROR;
 return 'mbstring.func_overload';
 }
 if (ini_get('mbstring.encoding_translation') != 0) {
-static::$status = static::STATUS_ERROR;
 return 'mbstring.encoding_translation';
 }
 // mbstring.http_input and mbstring.http_output are deprecated and empty by
 // default in PHP 5.6.
 if (version_compare(PHP_VERSION, '5.6.0') == -1) {
 if (ini_get('mbstring.http_input') != 'pass') {
-static::$status = static::STATUS_ERROR;
 return 'mbstring.http_input';
 }
 if (ini_get('mbstring.http_output') != 'pass') {
-static::$status = static::STATUS_ERROR;
 return 'mbstring.http_output';
 }
 }
-// Set appropriate configuration.
-mb_internal_encoding('utf-8');
-mb_language('uni');
-static::$status = static::STATUS_MULTIBYTE;
 return '';
 }
 /**
 * Decodes UTF byte-order mark (BOM) into the encoding's name.
 *
 * @return string|bool
 *   Converted data or FALSE.
 */
 public static function convertToUtf8($data, $encoding) {
-if (function_exists('iconv')) {
+return @iconv($encoding, 'utf-8', $data);
-return @iconv($encoding, 'utf-8', $data);
-}
-elseif (function_exists('mb_convert_encoding')) {
-return @mb_convert_encoding($data, 'utf-8', $encoding);
-}
-elseif (function_exists('recode_string')) {
-return @recode_string($encoding . '..utf-8', $data);
-}
-// Cannot convert.
-return FALSE;
 }
 /**
 * Truncates a UTF-8-encoded string safely to a number of bytes.
 *
 * @param string $text
 *   The string to run the operation on.
 *
 * @return int
 *   The length of the string.
+*
+* @deprecated in Drupal 8.6.0, will be removed before Drupal 9.0.0. Use
+*   mb_strlen() instead.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function strlen($text) {
-if (static::getStatus() == static::STATUS_MULTIBYTE) {
+@trigger_error('\Drupal\Component\Utility\Unicode::strlen() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. Use mb_strlen() instead. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
 return mb_strlen($text);
-}
-else {
-// Do not count UTF-8 continuation bytes.
-return strlen(preg_replace("/[\x80-\xBF]/", '', $text));
-}
 }
 /**
 * Converts a UTF-8 string to uppercase.
 *
 * @param string $text
 *   The string to run the operation on.
 *
 * @return string
 *   The string in uppercase.
+*
+* @deprecated in Drupal 8.6.0, will be removed before Drupal 9.0.0. Use
+*   mb_strtoupper() instead.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function strtoupper($text) {
-if (static::getStatus() == static::STATUS_MULTIBYTE) {
+@trigger_error('\Drupal\Component\Utility\Unicode::strtoupper() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. Use mb_strtoupper() instead. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
 return mb_strtoupper($text);
-}
-else {
-// Use C-locale for ASCII-only uppercase.
-$text = strtoupper($text);
-// Case flip Latin-1 accented letters.
-$text = preg_replace_callback('/\xC3[\xA0-\xB6\xB8-\xBE]/', '\Drupal\Component\Utility\Unicode::caseFlip', $text);
-return $text;
-}
 }
 /**
 * Converts a UTF-8 string to lowercase.
 *
 * @param string $text
 *   The string to run the operation on.
 *
 * @return string
 *   The string in lowercase.
+*
+* @deprecated in Drupal 8.6.0, will be removed before Drupal 9.0.0. Use
+*   mb_strtolower() instead.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function strtolower($text) {
-if (static::getStatus() == static::STATUS_MULTIBYTE) {
+@trigger_error('\Drupal\Component\Utility\Unicode::strtolower() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. Use mb_strtolower() instead. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
 return mb_strtolower($text);
-}
-else {
-// Use C-locale for ASCII-only lowercase.
-$text = strtolower($text);
-// Case flip Latin-1 accented letters.
-$text = preg_replace_callback('/\xC3[\x80-\x96\x98-\x9E]/', '\Drupal\Component\Utility\Unicode::caseFlip', $text);
-return $text;
-}
 }
 /**
 * Capitalizes the first character of a UTF-8 string.
 *
 *
 * @return string
 *   The string with the first character as uppercase.
 */
 public static function ucfirst($text) {
-return static::strtoupper(static::substr($text, 0, 1)) . static::substr($text, 1);
+return mb_strtoupper(mb_substr($text, 0, 1)) . mb_substr($text, 1);
 }
 /**
 * Converts the first character of a UTF-8 string to lowercase.
 *
 *
 * @ingroup php_wrappers
 */
 public static function lcfirst($text) {
 // Note: no mbstring equivalent!
-return static::strtolower(static::substr($text, 0, 1)) . static::substr($text, 1);
+return mb_strtolower(mb_substr($text, 0, 1)) . mb_substr($text, 1);
 }
 /**
 * Capitalizes the first character of each word in a UTF-8 string.
 *
 * @ingroup php_wrappers
 */
 public static function ucwords($text) {
 $regex = '/(^|[' . static::PREG_CLASS_WORD_BOUNDARY . '])([^' . static::PREG_CLASS_WORD_BOUNDARY . '])/u';
 return preg_replace_callback($regex, function (array $matches) {
-return $matches[1] . Unicode::strtoupper($matches[2]);
+return $matches[1] . mb_strtoupper($matches[2]);
 }, $text);
 }
 /**
 * Cuts off a piece of a string based on character indices and counts.
 * @param int $length
 *   The number of characters to read.
 *
 * @return string
 *   The shortened string.
+*
+* @deprecated in Drupal 8.6.0, will be removed before Drupal 9.0.0. Use
+*   mb_substr() instead.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function substr($text, $start, $length = NULL) {
-if (static::getStatus() == static::STATUS_MULTIBYTE) {
+@trigger_error('\Drupal\Component\Utility\Unicode::substr() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. Use mb_substr() instead. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
-return $length === NULL ? mb_substr($text, $start) : mb_substr($text, $start, $length);
+return mb_substr($text, $start, $length);
-}
-else {
-$strlen = strlen($text);
-// Find the starting byte offset.
-$bytes = 0;
-if ($start > 0) {
-// Count all the characters except continuation bytes from the start
-// until we have found $start characters or the end of the string.
-$bytes = -1; $chars = -1;
-while ($bytes < $strlen - 1 && $chars < $start) {
-$bytes++;
-$c = ord($text[$bytes]);
-if ($c < 0x80 || $c >= 0xC0) {
-$chars++;
-}
-}
-}
-elseif ($start < 0) {
-// Count all the characters except continuation bytes from the end
-// until we have found abs($start) characters.
-$start = abs($start);
-$bytes = $strlen; $chars = 0;
-while ($bytes > 0 && $chars < $start) {
-$bytes--;
-$c = ord($text[$bytes]);
-if ($c < 0x80 || $c >= 0xC0) {
-$chars++;
-}
-}
-}
-$istart = $bytes;
-// Find the ending byte offset.
-if ($length === NULL) {
-$iend = $strlen;
-}
-elseif ($length > 0) {
-// Count all the characters except continuation bytes from the starting
-// index until we have found $length characters or reached the end of
-// the string, then backtrace one byte.
-$iend = $istart - 1;
-$chars = -1;
-$last_real = FALSE;
-while ($iend < $strlen - 1 && $chars < $length) {
-$iend++;
-$c = ord($text[$iend]);
-$last_real = FALSE;
-if ($c < 0x80 || $c >= 0xC0) {
-$chars++;
-$last_real = TRUE;
-}
-}
-// Backtrace one byte if the last character we found was a real
-// character and we don't need it.
-if ($last_real && $chars >= $length) {
-$iend--;
-}
-}
-elseif ($length < 0) {
-// Count all the characters except continuation bytes from the end
-// until we have found abs($start) characters, then backtrace one byte.
-$length = abs($length);
-$iend = $strlen; $chars = 0;
-while ($iend > 0 && $chars < $length) {
-$iend--;
-$c = ord($text[$iend]);
-if ($c < 0x80 || $c >= 0xC0) {
-$chars++;
-}
-}
-// Backtrace one byte if we are not at the beginning of the string.
-if ($iend > 0) {
-$iend--;
-}
-}
-else {
-// $length == 0, return an empty string.
-return '';
-}
-return substr($text, $istart, max(0, $iend - $istart + 1));
-}
 }
 /**
 * Truncates a UTF-8-encoded string safely to a number of characters.
 *
 public static function truncate($string, $max_length, $wordsafe = FALSE, $add_ellipsis = FALSE, $min_wordsafe_length = 1) {
 $ellipsis = '';
 $max_length = max($max_length, 0);
 $min_wordsafe_length = max($min_wordsafe_length, 0);
-if (static::strlen($string) <= $max_length) {
+if (mb_strlen($string) <= $max_length) {
 // No truncation needed, so don't add ellipsis, just return.
 return $string;
 }
 if ($add_ellipsis) {
 // Truncate ellipsis in case $max_length is small.
-$ellipsis = static::substr('…', 0, $max_length);
+$ellipsis = mb_substr('…', 0, $max_length);
-$max_length -= static::strlen($ellipsis);
+$max_length -= mb_strlen($ellipsis);
 $max_length = max($max_length, 0);
 }
 if ($max_length <= $min_wordsafe_length) {
 // Do not attempt word-safe if lengths are bad.
 $found = preg_match('/^(.{' . $min_wordsafe_length . ',' . $max_length . '})[' . Unicode::PREG_CLASS_WORD_BOUNDARY . ']/us', $string, $matches);
 if ($found) {
 $string = $matches[1];
 }
 else {
-$string = static::substr($string, 0, $max_length);
+$string = mb_substr($string, 0, $max_length);
 }
 }
 else {
-$string = static::substr($string, 0, $max_length);
+$string = mb_substr($string, 0, $max_length);
 }
 if ($add_ellipsis) {
 // If we're adding an ellipsis, remove any trailing periods.
 $string = rtrim($string, '.');
 * @return int
 *   Returns < 0 if $str1 is less than $str2; > 0 if $str1 is greater than
 *   $str2, and 0 if they are equal.
 */
 public static function strcasecmp($str1, $str2) {
-return strcmp(static::strtoupper($str1), static::strtoupper($str2));
+return strcmp(mb_strtoupper($str1), mb_strtoupper($str2));
 }
 /**
 * Encodes MIME/HTTP headers that contain incorrectly encoded characters.
 *
 *
 * @return int|false
 *   The position where $needle occurs in $haystack, always relative to the
 *   beginning (independent of $offset), or FALSE if not found. Note that
 *   a return value of 0 is not the same as FALSE.
+*
+* @deprecated in Drupal 8.6.0, will be removed before Drupal 9.0.0. Use
+*   mb_strpos() instead.
+*
+* @see https://www.drupal.org/node/2850048
 */
 public static function strpos($haystack, $needle, $offset = 0) {
-if (static::getStatus() == static::STATUS_MULTIBYTE) {
+@trigger_error('\Drupal\Component\Utility\Unicode::strpos() is deprecated in Drupal 8.6.0 and will be removed before Drupal 9.0.0. Use mb_strpos() instead. See https://www.drupal.org/node/2850048.', E_USER_DEPRECATED);
 return mb_strpos($haystack, $needle, $offset);
-}
-else {
-// Remove Unicode continuation characters, to be compatible with
-// Unicode::strlen() and Unicode::substr().
-$haystack = preg_replace("/[\x80-\xBF]/", '', $haystack);
-$needle = preg_replace("/[\x80-\xBF]/", '', $needle);
-return strpos($haystack, $needle, $offset);
-}
 }
 }

Mercurial > hg > isophonics-drupal-site

comparison core/lib/Drupal/Component/Utility/Unicode.php @ 17:129ea1e6d783