pictcode / lib / Cake / I18n / Multibyte.php @ 1368d528
履歴 | 表示 | アノテート | ダウンロード (25.107 KB)
| 1 |
<?php
|
|---|---|
| 2 |
/**
|
| 3 |
* Multibyte handling methods.
|
| 4 |
*
|
| 5 |
* CakePHP(tm) : Rapid Development Framework (http://cakephp.org)
|
| 6 |
* Copyright (c) Cake Software Foundation, Inc. (http://cakefoundation.org)
|
| 7 |
*
|
| 8 |
* Licensed under The MIT License
|
| 9 |
* For full copyright and license information, please see the LICENSE.txt
|
| 10 |
* Redistributions of files must retain the above copyright notice.
|
| 11 |
*
|
| 12 |
* @copyright Copyright (c) Cake Software Foundation, Inc. (http://cakefoundation.org)
|
| 13 |
* @link http://cakephp.org CakePHP(tm) Project
|
| 14 |
* @package Cake.I18n
|
| 15 |
* @since CakePHP(tm) v 1.2.0.6833
|
| 16 |
* @license http://www.opensource.org/licenses/mit-license.php MIT License
|
| 17 |
*/
|
| 18 |
|
| 19 |
/**
|
| 20 |
* Multibyte handling methods.
|
| 21 |
*
|
| 22 |
* @package Cake.I18n
|
| 23 |
*/
|
| 24 |
class Multibyte { |
| 25 |
|
| 26 |
/**
|
| 27 |
* Holds the case folding values
|
| 28 |
*
|
| 29 |
* @var array
|
| 30 |
*/
|
| 31 |
protected static $_caseFold = array(); |
| 32 |
|
| 33 |
/**
|
| 34 |
* Holds an array of Unicode code point ranges
|
| 35 |
*
|
| 36 |
* @var array
|
| 37 |
*/
|
| 38 |
protected static $_codeRange = array(); |
| 39 |
|
| 40 |
/**
|
| 41 |
* Holds the current code point range
|
| 42 |
*
|
| 43 |
* @var string
|
| 44 |
*/
|
| 45 |
protected static $_table = null; |
| 46 |
|
| 47 |
/**
|
| 48 |
* Converts a multibyte character string
|
| 49 |
* to the decimal value of the character
|
| 50 |
*
|
| 51 |
* @param string $string String to convert.
|
| 52 |
* @return array
|
| 53 |
*/
|
| 54 |
public static function utf8($string) { |
| 55 |
$map = array(); |
| 56 |
|
| 57 |
$values = array(); |
| 58 |
$find = 1; |
| 59 |
$length = strlen($string); |
| 60 |
|
| 61 |
for ($i = 0; $i < $length; $i++) { |
| 62 |
$value = ord($string[$i]); |
| 63 |
|
| 64 |
if ($value < 128) { |
| 65 |
$map[] = $value; |
| 66 |
} else {
|
| 67 |
if (empty($values)) { |
| 68 |
$find = ($value < 224) ? 2 : 3; |
| 69 |
} |
| 70 |
$values[] = $value; |
| 71 |
|
| 72 |
if (count($values) === $find) { |
| 73 |
if ($find == 3) { |
| 74 |
$map[] = (($values[0] % 16) * 4096) + (($values[1] % 64) * 64) + ($values[2] % 64); |
| 75 |
} else {
|
| 76 |
$map[] = (($values[0] % 32) * 64) + ($values[1] % 64); |
| 77 |
} |
| 78 |
$values = array(); |
| 79 |
$find = 1; |
| 80 |
} |
| 81 |
} |
| 82 |
} |
| 83 |
return $map; |
| 84 |
} |
| 85 |
|
| 86 |
/**
|
| 87 |
* Converts the decimal value of a multibyte character string
|
| 88 |
* to a string
|
| 89 |
*
|
| 90 |
* @param array $array Values array.
|
| 91 |
* @return string
|
| 92 |
*/
|
| 93 |
public static function ascii($array) { |
| 94 |
$ascii = ''; |
| 95 |
|
| 96 |
foreach ($array as $utf8) { |
| 97 |
if ($utf8 < 128) { |
| 98 |
$ascii .= chr($utf8); |
| 99 |
} elseif ($utf8 < 2048) { |
| 100 |
$ascii .= chr(192 + (($utf8 - ($utf8 % 64)) / 64)); |
| 101 |
$ascii .= chr(128 + ($utf8 % 64)); |
| 102 |
} else {
|
| 103 |
$ascii .= chr(224 + (($utf8 - ($utf8 % 4096)) / 4096)); |
| 104 |
$ascii .= chr(128 + ((($utf8 % 4096) - ($utf8 % 64)) / 64)); |
| 105 |
$ascii .= chr(128 + ($utf8 % 64)); |
| 106 |
} |
| 107 |
} |
| 108 |
return $ascii; |
| 109 |
} |
| 110 |
|
| 111 |
/**
|
| 112 |
* Find position of first occurrence of a case-insensitive string.
|
| 113 |
*
|
| 114 |
* @param string $haystack The string from which to get the position of the first occurrence of $needle.
|
| 115 |
* @param string $needle The string to find in $haystack.
|
| 116 |
* @param int $offset The position in $haystack to start searching.
|
| 117 |
* @return int|bool The numeric position of the first occurrence of $needle in the $haystack string,
|
| 118 |
* or false if $needle is not found.
|
| 119 |
*/
|
| 120 |
public static function stripos($haystack, $needle, $offset = 0) { |
| 121 |
if (Multibyte::checkMultibyte($haystack)) { |
| 122 |
$haystack = Multibyte::strtoupper($haystack); |
| 123 |
$needle = Multibyte::strtoupper($needle); |
| 124 |
return Multibyte::strpos($haystack, $needle, $offset); |
| 125 |
} |
| 126 |
return stripos($haystack, $needle, $offset); |
| 127 |
} |
| 128 |
|
| 129 |
/**
|
| 130 |
* Finds first occurrence of a string within another, case insensitive.
|
| 131 |
*
|
| 132 |
* @param string $haystack The string from which to get the first occurrence of $needle.
|
| 133 |
* @param string $needle The string to find in $haystack.
|
| 134 |
* @param bool $part Determines which portion of $haystack this function returns.
|
| 135 |
* If set to true, it returns all of $haystack from the beginning to the first occurrence of $needle.
|
| 136 |
* If set to false, it returns all of $haystack from the first occurrence of $needle to the end,
|
| 137 |
* Default value is false.
|
| 138 |
* @return int|bool The portion of $haystack, or false if $needle is not found.
|
| 139 |
*/
|
| 140 |
public static function stristr($haystack, $needle, $part = false) { |
| 141 |
$php = (PHP_VERSION < 5.3); |
| 142 |
|
| 143 |
if (($php && $part) || Multibyte::checkMultibyte($haystack)) { |
| 144 |
$check = Multibyte::strtoupper($haystack); |
| 145 |
$check = Multibyte::utf8($check); |
| 146 |
$found = false; |
| 147 |
|
| 148 |
$haystack = Multibyte::utf8($haystack); |
| 149 |
$haystackCount = count($haystack); |
| 150 |
|
| 151 |
$needle = Multibyte::strtoupper($needle); |
| 152 |
$needle = Multibyte::utf8($needle); |
| 153 |
$needleCount = count($needle); |
| 154 |
|
| 155 |
$parts = array(); |
| 156 |
$position = 0; |
| 157 |
|
| 158 |
while (($found === false) && ($position < $haystackCount)) { |
| 159 |
if (isset($needle[0]) && $needle[0] === $check[$position]) { |
| 160 |
for ($i = 1; $i < $needleCount; $i++) { |
| 161 |
if ($needle[$i] !== $check[$position + $i]) { |
| 162 |
break;
|
| 163 |
} |
| 164 |
} |
| 165 |
if ($i === $needleCount) { |
| 166 |
$found = true; |
| 167 |
} |
| 168 |
} |
| 169 |
if (!$found) { |
| 170 |
$parts[] = $haystack[$position]; |
| 171 |
unset($haystack[$position]); |
| 172 |
} |
| 173 |
$position++;
|
| 174 |
} |
| 175 |
|
| 176 |
if ($found && $part && !empty($parts)) { |
| 177 |
return Multibyte::ascii($parts); |
| 178 |
} elseif ($found && !empty($haystack)) { |
| 179 |
return Multibyte::ascii($haystack); |
| 180 |
} |
| 181 |
return false; |
| 182 |
} |
| 183 |
|
| 184 |
if (!$php) { |
| 185 |
return stristr($haystack, $needle, $part); |
| 186 |
} |
| 187 |
return stristr($haystack, $needle); |
| 188 |
} |
| 189 |
|
| 190 |
/**
|
| 191 |
* Get string length.
|
| 192 |
*
|
| 193 |
* @param string $string The string being checked for length.
|
| 194 |
* @return int The number of characters in string $string
|
| 195 |
*/
|
| 196 |
public static function strlen($string) { |
| 197 |
if (Multibyte::checkMultibyte($string)) { |
| 198 |
$string = Multibyte::utf8($string); |
| 199 |
return count($string); |
| 200 |
} |
| 201 |
return strlen($string); |
| 202 |
} |
| 203 |
|
| 204 |
/**
|
| 205 |
* Find position of first occurrence of a string.
|
| 206 |
*
|
| 207 |
* @param string $haystack The string being checked.
|
| 208 |
* @param string $needle The position counted from the beginning of haystack.
|
| 209 |
* @param int $offset The search offset. If it is not specified, 0 is used.
|
| 210 |
* @return int|bool The numeric position of the first occurrence of $needle in the $haystack string.
|
| 211 |
* If $needle is not found, it returns false.
|
| 212 |
*/
|
| 213 |
public static function strpos($haystack, $needle, $offset = 0) { |
| 214 |
if (Multibyte::checkMultibyte($haystack)) { |
| 215 |
$found = false; |
| 216 |
|
| 217 |
$haystack = Multibyte::utf8($haystack); |
| 218 |
$haystackCount = count($haystack); |
| 219 |
|
| 220 |
$needle = Multibyte::utf8($needle); |
| 221 |
$needleCount = count($needle); |
| 222 |
|
| 223 |
$position = $offset; |
| 224 |
|
| 225 |
while (($found === false) && ($position < $haystackCount)) { |
| 226 |
if (isset($needle[0]) && $needle[0] === $haystack[$position]) { |
| 227 |
for ($i = 1; $i < $needleCount; $i++) { |
| 228 |
if ($needle[$i] !== $haystack[$position + $i]) { |
| 229 |
break;
|
| 230 |
} |
| 231 |
} |
| 232 |
if ($i === $needleCount) { |
| 233 |
$found = true; |
| 234 |
$position--;
|
| 235 |
} |
| 236 |
} |
| 237 |
$position++;
|
| 238 |
} |
| 239 |
if ($found) { |
| 240 |
return $position; |
| 241 |
} |
| 242 |
return false; |
| 243 |
} |
| 244 |
return strpos($haystack, $needle, $offset); |
| 245 |
} |
| 246 |
|
| 247 |
/**
|
| 248 |
* Finds the last occurrence of a character in a string within another.
|
| 249 |
*
|
| 250 |
* @param string $haystack The string from which to get the last occurrence of $needle.
|
| 251 |
* @param string $needle The string to find in $haystack.
|
| 252 |
* @param bool $part Determines which portion of $haystack this function returns.
|
| 253 |
* If set to true, it returns all of $haystack from the beginning to the last occurrence of $needle.
|
| 254 |
* If set to false, it returns all of $haystack from the last occurrence of $needle to the end,
|
| 255 |
* Default value is false.
|
| 256 |
* @return string|bool The portion of $haystack. or false if $needle is not found.
|
| 257 |
*/
|
| 258 |
public static function strrchr($haystack, $needle, $part = false) { |
| 259 |
$check = Multibyte::utf8($haystack); |
| 260 |
$found = false; |
| 261 |
|
| 262 |
$haystack = Multibyte::utf8($haystack); |
| 263 |
$haystackCount = count($haystack); |
| 264 |
|
| 265 |
$matches = array_count_values($check); |
| 266 |
|
| 267 |
$needle = Multibyte::utf8($needle); |
| 268 |
$needleCount = count($needle); |
| 269 |
|
| 270 |
$parts = array(); |
| 271 |
$position = 0; |
| 272 |
|
| 273 |
while (($found === false) && ($position < $haystackCount)) { |
| 274 |
if (isset($needle[0]) && $needle[0] === $check[$position]) { |
| 275 |
for ($i = 1; $i < $needleCount; $i++) { |
| 276 |
if ($needle[$i] !== $check[$position + $i]) { |
| 277 |
if ($needle[$i] === $check[($position + $i) - 1]) { |
| 278 |
$found = true; |
| 279 |
} |
| 280 |
unset($parts[$position - 1]); |
| 281 |
$haystack = array_merge(array($haystack[$position]), $haystack); |
| 282 |
break;
|
| 283 |
} |
| 284 |
} |
| 285 |
if (isset($matches[$needle[0]]) && $matches[$needle[0]] > 1) { |
| 286 |
$matches[$needle[0]] = $matches[$needle[0]] - 1; |
| 287 |
} elseif ($i === $needleCount) { |
| 288 |
$found = true; |
| 289 |
} |
| 290 |
} |
| 291 |
|
| 292 |
if (!$found && isset($haystack[$position])) { |
| 293 |
$parts[] = $haystack[$position]; |
| 294 |
unset($haystack[$position]); |
| 295 |
} |
| 296 |
$position++;
|
| 297 |
} |
| 298 |
|
| 299 |
if ($found && $part && !empty($parts)) { |
| 300 |
return Multibyte::ascii($parts); |
| 301 |
} elseif ($found && !empty($haystack)) { |
| 302 |
return Multibyte::ascii($haystack); |
| 303 |
} |
| 304 |
return false; |
| 305 |
} |
| 306 |
|
| 307 |
/**
|
| 308 |
* Finds the last occurrence of a character in a string within another, case insensitive.
|
| 309 |
*
|
| 310 |
* @param string $haystack The string from which to get the last occurrence of $needle.
|
| 311 |
* @param string $needle The string to find in $haystack.
|
| 312 |
* @param bool $part Determines which portion of $haystack this function returns.
|
| 313 |
* If set to true, it returns all of $haystack from the beginning to the last occurrence of $needle.
|
| 314 |
* If set to false, it returns all of $haystack from the last occurrence of $needle to the end,
|
| 315 |
* Default value is false.
|
| 316 |
* @return string|bool The portion of $haystack. or false if $needle is not found.
|
| 317 |
*/
|
| 318 |
public static function strrichr($haystack, $needle, $part = false) { |
| 319 |
$check = Multibyte::strtoupper($haystack); |
| 320 |
$check = Multibyte::utf8($check); |
| 321 |
$found = false; |
| 322 |
|
| 323 |
$haystack = Multibyte::utf8($haystack); |
| 324 |
$haystackCount = count($haystack); |
| 325 |
|
| 326 |
$matches = array_count_values($check); |
| 327 |
|
| 328 |
$needle = Multibyte::strtoupper($needle); |
| 329 |
$needle = Multibyte::utf8($needle); |
| 330 |
$needleCount = count($needle); |
| 331 |
|
| 332 |
$parts = array(); |
| 333 |
$position = 0; |
| 334 |
|
| 335 |
while (($found === false) && ($position < $haystackCount)) { |
| 336 |
if (isset($needle[0]) && $needle[0] === $check[$position]) { |
| 337 |
for ($i = 1; $i < $needleCount; $i++) { |
| 338 |
if ($needle[$i] !== $check[$position + $i]) { |
| 339 |
if ($needle[$i] === $check[($position + $i) - 1]) { |
| 340 |
$found = true; |
| 341 |
} |
| 342 |
unset($parts[$position - 1]); |
| 343 |
$haystack = array_merge(array($haystack[$position]), $haystack); |
| 344 |
break;
|
| 345 |
} |
| 346 |
} |
| 347 |
if (isset($matches[$needle[0]]) && $matches[$needle[0]] > 1) { |
| 348 |
$matches[$needle[0]] = $matches[$needle[0]] - 1; |
| 349 |
} elseif ($i === $needleCount) { |
| 350 |
$found = true; |
| 351 |
} |
| 352 |
} |
| 353 |
|
| 354 |
if (!$found && isset($haystack[$position])) { |
| 355 |
$parts[] = $haystack[$position]; |
| 356 |
unset($haystack[$position]); |
| 357 |
} |
| 358 |
$position++;
|
| 359 |
} |
| 360 |
|
| 361 |
if ($found && $part && !empty($parts)) { |
| 362 |
return Multibyte::ascii($parts); |
| 363 |
} elseif ($found && !empty($haystack)) { |
| 364 |
return Multibyte::ascii($haystack); |
| 365 |
} |
| 366 |
return false; |
| 367 |
} |
| 368 |
|
| 369 |
/**
|
| 370 |
* Finds position of last occurrence of a string within another, case insensitive
|
| 371 |
*
|
| 372 |
* @param string $haystack The string from which to get the position of the last occurrence of $needle.
|
| 373 |
* @param string $needle The string to find in $haystack.
|
| 374 |
* @param int $offset The position in $haystack to start searching.
|
| 375 |
* @return int|bool The numeric position of the last occurrence of $needle in the $haystack string,
|
| 376 |
* or false if $needle is not found.
|
| 377 |
*/
|
| 378 |
public static function strripos($haystack, $needle, $offset = 0) { |
| 379 |
if (Multibyte::checkMultibyte($haystack)) { |
| 380 |
$found = false; |
| 381 |
$haystack = Multibyte::strtoupper($haystack); |
| 382 |
$haystack = Multibyte::utf8($haystack); |
| 383 |
$haystackCount = count($haystack); |
| 384 |
|
| 385 |
$matches = array_count_values($haystack); |
| 386 |
|
| 387 |
$needle = Multibyte::strtoupper($needle); |
| 388 |
$needle = Multibyte::utf8($needle); |
| 389 |
$needleCount = count($needle); |
| 390 |
|
| 391 |
$position = $offset; |
| 392 |
|
| 393 |
while (($found === false) && ($position < $haystackCount)) { |
| 394 |
if (isset($needle[0]) && $needle[0] === $haystack[$position]) { |
| 395 |
for ($i = 1; $i < $needleCount; $i++) { |
| 396 |
if ($needle[$i] !== $haystack[$position + $i]) { |
| 397 |
if ($needle[$i] === $haystack[($position + $i) - 1]) { |
| 398 |
$position--;
|
| 399 |
$found = true; |
| 400 |
continue;
|
| 401 |
} |
| 402 |
} |
| 403 |
} |
| 404 |
|
| 405 |
if (!$offset && isset($matches[$needle[0]]) && $matches[$needle[0]] > 1) { |
| 406 |
$matches[$needle[0]] = $matches[$needle[0]] - 1; |
| 407 |
} elseif ($i === $needleCount) { |
| 408 |
$found = true; |
| 409 |
$position--;
|
| 410 |
} |
| 411 |
} |
| 412 |
$position++;
|
| 413 |
} |
| 414 |
return ($found) ? $position : false; |
| 415 |
} |
| 416 |
return strripos($haystack, $needle, $offset); |
| 417 |
} |
| 418 |
|
| 419 |
/**
|
| 420 |
* Find position of last occurrence of a string in a string.
|
| 421 |
*
|
| 422 |
* @param string $haystack The string being checked, for the last occurrence of $needle.
|
| 423 |
* @param string $needle The string to find in $haystack.
|
| 424 |
* @param int $offset May be specified to begin searching an arbitrary number of characters into the string.
|
| 425 |
* Negative values will stop searching at an arbitrary point prior to the end of the string.
|
| 426 |
* @return int|bool The numeric position of the last occurrence of $needle in the $haystack string.
|
| 427 |
* If $needle is not found, it returns false.
|
| 428 |
*/
|
| 429 |
public static function strrpos($haystack, $needle, $offset = 0) { |
| 430 |
if (Multibyte::checkMultibyte($haystack)) { |
| 431 |
$found = false; |
| 432 |
|
| 433 |
$haystack = Multibyte::utf8($haystack); |
| 434 |
$haystackCount = count($haystack); |
| 435 |
|
| 436 |
$matches = array_count_values($haystack); |
| 437 |
|
| 438 |
$needle = Multibyte::utf8($needle); |
| 439 |
$needleCount = count($needle); |
| 440 |
|
| 441 |
$position = $offset; |
| 442 |
|
| 443 |
while (($found === false) && ($position < $haystackCount)) { |
| 444 |
if (isset($needle[0]) && $needle[0] === $haystack[$position]) { |
| 445 |
for ($i = 1; $i < $needleCount; $i++) { |
| 446 |
if ($needle[$i] !== $haystack[$position + $i]) { |
| 447 |
if ($needle[$i] === $haystack[($position + $i) - 1]) { |
| 448 |
$position--;
|
| 449 |
$found = true; |
| 450 |
continue;
|
| 451 |
} |
| 452 |
} |
| 453 |
} |
| 454 |
|
| 455 |
if (!$offset && isset($matches[$needle[0]]) && $matches[$needle[0]] > 1) { |
| 456 |
$matches[$needle[0]] = $matches[$needle[0]] - 1; |
| 457 |
} elseif ($i === $needleCount) { |
| 458 |
$found = true; |
| 459 |
$position--;
|
| 460 |
} |
| 461 |
} |
| 462 |
$position++;
|
| 463 |
} |
| 464 |
return ($found) ? $position : false; |
| 465 |
} |
| 466 |
return strrpos($haystack, $needle, $offset); |
| 467 |
} |
| 468 |
|
| 469 |
/**
|
| 470 |
* Finds first occurrence of a string within another
|
| 471 |
*
|
| 472 |
* @param string $haystack The string from which to get the first occurrence of $needle.
|
| 473 |
* @param string $needle The string to find in $haystack
|
| 474 |
* @param bool $part Determines which portion of $haystack this function returns.
|
| 475 |
* If set to true, it returns all of $haystack from the beginning to the first occurrence of $needle.
|
| 476 |
* If set to false, it returns all of $haystack from the first occurrence of $needle to the end,
|
| 477 |
* Default value is FALSE.
|
| 478 |
* @return string|bool The portion of $haystack, or true if $needle is not found.
|
| 479 |
*/
|
| 480 |
public static function strstr($haystack, $needle, $part = false) { |
| 481 |
$php = (PHP_VERSION < 5.3); |
| 482 |
|
| 483 |
if (($php && $part) || Multibyte::checkMultibyte($haystack)) { |
| 484 |
$check = Multibyte::utf8($haystack); |
| 485 |
$found = false; |
| 486 |
|
| 487 |
$haystack = Multibyte::utf8($haystack); |
| 488 |
$haystackCount = count($haystack); |
| 489 |
|
| 490 |
$needle = Multibyte::utf8($needle); |
| 491 |
$needleCount = count($needle); |
| 492 |
|
| 493 |
$parts = array(); |
| 494 |
$position = 0; |
| 495 |
|
| 496 |
while (($found === false) && ($position < $haystackCount)) { |
| 497 |
if (isset($needle[0]) && $needle[0] === $check[$position]) { |
| 498 |
for ($i = 1; $i < $needleCount; $i++) { |
| 499 |
if ($needle[$i] !== $check[$position + $i]) { |
| 500 |
break;
|
| 501 |
} |
| 502 |
} |
| 503 |
if ($i === $needleCount) { |
| 504 |
$found = true; |
| 505 |
} |
| 506 |
} |
| 507 |
if (!$found) { |
| 508 |
$parts[] = $haystack[$position]; |
| 509 |
unset($haystack[$position]); |
| 510 |
} |
| 511 |
$position++;
|
| 512 |
} |
| 513 |
|
| 514 |
if ($found && $part && !empty($parts)) { |
| 515 |
return Multibyte::ascii($parts); |
| 516 |
} elseif ($found && !empty($haystack)) { |
| 517 |
return Multibyte::ascii($haystack); |
| 518 |
} |
| 519 |
return false; |
| 520 |
} |
| 521 |
|
| 522 |
if (!$php) { |
| 523 |
return strstr($haystack, $needle, $part); |
| 524 |
} |
| 525 |
return strstr($haystack, $needle); |
| 526 |
} |
| 527 |
|
| 528 |
/**
|
| 529 |
* Make a string lowercase
|
| 530 |
*
|
| 531 |
* @param string $string The string being lowercased.
|
| 532 |
* @return string with all alphabetic characters converted to lowercase.
|
| 533 |
*/
|
| 534 |
public static function strtolower($string) { |
| 535 |
$utf8Map = Multibyte::utf8($string); |
| 536 |
|
| 537 |
$length = count($utf8Map); |
| 538 |
$lowerCase = array(); |
| 539 |
|
| 540 |
for ($i = 0; $i < $length; $i++) { |
| 541 |
$char = $utf8Map[$i]; |
| 542 |
|
| 543 |
if ($char < 128) { |
| 544 |
$str = strtolower(chr($char)); |
| 545 |
$strlen = strlen($str); |
| 546 |
for ($ii = 0; $ii < $strlen; $ii++) { |
| 547 |
$lower = ord(substr($str, $ii, 1)); |
| 548 |
} |
| 549 |
$lowerCase[] = $lower; |
| 550 |
$matched = true; |
| 551 |
} else {
|
| 552 |
$matched = false; |
| 553 |
$keys = static::_find($char, 'upper'); |
| 554 |
|
| 555 |
if (!empty($keys)) { |
| 556 |
foreach ($keys as $key => $value) { |
| 557 |
if ($keys[$key]['upper'] == $char && count($keys[$key]['lower'][0]) === 1) { |
| 558 |
$lowerCase[] = $keys[$key]['lower'][0]; |
| 559 |
$matched = true; |
| 560 |
break 1; |
| 561 |
} |
| 562 |
} |
| 563 |
} |
| 564 |
} |
| 565 |
if ($matched === false) { |
| 566 |
$lowerCase[] = $char; |
| 567 |
} |
| 568 |
} |
| 569 |
return Multibyte::ascii($lowerCase); |
| 570 |
} |
| 571 |
|
| 572 |
/**
|
| 573 |
* Make a string uppercase
|
| 574 |
*
|
| 575 |
* @param string $string The string being uppercased.
|
| 576 |
* @return string with all alphabetic characters converted to uppercase.
|
| 577 |
*/
|
| 578 |
public static function strtoupper($string) { |
| 579 |
$utf8Map = Multibyte::utf8($string); |
| 580 |
|
| 581 |
$length = count($utf8Map); |
| 582 |
$replaced = array(); |
| 583 |
$upperCase = array(); |
| 584 |
|
| 585 |
for ($i = 0; $i < $length; $i++) { |
| 586 |
$char = $utf8Map[$i]; |
| 587 |
|
| 588 |
if ($char < 128) { |
| 589 |
$str = strtoupper(chr($char)); |
| 590 |
$strlen = strlen($str); |
| 591 |
for ($ii = 0; $ii < $strlen; $ii++) { |
| 592 |
$upper = ord(substr($str, $ii, 1)); |
| 593 |
} |
| 594 |
$upperCase[] = $upper; |
| 595 |
$matched = true; |
| 596 |
|
| 597 |
} else {
|
| 598 |
$matched = false; |
| 599 |
$keys = static::_find($char); |
| 600 |
$keyCount = count($keys); |
| 601 |
|
| 602 |
if (!empty($keys)) { |
| 603 |
foreach ($keys as $key => $value) { |
| 604 |
$matched = false; |
| 605 |
$replace = 0; |
| 606 |
if ($length > 1 && count($keys[$key]['lower']) > 1) { |
| 607 |
$j = 0; |
| 608 |
|
| 609 |
for ($ii = 0, $count = count($keys[$key]['lower']); $ii < $count; $ii++) { |
| 610 |
$nextChar = $utf8Map[$i + $ii]; |
| 611 |
|
| 612 |
if (isset($nextChar) && ($nextChar == $keys[$key]['lower'][$j + $ii])) { |
| 613 |
$replace++;
|
| 614 |
} |
| 615 |
} |
| 616 |
if ($replace == $count) { |
| 617 |
$upperCase[] = $keys[$key]['upper']; |
| 618 |
$replaced = array_merge($replaced, array_values($keys[$key]['lower'])); |
| 619 |
$matched = true; |
| 620 |
break 1; |
| 621 |
} |
| 622 |
} elseif ($length > 1 && $keyCount > 1) { |
| 623 |
$j = 0; |
| 624 |
for ($ii = 1; $ii < $keyCount; $ii++) { |
| 625 |
$nextChar = $utf8Map[$i + $ii - 1]; |
| 626 |
|
| 627 |
if (in_array($nextChar, $keys[$ii]['lower'])) { |
| 628 |
|
| 629 |
for ($jj = 0, $count = count($keys[$ii]['lower']); $jj < $count; $jj++) { |
| 630 |
$nextChar = $utf8Map[$i + $jj]; |
| 631 |
|
| 632 |
if (isset($nextChar) && ($nextChar == $keys[$ii]['lower'][$j + $jj])) { |
| 633 |
$replace++;
|
| 634 |
} |
| 635 |
} |
| 636 |
if ($replace == $count) { |
| 637 |
$upperCase[] = $keys[$ii]['upper']; |
| 638 |
$replaced = array_merge($replaced, array_values($keys[$ii]['lower'])); |
| 639 |
$matched = true; |
| 640 |
break 2; |
| 641 |
} |
| 642 |
} |
| 643 |
} |
| 644 |
} |
| 645 |
if ($keys[$key]['lower'][0] == $char) { |
| 646 |
$upperCase[] = $keys[$key]['upper']; |
| 647 |
$matched = true; |
| 648 |
break 1; |
| 649 |
} |
| 650 |
} |
| 651 |
} |
| 652 |
} |
| 653 |
if ($matched === false && !in_array($char, $replaced, true)) { |
| 654 |
$upperCase[] = $char; |
| 655 |
} |
| 656 |
} |
| 657 |
return Multibyte::ascii($upperCase); |
| 658 |
} |
| 659 |
|
| 660 |
/**
|
| 661 |
* Count the number of substring occurrences
|
| 662 |
*
|
| 663 |
* @param string $haystack The string being checked.
|
| 664 |
* @param string $needle The string being found.
|
| 665 |
* @return int The number of times the $needle substring occurs in the $haystack string.
|
| 666 |
*/
|
| 667 |
public static function substrCount($haystack, $needle) { |
| 668 |
$count = 0; |
| 669 |
$haystack = Multibyte::utf8($haystack); |
| 670 |
$haystackCount = count($haystack); |
| 671 |
$matches = array_count_values($haystack); |
| 672 |
$needle = Multibyte::utf8($needle); |
| 673 |
$needleCount = count($needle); |
| 674 |
|
| 675 |
if ($needleCount === 1 && isset($matches[$needle[0]])) { |
| 676 |
return $matches[$needle[0]]; |
| 677 |
} |
| 678 |
|
| 679 |
for ($i = 0; $i < $haystackCount; $i++) { |
| 680 |
if (isset($needle[0]) && $needle[0] === $haystack[$i]) { |
| 681 |
for ($ii = 1; $ii < $needleCount; $ii++) { |
| 682 |
if ($needle[$ii] === $haystack[$i + 1]) { |
| 683 |
if ((isset($needle[$ii + 1]) && $haystack[$i + 2]) && $needle[$ii + 1] !== $haystack[$i + 2]) { |
| 684 |
$count--;
|
| 685 |
} else {
|
| 686 |
$count++;
|
| 687 |
} |
| 688 |
} |
| 689 |
} |
| 690 |
} |
| 691 |
} |
| 692 |
return $count; |
| 693 |
} |
| 694 |
|
| 695 |
/**
|
| 696 |
* Get part of string
|
| 697 |
*
|
| 698 |
* @param string $string The string being checked.
|
| 699 |
* @param int $start The first position used in $string.
|
| 700 |
* @param int $length The maximum length of the returned string.
|
| 701 |
* @return string The portion of $string specified by the $string and $length parameters.
|
| 702 |
*/
|
| 703 |
public static function substr($string, $start, $length = null) { |
| 704 |
if ($start === 0 && $length === null) { |
| 705 |
return $string; |
| 706 |
} |
| 707 |
|
| 708 |
$string = Multibyte::utf8($string); |
| 709 |
|
| 710 |
for ($i = 1; $i <= $start; $i++) { |
| 711 |
unset($string[$i - 1]); |
| 712 |
} |
| 713 |
|
| 714 |
if ($length === null || count($string) < $length) { |
| 715 |
return Multibyte::ascii($string); |
| 716 |
} |
| 717 |
$string = array_values($string); |
| 718 |
|
| 719 |
$value = array(); |
| 720 |
for ($i = 0; $i < $length; $i++) { |
| 721 |
$value[] = $string[$i]; |
| 722 |
} |
| 723 |
return Multibyte::ascii($value); |
| 724 |
} |
| 725 |
|
| 726 |
/**
|
| 727 |
* Prepare a string for mail transport, using the provided encoding
|
| 728 |
*
|
| 729 |
* @param string $string value to encode
|
| 730 |
* @param string $charset charset to use for encoding. defaults to UTF-8
|
| 731 |
* @param string $newline Newline string.
|
| 732 |
* @return string
|
| 733 |
*/
|
| 734 |
public static function mimeEncode($string, $charset = null, $newline = "\r\n") { |
| 735 |
if (!Multibyte::checkMultibyte($string) && strlen($string) < 75) { |
| 736 |
return $string; |
| 737 |
} |
| 738 |
|
| 739 |
if (empty($charset)) { |
| 740 |
$charset = Configure::read('App.encoding'); |
| 741 |
} |
| 742 |
$charset = strtoupper($charset); |
| 743 |
|
| 744 |
$start = '=?' . $charset . '?B?'; |
| 745 |
$end = '?='; |
| 746 |
$spacer = $end . $newline . ' ' . $start; |
| 747 |
|
| 748 |
$length = 75 - strlen($start) - strlen($end); |
| 749 |
$length = $length - ($length % 4); |
| 750 |
if ($charset === 'UTF-8') { |
| 751 |
$parts = array(); |
| 752 |
$maxchars = floor(($length * 3) / 4); |
| 753 |
$stringLength = strlen($string); |
| 754 |
while ($stringLength > $maxchars) { |
| 755 |
$i = (int)$maxchars; |
| 756 |
$test = ord($string[$i]); |
| 757 |
while ($test >= 128 && $test <= 191) { |
| 758 |
$i--;
|
| 759 |
$test = ord($string[$i]); |
| 760 |
} |
| 761 |
$parts[] = base64_encode(substr($string, 0, $i)); |
| 762 |
$string = substr($string, $i); |
| 763 |
$stringLength = strlen($string); |
| 764 |
} |
| 765 |
$parts[] = base64_encode($string); |
| 766 |
$string = implode($spacer, $parts); |
| 767 |
} else {
|
| 768 |
$string = chunk_split(base64_encode($string), $length, $spacer); |
| 769 |
$string = preg_replace('/' . preg_quote($spacer) . '$/', '', $string); |
| 770 |
} |
| 771 |
return $start . $string . $end; |
| 772 |
} |
| 773 |
|
| 774 |
/**
|
| 775 |
* Return the Code points range for Unicode characters
|
| 776 |
*
|
| 777 |
* @param int $decimal Decimal value.
|
| 778 |
* @return string
|
| 779 |
*/
|
| 780 |
protected static function _codepoint($decimal) { |
| 781 |
if ($decimal > 128 && $decimal < 256) { |
| 782 |
$return = '0080_00ff'; // Latin-1 Supplement |
| 783 |
} elseif ($decimal < 384) { |
| 784 |
$return = '0100_017f'; // Latin Extended-A |
| 785 |
} elseif ($decimal < 592) { |
| 786 |
$return = '0180_024F'; // Latin Extended-B |
| 787 |
} elseif ($decimal < 688) { |
| 788 |
$return = '0250_02af'; // IPA Extensions |
| 789 |
} elseif ($decimal >= 880 && $decimal < 1024) { |
| 790 |
$return = '0370_03ff'; // Greek and Coptic |
| 791 |
} elseif ($decimal < 1280) { |
| 792 |
$return = '0400_04ff'; // Cyrillic |
| 793 |
} elseif ($decimal < 1328) { |
| 794 |
$return = '0500_052f'; // Cyrillic Supplement |
| 795 |
} elseif ($decimal < 1424) { |
| 796 |
$return = '0530_058f'; // Armenian |
| 797 |
} elseif ($decimal >= 7680 && $decimal < 7936) { |
| 798 |
$return = '1e00_1eff'; // Latin Extended Additional |
| 799 |
} elseif ($decimal < 8192) { |
| 800 |
$return = '1f00_1fff'; // Greek Extended |
| 801 |
} elseif ($decimal >= 8448 && $decimal < 8528) { |
| 802 |
$return = '2100_214f'; // Letterlike Symbols |
| 803 |
} elseif ($decimal < 8592) { |
| 804 |
$return = '2150_218f'; // Number Forms |
| 805 |
} elseif ($decimal >= 9312 && $decimal < 9472) { |
| 806 |
$return = '2460_24ff'; // Enclosed Alphanumerics |
| 807 |
} elseif ($decimal >= 11264 && $decimal < 11360) { |
| 808 |
$return = '2c00_2c5f'; // Glagolitic |
| 809 |
} elseif ($decimal < 11392) { |
| 810 |
$return = '2c60_2c7f'; // Latin Extended-C |
| 811 |
} elseif ($decimal < 11520) { |
| 812 |
$return = '2c80_2cff'; // Coptic |
| 813 |
} elseif ($decimal >= 65280 && $decimal < 65520) { |
| 814 |
$return = 'ff00_ffef'; // Halfwidth and Fullwidth Forms |
| 815 |
} else {
|
| 816 |
$return = false; |
| 817 |
} |
| 818 |
static::$_codeRange[$decimal] = $return; |
| 819 |
return $return; |
| 820 |
} |
| 821 |
|
| 822 |
/**
|
| 823 |
* Find the related code folding values for $char
|
| 824 |
*
|
| 825 |
* @param int $char decimal value of character
|
| 826 |
* @param string $type Type 'lower' or 'upper'. Defaults to 'lower'.
|
| 827 |
* @return array
|
| 828 |
*/
|
| 829 |
protected static function _find($char, $type = 'lower') { |
| 830 |
$found = array(); |
| 831 |
if (!isset(static::$_codeRange[$char])) { |
| 832 |
$range = static::_codepoint($char); |
| 833 |
if ($range === false) { |
| 834 |
return array(); |
| 835 |
} |
| 836 |
if (!Configure::configured('_cake_core_')) { |
| 837 |
App::uses('PhpReader', 'Configure'); |
| 838 |
Configure::config('_cake_core_', new PhpReader(CAKE . 'Config' . DS)); |
| 839 |
} |
| 840 |
Configure::load('unicode' . DS . 'casefolding' . DS . $range, '_cake_core_'); |
| 841 |
static::$_caseFold[$range] = Configure::read($range); |
| 842 |
Configure::delete($range); |
| 843 |
} |
| 844 |
|
| 845 |
if (!static::$_codeRange[$char]) { |
| 846 |
return array(); |
| 847 |
} |
| 848 |
static::$_table = static::$_codeRange[$char]; |
| 849 |
$count = count(static::$_caseFold[static::$_table]); |
| 850 |
|
| 851 |
for ($i = 0; $i < $count; $i++) { |
| 852 |
if ($type === 'lower' && static::$_caseFold[static::$_table][$i][$type][0] === $char) { |
| 853 |
$found[] = static::$_caseFold[static::$_table][$i]; |
| 854 |
} elseif ($type === 'upper' && static::$_caseFold[static::$_table][$i][$type] === $char) { |
| 855 |
$found[] = static::$_caseFold[static::$_table][$i]; |
| 856 |
} |
| 857 |
} |
| 858 |
return $found; |
| 859 |
} |
| 860 |
|
| 861 |
/**
|
| 862 |
* Check the $string for multibyte characters
|
| 863 |
*
|
| 864 |
* @param string $string Value to test.
|
| 865 |
* @return bool
|
| 866 |
*/
|
| 867 |
public static function checkMultibyte($string) { |
| 868 |
$length = strlen($string); |
| 869 |
|
| 870 |
for ($i = 0; $i < $length; $i++) { |
| 871 |
$value = ord(($string[$i])); |
| 872 |
if ($value > 128) { |
| 873 |
return true; |
| 874 |
} |
| 875 |
} |
| 876 |
return false; |
| 877 |
} |
| 878 |
|
| 879 |
} |