12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273 |
- <?php
- /**
- * UTF8::ord
- *
- * @package KO7
- *
- * @copyright (c) 2007-2016 Kohana Team
- * @copyright (c) since 2016 Koseven Team
- * @copyright (c) 2005 Harry Fuecks
- * @license http://www.gnu.org/licenses/old-licenses/lgpl-2.1.txt
- */
- function _ord($chr)
- {
- $ord0 = ord($chr);
- if ($ord0 >= 0 AND $ord0 <= 127)
- return $ord0;
- if ( ! isset($chr[1]))
- {
- throw new UTF8_Exception('Short sequence - at least 2 bytes expected, only 1 seen');
- }
- $ord1 = ord($chr[1]);
- if ($ord0 >= 192 AND $ord0 <= 223)
- return ($ord0 - 192) * 64 + ($ord1 - 128);
- if ( ! isset($chr[2]))
- {
- throw new UTF8_Exception('Short sequence - at least 3 bytes expected, only 2 seen');
- }
- $ord2 = ord($chr[2]);
- if ($ord0 >= 224 AND $ord0 <= 239)
- return ($ord0 - 224) * 4096 + ($ord1 - 128) * 64 + ($ord2 - 128);
- if ( ! isset($chr[3]))
- {
- throw new UTF8_Exception('Short sequence - at least 4 bytes expected, only 3 seen');
- }
- $ord3 = ord($chr[3]);
- if ($ord0 >= 240 AND $ord0 <= 247)
- return ($ord0 - 240) * 262144 + ($ord1 - 128) * 4096 + ($ord2-128) * 64 + ($ord3 - 128);
- if ( ! isset($chr[4]))
- {
- throw new UTF8_Exception('Short sequence - at least 5 bytes expected, only 4 seen');
- }
- $ord4 = ord($chr[4]);
- if ($ord0 >= 248 AND $ord0 <= 251)
- return ($ord0 - 248) * 16777216 + ($ord1-128) * 262144 + ($ord2 - 128) * 4096 + ($ord3 - 128) * 64 + ($ord4 - 128);
- if ( ! isset($chr[5]))
- {
- throw new UTF8_Exception('Short sequence - at least 6 bytes expected, only 5 seen');
- }
- if ($ord0 >= 252 AND $ord0 <= 253)
- return ($ord0 - 252) * 1073741824 + ($ord1 - 128) * 16777216 + ($ord2 - 128) * 262144 + ($ord3 - 128) * 4096 + ($ord4 - 128) * 64 + (ord($chr[5]) - 128);
- if ($ord0 >= 254 AND $ord0 <= 255)
- {
- throw new UTF8_Exception("Invalid UTF-8 with surrogate ordinal ':ordinal'", [
- ':ordinal' => $ord0,
- ]);
- }
- }
|