$code || $code >= 0x80) { return '{\\u' . $code . '}'; } if ($code == 123 || $code == 125 || $code == 92) { // open or close brace or backslash return '\\' . chr($code); } return chr($code); } protected function escapeMultibyteCharacter($code) { return '\\uc0{\\u' . $code . '}'; } /** * @see http://www.randomchaos.com/documents/?source=php_and_unicode * @param string $input */ protected function escapeSingleValue($input) { $escapedValue = ''; $numberOfBytes = 1; $bytes = array(); for ($i = 0; $i < strlen($input); ++$i) { $character = $input[$i]; $asciiCode = ord($character); if ($asciiCode < 128) { $escapedValue .= $this->escapeAsciiCharacter($asciiCode); } else { if (0 == count($bytes)) { if ($asciiCode < 224) { $numberOfBytes = 2; } elseif ($asciiCode < 240) { $numberOfBytes = 3; } elseif ($asciiCode < 248) { $numberOfBytes = 4; } } $bytes[] = $asciiCode; if ($numberOfBytes == count($bytes)) { if (4 == $numberOfBytes) { $multibyteCode = ($bytes[0] % 8) * 262144 + ($bytes[1] % 64) * 4096 + ($bytes[2] % 64) * 64 + ($bytes[3] % 64); } elseif (3 == $numberOfBytes) { $multibyteCode = ($bytes[0] % 16) * 4096 + ($bytes[1] % 64) * 64 + ($bytes[2] % 64); } else { $multibyteCode = ($bytes[0] % 32) * 64 + ($bytes[1] % 64); } if (65279 != $multibyteCode) { $escapedValue .= $multibyteCode < 128 ? $this->escapeAsciiCharacter($multibyteCode) : $this->escapeMultibyteCharacter($multibyteCode); } $numberOfBytes = 1; $bytes = array(); } } } return $escapedValue; } }