方法1
function unicode2utf8( $str )
{
$str = preg_replace_callback('/\\\\u([0-9a-f]{4})/i', array($this,'replace_unicode_escape_sequence'), $str);
return $str;
}
function replace_unicode_escape_sequence($match)
{
return mb_convert_encoding(pack('H*', $match[1]), 'UTF-8', 'UTF-16BE');
}
方法2
/**
* UNICODE 转 UTF8
* @param $str
* @param $code
* @return string
**/
function unicodeToUTF8($str, $code = 'UTF-8')
{
$str = str_replace('\u', '%u', $str);
$str = rawurldecode($str);
preg_match_all("/(?:%u.{4})|.{4};|&#\d+;|.+/U", $str, $r);
$ar = $r[0];
foreach ($ar as $k => $v)
{
if (substr($v, 0, 2) == "%u")
{
$ar[$k] = iconv("UCS-2", $code, pack("H4", substr($v, -4)));
}
elseif (substr($v, 0, 3) == "")
{
$ar[$k] = iconv("UCS-2", $code, pack("H4", substr($v, 3, -1)));
}
elseif (substr($v, 0, 2) == "&#")
{
echo substr($v, 2, -1) . " ";
$ar[$k] = iconv("UCS-2", $code, pack("n", substr($v, 2, -1)));
}
}
return join("", $ar);
}