这个类相当好用.作用么,PHP做JSON传递GBK字符,比如中文,日文,韩文神马的Unicode最合适不过了..
functiontoUtf8($ar)
{
foreach($aras$val){
$val=intval(substr($val,2),16);
if($val<0x7F){// 0000-007F
$c.=chr($val);
}elseif($val<0x800){// 0080-0800
$c.=chr(0xC0|($val/64));
$c.=chr(0x80|($val%64));
}else{// 0800-FFFF
$c.=chr(0xE0|(($val/64)/64));
$c.=chr(0x80|(($val/64)%64));
$c.=chr(0x80|($val%64));
}
}
return$c;
}
functionescape($string,$encoding='gb2312')
{
$return='';
for($x=0;$x<mb_strlen($string,$encoding);$x++){
$str=mb_substr($string,$x,1,$encoding);
if(strlen($str)>1){// 多字节字符
$return.='%u'.strtoupper(bin2hex(mb_convert_encoding($str,'UCS-2',$encoding)));
}else{
$return.='%'.strtoupper(bin2hex($str));
}
}
return$return;
}
functiongb2utf8($string,$encoding='utf-8',$from_encode='gb2312')
{
returnmb_convert_encoding($string,$encoding,$from_encode);
}
}
?>
google code 上找到的另外一个类似脚本
function<a href="/tag/PHP/" target="_blank" class="keywords">PHP</a>escape($str)
{
$sublen=strlen($str);
$retrunString="";
for($i=0;$i<$sublen;$i++)
{
if(ord($str[$i])>=127)
{
$tmpString=bin2hex(iconv("gbk","ucs-2",substr($str,$i,2)));
$tmpString=substr($tmpString,2,2).substr($tmpString,2);
$retrunString.="%u".$tmpString;
$i++;
}else{
$retrunString.="%".dechex(ord($str[$i]));
}
}
return$retrunString;
}
functionescape($str)
{
preg_match_all("/[\x80-\xff].|[\x01-\x7f]+/",$str,$r);
$ar=$r[0];
foreach($aras$k=>$v)
{
if(ord($v[0])<128)
$ar[$k]=rawurlencode($v);
else
$ar[$k]="%u".bin2hex(iconv("UTF-8","UCS-2",$v));
}
returnjoin("",$ar);
}
function<a href="/tag/PHP/" target="_blank" class="keywords">PHP</a>unescape($source)
{
$decodedStr="";
$pos=0;
$len=strlen($source);
while($pos<$len)
{
$charAt=substr($source,$pos,1);
if($charAt=='%')
{
$pos++;
$charAt=substr($source,1);
if($charAt=='u')
{
// we got a unicode character
$pos++;
$unicodeHexVal=substr($source,4);
$unicode=hexdec($unicodeHexVal);
$entity="&#".$unicode.';';
$decodedStr.=utf8_encode($entity);
$pos+=4;
}else{
// we have an escaped ascii character
$hexVal=substr($source,2);
$decodedStr.=chr(hexdec($hexVal));
$pos+=2;
}
}else{
$decodedStr.=$charAt;
$pos++;
}
}
return$decodedStr;
}
functionunescape($str)
{
$str=rawurldecode($str);
preg_match_all("/(?:%u.{4})|&#x.{4};|&#\d+;|.+/U",$r);
$ar=$r[0];
#print_r($ar);
foreach($aras$k=>$v)
{
if(substr($v,2)=="%u")
$ar[$k]=iconv("UCS-2","UTF-8",pack("H4",substr($v,-4)));
elseif(substr($v,3)=="&#x")
$ar[$k]=iconv("UCS-2",3,-1)));
elseif(substr($v,2)=="&#")
{
//echo substr($v,-1)."";
$ar[$k]=iconv("UCS-2",pack("n",-1)));
}
}
returnjoin("",$ar);
}
?>