javascript utf-8 url 编码 之 纯算法 解码 by shawl.qiu 2007-9-24
说明:
这个东西的用处嘛...
在于, 你使用 非utf-8 编码作为页面编码, 但是接收 request 时, 某页面传递了utf-8 编码的URL 过来...那现在这个函数就大有作为了...
题外话, 最近在研究算法, 刚开始的时候是 hash function, 然后 发现得先学 二进制, 再后来发现得学习 base64, 然后发现得了解编码集, 然后.....
天呀...真个没得完...
shawl.qiu
2007-09-24
http://blog.csdn.net/btbtd
下载:
http://files.myopera.com/btbtd/javascript/function/fPEUtf8ToGb.7z
内容:
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<title>shawl.qiu template </title>
<style type="text/css">
/* <![CDATA[ */
/* ]]> */
</style>
<script type="text/javascript">
/*<![CDATA[*/
if (navigator.appName=="Microsoft Internet Explorer")
{
//最大化窗口
self.moveTo(-5,-5)
self.resizeTo(screen.availWidth +8,screen.availHeight+8)
//这个脚本定义的宽度其实比原窗口还要大那么一点.
}
/*]]*/
</script>
</head>
<body>
<script type="text/javascript">
/*<![CDATA[*/
fTestFunc("encodeURIComponent", encodeURIComponent);
fTestFunc("encodeURI", encodeURI);
// PE = percent encoding
function fPEUtf8ToGb(sUtf8PE)
{ // shawl.qiu code, return string; Func: fGetUtf8PE
if(sUtf8PE.indexOf("%")===-1) return sUtf8PE;
var iLBound = parseInt("7d", 16);
for(var i=0, j=sUtf8PE.length; i<j; i++)
{
var iIndex = sUtf8PE.indexOf("%", i);
if(iIndex===-1) break;
i=iIndex+1;
var sHex = sUtf8PE.slice(i, i+2);
if(parseInt(sHex, 16)>iLBound)
{
var sHexExt = sUtf8PE.slice(i+2, i+8);
if(//%../%/.test(sHexExt))
{
var TempStr = sUtf8PE.slice(i-1, i+8);
TempStr = fGetUtf8PE(TempStr);
sUtf8PE = [sUtf8PE.slice(0, i-1), TempStr, sUtf8PE.slice(i+8)].join("");
i-=1;
}
} // end if(parseInt(sHex, 16)>iLBound)
} // end for(var i=0, j=sUtf8PE.length; i<j; i++)
if(sUtf8PE.indexOf("%")===-1) return sUtf8PE;
for(var i=0, j=sUtf8PE.length; i<j; i++)
{
var iIndex = sUtf8PE.indexOf("%", i);
if(iIndex===-1) break;
i=iIndex+1;
var sHex = sUtf8PE.slice(i, i+2);
var iDec = parseInt(sHex, 16);
var sAsc = String.fromCharCode(iDec);
sUtf8PE = [sUtf8PE.slice(0, i-1), sAsc, sUtf8PE.slice(i+2)].join("");
i-=1;
} // end for(var i=0, j=sUtf8PE.length; i<j; i++)
return sUtf8PE;
} // end function fPEUtf8ToGb(sUtf8PE)
// PE = percent encoding
function fGetUtf8PE(sUtf8PE) // %xx%xx%xx
{ // shawl.qiu code, return string
var Ar = sUtf8PE.replace(//%/, "").split("%");
var TAr = [];
for(var i=0, j=Ar.length; i<j; i++)
{
Ar[i] = parseInt(Ar[i], 16).toString(2);
var iZeroIndex = Ar[i].indexOf("0");
if(i===0)
{
Ar[i] = Ar[i].slice(iZeroIndex+1);
TAr.push(Ar[i]);
}
else
{
Ar[i] = Ar[i].substr(2);
TAr.push(Ar[i]);
}
} // end for(var i=0, j=Ar.length; i<j; i++)
var sHex = parseInt(TAr.join(""), 2).toString(16);
return unescape("%u"+sHex);
} // end function fGetUtf8PE(sUtf8PE)
function fTestFunc(sMsg, Func)
{
document.write("<p/>"+sMsg.bold()+":<p/> /n");
var str = "搜";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
var str = "1923809=-02343+|+|_l'kl'k中是; 苯胺中kj";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
var str = ")_()_(*(**(&*&(:J:KJuyjsdfj7867813dj|_)_09-090///|_+)_}/"L/":<>j";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
}
/*]]*/
</script>
</body>
</html>
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
<title>shawl.qiu template </title>
<style type="text/css">
/* <![CDATA[ */
/* ]]> */
</style>
<script type="text/javascript">
/*<![CDATA[*/
if (navigator.appName=="Microsoft Internet Explorer")
{
//最大化窗口
self.moveTo(-5,-5)
self.resizeTo(screen.availWidth +8,screen.availHeight+8)
//这个脚本定义的宽度其实比原窗口还要大那么一点.
}
/*]]*/
</script>
</head>
<body>
<script type="text/javascript">
/*<![CDATA[*/
fTestFunc("encodeURIComponent", encodeURIComponent);
fTestFunc("encodeURI", encodeURI);
// PE = percent encoding
function fPEUtf8ToGb(sUtf8PE)
{ // shawl.qiu code, return string; Func: fGetUtf8PE
if(sUtf8PE.indexOf("%")===-1) return sUtf8PE;
var iLBound = parseInt("7d", 16);
for(var i=0, j=sUtf8PE.length; i<j; i++)
{
var iIndex = sUtf8PE.indexOf("%", i);
if(iIndex===-1) break;
i=iIndex+1;
var sHex = sUtf8PE.slice(i, i+2);
if(parseInt(sHex, 16)>iLBound)
{
var sHexExt = sUtf8PE.slice(i+2, i+8);
if(//%../%/.test(sHexExt))
{
var TempStr = sUtf8PE.slice(i-1, i+8);
TempStr = fGetUtf8PE(TempStr);
sUtf8PE = [sUtf8PE.slice(0, i-1), TempStr, sUtf8PE.slice(i+8)].join("");
i-=1;
}
} // end if(parseInt(sHex, 16)>iLBound)
} // end for(var i=0, j=sUtf8PE.length; i<j; i++)
if(sUtf8PE.indexOf("%")===-1) return sUtf8PE;
for(var i=0, j=sUtf8PE.length; i<j; i++)
{
var iIndex = sUtf8PE.indexOf("%", i);
if(iIndex===-1) break;
i=iIndex+1;
var sHex = sUtf8PE.slice(i, i+2);
var iDec = parseInt(sHex, 16);
var sAsc = String.fromCharCode(iDec);
sUtf8PE = [sUtf8PE.slice(0, i-1), sAsc, sUtf8PE.slice(i+2)].join("");
i-=1;
} // end for(var i=0, j=sUtf8PE.length; i<j; i++)
return sUtf8PE;
} // end function fPEUtf8ToGb(sUtf8PE)
// PE = percent encoding
function fGetUtf8PE(sUtf8PE) // %xx%xx%xx
{ // shawl.qiu code, return string
var Ar = sUtf8PE.replace(//%/, "").split("%");
var TAr = [];
for(var i=0, j=Ar.length; i<j; i++)
{
Ar[i] = parseInt(Ar[i], 16).toString(2);
var iZeroIndex = Ar[i].indexOf("0");
if(i===0)
{
Ar[i] = Ar[i].slice(iZeroIndex+1);
TAr.push(Ar[i]);
}
else
{
Ar[i] = Ar[i].substr(2);
TAr.push(Ar[i]);
}
} // end for(var i=0, j=Ar.length; i<j; i++)
var sHex = parseInt(TAr.join(""), 2).toString(16);
return unescape("%u"+sHex);
} // end function fGetUtf8PE(sUtf8PE)
function fTestFunc(sMsg, Func)
{
document.write("<p/>"+sMsg.bold()+":<p/> /n");
var str = "搜";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
var str = "1923809=-02343+|+|_l'kl'k中是; 苯胺中kj";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
var str = ")_()_(*(**(&*&(:J:KJuyjsdfj7867813dj|_)_09-090///|_+)_}/"L/":<>j";
var s = Func(str);
var c = fPEUtf8ToGb(s);
document.write("Test String: "+str+"<br/>/n");
document.write(" Encoding: "+s+"<br/>/n");
document.write("<p/> Decoding: "+c+"<hr/>/n/n");
//----------------------------------
}
/*]]*/
</script>
</body>
</html>