网络编程 
首页 > 网络编程 > 浏览文章

utf-8编码转换成gb2312

(编辑:jimmy 日期: 2024/11/16 浏览:3 次 )
[code]<script>  
function  chinesefromutf8url(strutf8)    
{  
           var  bstr  =  "";  
           var  noffset  =  0; 
 //  processing  point  on  strutf8               
           if(  strutf8  ==  ""  )  
               return  "";                 
           strutf8  =  strutf8.tolowercase();  
           noffset  =  strutf8.indexof("%e");  
           if(  noffset  ==  -1  )  
               return  strutf8;  

           while(  noffset  !=  -1  )  
           {  
               bstr  +=  strutf8.substr(0,  noffset);  
               strutf8  =  strutf8.substr(noffset,  strutf8.length  -  noffset);  
               if(  strutf8  ==  ""    ¦  ¦  strutf8.length  <  9  )      //  bad  string  
                   return  bstr;  

               bstr  +=  utf8codetochinesechar(strutf8.substr(0,  9));  
               strutf8  =  strutf8.substr(9,  strutf8.length  -  9);  
               noffset  =  strutf8.indexof("%e");  
           }  

           return  bstr  +  strutf8;  
}  

function  unicodefromutf8(strutf8)    
{  
           var  bstr  =  "";  
           var  ntotalchars  =  strutf8.length;            //  total  chars  to  be  processed.  
           var  noffset  =  0;                                                            //  processing  point  on  strutf8  
           var  nremainingbytes  =  ntotalchars;            //  how  many  bytes  left  to  be  converted  
           var  noutputposition  =  0;  
           var  icode,  icode1,  icode2;                                    //  the  value  of  the  unicode.  

           while  (noffset  <  ntotalchars)  
           {  
                       icode  =  strutf8.charcodeat(noffset);  
                       if  ((icode  &  0x80)  ==  0)                                    //  1  byte.  
                       {  
                                   if  (  nremainingbytes  <  1  )                        //  not  enough  data  
                                               break;  

                                   bstr  +=  string.fromcharcode(icode  &  0x7f);  
                                   noffset  ++;  
                                   nremainingbytes  -=  1;  
                       }  
                       else  if  ((icode  &  0xe0)  ==  0xc0)            //  2  bytes  
                       {  
                                   icode1  =    strutf8.charcodeat(noffset  +  1);  
                                   if  (  nremainingbytes  <  2    ¦  ¦                                    //  not  enough  data  
                                                 (icode1  &  0xc0)  !=  0x80  )                        //  invalid  pattern  
                                   {  
                                               break;  
                                   }  

                                   bstr  +=  string.fromcharcode(((icode  &  0x3f)  <<  6)    ¦  (              icode1  &  0x3f));  
                                   noffset  +=  2;  
                                   nremainingbytes  -=  2;  
                       }  
                       else  if  ((icode  &  0xf0)  ==  0xe0)            //  3  bytes  
                       {  
                                   icode1  =    strutf8.charcodeat(noffset  +  1);  
                                   icode2  =    strutf8.charcodeat(noffset  +  2);  
                                   if  (  nremainingbytes  <  3    ¦  ¦                                    //  not  enough  data  
                                                 (icode1  &  0xc0)  !=  0x80    ¦  ¦                        //  invalid  pattern  
                                                 (icode2  &  0xc0)  !=  0x80  )  
                                   {  
                                               break;  
                                   }  

                                   bstr  +=  string.fromcharcode(((icode  &  0x0f)  <<  12)    ¦    
                                                           ((icode1  &  0x3f)  <<    6)    ¦  
                                                           (icode2  &  0x3f));  
                                   noffset  +=  3;  
                                   nremainingbytes  -=  3;  
                       }  
                       else                                                                                                //  4  or  more  bytes  --  unsupported  
                                   break;  
           }  

           if  (nremainingbytes  !=  0)  
           {  
                       //  bad  utf8  string.  
                       return  "";  
           }  

           return  bstr;  
}  

function  utf8codetochinesechar(strutf8)  
{  
   var  icode,  icode1,  icode2;  
   icode  =  parseint("0x"  +  strutf8.substr(1,  2));  
   icode1  =  parseint("0x"  +  strutf8.substr(4,  2));  
   icode2  =  parseint("0x"  +  strutf8.substr(7,  2));  

   return  string.fromcharcode(((icode  &  0x0f)  <<  12)    ¦    
                                                           ((icode1  &  0x3f)  <<    6)    ¦  
                                                           (icode2  &  0x3f));  
}  
alert(chinesefromutf8url("%e6%b5%8b%e8%af%95"))  
</script>[code]
上一篇:Utf-8和Gb2312乱码问题的终结
下一篇:UTF-8编码第1/2页
一句话新闻
微软与英特尔等合作伙伴联合定义“AI PC”:键盘需配有Copilot物理按键
几个月来,英特尔、微软、AMD和其它厂商都在共同推动“AI PC”的想法,朝着更多的AI功能迈进。在近日,英特尔在台北举行的开发者活动中,也宣布了关于AI PC加速计划、新的PC开发者计划和独立硬件供应商计划。
在此次发布会上,英特尔还发布了全新的全新的酷睿Ultra Meteor Lake NUC开发套件,以及联合微软等合作伙伴联合定义“AI PC”的定义标准。