use utf8;
use Encode;
use URI::Escape;
#从unicode得到utf8编码
$str = '%u6536';
$str =~ s/\%u([0-9a-fA-F]{4})/pack("U",hex($1))/eg;
$str = encode( "utf8", $str );
print uc unpack( "H*", $str ),"\n";
# 从unicode得到gb2312编码
$str = '%u6536';
$str =~ s/\%u([0-9a-fA-F]{4})/pack("U",hex($1))/eg;
$str = encode( "gb2312", $str );
print uc unpack( "H*", $str ),"\n";
# 从中文得到utf8编码
my $str = '中文';
print uri_escape_utf8($str),"\n";
# 从utf8编码得到中文
my $utf8_str = uri_escape_utf8 ("中文");
print uri_unescape($utf8_str),"\n";
# 从中文得到perl unicode
utf8::decode($str);
@chars = split //, $str;
foreach (@chars) {
printf "%x ", ord($_),"\n";
}
# 从中文得到标准unicode
$str = '中文';
map { print "\\u", sprintf( "%x", $_ ) ,"
perl 转化 utf8/unicode/gb2312
最新推荐文章于 2021-05-19 18:49:42 发布
这篇博客展示了如何使用Perl进行不同字符编码之间的转换,包括从Unicode到UTF8,从Unicode到GBK,从中文到UTF8,从UTF8编码到中文,以及从Perl Unicode到中文的转换。主要涉及的函数有`encode`、`uri_escape_utf8`、`uri_unescape`和正则表达式操作。
摘要由CSDN通过智能技术生成