⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 encoding.t

📁 source of perl for linux application,
💻 T
字号:
#!./perl -wBEGIN {    chdir 't' if -d 't';    @INC = '../lib';    no warnings; # Need global -w flag for later tests, but don't want this    # to warn here:    push @INC, "::lib:$MacPerl::Architecture:" if $^O eq 'MacOS';    unless (find PerlIO::Layer 'perlio') {	print "1..0 # Skip: not perlio\n";	exit 0;    }    unless (eval { require Encode } ) {	print "1..0 # Skip: not Encode\n";	exit 0;    }}print "1..15\n";my $grk = "grk$$";my $utf = "utf$$";my $fail1 = "fa$$";my $fail2 = "fb$$";my $russki = "koi8r$$";my $threebyte = "3byte$$";if (open(GRK, ">$grk")) {    binmode(GRK, ":bytes");    # alpha beta gamma in ISO 8859-7    print GRK "\xe1\xe2\xe3";    close GRK or die "Could not close: $!";}{    open(my $i,'<:encoding(iso-8859-7)',$grk);    print "ok 1\n";    open(my $o,'>:utf8',$utf);    print "ok 2\n";    print $o readline($i);    print "ok 3\n";    close($o) or die "Could not close: $!";    close($i);}if (open(UTF, "<$utf")) {    binmode(UTF, ":bytes");    if (ord('A') == 193) { # EBCDIC	# alpha beta gamma in UTF-EBCDIC Unicode (0x3b1 0x3b2 0x3b3)	print "not " unless <UTF> eq "\xb4\x58\xb4\x59\xb4\x62";    } else {	# alpha beta gamma in UTF-8 Unicode (0x3b1 0x3b2 0x3b3)	print "not " unless <UTF> eq "\xce\xb1\xce\xb2\xce\xb3";    }    print "ok 4\n";    close UTF;}{    use Encode;    open(my $i,'<:utf8',$utf);    print "ok 5\n";    open(my $o,'>:encoding(iso-8859-7)',$grk);    print "ok 6\n";    print $o readline($i);    print "ok 7\n";    close($o) or die "Could not close: $!";    close($i);}if (open(GRK, "<$grk")) {    binmode(GRK, ":bytes");    print "not " unless <GRK> eq "\xe1\xe2\xe3";    print "ok 8\n";    close GRK;}$SIG{__WARN__} = sub {$warn .= $_[0]};if (open(FAIL, ">:encoding(NoneSuch)", $fail1)) {    print "not ok 9 # Open should fail\n";} else {    print "ok 9\n";}if (!defined $warn) {    print "not ok 10 # warning is undef\n";} elsif ($warn =~ /^Cannot find encoding "NoneSuch" at/) {    print "ok 10\n";} else {    print "not ok 10 # warning is '$warn'";}if (open(RUSSKI, ">$russki")) {    print RUSSKI "\x3c\x3f\x78";    close RUSSKI or die "Could not close: $!";    open(RUSSKI, "$russki");    binmode(RUSSKI, ":raw");    my $buf1;    read(RUSSKI, $buf1, 1);    # eof(RUSSKI);    binmode(RUSSKI, ":encoding(koi8-r)");    my $buf2;    read(RUSSKI, $buf2, 1);    my $offset = tell(RUSSKI);    if (ord($buf1) == 0x3c &&	ord($buf2) == (ord('A') == 193) ? 0x6f : 0x3f &&	$offset == 2) {	print "ok 11\n";    } else {	printf "not ok 11 # [%s] [%s] %d\n",	       join(" ", unpack("H*", $buf1)),	       join(" ", unpack("H*", $buf2)), $offset;    }    close(RUSSKI);} else {    print "not ok 11 # open failed: $!\n";}undef $warn;# Check there is no Use of uninitialized value in concatenation (.) warning# due to the way @latin2iso_num was used to make aliases.if (open(FAIL, ">:encoding(latin42)", $fail2)) {    print "not ok 12 # Open should fail\n";} else {    print "ok 12\n";}if (!defined $warn) {    print "not ok 13 # warning is undef\n";} elsif ($warn =~ /^Cannot find encoding "latin42" at.*line \d+\.$/) {    print "ok 13\n";} else {    print "not ok 13 # warning is: \n";    $warn =~ s/^/# /mg;    print "$warn";}# Create a string of chars that are 3 bytes in UTF-8 my $str = "\x{1f80}" x 2048;# Write them to a fileopen(F,'>:utf8',$threebyte) || die "Cannot open $threebyte:$!";print F $str;close(F);# Read file back as UTF-8 open(F,'<:encoding(utf-8)',$threebyte) || die "Cannot open $threebyte:$!";my $dstr = <F>;close(F);print "not " unless ($dstr eq $str);print "ok 14\n";# Try decoding some bad stuffopen(F,'>:raw',$threebyte) || die "Cannot open $threebyte:$!";if (ord('A') == 193) { # EBCDIC    print F "foo\x8c\x80\x80\x80bar\n\x80foo\n";} else {    print F "foo\xF0\x80\x80\x80bar\n\x80foo\n";}close(F);open(F,'<:encoding(utf-8)',$threebyte) || die "Cannot open $threebyte:$!";$dstr = join(":", <F>);close(F);if (ord('A') == 193) { # EBCDIC    print "not " unless $dstr eq "foo\\x8C\\x80\\x80\\x80bar\n:\\x80foo\n";} else {    print "not " unless $dstr eq "foo\\xF0\\x80\\x80\\x80bar\n:\\x80foo\n";}print "ok 15\n";END {    1 while unlink($grk, $utf, $fail1, $fail2, $russki, $threebyte);}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -