PERLCN(1) Perl Programmers Reference Guide PERLCN(1)
NAME
perlcn - 1/4`o`Ia"OD^I"A Perl "O,"A"I
DESCRIPTION
>>9'O`A',u1/2 Perl ,u"A`I`i,uO!
''O 5.8.0 oae'ca^E1/4, Perl 3/4B]-,'A"E'I^e'EAE,u"A Unicode ('I3`O>>^A"e) "OS^O(R),
`O2'A~'o"OS^O(R)'A"ED'i9`a`A9,i'O"i"I,u`O^O'I^a,u"A]-`a^A"e.1/2^E1/2; CJK ("OD`E~Oo<<)
]-~a^E,CAE"a"OD,u"A`O>>2'c.'Y. Unicode ^E,C1'u1/4^ED^O,u"A]-^ex1/4, ^E^O'I1/4o-
,,C^E`A1/2,c'E"I"E`u'OD,u"Ax"O.^u: ^I-:-.1/2^E`A1/2,c, 9<<.1/2^E`A1/2,c,
`O^O1/4o'A1/2~OB1/4"a,u"A`O>>,CD ("IL`Ao^I"A, D`'o`A^u~N,C^I"A, ~N,C`A2(R)^I"A, "IL2(R)`A'^I"A,
'O,i9`E^I"A, 'O,i,uOo2^I"A, ,u`E,u`E). "E"u`O2`E'Y"A'E'A"E9`a"O"Ox-:-`O,u"I,u'I3'O"eAE1/2`I" (`E,c PC
1/4o^A'o1/2`'o"Eb).
Perl ]-3/4'E'i`O^O Unicode 1/2oDD2`Ux-:-. ~O^a]-'i^E3/4 Per
"A'U2'c,u"Ax"O.^u'(R)^E'y3/4'Y'c'E'O~A Unicode ]-'i^E3/4; Perl ,u"Ao ^E1/2'O"e"E~a.^u
(`A'y`E,c~O'y1ae]-'i^E3/4^E1/2]-`E9^O) `O2"A"U9^O Unicode 1/2oDD2`Ux-:-.
^O'U^E"a`E"e1/4o^E"a3"o^E]-, ^Ia'A"E'`A'i`O^O Unicode
"O(R),Co,u"A]-`a^A"e.1/2^E1/2'ae.A,u"A^E'y3/4'Y, Perl `I'a1(C)'A"E Encode ~O^a,"o"AL'c'e,
'c'E`O^O`E~A"A~a,C'a`Ox,uO9'A`E,i1/4oD'`E"e3/4'E'OD,u"A]-`a^A"e^E'y3/4'Y.
Encode ~N'O'E`i"AL'c'e"OS^O(R)"I^A'AD1/4`o`Ia"OD^I"A,u"A]-`a^A"e.1/2^E1/2 ('gb2312' ]-'i^E3/4
'euc-cn'):
euc-cn Unix ~N'O'E`ix"O.^u1/4 , `O23/4'I^E,C"Ex3AE,u"A1'u]-^e^A"e
gb2312-raw ^I'3/4'`A'i,u"A (,u'I]-`E`IO) GB2312 x"O.^u]-'i
gb12345 ^I'3/4'`A'i,u"A"OD1'u'O~A.]-`Ia"OD^I"A]-`a^A"e
iso-ir-165 GB2312 ] GB6345 ] GB8565 ] D^A^O"ox"O.^u
cp936 x"O^A"e`O3 936, `O2'c'E`O^O'O~A 'GBK' (`A(C)3"a1'u]-^e^A"e) "O,~A-:-
hz 7 ]-`E`IO`O'Y3"o^E1/2 GB2312 ]-`a^A"e
3/4`U`A'y`A'"E,u, 1/2<< EUC-CN ]-`a^A"e,u"A,u,uo,xa3'E Unicode, `i'oD`e1/4"u`E"e"I^A'AD"O,'A^i:
perl -Mencoding=euc-cn,STDOUT,utf8 -pe1 < file.euc-cn > file.utf8
Perl `O2"A'U,1/2'A"E "piconv", `O>>"OS'I^e`E<<`O^O Perl D'3'E,u"Ax"O.^uxa>>>>1x3/4B3`ID`o,
'O~A."`E,c"I^A:
piconv -f euc-cn -t utf8 < file.euc-cn > file.utf8
piconv -f utf8 -t euc-cn < file.utf8 > file.euc-cn
'A'i'I^a, `A^u'O~A encoding "AL'c'e, "A~a'c'E`O^O,C'a`OxD'3"o`O^Ox"O.^u^Ia,u=Y^I>>,u"A3`ID`o^A"e,
`E,c"I^A"E`u^E3/4:
#!/usr/in/env perl
# AE^o9 euc-cn x"O'(R)1/2^a^I"o; ]-^ex1/4^E"a3"o`E"e1/4o]-^ex1/4''i^I'o91/4'E`e^Ia euc-cn ]-`a^A"e
use encoding 'euc-cn', STDIN => 'euc-cn', STDOUT => 'euc-cn';
print length("^Aae'I~O"); # 2 ("E<<`O'yoA]-'i^E3/4x"O.^u)
print length('^Aae'I~O'); # 4 (,u=Y`O'yoA]-'i^E3/4x"O1/2'U)
print index("x>>x>>1/2`I>>a", ">>x>>1/2"); # -1 (2>>o"uo~'"Ex'Ox"O.^u'(R))
print index('x>>x>>1/2`I>>a', '>>x>>1/2'); # 1 (''O,u'U9b,"ox"O1/2'U'ca^E1/4)
^O'Ux^io'o`O>>'AD`A'yx'O`A"i, "x>>" ,u"A,u'U9b,"ox"O1/2'U'O"e "x>>"
,u"A,u'U`O>>,"ox"O1/2'U1/2'ao"I3'E EUC-CN ^A"e,u"A ">>x"; "x>>" ,u"A,u'U9b,"ox"O1/2'U^O`o'O"e
"1/2`I" ,u"A,u'U`O>>,"ox"O1/2'U1/2'ao"I3'E ">>1/2". ~O^a1/2^a3/4"o'A"E`O^O,Co EUC-CN
^A"e]-`E9^O'`A'i'E"I3L1/4^u,u"A^I^E`I^a.
9^^i''I^^a,,u""A""OD^^I""A]-``a^^A""e
`E,c1^uD`e`Oa,"u9`a,u"A"OD^I"A]-`a^A"e, 'c'E`O^O''O CPAN () "I^A^OO
Encode::HanExtra "AL'c'e. "E"u"A'c,Co`I'a1(C)"I^A'AD]-`a^A"e.1/2^E1/2:
gb18030 `A(C)3"a1'y,u"A1'u]-^e^A"e, o"uo~.]-`Ia"OD^I"A
'A'i'I^a, Encode::HanConvert "AL'c'e^O`o`I'a1(C)'A"E1/4`o.]-xa>>>>'O~A,u"A'A1/2"O"O]-`a^A"e:
big5-simp Big5 .]-`Ia"OD^I"A'O"e Unicode 1/4`o`Ia"OD^I"A>>=Yxa
gbk-trad GBK 1/4`o`Ia"OD^I"A'O"e Unicode .]-`Ia"OD^I"A>>=Yxa
`E^o"I"e^O'U GBK 'O"e Big5 "O(R)1/4"a>>=Yxa, ,C"e2^I'c1/4,~A"AL'c'e"A'U,1/2,u"A b2g.pl 'O"e
g2b.pl 'A1/2"OS3`ID`o, >>`o^O'U3`ID`o"A'U^E1'O~A"I^A'ADD'.":
use Encode::HanConvert;
$euccn = big5togb($big5); # ''O Big5 xa^Ia GBK
$big5 = gbtobig5($euccn); # ''O GBK xa^Ia Big5
1/2o``O>>>>21/2,,u""ADA""Ic
,C"e2^I'c1/4 Perl "A'U,1/2,u"A''o'A'c"E,u~A-:-^I"A1/4b (2>>D`O`E<<^E,C'O~A'Oc^I"AD',u"A),
`A'~NS"Io,"u9`a1O'O'U Perl ,u"A"Oa^E9, `O^O1/4o Unicode ,u"A^E1'O~A.1/2^E1/2. 2>>1'y,
'I^a2'c,u"Ax^E^O'"I`a,u]-.'a,>>:
``I''a1(C) Perl x^^E^^O'',,u""A''Io""O.
Perl ,u"A^Ex`O3 ('O'EA.`A3`A~n1<<"E3/4^I~>>x)
Perl x^Uo"I,u"a2O'Io (Comprehensive Perl Archive Network)
Perl 'O^E,u'Y^A^U`I3`O>>`A`A
~~NS""Io Perl ,,u""A''Io""O.
1/4`o`Ia"OD^I"Aoae,u"AA.`A3`A~n Perl ^E'e1/2a
Perl ^^E1''O~~A~~OB1/4 >>>>''a
"OD1'u Perl 'IAE1~ax'e`O>>`A`A
Unicode ""I``a1O''Io""O.
Unicode ~NS^E~o~NS>>'a (Unicode ]-^ex1/4,u"A"OAE9"~OB)
Unix/Linux 'E"I,u"A UTF-8 1/4o Unicode '`'o'c'I^I^E
SEE ALSO
Encode, Encode::CN, encoding, perluniintro, perlunicode
AUTHORS
Jarkko Hietaniemi
Autrijus Tang (`IAEx'Uoo)
perl v5.8.6 2004-11-05 PERLCN(1)
|