Unicode::Japanese::JA(3pm) User Contributed Perl Documentation Unicode::Japanese::JA(3pm)
NAME
Unicode::Japanese::JA -
use Unicode::Japanese;
use Unicode::Japanese qw(unijp);
# convert utf8 -> sjis
print Unicode::Japanese->new($str)->sjis;
print unijp($str)->sjis; # same as above.
# convert sjis -> utf8
print Unicode::Japanese->new($str,'sjis')->get;
# convert sjis (imode_EMOJI) -> utf8
print Unicode::Japanese->new($str,'sjis-imode')->get;
# convert zenkaku (utf8) -> hankaku (utf8)
print Unicode::Japanese->new($str)->z2h->get;
Unicode::Japanese
o Unicode::Japanese UTF-8
o XS / XS No-XS (Japanese.pm )
o
o (DoCoMo i-modeKDDI AU, Softbank Mobile, ASTEL dot-i) Unicode DB
o
o SJIS MS-CP932 Unicode
o Unicode -> SJISEUC-JP/JIS SJIS &#dddd; Unicode '?'. , , '?'.
o Perl-5.8.0 , utf8 . utf-8 `' utf8() , utf-8 `' getu() .
get() utf-8 `' ().
sjis(), jis(), utf8(), etc.. . new, set, getcode , utf8-flaged/bytes .
o perl 5.10.x, 5.8.x, etc. (5.004 ).
o (OK) C . XS Pure Perl . C , Unicode::Japanese Pure Perl .
o (OK) Test.pm Test::More.
.
$s = Unicode::Japanese->new($str [, $icode [, $encode]])
Unicode::Japanese
"set"
$s = unijp($str [, $icode [, $encode]])
Unicode::Janaese->new(...) .
$s->set($str [, $icode [, $encode]])
$str:
$icode: 'utf8'
$encode:
UTF-8
:
auto
utf8 ucs2 ucs4
utf16-be utf16-le utf16
utf32-be utf32-le utf32
sjis cp932 euc euc-jp jis
sjis-imode sjis-imode1 sjis-imode2
utf8-imode utf8-imode1 utf8-imode2
sjis-doti sjis-doti1
sjis-jsky sjis-jsky1 sjis-jsky2
jis-jsky jis-jsky1 jis-jsky2
utf8-jsky utf8-jsky1 utf8-jsky2
sjis-au sjis-au1 sjis-au2
jis-au jis-au1 jis-au2
sjis-icon-au sjis-icon-au1 sjis-icon-au2
euc-icon-au euc-icon-au1 euc-icon-au2
jis-icon-au jis-icon-au1 jis-icon-au2
utf8-icon-au utf8-icon-au1 utf8-icon-au2
ascii binary
( .)
'auto' 'auto' getcode()
'base64' base64 base64 Unicode::Japanese
'binary'
sjis-imodesjis-doti &#dddd;
sjis, utf8 sjis sjis-ausjis-doti sjis-au
$str = $s->get
$str: (UTF-8)
UTF-8
`' , .
utf8() , getu() .
$str = $s->getu
$str: (UTF-8)
UTF-8
Perl-5.8.0 , utf-8 utf-8 .
$code = $s->getcode($str)
$str:
$code:
($str)
, ,
(PurePerl)
1. UTF-32 BOM utf32
2. UTF-16 BOM utf16
3. UTF-32BE utf32-be
4. UTF-32LE utf32-le
5. ESC 8 ascii ESC ASCII (0x00-0x1F 0x7F) ascii
6. JISjis
7. J-PHONE sjis-jsky
8. EUC-JP euc
9. SJIS sjis
10. SJIS au sjis-au
11. SJIS i-mode sjis-imode
12. SJIS dot-i sjis-doti
13. UTF-8 utf8
14. unknown
(XS)
1. UTF-32 BOM utf32
2. UTF-16 BOM utf16
3. , .
ascii / euc / sjis / jis / utf8 / utf32-be / utf32-le / sjis-jsky / sjis-imode /
sjis-au / sjis-doti
4. , , .
utf32-be / utf32-le / ascii / jis / euc / sjis / sjis-jsky / sjis-imode / sjis-au
/ sjis-doti / utf8
5. unknown
o UTF-8 SJIS
o UCS2
o UTF-16 BOM
o
&#dddd;
XSPurePerl, , . , sjis, PurePerlsjis XS. sjis-jsky. , , euc-jp, .
$code = $s->getcodelist($str)
$str:
$code:
($str)
getcode , .
$str = $s->conv($ocode, $encode)
$ocode: ()
utf8 ucs2 ucs4 utf16
sjis cp932 euc euc-jp jis
sjis-imode sjis-imode1 sjis-imode2
utf8-imode utf8-imode1 utf8-imode2
sjis-doti sjis-doti1
sjis-jsky sjis-jsky1 sjis-jsky2
jis-jsky jis-jsky1 jis-jsky2
utf8-jsky utf8-jsky1 utf8-jsky2
sjis-au sjis-au1 sjis-au2
jis-au jis-au1 jis-au2
sjis-icon-au sjis-icon-au1 sjis-icon-au2
euc-icon-au euc-icon-au1 euc-icon-au2
jis-icon-au jis-icon-au1 jis-icon-au2
utf8-icon-au utf8-icon-au1 utf8-icon-au2
binary
( .)
$encode:
$str:
'base64' base64 base64
perl-5.8.0 , utf-8 .
$s->tag2bin
&#dddd;
$s->z2h
$s->h2z
$s->hira2kata
$s->kata2hira
$str = $s->jis
$str: JIS
JISISO-2022-JP
$str = $s->euc
$str: euc-jp
EUC-JP
$str = $s->utf8
$str: utf-8
UTF-8
perl-5.8.0 , .
$str = $s->ucs2
$str: ucs2
UCS2
$str = $s->ucs4
$str: ucs4
UCS4
$str = $s->utf16
$str: ucs-16
UTF-16 BOM
$str = $s->sjis
$str: sjis
SJISMS-CP932
$str = $s->sjis_imode
$str: sjis/imode
i-mode SJIS imode.
$str = $s->sjis_imode1
$str: sjis/imode
i-mode SJIS .
$str = $s->sjis_imode2
$str: sjis/imode
i-mode SJIS , .
$str = $s->sjis_doti
$str: sjis/dot-i
dot-i SJIS
$str = $s->sjis_jsky
$str: sjis/j-sky
j-sky SJIS j-sky(VERSION 0.15 , jsky2).
$str = $s->sjis_jsky1
$str: sjis/j-sky
j-sky SJIS Page 13 .
$str = $s->sjis_jsky
$str: sjis/j-sky
j-sky SJIS Page 16 .
$str = $s->sjis_icon_au
$str: sjis/AU icon
AU SJIS
$str_arrayref = $s->strcut($len)
$len: ()
$str_arrayref:
$len()
, utf-8 utf-8.
$len = $s->strlen
$len:
UTF-8 length() 3 SJIS 2
$s->join_csv(@values);
@values:
CSV ("\n")
@values = $s->split_csv;
@values:
CSV ("\n")
binary utf-8 . binary .
+---------------+----+-----+-------+
|encoding | in | out | guess |
+---------------+----+-----+-------+
|auto : OK : -- | ----- |
+---------------+----+-----+-------+
|utf8 : OK : OK | OK |
|ucs2 : OK : OK | ----- |
|ucs4 : OK : OK | ----- |
|utf16-be : OK : -- | ----- |
|utf16-le : OK : -- | ----- |
|utf16 : OK : OK | OK(#) |
|utf32-be : OK : -- | OK |
|utf32-le : OK : -- | OK |
|utf32 : OK : -- | OK(#) |
+---------------+----+-----+-------+
|sjis : OK : OK | OK |
|cp932 : OK : OK | ----- |
|euc : OK : OK | OK |
|euc-jp : OK : OK | ----- |
|jis : OK : OK | OK |
+---------------+----+-----+-------+
|sjis-imode : OK : OK | OK |
|sjis-imode1 : OK : OK | ----- |
|sjis-imode2 : OK : OK | ----- |
|utf8-imode : OK : OK | ----- |
|utf8-imode1 : OK : OK | ----- |
|utf8-imode2 : OK : OK | ----- |
+---------------+----+-----+-------+
|sjis-doti : OK : OK | OK |
|sjis-doti1 : OK : OK | ----- |
+---------------+----+-----+-------+
|sjis-jsky : OK : OK | OK |
|sjis-jsky1 : OK : OK | ----- |
|sjis-jsky2 : OK : OK | ----- |
|jis-jsky : OK : OK | ----- |
|jis-jsky1 : OK : OK | ----- |
|jis-jsky2 : OK : OK | ----- |
|utf8-jsky : OK : OK | ----- |
|utf8-jsky1 : OK : OK | ----- |
|utf8-jsky2 : OK : OK | ----- |
+---------------+----+-----+-------+
|sjis-au : OK : OK | OK |
|sjis-au1 : OK : OK | ----- |
|sjis-au2 : OK : OK | ----- |
|jis-au : OK : OK | ----- |
|jis-au1 : OK : OK | ----- |
|jis-au2 : OK : OK | ----- |
|sjis-icon-au : OK : OK | ----- |
|sjis-icon-au1 : OK : OK | ----- |
|sjis-icon-au2 : OK : OK | ----- |
|euc-icon-au : OK : OK | ----- |
|euc-icon-au1 : OK : OK | ----- |
|euc-icon-au2 : OK : OK | ----- |
|jis-icon-au : OK : OK | ----- |
|jis-icon-au1 : OK : OK | ----- |
|jis-icon-au2 : OK : OK | ----- |
|utf8-icon-au : OK : OK | ----- |
|utf8-icon-au1 : OK : OK | ----- |
|utf8-icon-au2 : OK : OK | ----- |
+---------------+----+-----+-------+
|ascii : OK : -- | OK |
|binary : OK : OK | ----- |
+---------------+----+-----+-------+
(#): guessed when it has bom.
1. utf32 (#)
2. utf16 (#)
3. utf32-be
4. utf32-le
5. ascii
6. jis
7. sjis-jsky (pp)
8. euc
9. sjis
10. sjis-jsky (xs)
11. sjis-au
12. sjis-imode
13. sjis-doti
14. utf8
15. unknown
DESCRIPTION OF UNICODE MAPPING
Unicode
Shift_JIS
MS-CP932 Unicode URL
<ftp://ftp.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/WINDOWS/CP932.TXT>
Unicode SJIS &#dddd; ?
SJIS ?
EUC-JP/ISO-2022-JP
SJISUnicode SJIS
DoCoMo i-mode
F800 - F9FF U+0FF800 - U+0FF9FF
ASTEL dot-i
F000 - F4FF U+0FF000 - U+0FF4FF
J-PHONE J-SKY
J-SKY "\e\$" 1 12"\x0f" 12
1214500 - 47FF U+0FFB00 - U+0FFDFF
Unicode::Japanese Unicode J-SKY 1
AU
U+0FF500 - U+0FF6FF
PurePerl mode
use Unicode::Japanese qw(PurePerl);
use 'PurePerl' , XS.
"bug-unicode-japanese at rt.cpan.org" .
<http://rt.cpan.org/NoAuth/ReportBug.html?Queue=Unicode-Japanese>. web . , .
o EUC-JPJIS SJIS UTF-8 SJIS
o XSEUC-JPSJIS() \e EUC-JPSJIS
o Japanese.pm FTP ASCII
perldoc .
perldoc Unicode::Japanese
, :
o AnnoCPAN: Annotated CPAN documentation
<http://annocpan.org/dist/Unicode-Japanese>
o CPAN Ratings
<http://cpanratings.perl.org/d/Unicode-Japanese>
o RT: CPAN's request tracker
<http://rt.cpan.org/NoAuth/Bugs.html?Dist=Unicode-Japanese>
o Search CPAN
<http://search.cpan.org/dist/Unicode-Japanese>
CREDITS
Thanks very much to:
NAKAYAMA Nao
SUGIURA Tatsuki & Debian JP Project
Copyright 2001-2008 SANO Taku (SAWATARI Mikage) and YAMASHINA Hio, all rights reserved.
Perl .
perl v5.34.0 2022-02-06 Unicode::Japanese::JA(3pm)
Generated by $Id: phpMan.php,v 4.55 2007/09/05 04:42:51 chedong Exp $ Author: Che Dong
On Apache
Under GNU General Public License
2025-11-21 17:34 @216.73.216.164 CrawledBy Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; ClaudeBot/1.0; +claudebot@anthropic.com)