177 lines
5.0 KiB
Perl
177 lines
5.0 KiB
Perl
#
|
||
# $Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $
|
||
#
|
||
|
||
package Encode::JP::H2Z;
|
||
|
||
use strict;
|
||
use warnings;
|
||
|
||
our $RCSID = q$Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $;
|
||
our $VERSION = do { my @r = ( q$Revision: 2.2 $ =~ /\d+/g ); sprintf "%d." . "%02d" x $#r, @r };
|
||
|
||
use Encode::CJKConstants qw(:all);
|
||
|
||
use vars qw(%_D2Z $_PAT_D2Z
|
||
%_Z2D $_PAT_Z2D
|
||
%_H2Z $_PAT_H2Z
|
||
%_Z2H $_PAT_Z2H);
|
||
|
||
%_H2Z = (
|
||
"\x8e\xa1" => "\xa1\xa3", #。
|
||
"\x8e\xa2" => "\xa1\xd6", #「
|
||
"\x8e\xa3" => "\xa1\xd7", #」
|
||
"\x8e\xa4" => "\xa1\xa2", #、
|
||
"\x8e\xa5" => "\xa1\xa6", #・
|
||
"\x8e\xa6" => "\xa5\xf2", #ヲ
|
||
"\x8e\xa7" => "\xa5\xa1", #ァ
|
||
"\x8e\xa8" => "\xa5\xa3", #ィ
|
||
"\x8e\xa9" => "\xa5\xa5", #ゥ
|
||
"\x8e\xaa" => "\xa5\xa7", #ェ
|
||
"\x8e\xab" => "\xa5\xa9", #ォ
|
||
"\x8e\xac" => "\xa5\xe3", #ャ
|
||
"\x8e\xad" => "\xa5\xe5", #ュ
|
||
"\x8e\xae" => "\xa5\xe7", #ョ
|
||
"\x8e\xaf" => "\xa5\xc3", #ッ
|
||
"\x8e\xb0" => "\xa1\xbc", #ー
|
||
"\x8e\xb1" => "\xa5\xa2", #ア
|
||
"\x8e\xb2" => "\xa5\xa4", #イ
|
||
"\x8e\xb3" => "\xa5\xa6", #ウ
|
||
"\x8e\xb4" => "\xa5\xa8", #エ
|
||
"\x8e\xb5" => "\xa5\xaa", #オ
|
||
"\x8e\xb6" => "\xa5\xab", #カ
|
||
"\x8e\xb7" => "\xa5\xad", #キ
|
||
"\x8e\xb8" => "\xa5\xaf", #ク
|
||
"\x8e\xb9" => "\xa5\xb1", #ケ
|
||
"\x8e\xba" => "\xa5\xb3", #コ
|
||
"\x8e\xbb" => "\xa5\xb5", #サ
|
||
"\x8e\xbc" => "\xa5\xb7", #シ
|
||
"\x8e\xbd" => "\xa5\xb9", #ス
|
||
"\x8e\xbe" => "\xa5\xbb", #セ
|
||
"\x8e\xbf" => "\xa5\xbd", #ソ
|
||
"\x8e\xc0" => "\xa5\xbf", #タ
|
||
"\x8e\xc1" => "\xa5\xc1", #チ
|
||
"\x8e\xc2" => "\xa5\xc4", #ツ
|
||
"\x8e\xc3" => "\xa5\xc6", #テ
|
||
"\x8e\xc4" => "\xa5\xc8", #ト
|
||
"\x8e\xc5" => "\xa5\xca", #ナ
|
||
"\x8e\xc6" => "\xa5\xcb", #ニ
|
||
"\x8e\xc7" => "\xa5\xcc", #ヌ
|
||
"\x8e\xc8" => "\xa5\xcd", #ネ
|
||
"\x8e\xc9" => "\xa5\xce", #ノ
|
||
"\x8e\xca" => "\xa5\xcf", #ハ
|
||
"\x8e\xcb" => "\xa5\xd2", #ヒ
|
||
"\x8e\xcc" => "\xa5\xd5", #フ
|
||
"\x8e\xcd" => "\xa5\xd8", #ヘ
|
||
"\x8e\xce" => "\xa5\xdb", #ホ
|
||
"\x8e\xcf" => "\xa5\xde", #マ
|
||
"\x8e\xd0" => "\xa5\xdf", #ミ
|
||
"\x8e\xd1" => "\xa5\xe0", #ム
|
||
"\x8e\xd2" => "\xa5\xe1", #メ
|
||
"\x8e\xd3" => "\xa5\xe2", #モ
|
||
"\x8e\xd4" => "\xa5\xe4", #ヤ
|
||
"\x8e\xd5" => "\xa5\xe6", #ユ
|
||
"\x8e\xd6" => "\xa5\xe8", #ヨ
|
||
"\x8e\xd7" => "\xa5\xe9", #ラ
|
||
"\x8e\xd8" => "\xa5\xea", #リ
|
||
"\x8e\xd9" => "\xa5\xeb", #ル
|
||
"\x8e\xda" => "\xa5\xec", #レ
|
||
"\x8e\xdb" => "\xa5\xed", #ロ
|
||
"\x8e\xdc" => "\xa5\xef", #ワ
|
||
"\x8e\xdd" => "\xa5\xf3", #ン
|
||
"\x8e\xde" => "\xa1\xab", #゛
|
||
"\x8e\xdf" => "\xa1\xac", #゜
|
||
);
|
||
|
||
%_D2Z = (
|
||
"\x8e\xb6\x8e\xde" => "\xa5\xac", #ガ
|
||
"\x8e\xb7\x8e\xde" => "\xa5\xae", #ギ
|
||
"\x8e\xb8\x8e\xde" => "\xa5\xb0", #グ
|
||
"\x8e\xb9\x8e\xde" => "\xa5\xb2", #ゲ
|
||
"\x8e\xba\x8e\xde" => "\xa5\xb4", #ゴ
|
||
"\x8e\xbb\x8e\xde" => "\xa5\xb6", #ザ
|
||
"\x8e\xbc\x8e\xde" => "\xa5\xb8", #ジ
|
||
"\x8e\xbd\x8e\xde" => "\xa5\xba", #ズ
|
||
"\x8e\xbe\x8e\xde" => "\xa5\xbc", #ゼ
|
||
"\x8e\xbf\x8e\xde" => "\xa5\xbe", #ゾ
|
||
"\x8e\xc0\x8e\xde" => "\xa5\xc0", #ダ
|
||
"\x8e\xc1\x8e\xde" => "\xa5\xc2", #ヂ
|
||
"\x8e\xc2\x8e\xde" => "\xa5\xc5", #ヅ
|
||
"\x8e\xc3\x8e\xde" => "\xa5\xc7", #デ
|
||
"\x8e\xc4\x8e\xde" => "\xa5\xc9", #ド
|
||
"\x8e\xca\x8e\xde" => "\xa5\xd0", #バ
|
||
"\x8e\xcb\x8e\xde" => "\xa5\xd3", #ビ
|
||
"\x8e\xcc\x8e\xde" => "\xa5\xd6", #ブ
|
||
"\x8e\xcd\x8e\xde" => "\xa5\xd9", #ベ
|
||
"\x8e\xce\x8e\xde" => "\xa5\xdc", #ボ
|
||
"\x8e\xca\x8e\xdf" => "\xa5\xd1", #パ
|
||
"\x8e\xcb\x8e\xdf" => "\xa5\xd4", #ピ
|
||
"\x8e\xcc\x8e\xdf" => "\xa5\xd7", #プ
|
||
"\x8e\xcd\x8e\xdf" => "\xa5\xda", #ペ
|
||
"\x8e\xce\x8e\xdf" => "\xa5\xdd", #ポ
|
||
"\x8e\xb3\x8e\xde" => "\xa5\xf4", #ヴ
|
||
);
|
||
|
||
# init only once;
|
||
|
||
#$_PAT_D2Z = join("|", keys %_D2Z);
|
||
#$_PAT_H2Z = join("|", keys %_H2Z);
|
||
|
||
%_Z2H = reverse %_H2Z;
|
||
%_Z2D = reverse %_D2Z;
|
||
|
||
#$_PAT_Z2H = join("|", keys %_Z2H);
|
||
#$_PAT_Z2D = join("|", keys %_Z2D);
|
||
|
||
sub h2z {
|
||
no warnings qw(uninitialized);
|
||
my $r_str = shift;
|
||
my ($keep_dakuten) = @_;
|
||
my $n = 0;
|
||
unless ($keep_dakuten) {
|
||
$n = (
|
||
$$r_str =~ s(
|
||
($RE{EUC_KANA}
|
||
(?:\x8e[\xde\xdf])?)
|
||
){
|
||
my $str = $1;
|
||
$_D2Z{$str} || $_H2Z{$str} ||
|
||
# in case dakuten and handakuten are side-by-side!
|
||
$_H2Z{substr($str,0,2)} . $_H2Z{substr($str,2,2)};
|
||
}eogx
|
||
);
|
||
}
|
||
else {
|
||
$n = (
|
||
$$r_str =~ s(
|
||
($RE{EUC_KANA})
|
||
){
|
||
$_H2Z{$1};
|
||
}eogx
|
||
);
|
||
}
|
||
$n;
|
||
}
|
||
|
||
sub z2h {
|
||
my $r_str = shift;
|
||
my $n = (
|
||
$$r_str =~ s(
|
||
($RE{EUC_C}|$RE{EUC_0212}|$RE{EUC_KANA})
|
||
){
|
||
$_Z2D{$1} || $_Z2H{$1} || $1;
|
||
}eogx
|
||
);
|
||
$n;
|
||
}
|
||
|
||
1;
|
||
__END__
|
||
|
||
|
||
=head1 NAME
|
||
|
||
Encode::JP::H2Z -- internally used by Encode::JP::2022_JP*
|
||
|
||
=cut
|