Files
server/usr/lib/x86_64-linux-gnu/perl/5.38.2/Encode/JP/H2Z.pm
2026-01-07 20:52:11 +01:00

177 lines
5.0 KiB
Perl
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
#
# $Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $
#
package Encode::JP::H2Z;
use strict;
use warnings;
our $RCSID = q$Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $;
our $VERSION = do { my @r = ( q$Revision: 2.2 $ =~ /\d+/g ); sprintf "%d." . "%02d" x $#r, @r };
use Encode::CJKConstants qw(:all);
use vars qw(%_D2Z $_PAT_D2Z
%_Z2D $_PAT_Z2D
%_H2Z $_PAT_H2Z
%_Z2H $_PAT_Z2H);
%_H2Z = (
"\x8e\xa1" => "\xa1\xa3", #。
"\x8e\xa2" => "\xa1\xd6", #「
"\x8e\xa3" => "\xa1\xd7", #」
"\x8e\xa4" => "\xa1\xa2", #、
"\x8e\xa5" => "\xa1\xa6", #・
"\x8e\xa6" => "\xa5\xf2", #ヲ
"\x8e\xa7" => "\xa5\xa1", #ァ
"\x8e\xa8" => "\xa5\xa3", #ィ
"\x8e\xa9" => "\xa5\xa5", #ゥ
"\x8e\xaa" => "\xa5\xa7", #ェ
"\x8e\xab" => "\xa5\xa9", #ォ
"\x8e\xac" => "\xa5\xe3", #ャ
"\x8e\xad" => "\xa5\xe5", #ュ
"\x8e\xae" => "\xa5\xe7", #ョ
"\x8e\xaf" => "\xa5\xc3", #ッ
"\x8e\xb0" => "\xa1\xbc", #ー
"\x8e\xb1" => "\xa5\xa2", #ア
"\x8e\xb2" => "\xa5\xa4", #イ
"\x8e\xb3" => "\xa5\xa6", #ウ
"\x8e\xb4" => "\xa5\xa8", #エ
"\x8e\xb5" => "\xa5\xaa", #オ
"\x8e\xb6" => "\xa5\xab", #カ
"\x8e\xb7" => "\xa5\xad", #キ
"\x8e\xb8" => "\xa5\xaf", #ク
"\x8e\xb9" => "\xa5\xb1", #ケ
"\x8e\xba" => "\xa5\xb3", #コ
"\x8e\xbb" => "\xa5\xb5", #サ
"\x8e\xbc" => "\xa5\xb7", #シ
"\x8e\xbd" => "\xa5\xb9", #ス
"\x8e\xbe" => "\xa5\xbb", #セ
"\x8e\xbf" => "\xa5\xbd", #ソ
"\x8e\xc0" => "\xa5\xbf", #タ
"\x8e\xc1" => "\xa5\xc1", #チ
"\x8e\xc2" => "\xa5\xc4", #ツ
"\x8e\xc3" => "\xa5\xc6", #テ
"\x8e\xc4" => "\xa5\xc8", #ト
"\x8e\xc5" => "\xa5\xca", #ナ
"\x8e\xc6" => "\xa5\xcb", #ニ
"\x8e\xc7" => "\xa5\xcc", #ヌ
"\x8e\xc8" => "\xa5\xcd", #ネ
"\x8e\xc9" => "\xa5\xce", #
"\x8e\xca" => "\xa5\xcf", #ハ
"\x8e\xcb" => "\xa5\xd2", #ヒ
"\x8e\xcc" => "\xa5\xd5", #フ
"\x8e\xcd" => "\xa5\xd8", #ヘ
"\x8e\xce" => "\xa5\xdb", #ホ
"\x8e\xcf" => "\xa5\xde", #マ
"\x8e\xd0" => "\xa5\xdf", #ミ
"\x8e\xd1" => "\xa5\xe0", #ム
"\x8e\xd2" => "\xa5\xe1", #メ
"\x8e\xd3" => "\xa5\xe2", #モ
"\x8e\xd4" => "\xa5\xe4", #ヤ
"\x8e\xd5" => "\xa5\xe6", #ユ
"\x8e\xd6" => "\xa5\xe8", #ヨ
"\x8e\xd7" => "\xa5\xe9", #ラ
"\x8e\xd8" => "\xa5\xea", #リ
"\x8e\xd9" => "\xa5\xeb", #ル
"\x8e\xda" => "\xa5\xec", #レ
"\x8e\xdb" => "\xa5\xed", #ロ
"\x8e\xdc" => "\xa5\xef", #ワ
"\x8e\xdd" => "\xa5\xf3", #ン
"\x8e\xde" => "\xa1\xab", #゛
"\x8e\xdf" => "\xa1\xac", #゜
);
%_D2Z = (
"\x8e\xb6\x8e\xde" => "\xa5\xac", #ガ
"\x8e\xb7\x8e\xde" => "\xa5\xae", #ギ
"\x8e\xb8\x8e\xde" => "\xa5\xb0", #グ
"\x8e\xb9\x8e\xde" => "\xa5\xb2", #ゲ
"\x8e\xba\x8e\xde" => "\xa5\xb4", #ゴ
"\x8e\xbb\x8e\xde" => "\xa5\xb6", #ザ
"\x8e\xbc\x8e\xde" => "\xa5\xb8", #ジ
"\x8e\xbd\x8e\xde" => "\xa5\xba", #ズ
"\x8e\xbe\x8e\xde" => "\xa5\xbc", #ゼ
"\x8e\xbf\x8e\xde" => "\xa5\xbe", #ゾ
"\x8e\xc0\x8e\xde" => "\xa5\xc0", #ダ
"\x8e\xc1\x8e\xde" => "\xa5\xc2", #ヂ
"\x8e\xc2\x8e\xde" => "\xa5\xc5", #ヅ
"\x8e\xc3\x8e\xde" => "\xa5\xc7", #デ
"\x8e\xc4\x8e\xde" => "\xa5\xc9", #ド
"\x8e\xca\x8e\xde" => "\xa5\xd0", #バ
"\x8e\xcb\x8e\xde" => "\xa5\xd3", #ビ
"\x8e\xcc\x8e\xde" => "\xa5\xd6", #ブ
"\x8e\xcd\x8e\xde" => "\xa5\xd9", #ベ
"\x8e\xce\x8e\xde" => "\xa5\xdc", #ボ
"\x8e\xca\x8e\xdf" => "\xa5\xd1", #パ
"\x8e\xcb\x8e\xdf" => "\xa5\xd4", #ピ
"\x8e\xcc\x8e\xdf" => "\xa5\xd7", #プ
"\x8e\xcd\x8e\xdf" => "\xa5\xda", #ペ
"\x8e\xce\x8e\xdf" => "\xa5\xdd", #ポ
"\x8e\xb3\x8e\xde" => "\xa5\xf4", #ヴ
);
# init only once;
#$_PAT_D2Z = join("|", keys %_D2Z);
#$_PAT_H2Z = join("|", keys %_H2Z);
%_Z2H = reverse %_H2Z;
%_Z2D = reverse %_D2Z;
#$_PAT_Z2H = join("|", keys %_Z2H);
#$_PAT_Z2D = join("|", keys %_Z2D);
sub h2z {
no warnings qw(uninitialized);
my $r_str = shift;
my ($keep_dakuten) = @_;
my $n = 0;
unless ($keep_dakuten) {
$n = (
$$r_str =~ s(
($RE{EUC_KANA}
(?:\x8e[\xde\xdf])?)
){
my $str = $1;
$_D2Z{$str} || $_H2Z{$str} ||
# in case dakuten and handakuten are side-by-side!
$_H2Z{substr($str,0,2)} . $_H2Z{substr($str,2,2)};
}eogx
);
}
else {
$n = (
$$r_str =~ s(
($RE{EUC_KANA})
){
$_H2Z{$1};
}eogx
);
}
$n;
}
sub z2h {
my $r_str = shift;
my $n = (
$$r_str =~ s(
($RE{EUC_C}|$RE{EUC_0212}|$RE{EUC_KANA})
){
$_Z2D{$1} || $_Z2H{$1} || $1;
}eogx
);
$n;
}
1;
__END__
=head1 NAME
Encode::JP::H2Z -- internally used by Encode::JP::2022_JP*
=cut