line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# |
2
|
|
|
|
|
|
|
# $Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $ |
3
|
|
|
|
|
|
|
# |
4
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
package Encode::JP::H2Z; |
6
|
|
|
|
|
|
|
|
7
|
7
|
|
|
7
|
|
53
|
use strict; |
|
7
|
|
|
|
|
21
|
|
|
7
|
|
|
|
|
244
|
|
8
|
7
|
|
|
7
|
|
47
|
use warnings; |
|
7
|
|
|
|
|
19
|
|
|
7
|
|
|
|
|
776
|
|
9
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
our $RCSID = q$Id: H2Z.pm,v 2.2 2006/06/03 20:28:48 dankogai Exp $; |
11
|
|
|
|
|
|
|
our $VERSION = do { my @r = ( q$Revision: 2.2 $ =~ /\d+/g ); sprintf "%d." . "%02d" x $#r, @r }; |
12
|
|
|
|
|
|
|
|
13
|
7
|
|
|
7
|
|
53
|
use Encode::CJKConstants qw(:all); |
|
7
|
|
|
|
|
16
|
|
|
7
|
|
|
|
|
1184
|
|
14
|
|
|
|
|
|
|
|
15
|
7
|
|
|
|
|
6167
|
use vars qw(%_D2Z $_PAT_D2Z |
16
|
|
|
|
|
|
|
%_Z2D $_PAT_Z2D |
17
|
|
|
|
|
|
|
%_H2Z $_PAT_H2Z |
18
|
7
|
|
|
7
|
|
53
|
%_Z2H $_PAT_Z2H); |
|
7
|
|
|
|
|
18
|
|
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
%_H2Z = ( |
21
|
|
|
|
|
|
|
"\x8e\xa1" => "\xa1\xa3", #。 |
22
|
|
|
|
|
|
|
"\x8e\xa2" => "\xa1\xd6", #「 |
23
|
|
|
|
|
|
|
"\x8e\xa3" => "\xa1\xd7", #」 |
24
|
|
|
|
|
|
|
"\x8e\xa4" => "\xa1\xa2", #、 |
25
|
|
|
|
|
|
|
"\x8e\xa5" => "\xa1\xa6", #・ |
26
|
|
|
|
|
|
|
"\x8e\xa6" => "\xa5\xf2", #ヲ |
27
|
|
|
|
|
|
|
"\x8e\xa7" => "\xa5\xa1", #ァ |
28
|
|
|
|
|
|
|
"\x8e\xa8" => "\xa5\xa3", #ィ |
29
|
|
|
|
|
|
|
"\x8e\xa9" => "\xa5\xa5", #ゥ |
30
|
|
|
|
|
|
|
"\x8e\xaa" => "\xa5\xa7", #ェ |
31
|
|
|
|
|
|
|
"\x8e\xab" => "\xa5\xa9", #ォ |
32
|
|
|
|
|
|
|
"\x8e\xac" => "\xa5\xe3", #ャ |
33
|
|
|
|
|
|
|
"\x8e\xad" => "\xa5\xe5", #ュ |
34
|
|
|
|
|
|
|
"\x8e\xae" => "\xa5\xe7", #ョ |
35
|
|
|
|
|
|
|
"\x8e\xaf" => "\xa5\xc3", #ッ |
36
|
|
|
|
|
|
|
"\x8e\xb0" => "\xa1\xbc", #ー |
37
|
|
|
|
|
|
|
"\x8e\xb1" => "\xa5\xa2", #ア |
38
|
|
|
|
|
|
|
"\x8e\xb2" => "\xa5\xa4", #イ |
39
|
|
|
|
|
|
|
"\x8e\xb3" => "\xa5\xa6", #ウ |
40
|
|
|
|
|
|
|
"\x8e\xb4" => "\xa5\xa8", #エ |
41
|
|
|
|
|
|
|
"\x8e\xb5" => "\xa5\xaa", #オ |
42
|
|
|
|
|
|
|
"\x8e\xb6" => "\xa5\xab", #カ |
43
|
|
|
|
|
|
|
"\x8e\xb7" => "\xa5\xad", #キ |
44
|
|
|
|
|
|
|
"\x8e\xb8" => "\xa5\xaf", #ク |
45
|
|
|
|
|
|
|
"\x8e\xb9" => "\xa5\xb1", #ケ |
46
|
|
|
|
|
|
|
"\x8e\xba" => "\xa5\xb3", #コ |
47
|
|
|
|
|
|
|
"\x8e\xbb" => "\xa5\xb5", #サ |
48
|
|
|
|
|
|
|
"\x8e\xbc" => "\xa5\xb7", #シ |
49
|
|
|
|
|
|
|
"\x8e\xbd" => "\xa5\xb9", #ス |
50
|
|
|
|
|
|
|
"\x8e\xbe" => "\xa5\xbb", #セ |
51
|
|
|
|
|
|
|
"\x8e\xbf" => "\xa5\xbd", #ソ |
52
|
|
|
|
|
|
|
"\x8e\xc0" => "\xa5\xbf", #タ |
53
|
|
|
|
|
|
|
"\x8e\xc1" => "\xa5\xc1", #チ |
54
|
|
|
|
|
|
|
"\x8e\xc2" => "\xa5\xc4", #ツ |
55
|
|
|
|
|
|
|
"\x8e\xc3" => "\xa5\xc6", #テ |
56
|
|
|
|
|
|
|
"\x8e\xc4" => "\xa5\xc8", #ト |
57
|
|
|
|
|
|
|
"\x8e\xc5" => "\xa5\xca", #ナ |
58
|
|
|
|
|
|
|
"\x8e\xc6" => "\xa5\xcb", #ニ |
59
|
|
|
|
|
|
|
"\x8e\xc7" => "\xa5\xcc", #ヌ |
60
|
|
|
|
|
|
|
"\x8e\xc8" => "\xa5\xcd", #ネ |
61
|
|
|
|
|
|
|
"\x8e\xc9" => "\xa5\xce", #ノ |
62
|
|
|
|
|
|
|
"\x8e\xca" => "\xa5\xcf", #ハ |
63
|
|
|
|
|
|
|
"\x8e\xcb" => "\xa5\xd2", #ヒ |
64
|
|
|
|
|
|
|
"\x8e\xcc" => "\xa5\xd5", #フ |
65
|
|
|
|
|
|
|
"\x8e\xcd" => "\xa5\xd8", #ヘ |
66
|
|
|
|
|
|
|
"\x8e\xce" => "\xa5\xdb", #ホ |
67
|
|
|
|
|
|
|
"\x8e\xcf" => "\xa5\xde", #マ |
68
|
|
|
|
|
|
|
"\x8e\xd0" => "\xa5\xdf", #ミ |
69
|
|
|
|
|
|
|
"\x8e\xd1" => "\xa5\xe0", #ム |
70
|
|
|
|
|
|
|
"\x8e\xd2" => "\xa5\xe1", #メ |
71
|
|
|
|
|
|
|
"\x8e\xd3" => "\xa5\xe2", #モ |
72
|
|
|
|
|
|
|
"\x8e\xd4" => "\xa5\xe4", #ヤ |
73
|
|
|
|
|
|
|
"\x8e\xd5" => "\xa5\xe6", #ユ |
74
|
|
|
|
|
|
|
"\x8e\xd6" => "\xa5\xe8", #ヨ |
75
|
|
|
|
|
|
|
"\x8e\xd7" => "\xa5\xe9", #ラ |
76
|
|
|
|
|
|
|
"\x8e\xd8" => "\xa5\xea", #リ |
77
|
|
|
|
|
|
|
"\x8e\xd9" => "\xa5\xeb", #ル |
78
|
|
|
|
|
|
|
"\x8e\xda" => "\xa5\xec", #レ |
79
|
|
|
|
|
|
|
"\x8e\xdb" => "\xa5\xed", #ロ |
80
|
|
|
|
|
|
|
"\x8e\xdc" => "\xa5\xef", #ワ |
81
|
|
|
|
|
|
|
"\x8e\xdd" => "\xa5\xf3", #ン |
82
|
|
|
|
|
|
|
"\x8e\xde" => "\xa1\xab", #゛ |
83
|
|
|
|
|
|
|
"\x8e\xdf" => "\xa1\xac", #゜ |
84
|
|
|
|
|
|
|
); |
85
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
%_D2Z = ( |
87
|
|
|
|
|
|
|
"\x8e\xb6\x8e\xde" => "\xa5\xac", #ガ |
88
|
|
|
|
|
|
|
"\x8e\xb7\x8e\xde" => "\xa5\xae", #ギ |
89
|
|
|
|
|
|
|
"\x8e\xb8\x8e\xde" => "\xa5\xb0", #グ |
90
|
|
|
|
|
|
|
"\x8e\xb9\x8e\xde" => "\xa5\xb2", #ゲ |
91
|
|
|
|
|
|
|
"\x8e\xba\x8e\xde" => "\xa5\xb4", #ゴ |
92
|
|
|
|
|
|
|
"\x8e\xbb\x8e\xde" => "\xa5\xb6", #ザ |
93
|
|
|
|
|
|
|
"\x8e\xbc\x8e\xde" => "\xa5\xb8", #ジ |
94
|
|
|
|
|
|
|
"\x8e\xbd\x8e\xde" => "\xa5\xba", #ズ |
95
|
|
|
|
|
|
|
"\x8e\xbe\x8e\xde" => "\xa5\xbc", #ゼ |
96
|
|
|
|
|
|
|
"\x8e\xbf\x8e\xde" => "\xa5\xbe", #ゾ |
97
|
|
|
|
|
|
|
"\x8e\xc0\x8e\xde" => "\xa5\xc0", #ダ |
98
|
|
|
|
|
|
|
"\x8e\xc1\x8e\xde" => "\xa5\xc2", #ヂ |
99
|
|
|
|
|
|
|
"\x8e\xc2\x8e\xde" => "\xa5\xc5", #ヅ |
100
|
|
|
|
|
|
|
"\x8e\xc3\x8e\xde" => "\xa5\xc7", #デ |
101
|
|
|
|
|
|
|
"\x8e\xc4\x8e\xde" => "\xa5\xc9", #ド |
102
|
|
|
|
|
|
|
"\x8e\xca\x8e\xde" => "\xa5\xd0", #バ |
103
|
|
|
|
|
|
|
"\x8e\xcb\x8e\xde" => "\xa5\xd3", #ビ |
104
|
|
|
|
|
|
|
"\x8e\xcc\x8e\xde" => "\xa5\xd6", #ブ |
105
|
|
|
|
|
|
|
"\x8e\xcd\x8e\xde" => "\xa5\xd9", #ベ |
106
|
|
|
|
|
|
|
"\x8e\xce\x8e\xde" => "\xa5\xdc", #ボ |
107
|
|
|
|
|
|
|
"\x8e\xca\x8e\xdf" => "\xa5\xd1", #パ |
108
|
|
|
|
|
|
|
"\x8e\xcb\x8e\xdf" => "\xa5\xd4", #ピ |
109
|
|
|
|
|
|
|
"\x8e\xcc\x8e\xdf" => "\xa5\xd7", #プ |
110
|
|
|
|
|
|
|
"\x8e\xcd\x8e\xdf" => "\xa5\xda", #ペ |
111
|
|
|
|
|
|
|
"\x8e\xce\x8e\xdf" => "\xa5\xdd", #ポ |
112
|
|
|
|
|
|
|
"\x8e\xb3\x8e\xde" => "\xa5\xf4", #ヴ |
113
|
|
|
|
|
|
|
); |
114
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
# init only once; |
116
|
|
|
|
|
|
|
|
117
|
|
|
|
|
|
|
#$_PAT_D2Z = join("|", keys %_D2Z); |
118
|
|
|
|
|
|
|
#$_PAT_H2Z = join("|", keys %_H2Z); |
119
|
|
|
|
|
|
|
|
120
|
|
|
|
|
|
|
%_Z2H = reverse %_H2Z; |
121
|
|
|
|
|
|
|
%_Z2D = reverse %_D2Z; |
122
|
|
|
|
|
|
|
|
123
|
|
|
|
|
|
|
#$_PAT_Z2H = join("|", keys %_Z2H); |
124
|
|
|
|
|
|
|
#$_PAT_Z2D = join("|", keys %_Z2D); |
125
|
|
|
|
|
|
|
|
126
|
|
|
|
|
|
|
sub h2z { |
127
|
7
|
|
|
7
|
|
65
|
no warnings qw(uninitialized); |
|
7
|
|
|
|
|
25
|
|
|
7
|
|
|
|
|
2151
|
|
128
|
934
|
|
|
934
|
0
|
2239
|
my $r_str = shift; |
129
|
934
|
|
|
|
|
2345
|
my ($keep_dakuten) = @_; |
130
|
934
|
|
|
|
|
1996
|
my $n = 0; |
131
|
934
|
50
|
|
|
|
2432
|
unless ($keep_dakuten) { |
132
|
934
|
|
|
|
|
3282
|
$n = ( |
133
|
|
|
|
|
|
|
$$r_str =~ s( |
134
|
|
|
|
|
|
|
($RE{EUC_KANA} |
135
|
|
|
|
|
|
|
(?:\x8e[\xde\xdf])?) |
136
|
|
|
|
|
|
|
){ |
137
|
0
|
|
|
|
|
0
|
my $str = $1; |
138
|
|
|
|
|
|
|
$_D2Z{$str} || $_H2Z{$str} || |
139
|
|
|
|
|
|
|
# in case dakuten and handakuten are side-by-side! |
140
|
0
|
0
|
0
|
|
|
0
|
$_H2Z{substr($str,0,2)} . $_H2Z{substr($str,2,2)}; |
141
|
|
|
|
|
|
|
}eogx |
142
|
|
|
|
|
|
|
); |
143
|
|
|
|
|
|
|
} |
144
|
|
|
|
|
|
|
else { |
145
|
0
|
|
|
|
|
0
|
$n = ( |
146
|
|
|
|
|
|
|
$$r_str =~ s( |
147
|
|
|
|
|
|
|
($RE{EUC_KANA}) |
148
|
|
|
|
|
|
|
){ |
149
|
0
|
|
|
|
|
0
|
$_H2Z{$1}; |
150
|
|
|
|
|
|
|
}eogx |
151
|
|
|
|
|
|
|
); |
152
|
|
|
|
|
|
|
} |
153
|
934
|
|
|
|
|
2803
|
$n; |
154
|
|
|
|
|
|
|
} |
155
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
sub z2h { |
157
|
0
|
|
|
0
|
0
|
|
my $r_str = shift; |
158
|
0
|
|
|
|
|
|
my $n = ( |
159
|
|
|
|
|
|
|
$$r_str =~ s( |
160
|
|
|
|
|
|
|
($RE{EUC_C}|$RE{EUC_0212}|$RE{EUC_KANA}) |
161
|
|
|
|
|
|
|
){ |
162
|
0
|
0
|
0
|
|
|
|
$_Z2D{$1} || $_Z2H{$1} || $1; |
163
|
|
|
|
|
|
|
}eogx |
164
|
|
|
|
|
|
|
); |
165
|
0
|
|
|
|
|
|
$n; |
166
|
|
|
|
|
|
|
} |
167
|
|
|
|
|
|
|
|
168
|
|
|
|
|
|
|
1; |
169
|
|
|
|
|
|
|
__END__ |