| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
# ################################################################### Otakar Smrz, 2003/01/23 |
|
2
|
|
|
|
|
|
|
# |
|
3
|
|
|
|
|
|
|
# Encoding of Arabic: ArabTeX Notation by Klaus Lagally ##################################### |
|
4
|
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
# $Id: RE.pm 162 2006-12-16 00:16:10Z smrz $ |
|
6
|
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
package Encode::Arabic::ArabTeX::RE; |
|
8
|
|
|
|
|
|
|
|
|
9
|
2
|
|
|
2
|
|
28670
|
use 5.008; |
|
|
2
|
|
|
|
|
7
|
|
|
|
2
|
|
|
|
|
90
|
|
|
10
|
|
|
|
|
|
|
|
|
11
|
2
|
|
|
2
|
|
10
|
use strict; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
64
|
|
|
12
|
2
|
|
|
2
|
|
10
|
use warnings; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
71
|
|
|
13
|
|
|
|
|
|
|
|
|
14
|
2
|
|
|
2
|
|
11
|
use Scalar::Util 'blessed'; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
288
|
|
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
our $VERSION = do { q $Revision: 162 $ =~ /(\d+)/; sprintf "%4.2f", $1 / 100 }; |
|
17
|
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
|
|
19
|
2
|
|
|
2
|
|
1025
|
use Encode::Encoding; |
|
|
2
|
|
|
|
|
14535
|
|
|
|
2
|
|
|
|
|
71
|
|
|
20
|
2
|
|
|
2
|
|
14
|
use base 'Encode::Encoding'; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
2987
|
|
|
21
|
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
__PACKAGE__->Define('ArabTeX-RE'); |
|
23
|
|
|
|
|
|
|
|
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
our (%encode_used, %decode_used, @shams, @qamar); |
|
26
|
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
our $enmode; |
|
28
|
|
|
|
|
|
|
our $demode; |
|
29
|
|
|
|
|
|
|
|
|
30
|
|
|
|
|
|
|
our %modemap = ( |
|
31
|
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
'default' => 3, |
|
33
|
|
|
|
|
|
|
'undef' => 0, |
|
34
|
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
'fullvocalize' => 4, |
|
36
|
|
|
|
|
|
|
'full' => 4, |
|
37
|
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
'vocalize' => 3, |
|
39
|
|
|
|
|
|
|
'nosukuun' => 3, |
|
40
|
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
'novocalize' => 2, |
|
42
|
|
|
|
|
|
|
'novowels' => 2, |
|
43
|
|
|
|
|
|
|
'none' => 2, |
|
44
|
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
'noshadda' => 1, |
|
46
|
|
|
|
|
|
|
'noneplus' => 1, |
|
47
|
|
|
|
|
|
|
); |
|
48
|
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
sub import { # perform import as if Encode were used one level before this module |
|
51
|
2
|
|
|
2
|
|
23
|
require Encode; |
|
52
|
2
|
|
|
|
|
64
|
Encode->export_to_level(1, @_); |
|
53
|
|
|
|
|
|
|
} |
|
54
|
|
|
|
|
|
|
|
|
55
|
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
sub encode ($$;$) { |
|
57
|
0
|
|
|
0
|
1
|
|
my ($cls, $text, $check) = @_; |
|
58
|
|
|
|
|
|
|
|
|
59
|
0
|
0
|
|
|
|
|
$_[1] = '' if $check; # this is what in-place edit needs |
|
60
|
|
|
|
|
|
|
|
|
61
|
0
|
0
|
|
|
|
|
$cls->initialize_encode() unless %encode_used; |
|
62
|
|
|
|
|
|
|
|
|
63
|
0
|
0
|
|
|
|
|
$text = join '', map { exists $encode_used{$_} ? $encode_used{$_} : $_ } split '', $text; |
|
|
0
|
|
|
|
|
|
|
|
64
|
|
|
|
|
|
|
|
|
65
|
0
|
|
|
|
|
|
$text =~ s/([\_\.\^]?\w)\\shadda{}/$1$1/g; |
|
66
|
0
|
|
|
|
|
|
$text =~ s/(\\ham{.})\\shadda{}/$1$1/g; |
|
67
|
|
|
|
|
|
|
|
|
68
|
0
|
|
|
|
|
|
$text =~ s/([\=\s\-\%])\\alif{}\\vow{a}l/$1"al-/g; |
|
69
|
0
|
|
|
|
|
|
$text =~ s/([\=\s\-\%])\\alif{}l/$1al-/g; |
|
70
|
0
|
|
|
|
|
|
$text =~ s/(b\\vow{i})\\alif{}l/$1-al-/g; |
|
71
|
0
|
|
|
|
|
|
$text =~ s/([\=\s\-\%])\\alif{}\\vow{([ui])}/$1"$2/g; |
|
72
|
0
|
|
|
|
|
|
$text =~ s/([\=\s\-\%])\\alif{}/$1i/g; |
|
73
|
0
|
|
|
|
|
|
$text =~ s/(\\vow{aN})\\alif{}/$1/g; |
|
74
|
0
|
|
|
|
|
|
$text =~ s/\\alif{}(\\vow{aN})/$1/g; |
|
75
|
0
|
|
|
|
|
|
$text =~ s/\\vow{a}\\alif{}/\\vow{A}/g; |
|
76
|
0
|
|
|
|
|
|
$text =~ s/\\alif{}/\\aux{A}/g; |
|
77
|
|
|
|
|
|
|
|
|
78
|
0
|
|
|
|
|
|
$text =~ s/\\madda{}/'A/g; |
|
79
|
|
|
|
|
|
|
|
|
80
|
0
|
|
|
|
|
|
$text =~ s/\\vow{a}\\maq{}/\\vow{Y}/g; |
|
81
|
0
|
|
|
|
|
|
$text =~ s/\\maq{}(\\vow{aN})/\\vow{aNY}/g; |
|
82
|
0
|
|
|
|
|
|
$text =~ s/\\vow{aN}\\maq{}/\\vow{aNY}/g; |
|
83
|
0
|
|
|
|
|
|
$text =~ s/\\maq{}/\\aux{Y}/g; |
|
84
|
|
|
|
|
|
|
|
|
85
|
0
|
|
|
|
|
|
$text =~ s/i(}?)y([^aiuAIUY])/I$1$2/g; # produces \ham{I}, too |
|
86
|
0
|
|
|
|
|
|
$text =~ s/u(}?)w([^aiuAIUY])/U$1$2/g; |
|
87
|
|
|
|
|
|
|
|
|
88
|
0
|
|
|
|
|
|
$text =~ s/([iIuU]})(\\ham{a})/$1-$2/g; |
|
89
|
0
|
|
|
|
|
|
$text =~ s/([\-\s])\\ham{a}([^\\])/$1'\\aux{a}$2/g; |
|
90
|
0
|
|
|
|
|
|
$text =~ s/([^\}\s])\\ham{a}/$1\\aux{a}'/g; |
|
91
|
|
|
|
|
|
|
|
|
92
|
0
|
|
|
|
|
|
$text =~ s/([^\-\s])(\\ham{i})/$1-$2/g; |
|
93
|
0
|
|
|
|
|
|
$text =~ s/\\ham{i}([^\\])/'\\aux{i}$1/g; |
|
94
|
|
|
|
|
|
|
|
|
95
|
0
|
|
|
|
|
|
$text =~ s/([^\}])(\\ham{w})/$1\\aux{u}$2/g; |
|
96
|
0
|
|
|
|
|
|
$text =~ s/(\\ham{w})([^\\])/$1\\aux{u}$2/g; |
|
97
|
|
|
|
|
|
|
|
|
98
|
0
|
|
|
|
|
|
$text =~ s/([^\}])(\\ham{y})/$1\\aux{i}$2/g; |
|
99
|
0
|
|
|
|
|
|
$text =~ s/(\\ham{y})([^\\])/$1\\aux{i}$2/g; |
|
100
|
|
|
|
|
|
|
|
|
101
|
0
|
|
|
|
|
|
$text =~ s/\\ham{[aiwy]}/'/g; |
|
102
|
0
|
|
|
|
|
|
$text =~ s/\\ham{I}/'I/g; |
|
103
|
|
|
|
|
|
|
|
|
104
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
105
|
|
|
|
|
|
|
|
|
106
|
|
|
|
|
|
|
|
|
107
|
2
|
|
|
2
|
|
15
|
no strict 'refs'; |
|
|
2
|
|
|
|
|
11
|
|
|
|
2
|
|
|
|
|
4526
|
|
|
108
|
|
|
|
|
|
|
|
|
109
|
0
|
0
|
0
|
|
|
|
if (defined ${ $cls . '::enmode' } and ${ $cls . '::enmode' } == 3) { |
|
|
0
|
0
|
0
|
|
|
|
|
|
|
0
|
0
|
0
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
|
|
111
|
0
|
|
|
|
|
|
$text =~ s/\\vow{(.+?)}/$1/g; |
|
112
|
0
|
|
|
|
|
|
$text =~ s/\\aux{(.+?)}/"$1/g; |
|
113
|
0
|
|
|
|
|
|
$text =~ s/\\sukun{}/"/g; |
|
114
|
|
|
|
|
|
|
} |
|
115
|
0
|
|
|
|
|
|
elsif (defined ${ $cls . '::enmode' } and ${ $cls . '::enmode' } == 2) { |
|
|
0
|
|
|
|
|
|
|
|
116
|
|
|
|
|
|
|
|
|
117
|
0
|
|
|
|
|
|
$text =~ s/\\vow{(.+?)}/"$1/g; |
|
118
|
0
|
|
|
|
|
|
$text =~ s/\\aux{(.+?)}/$1/g; |
|
119
|
0
|
|
|
|
|
|
$text =~ s/\\sukun{}/"/g; |
|
120
|
|
|
|
|
|
|
} |
|
121
|
0
|
|
|
|
|
|
elsif (defined ${ $cls . '::enmode' } and ${ $cls . '::enmode' } == 4) { |
|
122
|
|
|
|
|
|
|
|
|
123
|
0
|
|
|
|
|
|
$text =~ s/\\vow{(.+?)}/$1/g; |
|
124
|
0
|
|
|
|
|
|
$text =~ s/\\aux{(.+?)}/$1/g; |
|
125
|
0
|
|
|
|
|
|
$text =~ s/\\sukun{}//g; |
|
126
|
|
|
|
|
|
|
} |
|
127
|
|
|
|
|
|
|
|
|
128
|
0
|
|
|
|
|
|
return $text; |
|
129
|
|
|
|
|
|
|
} |
|
130
|
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
|
|
132
|
|
|
|
|
|
|
sub decode ($$;$) { |
|
133
|
0
|
|
|
0
|
1
|
|
my ($cls, $text, $check) = @_; |
|
134
|
0
|
|
|
|
|
|
my $one; |
|
135
|
|
|
|
|
|
|
|
|
136
|
0
|
0
|
|
|
|
|
$_[1] = '' if $check; # this is what in-place edit needs |
|
137
|
|
|
|
|
|
|
|
|
138
|
0
|
0
|
|
|
|
|
$cls->initialize_decode() unless %decode_used; |
|
139
|
|
|
|
|
|
|
|
|
140
|
0
|
|
|
|
|
|
$text = "\n" . $text . "\n"; |
|
141
|
|
|
|
|
|
|
|
|
142
|
0
|
|
|
|
|
|
$text =~ s/_a/a/g; # is there any special character for the defective fatha? |
|
143
|
0
|
|
|
|
|
|
$text =~ s/_U/U/g; # _U only affects the pronunciation, not the spelling |
|
144
|
|
|
|
|
|
|
|
|
145
|
0
|
|
|
|
|
|
foreach $one (@shams, '\\\'', @qamar) { |
|
146
|
|
|
|
|
|
|
|
|
147
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
148
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
149
|
|
|
|
|
|
|
# alas! using $one in the replacing expression produces extra \\ |
|
150
|
|
|
|
|
|
|
} |
|
151
|
|
|
|
|
|
|
|
|
152
|
0
|
|
|
|
|
|
$text =~ s/([\s\-])([aiu])/$1\\L{}$2/gs; |
|
153
|
|
|
|
|
|
|
|
|
154
|
0
|
|
|
|
|
|
$text =~ s/([\s\-])'([auUY])/$1\\H{a}$2/gs; |
|
155
|
0
|
|
|
|
|
|
$text =~ s/([\s\-])'([iI])/$1\\H{i}$2/gs; |
|
156
|
0
|
|
|
|
|
|
$text =~ s/([\s\-])'A/$1\\M{}/gs; |
|
157
|
|
|
|
|
|
|
|
|
158
|
0
|
|
|
|
|
|
$text =~ s/(I|y\\O{})'(aN[AY]?[\s\-])/$1\\H{y}$2/gs; |
|
159
|
0
|
|
|
|
|
|
$text =~ s/a'(|\\D{})(|[au]N?)([\s\-])/a\\H{a}$1$2$3/gs; |
|
160
|
0
|
|
|
|
|
|
$text =~ s/a'(|\\D{})(iN?)([\s\-])/a\\H{i}$1$2$3/gs; |
|
161
|
0
|
|
|
|
|
|
$text =~ s/i'(|\\D{})(|[aiu]N?)([\s\-])/i\\H{y}$1$2$3/gs; |
|
162
|
0
|
|
|
|
|
|
$text =~ s/u'(|\\D{})(|[aiu]N?)([\s\-])/u\\H{w}$1$2$3/gs; |
|
163
|
0
|
|
|
|
|
|
$text =~ s/'(|\\D{})(|[aiu]N?)([\s\-])/\\H{}$1$2$3/gs; |
|
164
|
|
|
|
|
|
|
|
|
165
|
0
|
|
|
|
|
|
$text =~ s/([iI]|y\\O{})'(|\\D{})/$1\\H{y}$2/g; |
|
166
|
0
|
|
|
|
|
|
$text =~ s/'(|\\D{})([iI])/\\H{y}$1$2/g; |
|
167
|
0
|
|
|
|
|
|
$text =~ s/([uU])'(|\\D{})/$1\\H{w}$2/g; |
|
168
|
0
|
|
|
|
|
|
$text =~ s/'(|\\D{})([uU])/\\H{w}$1$2/g; |
|
169
|
0
|
|
|
|
|
|
$text =~ s/A'(|\\D{})/A\\H{}$1/g; # how do you write ? |
|
170
|
0
|
|
|
|
|
|
$text =~ s/a'(\\D{})/a\\H{a}$1/g; # how do you write ? |
|
171
|
0
|
|
|
|
|
|
$text =~ s/'A/\\M{}/g; |
|
172
|
0
|
|
|
|
|
|
$text =~ s/'a/\\H{a}a/g; |
|
173
|
0
|
|
|
|
|
|
$text =~ s/'Y/\\H{a}Y/g; |
|
174
|
|
|
|
|
|
|
|
|
175
|
0
|
|
|
|
|
|
$text =~ s/'/\\H{a}a/g; # final resort |
|
176
|
|
|
|
|
|
|
|
|
177
|
0
|
|
|
|
|
|
foreach $one (@shams) { $text =~ s/($one)\-$one/l$1\\D{}/g; } |
|
|
0
|
|
|
|
|
|
|
|
178
|
0
|
|
|
|
|
|
foreach $one ('\\\\', @qamar) { $text =~ s/l\-($one)/l\\O{}$1/g; } |
|
|
0
|
|
|
|
|
|
|
|
179
|
|
|
|
|
|
|
# alas! using $one in the replacing expression produces extra \\ |
|
180
|
|
|
|
|
|
|
|
|
181
|
0
|
|
|
|
|
|
$text =~ s/aNY/\\V{aN}\\Q{}/g; |
|
182
|
0
|
|
|
|
|
|
$text =~ s/(?<=A\\H{}|\\H{a})aN/\\V{aN}/g; |
|
183
|
0
|
|
|
|
|
|
$text =~ s/(?<=T)aN/\\V{aN}/g; |
|
184
|
|
|
|
|
|
|
|
|
185
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
186
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
187
|
0
|
|
|
|
|
|
$text =~ s/(?
|
|
188
|
|
|
|
|
|
|
|
|
189
|
0
|
|
|
|
|
|
$text =~ s/UA/\\V{u}w\\L{}/g; |
|
190
|
0
|
|
|
|
|
|
$text =~ s/aWA?/\\V{a}w\\O{}\\L{}/g; |
|
191
|
|
|
|
|
|
|
|
|
192
|
0
|
|
|
|
|
|
$text =~ s/([^{])a/$1\\V{a}/g; |
|
193
|
0
|
|
|
|
|
|
$text =~ s/([^{])i/$1\\V{i}/g; |
|
194
|
0
|
|
|
|
|
|
$text =~ s/([^{])u/$1\\V{u}/g; |
|
195
|
|
|
|
|
|
|
|
|
196
|
0
|
|
|
|
|
|
$text =~ s/A/\\V{a}\\L{}/g; |
|
197
|
0
|
|
|
|
|
|
$text =~ s/Iy/\\V{i}y\\D{}/g; |
|
198
|
0
|
|
|
|
|
|
$text =~ s/I/\\V{i}y/g; |
|
199
|
0
|
|
|
|
|
|
$text =~ s/Uw/\\V{u}w\\D{}/g; |
|
200
|
0
|
|
|
|
|
|
$text =~ s/U/\\V{u}w/g; |
|
201
|
0
|
|
|
|
|
|
$text =~ s/Y/\\V{a}\\Q{}/g; |
|
202
|
|
|
|
|
|
|
|
|
203
|
0
|
|
|
|
|
|
$text =~ s/\-//g; |
|
204
|
|
|
|
|
|
|
|
|
205
|
0
|
|
|
|
|
|
$text =~ s/l((\\V\{[aiu]\}|\\D\{\}|\\O\{\})+)(\\L\{\}|\\H\{[ai]\}|\\M\{\})/l$3$1/g; |
|
206
|
|
|
|
|
|
|
|
|
207
|
0
|
|
|
|
|
|
foreach $one (keys %decode_used) { # risky .. the order matters and negative lookahead \{ is just right |
|
208
|
|
|
|
|
|
|
|
|
209
|
0
|
|
|
|
|
|
while ($text =~ s/(?
|
|
210
|
|
|
|
|
|
|
} |
|
211
|
|
|
|
|
|
|
|
|
212
|
0
|
|
|
|
|
|
$text = substr $text, 1, -1; # remove additional "\n"s |
|
213
|
|
|
|
|
|
|
|
|
214
|
0
|
|
|
|
|
|
return $text; |
|
215
|
|
|
|
|
|
|
} |
|
216
|
|
|
|
|
|
|
|
|
217
|
|
|
|
|
|
|
|
|
218
|
|
|
|
|
|
|
sub initialize_encode ($) { |
|
219
|
0
|
|
|
0
|
0
|
|
my $cls = shift @_; |
|
220
|
|
|
|
|
|
|
|
|
221
|
0
|
|
|
|
|
|
%encode_used = ( |
|
222
|
|
|
|
|
|
|
# "p", # 81 #"\201", |
|
223
|
|
|
|
|
|
|
# "^c", # 8D #"\215", |
|
224
|
|
|
|
|
|
|
# "^z", # 8E #"\216", |
|
225
|
|
|
|
|
|
|
# "\217", # 8F #"\217", |
|
226
|
|
|
|
|
|
|
# "g", # 90 #"\220", |
|
227
|
|
|
|
|
|
|
"\x{060C}", ",", # A1 "\241", '\\,', # 161 "\xA1", # "\xD8\x8C" right-to-left-comma |
|
228
|
|
|
|
|
|
|
# "\\lq ", # AB #"\253", |
|
229
|
|
|
|
|
|
|
"\x{061B}", ";", # BA "\272", '\\;', # 186 "\xBA", # "\xD8\x9B" right-to-left-semicolon |
|
230
|
|
|
|
|
|
|
# "\\rq", # BB #"\273", |
|
231
|
|
|
|
|
|
|
"\x{061F}", "?", # BF "\277", '\\?', # 191 "\xBF", # "\xD8\x9F" right-to-left-question-mark |
|
232
|
|
|
|
|
|
|
"\x{0621}", "'", # C1 "\301", '\\\\H{}', # 193 "\xC1", # "\xD8\xA1" hamza-on-the-line |
|
233
|
|
|
|
|
|
|
"\x{0622}", "\\madda{}", # C2 "\302", '\\\\M{}', # 194 "\xC2", # "\xD8\xA2" madda-over-'alif |
|
234
|
|
|
|
|
|
|
"\x{0623}", "\\ham{a}", # C3 "\303", '\\\\H{a}', # 195 "\xC3", # "\xD8\xA3" hamza-over-'alif |
|
235
|
|
|
|
|
|
|
"\x{0624}", "\\ham{w}", # C4 "\304", '\\\\H{w}', # 196 "\xC4", # "\xD8\xA4" hamza-over-waaw |
|
236
|
|
|
|
|
|
|
"\x{0625}", "\\ham{i}", # C5 "\305", '\\\\H{i}', # 197 "\xC5", # "\xD8\xA5" hamza-under-'alif |
|
237
|
|
|
|
|
|
|
"\x{0626}", "\\ham{y}", # C6 "\306", '\\\\H{y}', # 198 "\xC6", # "\xD8\xA6" hamza-over-yaa' |
|
238
|
|
|
|
|
|
|
"\x{0627}", "\\alif{}", # C7 "\307", '\\\\L{}', # 199 "\xC7", # "\xD8\xA7" bare 'alif |
|
239
|
|
|
|
|
|
|
"\x{0628}", "b", # C8 "\310", 'b', # 200 "\xC8", # "\xD8\xA8" |
|
240
|
|
|
|
|
|
|
"\x{0629}", "T", # C9 "\311", 'T', # 201 "\xC9", # "\xD8\xA9" |
|
241
|
|
|
|
|
|
|
"\x{062A}", "t", # CA "\312", 't', # 202 "\xCA", # "\xD8\xAA" |
|
242
|
|
|
|
|
|
|
"\x{062B}", "_t", # CB "\313", '\\_t', # 203 "\xCB", # "\xD8\xAB" <_t> |
|
243
|
|
|
|
|
|
|
"\x{062C}", "^g", # CC "\314", '\\^g', # 204 "\xCC", # "\xD8\xAC" <^g> |
|
244
|
|
|
|
|
|
|
"\x{062D}", ".h", # CD "\315", '\\.h', # 205 "\xCD", # "\xD8\xAD" <.h> |
|
245
|
|
|
|
|
|
|
"\x{062E}", "_h", # CE "\316", '\\_h', # 206 "\xCE", # "\xD8\xAE" <_h> |
|
246
|
|
|
|
|
|
|
"\x{062F}", "d", # CF "\317", 'd', # 207 "\xCF", # "\xD8\xAF" |
|
247
|
|
|
|
|
|
|
"\x{0630}", "_d", # D0 "\320", '\\_d', # 208 "\xD0", # "\xD8\xB0" <_d> |
|
248
|
|
|
|
|
|
|
"\x{0631}", "r", # D1 "\321", 'r', # 209 "\xD1", # "\xD8\xB1" |
|
249
|
|
|
|
|
|
|
"\x{0632}", "z", # D2 "\322", 'z', # 210 "\xD2", # "\xD8\xB2" |
|
250
|
|
|
|
|
|
|
"\x{0633}", "s", # D3 "\323", 's', # 211 "\xD3", # "\xD8\xB3" |
|
251
|
|
|
|
|
|
|
"\x{0634}", "^s", # D4 "\324", '\\^s', # 212 "\xD4", # "\xD8\xB4" <^s> |
|
252
|
|
|
|
|
|
|
"\x{0635}", ".s", # D5 "\325", '\\.s', # 213 "\xD5", # "\xD8\xB5" <.s> |
|
253
|
|
|
|
|
|
|
"\x{0636}", ".d", # D6 "\326", '\\.d', # 214 "\xD6", # "\xD8\xB6" <.d> |
|
254
|
|
|
|
|
|
|
# "\327", # D7 #"\327", |
|
255
|
|
|
|
|
|
|
"\x{0637}", ".t", # D8 "\330", '\\.t', # 216 "\xD8", # "\xD8\xB7" <.t> |
|
256
|
|
|
|
|
|
|
"\x{0638}", ".z", # D9 "\331", '\\.z', # 217 "\xD9", # "\xD8\xB8" <.z> |
|
257
|
|
|
|
|
|
|
"\x{0639}", "`", # DA "\332", '\\`', # 218 "\xDA", # "\xD8\xB9" <`> |
|
258
|
|
|
|
|
|
|
"\x{063A}", ".g", # DB "\333", '\\.g', # 219 "\xDB", # "\xD8\xBA" <.g> |
|
259
|
|
|
|
|
|
|
"\x{0640}", "-", # DC "\334", '--', # 220 "\xDC", # "\xD9\x80" ta.twiil |
|
260
|
|
|
|
|
|
|
"\x{0641}", "f", # DD "\335", 'f', # 221 "\xDD", # "\xD9\x81" |
|
261
|
|
|
|
|
|
|
"\x{0642}", "q", # DE "\336", 'q', # 222 "\xDE", # "\xD9\x82" |
|
262
|
|
|
|
|
|
|
"\x{0643}", "k", # DF "\337", 'k', # 223 "\xDF", # "\xD9\x83" |
|
263
|
|
|
|
|
|
|
# "\340", # E0 #"\340", |
|
264
|
|
|
|
|
|
|
"\x{0644}", "l", # E1 "\341", 'l', # 225 "\xE1", # "\xD9\x84" |
|
265
|
|
|
|
|
|
|
# "\342", # E2 #"\342", |
|
266
|
|
|
|
|
|
|
"\x{0645}", "m", # E3 "\343", 'm', # 227 "\xE3", # "\xD9\x85" |
|
267
|
|
|
|
|
|
|
"\x{0646}", "n", # E4 "\344", 'n', # 228 "\xE4", # "\xD9\x86" |
|
268
|
|
|
|
|
|
|
"\x{0647}", "h", # E5 "\345", 'h', # 229 "\xE5", # "\xD9\x87" |
|
269
|
|
|
|
|
|
|
"\x{0648}", "w", # E6 "\346", 'w', # 230 "\xE6", # "\xD9\x88" |
|
270
|
|
|
|
|
|
|
"\x{0649}", "\\maq{}", # EC "\354", '\\\\Q{}', # 236 "\xEC", # "\xD9\x89" 'alif maq.suura |
|
271
|
|
|
|
|
|
|
"\x{064A}", "y", # ED "\355", 'y', # 237 "\xED", # "\xD9\x8A" |
|
272
|
|
|
|
|
|
|
"\x{064B}", "\\vow{aN}", # F0 "\360", '\\\\V{aN}', # 240 "\xF0", # "\xD9\x8B" |
|
273
|
|
|
|
|
|
|
"\x{064C}", "\\vow{uN}", # F1 "\361", '\\\\V{uN}', # 241 "\xF1", # "\xD9\x8C" |
|
274
|
|
|
|
|
|
|
"\x{064D}", "\\vow{iN}", # F2 "\362", '\\\\V{iN}', # 242 "\xF2", # "\xD9\x8D" |
|
275
|
|
|
|
|
|
|
"\x{064E}", "\\vow{a}", # F3 "\363", '\\\\V{a}', # 243 "\xF3", # "\xD9\x8E" |
|
276
|
|
|
|
|
|
|
"\x{064F}", "\\vow{u}", # F5 "\365", '\\\\V{u}', # 245 "\xF5", # "\xD9\x8F" |
|
277
|
|
|
|
|
|
|
"\x{0650}", "\\vow{i}", # F6 "\366", '\\\\V{i}', # 246 "\xF6", # "\xD9\x90" |
|
278
|
|
|
|
|
|
|
"\x{0651}", "\\shadda{}", # F8 "\370", '\\\\D{}', # 248 "\xF8", # "\xD9\x91" ^sadda |
|
279
|
|
|
|
|
|
|
"\x{0652}", "\\sukun{}", # FA "\372", '\\\\O{}', # 250 "\xFA", # "\xD9\x92" sukuun |
|
280
|
|
|
|
|
|
|
"\x{0670}", # '\\\\A{}', # 243 "\xF3", # "\xD9\xB0" <_a> -> |
|
281
|
|
|
|
|
|
|
"\x{0671}", # '\\\\W{}', # 199 "\xC7", # "\xD9\xB1" wa.sla-on-'alif -> bare 'alif |
|
282
|
|
|
|
|
|
|
); |
|
283
|
|
|
|
|
|
|
|
|
284
|
|
|
|
|
|
|
|
|
285
|
2
|
|
|
2
|
|
13
|
no strict 'refs'; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
1118
|
|
|
286
|
|
|
|
|
|
|
|
|
287
|
0
|
0
|
|
|
|
|
$cls->enmode(defined ${ $cls . '::enmode' } ? ${ $cls . '::enmode' } : 'default'); |
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
288
|
|
|
|
|
|
|
} |
|
289
|
|
|
|
|
|
|
|
|
290
|
|
|
|
|
|
|
|
|
291
|
|
|
|
|
|
|
sub initialize_decode ($) { |
|
292
|
0
|
|
|
0
|
0
|
|
my $cls = shift @_; |
|
293
|
|
|
|
|
|
|
|
|
294
|
0
|
|
|
|
|
|
@shams = ('t', '\\_t', 'd', '\\_d', 'r', 'z', 's', '\\^s', '\\.s', '\\.d', '\\.t', '\\.z', 'l', 'n'); |
|
295
|
0
|
|
|
|
|
|
@qamar = ('b', '\\^g', '\\.h', '\\_h', '\\`', '\\.g', 'f', 'q', 'k', 'm', 'h', 'w', 'y'); |
|
296
|
|
|
|
|
|
|
|
|
297
|
0
|
|
|
|
|
|
%decode_used = ( |
|
298
|
|
|
|
|
|
|
# 'p', # 129 "\x81", |
|
299
|
|
|
|
|
|
|
# '\\^c', # 141 "\x8D", |
|
300
|
|
|
|
|
|
|
# '\\^z', # 142 "\x8E", |
|
301
|
|
|
|
|
|
|
# 'g', # 144 "\x90", |
|
302
|
|
|
|
|
|
|
'\\,', "\x{060C}", # 161 "\xA1", # "\xD8\x8C" right-to-left-comma |
|
303
|
|
|
|
|
|
|
'\\;', "\x{061B}", # 186 "\xBA", # "\xD8\x9B" right-to-left-semicolon |
|
304
|
|
|
|
|
|
|
'\\?', "\x{061F}", # 191 "\xBF", # "\xD8\x9F" right-to-left-question-mark |
|
305
|
|
|
|
|
|
|
'\\\\H{}', "\x{0621}", # 193 "\xC1", # "\xD8\xA1" hamza-on-the-line |
|
306
|
|
|
|
|
|
|
'\\\\M{}', "\x{0622}", # 194 "\xC2", # "\xD8\xA2" madda-over-'alif |
|
307
|
|
|
|
|
|
|
'\\\\H{a}', "\x{0623}", # 195 "\xC3", # "\xD8\xA3" hamza-over-'alif |
|
308
|
|
|
|
|
|
|
'\\\\H{w}', "\x{0624}", # 196 "\xC4", # "\xD8\xA4" hamza-over-waaw |
|
309
|
|
|
|
|
|
|
'\\\\H{i}', "\x{0625}", # 197 "\xC5", # "\xD8\xA5" hamza-under-'alif |
|
310
|
|
|
|
|
|
|
'\\\\H{y}', "\x{0626}", # 198 "\xC6", # "\xD8\xA6" hamza-over-yaa' |
|
311
|
|
|
|
|
|
|
'\\\\L{}', "\x{0627}", # 199 "\xC7", # "\xD8\xA7" bare 'alif |
|
312
|
|
|
|
|
|
|
'b', "\x{0628}", # 200 "\xC8", # "\xD8\xA8" |
|
313
|
|
|
|
|
|
|
'T', "\x{0629}", # 201 "\xC9", # "\xD8\xA9" |
|
314
|
|
|
|
|
|
|
't', "\x{062A}", # 202 "\xCA", # "\xD8\xAA" |
|
315
|
|
|
|
|
|
|
'\\_t', "\x{062B}", # 203 "\xCB", # "\xD8\xAB" <_t> |
|
316
|
|
|
|
|
|
|
'\\^g', "\x{062C}", # 204 "\xCC", # "\xD8\xAC" <^g> |
|
317
|
|
|
|
|
|
|
'\\.h', "\x{062D}", # 205 "\xCD", # "\xD8\xAD" <.h> |
|
318
|
|
|
|
|
|
|
'\\_h', "\x{062E}", # 206 "\xCE", # "\xD8\xAE" <_h> |
|
319
|
|
|
|
|
|
|
'd', "\x{062F}", # 207 "\xCF", # "\xD8\xAF" |
|
320
|
|
|
|
|
|
|
'\\_d', "\x{0630}", # 208 "\xD0", # "\xD8\xB0" <_d> |
|
321
|
|
|
|
|
|
|
'r', "\x{0631}", # 209 "\xD1", # "\xD8\xB1" |
|
322
|
|
|
|
|
|
|
'z', "\x{0632}", # 210 "\xD2", # "\xD8\xB2" |
|
323
|
|
|
|
|
|
|
's', "\x{0633}", # 211 "\xD3", # "\xD8\xB3" |
|
324
|
|
|
|
|
|
|
'\\^s', "\x{0634}", # 212 "\xD4", # "\xD8\xB4" <^s> |
|
325
|
|
|
|
|
|
|
'\\.s', "\x{0635}", # 213 "\xD5", # "\xD8\xB5" <.s> |
|
326
|
|
|
|
|
|
|
'\\.d', "\x{0636}", # 214 "\xD6", # "\xD8\xB6" <.d> |
|
327
|
|
|
|
|
|
|
'\\.t', "\x{0637}", # 216 "\xD8", # "\xD8\xB7" <.t> |
|
328
|
|
|
|
|
|
|
'\\.z', "\x{0638}", # 217 "\xD9", # "\xD8\xB8" <.z> |
|
329
|
|
|
|
|
|
|
'\\`', "\x{0639}", # 218 "\xDA", # "\xD8\xB9" <`> |
|
330
|
|
|
|
|
|
|
'\\.g', "\x{063A}", # 219 "\xDB", # "\xD8\xBA" <.g> |
|
331
|
|
|
|
|
|
|
'--', "\x{0640}", # 220 "\xDC", # "\xD9\x80" ta.twiil |
|
332
|
|
|
|
|
|
|
'f', "\x{0641}", # 221 "\xDD", # "\xD9\x81" |
|
333
|
|
|
|
|
|
|
'q', "\x{0642}", # 222 "\xDE", # "\xD9\x82" |
|
334
|
|
|
|
|
|
|
'k', "\x{0643}", # 223 "\xDF", # "\xD9\x83" |
|
335
|
|
|
|
|
|
|
'l', "\x{0644}", # 225 "\xE1", # "\xD9\x84" |
|
336
|
|
|
|
|
|
|
'm', "\x{0645}", # 227 "\xE3", # "\xD9\x85" |
|
337
|
|
|
|
|
|
|
'n', "\x{0646}", # 228 "\xE4", # "\xD9\x86" |
|
338
|
|
|
|
|
|
|
'h', "\x{0647}", # 229 "\xE5", # "\xD9\x87" |
|
339
|
|
|
|
|
|
|
'w', "\x{0648}", # 230 "\xE6", # "\xD9\x88" |
|
340
|
|
|
|
|
|
|
'\\\\Q{}', "\x{0649}", # 236 "\xEC", # "\xD9\x89" 'alif maq.suura |
|
341
|
|
|
|
|
|
|
'y', "\x{064A}", # 237 "\xED", # "\xD9\x8A" |
|
342
|
|
|
|
|
|
|
'\\\\V{aN}', "\x{064B}", # 240 "\xF0", # "\xD9\x8B" |
|
343
|
|
|
|
|
|
|
'\\\\V{uN}', "\x{064C}", # 241 "\xF1", # "\xD9\x8C" |
|
344
|
|
|
|
|
|
|
'\\\\V{iN}', "\x{064D}", # 242 "\xF2", # "\xD9\x8D" |
|
345
|
|
|
|
|
|
|
'\\\\V{a}', "\x{064E}", # 243 "\xF3", # "\xD9\x8E" |
|
346
|
|
|
|
|
|
|
'\\\\V{u}', "\x{064F}", # 245 "\xF5", # "\xD9\x8F" |
|
347
|
|
|
|
|
|
|
'\\\\V{i}', "\x{0650}", # 246 "\xF6", # "\xD9\x90" |
|
348
|
|
|
|
|
|
|
'\\\\D{}', "\x{0651}", # 248 "\xF8", # "\xD9\x91" ^sadda |
|
349
|
|
|
|
|
|
|
'\\\\O{}', "\x{0652}", # 250 "\xFA", # "\xD9\x92" sukuun |
|
350
|
|
|
|
|
|
|
'\\\\A{}', "\x{0670}", # 243 "\xF3", # "\xD9\xB0" <_a> -> |
|
351
|
|
|
|
|
|
|
'\\\\W{}', "\x{0671}", # 199 "\xC7", # "\xD9\xB1" wa.sla-on-'alif -> bare 'alif |
|
352
|
|
|
|
|
|
|
); |
|
353
|
|
|
|
|
|
|
|
|
354
|
|
|
|
|
|
|
|
|
355
|
2
|
|
|
2
|
|
13
|
no strict 'refs'; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
370
|
|
|
356
|
|
|
|
|
|
|
|
|
357
|
0
|
0
|
|
|
|
|
$cls->demode(defined ${ $cls . '::demode' } ? ${ $cls . '::demode' } : 'default'); |
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
358
|
|
|
|
|
|
|
} |
|
359
|
|
|
|
|
|
|
|
|
360
|
|
|
|
|
|
|
|
|
361
|
|
|
|
|
|
|
sub enmode ($$) { |
|
362
|
0
|
|
|
0
|
0
|
|
my ($cls, $mode) = @_; |
|
363
|
|
|
|
|
|
|
|
|
364
|
0
|
0
|
|
|
|
|
$cls = blessed $cls if ref $cls; |
|
365
|
|
|
|
|
|
|
|
|
366
|
0
|
0
|
|
|
|
|
$mode = 'undef' unless defined $mode; |
|
367
|
0
|
0
|
|
|
|
|
$mode = $modemap{$mode} if exists $modemap{$mode}; |
|
368
|
|
|
|
|
|
|
|
|
369
|
2
|
|
|
2
|
|
18
|
no strict 'refs'; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
225
|
|
|
370
|
|
|
|
|
|
|
|
|
371
|
0
|
|
|
|
|
|
my $return = ${ $cls . '::enmode' }; |
|
|
0
|
|
|
|
|
|
|
|
372
|
|
|
|
|
|
|
|
|
373
|
0
|
|
|
|
|
|
${ $cls . '::enmode' } = $mode; |
|
|
0
|
|
|
|
|
|
|
|
374
|
|
|
|
|
|
|
|
|
375
|
0
|
|
|
|
|
|
return $return; |
|
376
|
|
|
|
|
|
|
} |
|
377
|
|
|
|
|
|
|
|
|
378
|
|
|
|
|
|
|
|
|
379
|
|
|
|
|
|
|
sub demode ($$) { |
|
380
|
0
|
|
|
0
|
0
|
|
my ($cls, $mode) = @_; |
|
381
|
|
|
|
|
|
|
|
|
382
|
0
|
0
|
|
|
|
|
$cls = blessed $cls if ref $cls; |
|
383
|
|
|
|
|
|
|
|
|
384
|
0
|
0
|
|
|
|
|
$mode = 'undef' unless defined $mode; |
|
385
|
0
|
0
|
|
|
|
|
$mode = $modemap{$mode} if exists $modemap{$mode}; |
|
386
|
|
|
|
|
|
|
|
|
387
|
2
|
|
|
2
|
|
14
|
no strict 'refs'; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
254
|
|
|
388
|
|
|
|
|
|
|
|
|
389
|
0
|
|
|
|
|
|
my $return = ${ $cls . '::demode' }; |
|
|
0
|
|
|
|
|
|
|
|
390
|
|
|
|
|
|
|
|
|
391
|
0
|
|
|
|
|
|
${ $cls . '::demode' } = $mode; |
|
|
0
|
|
|
|
|
|
|
|
392
|
|
|
|
|
|
|
|
|
393
|
0
|
|
|
|
|
|
return $return; |
|
394
|
|
|
|
|
|
|
} |
|
395
|
|
|
|
|
|
|
|
|
396
|
|
|
|
|
|
|
|
|
397
|
|
|
|
|
|
|
1; |
|
398
|
|
|
|
|
|
|
|
|
399
|
|
|
|
|
|
|
__END__ |