| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package Lingua::Slavic::Numbers; |
|
2
|
7
|
|
|
7
|
|
106055
|
use strict; |
|
|
7
|
|
|
|
|
21
|
|
|
|
7
|
|
|
|
|
2655
|
|
|
3
|
|
|
|
|
|
|
|
|
4
|
7
|
|
|
7
|
|
53
|
use Carp qw(carp); |
|
|
7
|
|
|
|
|
16
|
|
|
|
7
|
|
|
|
|
480
|
|
|
5
|
7
|
|
|
7
|
|
47
|
use List::Util qw(max); |
|
|
7
|
|
|
|
|
27
|
|
|
|
7
|
|
|
|
|
922
|
|
|
6
|
7
|
|
|
7
|
|
18283
|
use Data::Dumper; |
|
|
7
|
|
|
|
|
153364
|
|
|
|
7
|
|
|
|
|
711
|
|
|
7
|
7
|
|
|
7
|
|
8941
|
use Regexp::Common qw /number/; |
|
|
7
|
|
|
|
|
36839
|
|
|
|
7
|
|
|
|
|
39
|
|
|
8
|
7
|
|
|
7
|
|
41917
|
use Exporter; |
|
|
7
|
|
|
|
|
16
|
|
|
|
7
|
|
|
|
|
405
|
|
|
9
|
7
|
|
|
7
|
|
8498
|
use utf8; |
|
|
7
|
|
|
|
|
72
|
|
|
|
7
|
|
|
|
|
69
|
|
|
10
|
7
|
|
|
7
|
|
310
|
use vars qw( $VERSION $DEBUG @ISA @EXPORT_OK @EXPORT); |
|
|
7
|
|
|
|
|
16
|
|
|
|
7
|
|
|
|
|
1417
|
|
|
11
|
7
|
|
|
|
|
543
|
use vars qw( |
|
12
|
|
|
|
|
|
|
%INFLEXIONS |
|
13
|
|
|
|
|
|
|
%NUMBER_NAMES |
|
14
|
|
|
|
|
|
|
%ORDINALS |
|
15
|
|
|
|
|
|
|
$OUTPUT_DECIMAL_DELIMITER |
|
16
|
|
|
|
|
|
|
$MINUS |
|
17
|
7
|
|
|
7
|
|
42
|
); |
|
|
7
|
|
|
|
|
16
|
|
|
18
|
|
|
|
|
|
|
|
|
19
|
7
|
|
|
7
|
|
154
|
use constant LANG_BG => 'bg'; |
|
|
7
|
|
|
|
|
15
|
|
|
|
7
|
|
|
|
|
511
|
|
|
20
|
|
|
|
|
|
|
|
|
21
|
7
|
|
|
7
|
|
34
|
use constant NO_CONJUNCTIONS => 'noconj'; |
|
|
7
|
|
|
|
|
13
|
|
|
|
7
|
|
|
|
|
444
|
|
|
22
|
7
|
|
|
7
|
|
34
|
use constant FEMININE_GENDER => 'fem'; |
|
|
7
|
|
|
|
|
13
|
|
|
|
7
|
|
|
|
|
296
|
|
|
23
|
7
|
|
|
7
|
|
435
|
use constant MASCULINE_GENDER => 'man'; |
|
|
7
|
|
|
|
|
13
|
|
|
|
7
|
|
|
|
|
408
|
|
|
24
|
7
|
|
|
7
|
|
42
|
use constant NEUTRAL_GENDER => 'neu'; |
|
|
7
|
|
|
|
|
10
|
|
|
|
7
|
|
|
|
|
46545
|
|
|
25
|
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
$VERSION = 0.03; |
|
27
|
|
|
|
|
|
|
$DEBUG = 0; |
|
28
|
|
|
|
|
|
|
@ISA = qw(Exporter); |
|
29
|
|
|
|
|
|
|
@EXPORT_OK = qw( &number_to_slavic &ordinate_to_slavic LANG_BG); |
|
30
|
|
|
|
|
|
|
@EXPORT = @EXPORT_OK; |
|
31
|
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
$MINUS = ('минус'); |
|
33
|
|
|
|
|
|
|
$OUTPUT_DECIMAL_DELIMITER = ('цяло'); |
|
34
|
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
%INFLEXIONS = |
|
36
|
|
|
|
|
|
|
( |
|
37
|
|
|
|
|
|
|
LANG_BG, |
|
38
|
|
|
|
|
|
|
{ |
|
39
|
|
|
|
|
|
|
FEMININE_GENDER, |
|
40
|
|
|
|
|
|
|
{ |
|
41
|
|
|
|
|
|
|
1 => 'една', |
|
42
|
|
|
|
|
|
|
}, |
|
43
|
|
|
|
|
|
|
MASCULINE_GENDER, |
|
44
|
|
|
|
|
|
|
{ |
|
45
|
|
|
|
|
|
|
1 => 'един', |
|
46
|
|
|
|
|
|
|
2 => 'два', |
|
47
|
|
|
|
|
|
|
}, |
|
48
|
|
|
|
|
|
|
} |
|
49
|
|
|
|
|
|
|
); |
|
50
|
|
|
|
|
|
|
|
|
51
|
|
|
|
|
|
|
%NUMBER_NAMES = |
|
52
|
|
|
|
|
|
|
( |
|
53
|
|
|
|
|
|
|
LANG_BG, |
|
54
|
|
|
|
|
|
|
{ |
|
55
|
|
|
|
|
|
|
0 => 'нула', |
|
56
|
|
|
|
|
|
|
1 => 'едно', |
|
57
|
|
|
|
|
|
|
2 => 'две', |
|
58
|
|
|
|
|
|
|
3 => 'три', |
|
59
|
|
|
|
|
|
|
4 => 'четири', |
|
60
|
|
|
|
|
|
|
5 => 'пет', |
|
61
|
|
|
|
|
|
|
6 => 'шест', |
|
62
|
|
|
|
|
|
|
7 => 'седем', |
|
63
|
|
|
|
|
|
|
8 => 'осем', |
|
64
|
|
|
|
|
|
|
9 => 'девет', |
|
65
|
|
|
|
|
|
|
10 => 'десет', |
|
66
|
|
|
|
|
|
|
11 => 'едина{10}', |
|
67
|
|
|
|
|
|
|
12 => 'двана{10}', |
|
68
|
|
|
|
|
|
|
13 => '{3}на{10}', |
|
69
|
|
|
|
|
|
|
14 => '{4}на{10}', |
|
70
|
|
|
|
|
|
|
15 => '{5}на{10}', |
|
71
|
|
|
|
|
|
|
16 => '{6}на{10}', |
|
72
|
|
|
|
|
|
|
17 => '{7}на{10}', |
|
73
|
|
|
|
|
|
|
18 => '{8}на{10}', |
|
74
|
|
|
|
|
|
|
19 => '{9}на{10}', |
|
75
|
|
|
|
|
|
|
20 => 'два{10}', |
|
76
|
|
|
|
|
|
|
30 => '{3}{10}', |
|
77
|
|
|
|
|
|
|
40 => '{4}{10}', |
|
78
|
|
|
|
|
|
|
50 => '{5}{10}', |
|
79
|
|
|
|
|
|
|
60 => '{6}{10}', |
|
80
|
|
|
|
|
|
|
70 => '{7}{10}', |
|
81
|
|
|
|
|
|
|
80 => '{8}{10}', |
|
82
|
|
|
|
|
|
|
90 => '{9}{10}', |
|
83
|
|
|
|
|
|
|
100 => 'сто', |
|
84
|
|
|
|
|
|
|
200 => '{2}ста', |
|
85
|
|
|
|
|
|
|
300 => '{3}ста', |
|
86
|
|
|
|
|
|
|
'1e3' => 'хиляда', |
|
87
|
|
|
|
|
|
|
'1e4' => '{10} хиляди', |
|
88
|
|
|
|
|
|
|
'1e5' => '{100} хиляди', |
|
89
|
|
|
|
|
|
|
'1e6' => 'милион', |
|
90
|
|
|
|
|
|
|
'1e7' => '{10} {1e6}а', |
|
91
|
|
|
|
|
|
|
'1e8' => '{100} {1e6}а', |
|
92
|
|
|
|
|
|
|
'1e9' => 'милиард', # USA English 'billion' |
|
93
|
|
|
|
|
|
|
'1e10' => '{10} {1e9}а', |
|
94
|
|
|
|
|
|
|
'1e11' => '{100} {1e9}а', |
|
95
|
|
|
|
|
|
|
'1e12' => 'трилион', # sometimes 'билион' in older usage |
|
96
|
|
|
|
|
|
|
'1e13' => '{10} {1e12}а', |
|
97
|
|
|
|
|
|
|
'1e14' => '{100} {1e12}а', |
|
98
|
|
|
|
|
|
|
'1e15' => 'квадрилион', |
|
99
|
|
|
|
|
|
|
'1e16' => '{10} {1e15}а', |
|
100
|
|
|
|
|
|
|
'1e17' => '{100} {1e15}а', |
|
101
|
|
|
|
|
|
|
'1e18' => 'квинтилион', |
|
102
|
|
|
|
|
|
|
'1e19' => '{10} {1e18}а', |
|
103
|
|
|
|
|
|
|
'1e20' => '{100} {1e18}а', |
|
104
|
|
|
|
|
|
|
'1e21' => 'секстилион', |
|
105
|
|
|
|
|
|
|
'1e22' => '{10} {1e21}а', |
|
106
|
|
|
|
|
|
|
} |
|
107
|
|
|
|
|
|
|
); |
|
108
|
|
|
|
|
|
|
|
|
109
|
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
$NUMBER_NAMES{LANG_BG()}->{"${_}00"} = "{$_}стотин" foreach qw/4 5 6 7 8 9/; |
|
111
|
|
|
|
|
|
|
$NUMBER_NAMES{LANG_BG()}->{'1' . '0'x(3*$_)} = $NUMBER_NAMES{LANG_BG()}->{'1e'. 3*$_} foreach 1..7; |
|
112
|
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
# use Data::Dumper; |
|
114
|
|
|
|
|
|
|
# print Dumper \%NUMBER_NAMES; |
|
115
|
|
|
|
|
|
|
my $count = 1; |
|
116
|
|
|
|
|
|
|
|
|
117
|
|
|
|
|
|
|
%ORDINALS = |
|
118
|
|
|
|
|
|
|
( |
|
119
|
|
|
|
|
|
|
LANG_BG, |
|
120
|
|
|
|
|
|
|
{ |
|
121
|
|
|
|
|
|
|
# given in male singular formal version only, inflection TODO. Nothing above 99 yet. |
|
122
|
|
|
|
|
|
|
0 => 'нулев', |
|
123
|
|
|
|
|
|
|
1 => 'първи', |
|
124
|
|
|
|
|
|
|
2 => 'втори', |
|
125
|
|
|
|
|
|
|
3 => 'трети', |
|
126
|
|
|
|
|
|
|
4 => 'четвърти', |
|
127
|
|
|
|
|
|
|
5 => '{5}и', |
|
128
|
|
|
|
|
|
|
6 => '{6}и', |
|
129
|
|
|
|
|
|
|
7 => 'седми', |
|
130
|
|
|
|
|
|
|
8 => 'осми', |
|
131
|
|
|
|
|
|
|
9 => '{9}и', |
|
132
|
|
|
|
|
|
|
10 => '{10}и', |
|
133
|
|
|
|
|
|
|
11 => 'едина[10]', |
|
134
|
|
|
|
|
|
|
12 => 'двана[10]', |
|
135
|
|
|
|
|
|
|
13 => '{3}на[10]', |
|
136
|
|
|
|
|
|
|
13 => '{3}на[10]', |
|
137
|
|
|
|
|
|
|
14 => '{4}на[10]', |
|
138
|
|
|
|
|
|
|
15 => '{5}на[10]', |
|
139
|
|
|
|
|
|
|
16 => '{6}на[10]', |
|
140
|
|
|
|
|
|
|
17 => '{7}на[10]', |
|
141
|
|
|
|
|
|
|
18 => '{8}на[10]', |
|
142
|
|
|
|
|
|
|
19 => '{9}на[10]', |
|
143
|
|
|
|
|
|
|
20 => 'два[10]', |
|
144
|
|
|
|
|
|
|
30 => '{3}[10]', |
|
145
|
|
|
|
|
|
|
40 => '{4}[10]', |
|
146
|
|
|
|
|
|
|
50 => '{5}[10]', |
|
147
|
|
|
|
|
|
|
60 => '{6}[10]', |
|
148
|
|
|
|
|
|
|
70 => '{7}[10]', |
|
149
|
|
|
|
|
|
|
80 => '{8}[10]', |
|
150
|
|
|
|
|
|
|
90 => '{9}[10]', |
|
151
|
|
|
|
|
|
|
100 => '{100}тен', |
|
152
|
|
|
|
|
|
|
1000 => 'хиляден', |
|
153
|
|
|
|
|
|
|
10e6 => '{1e6}ен', |
|
154
|
|
|
|
|
|
|
} |
|
155
|
|
|
|
|
|
|
); |
|
156
|
|
|
|
|
|
|
|
|
157
|
|
|
|
|
|
|
foreach my $lang (keys %ORDINALS) |
|
158
|
|
|
|
|
|
|
{ |
|
159
|
|
|
|
|
|
|
foreach my $val (values %{$ORDINALS{$lang}}) |
|
160
|
|
|
|
|
|
|
{ |
|
161
|
|
|
|
|
|
|
$val = interpolate_string($lang, $val); |
|
162
|
|
|
|
|
|
|
} |
|
163
|
|
|
|
|
|
|
} |
|
164
|
|
|
|
|
|
|
|
|
165
|
|
|
|
|
|
|
foreach my $lang (keys %NUMBER_NAMES) |
|
166
|
|
|
|
|
|
|
{ |
|
167
|
|
|
|
|
|
|
foreach my $val (values %{$NUMBER_NAMES{$lang}}) |
|
168
|
|
|
|
|
|
|
{ |
|
169
|
|
|
|
|
|
|
$val = interpolate_string($lang, $val); |
|
170
|
|
|
|
|
|
|
} |
|
171
|
|
|
|
|
|
|
} |
|
172
|
|
|
|
|
|
|
|
|
173
|
1112
|
100
|
|
1112
|
0
|
4337
|
sub deb { print @_ if $DEBUG } |
|
174
|
|
|
|
|
|
|
|
|
175
|
|
|
|
|
|
|
sub ordinate_to_slavic |
|
176
|
|
|
|
|
|
|
{ |
|
177
|
148
|
|
|
148
|
1
|
5632
|
my $lang = shift; |
|
178
|
148
|
|
|
|
|
636
|
my $number = shift; |
|
179
|
148
|
|
50
|
|
|
759
|
my $options = shift @_ || {}; |
|
180
|
|
|
|
|
|
|
|
|
181
|
148
|
50
|
|
|
|
1032
|
unless ( exists $ORDINALS{$lang} ) |
|
182
|
|
|
|
|
|
|
{ |
|
183
|
0
|
|
|
|
|
0
|
carp("Ordinates for language $lang are unknown, sorry"); |
|
184
|
0
|
|
|
|
|
0
|
return undef; |
|
185
|
|
|
|
|
|
|
} |
|
186
|
|
|
|
|
|
|
|
|
187
|
148
|
|
|
|
|
267
|
my $hash = $ORDINALS{$lang}; |
|
188
|
|
|
|
|
|
|
|
|
189
|
148
|
100
|
|
|
|
3090
|
unless ( $number >= 0 ) |
|
190
|
|
|
|
|
|
|
{ |
|
191
|
2
|
|
|
|
|
369
|
carp("Ordinates must not be negative"); |
|
192
|
2
|
|
|
|
|
12
|
return undef; |
|
193
|
|
|
|
|
|
|
} |
|
194
|
|
|
|
|
|
|
|
|
195
|
146
|
50
|
|
|
|
395
|
unless ( int $number == $number ) |
|
196
|
|
|
|
|
|
|
{ |
|
197
|
0
|
|
|
|
|
0
|
carp("Ordinates can only be integers"); |
|
198
|
0
|
|
|
|
|
0
|
return undef; |
|
199
|
|
|
|
|
|
|
} |
|
200
|
|
|
|
|
|
|
|
|
201
|
146
|
100
|
|
|
|
2998
|
return $hash->{$number} if exists $hash->{$number}; |
|
202
|
|
|
|
|
|
|
|
|
203
|
9
|
|
|
|
|
3323
|
my $max = max(keys %$hash); |
|
204
|
9
|
50
|
|
|
|
44
|
if ($number > $max) |
|
205
|
|
|
|
|
|
|
{ |
|
206
|
0
|
|
|
|
|
0
|
carp("Ordinate $number is above maximum $max and not supported, sorry"); |
|
207
|
0
|
|
|
|
|
0
|
return undef; |
|
208
|
|
|
|
|
|
|
} |
|
209
|
|
|
|
|
|
|
|
|
210
|
9
|
50
|
|
|
|
30
|
if ($lang eq LANG_BG) |
|
211
|
|
|
|
|
|
|
{ |
|
212
|
|
|
|
|
|
|
# we may have a partially expressible ordinate number, which in |
|
213
|
|
|
|
|
|
|
# Bulgarian for a number of N digits is done with N-1 numbers (not |
|
214
|
|
|
|
|
|
|
# ordinals) with no conjunctions, and an 'и' conjunction before the |
|
215
|
|
|
|
|
|
|
# last one (N) as an ordinal. Effectively it turns out to be the |
|
216
|
|
|
|
|
|
|
# number without the least significant digit, then 'и', then the |
|
217
|
|
|
|
|
|
|
# ordinal of the least significant digit. The exceptions should be |
|
218
|
|
|
|
|
|
|
# handled by $ORDINALS. |
|
219
|
|
|
|
|
|
|
|
|
220
|
9
|
|
|
|
|
14
|
my $out = ''; |
|
221
|
|
|
|
|
|
|
|
|
222
|
9
|
|
|
|
|
23
|
my $bot = $number % 10; |
|
223
|
9
|
|
|
|
|
15
|
my $top = $number - $bot; |
|
224
|
9
|
|
|
|
|
27
|
return interpolate_string($lang, "{{$top}@{[NO_CONJUNCTIONS()]}} и [$bot]"); |
|
|
9
|
|
|
|
|
57
|
|
|
225
|
|
|
|
|
|
|
} |
|
226
|
|
|
|
|
|
|
|
|
227
|
0
|
|
|
|
|
0
|
carp("The ordinate for $number in language '$lang' couldn't be found, sorry"); |
|
228
|
0
|
|
|
|
|
0
|
return undef; |
|
229
|
|
|
|
|
|
|
} |
|
230
|
|
|
|
|
|
|
|
|
231
|
|
|
|
|
|
|
sub bulgarian_triplets |
|
232
|
|
|
|
|
|
|
{ |
|
233
|
145
|
|
|
145
|
0
|
210
|
my $lang = LANG_BG; |
|
234
|
145
|
|
|
|
|
207
|
my $hash = shift; |
|
235
|
145
|
|
|
|
|
189
|
my $tri = shift; |
|
236
|
145
|
|
50
|
|
|
389
|
my $options = shift @_ || {}; |
|
237
|
|
|
|
|
|
|
|
|
238
|
145
|
|
|
|
|
31836
|
my $pow = 0; |
|
239
|
145
|
|
|
|
|
517
|
foreach my $t (@$tri) # this is a triplet |
|
240
|
|
|
|
|
|
|
{ |
|
241
|
275
|
|
|
|
|
644
|
my $some_left = scalar @$tri > $pow/3; # true if we're not at end of @$tri yet |
|
242
|
|
|
|
|
|
|
# convert to scientific notation |
|
243
|
275
|
|
|
|
|
366
|
my $canon_power = $pow; |
|
244
|
275
|
|
|
|
|
322
|
my $canon_t = $t; |
|
245
|
275
|
50
|
|
|
|
1495
|
if ($t =~ m/$RE{num}{real}{-sep=>'[,.]?'}{-keep}/) |
|
246
|
|
|
|
|
|
|
{ |
|
247
|
275
|
|
50
|
|
|
71253
|
$canon_power = $8 || 0; |
|
248
|
275
|
|
|
|
|
540
|
$canon_t = $3; |
|
249
|
|
|
|
|
|
|
} |
|
250
|
|
|
|
|
|
|
else |
|
251
|
|
|
|
|
|
|
{ |
|
252
|
0
|
|
|
|
|
0
|
while ($canon_t >= 10) |
|
253
|
|
|
|
|
|
|
{ |
|
254
|
0
|
|
|
|
|
0
|
$canon_t /= 10; |
|
255
|
0
|
|
|
|
|
0
|
$canon_power ++; |
|
256
|
|
|
|
|
|
|
} |
|
257
|
|
|
|
|
|
|
} |
|
258
|
|
|
|
|
|
|
|
|
259
|
275
|
|
|
|
|
3255
|
my $canon = "${canon_t}e$canon_power"; |
|
260
|
|
|
|
|
|
|
|
|
261
|
275
|
|
|
|
|
942
|
deb("Working on triplet $t (power $pow, canonical $canon)\n"); |
|
262
|
275
|
50
|
|
|
|
1046
|
if (exists $hash->{$canon}) |
|
|
|
100
|
|
|
|
|
|
|
263
|
|
|
|
|
|
|
{ |
|
264
|
0
|
|
|
|
|
0
|
$t = $hash->{$canon}; |
|
265
|
|
|
|
|
|
|
} |
|
266
|
|
|
|
|
|
|
elsif ($t == 0) # handle 0 and '000' strings |
|
267
|
|
|
|
|
|
|
{ |
|
268
|
88
|
50
|
|
|
|
201
|
if (scalar @$tri == 1) # is the zero the only number? |
|
269
|
|
|
|
|
|
|
{ |
|
270
|
0
|
|
|
|
|
0
|
$t = 0; |
|
271
|
0
|
|
|
|
|
0
|
redo; |
|
272
|
|
|
|
|
|
|
} |
|
273
|
|
|
|
|
|
|
else |
|
274
|
|
|
|
|
|
|
{ |
|
275
|
88
|
|
|
|
|
138
|
$t = ''; # don't do anything with uninteresting zeroes |
|
276
|
|
|
|
|
|
|
} |
|
277
|
|
|
|
|
|
|
} |
|
278
|
|
|
|
|
|
|
else |
|
279
|
|
|
|
|
|
|
{ |
|
280
|
|
|
|
|
|
|
# try decomposing $t |
|
281
|
|
|
|
|
|
|
|
|
282
|
|
|
|
|
|
|
# get rid of scientific notation |
|
283
|
187
|
|
|
|
|
336
|
$t =~ s/(\d+)e(\d+)/$1 . 0 x $2/e; |
|
|
0
|
|
|
|
|
0
|
|
|
284
|
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
# first, set up the qualifier |
|
286
|
187
|
|
|
|
|
469
|
deb("getting qualifier and gender for $t\n"); |
|
287
|
|
|
|
|
|
|
|
|
288
|
187
|
|
|
|
|
313
|
my $qualifier = ''; |
|
289
|
187
|
|
|
|
|
244
|
my $inflexion = ''; |
|
290
|
187
|
|
|
|
|
262
|
my $extra_а = ''; |
|
291
|
|
|
|
|
|
|
|
|
292
|
187
|
100
|
|
|
|
444
|
if ($pow) |
|
293
|
|
|
|
|
|
|
{ |
|
294
|
84
|
|
|
|
|
271
|
$qualifier = number_to_slavic($lang, "1e$pow"); |
|
295
|
84
|
|
|
|
|
210
|
$inflexion = MASCULINE_GENDER; # all but thousands are masculine |
|
296
|
84
|
|
|
|
|
126
|
$extra_а = 'а'; # and all have 'a' when plural (singular cases are caught by the %NUMBER_NAMES hash) |
|
297
|
|
|
|
|
|
|
|
|
298
|
84
|
100
|
|
|
|
221
|
if ($pow eq 3) # thousands are a special case for gender, being feminine |
|
299
|
|
|
|
|
|
|
{ |
|
300
|
62
|
|
|
|
|
141
|
$qualifier = 'хиляди'; |
|
301
|
62
|
|
|
|
|
129
|
$inflexion = FEMININE_GENDER; |
|
302
|
62
|
|
|
|
|
103
|
$extra_а = ''; # no extra 'a' for thousands |
|
303
|
|
|
|
|
|
|
} |
|
304
|
|
|
|
|
|
|
} |
|
305
|
|
|
|
|
|
|
|
|
306
|
187
|
|
|
|
|
316
|
$qualifier .= $extra_а; |
|
307
|
|
|
|
|
|
|
|
|
308
|
187
|
|
|
|
|
692
|
my @n = split //, $t; |
|
309
|
187
|
|
|
|
|
671
|
shift @n while 0 == $n[0]; # remove the leading zeroes |
|
310
|
187
|
|
|
|
|
690
|
deb("decomposing $t, result [@n]\n"); |
|
311
|
187
|
|
|
|
|
297
|
my @inter; |
|
312
|
187
|
|
|
|
|
439
|
while (@n) |
|
313
|
|
|
|
|
|
|
{ |
|
314
|
358
|
|
|
|
|
647
|
my $decompose_num = shift @n; |
|
315
|
358
|
|
|
|
|
647
|
my $decompose_pow = scalar @n; |
|
316
|
|
|
|
|
|
|
|
|
317
|
|
|
|
|
|
|
# grab the next digit for numbers 10 .. 20 |
|
318
|
358
|
100
|
100
|
|
|
2005
|
if (($decompose_num == 1 && scalar @n == 1) || |
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
319
|
|
|
|
|
|
|
($decompose_num == 2 && scalar @n == 1 && $n[0] == 0)) |
|
320
|
|
|
|
|
|
|
{ |
|
321
|
32
|
|
|
|
|
102
|
$decompose_num .= shift @n; |
|
322
|
32
|
|
|
|
|
51
|
$decompose_pow = 0; |
|
323
|
|
|
|
|
|
|
} |
|
324
|
|
|
|
|
|
|
|
|
325
|
358
|
100
|
|
|
|
741
|
next unless $decompose_num; # skip zeroes |
|
326
|
|
|
|
|
|
|
|
|
327
|
301
|
|
|
|
|
375
|
my $extra_и = ''; |
|
328
|
|
|
|
|
|
|
# numbers below 21 are one word, so in cases like 1001 (хиляда и едно) a conjunction is needed |
|
329
|
|
|
|
|
|
|
# ditto for 100..900 |
|
330
|
301
|
100
|
66
|
|
|
2278
|
if ( |
|
|
|
|
33
|
|
|
|
|
|
331
|
|
|
|
|
|
|
# $some_left tells us there are more triplets to come |
|
332
|
|
|
|
|
|
|
$some_left && |
|
333
|
|
|
|
|
|
|
( |
|
334
|
|
|
|
|
|
|
($decompose_num <= 20 && scalar @n == 0) || # 1..20 |
|
335
|
|
|
|
|
|
|
(scalar @n == 2 && $n[0] == 0 && $n[1] == 0) # N00 |
|
336
|
|
|
|
|
|
|
) |
|
337
|
|
|
|
|
|
|
) |
|
338
|
|
|
|
|
|
|
{ |
|
339
|
186
|
|
|
|
|
262
|
$extra_и = ' '; |
|
340
|
|
|
|
|
|
|
} |
|
341
|
|
|
|
|
|
|
|
|
342
|
301
|
|
|
|
|
1810
|
push @inter, sprintf("%s{%s%s}", $extra_и, $decompose_num, '0'x$decompose_pow); |
|
343
|
|
|
|
|
|
|
} |
|
344
|
|
|
|
|
|
|
|
|
345
|
187
|
|
|
|
|
2789
|
my @inter_options = (NO_CONJUNCTIONS); |
|
346
|
187
|
100
|
|
|
|
413
|
push @inter_options, $inflexion if $inflexion; |
|
347
|
187
|
|
|
|
|
359
|
my $inter_options = join ':', @inter_options; |
|
348
|
|
|
|
|
|
|
|
|
349
|
187
|
|
|
|
|
1570
|
$inter[-1] =~ s/({.*})/{$1$inter_options}/; |
|
350
|
|
|
|
|
|
|
|
|
351
|
187
|
|
|
|
|
425
|
my $inter = join(' ', @inter); |
|
352
|
187
|
|
|
|
|
528
|
deb("bulgarian_triplets calling interpolate_string with [$inter]\n"); |
|
353
|
187
|
|
|
|
|
437
|
$inter = interpolate_string($lang, $inter); |
|
354
|
|
|
|
|
|
|
|
|
355
|
187
|
50
|
|
|
|
516
|
if (defined $inter) |
|
356
|
|
|
|
|
|
|
{ |
|
357
|
187
|
|
|
|
|
424
|
$t = $inter; |
|
358
|
|
|
|
|
|
|
# add the final conjunction if requested |
|
359
|
187
|
100
|
|
|
|
2397
|
$t =~ s/\s(\w+)$/ и $1/ unless $options->{NO_CONJUNCTIONS()}; |
|
360
|
187
|
100
|
|
|
|
626
|
$t .= " ${qualifier}" if $qualifier; # add the qualifier |
|
361
|
187
|
|
|
|
|
724
|
$t =~ s/^\s+//g; # replace leading/ending spaces |
|
362
|
187
|
|
|
|
|
1205
|
$t =~ s/\s+$//g; # replace leading/ending spaces |
|
363
|
|
|
|
|
|
|
} |
|
364
|
|
|
|
|
|
|
else |
|
365
|
|
|
|
|
|
|
{ |
|
366
|
0
|
|
|
|
|
0
|
carp "Couldn't convert $canon"; |
|
367
|
|
|
|
|
|
|
} |
|
368
|
|
|
|
|
|
|
} |
|
369
|
|
|
|
|
|
|
|
|
370
|
275
|
|
|
|
|
932
|
$pow+=3; |
|
371
|
|
|
|
|
|
|
} |
|
372
|
|
|
|
|
|
|
|
|
373
|
145
|
|
|
|
|
561
|
@$tri = reverse @$tri; |
|
374
|
|
|
|
|
|
|
|
|
375
|
145
|
|
|
|
|
634
|
return "@$tri"; |
|
376
|
|
|
|
|
|
|
} |
|
377
|
|
|
|
|
|
|
|
|
378
|
|
|
|
|
|
|
sub find_known |
|
379
|
|
|
|
|
|
|
{ |
|
380
|
2358
|
|
|
2358
|
0
|
4393
|
my $lang = shift; |
|
381
|
2358
|
|
|
|
|
3828
|
my $hash = shift; |
|
382
|
2358
|
|
|
|
|
3170
|
my $number = shift; |
|
383
|
2358
|
|
50
|
|
|
5697
|
my $options = shift @_ || {}; |
|
384
|
|
|
|
|
|
|
|
|
385
|
2358
|
|
|
|
|
4086
|
foreach my $gender (FEMININE_GENDER(), MASCULINE_GENDER()) |
|
386
|
|
|
|
|
|
|
{ |
|
387
|
4672
|
100
|
100
|
|
|
20048
|
return $INFLEXIONS{$lang}->{$gender}->{$number} |
|
388
|
|
|
|
|
|
|
if (exists $options->{$gender} && |
|
389
|
|
|
|
|
|
|
exists $INFLEXIONS{$lang}->{$gender}->{$number}); |
|
390
|
|
|
|
|
|
|
} |
|
391
|
|
|
|
|
|
|
|
|
392
|
2308
|
100
|
|
|
|
20345
|
return $hash->{$number} if exists $hash->{$number}; |
|
393
|
|
|
|
|
|
|
|
|
394
|
156
|
|
|
|
|
486
|
return undef; |
|
395
|
|
|
|
|
|
|
} |
|
396
|
|
|
|
|
|
|
|
|
397
|
|
|
|
|
|
|
sub number_to_slavic |
|
398
|
|
|
|
|
|
|
{ |
|
399
|
1258
|
|
|
1258
|
1
|
38442
|
my $lang = shift; |
|
400
|
1258
|
|
|
|
|
2586
|
my $number = shift; |
|
401
|
1258
|
|
100
|
|
|
22442
|
my $options = shift @_ || {}; |
|
402
|
|
|
|
|
|
|
|
|
403
|
|
|
|
|
|
|
# carp("Language $lang, number $number"); |
|
404
|
|
|
|
|
|
|
|
|
405
|
1258
|
100
|
66
|
|
|
17658
|
if ($number !~ m/^$RE{num}{int}$/ && $number !~ m/^$RE{num}{real}$/) |
|
406
|
|
|
|
|
|
|
{ |
|
407
|
2
|
|
|
|
|
1086
|
carp("Number $number doesn't appear to be a real number, sorry"); |
|
408
|
2
|
|
|
|
|
14
|
return undef; |
|
409
|
|
|
|
|
|
|
} |
|
410
|
|
|
|
|
|
|
|
|
411
|
1256
|
|
|
|
|
247756
|
$number =~ s/\+//g; |
|
412
|
1256
|
50
|
|
|
|
3864
|
unless ( exists $NUMBER_NAMES{$lang} ) |
|
413
|
|
|
|
|
|
|
{ |
|
414
|
0
|
|
|
|
|
0
|
carp("Numbers for language $lang are unknown, sorry"); |
|
415
|
0
|
|
|
|
|
0
|
return undef; |
|
416
|
|
|
|
|
|
|
} |
|
417
|
|
|
|
|
|
|
|
|
418
|
1256
|
|
|
|
|
2123
|
my $hash = $NUMBER_NAMES{$lang}; |
|
419
|
|
|
|
|
|
|
|
|
420
|
1256
|
|
|
|
|
42205
|
my $max = max(keys %$hash); |
|
421
|
1256
|
100
|
|
|
|
8512
|
if ($number > $max) |
|
422
|
|
|
|
|
|
|
{ |
|
423
|
1
|
|
|
|
|
227
|
carp("Number $number is above maximum $max and not supported, sorry"); |
|
424
|
1
|
|
|
|
|
9
|
return undef; |
|
425
|
|
|
|
|
|
|
} |
|
426
|
|
|
|
|
|
|
|
|
427
|
1255
|
100
|
|
|
|
3119
|
return find_known($lang, $hash, $number, $options) if defined find_known($lang, $hash, $number, $options); |
|
428
|
|
|
|
|
|
|
|
|
429
|
154
|
100
|
|
|
|
550
|
return "$MINUS " . number_to_slavic($lang, $1) if $number =~ m/-\s*(.*)/; |
|
430
|
|
|
|
|
|
|
|
|
431
|
|
|
|
|
|
|
# normalize to scientific notation if exponent is specified, then expand |
|
432
|
145
|
50
|
|
|
|
695
|
if ($number =~ m/$RE{num}{real}{-sep=>'[,.]?'}{-keep}/) |
|
433
|
|
|
|
|
|
|
{ |
|
434
|
145
|
|
|
|
|
37951
|
my $power = $8; |
|
435
|
145
|
|
|
|
|
323
|
my $num = $3; |
|
436
|
145
|
100
|
|
|
|
414
|
if ($power) |
|
437
|
|
|
|
|
|
|
{ |
|
438
|
1
|
|
|
|
|
5
|
while ($num >= 10) |
|
439
|
|
|
|
|
|
|
{ |
|
440
|
1
|
|
|
|
|
3
|
$num /= 10; |
|
441
|
1
|
|
|
|
|
4
|
$power++; |
|
442
|
|
|
|
|
|
|
} |
|
443
|
|
|
|
|
|
|
|
|
444
|
1
|
50
|
|
|
|
3
|
return find_known($lang, $hash, $number, $options) if defined find_known($lang, $hash, $number, $options); |
|
445
|
|
|
|
|
|
|
|
|
446
|
1
|
|
66
|
|
|
9
|
while ($num && int $num != $num) |
|
447
|
|
|
|
|
|
|
{ |
|
448
|
1
|
|
|
|
|
3
|
$num *= 10; |
|
449
|
1
|
|
|
|
|
6
|
$power--; |
|
450
|
|
|
|
|
|
|
} |
|
451
|
|
|
|
|
|
|
|
|
452
|
1
|
|
|
|
|
6
|
$number = $num . '0' x $power; |
|
453
|
|
|
|
|
|
|
|
|
454
|
1
|
50
|
|
|
|
3
|
return find_known($lang, $hash, $number, $options) if defined find_known($lang, $hash, $number, $options); |
|
455
|
|
|
|
|
|
|
|
|
456
|
1
|
|
|
|
|
8
|
deb("finally, got power $power and number $num => $number\n"); |
|
457
|
|
|
|
|
|
|
} |
|
458
|
|
|
|
|
|
|
} |
|
459
|
|
|
|
|
|
|
|
|
460
|
145
|
50
|
|
|
|
14463
|
if (LANG_BG eq $lang) |
|
461
|
|
|
|
|
|
|
{ |
|
462
|
|
|
|
|
|
|
# build the intepretation from the number's digits |
|
463
|
145
|
|
|
|
|
227
|
my @components; |
|
464
|
145
|
|
|
|
|
617
|
my @parts = split /[.,]/, $number, 2; |
|
465
|
145
|
|
50
|
|
|
706
|
$parts[1] ||= ''; # always provide a floating part if it doesn't come with the number |
|
466
|
|
|
|
|
|
|
|
|
467
|
145
|
|
|
|
|
223
|
my $n = $parts[0]; |
|
468
|
145
|
|
|
|
|
175
|
my @n; |
|
469
|
145
|
|
|
|
|
427
|
while ($n) |
|
470
|
|
|
|
|
|
|
{ |
|
471
|
275
|
|
|
|
|
377
|
my $old_n = $n; |
|
472
|
275
|
|
|
|
|
531
|
my $triplet = substr $n, -3, 3, ''; |
|
473
|
275
|
|
|
|
|
859
|
deb("grabbing triplet from $old_n resulting in $n and $triplet\n"); |
|
474
|
275
|
|
|
|
|
893
|
push @n, $triplet; |
|
475
|
|
|
|
|
|
|
} |
|
476
|
|
|
|
|
|
|
|
|
477
|
145
|
|
|
|
|
374
|
my $out = bulgarian_triplets($hash, \@n, $options); |
|
478
|
|
|
|
|
|
|
# clean spaces |
|
479
|
145
|
|
|
|
|
690
|
$out =~ s/^\s*//; |
|
480
|
145
|
|
|
|
|
1102
|
$out =~ s/\s*$//; |
|
481
|
145
|
|
|
|
|
914
|
$out =~ s/\s+/ /g; |
|
482
|
|
|
|
|
|
|
# fix annoying bugs |
|
483
|
|
|
|
|
|
|
|
|
484
|
|
|
|
|
|
|
# remove leading и |
|
485
|
145
|
|
|
|
|
796
|
$out =~ s/^и\s+//g; |
|
486
|
|
|
|
|
|
|
# fix една хиляди |
|
487
|
145
|
|
|
|
|
291
|
$out =~ s/^една хиляди/хиляда/; |
|
488
|
145
|
|
|
|
|
1033
|
return $out; |
|
489
|
|
|
|
|
|
|
} |
|
490
|
|
|
|
|
|
|
|
|
491
|
0
|
|
|
|
|
0
|
carp("The number representation of $number in language '$lang' couldn't be found, sorry"); |
|
492
|
0
|
|
|
|
|
0
|
my $opt_string = join '//', sort keys %$options; |
|
493
|
0
|
0
|
|
|
|
0
|
$opt_string = "//$opt_string" if $opt_string; |
|
494
|
0
|
|
|
|
|
0
|
return "$number$opt_string"; |
|
495
|
|
|
|
|
|
|
} |
|
496
|
|
|
|
|
|
|
|
|
497
|
|
|
|
|
|
|
# |
|
498
|
|
|
|
|
|
|
# OO Methods |
|
499
|
|
|
|
|
|
|
# |
|
500
|
|
|
|
|
|
|
sub new { |
|
501
|
70
|
|
|
70
|
0
|
31958
|
my $class = shift; |
|
502
|
70
|
|
|
|
|
107
|
my $number = shift; |
|
503
|
70
|
|
|
|
|
107
|
my $lang = shift; |
|
504
|
70
|
|
|
|
|
487
|
bless { num => $number, lang => $lang}, $class; |
|
505
|
|
|
|
|
|
|
} |
|
506
|
|
|
|
|
|
|
|
|
507
|
|
|
|
|
|
|
sub parse { |
|
508
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
|
509
|
0
|
0
|
|
|
|
0
|
if ( $_[0] ) |
|
510
|
|
|
|
|
|
|
{ |
|
511
|
0
|
|
|
|
|
0
|
$self->{num} = shift; |
|
512
|
|
|
|
|
|
|
} |
|
513
|
0
|
0
|
|
|
|
0
|
if ( $_[1] ) |
|
514
|
|
|
|
|
|
|
{ |
|
515
|
0
|
|
|
|
|
0
|
$self->{lang} = shift; |
|
516
|
|
|
|
|
|
|
} |
|
517
|
0
|
|
|
|
|
0
|
$self; |
|
518
|
|
|
|
|
|
|
} |
|
519
|
|
|
|
|
|
|
|
|
520
|
|
|
|
|
|
|
sub get_string |
|
521
|
|
|
|
|
|
|
{ |
|
522
|
70
|
|
|
70
|
0
|
14797
|
my $self = shift; |
|
523
|
70
|
|
|
|
|
270
|
return number_to_slavic($self->{lang}, $self->{num}); |
|
524
|
|
|
|
|
|
|
} |
|
525
|
|
|
|
|
|
|
|
|
526
|
|
|
|
|
|
|
sub get_ordinate |
|
527
|
|
|
|
|
|
|
{ |
|
528
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
|
529
|
0
|
|
|
|
|
0
|
return ordinate_to_slavic($self->{lang}, $self->{num}); |
|
530
|
|
|
|
|
|
|
} |
|
531
|
|
|
|
|
|
|
|
|
532
|
|
|
|
|
|
|
### cperl-mode doesn't like this, so I put it at the end |
|
533
|
|
|
|
|
|
|
sub interpolate_string |
|
534
|
|
|
|
|
|
|
{ |
|
535
|
861
|
|
|
861
|
0
|
1321
|
my $lang = shift; |
|
536
|
861
|
|
|
|
|
1241
|
my $data = shift; |
|
537
|
|
|
|
|
|
|
|
|
538
|
|
|
|
|
|
|
|
|
539
|
861
|
|
100
|
|
|
5445
|
while ($data =~ m/\[$RE{num}{real}{-sep=>'[,.]?'}\]+/ || # [number] |
|
540
|
|
|
|
|
|
|
$data =~ m/{$RE{num}{real}{-sep=>'[,.]?'}}+/) # {number} |
|
541
|
|
|
|
|
|
|
{ |
|
542
|
683
|
|
|
|
|
274392
|
$data =~ s/{ |
|
543
|
|
|
|
|
|
|
{ |
|
544
|
|
|
|
|
|
|
$RE{num}{dec}{-sep=>'[,.]?'}{-keep} |
|
545
|
|
|
|
|
|
|
} |
|
546
|
|
|
|
|
|
|
([:\w]+)? |
|
547
|
|
|
|
|
|
|
} |
|
548
|
|
|
|
|
|
|
/ |
|
549
|
280
|
|
|
|
|
1127
|
number_to_slavic($lang, |
|
550
|
|
|
|
|
|
|
$1, |
|
551
|
196
|
|
|
|
|
43492
|
{ map { $_ => 1 } split(':', $11) } |
|
552
|
|
|
|
|
|
|
) |
|
553
|
|
|
|
|
|
|
/giex; |
|
554
|
|
|
|
|
|
|
|
|
555
|
683
|
|
|
|
|
147494
|
$data =~ s/ |
|
556
|
|
|
|
|
|
|
{ |
|
557
|
755
|
|
|
|
|
179725
|
$RE{num}{dec}{-sep=>'[,.]?'}{-keep} |
|
558
|
|
|
|
|
|
|
} |
|
559
|
|
|
|
|
|
|
/number_to_slavic($lang, $1)/giex; |
|
560
|
|
|
|
|
|
|
|
|
561
|
683
|
|
|
|
|
38235
|
$data =~ s/ |
|
562
|
|
|
|
|
|
|
\[ |
|
563
|
|
|
|
|
|
|
\[ |
|
564
|
|
|
|
|
|
|
$RE{num}{real}{-sep=>'[,.]?'}{-keep} |
|
565
|
|
|
|
|
|
|
\] |
|
566
|
|
|
|
|
|
|
([:\w]+)? |
|
567
|
|
|
|
|
|
|
\] |
|
568
|
|
|
|
|
|
|
/ |
|
569
|
0
|
|
|
|
|
0
|
ordinate_to_slavic( |
|
570
|
|
|
|
|
|
|
$lang, |
|
571
|
|
|
|
|
|
|
$1, |
|
572
|
0
|
|
|
|
|
0
|
{ map { $_ => 1 } split(':', $2) } |
|
573
|
|
|
|
|
|
|
) |
|
574
|
|
|
|
|
|
|
/giex; |
|
575
|
|
|
|
|
|
|
|
|
576
|
683
|
|
|
|
|
191225
|
$data =~ s/ |
|
577
|
|
|
|
|
|
|
\[ |
|
578
|
128
|
|
|
|
|
52930
|
$RE{num}{real}{-sep=>'[,.]?'}{-keep} |
|
579
|
|
|
|
|
|
|
\] |
|
580
|
|
|
|
|
|
|
/ordinate_to_slavic($lang, $1)/giex; |
|
581
|
|
|
|
|
|
|
} |
|
582
|
861
|
|
|
|
|
543851
|
return $data; |
|
583
|
|
|
|
|
|
|
} |
|
584
|
|
|
|
|
|
|
|
|
585
|
|
|
|
|
|
|
|
|
586
|
|
|
|
|
|
|
1; |
|
587
|
|
|
|
|
|
|
|
|
588
|
|
|
|
|
|
|
__END__ |