line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# Copyright 2010, 2011, 2012 Kevin Ryde |
2
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
# This file is part of Math-Aronson. |
4
|
|
|
|
|
|
|
# |
5
|
|
|
|
|
|
|
# Math-Aronson is free software; you can redistribute it and/or modify |
6
|
|
|
|
|
|
|
# it under the terms of the GNU General Public License as published by the |
7
|
|
|
|
|
|
|
# Free Software Foundation; either version 3, or (at your option) any later |
8
|
|
|
|
|
|
|
# version. |
9
|
|
|
|
|
|
|
# |
10
|
|
|
|
|
|
|
# Math-Aronson is distributed in the hope that it will be useful, but |
11
|
|
|
|
|
|
|
# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY |
12
|
|
|
|
|
|
|
# or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
13
|
|
|
|
|
|
|
# for more details. |
14
|
|
|
|
|
|
|
# |
15
|
|
|
|
|
|
|
# You should have received a copy of the GNU General Public License along |
16
|
|
|
|
|
|
|
# with Math-Aronson. If not, see . |
17
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
package Math::Aronson; |
19
|
3
|
|
|
3
|
|
36790
|
use 5.004; |
|
3
|
|
|
|
|
13
|
|
|
3
|
|
|
|
|
124
|
|
20
|
3
|
|
|
3
|
|
18
|
use strict; |
|
3
|
|
|
|
|
6
|
|
|
3
|
|
|
|
|
95
|
|
21
|
3
|
|
|
3
|
|
15
|
use Carp; |
|
3
|
|
|
|
|
9
|
|
|
3
|
|
|
|
|
244
|
|
22
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
# uncomment this to run the ### lines |
24
|
|
|
|
|
|
|
#use Devel::Comments; |
25
|
|
|
|
|
|
|
|
26
|
3
|
|
|
3
|
|
15
|
use vars '$VERSION'; |
|
3
|
|
|
|
|
6
|
|
|
3
|
|
|
|
|
496
|
|
27
|
|
|
|
|
|
|
$VERSION = 9; |
28
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
# maybe a hi=>$limit option to stop the ret or queue building up beyond a |
30
|
|
|
|
|
|
|
# desired point |
31
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
my $unaccent; |
34
|
|
|
|
|
|
|
BEGIN { |
35
|
3
|
50
|
|
3
|
|
172049
|
if (eval "use Unicode::Normalize 'normalize'; 1") { |
|
3
|
|
|
3
|
|
7234
|
|
|
3
|
|
|
|
|
16643
|
|
|
3
|
|
|
|
|
3239
|
|
36
|
|
|
|
|
|
|
$unaccent = sub { |
37
|
|
|
|
|
|
|
### unaccent: $_[0] |
38
|
|
|
|
|
|
|
# uncombine the latin-1 etc equivs then strip the zero-width marks |
39
|
3
|
|
|
3
|
|
8576
|
($_[0] = normalize('D',$_[0])) =~ s/\pM+//g; |
|
3
|
|
|
|
|
37
|
|
|
3
|
|
|
|
|
51
|
|
|
216
|
|
|
|
|
620
|
|
40
|
3
|
|
|
|
|
4011
|
}; |
41
|
|
|
|
|
|
|
} else { |
42
|
|
|
|
|
|
|
$unaccent = sub { |
43
|
|
|
|
|
|
|
# latin-1, generated by devel/unaccent.pl |
44
|
0
|
|
|
|
|
0
|
$_[0] =~ tr/\300\301\302\303\304\305\307\310\311\312\313\314\315\316\317\321\322\323\324\325\326\331\332\333\334\335\340\341\342\343\344\345\347\350\351\352\353\354\355\356\357\361\362\363\364\365\366\371\372\373\374\375\377/AAAAAACEEEEIIIINOOOOOUUUUYaaaaaaceeeeiiiinooooouuuuyy/; |
45
|
0
|
|
|
|
|
0
|
}; |
46
|
|
|
|
|
|
|
} |
47
|
|
|
|
|
|
|
} |
48
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
my %default_letter = ('en' => 'T', |
50
|
|
|
|
|
|
|
'fr' => 'E'); |
51
|
|
|
|
|
|
|
my %default_initial_string = ('en' => 'is the', |
52
|
|
|
|
|
|
|
'fr' => 'est la'); |
53
|
|
|
|
|
|
|
sub new { |
54
|
17
|
|
|
17
|
1
|
8243
|
my $class = shift; |
55
|
|
|
|
|
|
|
### Aronson new(): @_ |
56
|
|
|
|
|
|
|
|
57
|
17
|
|
|
|
|
32
|
my @ret; |
58
|
17
|
|
|
|
|
127
|
my $self = bless { ret => \@ret, |
59
|
|
|
|
|
|
|
queue => [ ], |
60
|
|
|
|
|
|
|
@_ |
61
|
|
|
|
|
|
|
}, $class; |
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
# 1 or '' for use with xor |
64
|
17
|
|
|
|
|
62
|
$self->{'lying'} = !! $self->{'lying'}; |
65
|
|
|
|
|
|
|
|
66
|
17
|
|
100
|
|
|
87
|
my $lang = ($self->{'lang'} ||= 'en'); # default |
67
|
17
|
100
|
|
|
|
48
|
if ($lang eq 'en') { |
|
|
50
|
|
|
|
|
|
68
|
16
|
|
|
|
|
159
|
%$self = (conjunctions_word => 'and', |
69
|
|
|
|
|
|
|
%$self); |
70
|
|
|
|
|
|
|
} elsif ($lang eq 'fr') { |
71
|
1
|
|
|
|
|
8
|
%$self = (conjunctions_word => 'et', |
72
|
|
|
|
|
|
|
%$self); |
73
|
|
|
|
|
|
|
} |
74
|
|
|
|
|
|
|
# for oeis_anum() |
75
|
17
|
50
|
|
|
|
84
|
$self->{'lang'} = ($self->{'ordinal_func'} ? 'func' : lc($lang)); |
76
|
|
|
|
|
|
|
|
77
|
17
|
|
|
|
|
39
|
my $without_conjunctions = delete $self->{'without_conjunctions'}; |
78
|
17
|
|
|
|
|
40
|
my $conjunctions_word = delete $self->{'conjunctions_word'}; |
79
|
|
|
|
|
|
|
|
80
|
17
|
100
|
33
|
|
|
149
|
$self->{'conjunctions'} |
|
|
50
|
|
|
|
|
|
81
|
|
|
|
|
|
|
= (($lang eq 'en' && $conjunctions_word ne 'and') |
82
|
|
|
|
|
|
|
&& ($lang eq 'fr' && $conjunctions_word ne 'et') |
83
|
|
|
|
|
|
|
? 'x' |
84
|
|
|
|
|
|
|
: ($without_conjunctions ? 0 : 1)); |
85
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
$self->{'ordinal_func'} ||= |
87
|
|
|
|
|
|
|
($lang eq 'en' ? do { |
88
|
16
|
|
|
|
|
12995
|
require Lingua::EN::Numbers; |
89
|
16
|
|
|
|
|
7284
|
Lingua::EN::Numbers->VERSION(1.01); # 1.01 rewrite |
90
|
16
|
|
|
|
|
104
|
\&Lingua::EN::Numbers::num2en_ordinal |
91
|
|
|
|
|
|
|
} |
92
|
|
|
|
|
|
|
: $lang eq 'fr' ? do { |
93
|
1
|
|
|
|
|
1122
|
require Lingua::FR::Numbers; |
94
|
1
|
|
|
|
|
7829
|
\&_fr_ordinal |
95
|
|
|
|
|
|
|
} |
96
|
17
|
50
|
33
|
|
|
73
|
: do { |
|
|
100
|
|
|
|
|
|
97
|
0
|
|
|
|
|
0
|
require Lingua::Any::Numbers; |
98
|
|
|
|
|
|
|
sub { |
99
|
0
|
|
|
0
|
|
0
|
return Lingua::Any::Numbers::to_ordinal($_[0], $lang); |
100
|
|
|
|
|
|
|
} |
101
|
0
|
|
|
|
|
0
|
}); |
102
|
|
|
|
|
|
|
|
103
|
|
|
|
|
|
|
my $without_conjunctions_func |
104
|
|
|
|
|
|
|
= $self->{'without_conjunctions_func'} |
105
|
|
|
|
|
|
|
= ($without_conjunctions && defined $conjunctions_word |
106
|
17
|
100
|
66
|
|
|
102
|
? do { |
107
|
3
|
|
|
|
|
8
|
$conjunctions_word = lc($conjunctions_word); |
108
|
106
|
|
|
106
|
|
500
|
sub { $_[0] =~ s/\b\Q$conjunctions_word\E\b// } |
109
|
3
|
|
|
|
|
22
|
} |
110
|
|
|
|
|
|
|
: \&_conjunctions_noop); # no change to strings |
111
|
|
|
|
|
|
|
|
112
|
17
|
|
|
|
|
38
|
my $initial_string = delete $self->{'initial_string'}; |
113
|
17
|
|
|
|
|
29
|
my $letter = $self->{'letter'}; |
114
|
|
|
|
|
|
|
|
115
|
17
|
100
|
|
|
|
46
|
if (! defined $initial_string) { |
116
|
13
|
100
|
|
|
|
30
|
if (! $letter) { |
117
|
|
|
|
|
|
|
# default 'T' for en or 'E' for fr |
118
|
8
|
|
|
|
|
21
|
$letter = $default_letter{$lang}; |
119
|
|
|
|
|
|
|
} |
120
|
13
|
50
|
|
|
|
47
|
if (! defined ($initial_string = $default_initial_string{$lang})) { |
121
|
0
|
|
|
|
|
0
|
croak 'No default initial_string for language \'',$lang,'\''; |
122
|
|
|
|
|
|
|
} |
123
|
13
|
|
|
|
|
31
|
$initial_string = $letter . $initial_string; |
124
|
|
|
|
|
|
|
} |
125
|
|
|
|
|
|
|
|
126
|
17
|
|
|
|
|
45
|
&$unaccent ($initial_string); |
127
|
17
|
|
|
|
|
310
|
$initial_string = lc ($initial_string); |
128
|
|
|
|
|
|
|
|
129
|
17
|
|
|
|
|
38
|
&$without_conjunctions_func ($initial_string); |
130
|
17
|
|
|
|
|
142
|
$initial_string =~ s/(\W|_)+//g; # strip non alphas |
131
|
|
|
|
|
|
|
### initial: $initial_string |
132
|
|
|
|
|
|
|
|
133
|
17
|
100
|
|
|
|
51
|
if (! defined $letter) { |
134
|
4
|
50
|
|
|
|
11
|
if (defined $initial_string) { |
135
|
|
|
|
|
|
|
# initial_string but no letter, take letter as first alphabetical |
136
|
4
|
|
|
|
|
13
|
$letter = substr($initial_string,0,1); |
137
|
|
|
|
|
|
|
} else { |
138
|
|
|
|
|
|
|
} |
139
|
|
|
|
|
|
|
} |
140
|
|
|
|
|
|
|
|
141
|
17
|
100
|
|
|
|
43
|
unless (length($letter)) { |
142
|
|
|
|
|
|
|
# empty letter string no good as will match endlessly, change to a space |
143
|
|
|
|
|
|
|
# which will never match |
144
|
1
|
|
|
|
|
3
|
$letter = ' '; |
145
|
|
|
|
|
|
|
} |
146
|
17
|
|
|
|
|
60
|
$self->{'letter'} = $letter = lc($letter); |
147
|
|
|
|
|
|
|
|
148
|
|
|
|
|
|
|
# my $upto = 1; |
149
|
95
|
|
|
|
|
213
|
push @ret, |
150
|
17
|
|
|
|
|
85
|
grep {(substr($initial_string,$_-1,1) eq $letter) ^ $self->{'lying'}} |
151
|
|
|
|
|
|
|
1 .. (1 + length($initial_string)-1); |
152
|
17
|
|
|
|
|
41
|
$self->{'upto'} = 1 + length($initial_string); |
153
|
|
|
|
|
|
|
### initial: $self |
154
|
17
|
|
|
|
|
73
|
return $self; |
155
|
|
|
|
|
|
|
} |
156
|
|
|
|
|
|
|
|
157
|
110
|
|
|
110
|
|
137
|
sub _conjunctions_noop { |
158
|
|
|
|
|
|
|
} |
159
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
sub _fr_ordinal { |
161
|
19
|
|
|
19
|
|
56
|
my $str = Lingua::FR::Numbers::ordinate_to_fr($_[0]); |
162
|
|
|
|
|
|
|
# Feminine "E est la premiere lettre ..." |
163
|
19
|
100
|
|
|
|
1204
|
if ($str eq 'premier') { $str = 'premiere'; } |
|
1
|
|
|
|
|
2
|
|
164
|
19
|
|
|
|
|
35
|
return $str; |
165
|
|
|
|
|
|
|
} |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
|
168
|
|
|
|
|
|
|
sub next { |
169
|
477
|
|
|
477
|
1
|
1825
|
my ($self) = @_; |
170
|
477
|
|
|
|
|
617
|
my $ret = $self->{'ret'}; |
171
|
477
|
|
|
|
|
498
|
for (;;) { |
172
|
676
|
100
|
|
|
|
1430
|
if (my $n = shift @$ret) { |
173
|
472
|
|
|
|
|
458
|
push @{$self->{'queue'}}, $n; |
|
472
|
|
|
|
|
916
|
|
174
|
472
|
|
|
|
|
1375
|
return $n; |
175
|
|
|
|
|
|
|
} |
176
|
|
|
|
|
|
|
|
177
|
204
|
|
100
|
|
|
232
|
my $k = shift @{$self->{'queue'}} |
178
|
|
|
|
|
|
|
|| return; # end of sequence |
179
|
|
|
|
|
|
|
|
180
|
199
|
|
|
|
|
387
|
my $str = &{$self->{'ordinal_func'}}($k); |
|
199
|
|
|
|
|
994
|
|
181
|
|
|
|
|
|
|
### orig str: $str |
182
|
199
|
|
|
|
|
9008
|
&{$self->{'without_conjunctions_func'}}($str); |
|
199
|
|
|
|
|
632
|
|
183
|
199
|
|
|
|
|
363
|
&$unaccent ($str); |
184
|
199
|
|
|
|
|
2550
|
$str = lc ($str); |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
# could be s/[[:punct:][:space:]]+//g, but [::] new in 5.005 or something |
187
|
199
|
|
|
|
|
1428
|
$str =~ s/(\W|_)+//g; # strip non alphas |
188
|
|
|
|
|
|
|
### munged str: $str |
189
|
|
|
|
|
|
|
|
190
|
199
|
|
|
|
|
347
|
my $upto = $self->{'upto'}; |
191
|
199
|
|
|
|
|
282
|
my $letter = $self->{'letter'}; |
192
|
2467
|
|
|
|
|
4326
|
push @$ret, |
193
|
199
|
|
|
|
|
645
|
grep {(substr($str,$_-$upto,1) eq $letter) ^ $self->{'lying'}} |
194
|
|
|
|
|
|
|
$upto .. ($upto + length($str)-1); |
195
|
|
|
|
|
|
|
|
196
|
199
|
|
|
|
|
493
|
$self->{'upto'} += length($str); |
197
|
|
|
|
|
|
|
### now upto: $self->{'upto'} |
198
|
|
|
|
|
|
|
### ret: $ret |
199
|
|
|
|
|
|
|
### queue: $self->{'queue'} |
200
|
|
|
|
|
|
|
} |
201
|
|
|
|
|
|
|
} |
202
|
|
|
|
|
|
|
|
203
|
|
|
|
|
|
|
1; |
204
|
|
|
|
|
|
|
__END__ |