| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package HTTP::ClientDetect::Language; |
|
2
|
|
|
|
|
|
|
|
|
3
|
2
|
|
|
2
|
|
3705
|
use 5.006; |
|
|
2
|
|
|
|
|
8
|
|
|
|
2
|
|
|
|
|
88
|
|
|
4
|
2
|
|
|
2
|
|
11
|
use strict; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
86
|
|
|
5
|
2
|
|
|
2
|
|
11
|
use warnings FATAL => 'all'; |
|
|
2
|
|
|
|
|
2
|
|
|
|
2
|
|
|
|
|
108
|
|
|
6
|
2
|
|
|
2
|
|
4832
|
use Moo; |
|
|
2
|
|
|
|
|
18130
|
|
|
|
2
|
|
|
|
|
15
|
|
|
7
|
|
|
|
|
|
|
|
|
8
|
2
|
|
|
2
|
|
2976
|
use Locale::Language; |
|
|
2
|
|
|
|
|
424562
|
|
|
|
2
|
|
|
|
|
180
|
|
|
9
|
2
|
|
|
2
|
|
1141
|
use Locale::Country; |
|
|
2
|
|
|
|
|
44369
|
|
|
|
2
|
|
|
|
|
1949
|
|
|
10
|
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
my @languages = all_language_codes(); |
|
12
|
|
|
|
|
|
|
my @countries = all_country_codes(); |
|
13
|
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
my %langs = map { $_ => 1 } @languages; |
|
15
|
|
|
|
|
|
|
my %countrs = map { $_ => 1 } @countries; |
|
16
|
|
|
|
|
|
|
|
|
17
|
|
|
|
|
|
|
=head1 NAME |
|
18
|
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
HTTP::ClientDetect::Language - Lookup the client's preferred language |
|
20
|
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
=head1 VERSION |
|
22
|
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
Version 0.03 |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
=cut |
|
26
|
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
our $VERSION = '0.03'; |
|
28
|
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
|
|
30
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
31
|
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
use HTTP::ClientDetect::Language; |
|
33
|
|
|
|
|
|
|
my $lang_detect = HTTP::ClientDetect::Language->new(server_default => "en_US"); |
|
34
|
|
|
|
|
|
|
# inside a Dancer route |
|
35
|
|
|
|
|
|
|
get '/detect' => sub { |
|
36
|
|
|
|
|
|
|
my $req = request; |
|
37
|
|
|
|
|
|
|
my $lang = $lang_detect->language($req); |
|
38
|
|
|
|
|
|
|
} |
|
39
|
|
|
|
|
|
|
|
|
40
|
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
=head1 ACCESSORS |
|
42
|
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
=head2 server_default |
|
44
|
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
The C should be set in the constructor and defaults to |
|
46
|
|
|
|
|
|
|
C. This will be always returned if the lookup fails |
|
47
|
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
=cut |
|
49
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
|
|
51
|
|
|
|
|
|
|
has server_default => (is => 'rw', |
|
52
|
|
|
|
|
|
|
default => sub { return "en_US" }, |
|
53
|
|
|
|
|
|
|
isa => sub { |
|
54
|
|
|
|
|
|
|
die "Bad language $_[0]\n" |
|
55
|
|
|
|
|
|
|
unless __PACKAGE__->check_language_name($_[0]); |
|
56
|
|
|
|
|
|
|
}); |
|
57
|
|
|
|
|
|
|
|
|
58
|
|
|
|
|
|
|
|
|
59
|
|
|
|
|
|
|
=head2 available_languages |
|
60
|
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
Accessor to an arrayref of languages available on the server side. |
|
62
|
|
|
|
|
|
|
Please use the short version (C, not C), otherwise the |
|
63
|
|
|
|
|
|
|
check will be too restrictive. |
|
64
|
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
=cut |
|
66
|
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
has available_languages => (is => 'rw', |
|
68
|
|
|
|
|
|
|
isa => sub { |
|
69
|
|
|
|
|
|
|
my $aref = $_[0]; |
|
70
|
|
|
|
|
|
|
die "Not an arrayref" unless ref($aref) eq 'ARRAY'; |
|
71
|
|
|
|
|
|
|
foreach my $l (@$aref) { |
|
72
|
|
|
|
|
|
|
die "Bad language $l\n" |
|
73
|
|
|
|
|
|
|
unless __PACKAGE__->check_language_name($l); |
|
74
|
|
|
|
|
|
|
} |
|
75
|
|
|
|
|
|
|
}, |
|
76
|
|
|
|
|
|
|
default => sub { [] }, |
|
77
|
|
|
|
|
|
|
); |
|
78
|
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
=head1 SUBROUTINES/METHODS |
|
81
|
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
=head2 language($request_obj) |
|
83
|
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
Return the preferred language of the request. The request object |
|
85
|
|
|
|
|
|
|
should an object which has the methods C or C |
|
86
|
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
From L: |
|
88
|
|
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
The Accept-Language request-header field is similar to Accept, but |
|
90
|
|
|
|
|
|
|
restricts the set of natural languages that are preferred as a |
|
91
|
|
|
|
|
|
|
response to the request. Language tags are defined in section 3.10. |
|
92
|
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
Accept-Language = "Accept-Language" ":" |
|
94
|
|
|
|
|
|
|
1#( language-range [ ";" "q" "=" qvalue ] ) |
|
95
|
|
|
|
|
|
|
language-range = ( ( 1*8ALPHA *( "-" 1*8ALPHA ) ) | "*" ) |
|
96
|
|
|
|
|
|
|
|
|
97
|
|
|
|
|
|
|
Each language-range MAY be given an associated quality value which |
|
98
|
|
|
|
|
|
|
represents an estimate of the user's preference for the languages |
|
99
|
|
|
|
|
|
|
specified by that range. The quality value defaults to "q=1". For |
|
100
|
|
|
|
|
|
|
example, |
|
101
|
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
Accept-Language: da, en-gb;q=0.8, en;q=0.7 |
|
103
|
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
would mean: "I prefer Danish, but will accept British English and |
|
105
|
|
|
|
|
|
|
other types of English." A language-range matches a language-tag if |
|
106
|
|
|
|
|
|
|
it exactly equals the tag, or if it exactly equals a prefix of the |
|
107
|
|
|
|
|
|
|
tag such that the first tag character following the prefix is "-". |
|
108
|
|
|
|
|
|
|
The special range "*", if present in the Accept-Language field, |
|
109
|
|
|
|
|
|
|
matches every tag not matched by any other range present in the |
|
110
|
|
|
|
|
|
|
Accept-Language field. |
|
111
|
|
|
|
|
|
|
|
|
112
|
|
|
|
|
|
|
Note: This use of a prefix matching rule does not imply that |
|
113
|
|
|
|
|
|
|
language tags are assigned to languages in such a way that it is |
|
114
|
|
|
|
|
|
|
always true that if a user understands a language with a certain |
|
115
|
|
|
|
|
|
|
tag, then this user will also understand all languages with tags |
|
116
|
|
|
|
|
|
|
for which this tag is a prefix. The prefix rule simply allows the |
|
117
|
|
|
|
|
|
|
use of prefix tags if this is the case. |
|
118
|
|
|
|
|
|
|
|
|
119
|
|
|
|
|
|
|
The language quality factor assigned to a language-tag by the |
|
120
|
|
|
|
|
|
|
Accept-Language field is the quality value of the longest language- |
|
121
|
|
|
|
|
|
|
range in the field that matches the language-tag. If no language- |
|
122
|
|
|
|
|
|
|
range in the field matches the tag, the language quality factor |
|
123
|
|
|
|
|
|
|
assigned is 0. If no Accept-Language header is present in the |
|
124
|
|
|
|
|
|
|
request, the server |
|
125
|
|
|
|
|
|
|
|
|
126
|
|
|
|
|
|
|
SHOULD assume that all languages are equally acceptable. If an |
|
127
|
|
|
|
|
|
|
Accept-Language header is present, then all languages which are |
|
128
|
|
|
|
|
|
|
assigned a quality factor greater than 0 are acceptable. |
|
129
|
|
|
|
|
|
|
|
|
130
|
|
|
|
|
|
|
It might be contrary to the privacy expectations of the user to send |
|
131
|
|
|
|
|
|
|
an Accept-Language header with the complete linguistic preferences |
|
132
|
|
|
|
|
|
|
of the user in every request |
|
133
|
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
=cut |
|
135
|
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
sub language { |
|
137
|
60
|
|
|
60
|
1
|
203
|
my ($self, $obj) = @_; |
|
138
|
60
|
|
|
|
|
114
|
my @browser_langs = $self->browser_languages($obj); |
|
139
|
60
|
|
|
|
|
847
|
my @avail = @{$self->available_languages}; |
|
|
60
|
|
|
|
|
1385
|
|
|
140
|
60
|
100
|
|
|
|
925
|
if (@avail) { |
|
141
|
36
|
|
|
|
|
55
|
foreach my $ua_lang (@browser_langs) { |
|
142
|
97
|
|
|
|
|
124
|
foreach my $avail_lang (@avail) { |
|
143
|
117
|
100
|
|
|
|
865
|
if ($ua_lang =~ m/^\Q$avail_lang\E(_[A-Z]+)?$/) { |
|
144
|
13
|
|
|
|
|
46
|
return $ua_lang; |
|
145
|
|
|
|
|
|
|
} |
|
146
|
|
|
|
|
|
|
} |
|
147
|
|
|
|
|
|
|
} |
|
148
|
|
|
|
|
|
|
# nothing? then return the server default |
|
149
|
23
|
|
|
|
|
463
|
return $self->server_default; |
|
150
|
|
|
|
|
|
|
} |
|
151
|
|
|
|
|
|
|
else { |
|
152
|
24
|
|
|
|
|
60
|
return $browser_langs[0]; |
|
153
|
|
|
|
|
|
|
} |
|
154
|
|
|
|
|
|
|
} |
|
155
|
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
=head2 browser_languages($request) |
|
157
|
|
|
|
|
|
|
|
|
158
|
|
|
|
|
|
|
This method returns the parsed and sorted list of language preferences |
|
159
|
|
|
|
|
|
|
set in the browser, when the first element has higher priority. |
|
160
|
|
|
|
|
|
|
|
|
161
|
|
|
|
|
|
|
=cut |
|
162
|
|
|
|
|
|
|
|
|
163
|
|
|
|
|
|
|
sub browser_languages { |
|
164
|
60
|
|
|
60
|
1
|
65
|
my ($self, $obj) = @_; |
|
165
|
60
|
50
|
|
|
|
125
|
return $self->server_default unless $obj; |
|
166
|
60
|
|
|
|
|
63
|
my $accept_str; |
|
167
|
60
|
50
|
|
|
|
234
|
if ($obj->can("accept_language")) { |
|
168
|
60
|
|
|
|
|
130
|
$accept_str = $obj->accept_language; |
|
169
|
|
|
|
|
|
|
} |
|
170
|
|
|
|
|
|
|
# nothing? try with header, but don't count too much on this |
|
171
|
60
|
50
|
33
|
|
|
143
|
if (!$accept_str and $obj->can("header")) { |
|
172
|
0
|
|
|
|
|
0
|
$accept_str = $obj->header('Accept-Language'); |
|
173
|
|
|
|
|
|
|
} |
|
174
|
60
|
50
|
|
|
|
92
|
return $self->server_default unless $accept_str; |
|
175
|
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
# split the string at , |
|
177
|
60
|
|
|
|
|
480
|
my @langs = split(/\s*,\s*/, $accept_str); |
|
178
|
60
|
|
|
|
|
62
|
my @to_order; |
|
179
|
60
|
|
|
|
|
87
|
foreach my $lang_str (@langs) { |
|
180
|
235
|
100
|
|
|
|
319
|
next unless $lang_str; |
|
181
|
190
|
|
|
|
|
129
|
my ($q, $code); |
|
182
|
190
|
100
|
|
|
|
803
|
if ($lang_str =~ m/([a-zA-Z]+([-_][a-zA-Z]+)?)\s*(;\s*q\s*=\s*([0-9\.]+))?/) { |
|
183
|
180
|
|
|
|
|
338
|
$code = $self->check_language_name($1); |
|
184
|
180
|
|
100
|
|
|
439
|
$q = $4 || 1; |
|
185
|
|
|
|
|
|
|
} |
|
186
|
190
|
100
|
|
|
|
272
|
next unless $code; |
|
187
|
165
|
|
|
|
|
374
|
push @to_order, [ $code => $q ]; |
|
188
|
|
|
|
|
|
|
# sort by q |
|
189
|
|
|
|
|
|
|
} |
|
190
|
60
|
100
|
|
|
|
333
|
return $self->server_default unless @to_order; |
|
191
|
50
|
|
|
|
|
158
|
my @ordered = sort { $b->[1] <=> $a->[1] } @to_order; |
|
|
170
|
|
|
|
|
373
|
|
|
192
|
50
|
|
|
|
|
66
|
return map { $_->[0] } @ordered; |
|
|
165
|
|
|
|
|
430
|
|
|
193
|
|
|
|
|
|
|
} |
|
194
|
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
=head3 language_short($request_obj) |
|
196
|
|
|
|
|
|
|
|
|
197
|
|
|
|
|
|
|
Return the short language version (i.e.), the language name without |
|
198
|
|
|
|
|
|
|
the country part. |
|
199
|
|
|
|
|
|
|
|
|
200
|
|
|
|
|
|
|
=cut |
|
201
|
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
sub language_short { |
|
203
|
36
|
|
|
36
|
1
|
4448
|
my ($self, $obj) = @_; |
|
204
|
36
|
|
|
|
|
60
|
my $lang = $self->language($obj); |
|
205
|
|
|
|
|
|
|
# strip the second part |
|
206
|
36
|
|
|
|
|
168
|
$lang =~ s/_.*$//; |
|
207
|
36
|
|
|
|
|
133
|
return $lang; |
|
208
|
|
|
|
|
|
|
} |
|
209
|
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
=head3 check_language_name |
|
212
|
|
|
|
|
|
|
|
|
213
|
|
|
|
|
|
|
Returns a normalized version of the language name, lower case for the |
|
214
|
|
|
|
|
|
|
language, upper case for the country. Undef it was not possible to |
|
215
|
|
|
|
|
|
|
validate it. |
|
216
|
|
|
|
|
|
|
|
|
217
|
|
|
|
|
|
|
=cut |
|
218
|
|
|
|
|
|
|
|
|
219
|
|
|
|
|
|
|
sub check_language_name { |
|
220
|
188
|
|
|
188
|
1
|
304
|
my ($self, $code) = @_; |
|
221
|
188
|
|
|
|
|
143
|
my ($lang, $country); |
|
222
|
188
|
50
|
|
|
|
277
|
return unless $code; |
|
223
|
188
|
100
|
|
|
|
487
|
if ($code =~ m/([a-zA-Z]{2})([_-]([a-zA-Z]*))?/) { |
|
224
|
183
|
|
|
|
|
333
|
$lang = $1; |
|
225
|
183
|
|
100
|
|
|
556
|
$country = $3 || ""; |
|
226
|
|
|
|
|
|
|
} |
|
227
|
|
|
|
|
|
|
else { |
|
228
|
5
|
|
|
|
|
7
|
$lang = $code; |
|
229
|
5
|
|
|
|
|
8
|
$country = $code; # eg. fr fr |
|
230
|
|
|
|
|
|
|
} |
|
231
|
|
|
|
|
|
|
# lowercase; |
|
232
|
188
|
|
|
|
|
221
|
$lang = lc($lang); |
|
233
|
188
|
|
|
|
|
170
|
$country = lc($country); |
|
234
|
|
|
|
|
|
|
# check the lang; |
|
235
|
188
|
100
|
|
|
|
431
|
return unless $langs{$lang}; |
|
236
|
|
|
|
|
|
|
# if the country doesn't validate, we fix the common scenario (en |
|
237
|
|
|
|
|
|
|
# => US), and append the same |
|
238
|
171
|
100
|
|
|
|
308
|
if ($countrs{$country}) { |
|
239
|
46
|
|
|
|
|
126
|
return $lang . "_" . uc($country); |
|
240
|
|
|
|
|
|
|
} |
|
241
|
|
|
|
|
|
|
# then do some heuristics, if the country didn't match |
|
242
|
125
|
100
|
|
|
|
204
|
if ($lang eq 'en') { |
|
243
|
45
|
|
|
|
|
98
|
return $lang . "_US"; |
|
244
|
|
|
|
|
|
|
} |
|
245
|
|
|
|
|
|
|
# then try the language as a country |
|
246
|
80
|
100
|
|
|
|
136
|
if ($countrs{$lang}) { |
|
247
|
50
|
|
|
|
|
217
|
return $lang . "_" . uc($lang); |
|
248
|
|
|
|
|
|
|
} |
|
249
|
|
|
|
|
|
|
# if we are still here, return the language, there are cases we |
|
250
|
|
|
|
|
|
|
# can't catch, like ja_JP |
|
251
|
30
|
|
|
|
|
48
|
return $lang; |
|
252
|
|
|
|
|
|
|
} |
|
253
|
|
|
|
|
|
|
|
|
254
|
|
|
|
|
|
|
|
|
255
|
|
|
|
|
|
|
=head1 AUTHOR |
|
256
|
|
|
|
|
|
|
|
|
257
|
|
|
|
|
|
|
Marco Pessotto, C<< >> |
|
258
|
|
|
|
|
|
|
|
|
259
|
|
|
|
|
|
|
=head1 BUGS |
|
260
|
|
|
|
|
|
|
|
|
261
|
|
|
|
|
|
|
Please report any bugs or feature requests to C, or through |
|
262
|
|
|
|
|
|
|
the web interface at L. I will be notified, and then you'll |
|
263
|
|
|
|
|
|
|
automatically be notified of progress on your bug as I make changes. |
|
264
|
|
|
|
|
|
|
|
|
265
|
|
|
|
|
|
|
|
|
266
|
|
|
|
|
|
|
|
|
267
|
|
|
|
|
|
|
|
|
268
|
|
|
|
|
|
|
=head1 SUPPORT |
|
269
|
|
|
|
|
|
|
|
|
270
|
|
|
|
|
|
|
You can find documentation for this module with the perldoc command. |
|
271
|
|
|
|
|
|
|
|
|
272
|
|
|
|
|
|
|
perldoc HTTP::ClientDetect::Language |
|
273
|
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
|
|
275
|
|
|
|
|
|
|
You can also look for information at: |
|
276
|
|
|
|
|
|
|
|
|
277
|
|
|
|
|
|
|
=over 4 |
|
278
|
|
|
|
|
|
|
|
|
279
|
|
|
|
|
|
|
=item * RT: CPAN's request tracker (report bugs here) |
|
280
|
|
|
|
|
|
|
|
|
281
|
|
|
|
|
|
|
L |
|
282
|
|
|
|
|
|
|
|
|
283
|
|
|
|
|
|
|
=item * AnnoCPAN: Annotated CPAN documentation |
|
284
|
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
L |
|
286
|
|
|
|
|
|
|
|
|
287
|
|
|
|
|
|
|
=item * CPAN Ratings |
|
288
|
|
|
|
|
|
|
|
|
289
|
|
|
|
|
|
|
L |
|
290
|
|
|
|
|
|
|
|
|
291
|
|
|
|
|
|
|
=item * Search CPAN |
|
292
|
|
|
|
|
|
|
|
|
293
|
|
|
|
|
|
|
L |
|
294
|
|
|
|
|
|
|
|
|
295
|
|
|
|
|
|
|
=back |
|
296
|
|
|
|
|
|
|
|
|
297
|
|
|
|
|
|
|
|
|
298
|
|
|
|
|
|
|
=head1 ACKNOWLEDGEMENTS |
|
299
|
|
|
|
|
|
|
|
|
300
|
|
|
|
|
|
|
|
|
301
|
|
|
|
|
|
|
=head1 LICENSE AND COPYRIGHT |
|
302
|
|
|
|
|
|
|
|
|
303
|
|
|
|
|
|
|
Copyright 2013 Marco Pessotto. |
|
304
|
|
|
|
|
|
|
|
|
305
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it |
|
306
|
|
|
|
|
|
|
under the terms of either: the GNU General Public License as published |
|
307
|
|
|
|
|
|
|
by the Free Software Foundation; or the Artistic License. |
|
308
|
|
|
|
|
|
|
|
|
309
|
|
|
|
|
|
|
See L for more information. |
|
310
|
|
|
|
|
|
|
|
|
311
|
|
|
|
|
|
|
|
|
312
|
|
|
|
|
|
|
=cut |
|
313
|
|
|
|
|
|
|
|
|
314
|
|
|
|
|
|
|
1; # End of HTTP::ClientDetect::Language |