| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package Locale::Maketext::Lexicon::Gettext; |
|
2
|
|
|
|
|
|
|
$Locale::Maketext::Lexicon::Gettext::VERSION = '1.00'; |
|
3
|
9
|
|
|
9
|
|
56
|
use strict; |
|
|
9
|
|
|
|
|
18
|
|
|
|
9
|
|
|
|
|
1416
|
|
|
4
|
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
# ABSTRACT: PO and MO file parser for Maketext |
|
6
|
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
my ( $InputEncoding, $OutputEncoding, $DoEncoding ); |
|
9
|
|
|
|
|
|
|
|
|
10
|
1
|
|
|
1
|
0
|
68
|
sub input_encoding {$InputEncoding} |
|
11
|
0
|
|
|
0
|
0
|
0
|
sub output_encoding {$OutputEncoding} |
|
12
|
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
sub parse { |
|
14
|
70
|
|
|
70
|
0
|
127
|
my $self = shift; |
|
15
|
70
|
|
|
|
|
99
|
my ( %var, $key, @ret ); |
|
16
|
0
|
|
|
|
|
0
|
my @metadata; |
|
17
|
0
|
|
|
|
|
0
|
my @comments; |
|
18
|
0
|
|
|
|
|
0
|
my @fuzzy; |
|
19
|
|
|
|
|
|
|
|
|
20
|
70
|
|
|
|
|
123
|
$InputEncoding = $OutputEncoding = $DoEncoding = undef; |
|
21
|
|
|
|
|
|
|
|
|
22
|
9
|
|
|
9
|
|
67
|
use Carp; |
|
|
9
|
|
|
|
|
17
|
|
|
|
9
|
|
|
|
|
19385
|
|
|
23
|
70
|
50
|
|
|
|
200
|
Carp::cluck "Undefined source called\n" unless defined $_[0]; |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
# Check for magic string of MO files |
|
26
|
70
|
100
|
100
|
|
|
852
|
return parse_mo( join( '', @_ ) ) |
|
27
|
|
|
|
|
|
|
if ( $_[0] =~ /^\x95\x04\x12\xde/ or $_[0] =~ /^\xde\x12\x04\x95/ ); |
|
28
|
|
|
|
|
|
|
|
|
29
|
12
|
|
|
|
|
45
|
local $^W; # no 'uninitialized' warnings, please. |
|
30
|
|
|
|
|
|
|
|
|
31
|
12
|
|
|
|
|
98
|
require Locale::Maketext::Lexicon; |
|
32
|
12
|
|
|
|
|
41
|
my $KeepFuzzy = Locale::Maketext::Lexicon::option('keep_fuzzy'); |
|
33
|
12
|
|
100
|
|
|
61
|
my $UseFuzzy = $KeepFuzzy |
|
34
|
|
|
|
|
|
|
|| Locale::Maketext::Lexicon::option('use_fuzzy'); |
|
35
|
12
|
|
|
|
|
33
|
my $AllowEmpty = Locale::Maketext::Lexicon::option('allow_empty'); |
|
36
|
|
|
|
|
|
|
my $process = sub { |
|
37
|
50
|
100
|
100
|
50
|
|
307
|
if ( length( $var{msgstr} ) and ( $UseFuzzy or !$var{fuzzy} ) ) { |
|
|
|
50
|
33
|
|
|
|
|
|
38
|
48
|
|
|
|
|
125
|
push @ret, ( map transform($_), @var{ 'msgid', 'msgstr' } ); |
|
39
|
|
|
|
|
|
|
} |
|
40
|
|
|
|
|
|
|
elsif ($AllowEmpty) { |
|
41
|
0
|
|
|
|
|
0
|
push @ret, ( transform( $var{msgid} ), '' ); |
|
42
|
|
|
|
|
|
|
} |
|
43
|
49
|
100
|
|
|
|
125
|
if ( $var{msgid} eq '' ) { |
|
44
|
10
|
|
|
|
|
34
|
push @metadata, parse_metadata( $var{msgstr} ); |
|
45
|
|
|
|
|
|
|
} |
|
46
|
|
|
|
|
|
|
else { |
|
47
|
39
|
|
|
|
|
82
|
push @comments, $var{msgid}, $var{msgcomment}; |
|
48
|
|
|
|
|
|
|
} |
|
49
|
49
|
100
|
100
|
|
|
170
|
if ( $KeepFuzzy && $var{fuzzy} ) { |
|
50
|
4
|
|
|
|
|
6
|
push @fuzzy, $var{msgid}, 1; |
|
51
|
|
|
|
|
|
|
} |
|
52
|
49
|
|
|
|
|
178
|
%var = (); |
|
53
|
12
|
|
|
|
|
77
|
}; |
|
54
|
|
|
|
|
|
|
|
|
55
|
|
|
|
|
|
|
# Parse PO files |
|
56
|
12
|
|
|
|
|
33
|
foreach (@_) { |
|
57
|
308
|
|
|
|
|
1602
|
s/[\015\012]*\z//; # fix CRLF issues |
|
58
|
|
|
|
|
|
|
|
|
59
|
|
|
|
|
|
|
/^(msgid|msgstr) +"(.*)" *$/ |
|
60
|
|
|
|
|
|
|
? do { # leading strings |
|
61
|
100
|
|
|
|
|
259
|
$var{$1} = $2; |
|
62
|
100
|
|
|
|
|
193
|
$key = $1; |
|
63
|
|
|
|
|
|
|
} |
|
64
|
|
|
|
|
|
|
: |
|
65
|
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
|
/^"(.*)" *$/ |
|
67
|
|
|
|
|
|
|
? do { # continued strings |
|
68
|
120
|
|
|
|
|
669
|
$var{$key} .= $1; |
|
69
|
|
|
|
|
|
|
} |
|
70
|
|
|
|
|
|
|
: |
|
71
|
|
|
|
|
|
|
|
|
72
|
|
|
|
|
|
|
/^# (.*)$/ |
|
73
|
|
|
|
|
|
|
? do { # user comments |
|
74
|
2
|
|
|
|
|
9
|
$var{msgcomment} .= $1 . "\n"; |
|
75
|
|
|
|
|
|
|
} |
|
76
|
|
|
|
|
|
|
: |
|
77
|
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
/^#, +(.*) *$/ |
|
79
|
|
|
|
|
|
|
? do { # control variables |
|
80
|
9
|
|
|
|
|
78
|
$var{$_} = 1 for split( /,\s+/, $1 ); |
|
81
|
|
|
|
|
|
|
} |
|
82
|
|
|
|
|
|
|
: |
|
83
|
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
/^ *$/ && %var |
|
85
|
308
|
100
|
66
|
|
|
1593
|
? do { # interpolate string escapes |
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
86
|
42
|
|
|
|
|
80
|
$process->($_); |
|
87
|
|
|
|
|
|
|
} |
|
88
|
|
|
|
|
|
|
: (); |
|
89
|
|
|
|
|
|
|
|
|
90
|
|
|
|
|
|
|
} |
|
91
|
|
|
|
|
|
|
|
|
92
|
|
|
|
|
|
|
# do not silently skip last entry |
|
93
|
12
|
100
|
|
|
|
65
|
$process->() if keys %var != 0; |
|
94
|
|
|
|
|
|
|
|
|
95
|
11
|
50
|
|
|
|
35
|
push @ret, map { transform($_) } @var{ 'msgid', 'msgstr' } |
|
|
0
|
|
|
|
|
0
|
|
|
96
|
|
|
|
|
|
|
if length $var{msgstr}; |
|
97
|
11
|
50
|
|
|
|
72
|
push @metadata, parse_metadata( $var{msgstr} ) |
|
98
|
|
|
|
|
|
|
if $var{msgid} eq ''; |
|
99
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
return wantarray |
|
101
|
11
|
100
|
|
|
|
265
|
? ( { @metadata, @ret }, {@comments}, {@fuzzy} ) |
|
102
|
|
|
|
|
|
|
: ( { @metadata, @ret } ); |
|
103
|
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
} |
|
105
|
|
|
|
|
|
|
|
|
106
|
|
|
|
|
|
|
sub parse_metadata { |
|
107
|
|
|
|
|
|
|
return map { |
|
108
|
80
|
|
|
80
|
0
|
186
|
(/^([^\x00-\x1f\x80-\xff :=]+):\s*(.*)$/) |
|
109
|
|
|
|
|
|
|
? ( $1 eq 'Content-Type' ) |
|
110
|
595
|
100
|
|
|
|
5030
|
? do { |
|
|
|
50
|
|
|
|
|
|
|
111
|
69
|
|
|
|
|
147
|
my $enc = $2; |
|
112
|
69
|
50
|
|
|
|
419
|
if ( $enc =~ /\bcharset=\s*([-\w]+)/i ) { |
|
113
|
69
|
|
50
|
|
|
245
|
$InputEncoding = $1 || ''; |
|
114
|
69
|
|
50
|
|
|
251
|
$OutputEncoding |
|
115
|
|
|
|
|
|
|
= Locale::Maketext::Lexicon::encoding() |
|
116
|
|
|
|
|
|
|
|| ''; |
|
117
|
69
|
100
|
|
|
|
378
|
$InputEncoding = 'utf8' |
|
118
|
|
|
|
|
|
|
if $InputEncoding =~ /^utf-?8$/i; |
|
119
|
69
|
50
|
|
|
|
154
|
$OutputEncoding = 'utf8' |
|
120
|
|
|
|
|
|
|
if $OutputEncoding =~ /^utf-?8$/i; |
|
121
|
69
|
50
|
33
|
|
|
190
|
if (Locale::Maketext::Lexicon::option('decode') |
|
|
|
|
66
|
|
|
|
|
|
122
|
|
|
|
|
|
|
and ( !$OutputEncoding |
|
123
|
|
|
|
|
|
|
or $InputEncoding ne $OutputEncoding ) |
|
124
|
|
|
|
|
|
|
) |
|
125
|
|
|
|
|
|
|
{ |
|
126
|
59
|
50
|
|
|
|
168
|
require Encode::compat if $] < 5.007001; |
|
127
|
59
|
|
|
|
|
1512
|
require Encode; |
|
128
|
59
|
|
|
|
|
14860
|
$DoEncoding = 1; |
|
129
|
|
|
|
|
|
|
} |
|
130
|
|
|
|
|
|
|
} |
|
131
|
69
|
|
|
|
|
250
|
( "__Content-Type", $enc ); |
|
132
|
|
|
|
|
|
|
} |
|
133
|
|
|
|
|
|
|
: ( "__$1", $2 ) |
|
134
|
|
|
|
|
|
|
: (); |
|
135
|
|
|
|
|
|
|
} split( /\r*\n+\r*/, transform(pop) ); |
|
136
|
|
|
|
|
|
|
} |
|
137
|
|
|
|
|
|
|
|
|
138
|
|
|
|
|
|
|
sub transform { |
|
139
|
411
|
|
|
411
|
0
|
626
|
my $str = shift; |
|
140
|
|
|
|
|
|
|
|
|
141
|
411
|
100
|
66
|
|
|
1420
|
if ( $DoEncoding and $InputEncoding ) { |
|
142
|
234
|
100
|
|
|
|
865
|
$str |
|
143
|
|
|
|
|
|
|
= ( $InputEncoding eq 'utf8' ) |
|
144
|
|
|
|
|
|
|
? Encode::decode_utf8($str) |
|
145
|
|
|
|
|
|
|
: Encode::decode( $InputEncoding, $str ); |
|
146
|
|
|
|
|
|
|
} |
|
147
|
|
|
|
|
|
|
|
|
148
|
410
|
|
|
|
|
178909
|
$str =~ s/\\([0x]..|c?.)/qq{"\\$1"}/eeg; |
|
|
188
|
|
|
|
|
10167
|
|
|
149
|
|
|
|
|
|
|
|
|
150
|
410
|
50
|
66
|
|
|
1644
|
if ( $DoEncoding and $OutputEncoding ) { |
|
151
|
0
|
0
|
|
|
|
0
|
$str |
|
152
|
|
|
|
|
|
|
= ( $OutputEncoding eq 'utf8' ) |
|
153
|
|
|
|
|
|
|
? Encode::encode_utf8($str) |
|
154
|
|
|
|
|
|
|
: Encode::encode( $OutputEncoding, $str ); |
|
155
|
|
|
|
|
|
|
} |
|
156
|
|
|
|
|
|
|
|
|
157
|
410
|
|
|
|
|
727
|
return _gettext_to_maketext($str); |
|
158
|
|
|
|
|
|
|
} |
|
159
|
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
sub _gettext_to_maketext { |
|
161
|
434
|
|
|
434
|
|
639
|
my $str = shift; |
|
162
|
434
|
|
|
|
|
1417
|
$str =~ s{([\~\[\]])}{~$1}g; |
|
163
|
434
|
|
|
|
|
10903
|
$str =~ s{ |
|
164
|
|
|
|
|
|
|
([%\\]%) # 1 - escaped sequence |
|
165
|
|
|
|
|
|
|
| |
|
166
|
|
|
|
|
|
|
% (?: |
|
167
|
|
|
|
|
|
|
([A-Za-z#*]\w*) # 2 - function call |
|
168
|
|
|
|
|
|
|
\(([^\)]*)\) # 3 - arguments |
|
169
|
|
|
|
|
|
|
| |
|
170
|
|
|
|
|
|
|
([1-9]\d*|\*) # 4 - variable |
|
171
|
|
|
|
|
|
|
) |
|
172
|
|
|
|
|
|
|
}{ |
|
173
|
78
|
100
|
|
|
|
433
|
$1 ? $1 |
|
|
|
50
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
: $2 ? "\[$2,"._unescape($3)."]" |
|
175
|
|
|
|
|
|
|
: "[_$4]" |
|
176
|
|
|
|
|
|
|
}egx; |
|
177
|
434
|
|
|
|
|
5601
|
$str; |
|
178
|
|
|
|
|
|
|
} |
|
179
|
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
sub _unescape { |
|
181
|
22
|
100
|
|
|
|
121
|
join( ',', |
|
182
|
9
|
|
|
9
|
|
34
|
map { /\A(\s*)%([1-9]\d*|\*)(\s*)\z/ ? "$1_$2$3" : $_ } |
|
183
|
|
|
|
|
|
|
split( /,/, $_[0] ) ); |
|
184
|
|
|
|
|
|
|
} |
|
185
|
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
# This subroutine was derived from Locale::Maketext::Gettext::readmo() |
|
187
|
|
|
|
|
|
|
# under the Perl License; the original author is Yi Ma Mao (IMACAT). |
|
188
|
|
|
|
|
|
|
sub parse_mo { |
|
189
|
59
|
|
|
59
|
0
|
662
|
my $content = shift; |
|
190
|
59
|
100
|
|
|
|
196
|
my $tmpl = ( substr( $content, 0, 4 ) eq "\xde\x12\x04\x95" ) ? 'V' : 'N'; |
|
191
|
|
|
|
|
|
|
|
|
192
|
|
|
|
|
|
|
# Check the MO format revision number |
|
193
|
|
|
|
|
|
|
# There is only one revision now: revision 0. |
|
194
|
59
|
50
|
|
|
|
239
|
return if unpack( $tmpl, substr( $content, 4, 4 ) ) > 0; |
|
195
|
|
|
|
|
|
|
|
|
196
|
59
|
|
|
|
|
82
|
my ( $num, $offo, $offt ); |
|
197
|
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
# Number of strings |
|
199
|
59
|
|
|
|
|
105
|
$num = unpack $tmpl, substr( $content, 8, 4 ); |
|
200
|
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
# Offset to the beginning of the original strings |
|
202
|
59
|
|
|
|
|
103
|
$offo = unpack $tmpl, substr( $content, 12, 4 ); |
|
203
|
|
|
|
|
|
|
|
|
204
|
|
|
|
|
|
|
# Offset to the beginning of the translated strings |
|
205
|
59
|
|
|
|
|
99
|
$offt = unpack $tmpl, substr( $content, 16, 4 ); |
|
206
|
|
|
|
|
|
|
|
|
207
|
59
|
|
|
|
|
78
|
my ( @metadata, @ret ); |
|
208
|
59
|
|
|
|
|
155
|
for ( 0 .. $num - 1 ) { |
|
209
|
118
|
|
|
|
|
133
|
my ( $len, $off, $stro, $strt ); |
|
210
|
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
# The first word is the length of the string |
|
212
|
118
|
|
|
|
|
388
|
$len = unpack $tmpl, substr( $content, $offo + $_ * 8, 4 ); |
|
213
|
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
# The second word is the offset of the string |
|
215
|
118
|
|
|
|
|
238
|
$off = unpack $tmpl, substr( $content, $offo + $_ * 8 + 4, 4 ); |
|
216
|
|
|
|
|
|
|
|
|
217
|
|
|
|
|
|
|
# Original string |
|
218
|
118
|
|
|
|
|
170
|
$stro = substr( $content, $off, $len ); |
|
219
|
|
|
|
|
|
|
|
|
220
|
|
|
|
|
|
|
# The first word is the length of the string |
|
221
|
118
|
|
|
|
|
206
|
$len = unpack $tmpl, substr( $content, $offt + $_ * 8, 4 ); |
|
222
|
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
# The second word is the offset of the string |
|
224
|
118
|
|
|
|
|
215
|
$off = unpack $tmpl, substr( $content, $offt + $_ * 8 + 4, 4 ); |
|
225
|
|
|
|
|
|
|
|
|
226
|
|
|
|
|
|
|
# Translated string |
|
227
|
118
|
|
|
|
|
201
|
$strt = substr( $content, $off, $len ); |
|
228
|
|
|
|
|
|
|
|
|
229
|
|
|
|
|
|
|
# Hash it |
|
230
|
118
|
100
|
|
|
|
347
|
push @metadata, parse_metadata($strt) if $stro eq ''; |
|
231
|
118
|
50
|
|
|
|
602
|
push @ret, ( map transform($_), $stro, $strt ) if length $strt; |
|
232
|
|
|
|
|
|
|
} |
|
233
|
|
|
|
|
|
|
|
|
234
|
59
|
|
|
|
|
1298
|
return { @metadata, @ret }; |
|
235
|
|
|
|
|
|
|
} |
|
236
|
|
|
|
|
|
|
|
|
237
|
|
|
|
|
|
|
1; |
|
238
|
|
|
|
|
|
|
|
|
239
|
|
|
|
|
|
|
__END__ |