| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
#!/pro/bin/perl |
|
2
|
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
package Spreadsheet::Read; |
|
4
|
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
=head1 NAME |
|
6
|
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
Spreadsheet::Read - Read the data from a spreadsheet |
|
8
|
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
10
|
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
use Spreadsheet::Read; |
|
12
|
|
|
|
|
|
|
my $book = ReadData ("test.csv", sep => ";"); |
|
13
|
|
|
|
|
|
|
my $book = ReadData ("test.sxc"); |
|
14
|
|
|
|
|
|
|
my $book = ReadData ("test.ods"); |
|
15
|
|
|
|
|
|
|
my $book = ReadData ("test.xls"); |
|
16
|
|
|
|
|
|
|
my $book = ReadData ("test.xlsx"); |
|
17
|
|
|
|
|
|
|
my $book = ReadData ($fh, parser => "xls"); |
|
18
|
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
Spreadsheet::Read::add ($book, "sheet.csv"); |
|
20
|
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
my $sheet = $book->[1]; # first datasheet |
|
22
|
|
|
|
|
|
|
my $cell = $book->[1]{A3}; # content of field A3 of sheet 1 |
|
23
|
|
|
|
|
|
|
my $cell = $book->[1]{cell}[1][3]; # same, unformatted |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
# OO API |
|
26
|
|
|
|
|
|
|
my $book = Spreadsheet::Read->new ("file.csv"); |
|
27
|
|
|
|
|
|
|
my $sheet = $book->sheet (1); |
|
28
|
|
|
|
|
|
|
my $cell = $sheet->cell ("A3"); |
|
29
|
|
|
|
|
|
|
my $cell = $sheet->cell (1, 3); |
|
30
|
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
$book->add ("test.xls"); |
|
32
|
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
=cut |
|
34
|
|
|
|
|
|
|
|
|
35
|
53
|
|
|
53
|
|
5239645
|
use 5.8.1; |
|
|
53
|
|
|
|
|
714
|
|
|
36
|
53
|
|
|
53
|
|
297
|
use strict; |
|
|
53
|
|
|
|
|
109
|
|
|
|
53
|
|
|
|
|
1255
|
|
|
37
|
53
|
|
|
53
|
|
281
|
use warnings; |
|
|
53
|
|
|
|
|
120
|
|
|
|
53
|
|
|
|
|
3448
|
|
|
38
|
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
our $VERSION = "0.81"; |
|
40
|
1
|
|
|
1
|
1
|
131
|
sub Version { $VERSION } |
|
41
|
|
|
|
|
|
|
|
|
42
|
53
|
|
|
53
|
|
400
|
use Carp; |
|
|
53
|
|
|
|
|
152
|
|
|
|
53
|
|
|
|
|
3471
|
|
|
43
|
53
|
|
|
53
|
|
379
|
use Exporter; |
|
|
53
|
|
|
|
|
113
|
|
|
|
53
|
|
|
|
|
4949
|
|
|
44
|
|
|
|
|
|
|
our @ISA = qw( Exporter ); |
|
45
|
|
|
|
|
|
|
our @EXPORT = qw( ReadData cell2cr cr2cell ); |
|
46
|
|
|
|
|
|
|
our @EXPORT_OK = qw( parses rows cellrow row add ); |
|
47
|
|
|
|
|
|
|
|
|
48
|
53
|
|
|
53
|
|
29800
|
use Encode qw( decode ); |
|
|
53
|
|
|
|
|
826256
|
|
|
|
53
|
|
|
|
|
4470
|
|
|
49
|
53
|
|
|
53
|
|
47041
|
use File::Temp qw( ); |
|
|
53
|
|
|
|
|
1145819
|
|
|
|
53
|
|
|
|
|
1811
|
|
|
50
|
53
|
|
|
53
|
|
33881
|
use Data::Dumper; |
|
|
53
|
|
|
|
|
332531
|
|
|
|
53
|
|
|
|
|
56844
|
|
|
51
|
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
my @parsers = ( |
|
53
|
|
|
|
|
|
|
[ csv => "Text::CSV_XS", "0.71" ], |
|
54
|
|
|
|
|
|
|
[ csv => "Text::CSV_PP", "1.17" ], |
|
55
|
|
|
|
|
|
|
[ csv => "Text::CSV", "1.17" ], |
|
56
|
|
|
|
|
|
|
[ ods => "Spreadsheet::ReadSXC", "0.20" ], |
|
57
|
|
|
|
|
|
|
[ sxc => "Spreadsheet::ReadSXC", "0.20" ], |
|
58
|
|
|
|
|
|
|
[ xls => "Spreadsheet::ParseExcel", "0.34" ], |
|
59
|
|
|
|
|
|
|
[ xlsx => "Spreadsheet::ParseXLSX", "0.24" ], |
|
60
|
|
|
|
|
|
|
[ xlsx => "Spreadsheet::XLSX", "0.13" ], |
|
61
|
|
|
|
|
|
|
[ prl => "Spreadsheet::Perl", "" ], |
|
62
|
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
# Helper modules |
|
64
|
|
|
|
|
|
|
[ ios => "IO::Scalar", "" ], |
|
65
|
|
|
|
|
|
|
[ dmp => "Data::Peek", "" ], |
|
66
|
|
|
|
|
|
|
); |
|
67
|
|
|
|
|
|
|
my %can = ( supports => { map { $_->[1] => $_->[2] } @parsers }); |
|
68
|
|
|
|
|
|
|
foreach my $p (@parsers) { |
|
69
|
|
|
|
|
|
|
my $format = $p->[0]; |
|
70
|
|
|
|
|
|
|
$can{$format} and next; |
|
71
|
|
|
|
|
|
|
$can{$format} = ""; |
|
72
|
|
|
|
|
|
|
my $preset = $ENV{"SPREADSHEET_READ_\U$format"} or next; |
|
73
|
|
|
|
|
|
|
my $min_version = $can{supports}{$preset}; |
|
74
|
|
|
|
|
|
|
unless ($min_version) { |
|
75
|
|
|
|
|
|
|
# Catch weirdness like $SPREADSHEET_READ_XLSX = "DBD::Oracle" |
|
76
|
|
|
|
|
|
|
$can{$format} = "!$preset is not supported for the $format format"; |
|
77
|
|
|
|
|
|
|
next; |
|
78
|
|
|
|
|
|
|
} |
|
79
|
|
|
|
|
|
|
if (eval "local \$_; require $preset" and not $@) { |
|
80
|
|
|
|
|
|
|
# forcing a parser should still check the version |
|
81
|
|
|
|
|
|
|
my $ok; |
|
82
|
|
|
|
|
|
|
my $has = $preset->VERSION; |
|
83
|
|
|
|
|
|
|
$has =~ s/_[0-9]+$//; # Remove beta-part |
|
84
|
|
|
|
|
|
|
if ($min_version =~ m/^v([0-9.]+)/) { # clumsy versions |
|
85
|
|
|
|
|
|
|
my @min = split m/\./ => $1; |
|
86
|
|
|
|
|
|
|
$has =~ s/^v//; |
|
87
|
|
|
|
|
|
|
my @has = split m/\./ => $has; |
|
88
|
|
|
|
|
|
|
$ok = (($has[0] * 1000 + $has[1]) * 1000 + $has[2]) >= |
|
89
|
|
|
|
|
|
|
(($min[0] * 1000 + $min[1]) * 1000 + $min[2]); |
|
90
|
|
|
|
|
|
|
} |
|
91
|
|
|
|
|
|
|
else { # normal versions |
|
92
|
|
|
|
|
|
|
$ok = $has >= $min_version; |
|
93
|
|
|
|
|
|
|
} |
|
94
|
|
|
|
|
|
|
$ok or $preset = "!$preset"; |
|
95
|
|
|
|
|
|
|
} |
|
96
|
|
|
|
|
|
|
else { |
|
97
|
|
|
|
|
|
|
$preset = "!$preset"; |
|
98
|
|
|
|
|
|
|
} |
|
99
|
|
|
|
|
|
|
$can{$format} = $preset; |
|
100
|
|
|
|
|
|
|
} |
|
101
|
|
|
|
|
|
|
delete $can{supports}; |
|
102
|
|
|
|
|
|
|
for (@parsers) { |
|
103
|
|
|
|
|
|
|
my ($flag, $mod, $vsn) = @$_; |
|
104
|
|
|
|
|
|
|
$can{$flag} and next; |
|
105
|
|
|
|
|
|
|
eval "require $mod; \$vsn and ${mod}->VERSION (\$vsn); \$can{\$flag} = '$mod'" or |
|
106
|
|
|
|
|
|
|
$_->[0] = "! Cannot use $mod version $vsn: $@"; |
|
107
|
|
|
|
|
|
|
} |
|
108
|
|
|
|
|
|
|
$can{sc} = __PACKAGE__; # SquirelCalc is built-in |
|
109
|
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
defined $Spreadsheet::ParseExcel::VERSION && $Spreadsheet::ParseExcel::VERSION < 0.61 and |
|
111
|
|
|
|
|
|
|
*Spreadsheet::ParseExcel::Workbook::get_active_sheet = sub { undef; }; |
|
112
|
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
my $debug = 0; |
|
114
|
|
|
|
|
|
|
my %def_opts = ( |
|
115
|
|
|
|
|
|
|
rc => 1, |
|
116
|
|
|
|
|
|
|
cells => 1, |
|
117
|
|
|
|
|
|
|
attr => 0, |
|
118
|
|
|
|
|
|
|
clip => undef, # $opt{cells}; |
|
119
|
|
|
|
|
|
|
strip => 0, |
|
120
|
|
|
|
|
|
|
pivot => 0, |
|
121
|
|
|
|
|
|
|
dtfmt => "yyyy-mm-dd", # Format 14 |
|
122
|
|
|
|
|
|
|
debug => 0, |
|
123
|
|
|
|
|
|
|
passwd => undef, |
|
124
|
|
|
|
|
|
|
parser => undef, |
|
125
|
|
|
|
|
|
|
sep => undef, |
|
126
|
|
|
|
|
|
|
quote => undef, |
|
127
|
|
|
|
|
|
|
label => undef, |
|
128
|
|
|
|
|
|
|
); |
|
129
|
|
|
|
|
|
|
my @def_attr = ( |
|
130
|
|
|
|
|
|
|
type => "text", |
|
131
|
|
|
|
|
|
|
fgcolor => undef, |
|
132
|
|
|
|
|
|
|
bgcolor => undef, |
|
133
|
|
|
|
|
|
|
font => undef, |
|
134
|
|
|
|
|
|
|
size => undef, |
|
135
|
|
|
|
|
|
|
format => undef, |
|
136
|
|
|
|
|
|
|
halign => "left", |
|
137
|
|
|
|
|
|
|
valign => "top", |
|
138
|
|
|
|
|
|
|
bold => 0, |
|
139
|
|
|
|
|
|
|
italic => 0, |
|
140
|
|
|
|
|
|
|
uline => 0, |
|
141
|
|
|
|
|
|
|
wrap => 0, |
|
142
|
|
|
|
|
|
|
merged => 0, |
|
143
|
|
|
|
|
|
|
hidden => 0, |
|
144
|
|
|
|
|
|
|
locked => 0, |
|
145
|
|
|
|
|
|
|
enc => "utf-8", # $ENV{LC_ALL} // $ENV{LANG} // ... |
|
146
|
|
|
|
|
|
|
formula => undef, |
|
147
|
|
|
|
|
|
|
); |
|
148
|
|
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
# Helper functions |
|
150
|
|
|
|
|
|
|
|
|
151
|
|
|
|
|
|
|
sub _dump { |
|
152
|
7
|
|
|
7
|
|
19
|
my ($label, $ref) = @_; |
|
153
|
7
|
50
|
|
|
|
23
|
if ($can{dmp}) { |
|
154
|
7
|
|
|
|
|
48
|
print STDERR Data::Peek::DDumper ({ $label => $ref }); |
|
155
|
|
|
|
|
|
|
} |
|
156
|
|
|
|
|
|
|
else { |
|
157
|
0
|
|
|
|
|
0
|
print STDERR Data::Dumper->Dump ([$ref], [$label]); |
|
158
|
|
|
|
|
|
|
} |
|
159
|
|
|
|
|
|
|
} # _dump |
|
160
|
|
|
|
|
|
|
|
|
161
|
|
|
|
|
|
|
sub _parser { |
|
162
|
342
|
100
|
|
342
|
|
1460
|
my $type = shift or return ""; |
|
163
|
100
|
|
|
|
|
308
|
$type = lc $type; |
|
164
|
|
|
|
|
|
|
# Aliases and fullnames |
|
165
|
100
|
100
|
|
|
|
343
|
$type eq "excel" and return "xls"; |
|
166
|
99
|
50
|
|
|
|
302
|
$type eq "excel2007" and return "xlsx"; |
|
167
|
99
|
100
|
|
|
|
307
|
$type eq "oo" and return "sxc"; |
|
168
|
98
|
100
|
|
|
|
296
|
$type eq "ods" and return "sxc"; |
|
169
|
96
|
100
|
|
|
|
292
|
$type eq "openoffice" and return "sxc"; |
|
170
|
95
|
50
|
|
|
|
291
|
$type eq "libreoffice" and return "sxc"; |
|
171
|
95
|
100
|
|
|
|
265
|
$type eq "perl" and return "prl"; |
|
172
|
94
|
50
|
|
|
|
261
|
$type eq "squirelcalc" and return "sc"; |
|
173
|
94
|
100
|
|
|
|
558
|
return exists $can{$type} ? $type : ""; |
|
174
|
|
|
|
|
|
|
} # _parser |
|
175
|
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
sub new { |
|
177
|
12
|
|
|
12
|
1
|
6892
|
my $class = shift; |
|
178
|
12
|
|
|
|
|
49
|
my $r = ReadData (@_); |
|
179
|
12
|
100
|
|
|
|
76
|
unless ($r) { |
|
180
|
2
|
50
|
|
|
|
17
|
@_ and return; # new with arguments failed to open resource |
|
181
|
0
|
|
|
|
|
0
|
$r = [{ |
|
182
|
|
|
|
|
|
|
parsers => [], |
|
183
|
|
|
|
|
|
|
error => undef, |
|
184
|
|
|
|
|
|
|
sheets => 0, |
|
185
|
|
|
|
|
|
|
sheet => { }, |
|
186
|
|
|
|
|
|
|
}]; |
|
187
|
|
|
|
|
|
|
} |
|
188
|
10
|
|
|
|
|
212
|
bless $r => $class; |
|
189
|
|
|
|
|
|
|
} # new |
|
190
|
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
# Spreadsheet::Read::parses ("csv") or die "Cannot parse CSV" |
|
192
|
|
|
|
|
|
|
sub parses { |
|
193
|
63
|
100
|
|
63
|
1
|
145584
|
ref $_[0] eq __PACKAGE__ and shift; |
|
194
|
63
|
100
|
|
|
|
277
|
my $type = _parser (shift) or return 0; |
|
195
|
61
|
100
|
|
|
|
407
|
if ($can{$type} =~ m/^!\s*(.*)/) { |
|
196
|
8
|
|
|
|
|
32
|
$@ = $1; |
|
197
|
8
|
|
|
|
|
28
|
return 0; |
|
198
|
|
|
|
|
|
|
} |
|
199
|
53
|
|
|
|
|
183
|
return $can{$type}; |
|
200
|
|
|
|
|
|
|
} # parses |
|
201
|
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
sub sheets { |
|
203
|
4
|
|
|
4
|
1
|
14
|
my $ctrl = shift->[0]; |
|
204
|
4
|
|
|
|
|
6
|
my %s = %{$ctrl->{sheet}}; |
|
|
4
|
|
|
|
|
19
|
|
|
205
|
4
|
100
|
|
|
|
35
|
wantarray ? sort { $s{$a} <=> $s{$b} } keys %s : $ctrl->{sheets}; |
|
|
4
|
|
|
|
|
26
|
|
|
206
|
|
|
|
|
|
|
} # sheets |
|
207
|
|
|
|
|
|
|
|
|
208
|
|
|
|
|
|
|
# col2label (4) => "D" |
|
209
|
|
|
|
|
|
|
sub col2label { |
|
210
|
15697
|
100
|
|
15697
|
1
|
32919
|
ref $_[0] eq __PACKAGE__ and shift; |
|
211
|
15697
|
|
|
|
|
20483
|
my $c = shift; |
|
212
|
15697
|
100
|
100
|
|
|
41042
|
defined $c && $c > 0 or return ""; |
|
213
|
15693
|
|
|
|
|
21423
|
my $cell = ""; |
|
214
|
15693
|
|
|
|
|
26123
|
while ($c) { |
|
215
|
53
|
|
|
53
|
|
30000
|
use integer; |
|
|
53
|
|
|
|
|
836
|
|
|
|
53
|
|
|
|
|
301
|
|
|
216
|
|
|
|
|
|
|
|
|
217
|
15710
|
|
|
|
|
29729
|
substr $cell, 0, 0, chr (--$c % 26 + ord "A"); |
|
218
|
15710
|
|
|
|
|
27647
|
$c /= 26; |
|
219
|
|
|
|
|
|
|
} |
|
220
|
15693
|
|
|
|
|
42026
|
$cell; |
|
221
|
|
|
|
|
|
|
} # col2label |
|
222
|
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
# cr2cell (4, 18) => "D18" |
|
224
|
|
|
|
|
|
|
# No prototype to allow 'cr2cell (@rowcol)' |
|
225
|
|
|
|
|
|
|
sub cr2cell { |
|
226
|
15495
|
100
|
|
15495
|
1
|
189546
|
ref $_[0] eq __PACKAGE__ and shift; |
|
227
|
15495
|
|
|
|
|
25206
|
my ($c, $r) = @_; |
|
228
|
15495
|
100
|
100
|
|
|
72297
|
defined $c && defined $r && $c > 0 && $r > 0 or return ""; |
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
229
|
15489
|
|
|
|
|
24027
|
col2label ($c) . $r; |
|
230
|
|
|
|
|
|
|
} # cr2cell |
|
231
|
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
# cell2cr ("D18") => (4, 18) |
|
233
|
|
|
|
|
|
|
sub cell2cr { |
|
234
|
604
|
100
|
|
604
|
1
|
610707
|
ref $_[0] eq __PACKAGE__ and shift; |
|
235
|
604
|
100
|
100
|
|
|
5633
|
my ($cc, $r) = (uc ($_[0]||"") =~ m/^([A-Z]+)([0-9]+)$/) or return (0, 0); |
|
236
|
600
|
|
|
|
|
1241
|
my $c = 0; |
|
237
|
600
|
|
|
|
|
2499
|
while ($cc =~ s/^([A-Z])//) { |
|
238
|
608
|
|
|
|
|
2497
|
$c = 26 * $c + 1 + ord ($1) - ord ("A"); |
|
239
|
|
|
|
|
|
|
} |
|
240
|
600
|
|
|
|
|
2112
|
($c, $r); |
|
241
|
|
|
|
|
|
|
} # cell2cr |
|
242
|
|
|
|
|
|
|
|
|
243
|
|
|
|
|
|
|
# my @row = cellrow ($book->[1], 1); |
|
244
|
|
|
|
|
|
|
# my @row = $book->cellrow (1, 1); |
|
245
|
|
|
|
|
|
|
sub cellrow { |
|
246
|
10
|
100
|
|
10
|
1
|
69
|
my $sheet = ref $_[0] eq __PACKAGE__ ? (shift)->[shift] : shift or return; |
|
|
|
100
|
|
|
|
|
|
|
247
|
9
|
100
|
66
|
|
|
65
|
ref $sheet eq "HASH" && exists $sheet->{cell} or return; |
|
248
|
7
|
50
|
33
|
|
|
39
|
exists $sheet->{maxcol} && exists $sheet->{maxrow} or return; |
|
249
|
7
|
100
|
|
|
|
26
|
my $row = shift or return; |
|
250
|
6
|
100
|
100
|
|
|
39
|
$row > 0 && $row <= $sheet->{maxrow} or return; |
|
251
|
4
|
|
|
|
|
12
|
my $s = $sheet->{cell}; |
|
252
|
4
|
|
|
|
|
17
|
map { $s->[$_][$row] } 1..$sheet->{maxcol}; |
|
|
76
|
|
|
|
|
147
|
|
|
253
|
|
|
|
|
|
|
} # cellrow |
|
254
|
|
|
|
|
|
|
|
|
255
|
|
|
|
|
|
|
# my @row = row ($book->[1], 1); |
|
256
|
|
|
|
|
|
|
# my @row = $book->row (1, 1); |
|
257
|
|
|
|
|
|
|
sub row { |
|
258
|
10
|
100
|
|
10
|
1
|
3508
|
my $sheet = ref $_[0] eq __PACKAGE__ ? (shift)->[shift] : shift or return; |
|
|
|
100
|
|
|
|
|
|
|
259
|
9
|
100
|
66
|
|
|
65
|
ref $sheet eq "HASH" && exists $sheet->{cell} or return; |
|
260
|
7
|
50
|
33
|
|
|
39
|
exists $sheet->{maxcol} && exists $sheet->{maxrow} or return; |
|
261
|
7
|
100
|
|
|
|
48
|
my $row = shift or return; |
|
262
|
6
|
100
|
100
|
|
|
40
|
$row > 0 && $row <= $sheet->{maxrow} or return; |
|
263
|
4
|
|
|
|
|
23
|
map { $sheet->{cr2cell ($_, $row)} } 1..$sheet->{maxcol}; |
|
|
76
|
|
|
|
|
134
|
|
|
264
|
|
|
|
|
|
|
} # row |
|
265
|
|
|
|
|
|
|
|
|
266
|
|
|
|
|
|
|
# Convert {cell}'s [column][row] to a [row][column] list |
|
267
|
|
|
|
|
|
|
# my @rows = rows ($book->[1]); |
|
268
|
|
|
|
|
|
|
sub rows { |
|
269
|
33
|
50
|
|
33
|
1
|
19369
|
my $sheet = ref $_[0] eq __PACKAGE__ ? (shift)->[shift] : shift or return; |
|
|
|
100
|
|
|
|
|
|
|
270
|
30
|
100
|
100
|
|
|
169
|
ref $sheet eq "HASH" && exists $sheet->{cell} or return; |
|
271
|
26
|
100
|
100
|
|
|
120
|
exists $sheet->{maxcol} && exists $sheet->{maxrow} or return; |
|
272
|
5
|
|
|
|
|
15
|
my $s = $sheet->{cell}; |
|
273
|
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
map { |
|
275
|
20
|
|
|
|
|
33
|
my $r = $_; |
|
276
|
20
|
|
|
|
|
36
|
[ map { $s->[$_][$r] } 1..$sheet->{maxcol} ]; |
|
|
80
|
|
|
|
|
205
|
|
|
277
|
5
|
|
|
|
|
28
|
} 1..$sheet->{maxrow}; |
|
278
|
|
|
|
|
|
|
} # rows |
|
279
|
|
|
|
|
|
|
|
|
280
|
|
|
|
|
|
|
sub sheet { |
|
281
|
23
|
|
|
23
|
1
|
650
|
my ($book, $sheet) = @_; |
|
282
|
23
|
100
|
100
|
|
|
116
|
$book && $sheet or return; |
|
283
|
21
|
|
|
|
|
43
|
my $class = "Spreadsheet::Read::Sheet"; |
|
284
|
|
|
|
|
|
|
$sheet =~ m/^[0-9]+$/ && $sheet >= 1 && $sheet <= $book->[0]{sheets} and |
|
285
|
21
|
100
|
66
|
|
|
301
|
return bless $book->[$sheet] => $class; |
|
|
|
|
100
|
|
|
|
|
|
286
|
|
|
|
|
|
|
exists $book->[0]{sheet}{$sheet} and |
|
287
|
6
|
100
|
|
|
|
26
|
return bless $book->[$book->[0]{sheet}{$sheet}] => $class; |
|
288
|
5
|
|
|
|
|
17
|
foreach my $idx (1 .. $book->[0]{sheets}) { |
|
289
|
6
|
100
|
|
|
|
24
|
$book->[$idx]{label} eq $sheet and |
|
290
|
|
|
|
|
|
|
return bless $book->[$idx] => $class; |
|
291
|
|
|
|
|
|
|
} |
|
292
|
4
|
|
|
|
|
19
|
return; |
|
293
|
|
|
|
|
|
|
} # sheet |
|
294
|
|
|
|
|
|
|
|
|
295
|
|
|
|
|
|
|
# If option "clip" is set, remove the trailing rows and |
|
296
|
|
|
|
|
|
|
# columns in each sheet that contain no visible data |
|
297
|
|
|
|
|
|
|
sub _clipsheets { |
|
298
|
227
|
|
|
227
|
|
616
|
my ($opt, $ref) = @_; |
|
299
|
|
|
|
|
|
|
|
|
300
|
227
|
50
|
|
|
|
766
|
$ref->[0]{sheets} or return $ref; |
|
301
|
|
|
|
|
|
|
|
|
302
|
227
|
|
|
|
|
610
|
my ($rc, $cl) = ($opt->{rc}, $opt->{cells}); |
|
303
|
227
|
|
|
|
|
646
|
my ($oc, $os, $oa) = ($opt->{clip}, $opt->{strip}, $opt->{attr}); |
|
304
|
|
|
|
|
|
|
|
|
305
|
|
|
|
|
|
|
# Strip leading/trailing spaces |
|
306
|
227
|
100
|
100
|
|
|
1020
|
if ($os || $oc) { |
|
307
|
212
|
|
|
|
|
703
|
foreach my $sheet (1 .. $ref->[0]{sheets}) { |
|
308
|
254
|
|
|
|
|
659
|
$ref->[$sheet]{indx} = $sheet; |
|
309
|
254
|
|
|
|
|
448
|
my $ss = $ref->[$sheet]; |
|
310
|
254
|
100
|
66
|
|
|
1331
|
$ss->{maxrow} && $ss->{maxcol} or next; |
|
311
|
247
|
|
|
|
|
587
|
my ($mc, $mr) = (0, 0); |
|
312
|
247
|
|
|
|
|
656
|
foreach my $row (1 .. $ss->{maxrow}) { |
|
313
|
1954
|
|
|
|
|
3372
|
foreach my $col (1 .. $ss->{maxcol}) { |
|
314
|
16636
|
100
|
|
|
|
26429
|
if ($rc) { |
|
315
|
14738
|
100
|
|
|
|
26967
|
defined $ss->{cell}[$col][$row] or next; |
|
316
|
5881
|
100
|
|
|
|
10285
|
$os & 2 and $ss->{cell}[$col][$row] =~ s/\s+$//; |
|
317
|
5881
|
100
|
|
|
|
9764
|
$os & 1 and $ss->{cell}[$col][$row] =~ s/^\s+//; |
|
318
|
5881
|
100
|
|
|
|
10671
|
if (length $ss->{cell}[$col][$row]) { |
|
319
|
4417
|
100
|
|
|
|
7531
|
$col > $mc and $mc = $col; |
|
320
|
4417
|
100
|
|
|
|
7463
|
$row > $mr and $mr = $row; |
|
321
|
|
|
|
|
|
|
} |
|
322
|
|
|
|
|
|
|
} |
|
323
|
7779
|
100
|
|
|
|
12465
|
if ($cl) { |
|
324
|
7560
|
|
|
|
|
11687
|
my $cell = cr2cell ($col, $row); |
|
325
|
7560
|
100
|
|
|
|
15679
|
defined $ss->{$cell} or next; |
|
326
|
6233
|
100
|
|
|
|
11280
|
$os & 2 and $ss->{$cell} =~ s/\s+$//; |
|
327
|
6233
|
100
|
|
|
|
10084
|
$os & 1 and $ss->{$cell} =~ s/^\s+//; |
|
328
|
6233
|
100
|
|
|
|
11221
|
if (length $ss->{$cell}) { |
|
329
|
4757
|
100
|
|
|
|
7763
|
$col > $mc and $mc = $col; |
|
330
|
4757
|
100
|
|
|
|
9090
|
$row > $mr and $mr = $row; |
|
331
|
|
|
|
|
|
|
} |
|
332
|
|
|
|
|
|
|
} |
|
333
|
|
|
|
|
|
|
} |
|
334
|
|
|
|
|
|
|
} |
|
335
|
|
|
|
|
|
|
|
|
336
|
247
|
100
|
66
|
|
|
1430
|
$oc && ($mc < $ss->{maxcol} || $mr < $ss->{maxrow}) or next; |
|
|
|
|
66
|
|
|
|
|
|
337
|
|
|
|
|
|
|
|
|
338
|
|
|
|
|
|
|
# Remove trailing empty columns |
|
339
|
106
|
|
|
|
|
277
|
foreach my $col (($mc + 1) .. $ss->{maxcol}) { |
|
340
|
243
|
100
|
|
|
|
627
|
$rc and undef $ss->{cell}[$col]; |
|
341
|
243
|
100
|
|
|
|
518
|
$oa and undef $ss->{attr}[$col]; |
|
342
|
243
|
100
|
|
|
|
462
|
$cl or next; |
|
343
|
193
|
|
|
|
|
333
|
my $c = col2label ($col); |
|
344
|
193
|
|
|
|
|
1424
|
delete $ss->{"$c$_"} for 1 .. $ss->{maxrow}; |
|
345
|
|
|
|
|
|
|
} |
|
346
|
|
|
|
|
|
|
|
|
347
|
|
|
|
|
|
|
# Remove trailing empty rows |
|
348
|
106
|
|
|
|
|
285
|
foreach my $row (($mr + 1) .. $ss->{maxrow}) { |
|
349
|
139
|
|
|
|
|
271
|
foreach my $col (1 .. $mc) { |
|
350
|
64
|
50
|
|
|
|
143
|
$cl and delete $ss->{cr2cell ($col, $row)}; |
|
351
|
64
|
50
|
|
|
|
183
|
$rc and undef $ss->{cell} [$col][$row]; |
|
352
|
64
|
50
|
|
|
|
152
|
$oa and undef $ss->{attr} [$col][$row]; |
|
353
|
|
|
|
|
|
|
} |
|
354
|
|
|
|
|
|
|
} |
|
355
|
|
|
|
|
|
|
|
|
356
|
106
|
|
|
|
|
330
|
($ss->{maxrow}, $ss->{maxcol}) = ($mr, $mc); |
|
357
|
|
|
|
|
|
|
} |
|
358
|
|
|
|
|
|
|
} |
|
359
|
|
|
|
|
|
|
|
|
360
|
227
|
100
|
|
|
|
657
|
if ($opt->{pivot}) { |
|
361
|
1
|
|
|
|
|
5
|
foreach my $sheet (1 .. $ref->[0]{sheets}) { |
|
362
|
1
|
|
|
|
|
4
|
my $ss = $ref->[$sheet]; |
|
363
|
1
|
0
|
33
|
|
|
4
|
$ss->{maxrow} || $ss->{maxcol} or next; |
|
364
|
1
|
50
|
|
|
|
6
|
my $mx = $ss->{maxrow} > $ss->{maxcol} ? $ss->{maxrow} : $ss->{maxcol}; |
|
365
|
1
|
|
|
|
|
5
|
foreach my $row (2 .. $mx) { |
|
366
|
18
|
|
|
|
|
40
|
foreach my $col (1 .. ($row - 1)) { |
|
367
|
|
|
|
|
|
|
$opt->{rc} and |
|
368
|
|
|
|
|
|
|
($ss->{cell}[$col][$row], $ss->{cell}[$row][$col]) = |
|
369
|
171
|
50
|
|
|
|
527
|
($ss->{cell}[$row][$col], $ss->{cell}[$col][$row]); |
|
370
|
|
|
|
|
|
|
$opt->{cells} and |
|
371
|
|
|
|
|
|
|
($ss->{cr2cell ($col, $row)}, $ss->{cr2cell ($row, $col)}) = |
|
372
|
171
|
50
|
|
|
|
352
|
($ss->{cr2cell ($row, $col)}, $ss->{cr2cell ($col, $row)}); |
|
373
|
|
|
|
|
|
|
} |
|
374
|
|
|
|
|
|
|
} |
|
375
|
1
|
|
|
|
|
9
|
($ss->{maxcol}, $ss->{maxrow}) = ($ss->{maxrow}, $ss->{maxcol}); |
|
376
|
|
|
|
|
|
|
} |
|
377
|
|
|
|
|
|
|
} |
|
378
|
|
|
|
|
|
|
|
|
379
|
227
|
|
|
|
|
5657
|
$ref; |
|
380
|
|
|
|
|
|
|
} # _clipsheets |
|
381
|
|
|
|
|
|
|
|
|
382
|
|
|
|
|
|
|
# Convert a single color (index) to a color |
|
383
|
|
|
|
|
|
|
sub _xls_color { |
|
384
|
1742
|
|
|
1742
|
|
21196
|
my $clr = shift; |
|
385
|
1742
|
100
|
|
|
|
3558
|
defined $clr or return undef; |
|
386
|
850
|
50
|
|
|
|
1532
|
$clr eq "#000000" and return undef; |
|
387
|
850
|
50
|
|
|
|
1689
|
$clr =~ m/^#[0-9a-fA-F]+$/ and return lc $clr; |
|
388
|
850
|
100
|
66
|
|
|
2901
|
$clr == 0 || $clr == 32767 and return undef; # Default fg color |
|
389
|
468
|
|
|
|
|
1142
|
return "#" . lc Spreadsheet::ParseExcel->ColorIdxToRGB ($clr); |
|
390
|
|
|
|
|
|
|
} # _xls_color |
|
391
|
|
|
|
|
|
|
|
|
392
|
|
|
|
|
|
|
# Convert a fill [ $pattern, $front_color, $back_color ] to a single background |
|
393
|
|
|
|
|
|
|
sub _xls_fill { |
|
394
|
1526
|
|
|
1526
|
|
2743
|
my ($p, $fg, $bg) = @_; |
|
395
|
1526
|
50
|
|
|
|
2702
|
defined $p or return undef; |
|
396
|
1526
|
50
|
|
|
|
2759
|
$p == 32767 and return undef; # Default fg color |
|
397
|
1526
|
100
|
100
|
|
|
17004
|
$p == 0 && !defined $bg and return undef; # No fill bg color |
|
398
|
634
|
100
|
|
|
|
1152
|
$p == 1 and return _xls_color ($fg); |
|
399
|
418
|
50
|
33
|
|
|
6280
|
$bg < 8 || $bg > 63 and return undef; # see Workbook.pm#106 |
|
400
|
0
|
|
|
|
|
0
|
return _xls_color ($bg); |
|
401
|
|
|
|
|
|
|
} # _xls_fill |
|
402
|
|
|
|
|
|
|
|
|
403
|
|
|
|
|
|
|
sub ReadData { |
|
404
|
279
|
100
|
|
279
|
1
|
301347
|
my $txt = shift or return; |
|
405
|
|
|
|
|
|
|
|
|
406
|
276
|
|
|
|
|
637
|
my %opt; |
|
407
|
276
|
100
|
|
|
|
856
|
if (@_) { |
|
408
|
221
|
100
|
|
|
|
1175
|
if (ref $_[0] eq "HASH") { %opt = %{shift @_} } |
|
|
20
|
50
|
|
|
|
35
|
|
|
|
20
|
|
|
|
|
86
|
|
|
409
|
201
|
|
|
|
|
836
|
elsif (@_ % 2 == 0) { %opt = @_ } |
|
410
|
|
|
|
|
|
|
} |
|
411
|
|
|
|
|
|
|
|
|
412
|
276
|
100
|
|
|
|
1205
|
exists $opt{rc} or $opt{rc} = $def_opts{rc}; |
|
413
|
276
|
100
|
|
|
|
968
|
exists $opt{cells} or $opt{cells} = $def_opts{cells}; |
|
414
|
276
|
100
|
|
|
|
899
|
exists $opt{attr} or $opt{attr} = $def_opts{attr}; |
|
415
|
276
|
100
|
|
|
|
796
|
exists $opt{clip} or $opt{clip} = $opt{cells}; |
|
416
|
276
|
100
|
|
|
|
839
|
exists $opt{strip} or $opt{strip} = $def_opts{strip}; |
|
417
|
276
|
100
|
|
|
|
954
|
exists $opt{dtfmt} or $opt{dtfmt} = $def_opts{dtfmt}; |
|
418
|
|
|
|
|
|
|
|
|
419
|
|
|
|
|
|
|
# $debug = $opt{debug} // 0; |
|
420
|
276
|
100
|
|
|
|
808
|
$debug = defined $opt{debug} ? $opt{debug} : $def_opts{debug}; |
|
421
|
276
|
100
|
|
|
|
745
|
$debug > 4 and _dump (Options => \%opt); |
|
422
|
|
|
|
|
|
|
|
|
423
|
31
|
|
|
|
|
105
|
my %parser_opts = map { $_ => $opt{$_} } |
|
424
|
276
|
|
|
|
|
2651
|
grep { !exists $def_opts{$_} } |
|
|
1764
|
|
|
|
|
3624
|
|
|
425
|
|
|
|
|
|
|
keys %opt; |
|
426
|
|
|
|
|
|
|
|
|
427
|
276
|
|
|
|
|
1162
|
my $_parser = _parser ($opt{parser}); |
|
428
|
|
|
|
|
|
|
|
|
429
|
276
|
100
|
|
|
|
1146
|
my $io_ref = ref ($txt) =~ m/GLOB|IO/ ? $txt : undef; |
|
430
|
|
|
|
|
|
|
my $io_fil = $io_ref ? 0 : $txt =~ m/\0/ ? 0 |
|
431
|
53
|
100
|
|
53
|
|
115311
|
: do { no warnings "newline"; -f $txt }; |
|
|
53
|
100
|
|
|
|
175
|
|
|
|
53
|
|
|
|
|
282478
|
|
|
|
276
|
|
|
|
|
1062
|
|
|
|
255
|
|
|
|
|
6142
|
|
|
432
|
276
|
100
|
100
|
|
|
1781
|
my $io_txt = $io_ref || $io_fil ? 0 : 1; |
|
433
|
|
|
|
|
|
|
|
|
434
|
276
|
100
|
100
|
|
|
3276
|
$io_fil && ! -s $txt and do { $@ = "$txt is empty"; return }; |
|
|
11
|
|
|
|
|
60
|
|
|
|
11
|
|
|
|
|
65
|
|
|
435
|
265
|
100
|
100
|
|
|
1540
|
$io_ref && eof $txt and do { $@ = "Empty stream"; return }; |
|
|
5
|
|
|
|
|
20
|
|
|
|
5
|
|
|
|
|
86
|
|
|
436
|
|
|
|
|
|
|
|
|
437
|
260
|
100
|
100
|
|
|
2194
|
if ($opt{parser} ? $_parser eq "csv" : ($io_fil && $txt =~ m/\.(csv)$/i)) { |
|
|
|
100
|
|
|
|
|
|
|
438
|
106
|
50
|
|
|
|
378
|
$can{csv} or croak "CSV parser not installed"; |
|
439
|
|
|
|
|
|
|
|
|
440
|
106
|
100
|
|
|
|
410
|
my $label = defined $opt{label} ? $opt{label} : $io_fil ? $txt : "IO"; |
|
|
|
100
|
|
|
|
|
|
|
441
|
|
|
|
|
|
|
|
|
442
|
106
|
50
|
|
|
|
411
|
$debug and print STDERR "Opening CSV $label using $can{csv}-", $can{csv}->VERSION, "\n"; |
|
443
|
|
|
|
|
|
|
|
|
444
|
|
|
|
|
|
|
my @data = ( |
|
445
|
|
|
|
|
|
|
{ type => "csv", |
|
446
|
|
|
|
|
|
|
parser => $can{csv}, |
|
447
|
|
|
|
|
|
|
version => $can{csv}->VERSION, |
|
448
|
|
|
|
|
|
|
parsers => [ { |
|
449
|
|
|
|
|
|
|
type => "csv", |
|
450
|
|
|
|
|
|
|
parser => $can{csv}, |
|
451
|
|
|
|
|
|
|
version => $can{csv}->VERSION, |
|
452
|
106
|
|
|
|
|
3423
|
}], |
|
453
|
|
|
|
|
|
|
error => undef, |
|
454
|
|
|
|
|
|
|
quote => '"', |
|
455
|
|
|
|
|
|
|
sepchar => ',', |
|
456
|
|
|
|
|
|
|
sheets => 1, |
|
457
|
|
|
|
|
|
|
sheet => { $label => 1 }, |
|
458
|
|
|
|
|
|
|
}, |
|
459
|
|
|
|
|
|
|
{ parser => 0, |
|
460
|
|
|
|
|
|
|
label => $label, |
|
461
|
|
|
|
|
|
|
maxrow => 0, |
|
462
|
|
|
|
|
|
|
maxcol => 0, |
|
463
|
|
|
|
|
|
|
cell => [], |
|
464
|
|
|
|
|
|
|
attr => [], |
|
465
|
|
|
|
|
|
|
merged => [], |
|
466
|
|
|
|
|
|
|
active => 1, |
|
467
|
|
|
|
|
|
|
}, |
|
468
|
|
|
|
|
|
|
); |
|
469
|
|
|
|
|
|
|
|
|
470
|
106
|
|
|
|
|
560
|
my ($sep, $quo, $in) = (",", '"'); |
|
471
|
106
|
100
|
|
|
|
332
|
defined $opt{sep} and $sep = $opt{sep}; |
|
472
|
106
|
100
|
|
|
|
281
|
defined $opt{quote} and $quo = $opt{quote}; |
|
473
|
106
|
50
|
|
|
|
311
|
$debug > 8 and _dump (debug => { |
|
474
|
|
|
|
|
|
|
data => \@data, txt => $txt, io_ref => $io_ref, io_fil => $io_fil }); |
|
475
|
106
|
100
|
|
|
|
322
|
if ($io_fil) { |
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
476
|
94
|
100
|
100
|
|
|
306
|
unless (defined $opt{quote} && defined $opt{sep}) { |
|
477
|
87
|
50
|
|
|
|
3736
|
open $in, "<", $txt or return; |
|
478
|
87
|
|
|
|
|
1831
|
my $l1 = <$in>; |
|
479
|
|
|
|
|
|
|
|
|
480
|
87
|
100
|
|
|
|
439
|
$quo = defined $opt{quote} ? $opt{quote} : '"'; |
|
481
|
|
|
|
|
|
|
$sep = # If explicitly set, use it |
|
482
|
|
|
|
|
|
|
defined $opt{sep} ? $opt{sep} : |
|
483
|
|
|
|
|
|
|
# otherwise start auto-detect with quoted strings |
|
484
|
87
|
50
|
|
|
|
913
|
$l1 =~ m/["0-9];["0-9;]/ ? ";" : |
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
485
|
|
|
|
|
|
|
$l1 =~ m/["0-9],["0-9,]/ ? "," : |
|
486
|
|
|
|
|
|
|
$l1 =~ m/["0-9]\t["0-9,]/ ? "\t" : |
|
487
|
|
|
|
|
|
|
$l1 =~ m/["0-9]\|["0-9,]/ ? "|" : |
|
488
|
|
|
|
|
|
|
# If neither, then for unquoted strings |
|
489
|
|
|
|
|
|
|
$l1 =~ m/\w;[\w;]/ ? ";" : |
|
490
|
|
|
|
|
|
|
$l1 =~ m/\w,[\w,]/ ? "," : |
|
491
|
|
|
|
|
|
|
$l1 =~ m/\w\t[\w,]/ ? "\t" : |
|
492
|
|
|
|
|
|
|
$l1 =~ m/\w\|[\w,]/ ? "|" : |
|
493
|
|
|
|
|
|
|
"," ; |
|
494
|
87
|
|
|
|
|
1348
|
close $in; |
|
495
|
|
|
|
|
|
|
} |
|
496
|
94
|
50
|
|
|
|
2882
|
open $in, "<", $txt or return; |
|
497
|
|
|
|
|
|
|
} |
|
498
|
|
|
|
|
|
|
elsif ($io_ref) { |
|
499
|
10
|
|
|
|
|
23
|
$in = $txt; |
|
500
|
|
|
|
|
|
|
} |
|
501
|
|
|
|
|
|
|
elsif (ref $txt eq "SCALAR") { |
|
502
|
1
|
50
|
|
|
|
13
|
open $in, "<", $txt or croak "Cannot open input: $!"; |
|
503
|
|
|
|
|
|
|
} |
|
504
|
|
|
|
|
|
|
elsif ($txt =~ m/[\r\n,;]/) { |
|
505
|
1
|
50
|
|
2
|
|
54
|
open $in, "<", \$txt or croak "Cannot open input: $!"; |
|
|
2
|
|
|
|
|
23
|
|
|
|
2
|
|
|
|
|
5
|
|
|
|
2
|
|
|
|
|
18
|
|
|
506
|
|
|
|
|
|
|
} |
|
507
|
|
|
|
|
|
|
else { |
|
508
|
0
|
|
|
|
|
0
|
warn "Input type ", ref $txt, |
|
509
|
|
|
|
|
|
|
" might not be supported. Please file a ticket\n"; |
|
510
|
0
|
|
|
|
|
0
|
$in = $txt; # Now pray ... |
|
511
|
|
|
|
|
|
|
} |
|
512
|
106
|
50
|
|
|
|
1409
|
$debug > 1 and print STDERR "CSV sep_char '$sep', quote_char '$quo'\n"; |
|
513
|
|
|
|
|
|
|
my $csv = $can{csv}->new ({ |
|
514
|
|
|
|
|
|
|
%parser_opts, |
|
515
|
|
|
|
|
|
|
|
|
516
|
|
|
|
|
|
|
sep_char => ($data[0]{sepchar} = $sep), |
|
517
|
106
|
50
|
|
|
|
1555
|
quote_char => ($data[0]{quote} = $quo), |
|
518
|
|
|
|
|
|
|
keep_meta_info => 1, |
|
519
|
|
|
|
|
|
|
binary => 1, |
|
520
|
|
|
|
|
|
|
auto_diag => 1, |
|
521
|
|
|
|
|
|
|
}) or croak "Cannot create a csv ('$sep', '$quo') parser!"; |
|
522
|
|
|
|
|
|
|
|
|
523
|
106
|
|
|
|
|
23943
|
while (my $row = $csv->getline ($in)) { |
|
524
|
413
|
50
|
|
|
|
70451
|
my @row = @$row or last; |
|
525
|
|
|
|
|
|
|
|
|
526
|
413
|
|
|
|
|
948
|
my $r = ++$data[1]{maxrow}; |
|
527
|
413
|
100
|
|
|
|
1070
|
@row > $data[1]{maxcol} and $data[1]{maxcol} = @row; |
|
528
|
413
|
|
|
|
|
1121
|
foreach my $c (0 .. $#row) { |
|
529
|
2427
|
|
|
|
|
3465
|
my $val = $row[$c]; |
|
530
|
2427
|
|
|
|
|
4442
|
my $cell = cr2cell ($c + 1, $r); |
|
531
|
2427
|
100
|
|
|
|
6865
|
$opt{rc} and $data[1]{cell}[$c + 1][$r] = $val; |
|
532
|
2427
|
100
|
|
|
|
6275
|
$opt{cells} and $data[1]{$cell} = $val; |
|
533
|
2427
|
50
|
|
|
|
12353
|
$opt{attr} and $data[1]{attr}[$c + 1][$r] = { @def_attr }; |
|
534
|
|
|
|
|
|
|
} |
|
535
|
|
|
|
|
|
|
} |
|
536
|
106
|
50
|
|
|
|
14838
|
$csv->eof () or $data[0]{error} = [ $csv->error_diag ]; |
|
537
|
106
|
|
|
|
|
1659
|
close $in; |
|
538
|
|
|
|
|
|
|
|
|
539
|
106
|
|
|
|
|
367
|
for (@{$data[1]{cell}}) { |
|
|
106
|
|
|
|
|
547
|
|
|
540
|
734
|
100
|
|
|
|
1679
|
defined or $_ = []; |
|
541
|
|
|
|
|
|
|
} |
|
542
|
106
|
|
|
|
|
571
|
return _clipsheets \%opt, [ @data ]; |
|
543
|
|
|
|
|
|
|
} |
|
544
|
|
|
|
|
|
|
|
|
545
|
154
|
100
|
|
|
|
466
|
if ($io_txt) { # && $_parser !~ m/^xlsx?$/) { |
|
546
|
29
|
100
|
66
|
|
|
435
|
if ( # /etc/magic: Microsoft Office Document |
|
|
|
50
|
66
|
|
|
|
|
|
|
|
100
|
66
|
|
|
|
|
|
547
|
|
|
|
|
|
|
$txt =~ m{\A(\376\067\0\043 |
|
548
|
|
|
|
|
|
|
|\320\317\021\340\241\261\032\341 |
|
549
|
|
|
|
|
|
|
|\333\245-\0\0\0)}x |
|
550
|
|
|
|
|
|
|
# /usr/share/misc/magic |
|
551
|
|
|
|
|
|
|
|| $txt =~ m{\A.{2080}Microsoft Excel 5.0 Worksheet} |
|
552
|
|
|
|
|
|
|
|| $txt =~ m{\A\x09\x04\x06\x00\x00\x00\x10\x00} |
|
553
|
|
|
|
|
|
|
) { |
|
554
|
1
|
50
|
|
|
|
7
|
$can{xls} or croak "Spreadsheet::ParseExcel not installed"; |
|
555
|
1
|
|
|
|
|
2
|
my $tmpfile; |
|
556
|
1
|
50
|
|
|
|
4
|
if ($can{ios}) { # Do not use a temp file if IO::Scalar is available |
|
557
|
1
|
|
|
|
|
3
|
$tmpfile = \$txt; |
|
558
|
|
|
|
|
|
|
} |
|
559
|
|
|
|
|
|
|
else { |
|
560
|
0
|
|
|
|
|
0
|
$tmpfile = File::Temp->new (SUFFIX => ".xls", UNLINK => 1); |
|
561
|
0
|
|
|
|
|
0
|
binmode $tmpfile; |
|
562
|
0
|
|
|
|
|
0
|
print $tmpfile $txt; |
|
563
|
0
|
|
|
|
|
0
|
close $tmpfile; |
|
564
|
|
|
|
|
|
|
} |
|
565
|
1
|
50
|
|
|
|
59
|
open $io_ref, "<", $tmpfile or do { $@ = $!; return }; |
|
|
0
|
|
|
|
|
0
|
|
|
|
0
|
|
|
|
|
0
|
|
|
566
|
1
|
|
|
|
|
1005
|
$io_txt = 0; |
|
567
|
1
|
|
|
|
|
6
|
$_parser = _parser ($opt{parser} = "xls"); |
|
568
|
|
|
|
|
|
|
} |
|
569
|
|
|
|
|
|
|
elsif ( # /usr/share/misc/magic |
|
570
|
|
|
|
|
|
|
$txt =~ m{\APK\003\004.{4,30}(?:\[Content_Types\]\.xml|_rels/\.rels)} |
|
571
|
|
|
|
|
|
|
) { |
|
572
|
0
|
0
|
|
|
|
0
|
$can{xlsx} or croak "XLSX parser not installed"; |
|
573
|
0
|
|
|
|
|
0
|
my $tmpfile; |
|
574
|
0
|
0
|
|
|
|
0
|
if ($can{ios}) { # Do not use a temp file if IO::Scalar is available |
|
575
|
0
|
|
|
|
|
0
|
$tmpfile = \$txt; |
|
576
|
|
|
|
|
|
|
} |
|
577
|
|
|
|
|
|
|
else { |
|
578
|
0
|
|
|
|
|
0
|
$tmpfile = File::Temp->new (SUFFIX => ".xlsx", UNLINK => 1); |
|
579
|
0
|
|
|
|
|
0
|
binmode $tmpfile; |
|
580
|
0
|
|
|
|
|
0
|
print $tmpfile $txt; |
|
581
|
0
|
|
|
|
|
0
|
close $tmpfile; |
|
582
|
|
|
|
|
|
|
} |
|
583
|
0
|
0
|
|
|
|
0
|
open $io_ref, "<", $tmpfile or do { $@ = $!; return }; |
|
|
0
|
|
|
|
|
0
|
|
|
|
0
|
|
|
|
|
0
|
|
|
584
|
0
|
|
|
|
|
0
|
$io_txt = 0; |
|
585
|
0
|
|
|
|
|
0
|
$_parser = _parser ($opt{parser} = "xlsx"); |
|
586
|
|
|
|
|
|
|
} |
|
587
|
|
|
|
|
|
|
elsif (!$io_ref && $txt =~ m/\.xlsx?$/i) { |
|
588
|
3
|
|
|
|
|
17
|
$@ = "Cannot open $txt as file"; |
|
589
|
3
|
|
|
|
|
50
|
return; |
|
590
|
|
|
|
|
|
|
} |
|
591
|
|
|
|
|
|
|
} |
|
592
|
151
|
100
|
66
|
|
|
1561
|
if ($opt{parser} ? $_parser =~ m/^xlsx?$/ |
|
|
|
100
|
|
|
|
|
|
|
593
|
|
|
|
|
|
|
: ($io_fil && $txt =~ m/\.(xlsx?)$/i && ($_parser = $1))) { |
|
594
|
75
|
100
|
|
|
|
388
|
my $parse_type = $_parser =~ m/x$/i ? "XLSX" : "XLS"; |
|
595
|
75
|
50
|
|
|
|
350
|
my $parser = $can{lc $parse_type} or |
|
596
|
|
|
|
|
|
|
croak "Parser for $parse_type is not installed"; |
|
597
|
|
|
|
|
|
|
$debug and print STDERR "Opening $parse_type ", $io_ref ? "<REF>" : $txt, |
|
598
|
75
|
50
|
|
|
|
390
|
" using $parser-", $can{lc $parse_type}->VERSION, "\n"; |
|
|
|
100
|
|
|
|
|
|
|
599
|
75
|
50
|
|
|
|
260
|
$opt{passwd} and $parser_opts{Password} = $opt{passwd}; |
|
600
|
75
|
|
|
|
|
265
|
my $oBook = eval { |
|
601
|
|
|
|
|
|
|
$io_ref |
|
602
|
|
|
|
|
|
|
? $parse_type eq "XLSX" |
|
603
|
|
|
|
|
|
|
? $can{xlsx} =~ m/::XLSX$/ |
|
604
|
|
|
|
|
|
|
? $parser->new ($io_ref) |
|
605
|
|
|
|
|
|
|
: $parser->new (%parser_opts)->parse ($io_ref) |
|
606
|
|
|
|
|
|
|
: $parser->new (%parser_opts)->Parse ($io_ref) |
|
607
|
|
|
|
|
|
|
: $parse_type eq "XLSX" |
|
608
|
75
|
0
|
|
|
|
991
|
? $can{xlsx} =~ m/::XLSX$/ |
|
|
|
50
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
609
|
|
|
|
|
|
|
? $parser->new ($txt) |
|
610
|
|
|
|
|
|
|
: $parser->new (%parser_opts)->parse ($txt) |
|
611
|
|
|
|
|
|
|
: $parser->new (%parser_opts)->Parse ($txt); |
|
612
|
|
|
|
|
|
|
}; |
|
613
|
75
|
50
|
|
|
|
2298301
|
unless ($oBook) { |
|
614
|
|
|
|
|
|
|
# cleanup will fail on folders with spaces. |
|
615
|
0
|
|
|
|
|
0
|
(my $msg = $@) =~ s/ at \S+ line \d+.*//s; |
|
616
|
0
|
|
|
|
|
0
|
croak "$parse_type parser cannot parse data: $msg"; |
|
617
|
|
|
|
|
|
|
} |
|
618
|
75
|
50
|
|
|
|
319
|
$debug > 8 and _dump (oBook => $oBook); |
|
619
|
|
|
|
|
|
|
|
|
620
|
|
|
|
|
|
|
# WorkBook keys: |
|
621
|
|
|
|
|
|
|
# aColor _CurSheet Format SheetCount |
|
622
|
|
|
|
|
|
|
# ActiveSheet _CurSheet_ FormatStr _skip_chart |
|
623
|
|
|
|
|
|
|
# Author File NotSetCell _string_contin |
|
624
|
|
|
|
|
|
|
# BIFFVersion Flg1904 Object Version |
|
625
|
|
|
|
|
|
|
# _buffer FmtClass PkgStr Worksheet |
|
626
|
|
|
|
|
|
|
# CellHandler Font _previous_info |
|
627
|
|
|
|
|
|
|
|
|
628
|
|
|
|
|
|
|
my @data = ( { |
|
629
|
|
|
|
|
|
|
type => lc $parse_type, |
|
630
|
|
|
|
|
|
|
parser => $can{lc $parse_type}, |
|
631
|
|
|
|
|
|
|
version => $can{lc $parse_type}->VERSION, |
|
632
|
|
|
|
|
|
|
parsers => [{ |
|
633
|
|
|
|
|
|
|
type => lc $parse_type, |
|
634
|
|
|
|
|
|
|
parser => $can{lc $parse_type}, |
|
635
|
|
|
|
|
|
|
version => $can{lc $parse_type}->VERSION, |
|
636
|
|
|
|
|
|
|
}], |
|
637
|
|
|
|
|
|
|
error => undef, |
|
638
|
75
|
|
50
|
|
|
3035
|
sheets => $oBook->{SheetCount} || 0, |
|
639
|
|
|
|
|
|
|
sheet => {}, |
|
640
|
|
|
|
|
|
|
} ); |
|
641
|
|
|
|
|
|
|
# $debug and $data[0]{_parser} = $oBook; |
|
642
|
|
|
|
|
|
|
# Overrule the default date format strings |
|
643
|
|
|
|
|
|
|
my %def_fmt = ( |
|
644
|
|
|
|
|
|
|
0x0E => lc $opt{dtfmt}, # m-d-yy |
|
645
|
75
|
|
|
|
|
718
|
0x0F => "d-mmm-yyyy", # d-mmm-yy |
|
646
|
|
|
|
|
|
|
0x11 => "mmm-yyyy", # mmm-yy |
|
647
|
|
|
|
|
|
|
0x16 => "yyyy-mm-dd hh:mm", # m-d-yy h:mm |
|
648
|
|
|
|
|
|
|
); |
|
649
|
75
|
|
|
|
|
627
|
$oBook->{FormatStr}{$_} = $def_fmt{$_} for keys %def_fmt; |
|
650
|
|
|
|
|
|
|
my $oFmt = $parse_type eq "XLSX" |
|
651
|
75
|
50
|
|
|
|
823
|
? $can{xlsx} =~ m/::XLSX$/ |
|
|
|
100
|
|
|
|
|
|
|
652
|
|
|
|
|
|
|
? Spreadsheet::XLSX::Fmt2007->new |
|
653
|
|
|
|
|
|
|
: Spreadsheet::ParseExcel::FmtDefault->new |
|
654
|
|
|
|
|
|
|
: Spreadsheet::ParseExcel::FmtDefault->new; |
|
655
|
|
|
|
|
|
|
|
|
656
|
75
|
100
|
|
|
|
904
|
$debug and print STDERR "\t$data[0]{sheets} sheets\n"; |
|
657
|
|
|
|
|
|
|
my $active_sheet = $oBook->get_active_sheet |
|
658
|
|
|
|
|
|
|
|| $oBook->{ActiveSheet} |
|
659
|
75
|
|
33
|
|
|
485
|
|| $oBook->{SelectedSheet}; |
|
660
|
75
|
|
|
|
|
999
|
my $current_sheet = 0; |
|
661
|
75
|
|
|
|
|
169
|
foreach my $oWkS (@{$oBook->{Worksheet}}) { |
|
|
75
|
|
|
|
|
264
|
|
|
662
|
121
|
|
|
|
|
291
|
$current_sheet++; |
|
663
|
121
|
100
|
100
|
|
|
682
|
$opt{clip} and !defined $oWkS->{Cells} and next; # Skip empty sheets |
|
664
|
|
|
|
|
|
|
my %sheet = ( |
|
665
|
|
|
|
|
|
|
parser => 0, |
|
666
|
|
|
|
|
|
|
label => $oWkS->{Name}, |
|
667
|
115
|
|
|
|
|
918
|
maxrow => 0, |
|
668
|
|
|
|
|
|
|
maxcol => 0, |
|
669
|
|
|
|
|
|
|
cell => [], |
|
670
|
|
|
|
|
|
|
attr => [], |
|
671
|
|
|
|
|
|
|
merged => [], |
|
672
|
|
|
|
|
|
|
active => 0, |
|
673
|
|
|
|
|
|
|
); |
|
674
|
|
|
|
|
|
|
# $debug and $sheet{_parser} = $oWkS; |
|
675
|
115
|
50
|
|
|
|
441
|
defined $sheet{label} or $sheet{label} = "-- unlabeled --"; |
|
676
|
115
|
100
|
|
|
|
435
|
exists $oWkS->{MinRow} and $sheet{minrow} = $oWkS->{MinRow} + 1; |
|
677
|
115
|
100
|
|
|
|
388
|
exists $oWkS->{MaxRow} and $sheet{maxrow} = $oWkS->{MaxRow} + 1; |
|
678
|
115
|
100
|
|
|
|
370
|
exists $oWkS->{MinCol} and $sheet{mincol} = $oWkS->{MinCol} + 1; |
|
679
|
115
|
100
|
|
|
|
348
|
exists $oWkS->{MaxCol} and $sheet{maxcol} = $oWkS->{MaxCol} + 1; |
|
680
|
|
|
|
|
|
|
$sheet{merged} = [ |
|
681
|
12
|
|
|
|
|
34
|
map { $_->[0] } |
|
682
|
4
|
|
|
|
|
21
|
sort { $a->[1] cmp $b->[1] } |
|
683
|
12
|
|
|
|
|
94
|
map {[ $_, pack "NNNN", @$_ ]} |
|
684
|
12
|
|
|
|
|
84
|
map {[ map { $_ + 1 } @{$_}[1,0,3,2] ]} |
|
|
48
|
|
|
|
|
109
|
|
|
|
12
|
|
|
|
|
41
|
|
|
685
|
115
|
100
|
|
|
|
261
|
@{$oWkS->get_merged_areas || []}]; |
|
|
115
|
|
|
|
|
516
|
|
|
686
|
115
|
|
|
|
|
1195
|
my $sheet_idx = 1 + @data; |
|
687
|
115
|
100
|
|
|
|
375
|
$debug and print STDERR "\tSheet $sheet_idx '$sheet{label}' $sheet{maxrow} x $sheet{maxcol}\n"; |
|
688
|
115
|
100
|
|
|
|
361
|
if (defined $active_sheet) { |
|
689
|
|
|
|
|
|
|
# _SheetNo is 0-based |
|
690
|
7
|
50
|
|
|
|
21
|
my $sheet_no = defined $oWkS->{_SheetNo} ? $oWkS->{_SheetNo} : $current_sheet - 1; |
|
691
|
7
|
100
|
|
|
|
31
|
$sheet_no eq $active_sheet and $sheet{active} = 1; |
|
692
|
|
|
|
|
|
|
} |
|
693
|
|
|
|
|
|
|
# Sheet keys: |
|
694
|
|
|
|
|
|
|
# _Book FooterMargin MinCol RightMargin |
|
695
|
|
|
|
|
|
|
# BottomMargin FooterMergin MinRow RightMergin |
|
696
|
|
|
|
|
|
|
# BottomMergin HCenter Name RowHeight |
|
697
|
|
|
|
|
|
|
# Cells Header NoColor RowHidden |
|
698
|
|
|
|
|
|
|
# ColFmtNo HeaderMargin NoOrient Scale |
|
699
|
|
|
|
|
|
|
# ColHidden HeaderMergin NoPls SheetHidden |
|
700
|
|
|
|
|
|
|
# ColWidth Kind Notes _SheetNo |
|
701
|
|
|
|
|
|
|
# Copis Landscape PageFit SheetType |
|
702
|
|
|
|
|
|
|
# DefColWidth LeftMargin PageStart SheetVersion |
|
703
|
|
|
|
|
|
|
# DefRowHeight LeftMergin PaperSize TopMargin |
|
704
|
|
|
|
|
|
|
# Draft LeftToRight _Pos TopMergin |
|
705
|
|
|
|
|
|
|
# FitHeight MaxCol PrintGrid UsePage |
|
706
|
|
|
|
|
|
|
# FitWidth MaxRow PrintHeaders VCenter |
|
707
|
|
|
|
|
|
|
# Footer MergedArea Res VRes |
|
708
|
115
|
100
|
|
|
|
341
|
if (exists $oWkS->{MinRow}) { |
|
709
|
110
|
|
50
|
|
|
477
|
my $hiddenRows = $oWkS->{RowHidden} || []; |
|
710
|
110
|
|
50
|
|
|
463
|
my $hiddenCols = $oWkS->{ColHidden} || []; |
|
711
|
110
|
100
|
|
|
|
314
|
if ($opt{clip}) { |
|
712
|
91
|
|
|
|
|
242
|
my ($mr, $mc) = (-1, -1); |
|
713
|
91
|
|
|
|
|
355
|
foreach my $r ($oWkS->{MinRow} .. $sheet{maxrow}) { |
|
714
|
516
|
|
|
|
|
949
|
foreach my $c ($oWkS->{MinCol} .. $sheet{maxcol}) { |
|
715
|
2908
|
100
|
|
|
|
5626
|
my $oWkC = $oWkS->{Cells}[$r][$c] or next; |
|
716
|
1701
|
50
|
|
|
|
3285
|
defined (my $val = $oWkC->{Val}) or next; |
|
717
|
1701
|
100
|
|
|
|
3180
|
$val eq "" and next; |
|
718
|
1679
|
100
|
|
|
|
2734
|
$r > $mr and $mr = $r; |
|
719
|
1679
|
100
|
|
|
|
2999
|
$c > $mc and $mc = $c; |
|
720
|
|
|
|
|
|
|
} |
|
721
|
|
|
|
|
|
|
} |
|
722
|
91
|
|
|
|
|
350
|
($sheet{maxrow}, $sheet{maxcol}) = ($mr + 1, $mc + 1); |
|
723
|
|
|
|
|
|
|
} |
|
724
|
110
|
|
|
|
|
352
|
foreach my $r ($oWkS->{MinRow} .. $sheet{maxrow}) { |
|
725
|
597
|
|
|
|
|
1280
|
foreach my $c ($oWkS->{MinCol} .. $sheet{maxcol}) { |
|
726
|
3132
|
100
|
|
|
|
12249
|
my $oWkC = $oWkS->{Cells}[$r][$c] or next; |
|
727
|
|
|
|
|
|
|
#defined (my $val = $oWkC->{Val}) or next; |
|
728
|
1802
|
|
|
|
|
2951
|
my $val = $oWkC->{Val}; |
|
729
|
1802
|
50
|
33
|
|
|
6154
|
if (defined $val and my $enc = $oWkC->{Code}) { |
|
730
|
0
|
0
|
|
|
|
0
|
$enc eq "ucs2" and $val = decode ("utf-16be", $val); |
|
731
|
|
|
|
|
|
|
} |
|
732
|
1802
|
|
|
|
|
4147
|
my $cell = cr2cell ($c + 1, $r + 1); |
|
733
|
1802
|
100
|
|
|
|
5604
|
$opt{rc} and $sheet{cell}[$c + 1][$r + 1] = $val; # Original |
|
734
|
|
|
|
|
|
|
|
|
735
|
1802
|
|
|
|
|
2466
|
my $fmt; |
|
736
|
1802
|
|
|
|
|
2652
|
my $FmT = $oWkC->{Format}; |
|
737
|
1802
|
100
|
|
|
|
3375
|
if ($FmT) { |
|
738
|
952
|
100
|
|
|
|
1928
|
unless (ref $FmT) { |
|
739
|
130
|
|
|
|
|
171
|
$fmt = $FmT; |
|
740
|
130
|
|
|
|
|
222
|
$FmT = {}; |
|
741
|
|
|
|
|
|
|
} |
|
742
|
|
|
|
|
|
|
} |
|
743
|
|
|
|
|
|
|
else { |
|
744
|
850
|
|
|
|
|
1395
|
$FmT = {}; |
|
745
|
|
|
|
|
|
|
} |
|
746
|
1802
|
|
|
|
|
3572
|
foreach my $attr (qw( AlignH AlignV FmtIdx Hidden Lock |
|
747
|
|
|
|
|
|
|
Wrap )) { |
|
748
|
10812
|
100
|
|
|
|
21191
|
exists $FmT->{$attr} or $FmT->{$attr} = 0; |
|
749
|
|
|
|
|
|
|
} |
|
750
|
1802
|
100
|
|
|
|
3758
|
exists $FmT->{Fill} or $FmT->{Fill} = [ 0 ]; |
|
751
|
1802
|
100
|
|
|
|
4029
|
exists $FmT->{Font} or $FmT->{Font} = undef; |
|
752
|
|
|
|
|
|
|
|
|
753
|
1802
|
100
|
|
|
|
3403
|
unless (defined $fmt) { |
|
754
|
|
|
|
|
|
|
$fmt = $FmT->{FmtIdx} |
|
755
|
|
|
|
|
|
|
? $oBook->{FormatStr}{$FmT->{FmtIdx}} |
|
756
|
1672
|
100
|
|
|
|
3215
|
: undef; |
|
757
|
|
|
|
|
|
|
} |
|
758
|
1802
|
100
|
|
|
|
3465
|
if ($oWkC->{Type} eq "Numeric") { |
|
759
|
|
|
|
|
|
|
# Fixed in 0.33 and up |
|
760
|
|
|
|
|
|
|
# see Spreadsheet/ParseExcel/FmtDefault.pm |
|
761
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x0e || |
|
762
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x0f || |
|
763
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x10 || |
|
764
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x11 || |
|
765
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x16 || |
|
766
|
|
|
|
|
|
|
(defined $fmt && $fmt =~ m{^[dmy][-\\/dmy]*$}) and |
|
767
|
370
|
100
|
33
|
|
|
3315
|
$oWkC->{Type} = "Date"; |
|
|
|
|
33
|
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
768
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x09 || |
|
769
|
|
|
|
|
|
|
$FmT->{FmtIdx} == 0x0a || |
|
770
|
|
|
|
|
|
|
(defined $fmt && $fmt =~ m{^0+\.0+%$}) and |
|
771
|
370
|
100
|
100
|
|
|
2129
|
$oWkC->{Type} = "Percentage"; |
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
772
|
|
|
|
|
|
|
} |
|
773
|
1802
|
100
|
|
|
|
3451
|
defined $fmt and $fmt =~ s/\\//g; |
|
774
|
|
|
|
|
|
|
$opt{cells} and # Formatted value |
|
775
|
|
|
|
|
|
|
$sheet{$cell} = defined $val ? $FmT && exists $def_fmt{$FmT->{FmtIdx}} |
|
776
|
1802
|
100
|
66
|
|
|
9920
|
? $oFmt->ValFmt ($oWkC, $oBook) |
|
|
|
50
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
777
|
|
|
|
|
|
|
: $oWkC->Value : undef; |
|
778
|
1802
|
100
|
|
|
|
15284
|
if ($opt{attr}) { |
|
779
|
1526
|
|
|
|
|
2303
|
my $FnT = $FmT->{Font}; |
|
780
|
|
|
|
|
|
|
my $fmi = $FmT->{FmtIdx} |
|
781
|
|
|
|
|
|
|
? $oBook->{FormatStr}{$FmT->{FmtIdx}} |
|
782
|
1526
|
100
|
|
|
|
2672
|
: undef; |
|
783
|
1526
|
100
|
|
|
|
2611
|
$fmi and $fmi =~ s/\\//g; |
|
784
|
|
|
|
|
|
|
$sheet{attr}[$c + 1][$r + 1] = { |
|
785
|
|
|
|
|
|
|
@def_attr, |
|
786
|
|
|
|
|
|
|
|
|
787
|
|
|
|
|
|
|
type => lc $oWkC->{Type}, |
|
788
|
|
|
|
|
|
|
enc => $oWkC->{Code}, |
|
789
|
|
|
|
|
|
|
merged => (defined $oWkC->{Merged} ? $oWkC->{Merged} : $oWkC->is_merged) || 0, |
|
790
|
|
|
|
|
|
|
hidden => ($hiddenRows->[$r] || $hiddenCols->[$c] ? 1 : |
|
791
|
|
|
|
|
|
|
defined $oWkC->{Hidden} ? $oWkC->{Hidden} : $FmT->{Hidden}) || 0, |
|
792
|
|
|
|
|
|
|
locked => $FmT->{Lock} || 0, |
|
793
|
|
|
|
|
|
|
format => $fmi, |
|
794
|
|
|
|
|
|
|
halign => [ undef, qw( left center right |
|
795
|
|
|
|
|
|
|
fill justify ), undef, |
|
796
|
|
|
|
|
|
|
"equal_space" ]->[$FmT->{AlignH}], |
|
797
|
|
|
|
|
|
|
valign => [ qw( top center bottom justify |
|
798
|
|
|
|
|
|
|
equal_space )]->[$FmT->{AlignV}], |
|
799
|
|
|
|
|
|
|
wrap => $FmT->{Wrap}, |
|
800
|
|
|
|
|
|
|
font => $FnT->{Name}, |
|
801
|
|
|
|
|
|
|
size => $FnT->{Height}, |
|
802
|
|
|
|
|
|
|
bold => $FnT->{Bold}, |
|
803
|
|
|
|
|
|
|
italic => $FnT->{Italic}, |
|
804
|
|
|
|
|
|
|
uline => $FnT->{Underline}, |
|
805
|
|
|
|
|
|
|
fgcolor => _xls_color ($FnT->{Color}), |
|
806
|
1526
|
|
|
|
|
6194
|
bgcolor => _xls_fill (@{$FmT->{Fill}}), |
|
807
|
|
|
|
|
|
|
formula => $oWkC->{Formula}, |
|
808
|
1526
|
|
100
|
|
|
4888
|
}; |
|
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
809
|
|
|
|
|
|
|
#_dump "cell", $sheet{attr}[$c + 1][$r + 1]; |
|
810
|
|
|
|
|
|
|
} |
|
811
|
|
|
|
|
|
|
} |
|
812
|
|
|
|
|
|
|
} |
|
813
|
|
|
|
|
|
|
} |
|
814
|
115
|
|
|
|
|
206
|
for (@{$sheet{cell}}) { |
|
|
115
|
|
|
|
|
380
|
|
|
815
|
409
|
100
|
|
|
|
1068
|
defined or $_ = []; |
|
816
|
|
|
|
|
|
|
} |
|
817
|
115
|
|
|
|
|
2012
|
push @data, { %sheet }; |
|
818
|
|
|
|
|
|
|
# $data[0]{sheets}++; |
|
819
|
115
|
50
|
|
|
|
614
|
if ($sheet{label} eq "-- unlabeled --") { |
|
820
|
0
|
|
|
|
|
0
|
$sheet{label} = ""; |
|
821
|
|
|
|
|
|
|
} |
|
822
|
|
|
|
|
|
|
else { |
|
823
|
115
|
|
|
|
|
783
|
$data[0]{sheet}{$sheet{label}} = $#data; |
|
824
|
|
|
|
|
|
|
} |
|
825
|
|
|
|
|
|
|
} |
|
826
|
75
|
|
|
|
|
497
|
return _clipsheets \%opt, [ @data ]; |
|
827
|
|
|
|
|
|
|
} |
|
828
|
|
|
|
|
|
|
|
|
829
|
76
|
100
|
|
|
|
430
|
if ($opt{parser} ? _parser ($opt{parser}) eq "sc" |
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
830
|
|
|
|
|
|
|
: $io_fil |
|
831
|
|
|
|
|
|
|
? $txt =~ m/\.sc$/ |
|
832
|
|
|
|
|
|
|
: $txt =~ m/^# .*SquirrelCalc/) { |
|
833
|
46
|
100
|
|
|
|
129
|
if ($io_ref) { |
|
|
|
100
|
|
|
|
|
|
|
834
|
2
|
|
|
|
|
9
|
local $/; |
|
835
|
2
|
|
|
|
|
56
|
my $x = <$txt>; |
|
836
|
2
|
|
|
|
|
12
|
$txt = $x; |
|
837
|
|
|
|
|
|
|
} |
|
838
|
|
|
|
|
|
|
elsif ($io_fil) { |
|
839
|
42
|
|
|
|
|
171
|
local $/; |
|
840
|
42
|
50
|
|
|
|
1606
|
open my $sc, "<", $txt or return; |
|
841
|
42
|
|
|
|
|
1836
|
$txt = <$sc>; |
|
842
|
42
|
|
|
|
|
702
|
close $sc; |
|
843
|
|
|
|
|
|
|
} |
|
844
|
46
|
50
|
|
|
|
302
|
$txt =~ m/\S/ or return; |
|
845
|
46
|
50
|
|
|
|
170
|
my $label = defined $opt{label} ? $opt{label} : "sheet"; |
|
846
|
46
|
|
|
|
|
646
|
my @data = ( |
|
847
|
|
|
|
|
|
|
{ type => "sc", |
|
848
|
|
|
|
|
|
|
parser => "Spreadsheet::Read", |
|
849
|
|
|
|
|
|
|
version => $VERSION, |
|
850
|
|
|
|
|
|
|
parsers => [{ |
|
851
|
|
|
|
|
|
|
type => "sc", |
|
852
|
|
|
|
|
|
|
parser => "Spreadsheet::Read", |
|
853
|
|
|
|
|
|
|
version => $VERSION, |
|
854
|
|
|
|
|
|
|
}], |
|
855
|
|
|
|
|
|
|
error => undef, |
|
856
|
|
|
|
|
|
|
sheets => 1, |
|
857
|
|
|
|
|
|
|
sheet => { $label => 1 }, |
|
858
|
|
|
|
|
|
|
}, |
|
859
|
|
|
|
|
|
|
{ parser => 0, |
|
860
|
|
|
|
|
|
|
label => $label, |
|
861
|
|
|
|
|
|
|
maxrow => 0, |
|
862
|
|
|
|
|
|
|
maxcol => 0, |
|
863
|
|
|
|
|
|
|
cell => [], |
|
864
|
|
|
|
|
|
|
attr => [], |
|
865
|
|
|
|
|
|
|
merged => [], |
|
866
|
|
|
|
|
|
|
active => 1, |
|
867
|
|
|
|
|
|
|
}, |
|
868
|
|
|
|
|
|
|
); |
|
869
|
|
|
|
|
|
|
|
|
870
|
46
|
|
|
|
|
9715
|
for (split m/\s*[\r\n]\s*/, $txt) { |
|
871
|
13478
|
100
|
|
|
|
22369
|
if (m/^dimension.*of ([0-9]+) rows.*of ([0-9]+) columns/i) { |
|
872
|
46
|
|
|
|
|
89
|
@{$data[1]}{qw(maxrow maxcol)} = ($1, $2); |
|
|
46
|
|
|
|
|
274
|
|
|
873
|
46
|
|
|
|
|
99
|
next; |
|
874
|
|
|
|
|
|
|
} |
|
875
|
13432
|
100
|
|
|
|
33232
|
s/^r([0-9]+)c([0-9]+)\s*=\s*// or next; |
|
876
|
3542
|
|
|
|
|
6147
|
my ($c, $r) = map { $_ + 1 } $2, $1; |
|
|
7084
|
|
|
|
|
15254
|
|
|
877
|
3542
|
100
|
66
|
|
|
15837
|
if (m/.* \{(.*)}$/ or m/"(.*)"/) { |
|
878
|
2714
|
|
|
|
|
5250
|
my $cell = cr2cell ($c, $r); |
|
879
|
2714
|
100
|
|
|
|
8551
|
$opt{rc} and $data[1]{cell}[$c][$r] = $1; |
|
880
|
2714
|
50
|
|
|
|
7580
|
$opt{cells} and $data[1]{$cell} = $1; |
|
881
|
2714
|
100
|
|
|
|
6438
|
$opt{attr} and $data[1]{attr}[$c + 1][$r] = { @def_attr }; |
|
882
|
2714
|
|
|
|
|
4661
|
next; |
|
883
|
|
|
|
|
|
|
} |
|
884
|
|
|
|
|
|
|
# Now only formula's remain. Ignore for now |
|
885
|
|
|
|
|
|
|
# r67c7 = [P2L] 2*(1000*r67c5-60) |
|
886
|
|
|
|
|
|
|
} |
|
887
|
46
|
|
|
|
|
795
|
for (@{$data[1]{cell}}) { |
|
|
46
|
|
|
|
|
167
|
|
|
888
|
360
|
100
|
|
|
|
756
|
defined or $_ = []; |
|
889
|
|
|
|
|
|
|
} |
|
890
|
46
|
|
|
|
|
172
|
return _clipsheets \%opt, [ @data ]; |
|
891
|
|
|
|
|
|
|
} |
|
892
|
|
|
|
|
|
|
|
|
893
|
30
|
50
|
66
|
|
|
364
|
if ($opt{parser} ? _parser ($opt{parser}) eq "sxc" |
|
|
|
100
|
|
|
|
|
|
|
894
|
|
|
|
|
|
|
: ($txt =~ m/^<\?xml/ or -f $txt)) { |
|
895
|
7
|
50
|
|
|
|
996
|
$can{sxc} or croak "Spreadsheet::ReadSXC not installed"; |
|
896
|
0
|
0
|
|
|
|
0
|
ref $txt and |
|
897
|
|
|
|
|
|
|
croak ("Sorry, references as input are not (yet) supported by Spreadsheet::ReadSXC"); |
|
898
|
|
|
|
|
|
|
|
|
899
|
0
|
|
|
|
|
0
|
my $using = "using $can{sxc}-" . $can{sxc}->VERSION; |
|
900
|
0
|
|
|
|
|
0
|
my $sxc_options = { %parser_opts, OrderBySheet => 1 }; # New interface 0.20 and up |
|
901
|
0
|
|
|
|
|
0
|
my $sxc; |
|
902
|
0
|
0
|
0
|
|
|
0
|
if ($txt =~ m/\.(sxc|ods)$/i) { |
|
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
903
|
0
|
0
|
|
|
|
0
|
$debug and print STDERR "Opening \U$1\E $txt $using\n"; |
|
904
|
0
|
0
|
|
|
|
0
|
$sxc = Spreadsheet::ReadSXC::read_sxc ($txt, $sxc_options) or return; |
|
905
|
|
|
|
|
|
|
} |
|
906
|
|
|
|
|
|
|
elsif ($txt =~ m/\.xml$/i) { |
|
907
|
0
|
0
|
|
|
|
0
|
$debug and print STDERR "Opening XML $txt $using\n"; |
|
908
|
0
|
0
|
|
|
|
0
|
$sxc = Spreadsheet::ReadSXC::read_xml_file ($txt, $sxc_options) or return; |
|
909
|
|
|
|
|
|
|
} |
|
910
|
|
|
|
|
|
|
# need to test on pattern to prevent stat warning |
|
911
|
|
|
|
|
|
|
# on filename with newline |
|
912
|
|
|
|
|
|
|
elsif ($txt !~ m/^<\?xml/i and -f $txt) { |
|
913
|
0
|
0
|
|
|
|
0
|
$debug and print STDERR "Opening XML $txt $using\n"; |
|
914
|
0
|
0
|
|
|
|
0
|
open my $f, "<", $txt or return; |
|
915
|
0
|
|
|
|
|
0
|
local $/; |
|
916
|
0
|
|
|
|
|
0
|
$txt = <$f>; |
|
917
|
0
|
|
|
|
|
0
|
close $f; |
|
918
|
|
|
|
|
|
|
} |
|
919
|
0
|
0
|
0
|
|
|
0
|
!$sxc && $txt =~ m/^<\?xml/i and |
|
920
|
|
|
|
|
|
|
$sxc = Spreadsheet::ReadSXC::read_xml_string ($txt, $sxc_options); |
|
921
|
0
|
0
|
|
|
|
0
|
$debug > 8 and _dump (sxc => $sxc); |
|
922
|
0
|
0
|
|
|
|
0
|
if ($sxc) { |
|
923
|
0
|
|
|
|
|
0
|
my @data = ( { |
|
924
|
|
|
|
|
|
|
type => "sxc", |
|
925
|
|
|
|
|
|
|
parser => "Spreadsheet::ReadSXC", |
|
926
|
|
|
|
|
|
|
version => $Spreadsheet::ReadSXC::VERSION, |
|
927
|
|
|
|
|
|
|
parsers => [{ |
|
928
|
|
|
|
|
|
|
type => "sxc", |
|
929
|
|
|
|
|
|
|
parser => "Spreadsheet::ReadSXC", |
|
930
|
|
|
|
|
|
|
version => $Spreadsheet::ReadSXC::VERSION, |
|
931
|
|
|
|
|
|
|
}], |
|
932
|
|
|
|
|
|
|
error => undef, |
|
933
|
|
|
|
|
|
|
sheets => 0, |
|
934
|
|
|
|
|
|
|
sheet => {}, |
|
935
|
|
|
|
|
|
|
} ); |
|
936
|
|
|
|
|
|
|
my @sheets = ref $sxc eq "HASH" # < 0.20 |
|
937
|
|
|
|
|
|
|
? map { |
|
938
|
|
|
|
|
|
|
{ label => $_, |
|
939
|
0
|
|
|
|
|
0
|
data => $sxc->{$_}, |
|
940
|
|
|
|
|
|
|
} |
|
941
|
|
|
|
|
|
|
} keys %$sxc |
|
942
|
0
|
0
|
|
|
|
0
|
: @{$sxc}; |
|
|
0
|
|
|
|
|
0
|
|
|
943
|
0
|
|
|
|
|
0
|
foreach my $sheet (@sheets) { |
|
944
|
0
|
|
|
|
|
0
|
my @sheet = @{$sheet->{data}}; |
|
|
0
|
|
|
|
|
0
|
|
|
945
|
|
|
|
|
|
|
my %sheet = ( |
|
946
|
|
|
|
|
|
|
parser => 0, |
|
947
|
|
|
|
|
|
|
label => $sheet->{label}, |
|
948
|
0
|
|
|
|
|
0
|
maxrow => scalar @sheet, |
|
949
|
|
|
|
|
|
|
maxcol => 0, |
|
950
|
|
|
|
|
|
|
cell => [], |
|
951
|
|
|
|
|
|
|
attr => [], |
|
952
|
|
|
|
|
|
|
merged => [], |
|
953
|
|
|
|
|
|
|
active => 0, |
|
954
|
|
|
|
|
|
|
); |
|
955
|
0
|
|
|
|
|
0
|
my $sheet_idx = 1 + @data; |
|
956
|
0
|
0
|
|
|
|
0
|
$debug and print STDERR "\tSheet $sheet_idx '$sheet{label}' $sheet{maxrow} rows\n"; |
|
957
|
0
|
|
|
|
|
0
|
foreach my $r (0 .. $#sheet) { |
|
958
|
0
|
0
|
|
|
|
0
|
my @row = @{$sheet[$r]} or next; |
|
|
0
|
|
|
|
|
0
|
|
|
959
|
0
|
|
|
|
|
0
|
foreach my $c (0 .. $#row) { |
|
960
|
0
|
0
|
|
|
|
0
|
defined (my $val = $row[$c]) or next; |
|
961
|
0
|
|
|
|
|
0
|
my $C = $c + 1; |
|
962
|
0
|
0
|
|
|
|
0
|
$C > $sheet{maxcol} and $sheet{maxcol} = $C; |
|
963
|
0
|
|
|
|
|
0
|
my $cell = cr2cell ($C, $r + 1); |
|
964
|
0
|
0
|
|
|
|
0
|
$opt{rc} and $sheet{cell}[$C][$r + 1] = $val; |
|
965
|
0
|
0
|
|
|
|
0
|
$opt{cells} and $sheet{$cell} = $val; |
|
966
|
0
|
0
|
|
|
|
0
|
$opt{attr} and $sheet{attr}[$C][$r + 1] = { @def_attr }; |
|
967
|
|
|
|
|
|
|
} |
|
968
|
|
|
|
|
|
|
} |
|
969
|
0
|
|
|
|
|
0
|
for (@{$sheet{cell}}) { |
|
|
0
|
|
|
|
|
0
|
|
|
970
|
0
|
0
|
|
|
|
0
|
defined or $_ = []; |
|
971
|
|
|
|
|
|
|
} |
|
972
|
0
|
0
|
|
|
|
0
|
$debug and print STDERR "\tSheet $sheet_idx '$sheet{label}' $sheet{maxrow} x $sheet{maxcol}\n"; |
|
973
|
0
|
|
|
|
|
0
|
push @data, { %sheet }; |
|
974
|
0
|
|
|
|
|
0
|
$data[0]{sheets}++; |
|
975
|
0
|
|
|
|
|
0
|
$data[0]{sheet}{$sheet->{label}} = $#data; |
|
976
|
|
|
|
|
|
|
} |
|
977
|
0
|
|
|
|
|
0
|
return _clipsheets \%opt, [ @data ]; |
|
978
|
|
|
|
|
|
|
} |
|
979
|
|
|
|
|
|
|
} |
|
980
|
|
|
|
|
|
|
|
|
981
|
23
|
100
|
100
|
|
|
138
|
if (!ref $txt and $txt =~ m/\.\w+$/) { |
|
982
|
|
|
|
|
|
|
# Return (localized) system message |
|
983
|
5
|
50
|
|
|
|
120
|
open my $fh, "<", $txt and |
|
984
|
|
|
|
|
|
|
croak "I can open file $txt, but I do not know how to parse it\n"; |
|
985
|
|
|
|
|
|
|
|
|
986
|
5
|
|
|
|
|
91
|
$@ = $!; |
|
987
|
|
|
|
|
|
|
} |
|
988
|
|
|
|
|
|
|
|
|
989
|
23
|
|
|
|
|
127
|
return; |
|
990
|
|
|
|
|
|
|
} # ReadData |
|
991
|
|
|
|
|
|
|
|
|
992
|
|
|
|
|
|
|
sub add { |
|
993
|
2
|
|
|
2
|
1
|
7
|
my $book = shift; |
|
994
|
2
|
50
|
|
|
|
9
|
my $r = ReadData (@_) or return; |
|
995
|
|
|
|
|
|
|
$book && (ref $book eq "ARRAY" || |
|
996
|
2
|
50
|
33
|
|
|
37
|
ref $book eq __PACKAGE__) && $book->[0]{sheets} or return $r; |
|
|
|
|
33
|
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
997
|
|
|
|
|
|
|
|
|
998
|
2
|
|
|
|
|
5
|
my $c1 = $book->[0]; |
|
999
|
2
|
|
|
|
|
5
|
my $c2 = $r->[0]; |
|
1000
|
|
|
|
|
|
|
|
|
1001
|
2
|
50
|
|
|
|
9
|
unless ($c1->{parsers}) { |
|
1002
|
0
|
|
|
|
|
0
|
$c1->{parsers}[0]{$_} = $c1->{$_} for qw( type parser version ); |
|
1003
|
0
|
|
|
|
|
0
|
$book->[$_]{parser} = 0 for 1 .. $c1->{sheets}; |
|
1004
|
|
|
|
|
|
|
} |
|
1005
|
2
|
|
|
|
|
8
|
my ($pidx) = (grep { my $p = $c1->{parsers}[$_]; |
|
1006
|
|
|
|
|
|
|
$p->{type} eq $c2->{type} && |
|
1007
|
|
|
|
|
|
|
$p->{parser} eq $c2->{parser} && |
|
1008
|
2
|
50
|
33
|
|
|
5
|
$p->{version} eq $c2->{version} } 0 .. $#{$c1->{parsers}}); |
|
|
2
|
|
|
|
|
77
|
|
|
|
2
|
|
|
|
|
7
|
|
|
1009
|
2
|
50
|
|
|
|
9
|
unless (defined $pidx) { |
|
1010
|
0
|
|
|
|
|
0
|
$pidx = scalar @{$c1->{parsers}}; |
|
|
0
|
|
|
|
|
0
|
|
|
1011
|
0
|
|
|
|
|
0
|
$c1->{parsers}[$pidx]{$_} = $c2->{$_} for qw( type parser version ); |
|
1012
|
|
|
|
|
|
|
} |
|
1013
|
|
|
|
|
|
|
|
|
1014
|
2
|
|
|
|
|
7
|
foreach my $sn (sort { $c2->{sheet}{$a} <=> $c2->{sheet}{$b} } keys %{$c2->{sheet}}) { |
|
|
0
|
|
|
|
|
0
|
|
|
|
2
|
|
|
|
|
14
|
|
|
1015
|
2
|
|
|
|
|
5
|
my $s = $sn; |
|
1016
|
2
|
|
|
|
|
4
|
my $v = 2; |
|
1017
|
2
|
|
|
|
|
9
|
while (exists $c1->{sheet}{$s}) { |
|
1018
|
1
|
|
|
|
|
7
|
$s = $sn."[".$v++."]"; |
|
1019
|
|
|
|
|
|
|
} |
|
1020
|
2
|
|
|
|
|
18
|
$c1->{sheet}{$s} = $c1->{sheets} + $c2->{sheet}{$sn}; |
|
1021
|
2
|
|
|
|
|
11
|
$r->[$c2->{sheet}{$sn}]{parser} = $pidx; |
|
1022
|
2
|
|
|
|
|
9
|
push @$book, $r->[$c2->{sheet}{$sn}]; |
|
1023
|
|
|
|
|
|
|
} |
|
1024
|
2
|
|
|
|
|
5
|
$c1->{sheets} += $c2->{sheets}; |
|
1025
|
|
|
|
|
|
|
|
|
1026
|
2
|
|
|
|
|
19
|
return $book; |
|
1027
|
|
|
|
|
|
|
} # add |
|
1028
|
|
|
|
|
|
|
|
|
1029
|
|
|
|
|
|
|
package Spreadsheet::Read::Attribute; |
|
1030
|
|
|
|
|
|
|
|
|
1031
|
53
|
|
|
53
|
|
614
|
use Carp; |
|
|
53
|
|
|
|
|
194
|
|
|
|
53
|
|
|
|
|
4624
|
|
|
1032
|
53
|
|
|
53
|
|
472
|
use vars qw( $AUTOLOAD ); |
|
|
53
|
|
|
|
|
128
|
|
|
|
53
|
|
|
|
|
64261
|
|
|
1033
|
|
|
|
|
|
|
|
|
1034
|
|
|
|
|
|
|
sub AUTOLOAD { |
|
1035
|
6
|
|
|
6
|
|
788
|
my $self = shift; |
|
1036
|
6
|
|
|
|
|
42
|
(my $attr = $AUTOLOAD) =~ s/.*:://; |
|
1037
|
6
|
|
|
|
|
249
|
$self->{$attr}; |
|
1038
|
|
|
|
|
|
|
} # AUTOLOAD |
|
1039
|
|
|
|
|
|
|
|
|
1040
|
|
|
|
|
|
|
package Spreadsheet::Read::Sheet; |
|
1041
|
|
|
|
|
|
|
|
|
1042
|
|
|
|
|
|
|
sub cell { |
|
1043
|
55
|
|
|
55
|
|
17964
|
my ($sheet, @id) = @_; |
|
1044
|
|
|
|
|
|
|
@id == 2 && $id[0] =~ m/^[0-9]+$/ && $id[1] =~ m/^[0-9]+$/ and |
|
1045
|
55
|
50
|
66
|
|
|
542
|
return $sheet->{cell}[$id[0]][$id[1]]; |
|
|
|
|
66
|
|
|
|
|
|
1046
|
|
|
|
|
|
|
@id && $id[0] && exists $sheet->{$id[0]} and |
|
1047
|
27
|
50
|
33
|
|
|
296
|
return $sheet->{$id[0]}; |
|
|
|
|
33
|
|
|
|
|
|
1048
|
|
|
|
|
|
|
} # cell |
|
1049
|
|
|
|
|
|
|
|
|
1050
|
|
|
|
|
|
|
sub attr { |
|
1051
|
8
|
|
|
8
|
|
23
|
my ($sheet, @id) = @_; |
|
1052
|
8
|
|
|
|
|
15
|
my $class = "Spreadsheet::Read::Attribute"; |
|
1053
|
|
|
|
|
|
|
@id == 2 && $id[0] =~ m/^[0-9]+$/ && $id[1] =~ m/^[0-9]+$/ and |
|
1054
|
8
|
50
|
66
|
|
|
70
|
return bless $sheet->{attr}[$id[0]][$id[1]] => $class; |
|
|
|
|
66
|
|
|
|
|
|
1055
|
5
|
50
|
33
|
|
|
34
|
if (@id && $id[0] && exists $sheet->{$id[0]}) { |
|
|
|
|
33
|
|
|
|
|
|
1056
|
5
|
|
|
|
|
17
|
my ($c, $r) = $sheet->cell2cr ($id[0]); |
|
1057
|
5
|
|
|
|
|
54
|
return bless $sheet->{attr}[$c][$r] => $class; |
|
1058
|
|
|
|
|
|
|
} |
|
1059
|
0
|
|
|
|
|
0
|
undef; |
|
1060
|
|
|
|
|
|
|
} # attr |
|
1061
|
|
|
|
|
|
|
|
|
1062
|
|
|
|
|
|
|
sub maxrow { |
|
1063
|
2
|
|
|
2
|
|
5
|
my $sheet = shift; |
|
1064
|
2
|
|
|
|
|
9
|
return $sheet->{maxrow}; |
|
1065
|
|
|
|
|
|
|
} # maxrow |
|
1066
|
|
|
|
|
|
|
|
|
1067
|
|
|
|
|
|
|
sub maxcol { |
|
1068
|
2
|
|
|
2
|
|
5
|
my $sheet = shift; |
|
1069
|
2
|
|
|
|
|
8
|
return $sheet->{maxcol}; |
|
1070
|
|
|
|
|
|
|
} # maxrow |
|
1071
|
|
|
|
|
|
|
|
|
1072
|
|
|
|
|
|
|
sub col2label { |
|
1073
|
1
|
50
|
|
1
|
|
9
|
$_[0] =~ m/::/ and shift; # class unused |
|
1074
|
1
|
|
|
|
|
22
|
return Spreadsheet::Read::col2label (@_); |
|
1075
|
|
|
|
|
|
|
} # col2label |
|
1076
|
|
|
|
|
|
|
|
|
1077
|
|
|
|
|
|
|
sub cr2cell { |
|
1078
|
24
|
50
|
|
24
|
|
90
|
$_[0] =~ m/::/ and shift; # class unused |
|
1079
|
24
|
|
|
|
|
89
|
return Spreadsheet::Read::cr2cell (@_); |
|
1080
|
|
|
|
|
|
|
} # cr2cell |
|
1081
|
|
|
|
|
|
|
|
|
1082
|
|
|
|
|
|
|
sub cell2cr { |
|
1083
|
21
|
50
|
|
21
|
|
11124
|
$_[0] =~ m/::/ and shift; # class unused |
|
1084
|
21
|
|
|
|
|
64
|
return Spreadsheet::Read::cell2cr (@_); |
|
1085
|
|
|
|
|
|
|
} # cell2cr |
|
1086
|
|
|
|
|
|
|
|
|
1087
|
|
|
|
|
|
|
sub label { |
|
1088
|
2
|
|
|
2
|
|
6
|
my ($sheet, $label) = @_; |
|
1089
|
2
|
100
|
|
|
|
10
|
defined $label and $sheet->{label} = $label; |
|
1090
|
2
|
|
|
|
|
8
|
return $sheet->{label}; |
|
1091
|
|
|
|
|
|
|
} # label |
|
1092
|
|
|
|
|
|
|
|
|
1093
|
|
|
|
|
|
|
sub active { |
|
1094
|
1
|
|
|
1
|
|
3
|
my $sheet = shift; |
|
1095
|
1
|
|
|
|
|
4
|
return $sheet->{active}; |
|
1096
|
|
|
|
|
|
|
} # label |
|
1097
|
|
|
|
|
|
|
|
|
1098
|
|
|
|
|
|
|
# my @row = $sheet->cellrow (1); |
|
1099
|
|
|
|
|
|
|
sub cellrow { |
|
1100
|
4
|
|
|
4
|
|
11
|
my ($sheet, $row) = @_; |
|
1101
|
4
|
100
|
66
|
|
|
33
|
defined $row && $row > 0 && $row <= $sheet->{maxrow} or return; |
|
|
|
|
100
|
|
|
|
|
|
1102
|
1
|
|
|
|
|
3
|
my $s = $sheet->{cell}; |
|
1103
|
1
|
|
|
|
|
6
|
map { $s->[$_][$row] } 1..$sheet->{maxcol}; |
|
|
19
|
|
|
|
|
42
|
|
|
1104
|
|
|
|
|
|
|
} # cellrow |
|
1105
|
|
|
|
|
|
|
|
|
1106
|
|
|
|
|
|
|
# my @row = $sheet->row (1); |
|
1107
|
|
|
|
|
|
|
sub row { |
|
1108
|
4
|
|
|
4
|
|
9
|
my ($sheet, $row) = @_; |
|
1109
|
4
|
100
|
66
|
|
|
37
|
defined $row && $row > 0 && $row <= $sheet->{maxrow} or return; |
|
|
|
|
100
|
|
|
|
|
|
1110
|
1
|
|
|
|
|
5
|
map { $sheet->{$sheet->cr2cell ($_, $row)} } 1..$sheet->{maxcol}; |
|
|
19
|
|
|
|
|
48
|
|
|
1111
|
|
|
|
|
|
|
} # row |
|
1112
|
|
|
|
|
|
|
|
|
1113
|
|
|
|
|
|
|
# my @col = $sheet->cellcolumn (1); |
|
1114
|
|
|
|
|
|
|
sub cellcolumn { |
|
1115
|
4
|
|
|
4
|
|
10
|
my ($sheet, $col) = @_; |
|
1116
|
4
|
100
|
66
|
|
|
37
|
defined $col && $col > 0 && $col <= $sheet->{maxcol} or return; |
|
|
|
|
100
|
|
|
|
|
|
1117
|
1
|
|
|
|
|
3
|
my $s = $sheet->{cell}; |
|
1118
|
1
|
|
|
|
|
4
|
map { $s->[$col][$_] } 1..$sheet->{maxrow}; |
|
|
5
|
|
|
|
|
20
|
|
|
1119
|
|
|
|
|
|
|
} # cellcolumn |
|
1120
|
|
|
|
|
|
|
|
|
1121
|
|
|
|
|
|
|
# my @col = $sheet->column (1); |
|
1122
|
|
|
|
|
|
|
sub column { |
|
1123
|
4
|
|
|
4
|
|
13
|
my ($sheet, $col) = @_; |
|
1124
|
4
|
100
|
66
|
|
|
32
|
defined $col && $col > 0 && $col <= $sheet->{maxcol} or return; |
|
|
|
|
100
|
|
|
|
|
|
1125
|
1
|
|
|
|
|
4
|
map { $sheet->{$sheet->cr2cell ($col, $_)} } 1..$sheet->{maxrow}; |
|
|
5
|
|
|
|
|
13
|
|
|
1126
|
|
|
|
|
|
|
} # column |
|
1127
|
|
|
|
|
|
|
|
|
1128
|
|
|
|
|
|
|
# Convert {cell}'s [column][row] to a [row][column] list |
|
1129
|
|
|
|
|
|
|
# my @rows = $sheet->rows (); |
|
1130
|
|
|
|
|
|
|
sub rows { |
|
1131
|
1
|
|
|
1
|
|
4
|
my $sheet = shift; |
|
1132
|
1
|
|
|
|
|
2
|
my $s = $sheet->{cell}; |
|
1133
|
|
|
|
|
|
|
|
|
1134
|
|
|
|
|
|
|
map { |
|
1135
|
5
|
|
|
|
|
8
|
my $r = $_; |
|
1136
|
5
|
|
|
|
|
10
|
[ map { $s->[$_][$r] } 1..$sheet->{maxcol} ]; |
|
|
95
|
|
|
|
|
199
|
|
|
1137
|
1
|
|
|
|
|
5
|
} 1..$sheet->{maxrow}; |
|
1138
|
|
|
|
|
|
|
} # rows |
|
1139
|
|
|
|
|
|
|
|
|
1140
|
|
|
|
|
|
|
1; |
|
1141
|
|
|
|
|
|
|
|
|
1142
|
|
|
|
|
|
|
__END__ |
|
1143
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
1144
|
|
|
|
|
|
|
|
|
1145
|
|
|
|
|
|
|
Spreadsheet::Read tries to transparently read *any* spreadsheet and |
|
1146
|
|
|
|
|
|
|
return its content in a universal manner independent of the parsing |
|
1147
|
|
|
|
|
|
|
module that does the actual spreadsheet scanning. |
|
1148
|
|
|
|
|
|
|
|
|
1149
|
|
|
|
|
|
|
For OpenOffice and/or LibreOffice this module uses |
|
1150
|
|
|
|
|
|
|
L<Spreadsheet::ReadSXC|https://metacpan.org/release/Spreadsheet-ReadSXC> |
|
1151
|
|
|
|
|
|
|
|
|
1152
|
|
|
|
|
|
|
For Microsoft Excel this module uses |
|
1153
|
|
|
|
|
|
|
L<Spreadsheet::ParseExcel|https://metacpan.org/release/Spreadsheet-ParseExcel>, |
|
1154
|
|
|
|
|
|
|
L<Spreadsheet::ParseXLSX|https://metacpan.org/release/Spreadsheet-ParseXLSX>, or |
|
1155
|
|
|
|
|
|
|
L<Spreadsheet::XLSX|https://metacpan.org/release/Spreadsheet-XLSX> (stronly |
|
1156
|
|
|
|
|
|
|
discouraged). |
|
1157
|
|
|
|
|
|
|
|
|
1158
|
|
|
|
|
|
|
For CSV this module uses L<Text::CSV_XS|https://metacpan.org/release/Text-CSV_XS> |
|
1159
|
|
|
|
|
|
|
or L<Text::CSV_PP|https://metacpan.org/release/Text-CSV_PP>. |
|
1160
|
|
|
|
|
|
|
|
|
1161
|
|
|
|
|
|
|
For SquirrelCalc there is a very simplistic built-in parser |
|
1162
|
|
|
|
|
|
|
|
|
1163
|
|
|
|
|
|
|
=head2 Data structure |
|
1164
|
|
|
|
|
|
|
|
|
1165
|
|
|
|
|
|
|
The data is returned as an array reference: |
|
1166
|
|
|
|
|
|
|
|
|
1167
|
|
|
|
|
|
|
$book = [ |
|
1168
|
|
|
|
|
|
|
# Entry 0 is the overall control hash |
|
1169
|
|
|
|
|
|
|
{ sheets => 2, |
|
1170
|
|
|
|
|
|
|
sheet => { |
|
1171
|
|
|
|
|
|
|
"Sheet 1" => 1, |
|
1172
|
|
|
|
|
|
|
"Sheet 2" => 2, |
|
1173
|
|
|
|
|
|
|
}, |
|
1174
|
|
|
|
|
|
|
parsers => [ { |
|
1175
|
|
|
|
|
|
|
type => "xls", |
|
1176
|
|
|
|
|
|
|
parser => "Spreadsheet::ParseExcel", |
|
1177
|
|
|
|
|
|
|
version => 0.59, |
|
1178
|
|
|
|
|
|
|
}], |
|
1179
|
|
|
|
|
|
|
error => undef, |
|
1180
|
|
|
|
|
|
|
}, |
|
1181
|
|
|
|
|
|
|
# Entry 1 is the first sheet |
|
1182
|
|
|
|
|
|
|
{ parser => 0, |
|
1183
|
|
|
|
|
|
|
label => "Sheet 1", |
|
1184
|
|
|
|
|
|
|
maxrow => 2, |
|
1185
|
|
|
|
|
|
|
maxcol => 4, |
|
1186
|
|
|
|
|
|
|
cell => [ undef, |
|
1187
|
|
|
|
|
|
|
[ undef, 1 ], |
|
1188
|
|
|
|
|
|
|
[ undef, undef, undef, undef, undef, "Nugget" ], |
|
1189
|
|
|
|
|
|
|
], |
|
1190
|
|
|
|
|
|
|
attr => [], |
|
1191
|
|
|
|
|
|
|
merged => [], |
|
1192
|
|
|
|
|
|
|
active => 1, |
|
1193
|
|
|
|
|
|
|
A1 => 1, |
|
1194
|
|
|
|
|
|
|
B5 => "Nugget", |
|
1195
|
|
|
|
|
|
|
}, |
|
1196
|
|
|
|
|
|
|
# Entry 2 is the second sheet |
|
1197
|
|
|
|
|
|
|
{ parser => 0, |
|
1198
|
|
|
|
|
|
|
label => "Sheet 2", |
|
1199
|
|
|
|
|
|
|
: |
|
1200
|
|
|
|
|
|
|
: |
|
1201
|
|
|
|
|
|
|
|
|
1202
|
|
|
|
|
|
|
To keep as close contact to spreadsheet users, row and column 1 have |
|
1203
|
|
|
|
|
|
|
index 1 too in the C<cell> element of the sheet hash, so cell "A1" is |
|
1204
|
|
|
|
|
|
|
the same as C<cell> [1, 1] (column first). To switch between the two, |
|
1205
|
|
|
|
|
|
|
there are helper functions available: C<cell2cr ()>, C<cr2cell ()>, |
|
1206
|
|
|
|
|
|
|
and C<col2label ()>. |
|
1207
|
|
|
|
|
|
|
|
|
1208
|
|
|
|
|
|
|
The C<cell> hash entry contains unformatted data, while the hash entries |
|
1209
|
|
|
|
|
|
|
with the traditional labels contain the formatted values (if applicable). |
|
1210
|
|
|
|
|
|
|
|
|
1211
|
|
|
|
|
|
|
The control hash (the first entry in the returned array ref), contains |
|
1212
|
|
|
|
|
|
|
some spreadsheet meta-data. The entry C<sheet> is there to be able to find |
|
1213
|
|
|
|
|
|
|
the sheets when accessing them by name: |
|
1214
|
|
|
|
|
|
|
|
|
1215
|
|
|
|
|
|
|
my %sheet2 = %{$book->[$book->[0]{sheet}{"Sheet 2"}]}; |
|
1216
|
|
|
|
|
|
|
|
|
1217
|
|
|
|
|
|
|
=head2 Formatted vs Unformatted |
|
1218
|
|
|
|
|
|
|
|
|
1219
|
|
|
|
|
|
|
The difference between formatted and unformatted cells is that the (optional) |
|
1220
|
|
|
|
|
|
|
format is applied to the cell or not. This part is B<completely> implemented |
|
1221
|
|
|
|
|
|
|
on the parser side. Spreadsheet::Read just makes both available if these are |
|
1222
|
|
|
|
|
|
|
supported. Options provide means to disable either. If the parser does not |
|
1223
|
|
|
|
|
|
|
provide formatted cells - like CSV - both values are equal. |
|
1224
|
|
|
|
|
|
|
|
|
1225
|
|
|
|
|
|
|
To show what this implies: |
|
1226
|
|
|
|
|
|
|
|
|
1227
|
|
|
|
|
|
|
use Spreadsheet::Read; |
|
1228
|
|
|
|
|
|
|
|
|
1229
|
|
|
|
|
|
|
my $file = "files/example.xlsx"; |
|
1230
|
|
|
|
|
|
|
my $workbook = Spreadsheet::Read->new ($file); |
|
1231
|
|
|
|
|
|
|
|
|
1232
|
|
|
|
|
|
|
my $info = $workbook->[0]; |
|
1233
|
|
|
|
|
|
|
say "Parsed $file with $info->{parser}-$info->{version}"; |
|
1234
|
|
|
|
|
|
|
|
|
1235
|
|
|
|
|
|
|
my $sheet = $workbook->sheet (1); |
|
1236
|
|
|
|
|
|
|
|
|
1237
|
|
|
|
|
|
|
say join "\t" => "Formatted:", $sheet->row (1); |
|
1238
|
|
|
|
|
|
|
say join "\t" => "Unformatted:", $sheet->cellrow (1); |
|
1239
|
|
|
|
|
|
|
|
|
1240
|
|
|
|
|
|
|
Might return very different results depending one the underlying parser (and |
|
1241
|
|
|
|
|
|
|
its version): |
|
1242
|
|
|
|
|
|
|
|
|
1243
|
|
|
|
|
|
|
Parsed files/example.xlsx with Spreadsheet::ParseXLSX-0.27 |
|
1244
|
|
|
|
|
|
|
Formatted: 8-Aug Foo & Barr < Quux |
|
1245
|
|
|
|
|
|
|
Unformatted: 39668 Foo & Barr < Quux |
|
1246
|
|
|
|
|
|
|
|
|
1247
|
|
|
|
|
|
|
Parsed files/example.xlsx with Spreadsheet::XLSX-0.15 |
|
1248
|
|
|
|
|
|
|
Formatted: 39668 Foo & Barr < Quux |
|
1249
|
|
|
|
|
|
|
Unformatted: 39668 Foo & Barr < Quux |
|
1250
|
|
|
|
|
|
|
|
|
1251
|
|
|
|
|
|
|
=head2 Functions and methods |
|
1252
|
|
|
|
|
|
|
|
|
1253
|
|
|
|
|
|
|
=head3 new |
|
1254
|
|
|
|
|
|
|
|
|
1255
|
|
|
|
|
|
|
my $book = Spreadsheet::Read->new (...) or die $@; |
|
1256
|
|
|
|
|
|
|
|
|
1257
|
|
|
|
|
|
|
All options accepted by ReadData are accepted by new. |
|
1258
|
|
|
|
|
|
|
|
|
1259
|
|
|
|
|
|
|
With no arguments at all, $book will be an object where sheets can be added |
|
1260
|
|
|
|
|
|
|
using C<add> |
|
1261
|
|
|
|
|
|
|
|
|
1262
|
|
|
|
|
|
|
my $book = Spreadsheet::Read->new (); |
|
1263
|
|
|
|
|
|
|
$book->add ("file.csv"); |
|
1264
|
|
|
|
|
|
|
$book->add ("file.cslx"); |
|
1265
|
|
|
|
|
|
|
|
|
1266
|
|
|
|
|
|
|
=head3 ReadData |
|
1267
|
|
|
|
|
|
|
|
|
1268
|
|
|
|
|
|
|
my $book = ReadData ($source [, option => value [, ... ]]); |
|
1269
|
|
|
|
|
|
|
|
|
1270
|
|
|
|
|
|
|
my $book = ReadData ("file.csv", sep => ',', quote => '"'); |
|
1271
|
|
|
|
|
|
|
|
|
1272
|
|
|
|
|
|
|
my $book = ReadData ("file.xls", dtfmt => "yyyy-mm-dd"); |
|
1273
|
|
|
|
|
|
|
|
|
1274
|
|
|
|
|
|
|
my $book = ReadData ("file.ods"); |
|
1275
|
|
|
|
|
|
|
|
|
1276
|
|
|
|
|
|
|
my $book = ReadData ("file.sxc"); |
|
1277
|
|
|
|
|
|
|
|
|
1278
|
|
|
|
|
|
|
my $book = ReadData ("content.xml"); |
|
1279
|
|
|
|
|
|
|
|
|
1280
|
|
|
|
|
|
|
my $book = ReadData ($content); |
|
1281
|
|
|
|
|
|
|
|
|
1282
|
|
|
|
|
|
|
my $book = ReadData ($content, parser => "xlsx"); |
|
1283
|
|
|
|
|
|
|
|
|
1284
|
|
|
|
|
|
|
my $book = ReadData ($fh, parser => "xlsx"); |
|
1285
|
|
|
|
|
|
|
|
|
1286
|
|
|
|
|
|
|
my $book = ReadData (\$content, parser => "xlsx"); |
|
1287
|
|
|
|
|
|
|
|
|
1288
|
|
|
|
|
|
|
Tries to convert the given file, string, or stream to the data structure |
|
1289
|
|
|
|
|
|
|
described above. |
|
1290
|
|
|
|
|
|
|
|
|
1291
|
|
|
|
|
|
|
Processing Excel data from a stream or content is supported through a |
|
1292
|
|
|
|
|
|
|
L<File::Temp|https://metacpan.org/release/File-Temp> temporary file or |
|
1293
|
|
|
|
|
|
|
L<IO::Scalar|https://metacpan.org/release/IO-Scalar> when available. |
|
1294
|
|
|
|
|
|
|
|
|
1295
|
|
|
|
|
|
|
L<Spreadsheet::ReadSXC|https://metacpan.org/release/Spreadsheet-ReadSXC> |
|
1296
|
|
|
|
|
|
|
does preserve sheet order as of version 0.20. |
|
1297
|
|
|
|
|
|
|
|
|
1298
|
|
|
|
|
|
|
Choosing between C<$content> and C<\\$content> (with or without passing |
|
1299
|
|
|
|
|
|
|
the desired C<parser> option) may be depending on trial and terror. |
|
1300
|
|
|
|
|
|
|
C<ReadData> does try to determine parser type on content if needed, but |
|
1301
|
|
|
|
|
|
|
not all combinations are checked, and not all signatures are builtin. |
|
1302
|
|
|
|
|
|
|
|
|
1303
|
|
|
|
|
|
|
Currently supported options are: |
|
1304
|
|
|
|
|
|
|
|
|
1305
|
|
|
|
|
|
|
=over 2 |
|
1306
|
|
|
|
|
|
|
|
|
1307
|
|
|
|
|
|
|
=item parser |
|
1308
|
|
|
|
|
|
|
X<parser> |
|
1309
|
|
|
|
|
|
|
|
|
1310
|
|
|
|
|
|
|
Force the data to be parsed by a specific format. Possible values are |
|
1311
|
|
|
|
|
|
|
C<csv>, C<prl> (or C<perl>), C<sc> (or C<squirelcalc>), C<sxc> (or C<oo>, |
|
1312
|
|
|
|
|
|
|
C<ods>, C<openoffice>, C<libreoffice>) C<xls> (or C<excel>), and C<xlsx> |
|
1313
|
|
|
|
|
|
|
(or C<excel2007>). |
|
1314
|
|
|
|
|
|
|
|
|
1315
|
|
|
|
|
|
|
When parsing streams, instead of files, it is highly recommended to pass |
|
1316
|
|
|
|
|
|
|
this option. |
|
1317
|
|
|
|
|
|
|
|
|
1318
|
|
|
|
|
|
|
Spreadsheet::Read supports several underlying parsers per spreadsheet |
|
1319
|
|
|
|
|
|
|
type. It will try those from most favored to least favored. When you |
|
1320
|
|
|
|
|
|
|
have a good reason to prefer a different parser, you can set that in |
|
1321
|
|
|
|
|
|
|
environment variables. The other options then will not be tested for: |
|
1322
|
|
|
|
|
|
|
|
|
1323
|
|
|
|
|
|
|
env SPREADSHEET_READ_CSV=Text::CSV_PP ... |
|
1324
|
|
|
|
|
|
|
|
|
1325
|
|
|
|
|
|
|
=item cells |
|
1326
|
|
|
|
|
|
|
X<cells> |
|
1327
|
|
|
|
|
|
|
|
|
1328
|
|
|
|
|
|
|
Control the generation of named cells ("C<A1>" etc). Default is true. |
|
1329
|
|
|
|
|
|
|
|
|
1330
|
|
|
|
|
|
|
=item rc |
|
1331
|
|
|
|
|
|
|
|
|
1332
|
|
|
|
|
|
|
Control the generation of the {cell}[c][r] entries. Default is true. |
|
1333
|
|
|
|
|
|
|
|
|
1334
|
|
|
|
|
|
|
=item attr |
|
1335
|
|
|
|
|
|
|
|
|
1336
|
|
|
|
|
|
|
Control the generation of the {attr}[c][r] entries. Default is false. |
|
1337
|
|
|
|
|
|
|
See L</Cell Attributes> below. |
|
1338
|
|
|
|
|
|
|
|
|
1339
|
|
|
|
|
|
|
=item clip |
|
1340
|
|
|
|
|
|
|
|
|
1341
|
|
|
|
|
|
|
If set, L<C<ReadData>|/ReadData> will remove all trailing rows and columns |
|
1342
|
|
|
|
|
|
|
per sheet that have no data, where no data means only undefined or empty |
|
1343
|
|
|
|
|
|
|
cells (after optional stripping). If a sheet has no data at all, the sheet |
|
1344
|
|
|
|
|
|
|
will be skipped entirely when this attribute is true. |
|
1345
|
|
|
|
|
|
|
|
|
1346
|
|
|
|
|
|
|
=item strip |
|
1347
|
|
|
|
|
|
|
|
|
1348
|
|
|
|
|
|
|
If set, L<C<ReadData>|/ReadData> will remove trailing- and/or |
|
1349
|
|
|
|
|
|
|
leading-whitespace from every field. |
|
1350
|
|
|
|
|
|
|
|
|
1351
|
|
|
|
|
|
|
strip leading strailing |
|
1352
|
|
|
|
|
|
|
----- ------- --------- |
|
1353
|
|
|
|
|
|
|
0 n/a n/a |
|
1354
|
|
|
|
|
|
|
1 strip n/a |
|
1355
|
|
|
|
|
|
|
2 n/a strip |
|
1356
|
|
|
|
|
|
|
3 strip strip |
|
1357
|
|
|
|
|
|
|
|
|
1358
|
|
|
|
|
|
|
=item pivot |
|
1359
|
|
|
|
|
|
|
|
|
1360
|
|
|
|
|
|
|
Swap all rows and columns. |
|
1361
|
|
|
|
|
|
|
|
|
1362
|
|
|
|
|
|
|
When a sheet contains data like |
|
1363
|
|
|
|
|
|
|
|
|
1364
|
|
|
|
|
|
|
A1 B1 C1 E1 |
|
1365
|
|
|
|
|
|
|
A2 C2 D2 |
|
1366
|
|
|
|
|
|
|
A3 B3 C3 D3 E3 |
|
1367
|
|
|
|
|
|
|
|
|
1368
|
|
|
|
|
|
|
using C<pivot> will return the sheet data as |
|
1369
|
|
|
|
|
|
|
|
|
1370
|
|
|
|
|
|
|
A1 A2 A3 |
|
1371
|
|
|
|
|
|
|
B1 B3 |
|
1372
|
|
|
|
|
|
|
C1 C2 C3 |
|
1373
|
|
|
|
|
|
|
D2 D3 |
|
1374
|
|
|
|
|
|
|
E1 E3 |
|
1375
|
|
|
|
|
|
|
|
|
1376
|
|
|
|
|
|
|
=item sep |
|
1377
|
|
|
|
|
|
|
|
|
1378
|
|
|
|
|
|
|
Set separator for CSV. Default is comma C<,>. |
|
1379
|
|
|
|
|
|
|
|
|
1380
|
|
|
|
|
|
|
=item quote |
|
1381
|
|
|
|
|
|
|
|
|
1382
|
|
|
|
|
|
|
Set quote character for CSV. Default is C<">. |
|
1383
|
|
|
|
|
|
|
|
|
1384
|
|
|
|
|
|
|
=item dtfmt |
|
1385
|
|
|
|
|
|
|
|
|
1386
|
|
|
|
|
|
|
Set the format for MS-Excel date fields that are set to use the default |
|
1387
|
|
|
|
|
|
|
date format. The default format in Excel is "C<m-d-yy>", which is both |
|
1388
|
|
|
|
|
|
|
not year 2000 safe, nor very useful. The default is now "C<yyyy-mm-dd>", |
|
1389
|
|
|
|
|
|
|
which is more ISO-like. |
|
1390
|
|
|
|
|
|
|
|
|
1391
|
|
|
|
|
|
|
Note that date formatting in MS-Excel is not reliable at all, as it will |
|
1392
|
|
|
|
|
|
|
store/replace/change the date field separator in already stored formats |
|
1393
|
|
|
|
|
|
|
if you change your locale settings. So the above mentioned default can |
|
1394
|
|
|
|
|
|
|
be either "C<m-d-yy>" OR "C<m/d/yy>" depending on what that specific |
|
1395
|
|
|
|
|
|
|
character happened to be at the time the user saved the file. |
|
1396
|
|
|
|
|
|
|
|
|
1397
|
|
|
|
|
|
|
=item debug |
|
1398
|
|
|
|
|
|
|
|
|
1399
|
|
|
|
|
|
|
Enable some diagnostic messages to STDERR. |
|
1400
|
|
|
|
|
|
|
|
|
1401
|
|
|
|
|
|
|
The value determines how much diagnostics are dumped (using |
|
1402
|
|
|
|
|
|
|
L<Data::Peek|https://metacpan.org/release/Data-Peek>). A value of C<9> |
|
1403
|
|
|
|
|
|
|
and higher will dump the entire structure from the back-end parser. |
|
1404
|
|
|
|
|
|
|
|
|
1405
|
|
|
|
|
|
|
=item passwd |
|
1406
|
|
|
|
|
|
|
|
|
1407
|
|
|
|
|
|
|
Use this password to decrypt password protected spreadsheet. |
|
1408
|
|
|
|
|
|
|
|
|
1409
|
|
|
|
|
|
|
Currently only supports Excel. |
|
1410
|
|
|
|
|
|
|
|
|
1411
|
|
|
|
|
|
|
=back |
|
1412
|
|
|
|
|
|
|
|
|
1413
|
|
|
|
|
|
|
All other attributes/options will be passed to the underlying parser if |
|
1414
|
|
|
|
|
|
|
that parser supports attributes. |
|
1415
|
|
|
|
|
|
|
|
|
1416
|
|
|
|
|
|
|
=head3 col2label |
|
1417
|
|
|
|
|
|
|
|
|
1418
|
|
|
|
|
|
|
my $col_id = col2label (col); |
|
1419
|
|
|
|
|
|
|
|
|
1420
|
|
|
|
|
|
|
my $col_id = $book->col2label (col); # OO |
|
1421
|
|
|
|
|
|
|
|
|
1422
|
|
|
|
|
|
|
C<col2label ()> converts a C<(column)> (1 based) to the letters used in the |
|
1423
|
|
|
|
|
|
|
traditional cell notation: |
|
1424
|
|
|
|
|
|
|
|
|
1425
|
|
|
|
|
|
|
my $id = col2label ( 4); # $id now "D" |
|
1426
|
|
|
|
|
|
|
my $id = col2label (28); # $id now "AB" |
|
1427
|
|
|
|
|
|
|
|
|
1428
|
|
|
|
|
|
|
=head3 cr2cell |
|
1429
|
|
|
|
|
|
|
|
|
1430
|
|
|
|
|
|
|
my $cell = cr2cell (col, row); |
|
1431
|
|
|
|
|
|
|
|
|
1432
|
|
|
|
|
|
|
my $cell = $book->cr2cell (col, row); # OO |
|
1433
|
|
|
|
|
|
|
|
|
1434
|
|
|
|
|
|
|
C<cr2cell ()> converts a C<(column, row)> pair (1 based) to the |
|
1435
|
|
|
|
|
|
|
traditional cell notation: |
|
1436
|
|
|
|
|
|
|
|
|
1437
|
|
|
|
|
|
|
my $cell = cr2cell ( 4, 14); # $cell now "D14" |
|
1438
|
|
|
|
|
|
|
my $cell = cr2cell (28, 4); # $cell now "AB4" |
|
1439
|
|
|
|
|
|
|
|
|
1440
|
|
|
|
|
|
|
=head3 cell2cr |
|
1441
|
|
|
|
|
|
|
|
|
1442
|
|
|
|
|
|
|
my ($col, $row) = cell2cr ($cell); |
|
1443
|
|
|
|
|
|
|
|
|
1444
|
|
|
|
|
|
|
my ($col, $row) = $book->cell2cr ($cell); # OO |
|
1445
|
|
|
|
|
|
|
|
|
1446
|
|
|
|
|
|
|
C<cell2cr ()> converts traditional cell notation to a C<(column, row)> |
|
1447
|
|
|
|
|
|
|
pair (1 based): |
|
1448
|
|
|
|
|
|
|
|
|
1449
|
|
|
|
|
|
|
my ($col, $row) = cell2cr ("D14"); # returns ( 4, 14) |
|
1450
|
|
|
|
|
|
|
my ($col, $row) = cell2cr ("AB4"); # returns (28, 4) |
|
1451
|
|
|
|
|
|
|
|
|
1452
|
|
|
|
|
|
|
=head3 row |
|
1453
|
|
|
|
|
|
|
|
|
1454
|
|
|
|
|
|
|
my @row = row ($sheet, $row) |
|
1455
|
|
|
|
|
|
|
|
|
1456
|
|
|
|
|
|
|
my @row = Spreadsheet::Read::row ($book->[1], 3); |
|
1457
|
|
|
|
|
|
|
|
|
1458
|
|
|
|
|
|
|
my @row = $book->row ($sheet, $row); # OO |
|
1459
|
|
|
|
|
|
|
|
|
1460
|
|
|
|
|
|
|
Get full row of formatted values (like C<< $sheet->{A3} .. $sheet->{G3} >>) |
|
1461
|
|
|
|
|
|
|
|
|
1462
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1463
|
|
|
|
|
|
|
|
|
1464
|
|
|
|
|
|
|
C<row ()> is not imported by default, so either specify it in the |
|
1465
|
|
|
|
|
|
|
use argument list, or call it fully qualified. |
|
1466
|
|
|
|
|
|
|
|
|
1467
|
|
|
|
|
|
|
See also the C<row ()> method on sheets. |
|
1468
|
|
|
|
|
|
|
|
|
1469
|
|
|
|
|
|
|
=head3 cellrow |
|
1470
|
|
|
|
|
|
|
|
|
1471
|
|
|
|
|
|
|
my @row = cellrow ($sheet, $row); |
|
1472
|
|
|
|
|
|
|
|
|
1473
|
|
|
|
|
|
|
my @row = Spreadsheet::Read::cellrow ($book->[1], 3); |
|
1474
|
|
|
|
|
|
|
|
|
1475
|
|
|
|
|
|
|
my @row = $book->cellrow ($sheet, $row); # OO |
|
1476
|
|
|
|
|
|
|
|
|
1477
|
|
|
|
|
|
|
Get full row of unformatted values (like C<< $sheet->{cell}[1][3] .. $sheet->{cell}[7][3] >>) |
|
1478
|
|
|
|
|
|
|
|
|
1479
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1480
|
|
|
|
|
|
|
|
|
1481
|
|
|
|
|
|
|
C<cellrow ()> is not imported by default, so either specify it in the |
|
1482
|
|
|
|
|
|
|
use argument list, or call it fully qualified or as method call. |
|
1483
|
|
|
|
|
|
|
|
|
1484
|
|
|
|
|
|
|
See also the C<cellrow ()> method on sheets. |
|
1485
|
|
|
|
|
|
|
|
|
1486
|
|
|
|
|
|
|
=head3 rows |
|
1487
|
|
|
|
|
|
|
|
|
1488
|
|
|
|
|
|
|
my @rows = rows ($sheet); |
|
1489
|
|
|
|
|
|
|
|
|
1490
|
|
|
|
|
|
|
my @rows = Spreadsheet::Read::rows ($book->[1]); |
|
1491
|
|
|
|
|
|
|
|
|
1492
|
|
|
|
|
|
|
my @rows = $book->rows (1); # OO |
|
1493
|
|
|
|
|
|
|
|
|
1494
|
|
|
|
|
|
|
Convert C<{cell}>'s C<[column][row]> to a C<[row][column]> list. |
|
1495
|
|
|
|
|
|
|
|
|
1496
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based, where the |
|
1497
|
|
|
|
|
|
|
index in the C<{cell}> entry is 1-based. |
|
1498
|
|
|
|
|
|
|
|
|
1499
|
|
|
|
|
|
|
C<rows ()> is not imported by default, so either specify it in the |
|
1500
|
|
|
|
|
|
|
use argument list, or call it fully qualified. |
|
1501
|
|
|
|
|
|
|
|
|
1502
|
|
|
|
|
|
|
=head3 parses |
|
1503
|
|
|
|
|
|
|
|
|
1504
|
|
|
|
|
|
|
parses ($format); |
|
1505
|
|
|
|
|
|
|
|
|
1506
|
|
|
|
|
|
|
Spreadsheet::Read::parses ("CSV"); |
|
1507
|
|
|
|
|
|
|
|
|
1508
|
|
|
|
|
|
|
$book->parses ("CSV"); # OO |
|
1509
|
|
|
|
|
|
|
|
|
1510
|
|
|
|
|
|
|
C<parses ()> returns Spreadsheet::Read's capability to parse the |
|
1511
|
|
|
|
|
|
|
required format. L<C<ReadData>|/ReadData> will pick its preferred parser |
|
1512
|
|
|
|
|
|
|
for that format unless overruled. See L<C<parser>|/parser>. |
|
1513
|
|
|
|
|
|
|
|
|
1514
|
|
|
|
|
|
|
C<parses ()> is not imported by default, so either specify it in the |
|
1515
|
|
|
|
|
|
|
use argument list, or call it fully qualified. |
|
1516
|
|
|
|
|
|
|
|
|
1517
|
|
|
|
|
|
|
=head3 Version |
|
1518
|
|
|
|
|
|
|
|
|
1519
|
|
|
|
|
|
|
my $v = Version () |
|
1520
|
|
|
|
|
|
|
|
|
1521
|
|
|
|
|
|
|
my $v = Spreadsheet::Read::Version () |
|
1522
|
|
|
|
|
|
|
|
|
1523
|
|
|
|
|
|
|
my $v = Spreadsheet::Read->VERSION; |
|
1524
|
|
|
|
|
|
|
|
|
1525
|
|
|
|
|
|
|
my $v = $book->Version (); # OO |
|
1526
|
|
|
|
|
|
|
|
|
1527
|
|
|
|
|
|
|
Returns the current version of Spreadsheet::Read. |
|
1528
|
|
|
|
|
|
|
|
|
1529
|
|
|
|
|
|
|
C<Version ()> is not imported by default, so either specify it in the |
|
1530
|
|
|
|
|
|
|
use argument list, or call it fully qualified. |
|
1531
|
|
|
|
|
|
|
|
|
1532
|
|
|
|
|
|
|
This function returns exactly the same as C<< Spreadsheet::Read->VERSION >> |
|
1533
|
|
|
|
|
|
|
returns and is only kept for backward compatibility reasons. |
|
1534
|
|
|
|
|
|
|
|
|
1535
|
|
|
|
|
|
|
=head3 sheets |
|
1536
|
|
|
|
|
|
|
|
|
1537
|
|
|
|
|
|
|
my $sheets = $book->sheets; # OO |
|
1538
|
|
|
|
|
|
|
my @sheets = $book->sheets; # OO |
|
1539
|
|
|
|
|
|
|
|
|
1540
|
|
|
|
|
|
|
In scalar context return the number of sheets in the book. |
|
1541
|
|
|
|
|
|
|
In list context return the labels of the sheets in the book. |
|
1542
|
|
|
|
|
|
|
|
|
1543
|
|
|
|
|
|
|
=head3 sheet |
|
1544
|
|
|
|
|
|
|
|
|
1545
|
|
|
|
|
|
|
my $sheet = $book->sheet (1); # OO |
|
1546
|
|
|
|
|
|
|
my $sheet = $book->sheet ("Foo"); # OO |
|
1547
|
|
|
|
|
|
|
|
|
1548
|
|
|
|
|
|
|
Return the numbered or named sheet out of the book. Will return C<undef> if |
|
1549
|
|
|
|
|
|
|
there is no match. Will not work for sheets I<named> with a number between 1 |
|
1550
|
|
|
|
|
|
|
and the number of sheets in the book. |
|
1551
|
|
|
|
|
|
|
|
|
1552
|
|
|
|
|
|
|
With named sheets will first try to use the list of sheet-labels as stored in |
|
1553
|
|
|
|
|
|
|
the control structure. If no match is found, it will scan the actual labels |
|
1554
|
|
|
|
|
|
|
of the sheets. In that case, it will return the first matching sheet. |
|
1555
|
|
|
|
|
|
|
|
|
1556
|
|
|
|
|
|
|
If defined, the returned sheet will be of class C<Spreadsheet::Read::Sheet>. |
|
1557
|
|
|
|
|
|
|
|
|
1558
|
|
|
|
|
|
|
=head3 add |
|
1559
|
|
|
|
|
|
|
|
|
1560
|
|
|
|
|
|
|
my $book = ReadData ("file.csv"); |
|
1561
|
|
|
|
|
|
|
Spreadsheet::Read::add ($book, "file.xlsx"); |
|
1562
|
|
|
|
|
|
|
|
|
1563
|
|
|
|
|
|
|
my $book = Spreadsheet::Read->new ("file.csv"); |
|
1564
|
|
|
|
|
|
|
$book->add ("file.xlsx"); # OO |
|
1565
|
|
|
|
|
|
|
|
|
1566
|
|
|
|
|
|
|
=head2 Methods on sheets |
|
1567
|
|
|
|
|
|
|
|
|
1568
|
|
|
|
|
|
|
=head3 maxcol |
|
1569
|
|
|
|
|
|
|
|
|
1570
|
|
|
|
|
|
|
my $col = $sheet->maxcol; |
|
1571
|
|
|
|
|
|
|
|
|
1572
|
|
|
|
|
|
|
Return the index of the last in-use column in the sheet. This index is 1-based. |
|
1573
|
|
|
|
|
|
|
|
|
1574
|
|
|
|
|
|
|
=head3 maxrow |
|
1575
|
|
|
|
|
|
|
|
|
1576
|
|
|
|
|
|
|
my $row = $sheet->maxrow; |
|
1577
|
|
|
|
|
|
|
|
|
1578
|
|
|
|
|
|
|
Return the index of the last in-use row in the sheet. This index is 1-based. |
|
1579
|
|
|
|
|
|
|
|
|
1580
|
|
|
|
|
|
|
=head3 cell |
|
1581
|
|
|
|
|
|
|
|
|
1582
|
|
|
|
|
|
|
my $cell = $sheet->cell ("A3"); |
|
1583
|
|
|
|
|
|
|
my $cell = $sheet->cell (1, 3); |
|
1584
|
|
|
|
|
|
|
|
|
1585
|
|
|
|
|
|
|
Return the value for a cell. Using tags will return the formatted value, |
|
1586
|
|
|
|
|
|
|
using column and row will return unformatted value. |
|
1587
|
|
|
|
|
|
|
|
|
1588
|
|
|
|
|
|
|
=head3 attr |
|
1589
|
|
|
|
|
|
|
|
|
1590
|
|
|
|
|
|
|
my $cell = $sheet->attr ("A3"); |
|
1591
|
|
|
|
|
|
|
my $cell = $sheet->attr (1, 3); |
|
1592
|
|
|
|
|
|
|
|
|
1593
|
|
|
|
|
|
|
Return the attributes of a cell. Only valid if attributes are enabled through |
|
1594
|
|
|
|
|
|
|
option C<attr>. |
|
1595
|
|
|
|
|
|
|
|
|
1596
|
|
|
|
|
|
|
=head3 col2label |
|
1597
|
|
|
|
|
|
|
|
|
1598
|
|
|
|
|
|
|
my $col_id = $sheet->col2label (col); |
|
1599
|
|
|
|
|
|
|
|
|
1600
|
|
|
|
|
|
|
C<col2label ()> converts a C<(column)> (1 based) to the letters used in the |
|
1601
|
|
|
|
|
|
|
traditional cell notation: |
|
1602
|
|
|
|
|
|
|
|
|
1603
|
|
|
|
|
|
|
my $id = $sheet->col2label ( 4); # $id now "D" |
|
1604
|
|
|
|
|
|
|
my $id = $sheet->col2label (28); # $id now "AB" |
|
1605
|
|
|
|
|
|
|
|
|
1606
|
|
|
|
|
|
|
=head3 cr2cell |
|
1607
|
|
|
|
|
|
|
|
|
1608
|
|
|
|
|
|
|
my $cell = $sheet->cr2cell (col, row); |
|
1609
|
|
|
|
|
|
|
|
|
1610
|
|
|
|
|
|
|
C<cr2cell ()> converts a C<(column, row)> pair (1 based) to the |
|
1611
|
|
|
|
|
|
|
traditional cell notation: |
|
1612
|
|
|
|
|
|
|
|
|
1613
|
|
|
|
|
|
|
my $cell = $sheet->cr2cell ( 4, 14); # $cell now "D14" |
|
1614
|
|
|
|
|
|
|
my $cell = $sheet->cr2cell (28, 4); # $cell now "AB4" |
|
1615
|
|
|
|
|
|
|
|
|
1616
|
|
|
|
|
|
|
=head3 cell2cr |
|
1617
|
|
|
|
|
|
|
|
|
1618
|
|
|
|
|
|
|
my ($col, $row) = $sheet->cell2cr ($cell); |
|
1619
|
|
|
|
|
|
|
|
|
1620
|
|
|
|
|
|
|
C<cell2cr ()> converts traditional cell notation to a C<(column, row)> |
|
1621
|
|
|
|
|
|
|
pair (1 based): |
|
1622
|
|
|
|
|
|
|
|
|
1623
|
|
|
|
|
|
|
my ($col, $row) = $sheet->cell2cr ("D14"); # returns ( 4, 14) |
|
1624
|
|
|
|
|
|
|
my ($col, $row) = $sheet->cell2cr ("AB4"); # returns (28, 4) |
|
1625
|
|
|
|
|
|
|
|
|
1626
|
|
|
|
|
|
|
=head3 col |
|
1627
|
|
|
|
|
|
|
|
|
1628
|
|
|
|
|
|
|
my @col = $sheet->column ($col); |
|
1629
|
|
|
|
|
|
|
|
|
1630
|
|
|
|
|
|
|
Get full column of formatted values (like C<< $sheet->{C1} .. $sheet->{C9} >>) |
|
1631
|
|
|
|
|
|
|
|
|
1632
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1633
|
|
|
|
|
|
|
|
|
1634
|
|
|
|
|
|
|
=head3 cellcolumn |
|
1635
|
|
|
|
|
|
|
|
|
1636
|
|
|
|
|
|
|
my @col = $sheet->cellcolumn ($col); |
|
1637
|
|
|
|
|
|
|
|
|
1638
|
|
|
|
|
|
|
Get full column of unformatted values (like C<< $sheet->{cell}[3][1] .. $sheet->{cell}[3][9] >>) |
|
1639
|
|
|
|
|
|
|
|
|
1640
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1641
|
|
|
|
|
|
|
|
|
1642
|
|
|
|
|
|
|
=head3 row |
|
1643
|
|
|
|
|
|
|
|
|
1644
|
|
|
|
|
|
|
my @row = $sheet->row ($row); |
|
1645
|
|
|
|
|
|
|
|
|
1646
|
|
|
|
|
|
|
Get full row of formatted values (like C<< $sheet->{A3} .. $sheet->{G3} >>) |
|
1647
|
|
|
|
|
|
|
|
|
1648
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1649
|
|
|
|
|
|
|
|
|
1650
|
|
|
|
|
|
|
=head3 cellrow |
|
1651
|
|
|
|
|
|
|
|
|
1652
|
|
|
|
|
|
|
my @row = $sheet->cellrow ($row); |
|
1653
|
|
|
|
|
|
|
|
|
1654
|
|
|
|
|
|
|
Get full row of unformatted values (like C<< $sheet->{cell}[1][3] .. $sheet->{cell}[7][3] >>) |
|
1655
|
|
|
|
|
|
|
|
|
1656
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based. |
|
1657
|
|
|
|
|
|
|
|
|
1658
|
|
|
|
|
|
|
=head3 rows |
|
1659
|
|
|
|
|
|
|
|
|
1660
|
|
|
|
|
|
|
my @rows = $sheet->rows (); |
|
1661
|
|
|
|
|
|
|
|
|
1662
|
|
|
|
|
|
|
Convert C<{cell}>'s C<[column][row]> to a C<[row][column]> list. |
|
1663
|
|
|
|
|
|
|
|
|
1664
|
|
|
|
|
|
|
Note that the indexes in the returned list are 0-based, where the |
|
1665
|
|
|
|
|
|
|
index in the C<{cell}> entry is 1-based. |
|
1666
|
|
|
|
|
|
|
|
|
1667
|
|
|
|
|
|
|
=head3 label |
|
1668
|
|
|
|
|
|
|
|
|
1669
|
|
|
|
|
|
|
my $label = $sheet->label; |
|
1670
|
|
|
|
|
|
|
$sheet->label ("New sheet label"); |
|
1671
|
|
|
|
|
|
|
|
|
1672
|
|
|
|
|
|
|
Set a new label to a sheet. Note that the index in the control structure will |
|
1673
|
|
|
|
|
|
|
I<NOT> be updated. |
|
1674
|
|
|
|
|
|
|
|
|
1675
|
|
|
|
|
|
|
=head3 active |
|
1676
|
|
|
|
|
|
|
|
|
1677
|
|
|
|
|
|
|
my $sheet_is_active = $sheet->active; |
|
1678
|
|
|
|
|
|
|
|
|
1679
|
|
|
|
|
|
|
Returns 1 if the selected sheet is active, otherwise returns 0. |
|
1680
|
|
|
|
|
|
|
|
|
1681
|
|
|
|
|
|
|
Currently only works on XLS (as of Spreadsheed::ParseExcel-0.61). |
|
1682
|
|
|
|
|
|
|
CSV is always active. |
|
1683
|
|
|
|
|
|
|
|
|
1684
|
|
|
|
|
|
|
=head2 Using CSV |
|
1685
|
|
|
|
|
|
|
|
|
1686
|
|
|
|
|
|
|
In case of CSV parsing, L<C<ReadData>|/ReadData> will use the first line of |
|
1687
|
|
|
|
|
|
|
the file to auto-detect the separation character if the first argument is a |
|
1688
|
|
|
|
|
|
|
file and both C<sep> and C<quote> are not passed as attributes. |
|
1689
|
|
|
|
|
|
|
L<Text::CSV_XS|https://metacpan.org/release/Text-CSV_XS> (or |
|
1690
|
|
|
|
|
|
|
L<Text::CSV_PP|https://metacpan.org/release/Text-CSV_PP>) is able to |
|
1691
|
|
|
|
|
|
|
automatically detect and use C<\r> line endings. |
|
1692
|
|
|
|
|
|
|
|
|
1693
|
|
|
|
|
|
|
CSV can parse streams too, but be sure to pass C<sep> and/or C<quote> if |
|
1694
|
|
|
|
|
|
|
these do not match the default C<,> and C<">. |
|
1695
|
|
|
|
|
|
|
|
|
1696
|
|
|
|
|
|
|
When an error is found in the CSV, it is automatically reported (to STDERR). |
|
1697
|
|
|
|
|
|
|
The structure will store the error in C<< $ss->[0]{error} >> as anonymous |
|
1698
|
|
|
|
|
|
|
list returned by |
|
1699
|
|
|
|
|
|
|
L<C<< $csv->error_diag >>|https://metacpan.org/pod/Text::CSV_XS#error_diag>. |
|
1700
|
|
|
|
|
|
|
See L<Text::CSV_XS|https://metacpan.org/pod/Text-CSV_XS> for documentation. |
|
1701
|
|
|
|
|
|
|
|
|
1702
|
|
|
|
|
|
|
my $ss = ReadData ("bad.csv"); |
|
1703
|
|
|
|
|
|
|
$ss->[0]{error} and say $ss->[0]{error}[1]; |
|
1704
|
|
|
|
|
|
|
|
|
1705
|
|
|
|
|
|
|
As CSV has no sheet labels, the default label for a CSV sheet is its filename. |
|
1706
|
|
|
|
|
|
|
For CSV, this can be overruled using the I<label> attribute: |
|
1707
|
|
|
|
|
|
|
|
|
1708
|
|
|
|
|
|
|
my $ss = Spreadsheet::Read->new ("/some/place/test.csv", label => "Test"); |
|
1709
|
|
|
|
|
|
|
|
|
1710
|
|
|
|
|
|
|
=head2 Cell Attributes |
|
1711
|
|
|
|
|
|
|
X<attr> |
|
1712
|
|
|
|
|
|
|
|
|
1713
|
|
|
|
|
|
|
If the constructor was called with C<attr> having a true value, |
|
1714
|
|
|
|
|
|
|
|
|
1715
|
|
|
|
|
|
|
my $book = ReadData ("book.xls", attr => 1); |
|
1716
|
|
|
|
|
|
|
my $book = Spreadsheet::Read->new ("book.xlsx", attr => 1); |
|
1717
|
|
|
|
|
|
|
|
|
1718
|
|
|
|
|
|
|
effort is made to analyze and store field attributes like this: |
|
1719
|
|
|
|
|
|
|
|
|
1720
|
|
|
|
|
|
|
{ label => "Sheet 1", |
|
1721
|
|
|
|
|
|
|
maxrow => 5, |
|
1722
|
|
|
|
|
|
|
maxcol => 2, |
|
1723
|
|
|
|
|
|
|
cell => [ undef, |
|
1724
|
|
|
|
|
|
|
[ undef, 1 ], |
|
1725
|
|
|
|
|
|
|
[ undef, undef, undef, undef, undef, "Nugget" ], |
|
1726
|
|
|
|
|
|
|
], |
|
1727
|
|
|
|
|
|
|
attr => [ undef, |
|
1728
|
|
|
|
|
|
|
[ undef, { |
|
1729
|
|
|
|
|
|
|
type => "numeric", |
|
1730
|
|
|
|
|
|
|
fgcolor => "#ff0000", |
|
1731
|
|
|
|
|
|
|
bgcolor => undef, |
|
1732
|
|
|
|
|
|
|
font => "Arial", |
|
1733
|
|
|
|
|
|
|
size => undef, |
|
1734
|
|
|
|
|
|
|
format => "## ##0.00", |
|
1735
|
|
|
|
|
|
|
halign => "right", |
|
1736
|
|
|
|
|
|
|
valign => "top", |
|
1737
|
|
|
|
|
|
|
uline => 0, |
|
1738
|
|
|
|
|
|
|
bold => 0, |
|
1739
|
|
|
|
|
|
|
italic => 0, |
|
1740
|
|
|
|
|
|
|
wrap => 0, |
|
1741
|
|
|
|
|
|
|
merged => 0, |
|
1742
|
|
|
|
|
|
|
hidden => 0, |
|
1743
|
|
|
|
|
|
|
locked => 0, |
|
1744
|
|
|
|
|
|
|
enc => "utf-8", |
|
1745
|
|
|
|
|
|
|
}, ] |
|
1746
|
|
|
|
|
|
|
[ undef, undef, undef, undef, undef, { |
|
1747
|
|
|
|
|
|
|
type => "text", |
|
1748
|
|
|
|
|
|
|
fgcolor => "#e2e2e2", |
|
1749
|
|
|
|
|
|
|
bgcolor => undef, |
|
1750
|
|
|
|
|
|
|
font => "Letter Gothic", |
|
1751
|
|
|
|
|
|
|
size => 15, |
|
1752
|
|
|
|
|
|
|
format => undef, |
|
1753
|
|
|
|
|
|
|
halign => "left", |
|
1754
|
|
|
|
|
|
|
valign => "top", |
|
1755
|
|
|
|
|
|
|
uline => 0, |
|
1756
|
|
|
|
|
|
|
bold => 0, |
|
1757
|
|
|
|
|
|
|
italic => 0, |
|
1758
|
|
|
|
|
|
|
wrap => 0, |
|
1759
|
|
|
|
|
|
|
merged => 0, |
|
1760
|
|
|
|
|
|
|
hidden => 0, |
|
1761
|
|
|
|
|
|
|
locked => 0, |
|
1762
|
|
|
|
|
|
|
enc => "iso8859-1", |
|
1763
|
|
|
|
|
|
|
}, ] |
|
1764
|
|
|
|
|
|
|
merged => [], |
|
1765
|
|
|
|
|
|
|
A1 => 1, |
|
1766
|
|
|
|
|
|
|
B5 => "Nugget", |
|
1767
|
|
|
|
|
|
|
}, |
|
1768
|
|
|
|
|
|
|
|
|
1769
|
|
|
|
|
|
|
The entries C<maxrow> and C<maxcol> are 1-based. |
|
1770
|
|
|
|
|
|
|
|
|
1771
|
|
|
|
|
|
|
This has now been partially implemented, mainly for Excel, as the other |
|
1772
|
|
|
|
|
|
|
parsers do not (yet) support all of that. YMMV. |
|
1773
|
|
|
|
|
|
|
|
|
1774
|
|
|
|
|
|
|
If a cell itself is not hidden, but the parser holds the information that |
|
1775
|
|
|
|
|
|
|
either the row or the column (or both) the field is in is hidden, the flag |
|
1776
|
|
|
|
|
|
|
is inherited into the cell attributes. |
|
1777
|
|
|
|
|
|
|
|
|
1778
|
|
|
|
|
|
|
You can get the attributes of a cell (as a hash-ref) like this: |
|
1779
|
|
|
|
|
|
|
|
|
1780
|
|
|
|
|
|
|
my $attr = $book[1]{attr}[1][3]; # Direct structure |
|
1781
|
|
|
|
|
|
|
my $attr = $book->sheet (1)->attr (1, 3); # Same using OO |
|
1782
|
|
|
|
|
|
|
my $attr = $book->sheet (1)->attr ("A3"); # Same using OO |
|
1783
|
|
|
|
|
|
|
|
|
1784
|
|
|
|
|
|
|
To get to the C<font> attribute, use any of these: |
|
1785
|
|
|
|
|
|
|
|
|
1786
|
|
|
|
|
|
|
my $font = $book[1]{attr}[1][3]{font}; |
|
1787
|
|
|
|
|
|
|
my $font = $book->sheet (1)->attr (1, 3)->{font}; |
|
1788
|
|
|
|
|
|
|
my $font = $book->sheet (1)->attr ("A3")->font; |
|
1789
|
|
|
|
|
|
|
|
|
1790
|
|
|
|
|
|
|
=head3 Merged cells |
|
1791
|
|
|
|
|
|
|
X<merged> |
|
1792
|
|
|
|
|
|
|
|
|
1793
|
|
|
|
|
|
|
Note that only |
|
1794
|
|
|
|
|
|
|
L<Spreadsheet::ReadSXC|https://metacpan.org/release/Spreadsheet-ReadSXC> |
|
1795
|
|
|
|
|
|
|
documents the use of merged cells, and not in a way useful for the spreadsheet |
|
1796
|
|
|
|
|
|
|
consumer. |
|
1797
|
|
|
|
|
|
|
|
|
1798
|
|
|
|
|
|
|
CSV does not support merged cells (though future implementations of CSV |
|
1799
|
|
|
|
|
|
|
for the web might). |
|
1800
|
|
|
|
|
|
|
|
|
1801
|
|
|
|
|
|
|
The documentation of merged areas in |
|
1802
|
|
|
|
|
|
|
L<Spreadsheet::ParseExcel|https://metacpan.org/release/Spreadsheet-ParseExcel> and |
|
1803
|
|
|
|
|
|
|
L<Spreadsheet::ParseXLSX|https://metacpan.org/release/Spreadsheet-ParseXLSX> can |
|
1804
|
|
|
|
|
|
|
be found in |
|
1805
|
|
|
|
|
|
|
L<Spreadsheet::ParseExcel::Worksheet|https://metacpan.org/release/Spreadsheet-ParseExcel-Worksheet> |
|
1806
|
|
|
|
|
|
|
and L<Spreadsheet::ParseExcel::Cell|https://metacpan.org/release/Spreadsheet-ParseExcel-Cell>. |
|
1807
|
|
|
|
|
|
|
|
|
1808
|
|
|
|
|
|
|
None of basic L<Spreadsheet::XLSX|https://metacpan.org/release/Spreadsheet-XLSX>, |
|
1809
|
|
|
|
|
|
|
L<Spreadsheet::ParseExcel|https://metacpan.org/release/Spreadsheet-ParseExcel>, and |
|
1810
|
|
|
|
|
|
|
L<Spreadsheet::ParseXLSX|https://metacpan.org/release/Spreadsheet-ParseXLSX> manual |
|
1811
|
|
|
|
|
|
|
pages mention merged cells at all. |
|
1812
|
|
|
|
|
|
|
|
|
1813
|
|
|
|
|
|
|
This module just tries to return the information in a generic way. |
|
1814
|
|
|
|
|
|
|
|
|
1815
|
|
|
|
|
|
|
Given this spreadsheet as an example |
|
1816
|
|
|
|
|
|
|
|
|
1817
|
|
|
|
|
|
|
merged.xlsx: |
|
1818
|
|
|
|
|
|
|
|
|
1819
|
|
|
|
|
|
|
A B C |
|
1820
|
|
|
|
|
|
|
+-----+-----------+ |
|
1821
|
|
|
|
|
|
|
1| | foo | |
|
1822
|
|
|
|
|
|
|
+-----+ + |
|
1823
|
|
|
|
|
|
|
2| bar | | |
|
1824
|
|
|
|
|
|
|
| +-----+-----+ |
|
1825
|
|
|
|
|
|
|
3| | urg | orc | |
|
1826
|
|
|
|
|
|
|
+-----+-----+-----+ |
|
1827
|
|
|
|
|
|
|
|
|
1828
|
|
|
|
|
|
|
the information extracted from that undocumented information is |
|
1829
|
|
|
|
|
|
|
returned in the C<merged> entry of the sheet's hash as a list of |
|
1830
|
|
|
|
|
|
|
top-left, bottom-right coordinate pars (col, row, col, row). For |
|
1831
|
|
|
|
|
|
|
given example, that would be: |
|
1832
|
|
|
|
|
|
|
|
|
1833
|
|
|
|
|
|
|
$ss->{merged} = [ |
|
1834
|
|
|
|
|
|
|
[ 1, 2, 1, 3 ], # A2-A3 |
|
1835
|
|
|
|
|
|
|
[ 2, 1, 3, 2 ], # B1-C2 |
|
1836
|
|
|
|
|
|
|
]; |
|
1837
|
|
|
|
|
|
|
|
|
1838
|
|
|
|
|
|
|
When the attributes are also enabled, there is some merge information |
|
1839
|
|
|
|
|
|
|
copied directly from the cell information, but again, that stems from |
|
1840
|
|
|
|
|
|
|
code analysis and not from documentation: |
|
1841
|
|
|
|
|
|
|
|
|
1842
|
|
|
|
|
|
|
my $ss = ReadData ("merged.xlsx", attr => 1)->[1]; |
|
1843
|
|
|
|
|
|
|
foreach my $row (1 .. $ss->{maxrow}) { |
|
1844
|
|
|
|
|
|
|
foreach my $col (1 .. $ss->{maxcol}) { |
|
1845
|
|
|
|
|
|
|
my $cell = cr2cell ($col, $row); |
|
1846
|
|
|
|
|
|
|
printf "%s %-3s %d ", $cell, $ss->{$cell}, |
|
1847
|
|
|
|
|
|
|
$ss->{attr}[$col][$row]{merged}; |
|
1848
|
|
|
|
|
|
|
} |
|
1849
|
|
|
|
|
|
|
print "\n"; |
|
1850
|
|
|
|
|
|
|
} |
|
1851
|
|
|
|
|
|
|
|
|
1852
|
|
|
|
|
|
|
A1 0 B1 foo 1 C1 1 |
|
1853
|
|
|
|
|
|
|
A2 bar 1 B2 1 C2 1 |
|
1854
|
|
|
|
|
|
|
A3 1 B3 urg 0 C3 orc 0 |
|
1855
|
|
|
|
|
|
|
|
|
1856
|
|
|
|
|
|
|
In this example, there is no way to see if C<B2> is merged to C<A2> or |
|
1857
|
|
|
|
|
|
|
to C<B1> without analyzing all surrounding cells. This could as well |
|
1858
|
|
|
|
|
|
|
mean C<A2:A3>, C<B1:C1>, C<B2:C2>, as C<A2:A3>, C<B1:B2>, C<C1:C2>, as |
|
1859
|
|
|
|
|
|
|
C<A2:A3>, C<B1:C2>. |
|
1860
|
|
|
|
|
|
|
Use the L<C<merged>|/merged> entry described above to find out what |
|
1861
|
|
|
|
|
|
|
fields are merged to what other fields. |
|
1862
|
|
|
|
|
|
|
|
|
1863
|
|
|
|
|
|
|
=head1 TOOLS |
|
1864
|
|
|
|
|
|
|
|
|
1865
|
|
|
|
|
|
|
This modules comes with a few tools that perform tasks from the FAQ, like |
|
1866
|
|
|
|
|
|
|
"How do I select only column D through F from sheet 2 into a CSV file?" |
|
1867
|
|
|
|
|
|
|
|
|
1868
|
|
|
|
|
|
|
If the module was installed without the tools, you can find them here: |
|
1869
|
|
|
|
|
|
|
https://github.com/Tux/Spreadsheet-Read/tree/master/examples |
|
1870
|
|
|
|
|
|
|
|
|
1871
|
|
|
|
|
|
|
=head2 C<xlscat> |
|
1872
|
|
|
|
|
|
|
|
|
1873
|
|
|
|
|
|
|
Show (parts of) a spreadsheet in plain text, CSV, or HTML |
|
1874
|
|
|
|
|
|
|
|
|
1875
|
|
|
|
|
|
|
usage: xlscat [-s <sep>] [-L] [-n] [-A] [-u] [Selection] file.xls |
|
1876
|
|
|
|
|
|
|
[-c | -m] [-u] [Selection] file.xls |
|
1877
|
|
|
|
|
|
|
-i [-S sheets] file.xls |
|
1878
|
|
|
|
|
|
|
Generic options: |
|
1879
|
|
|
|
|
|
|
-v[#] Set verbose level (xlscat/xlsgrep) |
|
1880
|
|
|
|
|
|
|
-d[#] Set debug level (Spreadsheet::Read) |
|
1881
|
|
|
|
|
|
|
-u Use unformatted values |
|
1882
|
|
|
|
|
|
|
--noclip Do not strip empty sheets and |
|
1883
|
|
|
|
|
|
|
trailing empty rows and columns |
|
1884
|
|
|
|
|
|
|
-e <enc> Set encoding for input and output |
|
1885
|
|
|
|
|
|
|
-b <enc> Set encoding for input |
|
1886
|
|
|
|
|
|
|
-a <enc> Set encoding for output |
|
1887
|
|
|
|
|
|
|
Input CSV: |
|
1888
|
|
|
|
|
|
|
--in-sep=c Set input sep_char for CSV |
|
1889
|
|
|
|
|
|
|
Input XLS: |
|
1890
|
|
|
|
|
|
|
--dtfmt=fmt Specify the default date format to replace 'm-d-yy' |
|
1891
|
|
|
|
|
|
|
the default replacement is 'yyyy-mm-dd' |
|
1892
|
|
|
|
|
|
|
Output Text (default): |
|
1893
|
|
|
|
|
|
|
-s <sep> Use separator <sep>. Default '|', \n allowed |
|
1894
|
|
|
|
|
|
|
-L Line up the columns |
|
1895
|
|
|
|
|
|
|
-n [skip] Number lines (prefix with column number) |
|
1896
|
|
|
|
|
|
|
optionally skip <skip> (header) lines |
|
1897
|
|
|
|
|
|
|
-A Show field attributes in ANSI escapes |
|
1898
|
|
|
|
|
|
|
-h[#] Show # header lines |
|
1899
|
|
|
|
|
|
|
Output Index only: |
|
1900
|
|
|
|
|
|
|
-i Show sheet names and size only |
|
1901
|
|
|
|
|
|
|
Output CSV: |
|
1902
|
|
|
|
|
|
|
-c Output CSV, separator = ',' |
|
1903
|
|
|
|
|
|
|
-m Output CSV, separator = ';' |
|
1904
|
|
|
|
|
|
|
Output HTML: |
|
1905
|
|
|
|
|
|
|
-H Output HTML |
|
1906
|
|
|
|
|
|
|
Selection: |
|
1907
|
|
|
|
|
|
|
-S <sheets> Only print sheets <sheets>. 'all' is a valid set |
|
1908
|
|
|
|
|
|
|
Default only prints the first sheet |
|
1909
|
|
|
|
|
|
|
-R <rows> Only print rows <rows>. Default is 'all' |
|
1910
|
|
|
|
|
|
|
-C <cols> Only print columns <cols>. Default is 'all' |
|
1911
|
|
|
|
|
|
|
-F <flds> Only fields <flds> e.g. -FA3,B16 |
|
1912
|
|
|
|
|
|
|
Ordering (column numbers in result set *after* selection): |
|
1913
|
|
|
|
|
|
|
--sort=spec Sort output (e.g. --sort=3,2r,5n,1rn+2) |
|
1914
|
|
|
|
|
|
|
+# - first # lines do not sort (header) |
|
1915
|
|
|
|
|
|
|
# - order on column # lexical ascending |
|
1916
|
|
|
|
|
|
|
#n - order on column # numeric ascending |
|
1917
|
|
|
|
|
|
|
#r - order on column # lexical descending |
|
1918
|
|
|
|
|
|
|
#rn - order on column # numeric descending |
|
1919
|
|
|
|
|
|
|
|
|
1920
|
|
|
|
|
|
|
=head2 C<xlsgrep> |
|
1921
|
|
|
|
|
|
|
|
|
1922
|
|
|
|
|
|
|
Show (parts of) a spreadsheet that match a pattern in plain text, CSV, or HTML |
|
1923
|
|
|
|
|
|
|
|
|
1924
|
|
|
|
|
|
|
usage: xlsgrep [-s <sep>] [-L] [-n] [-A] [-u] [Selection] pattern file.xls |
|
1925
|
|
|
|
|
|
|
[-c | -m] [-u] [Selection] pattern file.xls |
|
1926
|
|
|
|
|
|
|
-i [-S sheets] pattern file.xls |
|
1927
|
|
|
|
|
|
|
Generic options: |
|
1928
|
|
|
|
|
|
|
-v[#] Set verbose level (xlscat/xlsgrep) |
|
1929
|
|
|
|
|
|
|
-d[#] Set debug level (Spreadsheet::Read) |
|
1930
|
|
|
|
|
|
|
-u Use unformatted values |
|
1931
|
|
|
|
|
|
|
--noclip Do not strip empty sheets and |
|
1932
|
|
|
|
|
|
|
trailing empty rows and columns |
|
1933
|
|
|
|
|
|
|
-e <enc> Set encoding for input and output |
|
1934
|
|
|
|
|
|
|
-b <enc> Set encoding for input |
|
1935
|
|
|
|
|
|
|
-a <enc> Set encoding for output |
|
1936
|
|
|
|
|
|
|
Input CSV: |
|
1937
|
|
|
|
|
|
|
--in-sep=c Set input sep_char for CSV |
|
1938
|
|
|
|
|
|
|
Input XLS: |
|
1939
|
|
|
|
|
|
|
--dtfmt=fmt Specify the default date format to replace 'm-d-yy' |
|
1940
|
|
|
|
|
|
|
the default replacement is 'yyyy-mm-dd' |
|
1941
|
|
|
|
|
|
|
Output Text (default): |
|
1942
|
|
|
|
|
|
|
-s <sep> Use separator <sep>. Default '|', \n allowed |
|
1943
|
|
|
|
|
|
|
-L Line up the columns |
|
1944
|
|
|
|
|
|
|
-n [skip] Number lines (prefix with column number) |
|
1945
|
|
|
|
|
|
|
optionally skip <skip> (header) lines |
|
1946
|
|
|
|
|
|
|
-A Show field attributes in ANSI escapes |
|
1947
|
|
|
|
|
|
|
-h[#] Show # header lines |
|
1948
|
|
|
|
|
|
|
Grep options: |
|
1949
|
|
|
|
|
|
|
-i Ignore case |
|
1950
|
|
|
|
|
|
|
-w Match whole words only |
|
1951
|
|
|
|
|
|
|
Output CSV: |
|
1952
|
|
|
|
|
|
|
-c Output CSV, separator = ',' |
|
1953
|
|
|
|
|
|
|
-m Output CSV, separator = ';' |
|
1954
|
|
|
|
|
|
|
Output HTML: |
|
1955
|
|
|
|
|
|
|
-H Output HTML |
|
1956
|
|
|
|
|
|
|
Selection: |
|
1957
|
|
|
|
|
|
|
-S <sheets> Only print sheets <sheets>. 'all' is a valid set |
|
1958
|
|
|
|
|
|
|
Default only prints the first sheet |
|
1959
|
|
|
|
|
|
|
-R <rows> Only print rows <rows>. Default is 'all' |
|
1960
|
|
|
|
|
|
|
-C <cols> Only print columns <cols>. Default is 'all' |
|
1961
|
|
|
|
|
|
|
-F <flds> Only fields <flds> e.g. -FA3,B16 |
|
1962
|
|
|
|
|
|
|
Ordering (column numbers in result set *after* selection): |
|
1963
|
|
|
|
|
|
|
--sort=spec Sort output (e.g. --sort=3,2r,5n,1rn+2) |
|
1964
|
|
|
|
|
|
|
+# - first # lines do not sort (header) |
|
1965
|
|
|
|
|
|
|
# - order on column # lexical ascending |
|
1966
|
|
|
|
|
|
|
#n - order on column # numeric ascending |
|
1967
|
|
|
|
|
|
|
#r - order on column # lexical descending |
|
1968
|
|
|
|
|
|
|
#rn - order on column # numeric descending |
|
1969
|
|
|
|
|
|
|
|
|
1970
|
|
|
|
|
|
|
=head2 C<xls2csv> |
|
1971
|
|
|
|
|
|
|
|
|
1972
|
|
|
|
|
|
|
Convert a spreadsheet to CSV. This is just a small wrapper over C<xlscat>. |
|
1973
|
|
|
|
|
|
|
|
|
1974
|
|
|
|
|
|
|
usage: xls2csv [ -o file.csv ] file.xls |
|
1975
|
|
|
|
|
|
|
|
|
1976
|
|
|
|
|
|
|
=head2 C<ss2tk> |
|
1977
|
|
|
|
|
|
|
|
|
1978
|
|
|
|
|
|
|
Show a spreadsheet in a perl/Tk spreadsheet widget |
|
1979
|
|
|
|
|
|
|
|
|
1980
|
|
|
|
|
|
|
usage: ss2tk [-w <width>] [X11 options] file.xls [<pattern>] |
|
1981
|
|
|
|
|
|
|
-w <width> use <width> as default column width (4) |
|
1982
|
|
|
|
|
|
|
|
|
1983
|
|
|
|
|
|
|
=head2 C<ssdiff> |
|
1984
|
|
|
|
|
|
|
|
|
1985
|
|
|
|
|
|
|
Show the differences between two spreadsheets. |
|
1986
|
|
|
|
|
|
|
|
|
1987
|
|
|
|
|
|
|
usage: examples/ssdiff [--verbose[=1]] file.xls file.xlsx |
|
1988
|
|
|
|
|
|
|
|
|
1989
|
|
|
|
|
|
|
=head1 TODO |
|
1990
|
|
|
|
|
|
|
|
|
1991
|
|
|
|
|
|
|
=over 4 |
|
1992
|
|
|
|
|
|
|
|
|
1993
|
|
|
|
|
|
|
=item Options |
|
1994
|
|
|
|
|
|
|
|
|
1995
|
|
|
|
|
|
|
=over 2 |
|
1996
|
|
|
|
|
|
|
|
|
1997
|
|
|
|
|
|
|
=item Module Options |
|
1998
|
|
|
|
|
|
|
|
|
1999
|
|
|
|
|
|
|
New Spreadsheet::Read options are bound to happen. I'm thinking of an |
|
2000
|
|
|
|
|
|
|
option that disables the reading of the data entirely to speed up an |
|
2001
|
|
|
|
|
|
|
index request (how many sheets/fields/columns). See C<xlscat -i>. |
|
2002
|
|
|
|
|
|
|
|
|
2003
|
|
|
|
|
|
|
=item Parser options |
|
2004
|
|
|
|
|
|
|
|
|
2005
|
|
|
|
|
|
|
Try to transparently support as many options as the encapsulated modules |
|
2006
|
|
|
|
|
|
|
support regarding (un)formatted values, (date) formats, hidden columns |
|
2007
|
|
|
|
|
|
|
rows or fields etc. These could be implemented like C<attr> above but |
|
2008
|
|
|
|
|
|
|
names C<meta>, or just be new values in the C<attr> hashes. |
|
2009
|
|
|
|
|
|
|
|
|
2010
|
|
|
|
|
|
|
=back |
|
2011
|
|
|
|
|
|
|
|
|
2012
|
|
|
|
|
|
|
=item Other parsers |
|
2013
|
|
|
|
|
|
|
|
|
2014
|
|
|
|
|
|
|
Add support for new(er) parsers for already supported formats, like |
|
2015
|
|
|
|
|
|
|
|
|
2016
|
|
|
|
|
|
|
=over 2 |
|
2017
|
|
|
|
|
|
|
|
|
2018
|
|
|
|
|
|
|
=item Data::XLSX::Parser |
|
2019
|
|
|
|
|
|
|
|
|
2020
|
|
|
|
|
|
|
Data::XLSX::Parser provides faster way to parse Microsoft Excel's .xlsx |
|
2021
|
|
|
|
|
|
|
files. The implementation of this module is highly inspired from Python's |
|
2022
|
|
|
|
|
|
|
FastXLSX library. |
|
2023
|
|
|
|
|
|
|
|
|
2024
|
|
|
|
|
|
|
This is SAX based parser, so you can parse very large XLSX file with |
|
2025
|
|
|
|
|
|
|
lower memory usage. |
|
2026
|
|
|
|
|
|
|
|
|
2027
|
|
|
|
|
|
|
=back |
|
2028
|
|
|
|
|
|
|
|
|
2029
|
|
|
|
|
|
|
=item Other spreadsheet formats |
|
2030
|
|
|
|
|
|
|
|
|
2031
|
|
|
|
|
|
|
I consider adding any spreadsheet interface that offers a usable API. |
|
2032
|
|
|
|
|
|
|
|
|
2033
|
|
|
|
|
|
|
Under investigation: |
|
2034
|
|
|
|
|
|
|
|
|
2035
|
|
|
|
|
|
|
=over 2 |
|
2036
|
|
|
|
|
|
|
|
|
2037
|
|
|
|
|
|
|
=item Gnumeric (.gnumeric) |
|
2038
|
|
|
|
|
|
|
|
|
2039
|
|
|
|
|
|
|
I have seen no existing CPAN module yet. |
|
2040
|
|
|
|
|
|
|
|
|
2041
|
|
|
|
|
|
|
It is gzip'ed XML |
|
2042
|
|
|
|
|
|
|
|
|
2043
|
|
|
|
|
|
|
=item Kspread (.ksp) |
|
2044
|
|
|
|
|
|
|
|
|
2045
|
|
|
|
|
|
|
Now knows as Calligra Sheets. |
|
2046
|
|
|
|
|
|
|
|
|
2047
|
|
|
|
|
|
|
I have seen no existing CPAN module yet. |
|
2048
|
|
|
|
|
|
|
|
|
2049
|
|
|
|
|
|
|
It is XML in ZIP |
|
2050
|
|
|
|
|
|
|
|
|
2051
|
|
|
|
|
|
|
=back |
|
2052
|
|
|
|
|
|
|
|
|
2053
|
|
|
|
|
|
|
=item Alternative parsers for existing formats |
|
2054
|
|
|
|
|
|
|
|
|
2055
|
|
|
|
|
|
|
As long as the alternative has a good reason for its existence, and the |
|
2056
|
|
|
|
|
|
|
API of that parser reasonable fits in my approach, I will consider to |
|
2057
|
|
|
|
|
|
|
implement the glue layer, or apply patches to do so as long as these |
|
2058
|
|
|
|
|
|
|
match what F<CONTRIBUTING.md> describes. |
|
2059
|
|
|
|
|
|
|
|
|
2060
|
|
|
|
|
|
|
=back |
|
2061
|
|
|
|
|
|
|
|
|
2062
|
|
|
|
|
|
|
=head1 SEE ALSO |
|
2063
|
|
|
|
|
|
|
|
|
2064
|
|
|
|
|
|
|
=over 2 |
|
2065
|
|
|
|
|
|
|
|
|
2066
|
|
|
|
|
|
|
=item Text::CSV_XS, Text::CSV_PP |
|
2067
|
|
|
|
|
|
|
|
|
2068
|
|
|
|
|
|
|
See L<Text::CSV_XS|https://metacpan.org/release/Text-CSV_XS> , |
|
2069
|
|
|
|
|
|
|
L<Text::CSV_PP|https://metacpan.org/release/Text-CSV_PP> , and |
|
2070
|
|
|
|
|
|
|
L<Text::CSV|https://metacpan.org/release/Text-CSV> documentation. |
|
2071
|
|
|
|
|
|
|
|
|
2072
|
|
|
|
|
|
|
L<Text::CSV|https://metacpan.org/release/Text-CSV> is a wrapper over Text::CSV_XS (the fast XS version) and/or |
|
2073
|
|
|
|
|
|
|
L<Text::CSV_PP|https://metacpan.org/release/Text-CSV_PP> (the pure perl version). |
|
2074
|
|
|
|
|
|
|
|
|
2075
|
|
|
|
|
|
|
=item Spreadsheet::ParseExcel |
|
2076
|
|
|
|
|
|
|
|
|
2077
|
|
|
|
|
|
|
L<Spreadsheet::ParseExcel|https://metacpan.org/release/Spreadsheet-ParseExcel> is |
|
2078
|
|
|
|
|
|
|
the best parser for old-style Microsoft Excel (.xls) files. |
|
2079
|
|
|
|
|
|
|
|
|
2080
|
|
|
|
|
|
|
=item Spreadsheet::ParseXLSX |
|
2081
|
|
|
|
|
|
|
|
|
2082
|
|
|
|
|
|
|
L<Spreadsheet::ParseXLSX|https://metacpan.org/release/Spreadsheet-ParseXLSX> is |
|
2083
|
|
|
|
|
|
|
like L<Spreadsheet::ParseExcel|https://metacpan.org/release/Spreadsheet-ParseExcel>, |
|
2084
|
|
|
|
|
|
|
but for new Microsoft Excel 2007+ files (.xlsx). They have the same API. |
|
2085
|
|
|
|
|
|
|
|
|
2086
|
|
|
|
|
|
|
This module uses L<XML::Twig|https://metacpan.org/release/XML-Twig> to parse the |
|
2087
|
|
|
|
|
|
|
internal XML. |
|
2088
|
|
|
|
|
|
|
|
|
2089
|
|
|
|
|
|
|
=item Spreadsheet::XLSX |
|
2090
|
|
|
|
|
|
|
|
|
2091
|
|
|
|
|
|
|
See L<Spreadsheet::XLSX|https://metacpan.org/release/Spreadsheet-XLSX> |
|
2092
|
|
|
|
|
|
|
documentation. |
|
2093
|
|
|
|
|
|
|
|
|
2094
|
|
|
|
|
|
|
This module is dead and deprecated. It is B<buggy and unmaintained>. I<Please> |
|
2095
|
|
|
|
|
|
|
use L<Spreadsheet::ParseXLSX|https://metacpan.org/release/Spreadsheet-ParseXLSX> |
|
2096
|
|
|
|
|
|
|
instead. |
|
2097
|
|
|
|
|
|
|
|
|
2098
|
|
|
|
|
|
|
=item Spreadsheet::ReadSXC |
|
2099
|
|
|
|
|
|
|
|
|
2100
|
|
|
|
|
|
|
L<Spreadsheet::ReadSXC|https://metacpan.org/release/Spreadsheet-ReadSXC> is a |
|
2101
|
|
|
|
|
|
|
parser for OpenOffice/LibreOffice (.sxc and .ods) spreadsheet files. |
|
2102
|
|
|
|
|
|
|
|
|
2103
|
|
|
|
|
|
|
=item Spreadsheet::BasicRead |
|
2104
|
|
|
|
|
|
|
|
|
2105
|
|
|
|
|
|
|
See L<Spreadsheet::BasicRead|https://metacpan.org/release/Spreadsheet-BasicRead> |
|
2106
|
|
|
|
|
|
|
for xlscat-like functionality (Excel only) |
|
2107
|
|
|
|
|
|
|
|
|
2108
|
|
|
|
|
|
|
=item Spreadsheet::ConvertAA |
|
2109
|
|
|
|
|
|
|
|
|
2110
|
|
|
|
|
|
|
See L<Spreadsheet::ConvertAA|https://metacpan.org/release/Spreadsheet-ConvertAA> |
|
2111
|
|
|
|
|
|
|
for an alternative set of L</cell2cr>/L</cr2cell> pair. |
|
2112
|
|
|
|
|
|
|
|
|
2113
|
|
|
|
|
|
|
=item Spreadsheet::Perl |
|
2114
|
|
|
|
|
|
|
|
|
2115
|
|
|
|
|
|
|
L<Spreadsheet::Perl|https://metacpan.org/release/Spreadsheet-Perl> offers a Pure |
|
2116
|
|
|
|
|
|
|
Perl implementation of a spreadsheet engine. Users that want this format to be |
|
2117
|
|
|
|
|
|
|
supported in Spreadsheet::Read are hereby motivated to offer patches. It is |
|
2118
|
|
|
|
|
|
|
not high on my TODO-list. |
|
2119
|
|
|
|
|
|
|
|
|
2120
|
|
|
|
|
|
|
=item Spreadsheet::CSV |
|
2121
|
|
|
|
|
|
|
|
|
2122
|
|
|
|
|
|
|
L<Spreadsheet::CSV|https://metacpan.org/release/Spreadsheet-CSV> offers the |
|
2123
|
|
|
|
|
|
|
interesting approach of seeing all supported spreadsheet formats as if it were |
|
2124
|
|
|
|
|
|
|
CSV, mimicking the L<Text::CSV_XS|https://metacpan.org/release/Text-CSV_XS> |
|
2125
|
|
|
|
|
|
|
interface. |
|
2126
|
|
|
|
|
|
|
|
|
2127
|
|
|
|
|
|
|
=item xls2csv |
|
2128
|
|
|
|
|
|
|
|
|
2129
|
|
|
|
|
|
|
L<xls2csv|https://metacpan.org/release/xls2csv> offers an alternative for my |
|
2130
|
|
|
|
|
|
|
C<xlscat -c>, in the xls2csv tool, but this tool focuses on character encoding |
|
2131
|
|
|
|
|
|
|
transparency, and requires some other modules. |
|
2132
|
|
|
|
|
|
|
|
|
2133
|
|
|
|
|
|
|
=back |
|
2134
|
|
|
|
|
|
|
|
|
2135
|
|
|
|
|
|
|
=head1 AUTHOR |
|
2136
|
|
|
|
|
|
|
|
|
2137
|
|
|
|
|
|
|
H.Merijn Brand, <h.m.brand@xs4all.nl> |
|
2138
|
|
|
|
|
|
|
|
|
2139
|
|
|
|
|
|
|
=head1 COPYRIGHT AND LICENSE |
|
2140
|
|
|
|
|
|
|
|
|
2141
|
|
|
|
|
|
|
Copyright (C) 2005-2019 H.Merijn Brand |
|
2142
|
|
|
|
|
|
|
|
|
2143
|
|
|
|
|
|
|
This library is free software; you can redistribute it and/or modify |
|
2144
|
|
|
|
|
|
|
it under the same terms as Perl itself. |
|
2145
|
|
|
|
|
|
|
|
|
2146
|
|
|
|
|
|
|
=cut |