line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
|
2
|
|
|
|
|
|
|
=head1 NAME |
3
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
NetSDS::Util::FileImport - import table structure from file |
5
|
|
|
|
|
|
|
|
6
|
|
|
|
|
|
|
=head1 SYNOPSIS |
7
|
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
use NetSDS::Util::FileImport |
9
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
=head1 DESCRIPTION |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
=cut |
13
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
package NetSDS::Util::FileImport; |
15
|
|
|
|
|
|
|
|
16
|
2
|
|
|
2
|
|
3679
|
use 5.8.0; |
|
2
|
|
|
|
|
5
|
|
|
2
|
|
|
|
|
92
|
|
17
|
2
|
|
|
2
|
|
7
|
use strict; |
|
2
|
|
|
|
|
2
|
|
|
2
|
|
|
|
|
52
|
|
18
|
2
|
|
|
2
|
|
45
|
use warnings; |
|
2
|
|
|
|
|
3
|
|
|
2
|
|
|
|
|
51
|
|
19
|
|
|
|
|
|
|
|
20
|
2
|
|
|
2
|
|
1312
|
use File::MMagic; # Determine MIME type of file |
|
2
|
|
|
|
|
14709
|
|
|
2
|
|
|
|
|
115
|
|
21
|
2
|
|
|
2
|
|
1359
|
use Spreadsheet::Read; # Parse spreadsheet files |
|
2
|
|
|
|
|
27907
|
|
|
2
|
|
|
|
|
158
|
|
22
|
|
|
|
|
|
|
|
23
|
2
|
|
|
2
|
|
15
|
use base 'Exporter'; |
|
2
|
|
|
|
|
13
|
|
|
2
|
|
|
|
|
170
|
|
24
|
|
|
|
|
|
|
|
25
|
2
|
|
|
2
|
|
10
|
use version; our $VERSION = "1.044"; |
|
2
|
|
|
|
|
3
|
|
|
2
|
|
|
|
|
21
|
|
26
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
our @EXPORT = qw( |
28
|
|
|
|
|
|
|
import_table |
29
|
|
|
|
|
|
|
); |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
# TODO |
32
|
2
|
|
|
2
|
|
170
|
use constant PREVIEW_LIMIT => 5; # Number of records to process for previews |
|
2
|
|
|
|
|
4
|
|
|
2
|
|
|
|
|
2115
|
|
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
=head1 CLASS API |
35
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
=over |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
=item B - import table data from file |
39
|
|
|
|
|
|
|
|
40
|
|
|
|
|
|
|
takes $content of a file, $pre_parse (true or false it means: return all table or only 5 first rows |
41
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
params it could be |
43
|
|
|
|
|
|
|
patterns => { qr#name#i => { qr#last#i => 'last_name', qr#first#i => 'first_name' } } |
44
|
|
|
|
|
|
|
separator => could be ,;\t: |
45
|
|
|
|
|
|
|
fields => [ email last_name ] |
46
|
|
|
|
|
|
|
substitute => { E-mail => email, Last Name => last_name, .. } |
47
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
Depends of a params parse would be different |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
Returns a structure like this |
51
|
|
|
|
|
|
|
[ { last_name => undef, first_name => yana, ... }, { last_name => kornienko, first_name => test, ... } .. ] |
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
=back |
54
|
|
|
|
|
|
|
|
55
|
|
|
|
|
|
|
=cut |
56
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
sub import_table($;$$) { |
58
|
0
|
|
|
0
|
1
|
|
my ( $file_name, $params, $pre_parse ) = @_; |
59
|
0
|
|
|
|
|
|
my ( $separator, $data, $rows ) = ( $params->{'separator'}, [], [] ); |
60
|
0
|
0
|
|
|
|
|
return "Can't find file [$file_name]." unless -e $file_name; |
61
|
|
|
|
|
|
|
# [ { 'last_name' => 'my name', 'First Name' => 'my first name' ... }, {'last_name' => undef, 'First Name' => 'test_name' ... } ... ] |
62
|
|
|
|
|
|
|
|
63
|
0
|
|
|
|
|
|
my @title = (); |
64
|
0
|
0
|
|
|
|
|
if ( File::MMagic->new->checktype_filename($file_name) eq 'text/plain' ) { |
65
|
|
|
|
|
|
|
|
66
|
0
|
0
|
|
|
|
|
open my $FILE, '<', $file_name or return $!; |
67
|
0
|
|
|
|
|
|
my @lines = <$FILE>; |
68
|
0
|
|
|
|
|
|
chomp for @lines; |
69
|
0
|
|
|
|
|
|
close $FILE; |
70
|
|
|
|
|
|
|
|
71
|
0
|
|
|
|
|
|
$lines[0] =~ s/^["']|["']$//; |
72
|
0
|
|
0
|
|
|
|
$separator ||= ( $lines[0] =~ m![\w\s"]+?([,;:\t])! )[0]; |
73
|
0
|
0
|
|
|
|
|
return "Parse error while parsing csv file" unless $separator; |
74
|
|
|
|
|
|
|
|
75
|
0
|
|
|
|
|
|
$lines[0] =~ s/["']$//; |
76
|
0
|
|
|
|
|
|
@title = split /["']{0,1}$separator["']{0,1}/, $lines[0]; |
77
|
|
|
|
|
|
|
|
78
|
0
|
0
|
0
|
|
|
|
my @rows = ( ( $pre_parse and @lines > PREVIEW_LIMIT ) ? @lines[ 1 .. PREVIEW_LIMIT + 1 ] : @lines ); |
79
|
0
|
0
|
0
|
|
|
|
$rows = [ map { [ split /["']*$separator["']*/, $_ ] } grep { ( $_ and $_ =~ s/^['"]// ) or $_ } @rows ]; |
|
0
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
|
81
|
|
|
|
|
|
|
} else { |
82
|
|
|
|
|
|
|
|
83
|
0
|
|
|
|
|
|
my $struct = ReadData($file_name); |
84
|
0
|
0
|
|
|
|
|
return "Parse error while parsing data xls file" unless $struct; |
85
|
|
|
|
|
|
|
|
86
|
0
|
|
|
|
|
|
my @content = @{ $struct->[1]{'cell'} }; |
|
0
|
|
|
|
|
|
|
87
|
0
|
|
|
|
|
|
@title = map { $content[$_]->[1] } 1 .. $#content; |
|
0
|
|
|
|
|
|
|
88
|
0
|
0
|
0
|
|
|
|
my $count = ( ( $pre_parse and @{ $content[1] } > ( PREVIEW_LIMIT + 2 ) ) ? PREVIEW_LIMIT : scalar @{ $content[1] } - 1 ); |
|
0
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
|
90
|
0
|
|
|
|
|
|
for my $i ( 2 .. $count ) { |
91
|
0
|
|
|
|
|
|
push @$rows, [ map { $content[$_]->[$i] } 1 .. @title ]; |
|
0
|
|
|
|
|
|
|
92
|
|
|
|
|
|
|
} |
93
|
|
|
|
|
|
|
} |
94
|
|
|
|
|
|
|
|
95
|
0
|
|
|
|
|
|
my @original_fields = @title; |
96
|
0
|
0
|
|
|
|
|
if ( $params->{'patterns'} ) { |
|
|
0
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
97
|
0
|
|
|
|
|
|
_order_data_by_patterns( \@title, $params->{'patterns'} ); |
98
|
|
|
|
|
|
|
} elsif ( $params->{'fields'} ) { #return only specific fields that has the same name |
99
|
0
|
|
|
|
|
|
_order_data_by_fields( $data, \@title, $params->{'fields'}, $rows ); |
100
|
0
|
|
|
|
|
|
return $data; |
101
|
|
|
|
|
|
|
} elsif ( $params->{'substitute'} ) { #return only specific fields the names of which has been changed |
102
|
0
|
|
|
|
|
|
_order_data_with_substitute( $data, \@title, $params->{'substitute'}, $rows ); |
103
|
0
|
|
|
|
|
|
return $data; |
104
|
|
|
|
|
|
|
} |
105
|
|
|
|
|
|
|
|
106
|
0
|
|
|
|
|
|
for my $row (@$rows) { |
107
|
0
|
|
|
|
|
|
push @$data, { map { ( $title[$_] => $row->[$_] ) } 0 .. $#title }; |
|
0
|
|
|
|
|
|
|
108
|
|
|
|
|
|
|
} |
109
|
|
|
|
|
|
|
|
110
|
0
|
0
|
|
|
|
|
return wantarray ? ( $data, \@original_fields ) : $data; |
111
|
|
|
|
|
|
|
} ## end sub import_table($;$$) |
112
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
sub _order_data_by_patterns($$) { |
114
|
0
|
|
|
0
|
|
|
my ( $title, $patterns ) = @_; |
115
|
|
|
|
|
|
|
|
116
|
0
|
|
|
|
|
|
for ( my $i = 0 ; $title->[$i] ; $i++ ) { #TODO multi |
117
|
0
|
|
|
|
|
|
for my $pattern ( keys %$patterns ) { |
118
|
0
|
0
|
|
|
|
|
if ( $title->[$i] =~ $pattern ) { |
119
|
0
|
0
|
|
|
|
|
if ( ref $patterns->{$pattern} ) { |
120
|
0
|
|
|
|
|
|
for my $subpattern ( keys %{ $patterns->{$pattern} } ) { |
|
0
|
|
|
|
|
|
|
121
|
0
|
0
|
|
|
|
|
if ( $title->[$i] =~ $subpattern ) { |
122
|
0
|
|
|
|
|
|
$title->[$i] = $patterns->{$pattern}{$subpattern}; |
123
|
0
|
|
|
|
|
|
last; |
124
|
|
|
|
|
|
|
} |
125
|
|
|
|
|
|
|
} |
126
|
|
|
|
|
|
|
} else { |
127
|
0
|
|
|
|
|
|
$title->[$i] = $patterns->{$pattern}; |
128
|
|
|
|
|
|
|
} |
129
|
|
|
|
|
|
|
} |
130
|
|
|
|
|
|
|
} |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
} ## end sub _order_data_by_patterns($$) |
133
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
sub _order_data_by_fields($$$$) { |
135
|
0
|
|
|
0
|
|
|
my ( $data, $title, $fields, $rows ) = @_; |
136
|
0
|
|
|
|
|
|
my @res = (); |
137
|
|
|
|
|
|
|
|
138
|
0
|
|
|
|
|
|
for my $field (@$fields) { |
139
|
0
|
|
|
|
|
|
for ( my $i = 0 ; $title->[$i] ; $i++ ) { |
140
|
0
|
0
|
|
|
|
|
if ( $title->[$i] eq $field ) { |
141
|
0
|
|
|
|
|
|
push @res, $i; |
142
|
0
|
|
|
|
|
|
last; |
143
|
|
|
|
|
|
|
} |
144
|
|
|
|
|
|
|
} |
145
|
|
|
|
|
|
|
} |
146
|
|
|
|
|
|
|
|
147
|
0
|
|
|
|
|
|
for my $row (@$rows) { |
148
|
0
|
|
|
|
|
|
push @$data, { map { ( $title->[$_] => $row->[$_] ) } @res }; |
|
0
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
} |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
sub _order_data_with_substitute($$$$) { |
153
|
0
|
|
|
0
|
|
|
my ( $data, $title, $substitute, $rows ) = @_; |
154
|
0
|
|
|
|
|
|
my $pattern = join '|', map { quotemeta $_ } keys %$substitute; |
|
0
|
|
|
|
|
|
|
155
|
|
|
|
|
|
|
|
156
|
0
|
|
|
|
|
|
$_ =~ s/^($pattern)$/$substitute->{$1}/ for @$title; |
157
|
|
|
|
|
|
|
|
158
|
0
|
|
|
|
|
|
_order_data_by_fields( $data, $title, [ values %$substitute ], $rows ); |
159
|
|
|
|
|
|
|
} |
160
|
|
|
|
|
|
|
|
161
|
|
|
|
|
|
|
1; |