line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Text::vFile::asData; |
2
|
4
|
|
|
4
|
|
60545
|
use strict; |
|
4
|
|
|
|
|
10
|
|
|
4
|
|
|
|
|
172
|
|
3
|
4
|
|
|
4
|
|
23
|
use warnings; |
|
4
|
|
|
|
|
10
|
|
|
4
|
|
|
|
|
156
|
|
4
|
4
|
|
|
4
|
|
40
|
no warnings 'uninitialized'; |
|
4
|
|
|
|
|
10
|
|
|
4
|
|
|
|
|
177
|
|
5
|
4
|
|
|
4
|
|
22
|
use base qw( Class::Accessor::Chained::Fast ); |
|
4
|
|
|
|
|
6
|
|
|
4
|
|
|
|
|
4234
|
|
6
|
|
|
|
|
|
|
__PACKAGE__->mk_accessors(qw( preserve_params )); |
7
|
|
|
|
|
|
|
our $VERSION = '0.08'; |
8
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
=head1 NAME |
10
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
Text::vFile::asData - parse vFile formatted files into data structures |
12
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
=head1 SYNOPSIS |
14
|
|
|
|
|
|
|
|
15
|
|
|
|
|
|
|
use Text::vFile::asData; |
16
|
|
|
|
|
|
|
open my $fh, "foo.ics" |
17
|
|
|
|
|
|
|
or die "couldn't open ics: $!"; |
18
|
|
|
|
|
|
|
my $data = Text::vFile::asData->new->parse( $fh ); |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
=head1 DESCRIPTION |
21
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
Text::vFile::asData reads vFile format files, such as vCard (RFC 2426) and |
23
|
|
|
|
|
|
|
vCalendar (RFC 2445). |
24
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
=cut |
26
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
sub _unwrap_lines { |
28
|
116
|
|
|
116
|
|
1035
|
my $self = shift; |
29
|
116
|
|
|
|
|
147
|
my @lines; |
30
|
116
|
|
|
|
|
264
|
for (@_) { |
31
|
2017
|
|
|
|
|
2528
|
my $line = $_; # $_ may be readonly |
32
|
2017
|
|
|
|
|
5416
|
$line =~ s{[\r\n]+$}{}; # lines SHOULD end CRLF |
33
|
2017
|
100
|
|
|
|
5348
|
if ($line =~ /^[ \t](.*)/) { # Continuation line (RFC Sect. 4.1) |
34
|
717
|
50
|
|
|
|
1339
|
die "Continuation line, but no preceding line" unless @lines; |
35
|
717
|
|
|
|
|
1606
|
$lines[-1] .= $1; |
36
|
717
|
|
|
|
|
1174
|
next; |
37
|
|
|
|
|
|
|
} |
38
|
1300
|
|
|
|
|
2465
|
push @lines, $line; |
39
|
|
|
|
|
|
|
} |
40
|
116
|
|
|
|
|
734
|
return @lines; |
41
|
|
|
|
|
|
|
} |
42
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
sub parse { |
44
|
50
|
|
|
50
|
0
|
9565
|
my $self = shift; |
45
|
50
|
|
|
|
|
103
|
my $fh = shift; |
46
|
50
|
|
|
|
|
3473
|
return $self->parse_lines( <$fh> ); |
47
|
|
|
|
|
|
|
} |
48
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
# like Text::ParseWords' parse_line, only C-style so the regex engine doesn't |
50
|
|
|
|
|
|
|
# blow its stack, and it's also got a $limit like split |
51
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
# this only took a trainride, so I'm pretty sure there are lurking |
53
|
|
|
|
|
|
|
# corner cases - when I get a tuit I'll take the Text::ParseWords |
54
|
|
|
|
|
|
|
# tests and run them through it |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
sub parse_line { |
57
|
1938
|
|
|
1938
|
0
|
11307
|
my ($delim, $keep, $text, $limit) = @_; |
58
|
|
|
|
|
|
|
|
59
|
1938
|
|
|
|
|
1905
|
my ($current, @parts); |
60
|
0
|
|
|
|
|
0
|
my ($quote, $escaped); |
61
|
1938
|
|
|
|
|
4085
|
while (length $text) { |
62
|
21417
|
50
|
|
|
|
45329
|
if ($text =~ s{^(\\)}{}) { |
63
|
0
|
0
|
0
|
|
|
0
|
$current .= $1 if $escaped || $keep; |
64
|
0
|
|
|
|
|
0
|
$escaped = !$escaped; |
65
|
0
|
|
|
|
|
0
|
next; |
66
|
|
|
|
|
|
|
} |
67
|
21417
|
100
|
66
|
|
|
153943
|
if (!$quote && !$escaped && $text =~ s{^$delim}{}) { |
|
|
|
100
|
|
|
|
|
68
|
1360
|
|
|
|
|
2526
|
push @parts, $current; |
69
|
1360
|
|
|
|
|
1460
|
$current = undef; |
70
|
1360
|
100
|
66
|
|
|
5299
|
if (defined $limit && @parts == $limit -1) { |
71
|
963
|
|
|
|
|
3607
|
return @parts, $text; |
72
|
|
|
|
|
|
|
} |
73
|
|
|
|
|
|
|
} |
74
|
|
|
|
|
|
|
else { |
75
|
|
|
|
|
|
|
# pull the character off to take a looksee |
76
|
20057
|
|
|
|
|
57710
|
$text =~ s{(.)}{}; |
77
|
20057
|
|
|
|
|
33516
|
my $char = $1; |
78
|
20057
|
100
|
66
|
|
|
47046
|
if ($char eq '"' && !$escaped) { |
79
|
|
|
|
|
|
|
# either it's defined and matches, in which case we |
80
|
|
|
|
|
|
|
# clear the quote variable, or it's undefined which |
81
|
|
|
|
|
|
|
# makes this quote an opening quote |
82
|
28
|
|
|
|
|
39
|
$quote = !$quote; |
83
|
28
|
100
|
|
|
|
61
|
$current .= $char if $keep; |
84
|
|
|
|
|
|
|
} |
85
|
|
|
|
|
|
|
else { |
86
|
20029
|
|
|
|
|
30851
|
$current .= $char; |
87
|
|
|
|
|
|
|
} |
88
|
|
|
|
|
|
|
} |
89
|
20454
|
|
|
|
|
49764
|
$escaped = 0; |
90
|
|
|
|
|
|
|
} |
91
|
|
|
|
|
|
|
|
92
|
975
|
|
|
|
|
3331
|
return @parts, $current; |
93
|
|
|
|
|
|
|
} |
94
|
|
|
|
|
|
|
|
95
|
|
|
|
|
|
|
sub parse_lines { |
96
|
115
|
|
|
115
|
0
|
24047
|
my $self = shift; |
97
|
|
|
|
|
|
|
|
98
|
115
|
|
|
|
|
165
|
my @path; |
99
|
|
|
|
|
|
|
my $current; |
100
|
115
|
|
|
|
|
381
|
for ($self->_unwrap_lines( @_ )) { |
101
|
|
|
|
|
|
|
# Ignore leading or trailing blank lines at the top/bottom of the |
102
|
|
|
|
|
|
|
# input. Not sure about completely blank lines within the input |
103
|
1299
|
100
|
100
|
|
|
3806
|
next if scalar @path == 0 and $_ =~ /^\s*$/; |
104
|
|
|
|
|
|
|
|
105
|
1294
|
100
|
|
|
|
3917
|
if (/^BEGIN:(.*)/i) { |
106
|
165
|
|
|
|
|
251
|
push @path, $current; |
107
|
165
|
|
|
|
|
1305
|
$current = { type => $1 }; |
108
|
165
|
|
|
|
|
209
|
push @{ $path[-1]{objects} }, $current; |
|
165
|
|
|
|
|
524
|
|
109
|
165
|
|
|
|
|
354
|
next; |
110
|
|
|
|
|
|
|
} |
111
|
1129
|
100
|
|
|
|
2724
|
if (/^END:(.*)/i) { |
112
|
164
|
100
|
|
|
|
741
|
die "END $1 in $current->{type}" |
113
|
|
|
|
|
|
|
unless lc $current->{type} eq lc $1; |
114
|
163
|
|
|
|
|
322
|
$current = pop @path; |
115
|
163
|
|
|
|
|
398
|
next; |
116
|
|
|
|
|
|
|
} |
117
|
|
|
|
|
|
|
|
118
|
|
|
|
|
|
|
# we'd use Text::ParseWords here, but it likes to segfault. |
119
|
965
|
|
|
|
|
1941
|
my ($name, $value) = parse_line( ':', 1, $_, 2); |
120
|
965
|
100
|
|
|
|
2365
|
$value = '' unless defined $value; |
121
|
965
|
|
|
|
|
1906
|
my @params = parse_line( ';', 0, $name ); |
122
|
965
|
|
|
|
|
2148
|
$name = shift @params; |
123
|
|
|
|
|
|
|
|
124
|
965
|
|
|
|
|
4029
|
$value = { value => $value }; |
125
|
|
|
|
|
|
|
|
126
|
965
|
|
|
|
|
1818
|
foreach my $param (@params) { |
127
|
389
|
|
|
|
|
1110
|
my ($p_name, $p_value) = split /=/, $param; |
128
|
389
|
100
|
|
|
|
1334
|
push @{ $value->{params} }, { $p_name => $p_value } |
|
197
|
|
|
|
|
1748
|
|
129
|
|
|
|
|
|
|
if $self->preserve_params; |
130
|
389
|
|
|
|
|
2848
|
$value->{param}{ $p_name } = $p_value; |
131
|
|
|
|
|
|
|
} |
132
|
965
|
|
|
|
|
1202
|
push @{ $current->{properties}{ $name } }, $value; |
|
965
|
|
|
|
|
4149
|
|
133
|
|
|
|
|
|
|
} |
134
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
# something did a BEGIN but no END - TODO, unwind this nicely as |
136
|
|
|
|
|
|
|
# it may be more than one level |
137
|
114
|
100
|
|
|
|
459
|
die "BEGIN $current->{type} without matching END" |
138
|
|
|
|
|
|
|
if @path; |
139
|
|
|
|
|
|
|
|
140
|
113
|
|
|
|
|
723
|
return $current; |
141
|
|
|
|
|
|
|
} |
142
|
|
|
|
|
|
|
|
143
|
|
|
|
|
|
|
# this might not strictly comply |
144
|
|
|
|
|
|
|
sub generate_lines { |
145
|
126
|
|
|
126
|
0
|
32778
|
my $self = shift; |
146
|
126
|
|
|
|
|
172
|
my $this = shift; |
147
|
|
|
|
|
|
|
|
148
|
126
|
|
|
|
|
165
|
my @lines; |
149
|
|
|
|
|
|
|
# XXX all the existence checks are to prevent auto-vivification |
150
|
|
|
|
|
|
|
# breaking if_diff tests - do we mind, or should the fields have been |
151
|
|
|
|
|
|
|
# there anyway? |
152
|
|
|
|
|
|
|
|
153
|
126
|
100
|
|
|
|
433
|
push @lines, "BEGIN:$this->{type}" if exists $this->{type}; |
154
|
126
|
100
|
|
|
|
304
|
if (exists $this->{properties}) { |
155
|
78
|
|
|
|
|
142
|
while (my ($name, $v) = each %{ $this->{properties} } ) { |
|
484
|
|
|
|
|
1705
|
|
156
|
406
|
|
|
|
|
635
|
for my $value (@$v) { |
157
|
|
|
|
|
|
|
# XXX so we're taking params in preference to param, |
158
|
|
|
|
|
|
|
# let's be sure to document that when we document this |
159
|
|
|
|
|
|
|
# method |
160
|
498
|
|
|
|
|
583
|
my $param = join ';', '', map { |
161
|
468
|
100
|
|
|
|
2105
|
my $hash = $_; |
162
|
178
|
100
|
|
|
|
863
|
map { |
163
|
498
|
|
|
|
|
1378
|
"$_" . (defined $hash->{$_} ? "=" . $hash->{$_} : "") |
164
|
|
|
|
|
|
|
} keys %$hash |
165
|
468
|
|
|
|
|
480
|
} @{ $value->{params} || [ $value->{param} ] }; |
166
|
468
|
|
|
|
|
1292
|
my $line = "$name$param:$value->{value}"; |
167
|
|
|
|
|
|
|
# wrapping, but done ugly |
168
|
468
|
|
|
|
|
1858
|
my @chunks = $line =~ m/(.{1,72})/g; |
169
|
468
|
|
|
|
|
749
|
push @lines, shift @chunks; |
170
|
468
|
|
|
|
|
1374
|
push @lines, map { " $_" } @chunks; |
|
60
|
|
|
|
|
240
|
|
171
|
|
|
|
|
|
|
} |
172
|
|
|
|
|
|
|
} |
173
|
|
|
|
|
|
|
} |
174
|
|
|
|
|
|
|
|
175
|
126
|
100
|
|
|
|
322
|
if (exists $this->{objects}) { |
176
|
58
|
|
|
|
|
83
|
push @lines, $self->generate_lines( $_ ) for @{ $this->{objects} } |
|
58
|
|
|
|
|
255
|
|
177
|
|
|
|
|
|
|
} |
178
|
126
|
100
|
|
|
|
385
|
push @lines, "END:$this->{type}" if exists $this->{type}; |
179
|
126
|
|
|
|
|
823
|
return @lines; |
180
|
|
|
|
|
|
|
} |
181
|
|
|
|
|
|
|
|
182
|
|
|
|
|
|
|
|
183
|
|
|
|
|
|
|
1; |
184
|
|
|
|
|
|
|
__END__ |