line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Catmandu::Fix::pica_map; |
2
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
our $VERSION = '0.16'; |
4
|
|
|
|
|
|
|
|
5
|
1
|
|
|
1
|
|
846
|
use Catmandu::Sane; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
8
|
|
6
|
1
|
|
|
1
|
|
190
|
use Moo; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
7
|
|
7
|
|
|
|
|
|
|
|
8
|
1
|
|
|
1
|
|
934
|
use Catmandu::Fix::Has; |
|
1
|
|
|
|
|
1733
|
|
|
1
|
|
|
|
|
5
|
|
9
|
1
|
|
|
1
|
|
1277
|
use PICA::Path; |
|
1
|
|
|
|
|
1210
|
|
|
1
|
|
|
|
|
1504
|
|
10
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
has pica_path => ( fix_arg => 1 ); |
12
|
|
|
|
|
|
|
has path => ( fix_arg => 1 ); |
13
|
|
|
|
|
|
|
has record => ( fix_opt => 1 ); |
14
|
|
|
|
|
|
|
has split => ( fix_opt => 1 ); |
15
|
|
|
|
|
|
|
has join => ( fix_opt => 1 ); |
16
|
|
|
|
|
|
|
has value => ( fix_opt => 1 ); |
17
|
|
|
|
|
|
|
has pluck => ( fix_opt => 1 ); |
18
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
sub emit { |
20
|
0
|
|
|
0
|
0
|
|
my ( $self, $fixer ) = @_; |
21
|
0
|
|
|
|
|
|
my $path = $fixer->split_path( $self->path ); |
22
|
0
|
|
0
|
|
|
|
my $record_key = $fixer->emit_string( $self->record // 'record' ); |
23
|
0
|
|
0
|
|
|
|
my $join_char = $fixer->emit_string( $self->join // '' ); |
24
|
0
|
|
|
|
|
|
my $pica_path = PICA::Path->new($self->pica_path); |
25
|
|
|
|
|
|
|
|
26
|
0
|
|
|
|
|
|
my ($field_regex, $occurrence_regex, $subfield_regex, $from, $length) = @$pica_path; |
27
|
|
|
|
|
|
|
|
28
|
0
|
|
|
|
|
|
my $var = $fixer->var; |
29
|
0
|
|
|
|
|
|
my $vals = $fixer->generate_var; |
30
|
0
|
|
|
|
|
|
my $perl = $fixer->emit_declare_vars( $vals, '[]' ); |
31
|
|
|
|
|
|
|
|
32
|
0
|
|
|
|
|
|
my $field_regex_var = $fixer->generate_var; |
33
|
0
|
|
|
|
|
|
$perl .= $fixer->emit_declare_vars( $field_regex_var, "qr{$field_regex}" ); |
34
|
|
|
|
|
|
|
|
35
|
0
|
|
|
|
|
|
my $subfield_regex_var = $fixer->generate_var; |
36
|
0
|
|
|
|
|
|
$perl .= $fixer->emit_declare_vars( $subfield_regex_var, "qr{$subfield_regex}" ); |
37
|
|
|
|
|
|
|
|
38
|
0
|
|
|
|
|
|
my $occurrence_regex_var; |
39
|
0
|
0
|
|
|
|
|
if (defined $occurrence_regex) { |
40
|
0
|
|
|
|
|
|
$occurrence_regex_var = $fixer->generate_var; |
41
|
0
|
|
|
|
|
|
$perl .= $fixer->emit_declare_vars( $occurrence_regex_var, "qr{$occurrence_regex}" ); |
42
|
|
|
|
|
|
|
} |
43
|
|
|
|
|
|
|
|
44
|
|
|
|
|
|
|
$perl .= $fixer->emit_foreach( |
45
|
|
|
|
|
|
|
"${var}->{${record_key}}", |
46
|
|
|
|
|
|
|
sub { |
47
|
0
|
|
|
0
|
|
|
my $var = shift; |
48
|
0
|
|
|
|
|
|
my $v = $fixer->generate_var; |
49
|
0
|
|
|
|
|
|
my $perl = ""; |
50
|
|
|
|
|
|
|
|
51
|
0
|
|
|
|
|
|
$perl .= "next if ${var}->[0] !~ ${field_regex_var};"; |
52
|
|
|
|
|
|
|
|
53
|
0
|
0
|
|
|
|
|
if (defined $occurrence_regex) { |
54
|
0
|
|
|
|
|
|
$perl .= "next if (!defined ${var}->[1] || ${var}->[1] !~ ${occurrence_regex_var});"; |
55
|
|
|
|
|
|
|
} |
56
|
|
|
|
|
|
|
|
57
|
0
|
0
|
|
|
|
|
if ( $self->value ) { |
58
|
0
|
|
|
|
|
|
$perl .= $fixer->emit_declare_vars( $v, |
59
|
|
|
|
|
|
|
$fixer->emit_string( $self->value ) ); |
60
|
|
|
|
|
|
|
} |
61
|
|
|
|
|
|
|
else { |
62
|
0
|
|
|
|
|
|
my $i = $fixer->generate_var; |
63
|
|
|
|
|
|
|
my $add_subfields = sub { |
64
|
0
|
|
|
|
|
|
my $start = shift; |
65
|
0
|
0
|
|
|
|
|
if ($self->pluck) { |
66
|
|
|
|
|
|
|
# Treat the subfield_regex as a hash index |
67
|
0
|
|
|
|
|
|
my $pluck = $fixer->generate_var; |
68
|
|
|
|
|
|
|
return |
69
|
0
|
|
|
|
|
|
"my ${pluck} = {};" . |
70
|
|
|
|
|
|
|
"for (my ${i} = ${start}; ${i} < \@{${var}}; ${i} += 2) {". |
71
|
|
|
|
|
|
|
"push(\@{ ${pluck}->{ ${var}->[${i}] } }, ${var}->[${i} + 1]);" . |
72
|
|
|
|
|
|
|
"}" . |
73
|
|
|
|
|
|
|
"for my ${i} (split('','${subfield_regex}')) { " . |
74
|
|
|
|
|
|
|
"push(\@{${v}}, \@{ ${pluck}->{${i}} }) if exists ${pluck}->{${i}};" . |
75
|
|
|
|
|
|
|
"}"; |
76
|
|
|
|
|
|
|
} |
77
|
|
|
|
|
|
|
else { |
78
|
|
|
|
|
|
|
# Treat the subfield_regex as regex that needs to match the subfields |
79
|
|
|
|
|
|
|
return |
80
|
0
|
|
|
|
|
|
"for (my ${i} = ${start}; ${i} < \@{${var}}; ${i} += 2) {". |
81
|
|
|
|
|
|
|
"if (${var}->[${i}] =~ /${subfield_regex}/) {". |
82
|
|
|
|
|
|
|
"push(\@{${v}}, ${var}->[${i} + 1]);". |
83
|
|
|
|
|
|
|
"}". |
84
|
|
|
|
|
|
|
"}"; |
85
|
|
|
|
|
|
|
} |
86
|
0
|
|
|
|
|
|
}; |
87
|
0
|
|
|
|
|
|
$perl .= $fixer->emit_declare_vars( $v, "[]" ); |
88
|
0
|
|
|
|
|
|
$perl .= $add_subfields->(2); |
89
|
0
|
|
|
|
|
|
$perl .= "if (\@{${v}}) {"; |
90
|
0
|
0
|
|
|
|
|
if ( !$self->split ) { |
91
|
0
|
|
|
|
|
|
$perl .= "${v} = join(${join_char}, \@{${v}});"; |
92
|
0
|
0
|
|
|
|
|
if ( defined( my $off = $from ) ) { |
93
|
0
|
|
|
|
|
|
$perl .= "if (eval { ${v} = substr(${v}, ${off}, ${length}); 1 }) {"; |
94
|
|
|
|
|
|
|
} |
95
|
|
|
|
|
|
|
} |
96
|
|
|
|
|
|
|
$perl .= $fixer->emit_create_path( |
97
|
|
|
|
|
|
|
$fixer->var, |
98
|
|
|
|
|
|
|
$path, |
99
|
|
|
|
|
|
|
sub { |
100
|
0
|
|
|
|
|
|
my $var = shift; |
101
|
0
|
0
|
|
|
|
|
if ( $self->split ) { |
102
|
0
|
|
|
|
|
|
"if (is_array_ref(${var})) {" |
103
|
|
|
|
|
|
|
. "push \@{${var}}, ${v};" |
104
|
|
|
|
|
|
|
. "} else {" |
105
|
|
|
|
|
|
|
. "${var} = [${v}];" . "}"; |
106
|
|
|
|
|
|
|
} |
107
|
|
|
|
|
|
|
else { |
108
|
0
|
|
|
|
|
|
"if (is_string(${var})) {" |
109
|
|
|
|
|
|
|
. "${var} = join(${join_char}, ${var}, ${v});" |
110
|
|
|
|
|
|
|
. "} else {" |
111
|
|
|
|
|
|
|
. "${var} = ${v};" . "}"; |
112
|
|
|
|
|
|
|
} |
113
|
|
|
|
|
|
|
} |
114
|
0
|
|
|
|
|
|
); |
115
|
0
|
0
|
|
|
|
|
if ( defined($from) ) { |
116
|
0
|
|
|
|
|
|
$perl .= "}"; |
117
|
|
|
|
|
|
|
} |
118
|
0
|
|
|
|
|
|
$perl .= "}"; |
119
|
|
|
|
|
|
|
} |
120
|
0
|
|
|
|
|
|
$perl; |
121
|
|
|
|
|
|
|
} |
122
|
0
|
|
|
|
|
|
); |
123
|
|
|
|
|
|
|
|
124
|
0
|
|
|
|
|
|
$perl; |
125
|
|
|
|
|
|
|
} |
126
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
1; |
128
|
|
|
|
|
|
|
__END__ |