line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Data::CompactReadonly::V0::Dictionary; |
2
|
|
|
|
|
|
|
our $VERSION = '0.0.5'; |
3
|
|
|
|
|
|
|
|
4
|
5
|
|
|
5
|
|
42
|
use warnings; |
|
5
|
|
|
|
|
13
|
|
|
5
|
|
|
|
|
166
|
|
5
|
5
|
|
|
5
|
|
25
|
use strict; |
|
5
|
|
|
|
|
11
|
|
|
5
|
|
|
|
|
133
|
|
6
|
5
|
|
|
5
|
|
23
|
use base qw(Data::CompactReadonly::V0::Collection Data::CompactReadonly::Dictionary); |
|
5
|
|
|
|
|
13
|
|
|
5
|
|
|
|
|
3089
|
|
7
|
|
|
|
|
|
|
|
8
|
5
|
|
|
5
|
|
2745
|
use Data::CompactReadonly::V0::TiedDictionary; |
|
5
|
|
|
|
|
16
|
|
|
5
|
|
|
|
|
188
|
|
9
|
5
|
|
|
5
|
|
34
|
use Scalar::Util qw(blessed); |
|
5
|
|
|
|
|
9
|
|
|
5
|
|
|
|
|
319
|
|
10
|
5
|
|
|
5
|
|
31
|
use Devel::StackTrace; |
|
5
|
|
|
|
|
9
|
|
|
5
|
|
|
|
|
6795
|
|
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
sub _init { |
13
|
53
|
|
|
53
|
|
209
|
my($class, %args) = @_; |
14
|
53
|
|
|
|
|
145
|
my($root, $offset) = @args{qw(root offset)}; |
15
|
|
|
|
|
|
|
|
16
|
53
|
100
|
|
|
|
167
|
my $object = bless({ |
17
|
|
|
|
|
|
|
root => $root, |
18
|
|
|
|
|
|
|
offset => $offset, |
19
|
|
|
|
|
|
|
cache => ($root->_fast_collections() ? {} : undef), |
20
|
|
|
|
|
|
|
}, $class); |
21
|
|
|
|
|
|
|
|
22
|
53
|
100
|
|
|
|
170
|
if($root->_tied()) { |
23
|
27
|
|
|
|
|
119
|
tie my %dict, 'Data::CompactReadonly::V0::TiedDictionary', $object; |
24
|
27
|
|
|
|
|
161
|
return \%dict; |
25
|
|
|
|
|
|
|
} else { |
26
|
26
|
|
|
|
|
199
|
return $object; |
27
|
|
|
|
|
|
|
} |
28
|
|
|
|
|
|
|
} |
29
|
|
|
|
|
|
|
|
30
|
|
|
|
|
|
|
# write a Dictionary to the file at the current offset |
31
|
|
|
|
|
|
|
sub _create { |
32
|
19
|
|
|
19
|
|
89
|
my($class, %args) = @_; |
33
|
19
|
|
|
|
|
56
|
my $fh = $args{fh}; |
34
|
19
|
|
|
|
|
123
|
$class->_stash_already_seen(%args); |
35
|
19
|
|
|
|
|
1406088
|
(my $scalar_type = $class) =~ s/Dictionary/Scalar/; |
36
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
# node header |
38
|
|
|
|
|
|
|
print $fh $class->_type_byte_from_class(). |
39
|
19
|
|
|
|
|
159
|
$scalar_type->_get_bytes_from_word(scalar(keys %{$args{data}})); |
|
19
|
|
|
|
|
180
|
|
40
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
# empty pointer table |
42
|
19
|
|
|
|
|
192
|
my $table_start_ptr = tell($fh); |
43
|
19
|
|
|
|
|
109
|
print $fh "\x00" x $args{ptr_size} x 2 x scalar(keys %{$args{data}}); |
|
19
|
|
|
|
|
1251
|
|
44
|
19
|
|
|
|
|
178
|
$class->_set_next_free_ptr(%args); |
45
|
|
|
|
|
|
|
|
46
|
19
|
|
|
|
|
64
|
my @sorted_keys = sort keys %{$args{data}}; |
|
19
|
|
|
|
|
342409
|
|
47
|
19
|
|
|
|
|
22263
|
foreach my $index (0 .. $#sorted_keys) { |
48
|
65617
|
|
|
|
|
243359
|
my $this_key = $sorted_keys[$index]; |
49
|
65617
|
|
|
|
|
158854
|
my $this_value = $args{data}->{$this_key}; |
50
|
|
|
|
|
|
|
|
51
|
|
|
|
|
|
|
# write the pointer to the key, and the key if needed. Then write the |
52
|
|
|
|
|
|
|
# pointer to the value, and the value if needed. The value can be any |
53
|
|
|
|
|
|
|
# type. Keys are coerced Text to avoid floating point problems. |
54
|
65617
|
|
|
|
|
278648
|
foreach my $item ( |
55
|
|
|
|
|
|
|
{ data => $this_key, ptr_offset => 0, coerce_to_text => 1 }, |
56
|
|
|
|
|
|
|
{ data => $this_value, ptr_offset => $args{ptr_size} } |
57
|
|
|
|
|
|
|
) { |
58
|
131231
|
|
|
|
|
813639
|
$class->_seek(%args, pointer => $item->{ptr_offset} + $table_start_ptr + 2 * $index * $args{ptr_size}); |
59
|
131231
|
100
|
|
|
|
683320
|
if(my $ptr = $class->_get_already_seen(%args, data => $item->{data})) { |
60
|
65568
|
|
|
|
|
730455
|
print $fh $class->_encode_ptr(%args, pointer => $ptr); |
61
|
|
|
|
|
|
|
} else { |
62
|
65663
|
|
|
|
|
266416
|
print $fh $class->_encode_ptr(%args, pointer => $class->_get_next_free_ptr(%args)); |
63
|
65663
|
|
|
|
|
499336
|
$class->_seek(%args, pointer => $class->_get_next_free_ptr(%args)); |
64
|
|
|
|
|
|
|
|
65
|
65660
|
|
|
|
|
224460
|
my $node_class = 'Data::CompactReadonly::V0::Node'; |
66
|
65660
|
100
|
|
|
|
164282
|
if($item->{coerce_to_text}) { |
67
|
65610
|
|
|
|
|
219303
|
$node_class = 'Data::CompactReadonly::V0::'.$class->_text_type_for_data($item->{data}); |
68
|
65610
|
100
|
|
|
|
499290
|
unless($node_class->VERSION()) { |
69
|
2
|
|
|
2
|
|
1017
|
eval "use $node_class"; |
|
2
|
|
|
|
|
6
|
|
|
2
|
|
|
|
|
39
|
|
|
2
|
|
|
|
|
122
|
|
70
|
2
|
50
|
|
|
|
11
|
die($@) if($@); |
71
|
|
|
|
|
|
|
} |
72
|
|
|
|
|
|
|
} |
73
|
65660
|
|
|
|
|
318952
|
$node_class->_create(%args, data => $item->{data}); |
74
|
|
|
|
|
|
|
} |
75
|
|
|
|
|
|
|
} |
76
|
|
|
|
|
|
|
} |
77
|
|
|
|
|
|
|
} |
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
# Efficient binary search. Relies on elements' being ASCIIbetically sorted by key. |
80
|
|
|
|
|
|
|
# 1 <= iterations to find key (or find that there is no key) <= ceil(log2(N)) |
81
|
|
|
|
|
|
|
# so no more than 4 iterations for a ten element list, no more than 20 for |
82
|
|
|
|
|
|
|
# a million element list. Each iteration takes two seeks and two reads there |
83
|
|
|
|
|
|
|
# are then two more seeks and reads to get the value |
84
|
|
|
|
|
|
|
sub element { |
85
|
108
|
|
|
108
|
0
|
10491
|
my($self, $element) = @_; |
86
|
|
|
|
|
|
|
|
87
|
108
|
100
|
100
|
|
|
546
|
die( |
|
|
100
|
|
|
|
|
|
88
|
|
|
|
|
|
|
"$self: Invalid element: ". |
89
|
|
|
|
|
|
|
(!defined($element) ? '[undef]' : $element). |
90
|
|
|
|
|
|
|
" isn't Text or numeric\n" |
91
|
|
|
|
|
|
|
) unless(defined($element) && !ref($element)); |
92
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
# first we need to find that key |
94
|
105
|
|
|
|
|
333
|
my $max_candidate = $self->count() - 1; |
95
|
105
|
|
|
|
|
196
|
my $min_candidate = 0; |
96
|
105
|
|
|
|
|
287
|
my $cur_candidate = int($max_candidate / 2); |
97
|
105
|
|
|
|
|
169
|
my $prev_candidate = -1; |
98
|
|
|
|
|
|
|
|
99
|
105
|
|
|
|
|
209
|
while(1) { |
100
|
457
|
|
|
|
|
1107
|
my $key = $self->_nth_key($cur_candidate); |
101
|
457
|
|
|
|
|
741
|
$prev_candidate = $cur_candidate; |
102
|
457
|
100
|
|
|
|
1400
|
if($key eq $element) { |
|
|
100
|
|
|
|
|
|
103
|
100
|
|
|
|
|
276
|
return $self->_nth_value($cur_candidate); |
104
|
|
|
|
|
|
|
} elsif($key lt $element) { # our target is futher down the list |
105
|
215
|
|
|
|
|
721
|
($min_candidate, $cur_candidate, $max_candidate) = ( |
106
|
|
|
|
|
|
|
$cur_candidate + 1, |
107
|
|
|
|
|
|
|
int(($cur_candidate + $max_candidate + 1) / 2), |
108
|
|
|
|
|
|
|
$max_candidate |
109
|
|
|
|
|
|
|
); |
110
|
|
|
|
|
|
|
} else { # our target is further up the list |
111
|
142
|
|
|
|
|
500
|
($min_candidate, $cur_candidate, $max_candidate) = ( |
112
|
|
|
|
|
|
|
$min_candidate, |
113
|
|
|
|
|
|
|
int(($min_candidate + $cur_candidate) / 2), |
114
|
|
|
|
|
|
|
$cur_candidate - 1 |
115
|
|
|
|
|
|
|
); |
116
|
|
|
|
|
|
|
} |
117
|
357
|
100
|
|
|
|
825
|
last if($prev_candidate == $cur_candidate); |
118
|
|
|
|
|
|
|
} |
119
|
5
|
|
|
|
|
52
|
die("$self: Invalid element: $element: doesn't exist\n"); |
120
|
|
|
|
|
|
|
} |
121
|
|
|
|
|
|
|
|
122
|
|
|
|
|
|
|
sub exists { |
123
|
16
|
|
|
16
|
0
|
476
|
my($self, $element) = @_; |
124
|
16
|
100
|
|
|
|
49
|
return 0 if($self->count() == 0); |
125
|
15
|
|
|
|
|
41
|
eval { $self->element($element) }; |
|
15
|
|
|
|
|
43
|
|
126
|
15
|
100
|
|
|
|
81
|
if($@ =~ /doesn't exist/) { |
|
|
100
|
|
|
|
|
|
127
|
2
|
|
|
|
|
12
|
return 0; |
128
|
|
|
|
|
|
|
} elsif($@) { |
129
|
1
|
|
|
|
|
7
|
die($@); |
130
|
|
|
|
|
|
|
} else { |
131
|
12
|
|
|
|
|
48
|
return 1; |
132
|
|
|
|
|
|
|
} |
133
|
|
|
|
|
|
|
} |
134
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
sub _nth_key { |
136
|
489
|
|
|
489
|
|
919
|
my($self, $n) = @_; |
137
|
489
|
100
|
100
|
|
|
1167
|
if($self->{cache} && exists($self->{cache}->{keys}->{$n})) { |
138
|
19
|
|
|
|
|
49
|
return $self->{cache}->{keys}->{$n} |
139
|
|
|
|
|
|
|
} |
140
|
|
|
|
|
|
|
|
141
|
470
|
|
|
|
|
1087
|
$self->_seek($self->_nth_key_ptr_location($n)); |
142
|
470
|
|
|
|
|
2029
|
$self->_seek($self->_ptr_at_current_offset()); |
143
|
|
|
|
|
|
|
|
144
|
|
|
|
|
|
|
# for performance, cache the filehandle in this object |
145
|
470
|
|
33
|
|
|
1879
|
$self->{_fh} ||= $self->_fh(); |
146
|
470
|
|
|
|
|
972
|
my $offset = tell($self->{_fh}); |
147
|
470
|
|
|
|
|
1415
|
my $key = $self->_node_at_current_offset(); |
148
|
469
|
100
|
100
|
|
|
1956
|
if(!defined($key) || ref($key)) { |
149
|
2
|
100
|
|
|
|
25
|
die("$self: Invalid type: ". |
150
|
|
|
|
|
|
|
(!defined($key) ? 'Null' : $key). |
151
|
|
|
|
|
|
|
": Dictionary keys must be Text at ". |
152
|
|
|
|
|
|
|
sprintf("0x%08x", $offset). |
153
|
|
|
|
|
|
|
"\n". |
154
|
|
|
|
|
|
|
Devel::StackTrace->new()->as_string() |
155
|
|
|
|
|
|
|
); |
156
|
|
|
|
|
|
|
} |
157
|
467
|
100
|
|
|
|
1098
|
if($self->{cache}) { |
158
|
16
|
|
|
|
|
59
|
return $self->{cache}->{keys}->{$n} = $key; |
159
|
|
|
|
|
|
|
} |
160
|
451
|
|
|
|
|
1066
|
return $key; |
161
|
|
|
|
|
|
|
} |
162
|
|
|
|
|
|
|
|
163
|
|
|
|
|
|
|
sub _nth_value { |
164
|
100
|
|
|
100
|
|
219
|
my($self, $n) = @_; |
165
|
100
|
100
|
100
|
|
|
274
|
if($self->{cache} && exists($self->{cache}->{values}->{$n})) { |
166
|
1
|
|
|
|
|
5
|
return $self->{cache}->{values}->{$n} |
167
|
|
|
|
|
|
|
} |
168
|
|
|
|
|
|
|
|
169
|
99
|
|
|
|
|
253
|
$self->_seek($self->_nth_key_ptr_location($n) + $self->_ptr_size()); |
170
|
99
|
|
|
|
|
366
|
$self->_seek($self->_ptr_at_current_offset()); |
171
|
|
|
|
|
|
|
|
172
|
99
|
|
|
|
|
380
|
my $val = $self->_node_at_current_offset(); |
173
|
|
|
|
|
|
|
|
174
|
99
|
100
|
|
|
|
293
|
if($self->{cache}) { |
175
|
15
|
|
|
|
|
113
|
return $self->{cache}->{values}->{$n} = $val; |
176
|
|
|
|
|
|
|
} |
177
|
84
|
|
|
|
|
580
|
return $val; |
178
|
|
|
|
|
|
|
} |
179
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
sub _nth_key_ptr_location { |
181
|
569
|
|
|
569
|
|
1087
|
my($self, $n) = @_; |
182
|
569
|
|
|
|
|
1407
|
return $self->_offset() + $self->_scalar_type_bytes() + |
183
|
|
|
|
|
|
|
2 * $n * $self->_ptr_size(); |
184
|
|
|
|
|
|
|
} |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
sub _ptr_at_current_offset { |
187
|
569
|
|
|
569
|
|
982
|
my $self = shift; |
188
|
569
|
|
|
|
|
1392
|
return $self->_decode_ptr( |
189
|
|
|
|
|
|
|
$self->_bytes_at_current_offset($self->_ptr_size()) |
190
|
|
|
|
|
|
|
); |
191
|
|
|
|
|
|
|
} |
192
|
|
|
|
|
|
|
|
193
|
|
|
|
|
|
|
sub indices { |
194
|
7
|
|
|
7
|
0
|
148
|
my $self = shift; |
195
|
7
|
100
|
|
|
|
20
|
return [] if($self->count() == 0); |
196
|
6
|
|
|
|
|
19
|
return [ map { $self->_nth_key($_) } (0 .. $self->count() - 1) ]; |
|
17
|
|
|
|
|
57
|
|
197
|
|
|
|
|
|
|
} |
198
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
1; |