line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Algorithm::SixDegrees; |
2
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
require 5.006; |
4
|
6
|
|
|
6
|
|
286650
|
use warnings; |
|
6
|
|
|
|
|
45
|
|
|
6
|
|
|
|
|
172
|
|
5
|
6
|
|
|
6
|
|
28
|
use strict; |
|
6
|
|
|
|
|
9
|
|
|
6
|
|
|
|
|
115
|
|
6
|
6
|
|
|
6
|
|
23
|
use Scalar::Util qw(reftype); |
|
6
|
|
|
|
|
9
|
|
|
6
|
|
|
|
|
9823
|
|
7
|
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
=head1 NAME |
9
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
Algorithm::SixDegrees - Find a path through linked elements in a set |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
=head1 VERSION |
13
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
Version 1.00 |
15
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
=cut |
17
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
our $VERSION = '1.00'; |
19
|
|
|
|
|
|
|
our $ERROR = ''; |
20
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
=head1 SYNOPSIS |
22
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
use Algorithm::SixDegrees; |
24
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
my $sd1 = Algorithm::SixDegrees->new(); |
26
|
|
|
|
|
|
|
$sd1->data_source( actors => \&starred_in ); |
27
|
|
|
|
|
|
|
$sd1->data_source( movies => \&stars_of ); |
28
|
|
|
|
|
|
|
@elems = $sd1->make_link('actors', 'Tom Cruise', 'Kevin Bacon'); |
29
|
|
|
|
|
|
|
|
30
|
|
|
|
|
|
|
my $sd2 = Algorithm::SixDegrees->new(); |
31
|
|
|
|
|
|
|
$sd2->forward_data_source( friends => \&friends, @args ); |
32
|
|
|
|
|
|
|
$sd2->reverse_data_source( friends => \&friend_of, @args ); |
33
|
|
|
|
|
|
|
@elems = $sd2->make_link('friends', 'Bob', 'Mark'); |
34
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
=head1 DESCRIPTION |
36
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
C is a Perl implementation of a breadth-first |
38
|
|
|
|
|
|
|
search through a set of linked elements in order to find the shortest |
39
|
|
|
|
|
|
|
possible chain linking two specific elements together. |
40
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
In simpler terms, this module will take a bunch of related items and |
42
|
|
|
|
|
|
|
attempt to find a relationship between two of them. It looks for the |
43
|
|
|
|
|
|
|
shortest (and generally, simplest) relationship it can find. |
44
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
=head1 CONSTRUCTOR |
46
|
|
|
|
|
|
|
|
47
|
|
|
|
|
|
|
=head2 new() |
48
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
C requires use as an object; it can't (yet) be used |
50
|
|
|
|
|
|
|
as a stand-alone module. C takes no arguments, however. |
51
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
=cut |
53
|
|
|
|
|
|
|
|
54
|
|
|
|
|
|
|
sub new { |
55
|
10
|
|
|
10
|
1
|
315
|
my $class = shift; |
56
|
10
|
|
|
|
|
41
|
my $self = { |
57
|
|
|
|
|
|
|
_source_left => {}, |
58
|
|
|
|
|
|
|
_source_right => {}, |
59
|
|
|
|
|
|
|
_sources => [], |
60
|
|
|
|
|
|
|
_investigated => {}, |
61
|
|
|
|
|
|
|
}; |
62
|
10
|
|
|
|
|
39
|
return bless $self,$class; |
63
|
|
|
|
|
|
|
} |
64
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
=head1 FUNCTIONS |
66
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
=head2 forward_data_source( name => \&sub, @args ); |
68
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
Tells C that all items in the data set relating to |
70
|
|
|
|
|
|
|
C can be retrieved by calling C. See L. |
71
|
|
|
|
|
|
|
|
72
|
|
|
|
|
|
|
In our friends example above, if Bob considers Mark a friend, but Mark |
73
|
|
|
|
|
|
|
doesn't consider Bob a friend, calling the sub with "Bob" as an argument |
74
|
|
|
|
|
|
|
should return "Mark", but calling the sub with "Mark" as an argument |
75
|
|
|
|
|
|
|
should not return "Bob". |
76
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
=cut |
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
sub forward_data_source { |
80
|
23
|
|
|
23
|
1
|
2943
|
my ($self, $name, $sub, @args) = @_; |
81
|
23
|
100
|
|
|
|
83
|
die "Data sources must be named\n" unless defined($name); |
82
|
19
|
100
|
|
|
|
45
|
die "Data sources must have code supplied\n" unless defined($sub); |
83
|
17
|
100
|
100
|
|
|
114
|
die "Data sources must have a coderef argument\n" unless ref($sub) && reftype($sub) eq 'CODE'; |
84
|
13
|
|
|
|
|
42
|
$self->{'_source_left'}{$name}{'sub'} = $sub; |
85
|
13
|
|
|
|
|
23
|
$self->{'_source_left'}{$name}{'args'} = \@args; |
86
|
13
|
|
|
|
|
19
|
foreach my $source (@{$self->{'_sources'}}) { |
|
13
|
|
|
|
|
26
|
|
87
|
6
|
100
|
|
|
|
15
|
return if $source eq $name; |
88
|
|
|
|
|
|
|
} |
89
|
12
|
|
|
|
|
18
|
push(@{$self->{'_sources'}},$name); |
|
12
|
|
|
|
|
29
|
|
90
|
12
|
|
|
|
|
19
|
return; |
91
|
|
|
|
|
|
|
} |
92
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
=head2 reverse_data_source( name => \&sub, @args ); |
94
|
|
|
|
|
|
|
|
95
|
|
|
|
|
|
|
Tells C that all items in the data set related to |
96
|
|
|
|
|
|
|
by C can be retrieved by calling C. See L. |
97
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
In the same friends example, calling the sub with "Bob" as an argument |
99
|
|
|
|
|
|
|
should not return "Mark", but calling the sub with "Mark" as an argument |
100
|
|
|
|
|
|
|
should return "Bob". |
101
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
=cut |
103
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
sub reverse_data_source { |
105
|
18
|
|
|
18
|
1
|
2752
|
my ($self, $name, $sub, @args) = @_; |
106
|
18
|
100
|
|
|
|
86
|
die "Data sources must be named\n" unless defined($name); |
107
|
16
|
100
|
|
|
|
48
|
die "Data sources must have code supplied\n" unless defined($sub); |
108
|
15
|
100
|
100
|
|
|
88
|
die "Data sources must have a coderef argument\n" unless ref($sub) && reftype($sub) eq 'CODE'; |
109
|
13
|
|
|
|
|
31
|
$self->{'_source_right'}{$name}{'sub'} = $sub; |
110
|
13
|
|
|
|
|
23
|
$self->{'_source_right'}{$name}{'args'} = \@args; |
111
|
13
|
|
|
|
|
20
|
foreach my $source (@{$self->{'_sources'}}) { |
|
13
|
|
|
|
|
76
|
|
112
|
17
|
100
|
|
|
|
44
|
return if $source eq $name; |
113
|
|
|
|
|
|
|
} |
114
|
1
|
|
|
|
|
2
|
push(@{$self->{'_sources'}},$name); |
|
1
|
|
|
|
|
3
|
|
115
|
1
|
|
|
|
|
2
|
return; |
116
|
|
|
|
|
|
|
} |
117
|
|
|
|
|
|
|
|
118
|
|
|
|
|
|
|
=head2 data_source( name => \&sub, @args ); |
119
|
|
|
|
|
|
|
|
120
|
|
|
|
|
|
|
Sets up a data source as both forward and reverse. This is useful if |
121
|
|
|
|
|
|
|
the data source is mutually relational; that is, in our actors/movies |
122
|
|
|
|
|
|
|
example, Kevin Bacon is always in Mystic River, and Mystic River always |
123
|
|
|
|
|
|
|
has Kevin Bacon in it. |
124
|
|
|
|
|
|
|
|
125
|
|
|
|
|
|
|
=cut |
126
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
sub data_source { |
128
|
15
|
|
|
15
|
1
|
3854
|
my ($self, $name, $sub, @args) = @_; |
129
|
15
|
|
|
|
|
44
|
$self->forward_data_source($name,$sub,@args); |
130
|
10
|
|
|
|
|
26
|
$self->reverse_data_source($name,$sub,@args); |
131
|
10
|
|
|
|
|
19
|
return; |
132
|
|
|
|
|
|
|
} |
133
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
=head2 make_link |
135
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
Does the work of making the link. Returns a list or arrayref, based |
137
|
|
|
|
|
|
|
on calling context. |
138
|
|
|
|
|
|
|
|
139
|
|
|
|
|
|
|
=cut |
140
|
|
|
|
|
|
|
|
141
|
|
|
|
|
|
|
sub make_link { |
142
|
35
|
|
|
35
|
1
|
525
|
my ($self, $mainsource, $start, $end) = @_; |
143
|
35
|
|
|
|
|
47
|
$ERROR = undef; |
144
|
|
|
|
|
|
|
|
145
|
35
|
100
|
66
|
|
|
174
|
unless (ref($self) && $self->isa(__PACKAGE__)) { |
146
|
2
|
|
|
|
|
4
|
$ERROR = 'Invalid object reference used to call make_link'; |
147
|
2
|
|
|
|
|
8
|
return; |
148
|
|
|
|
|
|
|
} |
149
|
33
|
100
|
|
|
|
71
|
unless (defined($mainsource)) { |
150
|
1
|
|
|
|
|
6
|
$ERROR = 'Data set name is not defined'; |
151
|
1
|
|
|
|
|
3
|
return; |
152
|
|
|
|
|
|
|
} |
153
|
32
|
100
|
|
|
|
53
|
unless (defined($start)) { |
154
|
1
|
|
|
|
|
2
|
$ERROR = 'Starting identifier is not defined'; |
155
|
1
|
|
|
|
|
4
|
return; |
156
|
|
|
|
|
|
|
} |
157
|
31
|
100
|
|
|
|
54
|
unless (defined($end)) { |
158
|
1
|
|
|
|
|
2
|
$ERROR = 'Ending identifier is not defined'; |
159
|
1
|
|
|
|
|
4
|
return; |
160
|
|
|
|
|
|
|
} |
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
# Assume working from "left to right"; therefore, links leading |
163
|
|
|
|
|
|
|
# from the starting identifier are on the "left side", and links |
164
|
|
|
|
|
|
|
# leading to the ending identifier are on the "right side". |
165
|
30
|
|
|
|
|
37
|
my %leftside = (); |
166
|
30
|
|
|
|
|
36
|
my %rightside = (); |
167
|
|
|
|
|
|
|
|
168
|
|
|
|
|
|
|
# If $altsource gets defined, that means there are two sources used. |
169
|
30
|
|
|
|
|
37
|
my $altsource; |
170
|
|
|
|
|
|
|
|
171
|
30
|
100
|
100
|
|
|
138
|
unless (exists($self->{'_sources'}) && reftype($self->{'_sources'}) eq 'ARRAY') { |
172
|
2
|
|
|
|
|
3
|
$ERROR = 'No data sources defined'; |
173
|
2
|
|
|
|
|
8
|
return; |
174
|
|
|
|
|
|
|
} |
175
|
28
|
|
|
|
|
45
|
my @sources = @{$self->{'_sources'}}; |
|
28
|
|
|
|
|
59
|
|
176
|
28
|
|
|
|
|
48
|
my $source_exists = 0; |
177
|
28
|
|
|
|
|
40
|
foreach my $source (@sources) { |
178
|
39
|
100
|
|
|
|
80
|
if ($mainsource eq $source) { |
179
|
26
|
|
|
|
|
35
|
$source_exists = 1; |
180
|
26
|
|
|
|
|
55
|
$leftside{$source} = {$start, undef}; |
181
|
26
|
|
|
|
|
54
|
$rightside{$source} = {$end, undef}; |
182
|
|
|
|
|
|
|
} else { |
183
|
13
|
|
|
|
|
19
|
$altsource = $source; |
184
|
13
|
|
|
|
|
22
|
$leftside{$source} = {}; |
185
|
13
|
|
|
|
|
23
|
$rightside{$source} = {}; |
186
|
|
|
|
|
|
|
} |
187
|
39
|
100
|
100
|
|
|
194
|
unless (ref($self->{'_source_left'}) && |
|
|
|
66
|
|
|
|
|
188
|
|
|
|
|
|
|
ref($self->{'_source_left'}{$source}) && |
189
|
|
|
|
|
|
|
reftype($self->{'_source_left'}{$source}{'sub'}) eq 'CODE') { |
190
|
2
|
|
|
|
|
5
|
$ERROR = "Source '$source' does not have a valid forward subroutine"; |
191
|
2
|
|
|
|
|
11
|
return; |
192
|
|
|
|
|
|
|
} |
193
|
37
|
100
|
100
|
|
|
180
|
unless (ref($self->{'_source_right'}) && |
|
|
|
66
|
|
|
|
|
194
|
|
|
|
|
|
|
ref($self->{'_source_right'}{$source}) && |
195
|
|
|
|
|
|
|
reftype($self->{'_source_right'}{$source}{'sub'}) eq 'CODE') { |
196
|
2
|
|
|
|
|
5
|
$ERROR = "Source '$source' does not have a valid reverse subroutine"; |
197
|
2
|
|
|
|
|
10
|
return; |
198
|
|
|
|
|
|
|
} |
199
|
35
|
|
|
|
|
76
|
$self->{'_investigated'}{$source} = {}; |
200
|
|
|
|
|
|
|
} |
201
|
24
|
100
|
|
|
|
49
|
unless ($source_exists) { |
202
|
2
|
|
|
|
|
5
|
$ERROR = "Source '$mainsource' was not defined"; |
203
|
2
|
|
|
|
|
9
|
return; |
204
|
|
|
|
|
|
|
} |
205
|
22
|
100
|
|
|
|
55
|
if (scalar(keys(%leftside)) > 2) { |
206
|
1
|
|
|
|
|
2
|
$ERROR = 'Too many defined data sources; maximum is 2'; |
207
|
1
|
|
|
|
|
6
|
return; |
208
|
|
|
|
|
|
|
} |
209
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
|
211
|
21
|
100
|
|
|
|
38
|
if ($start eq $end) { |
212
|
|
|
|
|
|
|
# Only one element if the start and end are the same. |
213
|
5
|
100
|
|
|
|
35
|
return wantarray ? ($start) : [$start]; |
214
|
|
|
|
|
|
|
} |
215
|
|
|
|
|
|
|
|
216
|
16
|
|
|
|
|
20
|
my $leftcount = 1; |
217
|
16
|
|
|
|
|
20
|
my $rightcount = 1; |
218
|
|
|
|
|
|
|
|
219
|
|
|
|
|
|
|
# If altsource exists, pull the left side main, then pull the right side main, |
220
|
|
|
|
|
|
|
# and check for middle matches. This reduces database hits as opposed to |
221
|
|
|
|
|
|
|
# where it's pulled left main - left alt; left alt >= 1 at that point, whereas |
222
|
|
|
|
|
|
|
# right main on the first loop == 1. Following that, pull the left alt and |
223
|
|
|
|
|
|
|
# then the right alt, which gets the CHAINLOOP back in synch. |
224
|
|
|
|
|
|
|
|
225
|
16
|
100
|
|
|
|
31
|
if (defined($altsource)) { |
226
|
8
|
|
|
|
|
22
|
my ($count,$id,$err) = $self->_match('left',$mainsource,$altsource,\%leftside,\%rightside); |
227
|
8
|
50
|
|
|
|
17
|
if (defined($err)) { $ERROR = $err; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
228
|
8
|
50
|
|
|
|
15
|
if (defined($id)) { $ERROR = 'Internal error, id cannot match here'; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
229
|
8
|
50
|
33
|
|
|
31
|
return if !defined($count) || $count == 0; |
230
|
|
|
|
|
|
|
|
231
|
8
|
|
|
|
|
25
|
($count,$id,$err) = $self->_match('right',$mainsource,$altsource,\%rightside,\%leftside); |
232
|
8
|
50
|
|
|
|
15
|
if (defined($err)) { $ERROR = $err; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
233
|
8
|
100
|
|
|
|
17
|
if (defined($id)) { |
234
|
2
|
|
|
|
|
6
|
my @abc = ($leftside{$altsource}{$id},$id,$rightside{$altsource}{$id}); |
235
|
2
|
50
|
|
|
|
19
|
return wantarray ? @abc : \@abc; |
236
|
|
|
|
|
|
|
}; |
237
|
6
|
100
|
66
|
|
|
34
|
return if !defined($count) || $count == 0; |
238
|
|
|
|
|
|
|
|
239
|
4
|
|
|
|
|
10
|
($leftcount,$id,$err) = $self->_match('left',$altsource,$mainsource,\%leftside,\%rightside); |
240
|
4
|
50
|
|
|
|
9
|
if (defined($err)) { $ERROR = $err; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
241
|
4
|
50
|
|
|
|
7
|
if (defined($id)) { $ERROR = 'Internal error, id cannot match here'; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
242
|
4
|
50
|
33
|
|
|
14
|
return if !defined($leftcount) || $leftcount == 0; |
243
|
|
|
|
|
|
|
|
244
|
4
|
|
|
|
|
9
|
($rightcount,$id,$err) = $self->_match('right',$altsource,$mainsource,\%rightside,\%leftside); |
245
|
4
|
50
|
|
|
|
9
|
if (defined($err)) { $ERROR = $err; return; }; |
|
0
|
|
|
|
|
0
|
|
|
0
|
|
|
|
|
0
|
|
246
|
4
|
100
|
|
|
|
19
|
if (defined($id)) { |
247
|
2
|
|
|
|
|
4
|
my $la = $leftside{$mainsource}{$id}; |
248
|
2
|
|
|
|
|
5
|
my $lm = $leftside{$altsource}{$la}; |
249
|
2
|
|
|
|
|
4
|
my $ra = $rightside{$mainsource}{$id}; |
250
|
2
|
|
|
|
|
14
|
my $rm = $rightside{$altsource}{$ra}; |
251
|
2
|
50
|
33
|
|
|
26
|
unless (defined($la) && defined($lm) && defined($ra) && defined($rm)) { |
|
|
|
33
|
|
|
|
|
|
|
|
33
|
|
|
|
|
252
|
0
|
|
|
|
|
0
|
$ERROR = 'Internal error, identifier not defined'; |
253
|
0
|
|
|
|
|
0
|
return; |
254
|
|
|
|
|
|
|
} |
255
|
2
|
50
|
|
|
|
25
|
return wantarray ? ($lm,$la,$id,$ra,$rm) : [$lm,$la,$id,$ra,$rm]; |
256
|
|
|
|
|
|
|
}; |
257
|
2
|
50
|
33
|
|
|
10
|
return if !defined($rightcount) || $rightcount == 0; |
258
|
|
|
|
|
|
|
|
259
|
|
|
|
|
|
|
} |
260
|
|
|
|
|
|
|
|
261
|
|
|
|
|
|
|
# There is bias here, but the tie needs to be broken, so in the |
262
|
|
|
|
|
|
|
# event of a tie, move left to right in the chain. |
263
|
|
|
|
|
|
|
|
264
|
|
|
|
|
|
|
CHAINLOOP: { |
265
|
10
|
|
|
|
|
20
|
my $id; |
|
45
|
|
|
|
|
58
|
|
266
|
|
|
|
|
|
|
my $err; |
267
|
45
|
100
|
|
|
|
77
|
if ($leftcount <= $rightcount) { |
268
|
42
|
100
|
|
|
|
58
|
if (defined($altsource)) { |
269
|
4
|
|
|
|
|
9
|
($leftcount,$id,$err) = $self->_match_two('left',$mainsource,$altsource,\%leftside,\%rightside); |
270
|
|
|
|
|
|
|
} else { |
271
|
38
|
|
|
|
|
70
|
($leftcount,$id,$err) = $self->_match_one('left',$mainsource,\%leftside,\%rightside); |
272
|
|
|
|
|
|
|
} |
273
|
|
|
|
|
|
|
} else { |
274
|
3
|
100
|
|
|
|
35
|
if (defined($altsource)) { |
275
|
2
|
|
|
|
|
9
|
($rightcount,$id,$err) = $self->_match_two('right',$mainsource,$altsource,\%rightside,\%leftside); |
276
|
|
|
|
|
|
|
} else { |
277
|
1
|
|
|
|
|
7
|
($rightcount,$id,$err) = $self->_match_one('right',$mainsource,\%rightside,\%leftside); |
278
|
|
|
|
|
|
|
} |
279
|
|
|
|
|
|
|
} |
280
|
45
|
50
|
|
|
|
91
|
if(defined($err)) { |
281
|
0
|
|
|
|
|
0
|
$ERROR = $err; |
282
|
0
|
|
|
|
|
0
|
return; |
283
|
|
|
|
|
|
|
} |
284
|
45
|
100
|
|
|
|
68
|
if(defined($id)) { |
285
|
|
|
|
|
|
|
# If _match returns an id, that means a match was found. |
286
|
|
|
|
|
|
|
# To get it, we simply have to trace out from the "middle" |
287
|
|
|
|
|
|
|
# to get the full link. |
288
|
7
|
|
|
|
|
12
|
my @match = ($id); |
289
|
|
|
|
|
|
|
# middle, building to left. |
290
|
7
|
|
|
|
|
17
|
while($match[0] ne $start) { |
291
|
33
|
|
|
|
|
74
|
unshift(@match,$leftside{$mainsource}{$match[0]}); |
292
|
33
|
100
|
|
|
|
56
|
unshift(@match,$leftside{$altsource}{$match[0]}) if defined($altsource); |
293
|
33
|
50
|
|
|
|
60
|
if (!defined($match[0])) { |
294
|
0
|
|
|
|
|
0
|
$ERROR = 'Internal error, left identifier was not defined'; |
295
|
0
|
|
|
|
|
0
|
return; |
296
|
|
|
|
|
|
|
} |
297
|
|
|
|
|
|
|
} |
298
|
|
|
|
|
|
|
# middle building to right |
299
|
7
|
|
|
|
|
15
|
while($match[-1] ne $end) { |
300
|
4
|
|
|
|
|
8
|
push(@match,$rightside{$mainsource}{$match[-1]}); |
301
|
4
|
50
|
|
|
|
9
|
push(@match,$rightside{$altsource}{$match[-1]}) if defined($altsource); |
302
|
4
|
50
|
|
|
|
12
|
if (!defined($match[-1])) { |
303
|
0
|
|
|
|
|
0
|
$ERROR = 'Internal error, right identifier was not defined'; |
304
|
0
|
|
|
|
|
0
|
return; |
305
|
|
|
|
|
|
|
} |
306
|
|
|
|
|
|
|
} |
307
|
7
|
100
|
|
|
|
70
|
return wantarray ? @match : \@match; |
308
|
|
|
|
|
|
|
} |
309
|
38
|
100
|
100
|
|
|
105
|
if ($leftcount == 0 || $rightcount == 0) { |
310
|
3
|
|
|
|
|
6
|
last CHAINLOOP; |
311
|
|
|
|
|
|
|
} |
312
|
35
|
|
|
|
|
54
|
redo CHAINLOOP; |
313
|
|
|
|
|
|
|
} |
314
|
|
|
|
|
|
|
|
315
|
3
|
50
|
|
|
|
306
|
return wantarray ? () : []; |
316
|
|
|
|
|
|
|
} |
317
|
|
|
|
|
|
|
|
318
|
|
|
|
|
|
|
=head2 error |
319
|
|
|
|
|
|
|
|
320
|
|
|
|
|
|
|
Returns the current value of C<$Algorithm::SixDegrees::ERROR>. See |
321
|
|
|
|
|
|
|
L. |
322
|
|
|
|
|
|
|
|
323
|
|
|
|
|
|
|
=cut |
324
|
|
|
|
|
|
|
|
325
|
|
|
|
|
|
|
sub error { |
326
|
20
|
|
|
20
|
1
|
97
|
return $ERROR; |
327
|
|
|
|
|
|
|
} |
328
|
|
|
|
|
|
|
|
329
|
|
|
|
|
|
|
sub _match_two { |
330
|
6
|
|
|
6
|
|
12
|
my ($self,$side,$mainsource,$altsource,$thisside,$thatside) = @_; |
331
|
|
|
|
|
|
|
# Assume $self is OK since this is an internal function |
332
|
6
|
|
|
|
|
12
|
my ($count,$id,$err) = $self->_match($side,$mainsource,$altsource,$thisside,$thatside); |
333
|
6
|
50
|
|
|
|
29
|
return (undef,undef,$err) if defined($err); |
334
|
6
|
50
|
|
|
|
13
|
return ($count,$id,$err) if defined($id); |
335
|
6
|
50
|
33
|
|
|
31
|
return (0,undef,undef) if !defined($count) || $count == 0; |
336
|
|
|
|
|
|
|
# mental note: this should never return an id |
337
|
|
|
|
|
|
|
# after all, you can't have two mains together in a true |
338
|
|
|
|
|
|
|
# alternating chain |
339
|
6
|
|
|
|
|
41
|
return $self->_match($side,$altsource,$mainsource,$thisside,$thatside); |
340
|
|
|
|
|
|
|
} |
341
|
|
|
|
|
|
|
|
342
|
|
|
|
|
|
|
sub _match_one { |
343
|
39
|
|
|
39
|
|
61
|
my ($self,$side,$source,$thisside,$thatside) = @_; |
344
|
|
|
|
|
|
|
# Assume $self is OK since this is an internal function |
345
|
39
|
|
|
|
|
83
|
return $self->_match($side,$source,$source,$thisside,$thatside); |
346
|
|
|
|
|
|
|
} |
347
|
|
|
|
|
|
|
|
348
|
|
|
|
|
|
|
sub _match { |
349
|
75
|
|
|
75
|
|
122
|
my ($self,$side,$fromsource,$tosource,$thisside,$thatside) = @_; |
350
|
|
|
|
|
|
|
# Assume $self is OK since this is an internal function |
351
|
75
|
50
|
|
|
|
247
|
return (undef,undef,'Internal error: missing code') unless reftype($self->{"_source_$side"}{$fromsource}{'sub'}) eq 'CODE'; |
352
|
75
|
50
|
|
|
|
145
|
return (undef,undef,'Internal error: missing side (1)') unless reftype($thisside) eq 'HASH'; |
353
|
75
|
50
|
|
|
|
122
|
return (undef,undef,'Internal error: missing side (2)') unless exists($thisside->{$fromsource}); |
354
|
75
|
50
|
|
|
|
133
|
return (undef,undef,'Internal error: missing side (3)') unless reftype($thatside) eq 'HASH'; |
355
|
75
|
50
|
|
|
|
120
|
return (undef,undef,'Internal error: missing side (4)') unless exists($thatside->{$tosource}); |
356
|
|
|
|
|
|
|
|
357
|
75
|
|
|
|
|
86
|
my $newsidecount = 0; |
358
|
75
|
|
|
|
|
86
|
foreach my $id (keys %{$thisside->{$fromsource}}) { |
|
75
|
|
|
|
|
178
|
|
359
|
200
|
100
|
|
|
|
328
|
next if exists($self->{"_investigated"}{$fromsource}{$id}); |
360
|
80
|
|
|
|
|
129
|
$self->{"_investigated"}{$fromsource}{$id} = 1; |
361
|
|
|
|
|
|
|
|
362
|
80
|
50
|
|
|
|
201
|
my $use_args = reftype($self->{"_source_$side"}{$fromsource}{'args'}) eq 'ARRAY' ? 1 : 0; |
363
|
|
|
|
|
|
|
|
364
|
80
|
50
|
|
|
|
116
|
my @ids = &{$self->{"_source_$side"}{$fromsource}{'sub'}}($id,($use_args?@{$self->{"_source_$side"}{$fromsource}{'args'}}:())); |
|
80
|
|
|
|
|
157
|
|
|
80
|
|
|
|
|
145
|
|
365
|
80
|
50
|
66
|
|
|
1257
|
return (undef,undef,$ERROR) if scalar(@ids) == 1 && !defined($ids[0]); |
366
|
80
|
|
|
|
|
107
|
foreach my $thisid (@ids) { |
367
|
140
|
100
|
|
|
|
224
|
unless (exists($thisside->{$tosource}{$thisid})) { |
368
|
87
|
|
|
|
|
155
|
$thisside->{$tosource}{$thisid} = $id; |
369
|
87
|
|
|
|
|
102
|
$newsidecount++; |
370
|
|
|
|
|
|
|
} |
371
|
140
|
100
|
|
|
|
270
|
return (0,$thisid,undef) if exists($thatside->{$tosource}{$thisid}); |
372
|
|
|
|
|
|
|
} |
373
|
|
|
|
|
|
|
} |
374
|
|
|
|
|
|
|
|
375
|
64
|
|
|
|
|
131
|
return $newsidecount; |
376
|
|
|
|
|
|
|
} |
377
|
|
|
|
|
|
|
|
378
|
|
|
|
|
|
|
=head1 SUBROUTINE RULES |
379
|
|
|
|
|
|
|
|
380
|
|
|
|
|
|
|
Passed-in subroutines should take at least one argument, which |
381
|
|
|
|
|
|
|
should be some form of unique identifier, and return a list of |
382
|
|
|
|
|
|
|
unique identifiers that have a relation to the argument. |
383
|
|
|
|
|
|
|
|
384
|
|
|
|
|
|
|
The unique identifiers must be able to be compared with C. |
385
|
|
|
|
|
|
|
|
386
|
|
|
|
|
|
|
The identifiers should be unique in datatype; that is, in an |
387
|
|
|
|
|
|
|
actor/movie relationship, "Kevin Bacon" can be both the name of an |
388
|
|
|
|
|
|
|
actor and a movie. |
389
|
|
|
|
|
|
|
|
390
|
|
|
|
|
|
|
A linked data type must return identifiers that relate across the |
391
|
|
|
|
|
|
|
link; that is, for an actor/movie relationship, an actor subroutine |
392
|
|
|
|
|
|
|
should return movies, and a movie subroutine should return actors. |
393
|
|
|
|
|
|
|
|
394
|
|
|
|
|
|
|
Additional arguments can be provided; these will be stored in the |
395
|
|
|
|
|
|
|
object and passed through as the second and further arguments to |
396
|
|
|
|
|
|
|
the subroutine. This may be useful, for example, if you're using |
397
|
|
|
|
|
|
|
some form of results caching and need to pass a Cd handle |
398
|
|
|
|
|
|
|
around. |
399
|
|
|
|
|
|
|
|
400
|
|
|
|
|
|
|
If you return explicit undef, please set C<$Algorithm::SixDegrees::ERROR> |
401
|
|
|
|
|
|
|
with an error code. Explicit undef means that an error occurred |
402
|
|
|
|
|
|
|
that should terminate the search; it should be returned as a |
403
|
|
|
|
|
|
|
one-element list. |
404
|
|
|
|
|
|
|
|
405
|
|
|
|
|
|
|
=head1 AUTHOR |
406
|
|
|
|
|
|
|
|
407
|
|
|
|
|
|
|
Pete Krawczyk, C<< >> |
408
|
|
|
|
|
|
|
|
409
|
|
|
|
|
|
|
=head1 BUGS |
410
|
|
|
|
|
|
|
|
411
|
|
|
|
|
|
|
Please report any bugs or feature requests to |
412
|
|
|
|
|
|
|
C, or through the web interface at |
413
|
|
|
|
|
|
|
L. I will be notified, and then you'll automatically |
414
|
|
|
|
|
|
|
be notified of progress on your bug as I make changes. |
415
|
|
|
|
|
|
|
|
416
|
|
|
|
|
|
|
=head1 ACKNOWLEDGEMENTS |
417
|
|
|
|
|
|
|
|
418
|
|
|
|
|
|
|
Andy Lester and Ricardo Signes wrote Module::Starter, which helped |
419
|
|
|
|
|
|
|
get the framework up and running fairly quickly. |
420
|
|
|
|
|
|
|
|
421
|
|
|
|
|
|
|
Brad Fitzpatrick of L for giving me access |
422
|
|
|
|
|
|
|
to a LiveJournal interface to determine linking information on that |
423
|
|
|
|
|
|
|
site, which enabled me to write the algorithm that has been reduced |
424
|
|
|
|
|
|
|
into this module. |
425
|
|
|
|
|
|
|
|
426
|
|
|
|
|
|
|
=head1 COPYRIGHT & LICENSE |
427
|
|
|
|
|
|
|
|
428
|
|
|
|
|
|
|
Copyright 2005 Pete Krawczyk, All Rights Reserved. |
429
|
|
|
|
|
|
|
|
430
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it |
431
|
|
|
|
|
|
|
under the same terms as Perl itself. |
432
|
|
|
|
|
|
|
|
433
|
|
|
|
|
|
|
=cut |
434
|
|
|
|
|
|
|
|
435
|
|
|
|
|
|
|
1; # End of Algorithm::SixDegrees |