line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Net::CascadeCopy; |
2
|
34
|
|
|
34
|
|
929403
|
use strict; |
|
34
|
|
|
|
|
78
|
|
|
34
|
|
|
|
|
1154
|
|
3
|
34
|
|
|
34
|
|
198
|
use warnings; |
|
34
|
|
|
|
|
45
|
|
|
34
|
|
|
|
|
1540
|
|
4
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
our $VERSION = '0.2.6'; # VERSION |
6
|
|
|
|
|
|
|
|
7
|
34
|
|
|
34
|
|
32726
|
use Mouse; |
|
34
|
|
|
|
|
1404456
|
|
|
34
|
|
|
|
|
238
|
|
8
|
|
|
|
|
|
|
|
9
|
34
|
|
|
34
|
|
82867
|
use Benchmark; |
|
34
|
|
|
|
|
332813
|
|
|
34
|
|
|
|
|
290
|
|
10
|
34
|
|
|
34
|
|
54485
|
use Log::Log4perl qw(:easy); |
|
34
|
|
|
|
|
2335723
|
|
|
34
|
|
|
|
|
253
|
|
11
|
34
|
|
|
34
|
|
53643
|
use POSIX ":sys_wait_h"; # imports WNOHANG |
|
34
|
|
|
|
|
329619
|
|
|
34
|
|
|
|
|
269
|
|
12
|
34
|
|
|
34
|
|
101649
|
use Proc::Queue size => 32, debug => 0, trace => 0, delay => 1; |
|
34
|
|
|
|
|
563965
|
|
|
34
|
|
|
|
|
4911
|
|
13
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
my $logger = get_logger( 'default' ); |
15
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
has data => ( is => 'ro', isa => 'HashRef', default => sub { return {} } ); |
17
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
has total_time => ( is => 'rw', isa => 'Num', default => 0 ); |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
has ssh => ( is => 'ro', isa => 'Str', default => "ssh" ); |
21
|
|
|
|
|
|
|
has ssh_args => ( is => 'ro', isa => 'Str', default => "-x -A" ); |
22
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
has command => ( is => 'ro', isa => 'Str', required => 1 ); |
24
|
|
|
|
|
|
|
has command_args => ( is => 'ro', isa => 'Str', default => "" ); |
25
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
has source_path => ( is => 'ro', isa => 'Str', required => 1 ); |
27
|
|
|
|
|
|
|
has target_path => ( is => 'ro', isa => 'Str', required => 1 ); |
28
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
has output => ( is => 'ro', isa => 'Str', default => "" ); |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
# maximum number of failures per server |
32
|
|
|
|
|
|
|
has max_failures => ( is => 'ro', isa => 'Num', default => 3 ); |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
# maximum processes per remote server |
35
|
|
|
|
|
|
|
has max_forks => ( is => 'ro', isa => 'Num', default => 2 ); |
36
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
# keep track of child processes |
38
|
|
|
|
|
|
|
has children => ( is => 'ro', isa => 'HashRef', default => sub { return {} } ); |
39
|
|
|
|
|
|
|
|
40
|
|
|
|
|
|
|
# for testing purposes |
41
|
|
|
|
|
|
|
has transfer_map => ( is => 'ro', isa => 'HashRef', default => sub { return {} } ); |
42
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
# sort order |
44
|
|
|
|
|
|
|
has sort_order => ( is => 'ro', isa => 'HashRef', default => sub { return {} } ); |
45
|
|
|
|
|
|
|
|
46
|
|
|
|
|
|
|
sub add_group { |
47
|
47
|
|
|
47
|
1
|
517
|
my ( $self, $group, $servers_a ) = @_; |
48
|
|
|
|
|
|
|
|
49
|
47
|
|
|
|
|
474
|
$logger->info( "Adding group: $group: ", |
50
|
|
|
|
|
|
|
join( ", ", @$servers_a ), |
51
|
|
|
|
|
|
|
); |
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
# initialize data structures |
54
|
47
|
|
|
|
|
706
|
for my $server ( @{ $servers_a } ) { |
|
47
|
|
|
|
|
133
|
|
55
|
253
|
|
|
|
|
1012
|
$self->data->{remaining}->{ $group }->{$server} = 1; |
56
|
|
|
|
|
|
|
|
57
|
253
|
100
|
|
|
|
870
|
unless ( defined $self->sort_order->{ $group }->{ $server } ) { |
58
|
252
|
|
|
|
|
272
|
$self->sort_order->{ $group }->{ $server } = scalar keys %{ $self->sort_order->{ $group } }; |
|
252
|
|
|
|
|
1417
|
|
59
|
|
|
|
|
|
|
} |
60
|
|
|
|
|
|
|
} |
61
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
# first server to transfer from is the current server |
63
|
47
|
|
|
|
|
745
|
$self->data->{available}->{ $group }->{localhost} = 1; |
64
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
# initialize data structures |
66
|
47
|
|
|
|
|
1234
|
$self->data->{completed}->{ $group } = []; |
67
|
|
|
|
|
|
|
|
68
|
|
|
|
|
|
|
} |
69
|
|
|
|
|
|
|
|
70
|
|
|
|
|
|
|
sub get_groups { |
71
|
6
|
|
|
6
|
1
|
20
|
my ( $self ) = @_; |
72
|
|
|
|
|
|
|
|
73
|
6
|
|
|
|
|
17
|
my @groups; |
74
|
|
|
|
|
|
|
|
75
|
6
|
|
|
|
|
43
|
for my $group ( keys %{ $self->sort_order } ) { |
|
6
|
|
|
|
|
63
|
|
76
|
7
|
|
|
|
|
43
|
push @groups, $group; |
77
|
|
|
|
|
|
|
} |
78
|
|
|
|
|
|
|
|
79
|
6
|
|
|
|
|
29
|
return @groups; |
80
|
|
|
|
|
|
|
} |
81
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
sub transfer { |
83
|
11
|
|
|
11
|
1
|
33
|
my ( $self ) = @_; |
84
|
|
|
|
|
|
|
|
85
|
11
|
|
|
|
|
99
|
my $transfer_start = new Benchmark; |
86
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
LOOP: |
88
|
11
|
|
|
|
|
352
|
while ( 1 ) { |
89
|
109
|
100
|
|
|
|
1234
|
last LOOP unless $self->_transfer_loop( $transfer_start ); |
90
|
98
|
|
|
|
|
98162482
|
sleep 1; |
91
|
|
|
|
|
|
|
} |
92
|
|
|
|
|
|
|
} |
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
sub _transfer_loop { |
95
|
153
|
|
|
153
|
|
16422
|
my ( $self, $transfer_start ) = @_; |
96
|
|
|
|
|
|
|
|
97
|
153
|
|
|
|
|
1122
|
$self->_check_for_completed_processes(); |
98
|
|
|
|
|
|
|
|
99
|
|
|
|
|
|
|
# keep track if there are any remaining servers in any groups |
100
|
153
|
|
|
|
|
317
|
my ( $remaining_flag, $available_flag ); |
101
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
# handle completed processes |
103
|
153
|
100
|
66
|
|
|
375
|
if ( ! scalar keys %{ $self->data->{remaining} } && ! $self->data->{running} ) { |
|
153
|
|
|
|
|
1190
|
|
104
|
6
|
|
|
|
|
96
|
my $transfer_end = new Benchmark; |
105
|
6
|
|
|
|
|
112
|
my $transfer_diff = timediff( $transfer_end, $transfer_start ); |
106
|
6
|
|
|
|
|
228
|
my $transfer_time = $self->_human_friendly_time( $transfer_diff->[0] ); |
107
|
6
|
|
|
|
|
90
|
$logger->warn( "Job completed in $transfer_time" ); |
108
|
|
|
|
|
|
|
|
109
|
6
|
|
|
|
|
80
|
my $total_time = $self->_human_friendly_time( $self->total_time ); |
110
|
6
|
|
|
|
|
45
|
$logger->info ( "Cumulative tansfer time of all jobs: $total_time" ); |
111
|
|
|
|
|
|
|
|
112
|
6
|
|
|
|
|
64
|
my $savings = $self->total_time - $transfer_diff->[0]; |
113
|
6
|
100
|
|
|
|
50
|
if ( $savings ) { |
114
|
2
|
|
|
|
|
6
|
$savings = $self->_human_friendly_time( $savings ); |
115
|
2
|
|
|
|
|
12
|
$logger->info( "Approximate Time Saved: $savings" ); |
116
|
|
|
|
|
|
|
} |
117
|
|
|
|
|
|
|
|
118
|
6
|
|
|
|
|
27
|
my $failure_count; |
119
|
6
|
|
|
|
|
39
|
for my $group ( $self->get_groups() ) { |
120
|
7
|
|
|
|
|
33
|
my ( $errors, $failures ) = $self->_get_failed_count( $group ); |
121
|
7
|
|
|
|
|
27
|
$failure_count += $failures; |
122
|
|
|
|
|
|
|
} |
123
|
|
|
|
|
|
|
|
124
|
6
|
100
|
|
|
|
41
|
if ( $failure_count ) { |
125
|
1
|
|
|
|
|
6
|
$logger->fatal( "$failure_count Fatal Errors" ); |
126
|
|
|
|
|
|
|
} |
127
|
|
|
|
|
|
|
else { |
128
|
5
|
|
|
|
|
23
|
$logger->warn( "Completed successfully" ); |
129
|
|
|
|
|
|
|
} |
130
|
6
|
|
|
|
|
102
|
return; |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
# start new transfers to remaining servers |
134
|
147
|
|
|
|
|
496
|
for ( 0, 1 ) { |
135
|
|
|
|
|
|
|
# code_smell: start 2 transfers each round to keep the |
136
|
|
|
|
|
|
|
# test cases from breaking. need to refactor test cases! |
137
|
276
|
|
|
|
|
3159
|
for my $group ( $self->_get_remaining_groups() ) { |
138
|
|
|
|
|
|
|
# group contains servers that still need to be tranferred |
139
|
|
|
|
|
|
|
|
140
|
300
|
100
|
|
|
|
2902
|
if ( $self->_get_available_servers( $group ) ) { |
141
|
|
|
|
|
|
|
# reserve a server to start a new transfer from |
142
|
144
|
|
|
|
|
1047
|
my $source = $self->_reserve_available_server( $group ); |
143
|
144
|
|
|
|
|
1417
|
my $target = $self->_reserve_remaining_server( $group ); |
144
|
144
|
|
|
|
|
951
|
$self->_start_process( $group, $source, $target ); |
145
|
|
|
|
|
|
|
} |
146
|
|
|
|
|
|
|
} |
147
|
|
|
|
|
|
|
} |
148
|
|
|
|
|
|
|
|
149
|
121
|
|
|
|
|
3803
|
return 1; |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
sub _human_friendly_time { |
153
|
95
|
|
|
95
|
|
259
|
my ( $self, $seconds ) = @_; |
154
|
|
|
|
|
|
|
|
155
|
95
|
50
|
|
|
|
457
|
return "0 secs" unless $seconds; |
156
|
|
|
|
|
|
|
|
157
|
95
|
|
|
|
|
188
|
my @time_string; |
158
|
|
|
|
|
|
|
|
159
|
95
|
50
|
|
|
|
506
|
if ( $seconds > 3600 ) { |
160
|
0
|
|
|
|
|
0
|
my $hours = int( $seconds / 3600 ); |
161
|
0
|
|
|
|
|
0
|
$seconds = $seconds % 3600; |
162
|
0
|
|
|
|
|
0
|
push @time_string, "$hours hrs"; |
163
|
|
|
|
|
|
|
} |
164
|
95
|
50
|
|
|
|
507
|
if ( $seconds > 60 ) { |
165
|
0
|
|
|
|
|
0
|
my $minutes = int( $seconds / 60 ); |
166
|
0
|
|
|
|
|
0
|
$seconds = $seconds % 60; |
167
|
0
|
|
|
|
|
0
|
push @time_string, "$minutes mins"; |
168
|
|
|
|
|
|
|
} |
169
|
95
|
50
|
|
|
|
392
|
if ( $seconds ) { |
170
|
95
|
|
|
|
|
328
|
push @time_string, "$seconds secs"; |
171
|
|
|
|
|
|
|
} |
172
|
|
|
|
|
|
|
|
173
|
95
|
|
|
|
|
953
|
return join " ", @time_string; |
174
|
|
|
|
|
|
|
} |
175
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
sub _print_status { |
177
|
82
|
|
|
82
|
|
239
|
my ( $self, $group ) = @_; |
178
|
|
|
|
|
|
|
|
179
|
|
|
|
|
|
|
# completed procs |
180
|
82
|
|
|
|
|
199
|
my $completed = 0; |
181
|
82
|
50
|
|
|
|
461
|
if ( $self->data->{completed}->{ $group } ) { |
182
|
82
|
|
|
|
|
139
|
$completed = scalar @{ $self->data->{completed}->{ $group } }; |
|
82
|
|
|
|
|
764
|
|
183
|
|
|
|
|
|
|
} |
184
|
|
|
|
|
|
|
|
185
|
|
|
|
|
|
|
# running procs |
186
|
82
|
|
|
|
|
176
|
my $running = 0; |
187
|
82
|
50
|
|
|
|
646
|
if ( $self->data->{running} ) { |
188
|
82
|
|
|
|
|
174
|
for my $pid ( keys %{ $self->data->{running} } ) { |
|
82
|
|
|
|
|
463
|
|
189
|
90
|
100
|
|
|
|
831
|
if ( $self->data->{running}->{ $pid }->{group} eq $group ) { |
190
|
57
|
|
|
|
|
253
|
$running++; |
191
|
|
|
|
|
|
|
} |
192
|
|
|
|
|
|
|
} |
193
|
|
|
|
|
|
|
} |
194
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
# unstarted |
196
|
82
|
|
|
|
|
230
|
my $unstarted = 0; |
197
|
82
|
100
|
|
|
|
2166
|
if ( $self->data->{remaining}->{ $group } ) { |
198
|
68
|
|
|
|
|
140
|
$unstarted = scalar keys %{ $self->data->{remaining}->{ $group } }; |
|
68
|
|
|
|
|
300
|
|
199
|
|
|
|
|
|
|
} |
200
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
# failed |
202
|
82
|
|
|
|
|
356
|
my ( $errors, $failures ) = $self->_get_failed_count( $group ); |
203
|
|
|
|
|
|
|
|
204
|
82
|
|
|
|
|
1452
|
$logger->info( "\U$group: ", |
205
|
|
|
|
|
|
|
"completed:$completed ", |
206
|
|
|
|
|
|
|
"running:$running ", |
207
|
|
|
|
|
|
|
"left:$unstarted ", |
208
|
|
|
|
|
|
|
"errors:$errors ", |
209
|
|
|
|
|
|
|
"failures:$failures ", |
210
|
|
|
|
|
|
|
); |
211
|
|
|
|
|
|
|
} |
212
|
|
|
|
|
|
|
|
213
|
|
|
|
|
|
|
sub _start_process { |
214
|
144
|
|
|
144
|
|
389
|
my ( $self, $group, $source, $target ) = @_; |
215
|
|
|
|
|
|
|
|
216
|
144
|
|
|
|
|
819
|
$self->transfer_map->{$source}->{$target} += 1; |
217
|
|
|
|
|
|
|
|
218
|
144
|
|
|
|
|
712
|
my $f=fork; |
219
|
144
|
100
|
66
|
|
|
64285438
|
if (defined ($f) and $f==0) { |
220
|
|
|
|
|
|
|
|
221
|
26
|
|
|
|
|
10334
|
my $target_path = $self->target_path; |
222
|
|
|
|
|
|
|
|
223
|
26
|
|
|
|
|
442
|
my $command; |
224
|
26
|
100
|
|
|
|
1188
|
if ( $source eq "localhost" ) { |
225
|
7
|
|
|
|
|
373
|
$command = join( " ", |
226
|
|
|
|
|
|
|
$self->command, |
227
|
|
|
|
|
|
|
$self->command_args, |
228
|
|
|
|
|
|
|
$self->source_path, |
229
|
|
|
|
|
|
|
"$target:$target_path" |
230
|
|
|
|
|
|
|
); |
231
|
|
|
|
|
|
|
} else { |
232
|
19
|
|
|
|
|
3560
|
$command = join( " ", |
233
|
|
|
|
|
|
|
$self->ssh, |
234
|
|
|
|
|
|
|
$self->ssh_args, |
235
|
|
|
|
|
|
|
$source, |
236
|
|
|
|
|
|
|
$self->command, |
237
|
|
|
|
|
|
|
$self->command_args, |
238
|
|
|
|
|
|
|
$self->target_path, |
239
|
|
|
|
|
|
|
"$target:$target_path" |
240
|
|
|
|
|
|
|
); |
241
|
|
|
|
|
|
|
} |
242
|
|
|
|
|
|
|
|
243
|
26
|
|
|
|
|
10230
|
print "COMMAND: $command\n"; |
244
|
|
|
|
|
|
|
|
245
|
26
|
|
50
|
|
|
1473
|
my $output = $self->output || ""; |
246
|
26
|
50
|
|
|
|
487
|
if ( $output eq "stdout" ) { |
|
|
50
|
|
|
|
|
|
247
|
|
|
|
|
|
|
# don't modify command |
248
|
|
|
|
|
|
|
} elsif ( $output eq "log" ) { |
249
|
|
|
|
|
|
|
# redirect all child output to log |
250
|
0
|
|
|
|
|
0
|
$command = "$command >> ccp.$source.$target.log 2>&1" |
251
|
|
|
|
|
|
|
} else { |
252
|
|
|
|
|
|
|
# default is to redirectout stdout to /dev/null |
253
|
26
|
|
|
|
|
255
|
$command = "$command >/dev/null" |
254
|
|
|
|
|
|
|
} |
255
|
|
|
|
|
|
|
|
256
|
26
|
|
|
|
|
2256
|
$logger->info( "Starting: ($group) $source => $target" ); |
257
|
26
|
|
|
|
|
1654
|
$logger->debug( "Starting new child: $command" ); |
258
|
|
|
|
|
|
|
|
259
|
26
|
|
|
|
|
48281265
|
system( $command ); |
260
|
|
|
|
|
|
|
|
261
|
26
|
50
|
|
|
|
24584
|
if ($? == -1) { |
|
|
50
|
|
|
|
|
|
262
|
0
|
|
|
|
|
0
|
$logger->logconfess( "failed to execute: $!" ); |
263
|
|
|
|
|
|
|
} elsif ($? & 127) { |
264
|
0
|
0
|
|
|
|
0
|
$logger->logconfess( sprintf "child died with signal %d, %s coredump", |
265
|
|
|
|
|
|
|
($? & 127), ($? & 128) ? 'with' : 'without' |
266
|
|
|
|
|
|
|
); |
267
|
|
|
|
|
|
|
} else { |
268
|
26
|
|
|
|
|
379
|
my $exit_status = $? >> 8; |
269
|
26
|
100
|
|
|
|
456
|
if ( $exit_status ) { |
270
|
1
|
|
|
|
|
250
|
$logger->error( "child exit status: $exit_status" ); |
271
|
|
|
|
|
|
|
} |
272
|
26
|
|
|
|
|
13015
|
exit $exit_status; |
273
|
|
|
|
|
|
|
} |
274
|
|
|
|
|
|
|
} else { |
275
|
118
|
|
|
|
|
19273
|
my $start = new Benchmark; |
276
|
118
|
|
|
|
|
50018
|
$self->data->{running}->{ $f } = { group => $group, |
277
|
|
|
|
|
|
|
source => $source, |
278
|
|
|
|
|
|
|
target => $target, |
279
|
|
|
|
|
|
|
start => $start, |
280
|
|
|
|
|
|
|
}; |
281
|
|
|
|
|
|
|
} |
282
|
|
|
|
|
|
|
} |
283
|
|
|
|
|
|
|
|
284
|
|
|
|
|
|
|
sub _check_for_completed_processes { |
285
|
176
|
|
|
176
|
|
492
|
my ( $self ) = @_; |
286
|
|
|
|
|
|
|
|
287
|
176
|
100
|
|
|
|
3098
|
return unless $self->data->{running}; |
288
|
|
|
|
|
|
|
|
289
|
|
|
|
|
|
|
# find any processes that ended and reschedule the source and |
290
|
|
|
|
|
|
|
# target servers in the available pool |
291
|
121
|
|
|
|
|
392
|
for my $pid ( keys %{ $self->data->{running} } ) { |
|
121
|
|
|
|
|
1771
|
|
292
|
237
|
100
|
|
|
|
9041
|
if ( waitpid( $pid, WNOHANG) ) { |
293
|
|
|
|
|
|
|
|
294
|
|
|
|
|
|
|
# check the exit status of the command. |
295
|
82
|
100
|
|
|
|
8894
|
if ( $? ) { |
296
|
1
|
|
|
|
|
10
|
$self->_failed_process( $pid ); |
297
|
|
|
|
|
|
|
} else { |
298
|
81
|
|
|
|
|
676
|
$self->_succeeded_process( $pid ); |
299
|
|
|
|
|
|
|
} |
300
|
|
|
|
|
|
|
} |
301
|
|
|
|
|
|
|
} |
302
|
|
|
|
|
|
|
|
303
|
121
|
100
|
|
|
|
4927
|
unless ( keys %{ $self->data->{running} } ) { |
|
121
|
|
|
|
|
827
|
|
304
|
34
|
|
|
|
|
275
|
delete $self->data->{running}; |
305
|
|
|
|
|
|
|
} |
306
|
|
|
|
|
|
|
} |
307
|
|
|
|
|
|
|
|
308
|
|
|
|
|
|
|
sub _succeeded_process { |
309
|
81
|
|
|
81
|
|
433
|
my ( $self, $pid ) = @_; |
310
|
|
|
|
|
|
|
|
311
|
81
|
|
|
|
|
602
|
my $group = $self->data->{running}->{ $pid }->{group}; |
312
|
81
|
|
|
|
|
441
|
my $source = $self->data->{running}->{ $pid }->{source}; |
313
|
81
|
|
|
|
|
596
|
my $target = $self->data->{running}->{ $pid }->{target}; |
314
|
81
|
|
|
|
|
455
|
my $start = $self->data->{running}->{ $pid }->{start}; |
315
|
|
|
|
|
|
|
|
316
|
|
|
|
|
|
|
# calculate time for this transfer |
317
|
81
|
|
|
|
|
988
|
my $end = new Benchmark; |
318
|
81
|
|
|
|
|
2469
|
my $diff = timediff( $end, $start ); |
319
|
|
|
|
|
|
|
|
320
|
|
|
|
|
|
|
# keep track of transfer time totals |
321
|
81
|
|
|
|
|
5085
|
$self->total_time( $self->total_time + $diff->[0] ); |
322
|
|
|
|
|
|
|
|
323
|
81
|
|
|
|
|
722
|
my $time = $self->_human_friendly_time( $diff->[0] ); |
324
|
81
|
|
|
|
|
6048
|
$logger->warn( "Succeeded: ($group) $source => $target ($time)" ); |
325
|
|
|
|
|
|
|
|
326
|
81
|
|
|
|
|
1815
|
$self->_mark_available( $group, $source ); |
327
|
81
|
|
|
|
|
527
|
$self->_mark_completed( $group, $target ); |
328
|
81
|
|
|
|
|
241
|
$self->_mark_available( $group, $target ); |
329
|
|
|
|
|
|
|
|
330
|
81
|
|
|
|
|
460
|
delete $self->data->{running}->{ $pid }; |
331
|
|
|
|
|
|
|
|
332
|
81
|
|
|
|
|
347
|
$self->_print_status( $group ); |
333
|
|
|
|
|
|
|
} |
334
|
|
|
|
|
|
|
|
335
|
|
|
|
|
|
|
sub _failed_process { |
336
|
1
|
|
|
1
|
|
7
|
my ( $self, $pid ) = @_; |
337
|
|
|
|
|
|
|
|
338
|
1
|
|
|
|
|
8
|
my $group = $self->data->{running}->{ $pid }->{group}; |
339
|
1
|
|
|
|
|
20
|
my $source = $self->data->{running}->{ $pid }->{source}; |
340
|
1
|
|
|
|
|
10
|
my $target = $self->data->{running}->{ $pid }->{target}; |
341
|
1
|
|
|
|
|
8
|
my $start = $self->data->{running}->{ $pid }->{start}; |
342
|
|
|
|
|
|
|
|
343
|
|
|
|
|
|
|
# calculate time for this transfer |
344
|
1
|
|
|
|
|
9
|
my $end = new Benchmark; |
345
|
1
|
|
|
|
|
34
|
my $diff = timediff( $end, $start ); |
346
|
|
|
|
|
|
|
# keep track of transfer time totals |
347
|
1
|
|
|
|
|
61
|
$self->total_time( $self->total_time + $diff->[0] ); |
348
|
|
|
|
|
|
|
|
349
|
1
|
|
|
|
|
24
|
$logger->warn( "Failed: ($group) $source => $target ($diff->[0] seconds)" ); |
350
|
|
|
|
|
|
|
|
351
|
|
|
|
|
|
|
# there was an error during the transfer, reschedule |
352
|
|
|
|
|
|
|
# it at the end of the list |
353
|
1
|
|
|
|
|
23
|
$self->_mark_available( $group, $source ); |
354
|
1
|
|
|
|
|
8
|
my $fail_count = $self->_mark_failed( $group, $target ); |
355
|
1
|
50
|
|
|
|
6
|
if ( ! $self->_get_available_servers( $group ) ) { |
|
|
0
|
|
|
|
|
|
356
|
1
|
|
|
|
|
10
|
$logger->fatal( "Error: no available servers in '$group' to handle $target" ); |
357
|
1
|
|
|
|
|
15
|
$self->_mark_failed( $group, $target, 1 ); |
358
|
|
|
|
|
|
|
} |
359
|
|
|
|
|
|
|
elsif ( $fail_count >= $self->max_failures ) { |
360
|
0
|
|
|
|
|
0
|
$logger->fatal( "Error: giving up on ($group) $target" ); |
361
|
|
|
|
|
|
|
} else { |
362
|
0
|
|
|
|
|
0
|
$self->_mark_remaining( $group, $target ); |
363
|
|
|
|
|
|
|
} |
364
|
|
|
|
|
|
|
|
365
|
1
|
|
|
|
|
6
|
delete $self->data->{running}->{ $pid }; |
366
|
|
|
|
|
|
|
|
367
|
1
|
|
|
|
|
7
|
$self->_print_status( $group ); |
368
|
|
|
|
|
|
|
} |
369
|
|
|
|
|
|
|
|
370
|
|
|
|
|
|
|
sub _get_available_servers { |
371
|
513
|
|
|
513
|
|
1495
|
my ( $self, $group ) = @_; |
372
|
513
|
50
|
|
|
|
4106
|
return unless $self->data->{available}; |
373
|
513
|
50
|
|
|
|
2374
|
return unless $self->data->{available}->{ $group }; |
374
|
|
|
|
|
|
|
|
375
|
513
|
|
|
|
|
880
|
my @available; |
376
|
513
|
|
|
|
|
831
|
for my $host ( $self->_sort_servers( $group, keys %{ $self->data->{available}->{ $group } } ) ) { |
|
513
|
|
|
|
|
5602
|
|
377
|
619
|
100
|
|
|
|
2524
|
if ( $self->children->{$host} ) { |
378
|
258
|
100
|
|
|
|
2866
|
next if $self->children->{$host} >= $self->max_forks; |
379
|
|
|
|
|
|
|
} |
380
|
495
|
|
|
|
|
1985
|
push @available, $host; |
381
|
|
|
|
|
|
|
} |
382
|
|
|
|
|
|
|
|
383
|
513
|
|
|
|
|
3385
|
return @available; |
384
|
|
|
|
|
|
|
} |
385
|
|
|
|
|
|
|
|
386
|
|
|
|
|
|
|
sub _reserve_available_server { |
387
|
144
|
|
|
144
|
|
733
|
my ( $self, $group ) = @_; |
388
|
|
|
|
|
|
|
|
389
|
144
|
|
|
|
|
436
|
my ( $server ) = $self->_get_available_servers( $group ); |
390
|
144
|
|
|
|
|
4318
|
$logger->debug( "Reserving ($group) $server" ); |
391
|
|
|
|
|
|
|
|
392
|
|
|
|
|
|
|
# only one transfer from localhost to each dc |
393
|
144
|
100
|
|
|
|
3336
|
if ( $server eq "localhost" ) { |
394
|
42
|
|
|
|
|
216
|
delete $self->data->{available}->{$group}->{localhost}; |
395
|
|
|
|
|
|
|
} |
396
|
|
|
|
|
|
|
|
397
|
144
|
|
|
|
|
770
|
$self->children->{ $server }++; |
398
|
144
|
|
|
|
|
461
|
return $server; |
399
|
|
|
|
|
|
|
} |
400
|
|
|
|
|
|
|
|
401
|
|
|
|
|
|
|
sub _get_remaining_servers { |
402
|
216
|
|
|
216
|
|
844
|
my ( $self, $group ) = @_; |
403
|
|
|
|
|
|
|
|
404
|
216
|
50
|
|
|
|
4610
|
return unless $self->data->{remaining}; |
405
|
|
|
|
|
|
|
|
406
|
216
|
100
|
|
|
|
1141
|
return unless $self->data->{remaining}->{ $group }; |
407
|
|
|
|
|
|
|
|
408
|
210
|
|
|
|
|
312
|
my @hosts = $self->_sort_servers( $group, keys %{ $self->data->{remaining}->{ $group } } ); |
|
210
|
|
|
|
|
4748
|
|
409
|
210
|
|
|
|
|
2561
|
return @hosts; |
410
|
|
|
|
|
|
|
} |
411
|
|
|
|
|
|
|
|
412
|
|
|
|
|
|
|
sub _sort_servers { |
413
|
867
|
|
|
867
|
|
2946
|
my ( $self, $group, @servers ) = @_; |
414
|
|
|
|
|
|
|
|
415
|
|
|
|
|
|
|
# sort servers based on original insertion order |
416
|
867
|
|
|
|
|
6385
|
@servers = sort { $self->sort_order->{$group}->{$a} <=> $self->sort_order->{$group}->{$b} } @servers; |
|
2751
|
|
|
|
|
11957
|
|
417
|
|
|
|
|
|
|
|
418
|
867
|
|
|
|
|
6621
|
return @servers; |
419
|
|
|
|
|
|
|
} |
420
|
|
|
|
|
|
|
|
421
|
|
|
|
|
|
|
sub _reserve_remaining_server { |
422
|
144
|
|
|
144
|
|
1101
|
my ( $self, $group ) = @_; |
423
|
|
|
|
|
|
|
|
424
|
144
|
50
|
|
|
|
448
|
if ( $self->_get_remaining_servers( $group ) ) { |
425
|
144
|
|
|
|
|
346
|
my $server = ( $self->_sort_servers( $group, keys %{ $self->data->{remaining}->{ $group } } ) )[0]; |
|
144
|
|
|
|
|
891
|
|
426
|
144
|
|
|
|
|
1213
|
delete $self->data->{remaining}->{ $group }->{$server}; |
427
|
144
|
|
|
|
|
1044
|
$logger->debug( "Reserving ($group) $server" ); |
428
|
|
|
|
|
|
|
|
429
|
|
|
|
|
|
|
# delete remaining data structure as groups are completed |
430
|
144
|
100
|
|
|
|
3594
|
unless ( scalar keys %{ $self->data->{remaining}->{ $group } } ) { |
|
144
|
|
|
|
|
1591
|
|
431
|
15
|
|
|
|
|
499
|
$logger->debug( "Group empty: $group" ); |
432
|
15
|
|
|
|
|
258
|
delete $self->data->{remaining}->{ $group }; |
433
|
15
|
100
|
|
|
|
315
|
unless ( scalar ( keys %{ $self->data->{remaining} } ) ) { |
|
15
|
|
|
|
|
163
|
|
434
|
12
|
|
|
|
|
172
|
$logger->debug( "No servers remaining" ); |
435
|
12
|
|
|
|
|
220
|
delete $self->data->{remaining}; |
436
|
|
|
|
|
|
|
} |
437
|
|
|
|
|
|
|
} |
438
|
144
|
|
|
|
|
514
|
return $server; |
439
|
|
|
|
|
|
|
} |
440
|
|
|
|
|
|
|
} |
441
|
|
|
|
|
|
|
|
442
|
|
|
|
|
|
|
sub _get_remaining_groups { |
443
|
276
|
|
|
276
|
|
843
|
my ( $self ) = @_; |
444
|
276
|
100
|
|
|
|
1516
|
return unless $self->data->{remaining}; |
445
|
271
|
|
|
|
|
420
|
my @keys = sort keys %{ $self->data->{remaining} }; |
|
271
|
|
|
|
|
2613
|
|
446
|
271
|
100
|
|
|
|
997
|
return unless scalar @keys; |
447
|
261
|
|
|
|
|
1932
|
return @keys; |
448
|
|
|
|
|
|
|
} |
449
|
|
|
|
|
|
|
|
450
|
|
|
|
|
|
|
sub _mark_available { |
451
|
163
|
|
|
163
|
|
364
|
my ( $self, $group, $server ) = @_; |
452
|
|
|
|
|
|
|
|
453
|
|
|
|
|
|
|
# only the initial transfer to each dc comes from localhost. iff |
454
|
|
|
|
|
|
|
# first transfer (from localhost) succeeded, then don't reschedule |
455
|
|
|
|
|
|
|
# for future syncs |
456
|
163
|
100
|
|
|
|
728
|
if ( $server eq "localhost" ) { |
457
|
|
|
|
|
|
|
|
458
|
34
|
50
|
|
|
|
769
|
if ( $self->data->{completed}->{ $group } ) { |
459
|
|
|
|
|
|
|
|
460
|
34
|
|
|
|
|
203
|
delete $self->data->{available}->{ $group }->{$server}; |
461
|
34
|
|
|
|
|
100
|
return; |
462
|
|
|
|
|
|
|
} |
463
|
|
|
|
|
|
|
} |
464
|
|
|
|
|
|
|
|
465
|
129
|
|
|
|
|
1230
|
$logger->debug( "Server available: ($group) $server" ); |
466
|
129
|
|
|
|
|
1907
|
$self->data->{available}->{ $group }->{$server} = 1; |
467
|
|
|
|
|
|
|
|
468
|
|
|
|
|
|
|
# reduce count of number of active processes on this server |
469
|
129
|
100
|
|
|
|
881
|
if ( $self->children->{$server} ) { |
470
|
48
|
|
|
|
|
759
|
$self->children->{$server}--; |
471
|
|
|
|
|
|
|
} |
472
|
|
|
|
|
|
|
} |
473
|
|
|
|
|
|
|
|
474
|
|
|
|
|
|
|
sub _mark_remaining { |
475
|
0
|
|
|
0
|
|
0
|
my ( $self, $group, $server ) = @_; |
476
|
|
|
|
|
|
|
|
477
|
0
|
|
|
|
|
0
|
$logger->debug( "Server remaining: ($group) $server" ); |
478
|
0
|
|
|
|
|
0
|
$self->data->{remaining}->{ $group }->{$server} = 1; |
479
|
|
|
|
|
|
|
} |
480
|
|
|
|
|
|
|
|
481
|
|
|
|
|
|
|
sub _mark_completed { |
482
|
81
|
|
|
81
|
|
237
|
my ( $self, $group, $server ) = @_; |
483
|
|
|
|
|
|
|
|
484
|
81
|
|
|
|
|
1340
|
$logger->debug( "Server completed: ($group) $server" ); |
485
|
81
|
|
|
|
|
694
|
push @{ $self->data->{completed}->{ $group } }, $server; |
|
81
|
|
|
|
|
544
|
|
486
|
|
|
|
|
|
|
} |
487
|
|
|
|
|
|
|
|
488
|
|
|
|
|
|
|
sub _mark_failed { |
489
|
2
|
|
|
2
|
|
5
|
my ( $self, $group, $server, $fatal ) = @_; |
490
|
|
|
|
|
|
|
|
491
|
2
|
|
|
|
|
12
|
$logger->debug( "Server failed: ($group) $server" ); |
492
|
|
|
|
|
|
|
|
493
|
2
|
100
|
|
|
|
20
|
if ( $fatal ) { |
494
|
1
|
|
|
|
|
23
|
$self->data->{failed}->{ $group }->{ $server } = $self->max_failures; |
495
|
|
|
|
|
|
|
} |
496
|
|
|
|
|
|
|
else { |
497
|
1
|
|
|
|
|
10
|
$self->data->{failed}->{ $group }->{ $server }++; |
498
|
|
|
|
|
|
|
} |
499
|
|
|
|
|
|
|
|
500
|
2
|
|
|
|
|
7
|
my $failures = $self->data->{failed}->{ $group }->{ $server }; |
501
|
2
|
|
|
|
|
10
|
$logger->debug( "$failures failures for ($group) $server" ); |
502
|
2
|
|
|
|
|
23
|
return $failures; |
503
|
|
|
|
|
|
|
} |
504
|
|
|
|
|
|
|
|
505
|
|
|
|
|
|
|
sub _get_failed_count { |
506
|
89
|
|
|
89
|
|
191
|
my ( $self, $group ) = @_; |
507
|
|
|
|
|
|
|
|
508
|
89
|
|
|
|
|
663
|
my $errors = 0; |
509
|
89
|
|
|
|
|
181
|
my $failures = 0; |
510
|
|
|
|
|
|
|
|
511
|
89
|
100
|
66
|
|
|
746
|
if ( $self->data->{failed} && $self->data->{failed}->{ $group } ) { |
512
|
2
|
|
|
|
|
5
|
for my $server ( keys %{ $self->data->{failed}->{ $group }} ) { |
|
2
|
|
|
|
|
17
|
|
513
|
2
|
|
|
|
|
7
|
$errors += $self->data->{failed}->{ $group }->{ $server }; |
514
|
2
|
50
|
|
|
|
12
|
if ( $self->data->{failed}->{ $group }->{ $server } >= $self->max_failures ) { |
515
|
2
|
|
|
|
|
5
|
$failures++; |
516
|
|
|
|
|
|
|
} |
517
|
|
|
|
|
|
|
} |
518
|
|
|
|
|
|
|
} |
519
|
|
|
|
|
|
|
|
520
|
89
|
|
|
|
|
280
|
return ( $errors, $failures ); |
521
|
|
|
|
|
|
|
} |
522
|
|
|
|
|
|
|
|
523
|
|
|
|
|
|
|
# tracing all the attempted transfers |
524
|
|
|
|
|
|
|
sub get_transfer_map { |
525
|
16
|
|
|
16
|
1
|
518
|
my ( $self ) = @_; |
526
|
|
|
|
|
|
|
|
527
|
16
|
|
|
|
|
1381
|
return $self->transfer_map; |
528
|
|
|
|
|
|
|
} |
529
|
|
|
|
|
|
|
|
530
|
|
|
|
|
|
|
|
531
|
|
|
|
|
|
|
1; |
532
|
|
|
|
|
|
|
|
533
|
|
|
|
|
|
|
__END__ |