line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package MogileFS::Worker; |
2
|
21
|
|
|
21
|
|
113
|
use strict; |
|
21
|
|
|
|
|
27
|
|
|
21
|
|
|
|
|
962
|
|
3
|
21
|
|
|
|
|
164
|
use fields ('psock', # socket for parent/child communications |
4
|
|
|
|
|
|
|
'last_bcast_state', # "{device|host}-$devid" => [$time, {alive|dead}] |
5
|
|
|
|
|
|
|
'readbuf', # unparsed data from parent |
6
|
|
|
|
|
|
|
'monitor_has_run', # true once we've heard of the monitor job being alive |
7
|
|
|
|
|
|
|
'last_ping', # time we last said we're alive |
8
|
|
|
|
|
|
|
'woken_up', # bool: if we've been woken up |
9
|
|
|
|
|
|
|
'last_wake', # hashref: { $class -> time() } when we last woke up a certain job class |
10
|
|
|
|
|
|
|
'queue_depth', # depth of a queue we queried |
11
|
|
|
|
|
|
|
'queue_todo', # aref of hrefs of work sent from parent |
12
|
21
|
|
|
21
|
|
91
|
); |
|
21
|
|
|
|
|
26
|
|
13
|
|
|
|
|
|
|
|
14
|
21
|
|
|
21
|
|
2018
|
use MogileFS::Util qw(error eurl decode_url_args apply_state_events); |
|
21
|
|
|
|
|
32
|
|
|
21
|
|
|
|
|
1260
|
|
15
|
21
|
|
|
21
|
|
96
|
use MogileFS::Server; |
|
21
|
|
|
|
|
24
|
|
|
21
|
|
|
|
|
508
|
|
16
|
|
|
|
|
|
|
|
17
|
|
|
|
|
|
|
use vars ( |
18
|
21
|
|
|
|
|
25979
|
'$got_live_vs_die', # local'ized scalarref flag for whether we've |
19
|
|
|
|
|
|
|
# gotten a live-vs-die instruction from parent |
20
|
21
|
|
|
21
|
|
81
|
); |
|
21
|
|
|
|
|
28
|
|
21
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
sub new { |
23
|
0
|
|
|
0
|
0
|
|
my ($self, $psock) = @_; |
24
|
0
|
0
|
|
|
|
|
$self = fields::new($self) unless ref $self; |
25
|
|
|
|
|
|
|
|
26
|
0
|
|
|
|
|
|
$self->{psock} = $psock; |
27
|
0
|
|
|
|
|
|
$self->{readbuf} = ''; |
28
|
0
|
|
|
|
|
|
$self->{last_bcast_state} = {}; |
29
|
0
|
|
|
|
|
|
$self->{monitor_has_run} = MogileFS::ProcManager->is_monitor_good; |
30
|
0
|
|
|
|
|
|
$self->{last_ping} = 0; |
31
|
0
|
|
|
|
|
|
$self->{last_wake} = {}; |
32
|
0
|
|
|
|
|
|
$self->{queue_depth} = {}; |
33
|
0
|
|
|
|
|
|
$self->{queue_todo} = {}; |
34
|
|
|
|
|
|
|
|
35
|
0
|
|
|
|
|
|
IO::Handle::blocking($psock, 0); |
36
|
0
|
|
|
|
|
|
return $self; |
37
|
|
|
|
|
|
|
} |
38
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
sub psock_fd { |
40
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
41
|
0
|
|
|
|
|
|
return fileno($self->{psock}); |
42
|
|
|
|
|
|
|
} |
43
|
|
|
|
|
|
|
|
44
|
|
|
|
|
|
|
sub psock { |
45
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
46
|
0
|
|
|
|
|
|
return $self->{psock}; |
47
|
|
|
|
|
|
|
} |
48
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
sub validate_dbh { |
50
|
0
|
|
|
0
|
0
|
|
return Mgd::validate_dbh(); |
51
|
|
|
|
|
|
|
} |
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
sub monitor_has_run { |
54
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
55
|
0
|
0
|
|
|
|
|
return $self->{monitor_has_run} ? 1 : 0; |
56
|
|
|
|
|
|
|
} |
57
|
|
|
|
|
|
|
|
58
|
|
|
|
|
|
|
sub forget_that_monitor_has_run { |
59
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
60
|
0
|
|
|
|
|
|
$self->{monitor_has_run} = 0; |
61
|
|
|
|
|
|
|
} |
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
sub wait_for_monitor { |
64
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
65
|
0
|
|
|
|
|
|
while (! $self->monitor_has_run) { |
66
|
0
|
|
|
|
|
|
$self->read_from_parent(1); |
67
|
0
|
|
|
|
|
|
$self->still_alive; |
68
|
|
|
|
|
|
|
} |
69
|
|
|
|
|
|
|
} |
70
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
# method that workers can call just to write something to the parent, so worker |
72
|
|
|
|
|
|
|
# doesn't get killed. (during idle/slow operation, say) |
73
|
|
|
|
|
|
|
# returns current time, so caller can avoid a time() call as well, for its loop |
74
|
|
|
|
|
|
|
sub still_alive { |
75
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
76
|
0
|
|
|
|
|
|
my $now = time(); |
77
|
0
|
0
|
|
|
|
|
if ($now > $self->{last_ping} + ($self->watchdog_timeout / 4)) { |
78
|
0
|
|
|
|
|
|
$self->send_to_parent(":still_alive"); # a no-op, just for the watchdog |
79
|
0
|
|
|
|
|
|
$self->{last_ping} = $now; |
80
|
|
|
|
|
|
|
} |
81
|
0
|
|
|
|
|
|
return $now; |
82
|
|
|
|
|
|
|
} |
83
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
sub send_to_parent { |
85
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
86
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
# can be called as package method: MogileFS::Worker->send_to_parent... |
88
|
0
|
0
|
|
|
|
|
unless (ref $self) { |
89
|
0
|
0
|
|
|
|
|
$self = MogileFS::ProcManager->is_child |
90
|
|
|
|
|
|
|
or return; |
91
|
|
|
|
|
|
|
} |
92
|
|
|
|
|
|
|
|
93
|
0
|
|
|
|
|
|
my $write = "$_[0]\r\n"; |
94
|
0
|
|
|
|
|
|
my $totallen = length $write; |
95
|
0
|
|
|
|
|
|
my $rv = syswrite($self->{psock}, $write); |
96
|
0
|
0
|
0
|
|
|
|
return 1 if defined $rv && $rv == $totallen; |
97
|
0
|
0
|
0
|
|
|
|
die "Error writing to parent process: $!" if $! && ! $!{EAGAIN}; |
98
|
|
|
|
|
|
|
|
99
|
0
|
|
0
|
|
|
|
$rv ||= 0; # could've been undef, if EAGAIN immediately. |
100
|
0
|
|
|
|
|
|
my $remain = $totallen - $rv; |
101
|
0
|
|
|
|
|
|
my $offset = $rv; |
102
|
0
|
|
|
|
|
|
while ($remain > 0) { |
103
|
0
|
0
|
|
|
|
|
MogileFS::Util::wait_for_writeability(fileno($self->{psock}), 30) |
104
|
|
|
|
|
|
|
or die "Parent not writable in 30 seconds"; |
105
|
|
|
|
|
|
|
|
106
|
0
|
|
|
|
|
|
$rv = syswrite($self->{psock}, $write, $remain, $offset); |
107
|
0
|
0
|
0
|
|
|
|
die "Error writing to parent process (in loop): $!" if $! && ! $!{EAGAIN}; |
108
|
0
|
0
|
|
|
|
|
if ($rv) { |
109
|
0
|
|
|
|
|
|
$remain -= $rv; |
110
|
0
|
|
|
|
|
|
$offset += $rv; |
111
|
|
|
|
|
|
|
} |
112
|
|
|
|
|
|
|
} |
113
|
0
|
0
|
|
|
|
|
die "remain is negative: $remain" if $remain < 0; |
114
|
0
|
|
|
|
|
|
return 1; |
115
|
|
|
|
|
|
|
} |
116
|
|
|
|
|
|
|
|
117
|
|
|
|
|
|
|
# override in children |
118
|
|
|
|
|
|
|
sub watchdog_timeout { |
119
|
0
|
|
|
0
|
0
|
|
return 10; |
120
|
|
|
|
|
|
|
} |
121
|
|
|
|
|
|
|
|
122
|
|
|
|
|
|
|
# should be overridden by workers to process worker-specific directives |
123
|
|
|
|
|
|
|
# from the parent process. return 1 if you recognize the command, 0 otherwise. |
124
|
|
|
|
|
|
|
sub process_line { |
125
|
0
|
|
|
0
|
0
|
|
my ($self, $lineref) = @_; |
126
|
0
|
|
|
|
|
|
return 0; |
127
|
|
|
|
|
|
|
} |
128
|
|
|
|
|
|
|
|
129
|
|
|
|
|
|
|
sub read_from_parent { |
130
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
131
|
0
|
|
0
|
|
|
|
my $timeout = shift || 0; |
132
|
0
|
|
|
|
|
|
my $psock = $self->{psock}; |
133
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
# while things are immediately available, |
135
|
|
|
|
|
|
|
# (or optionally sleep a bit) |
136
|
0
|
|
|
|
|
|
while (MogileFS::Util::wait_for_readability(fileno($psock), $timeout)) { |
137
|
0
|
|
|
|
|
|
$timeout = 0; # only wait on the timeout for the first read. |
138
|
0
|
|
|
|
|
|
my $buf; |
139
|
0
|
|
|
|
|
|
my $rv = sysread($psock, $buf, Mgd::UNIX_RCVBUF_SIZE()); |
140
|
0
|
0
|
|
|
|
|
if (!$rv) { |
141
|
0
|
0
|
|
|
|
|
if (defined $rv) { |
142
|
0
|
|
|
|
|
|
die "While reading pipe from parent, got EOF. Parent's gone. Quitting.\n"; |
143
|
|
|
|
|
|
|
} else { |
144
|
0
|
|
|
|
|
|
die "Error reading pipe from parent: $!\n"; |
145
|
|
|
|
|
|
|
} |
146
|
|
|
|
|
|
|
} |
147
|
|
|
|
|
|
|
|
148
|
0
|
0
|
|
|
|
|
if ($Mgd::POST_SLEEP_DEBUG) { |
149
|
0
|
|
|
|
|
|
my $out = $buf; |
150
|
0
|
|
|
|
|
|
$out =~ s/\s+$//; |
151
|
0
|
|
|
|
|
|
warn "proc ${self}[$$] read: [$out]\n" |
152
|
|
|
|
|
|
|
} |
153
|
0
|
|
|
|
|
|
$self->{readbuf} .= $buf; |
154
|
|
|
|
|
|
|
|
155
|
0
|
|
|
|
|
|
while ($self->{readbuf} =~ s/^(.+?)\r?\n//) { |
156
|
0
|
|
|
|
|
|
my $line = $1; |
157
|
|
|
|
|
|
|
|
158
|
0
|
0
|
|
|
|
|
next if $self->process_generic_command(\$line); |
159
|
0
|
|
|
|
|
|
my $ok = $self->process_line(\$line); |
160
|
0
|
0
|
|
|
|
|
unless ($ok) { |
161
|
0
|
|
|
|
|
|
error("Unrecognized command from parent: $line"); |
162
|
|
|
|
|
|
|
} |
163
|
|
|
|
|
|
|
} |
164
|
|
|
|
|
|
|
} |
165
|
|
|
|
|
|
|
} |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
sub parent_ping { |
168
|
0
|
|
|
0
|
0
|
|
my $self = shift; |
169
|
0
|
|
|
|
|
|
my $psock = $self->{psock}; |
170
|
0
|
|
|
|
|
|
$self->send_to_parent(':ping'); |
171
|
|
|
|
|
|
|
|
172
|
0
|
|
|
|
|
|
my $got_reply = 0; |
173
|
0
|
0
|
|
|
|
|
die "recursive parent_ping!" if $got_live_vs_die; |
174
|
0
|
|
|
|
|
|
local $got_live_vs_die = \$got_reply; |
175
|
|
|
|
|
|
|
|
176
|
0
|
|
|
|
|
|
my $loops = 0; |
177
|
|
|
|
|
|
|
|
178
|
0
|
|
|
|
|
|
while (!$got_reply) { |
179
|
0
|
|
|
|
|
|
$self->read_from_parent; |
180
|
0
|
0
|
|
|
|
|
return if $got_reply; |
181
|
|
|
|
|
|
|
|
182
|
0
|
|
|
|
|
|
$loops++; |
183
|
0
|
|
|
|
|
|
select undef, undef, undef, 0.20; |
184
|
0
|
0
|
|
|
|
|
if ($loops > 5) { |
185
|
0
|
|
|
|
|
|
warn "No simple reply from parent to child $self [$$] in $loops 0.2second loops.\n"; |
186
|
0
|
0
|
|
|
|
|
die "No answer in 4 seconds from parent to child $self [$$], dying" if $loops > 20; |
187
|
|
|
|
|
|
|
} |
188
|
|
|
|
|
|
|
} |
189
|
|
|
|
|
|
|
} |
190
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
# tries to parse generic (not job-specific) commands sent from parent |
192
|
|
|
|
|
|
|
# to child. returns 1 on success, or 0 if command given isn't generic, |
193
|
|
|
|
|
|
|
# and child should parse. |
194
|
|
|
|
|
|
|
# lineref doesn't have \r\n at end. |
195
|
|
|
|
|
|
|
sub process_generic_command { |
196
|
0
|
|
|
0
|
0
|
|
my ($self, $lineref) = @_; |
197
|
0
|
0
|
|
|
|
|
return 0 unless $$lineref =~ /^:/; # all generic commands start with colon |
198
|
|
|
|
|
|
|
|
199
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:shutdown/) { |
200
|
0
|
0
|
|
|
|
|
$$got_live_vs_die = 1 if $got_live_vs_die; |
201
|
0
|
|
|
|
|
|
exit 0; |
202
|
|
|
|
|
|
|
} |
203
|
|
|
|
|
|
|
|
204
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:stay_alive/) { |
205
|
0
|
0
|
|
|
|
|
$$got_live_vs_die = 1 if $got_live_vs_die; |
206
|
0
|
|
|
|
|
|
return 1; |
207
|
|
|
|
|
|
|
} |
208
|
|
|
|
|
|
|
|
209
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:monitor_events/) { |
210
|
0
|
|
|
|
|
|
apply_state_events($lineref); |
211
|
0
|
|
|
|
|
|
return 1; |
212
|
|
|
|
|
|
|
} |
213
|
|
|
|
|
|
|
|
214
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:monitor_has_run/) { |
215
|
0
|
|
|
|
|
|
$self->{monitor_has_run} = 1; |
216
|
0
|
|
|
|
|
|
return 1; |
217
|
|
|
|
|
|
|
} |
218
|
|
|
|
|
|
|
|
219
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:wake_up/) { |
220
|
0
|
|
|
|
|
|
$self->{woken_up} = 1; |
221
|
0
|
|
|
|
|
|
return 1; |
222
|
|
|
|
|
|
|
} |
223
|
|
|
|
|
|
|
|
224
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:set_config_from_parent (\S+) (.+)/) { |
225
|
|
|
|
|
|
|
# the 'no_broadcast' API keeps us from looping forever. |
226
|
0
|
|
|
|
|
|
MogileFS::Config->set_config_no_broadcast($1, $2); |
227
|
0
|
|
|
|
|
|
return 1; |
228
|
|
|
|
|
|
|
} |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
# queue_name depth |
231
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:queue_depth (\w+) (\d+)/) { |
232
|
0
|
|
|
|
|
|
$self->queue_depth($1, $2); |
233
|
0
|
|
|
|
|
|
return 1; |
234
|
|
|
|
|
|
|
} |
235
|
|
|
|
|
|
|
|
236
|
|
|
|
|
|
|
# queue_name encoded_item |
237
|
0
|
0
|
|
|
|
|
if ($$lineref =~ /^:queue_todo (\w+) (.+)/) { |
238
|
|
|
|
|
|
|
# TODO: Use the accessor. |
239
|
0
|
|
|
|
|
|
push(@{$self->{queue_todo}->{$1}}, decode_url_args(\$2)); |
|
0
|
|
|
|
|
|
|
240
|
0
|
|
|
|
|
|
return 1; |
241
|
|
|
|
|
|
|
} |
242
|
|
|
|
|
|
|
|
243
|
|
|
|
|
|
|
# TODO: warn on unknown commands? |
244
|
|
|
|
|
|
|
|
245
|
0
|
|
|
|
|
|
return 0; |
246
|
|
|
|
|
|
|
} |
247
|
|
|
|
|
|
|
|
248
|
|
|
|
|
|
|
sub queue_depth { |
249
|
0
|
|
|
0
|
0
|
|
my MogileFS::Worker $self = shift; |
250
|
0
|
|
|
|
|
|
my $type = shift; |
251
|
0
|
|
0
|
|
|
|
$self->{queue_depth}->{$type} ||= 0; |
252
|
0
|
0
|
|
|
|
|
return $self->{queue_depth}->{$type} unless @_; |
253
|
0
|
|
|
|
|
|
return $self->{queue_depth}->{$type} = shift; |
254
|
|
|
|
|
|
|
} |
255
|
|
|
|
|
|
|
|
256
|
|
|
|
|
|
|
sub queue_todo { |
257
|
0
|
|
|
0
|
0
|
|
my MogileFS::Worker $self = shift; |
258
|
0
|
|
|
|
|
|
my $type = shift; |
259
|
0
|
|
0
|
|
|
|
$self->{queue_todo}->{$type} ||= []; |
260
|
0
|
0
|
|
|
|
|
push(@{$self->{queue_todo}->{$type}}, @_) if @_; |
|
0
|
|
|
|
|
|
|
261
|
0
|
|
|
|
|
|
return $self->{queue_todo}->{$type}; |
262
|
|
|
|
|
|
|
} |
263
|
|
|
|
|
|
|
|
264
|
|
|
|
|
|
|
sub was_woken_up { |
265
|
0
|
|
|
0
|
0
|
|
my MogileFS::Worker $self = shift; |
266
|
0
|
|
|
|
|
|
return $self->{woken_up}; |
267
|
|
|
|
|
|
|
} |
268
|
|
|
|
|
|
|
|
269
|
|
|
|
|
|
|
sub forget_woken_up { |
270
|
0
|
|
|
0
|
0
|
|
my MogileFS::Worker $self = shift; |
271
|
0
|
|
|
|
|
|
$self->{woken_up} = 0; |
272
|
|
|
|
|
|
|
} |
273
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
# don't wake processes more than once a second... not necessary. |
275
|
|
|
|
|
|
|
sub wake_a { |
276
|
0
|
|
|
0
|
0
|
|
my ($self, $class) = @_; |
277
|
0
|
|
|
|
|
|
my $now = time(); |
278
|
0
|
0
|
0
|
|
|
|
return if ($self->{last_wake}{$class}||0) == $now; |
279
|
0
|
|
|
|
|
|
$self->{last_wake}{$class} = $now; |
280
|
0
|
|
|
|
|
|
$self->send_to_parent(":wake_a $class"); |
281
|
|
|
|
|
|
|
} |
282
|
|
|
|
|
|
|
|
283
|
|
|
|
|
|
|
1; |
284
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
# Local Variables: |
286
|
|
|
|
|
|
|
# mode: perl |
287
|
|
|
|
|
|
|
# c-basic-indent: 4 |
288
|
|
|
|
|
|
|
# indent-tabs-mode: nil |
289
|
|
|
|
|
|
|
# End: |
290
|
|
|
|
|
|
|
|