| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
2
|
|
|
2
|
|
10
|
use strict; |
|
|
2
|
|
|
|
|
2
|
|
|
|
2
|
|
|
|
|
73
|
|
|
2
|
2
|
|
|
2
|
|
6
|
use warnings; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
60
|
|
|
3
|
2
|
|
|
2
|
|
6
|
no warnings "void"; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
88
|
|
|
4
|
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
=head1 NAME |
|
6
|
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
LWP::UserAgent::Paranoid - A modern LWPx::ParanoidAgent for safer requests |
|
8
|
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
=cut |
|
10
|
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
package LWP::UserAgent::Paranoid; |
|
12
|
2
|
|
|
2
|
|
6
|
use base 'LWP::UserAgent'; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
1257
|
|
|
13
|
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
our $VERSION = "0.97"; |
|
15
|
|
|
|
|
|
|
|
|
16
|
2
|
|
|
2
|
|
47569
|
use Scalar::Util qw/ refaddr /; |
|
|
2
|
|
|
|
|
7
|
|
|
|
2
|
|
|
|
|
162
|
|
|
17
|
2
|
|
|
2
|
|
11
|
use Time::HiRes qw/ alarm /; |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
19
|
|
|
18
|
2
|
|
|
2
|
|
3214
|
use LWPx::ParanoidHandler qw//; |
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
use Net::DNS::Paranoid qw//; |
|
20
|
|
|
|
|
|
|
use Carp qw//; |
|
21
|
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
23
|
|
|
|
|
|
|
|
|
24
|
|
|
|
|
|
|
use LWP::UserAgent::Paranoid; |
|
25
|
|
|
|
|
|
|
my $ua = LWP::UserAgent::Paranoid->new( |
|
26
|
|
|
|
|
|
|
request_timeout => 5 # seconds; may be fractional |
|
27
|
|
|
|
|
|
|
); |
|
28
|
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
# use $ua as a normal LWP::UserAgent... |
|
30
|
|
|
|
|
|
|
my $response = $ua->get("http://example.com"); |
|
31
|
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
# allow requests to localhost and 127.0.0.1 |
|
33
|
|
|
|
|
|
|
$ua->whitelisted_hosts('localhost', '127.0.0.1'); |
|
34
|
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
36
|
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
This module is a more modern L with cleaner internals and |
|
38
|
|
|
|
|
|
|
a very similar feature set. It is a not a drop-in replacement, however, since |
|
39
|
|
|
|
|
|
|
the API differs. |
|
40
|
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
The primary features provided by this module: |
|
42
|
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
=head2 Overall request timeout |
|
44
|
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
A configurable timeout from start to finish of a "logical" request made by |
|
46
|
|
|
|
|
|
|
calling one of L's request methods. It encompasses all |
|
47
|
|
|
|
|
|
|
followed redirects to ensure that you can't be tarpitted by a series of |
|
48
|
|
|
|
|
|
|
stalling redirects. The default is 5 seconds. |
|
49
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
=head2 Blocked private hosts and IP address ranges |
|
51
|
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
All new agents are automatically made paranoid of private hostnames and IP |
|
53
|
|
|
|
|
|
|
address ranges using L. You may access the |
|
54
|
|
|
|
|
|
|
L resolver via the L method in order to |
|
55
|
|
|
|
|
|
|
customize its behaviour. |
|
56
|
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
For simple whitelisting and blacklisting, you may call L or |
|
58
|
|
|
|
|
|
|
L. These methods are proxied to the corresponding methods |
|
59
|
|
|
|
|
|
|
of L. The only difference is that you may pass a list to |
|
60
|
|
|
|
|
|
|
this class' methods. |
|
61
|
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
=head1 EVEN MORE PARANOIA |
|
63
|
|
|
|
|
|
|
|
|
64
|
|
|
|
|
|
|
You may also wish to tune standard L parameters for greater |
|
65
|
|
|
|
|
|
|
paranoria depending on your requirements: |
|
66
|
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
=head2 Maximum number of redirects |
|
68
|
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
Although generally unnecessary given the request timeout, you can tune |
|
70
|
|
|
|
|
|
|
L down from the default of 7. |
|
71
|
|
|
|
|
|
|
|
|
72
|
|
|
|
|
|
|
=head2 Protocols/URI schemes allowed |
|
73
|
|
|
|
|
|
|
|
|
74
|
|
|
|
|
|
|
If you don't want to allow requests for schemes other than http and https, you |
|
75
|
|
|
|
|
|
|
may use L either as a method or as an option |
|
76
|
|
|
|
|
|
|
to I. |
|
77
|
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
$ua->protocols_allowed(["http", "https"]); |
|
79
|
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
=head1 WHY NOT LWPx::ParanoidAgent? |
|
81
|
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
L's implemention involves a 2009-era fork of LWP's http |
|
83
|
|
|
|
|
|
|
and https protocol handlers, and it is no longer maintained. A more |
|
84
|
|
|
|
|
|
|
maintainable approach is taken by this module and L. |
|
85
|
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
=head1 METHODS |
|
87
|
|
|
|
|
|
|
|
|
88
|
|
|
|
|
|
|
All methods from L are available via inheritence. In addition, |
|
89
|
|
|
|
|
|
|
the following methods are available: |
|
90
|
|
|
|
|
|
|
|
|
91
|
|
|
|
|
|
|
=head2 request_timeout |
|
92
|
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
Gets/sets the timeout which encapsulates each logical request, including any |
|
94
|
|
|
|
|
|
|
redirects which are followed. The default is 5 seconds. Fractional seconds |
|
95
|
|
|
|
|
|
|
are OK. |
|
96
|
|
|
|
|
|
|
|
|
97
|
|
|
|
|
|
|
=head2 resolver |
|
98
|
|
|
|
|
|
|
|
|
99
|
|
|
|
|
|
|
Gets the DNS resolver which is used to block private hosts. There is little |
|
100
|
|
|
|
|
|
|
need to set your own but if you do it should be an L |
|
101
|
|
|
|
|
|
|
object. This attribute is read-only, so if you want to replace the resolver |
|
102
|
|
|
|
|
|
|
you need to call L again to create a new L. |
|
103
|
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
Use the blocking and whitelisting methods on the resolver, or this class' |
|
105
|
|
|
|
|
|
|
L and L, to customize the behaviour. |
|
106
|
|
|
|
|
|
|
|
|
107
|
|
|
|
|
|
|
=head2 whitelisted_hosts / blocked_hosts |
|
108
|
|
|
|
|
|
|
|
|
109
|
|
|
|
|
|
|
Accepts a single arrayref and proxies to the method of the same name on the |
|
110
|
|
|
|
|
|
|
L. For convenience, you may pass a list which will be passed as an |
|
111
|
|
|
|
|
|
|
arrayref to the resolver's method. |
|
112
|
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
=cut |
|
114
|
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
sub new { |
|
116
|
|
|
|
|
|
|
my ($class, %opts) = @_; |
|
117
|
|
|
|
|
|
|
|
|
118
|
|
|
|
|
|
|
my $timeout = delete $opts{request_timeout}; |
|
119
|
|
|
|
|
|
|
$timeout = 5 unless $timeout; |
|
120
|
|
|
|
|
|
|
|
|
121
|
|
|
|
|
|
|
my $resolver = delete $opts{resolver}; |
|
122
|
|
|
|
|
|
|
$resolver = Net::DNS::Paranoid->new unless $resolver; |
|
123
|
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
for my $acl (qw(blocked_hosts whitelisted_hosts)) { |
|
125
|
|
|
|
|
|
|
next unless $opts{$acl}; |
|
126
|
|
|
|
|
|
|
$resolver->$acl( delete $opts{$acl} ); |
|
127
|
|
|
|
|
|
|
} |
|
128
|
|
|
|
|
|
|
|
|
129
|
|
|
|
|
|
|
my $self = $class->SUPER::new(%opts); |
|
130
|
|
|
|
|
|
|
$self->request_timeout($timeout); |
|
131
|
|
|
|
|
|
|
$self->_elem("resolver", $resolver); |
|
132
|
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
LWPx::ParanoidHandler::make_paranoid($self, $self->_resolver); |
|
134
|
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
return $self; |
|
136
|
|
|
|
|
|
|
} |
|
137
|
|
|
|
|
|
|
|
|
138
|
|
|
|
|
|
|
sub request_timeout { shift->_elem("request_timeout", @_) } |
|
139
|
|
|
|
|
|
|
sub resolver { |
|
140
|
|
|
|
|
|
|
my $self = shift; |
|
141
|
|
|
|
|
|
|
Carp::croak("resolver is read-only; to use a new resolver, create a new user agent") |
|
142
|
|
|
|
|
|
|
if @_; |
|
143
|
|
|
|
|
|
|
return $self->_resolver; |
|
144
|
|
|
|
|
|
|
} |
|
145
|
|
|
|
|
|
|
sub _resolver { |
|
146
|
|
|
|
|
|
|
shift->_elem("resolver"); |
|
147
|
|
|
|
|
|
|
} |
|
148
|
|
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
sub blocked_hosts { shift->_resolver->blocked_hosts(ref $_[0] ? $_[0] : \@_) } |
|
150
|
|
|
|
|
|
|
sub whitelisted_hosts { shift->_resolver->whitelisted_hosts(ref $_[0] ? $_[0] : \@_) } |
|
151
|
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
sub __timed_out { Carp::croak("Client timed out request") } |
|
153
|
|
|
|
|
|
|
sub __with_timeout { |
|
154
|
|
|
|
|
|
|
my $method = shift; |
|
155
|
|
|
|
|
|
|
my $self = shift; |
|
156
|
|
|
|
|
|
|
my $SUPER = $self->can("SUPER::$method") |
|
157
|
|
|
|
|
|
|
or Carp::croak("No such method '$method'"); |
|
158
|
|
|
|
|
|
|
|
|
159
|
|
|
|
|
|
|
my $our_alarm = ( |
|
160
|
|
|
|
|
|
|
ref($SIG{ALRM}) eq "CODE" |
|
161
|
|
|
|
|
|
|
and refaddr($SIG{ALRM}) eq refaddr(\&__timed_out) |
|
162
|
|
|
|
|
|
|
); |
|
163
|
|
|
|
|
|
|
|
|
164
|
|
|
|
|
|
|
if (not $our_alarm) { |
|
165
|
|
|
|
|
|
|
local $SIG{ALRM} = \&__timed_out; |
|
166
|
|
|
|
|
|
|
alarm $self->request_timeout; |
|
167
|
|
|
|
|
|
|
my $ret = $self->$SUPER(@_); |
|
168
|
|
|
|
|
|
|
alarm 0; |
|
169
|
|
|
|
|
|
|
return $ret; |
|
170
|
|
|
|
|
|
|
} else { |
|
171
|
|
|
|
|
|
|
return $self->$SUPER(@_); |
|
172
|
|
|
|
|
|
|
} |
|
173
|
|
|
|
|
|
|
}; |
|
174
|
|
|
|
|
|
|
|
|
175
|
|
|
|
|
|
|
sub request { __with_timeout("request", @_) } |
|
176
|
|
|
|
|
|
|
sub simple_request { __with_timeout("simple_request", @_) } |
|
177
|
|
|
|
|
|
|
|
|
178
|
|
|
|
|
|
|
"The truth is out there."; |
|
179
|
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
=head1 CAVEATS |
|
181
|
|
|
|
|
|
|
|
|
182
|
|
|
|
|
|
|
The overall request timeout is implemented using SIGALRM. Any C<$SIG{ALRM}> |
|
183
|
|
|
|
|
|
|
handler from an outer scope is replaced in the scope of |
|
184
|
|
|
|
|
|
|
L requests. |
|
185
|
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
=head1 BUGS |
|
187
|
|
|
|
|
|
|
|
|
188
|
|
|
|
|
|
|
All bugs should be reported via |
|
189
|
|
|
|
|
|
|
L |
|
190
|
|
|
|
|
|
|
or L. |
|
191
|
|
|
|
|
|
|
|
|
192
|
|
|
|
|
|
|
=head1 AUTHOR |
|
193
|
|
|
|
|
|
|
|
|
194
|
|
|
|
|
|
|
Thomas Sibley |
|
195
|
|
|
|
|
|
|
|
|
196
|
|
|
|
|
|
|
=head1 LICENSE AND COPYRIGHT |
|
197
|
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
This software is primarily Copyright (c) 2013 by Best Practical Solutions, |
|
199
|
|
|
|
|
|
|
with parts of it Copyright (c) 2014-2015 by Thomas Sibley. |
|
200
|
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
This is free software, licensed under: |
|
202
|
|
|
|
|
|
|
|
|
203
|
|
|
|
|
|
|
The GNU General Public License, Version 2, June 1991 |
|
204
|
|
|
|
|
|
|
|
|
205
|
|
|
|
|
|
|
=cut |