| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package WWW::Crawl4AI::Strategy::Browser; |
|
2
|
|
|
|
|
|
|
# ABSTRACT: Crawl4AI strategy with full JS rendering (wait for networkidle) |
|
3
|
2
|
|
|
2
|
|
10
|
use Moo; |
|
|
2
|
|
|
|
|
2
|
|
|
|
2
|
|
|
|
|
9
|
|
|
4
|
2
|
|
|
2
|
|
583
|
use WWW::Crawl4AI::Request (); |
|
|
2
|
|
|
|
|
3
|
|
|
|
2
|
|
|
|
|
238
|
|
|
5
|
|
|
|
|
|
|
with 'WWW::Crawl4AI::Strategy'; |
|
6
|
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
our $VERSION = '0.001'; |
|
8
|
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
|
|
10
|
22
|
|
|
22
|
1
|
70
|
sub name { 'crawl4ai_browser' } |
|
11
|
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
|
|
13
|
5
|
|
|
5
|
1
|
22
|
sub cost_class { 'browser' } |
|
14
|
|
|
|
|
|
|
|
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
sub build_request { |
|
17
|
5
|
|
|
5
|
0
|
10
|
my ( $self, $crawler, $url ) = @_; |
|
18
|
5
|
|
|
|
|
13
|
return $self->_request( |
|
19
|
|
|
|
|
|
|
$url, |
|
20
|
|
|
|
|
|
|
browser => { headless => WWW::Crawl4AI::Request::JSON_true() }, |
|
21
|
|
|
|
|
|
|
crawler => { wait_until => 'networkidle' }, |
|
22
|
|
|
|
|
|
|
); |
|
23
|
|
|
|
|
|
|
} |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
1; |
|
26
|
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
__END__ |