line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package POE::Component::SmokeBox::Uploads::RSS; |
2
|
|
|
|
|
|
|
|
3
|
1
|
|
|
1
|
|
32198
|
use strict; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
35
|
|
4
|
1
|
|
|
1
|
|
5
|
use warnings; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
26
|
|
5
|
1
|
|
|
1
|
|
5
|
use Carp; |
|
1
|
|
|
|
|
5
|
|
|
1
|
|
|
|
|
87
|
|
6
|
1
|
|
|
1
|
|
896
|
use POE qw(Component::RSSAggregator Component::Client::HTTP); |
|
1
|
|
|
|
|
68525
|
|
|
1
|
|
|
|
|
6
|
|
7
|
|
|
|
|
|
|
use HTTP::Request; |
8
|
|
|
|
|
|
|
use HTML::LinkExtor; |
9
|
|
|
|
|
|
|
use vars qw($VERSION); |
10
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
$VERSION = '1.00'; |
12
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
sub spawn { |
14
|
|
|
|
|
|
|
my $package = shift; |
15
|
|
|
|
|
|
|
my %opts = @_; |
16
|
|
|
|
|
|
|
$opts{lc $_} = delete $opts{$_} for keys %opts; |
17
|
|
|
|
|
|
|
croak "$package requires an 'event' argument\n" unless $opts{event}; |
18
|
|
|
|
|
|
|
$opts{feed} = 'http://search.cpan.org/uploads.rdf' unless $opts{feed}; |
19
|
|
|
|
|
|
|
$opts{name} = 'search-cpan-recent' unless $opts{name}; |
20
|
|
|
|
|
|
|
$opts{delay} = 1800 unless $opts{delay}; |
21
|
|
|
|
|
|
|
my $options = delete $opts{options}; |
22
|
|
|
|
|
|
|
my $self = bless \%opts, $package; |
23
|
|
|
|
|
|
|
$self->{session_id} = POE::Session->create( |
24
|
|
|
|
|
|
|
object_states => [ |
25
|
|
|
|
|
|
|
$self => { shutdown => '_shutdown', }, |
26
|
|
|
|
|
|
|
$self => [ qw(_start _dispatch _feed_url _handle_feed _real_shutdown) ], |
27
|
|
|
|
|
|
|
], |
28
|
|
|
|
|
|
|
heap => $self, |
29
|
|
|
|
|
|
|
( ref($options) eq 'HASH' ? ( options => $options ) : () ), |
30
|
|
|
|
|
|
|
)->ID(); |
31
|
|
|
|
|
|
|
return $self; |
32
|
|
|
|
|
|
|
} |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
sub session_id { |
35
|
|
|
|
|
|
|
return $_[0]->{session_id}; |
36
|
|
|
|
|
|
|
} |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
sub shutdown { |
39
|
|
|
|
|
|
|
my $self = shift; |
40
|
|
|
|
|
|
|
$poe_kernel->post( $self->{session_id}, 'shutdown' ); |
41
|
|
|
|
|
|
|
return; |
42
|
|
|
|
|
|
|
} |
43
|
|
|
|
|
|
|
|
44
|
|
|
|
|
|
|
sub _shutdown { |
45
|
|
|
|
|
|
|
my ($kernel,$self) = @_[KERNEL,OBJECT]; |
46
|
|
|
|
|
|
|
$self->{_shutdown} = 1; |
47
|
|
|
|
|
|
|
return if $self->{_http_requests}; |
48
|
|
|
|
|
|
|
$kernel->yield( '_real_shutdown' ); |
49
|
|
|
|
|
|
|
return; |
50
|
|
|
|
|
|
|
} |
51
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
sub _real_shutdown { |
53
|
|
|
|
|
|
|
my ($kernel,$self) = @_[KERNEL,OBJECT]; |
54
|
|
|
|
|
|
|
$kernel->alias_remove( $_ ) for $kernel->alias_list(); |
55
|
|
|
|
|
|
|
$kernel->refcount_decrement( $self->{session_id}, __PACKAGE__ ) unless $self->{alias}; |
56
|
|
|
|
|
|
|
$kernel->refcount_decrement( $self->{sender_id}, __PACKAGE__ ); |
57
|
|
|
|
|
|
|
$kernel->post( $self->{http_id}, 'shutdown' ) unless $self->{http_alias}; |
58
|
|
|
|
|
|
|
$kernel->post( $self->{rssagg}, 'shutdown' ); |
59
|
|
|
|
|
|
|
return; |
60
|
|
|
|
|
|
|
} |
61
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
sub _start { |
63
|
|
|
|
|
|
|
my ($kernel,$session,$sender,$self) = @_[KERNEL,SESSION,SENDER,OBJECT]; |
64
|
|
|
|
|
|
|
$self->{session_id} = $session->ID(); |
65
|
|
|
|
|
|
|
if ( $kernel == $sender and !$self->{session} ) { |
66
|
|
|
|
|
|
|
croak "Not called from another POE session and 'session' wasn't set\n"; |
67
|
|
|
|
|
|
|
} |
68
|
|
|
|
|
|
|
my $sender_id; |
69
|
|
|
|
|
|
|
if ( $self->{session} ) { |
70
|
|
|
|
|
|
|
if ( my $ref = $kernel->alias_resolve( $self->{session} ) ) { |
71
|
|
|
|
|
|
|
$sender_id = $ref->ID(); |
72
|
|
|
|
|
|
|
} |
73
|
|
|
|
|
|
|
else { |
74
|
|
|
|
|
|
|
croak "Could not resolve 'session' to a valid POE session\n"; |
75
|
|
|
|
|
|
|
} |
76
|
|
|
|
|
|
|
} |
77
|
|
|
|
|
|
|
else { |
78
|
|
|
|
|
|
|
$sender_id = $sender->ID(); |
79
|
|
|
|
|
|
|
} |
80
|
|
|
|
|
|
|
$kernel->refcount_increment( $sender_id, __PACKAGE__ ); |
81
|
|
|
|
|
|
|
$self->{sender_id} = $sender_id; |
82
|
|
|
|
|
|
|
if ( $self->{http_alias} ) { |
83
|
|
|
|
|
|
|
my $http_ref = $kernel->alias_resolve( $self->{http_alias} ); |
84
|
|
|
|
|
|
|
$self->{http_id} = $http_ref->ID() if $http_ref; |
85
|
|
|
|
|
|
|
} |
86
|
|
|
|
|
|
|
unless ( $self->{http_id} ) { |
87
|
|
|
|
|
|
|
$self->{http_id} = 'smokeboxrss' . $$ . $self->{session_id}; |
88
|
|
|
|
|
|
|
POE::Component::Client::HTTP->spawn( |
89
|
|
|
|
|
|
|
Alias => $self->{http_id}, |
90
|
|
|
|
|
|
|
FollowRedirects => 2, |
91
|
|
|
|
|
|
|
Timeout => 60, |
92
|
|
|
|
|
|
|
Agent => 'Mozilla/5.0 (X11; U; Linux i686; en-US; ' |
93
|
|
|
|
|
|
|
. 'rv:1.1) Gecko/20020913 Debian/1.1-1', |
94
|
|
|
|
|
|
|
); |
95
|
|
|
|
|
|
|
} |
96
|
|
|
|
|
|
|
$self->{rssagg} = 'rssagg' . $self->{session_id}; |
97
|
|
|
|
|
|
|
POE::Component::RSSAggregator->new( |
98
|
|
|
|
|
|
|
alias => $self->{rssagg}, |
99
|
|
|
|
|
|
|
callback => $session->postback('_handle_feed'), |
100
|
|
|
|
|
|
|
http_alias => $self->{http_id}, |
101
|
|
|
|
|
|
|
tmpdir => $self->{tmpdir} || '.', # optional caching |
102
|
|
|
|
|
|
|
); |
103
|
|
|
|
|
|
|
my $feed = { |
104
|
|
|
|
|
|
|
url => $self->{feed}, |
105
|
|
|
|
|
|
|
name => $self->{name}, |
106
|
|
|
|
|
|
|
delay => $self->{delay}, |
107
|
|
|
|
|
|
|
}; |
108
|
|
|
|
|
|
|
$kernel->post( $self->{rssagg}, 'add_feed', $feed ); |
109
|
|
|
|
|
|
|
return; |
110
|
|
|
|
|
|
|
} |
111
|
|
|
|
|
|
|
|
112
|
|
|
|
|
|
|
sub _handle_feed { |
113
|
|
|
|
|
|
|
my ($kernel,$self,$feed) = (@_[KERNEL,OBJECT], $_[ARG1]->[0]); |
114
|
|
|
|
|
|
|
for my $headline ( reverse $feed->late_breaking_news ) { |
115
|
|
|
|
|
|
|
$kernel->post( |
116
|
|
|
|
|
|
|
$self->{http_id}, |
117
|
|
|
|
|
|
|
'request', |
118
|
|
|
|
|
|
|
'_feed_url', |
119
|
|
|
|
|
|
|
HTTP::Request->new( GET => $headline->url ), |
120
|
|
|
|
|
|
|
$headline->headline, |
121
|
|
|
|
|
|
|
); |
122
|
|
|
|
|
|
|
$self->{_http_requests}++; |
123
|
|
|
|
|
|
|
} |
124
|
|
|
|
|
|
|
return; |
125
|
|
|
|
|
|
|
} |
126
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
sub _feed_url { |
128
|
|
|
|
|
|
|
my ($kernel,$self,$request_packet,$response_packet) = @_[KERNEL,OBJECT,ARG0,ARG1]; |
129
|
|
|
|
|
|
|
my $http_resp = $response_packet->[0]; |
130
|
|
|
|
|
|
|
$self->{_http_requests}--; |
131
|
|
|
|
|
|
|
return unless $http_resp and $http_resp->code() == 200; |
132
|
|
|
|
|
|
|
my $tag = $request_packet->[1]; |
133
|
|
|
|
|
|
|
my $p = HTML::LinkExtor->new(); |
134
|
|
|
|
|
|
|
$p->parse( $http_resp->content() ); |
135
|
|
|
|
|
|
|
foreach my $link ( $p->links() ) { |
136
|
|
|
|
|
|
|
if ( $link->[0] eq 'a' and $link->[2] =~ /\Q$tag\E/ ) { |
137
|
|
|
|
|
|
|
( my $module = $link->[2] ) =~ s#/CPAN/authors/id/##; |
138
|
|
|
|
|
|
|
$kernel->call( $self->{session_id}, '_dispatch', $module ); |
139
|
|
|
|
|
|
|
last; |
140
|
|
|
|
|
|
|
} |
141
|
|
|
|
|
|
|
} |
142
|
|
|
|
|
|
|
$kernel->yield( '_real_shutdown' ) if $self->{_shutdown} and $self->{_http_requests} == 0; |
143
|
|
|
|
|
|
|
return; |
144
|
|
|
|
|
|
|
} |
145
|
|
|
|
|
|
|
|
146
|
|
|
|
|
|
|
sub _dispatch { |
147
|
|
|
|
|
|
|
my ($kernel,$self,$module) = @_[KERNEL,OBJECT,ARG0]; |
148
|
|
|
|
|
|
|
$kernel->post( $self->{sender_id}, $self->{event}, $module ); |
149
|
|
|
|
|
|
|
return; |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
"This town ain't big enough for the both of us"; |
153
|
|
|
|
|
|
|
|
154
|
|
|
|
|
|
|
__END__ |