| line | stmt | bran | cond | sub | pod | time | code | 
| 1 |  |  |  |  |  |  | package POE::Component::SmokeBox::Uploads::RSS; | 
| 2 |  |  |  |  |  |  |  | 
| 3 | 1 |  |  | 1 |  | 32198 | use strict; | 
|  | 1 |  |  |  |  | 2 |  | 
|  | 1 |  |  |  |  | 35 |  | 
| 4 | 1 |  |  | 1 |  | 5 | use warnings; | 
|  | 1 |  |  |  |  | 2 |  | 
|  | 1 |  |  |  |  | 26 |  | 
| 5 | 1 |  |  | 1 |  | 5 | use Carp; | 
|  | 1 |  |  |  |  | 5 |  | 
|  | 1 |  |  |  |  | 87 |  | 
| 6 | 1 |  |  | 1 |  | 896 | use POE qw(Component::RSSAggregator Component::Client::HTTP); | 
|  | 1 |  |  |  |  | 68525 |  | 
|  | 1 |  |  |  |  | 6 |  | 
| 7 |  |  |  |  |  |  | use HTTP::Request; | 
| 8 |  |  |  |  |  |  | use HTML::LinkExtor; | 
| 9 |  |  |  |  |  |  | use vars qw($VERSION); | 
| 10 |  |  |  |  |  |  |  | 
| 11 |  |  |  |  |  |  | $VERSION = '1.00'; | 
| 12 |  |  |  |  |  |  |  | 
| 13 |  |  |  |  |  |  | sub spawn { | 
| 14 |  |  |  |  |  |  | my $package = shift; | 
| 15 |  |  |  |  |  |  | my %opts = @_; | 
| 16 |  |  |  |  |  |  | $opts{lc $_} = delete $opts{$_} for keys %opts; | 
| 17 |  |  |  |  |  |  | croak "$package requires an 'event' argument\n" unless $opts{event}; | 
| 18 |  |  |  |  |  |  | $opts{feed} = 'http://search.cpan.org/uploads.rdf' unless $opts{feed}; | 
| 19 |  |  |  |  |  |  | $opts{name} = 'search-cpan-recent' unless $opts{name}; | 
| 20 |  |  |  |  |  |  | $opts{delay} = 1800 unless $opts{delay}; | 
| 21 |  |  |  |  |  |  | my $options = delete $opts{options}; | 
| 22 |  |  |  |  |  |  | my $self = bless \%opts, $package; | 
| 23 |  |  |  |  |  |  | $self->{session_id} = POE::Session->create( | 
| 24 |  |  |  |  |  |  | object_states => [ | 
| 25 |  |  |  |  |  |  | $self => { shutdown => '_shutdown', }, | 
| 26 |  |  |  |  |  |  | $self => [ qw(_start _dispatch _feed_url _handle_feed _real_shutdown) ], | 
| 27 |  |  |  |  |  |  | ], | 
| 28 |  |  |  |  |  |  | heap => $self, | 
| 29 |  |  |  |  |  |  | ( ref($options) eq 'HASH' ? ( options => $options ) : () ), | 
| 30 |  |  |  |  |  |  | )->ID(); | 
| 31 |  |  |  |  |  |  | return $self; | 
| 32 |  |  |  |  |  |  | } | 
| 33 |  |  |  |  |  |  |  | 
| 34 |  |  |  |  |  |  | sub session_id { | 
| 35 |  |  |  |  |  |  | return $_[0]->{session_id}; | 
| 36 |  |  |  |  |  |  | } | 
| 37 |  |  |  |  |  |  |  | 
| 38 |  |  |  |  |  |  | sub shutdown { | 
| 39 |  |  |  |  |  |  | my $self = shift; | 
| 40 |  |  |  |  |  |  | $poe_kernel->post( $self->{session_id}, 'shutdown' ); | 
| 41 |  |  |  |  |  |  | return; | 
| 42 |  |  |  |  |  |  | } | 
| 43 |  |  |  |  |  |  |  | 
| 44 |  |  |  |  |  |  | sub _shutdown { | 
| 45 |  |  |  |  |  |  | my ($kernel,$self) = @_[KERNEL,OBJECT]; | 
| 46 |  |  |  |  |  |  | $self->{_shutdown} = 1; | 
| 47 |  |  |  |  |  |  | return if $self->{_http_requests}; | 
| 48 |  |  |  |  |  |  | $kernel->yield( '_real_shutdown' ); | 
| 49 |  |  |  |  |  |  | return; | 
| 50 |  |  |  |  |  |  | } | 
| 51 |  |  |  |  |  |  |  | 
| 52 |  |  |  |  |  |  | sub _real_shutdown { | 
| 53 |  |  |  |  |  |  | my ($kernel,$self) = @_[KERNEL,OBJECT]; | 
| 54 |  |  |  |  |  |  | $kernel->alias_remove( $_ ) for $kernel->alias_list(); | 
| 55 |  |  |  |  |  |  | $kernel->refcount_decrement( $self->{session_id}, __PACKAGE__ ) unless $self->{alias}; | 
| 56 |  |  |  |  |  |  | $kernel->refcount_decrement( $self->{sender_id}, __PACKAGE__ ); | 
| 57 |  |  |  |  |  |  | $kernel->post( $self->{http_id}, 'shutdown' ) unless $self->{http_alias}; | 
| 58 |  |  |  |  |  |  | $kernel->post( $self->{rssagg}, 'shutdown' ); | 
| 59 |  |  |  |  |  |  | return; | 
| 60 |  |  |  |  |  |  | } | 
| 61 |  |  |  |  |  |  |  | 
| 62 |  |  |  |  |  |  | sub _start { | 
| 63 |  |  |  |  |  |  | my ($kernel,$session,$sender,$self) = @_[KERNEL,SESSION,SENDER,OBJECT]; | 
| 64 |  |  |  |  |  |  | $self->{session_id} = $session->ID(); | 
| 65 |  |  |  |  |  |  | if ( $kernel == $sender and !$self->{session} ) { | 
| 66 |  |  |  |  |  |  | croak "Not called from another POE session and 'session' wasn't set\n"; | 
| 67 |  |  |  |  |  |  | } | 
| 68 |  |  |  |  |  |  | my $sender_id; | 
| 69 |  |  |  |  |  |  | if ( $self->{session} ) { | 
| 70 |  |  |  |  |  |  | if ( my $ref = $kernel->alias_resolve( $self->{session} ) ) { | 
| 71 |  |  |  |  |  |  | $sender_id = $ref->ID(); | 
| 72 |  |  |  |  |  |  | } | 
| 73 |  |  |  |  |  |  | else { | 
| 74 |  |  |  |  |  |  | croak "Could not resolve 'session' to a valid POE session\n"; | 
| 75 |  |  |  |  |  |  | } | 
| 76 |  |  |  |  |  |  | } | 
| 77 |  |  |  |  |  |  | else { | 
| 78 |  |  |  |  |  |  | $sender_id = $sender->ID(); | 
| 79 |  |  |  |  |  |  | } | 
| 80 |  |  |  |  |  |  | $kernel->refcount_increment( $sender_id, __PACKAGE__ ); | 
| 81 |  |  |  |  |  |  | $self->{sender_id} = $sender_id; | 
| 82 |  |  |  |  |  |  | if ( $self->{http_alias} ) { | 
| 83 |  |  |  |  |  |  | my $http_ref = $kernel->alias_resolve( $self->{http_alias} ); | 
| 84 |  |  |  |  |  |  | $self->{http_id} = $http_ref->ID() if $http_ref; | 
| 85 |  |  |  |  |  |  | } | 
| 86 |  |  |  |  |  |  | unless ( $self->{http_id} ) { | 
| 87 |  |  |  |  |  |  | $self->{http_id} = 'smokeboxrss' . $$ . $self->{session_id}; | 
| 88 |  |  |  |  |  |  | POE::Component::Client::HTTP->spawn( | 
| 89 |  |  |  |  |  |  | Alias           => $self->{http_id}, | 
| 90 |  |  |  |  |  |  | FollowRedirects => 2, | 
| 91 |  |  |  |  |  |  | Timeout         => 60, | 
| 92 |  |  |  |  |  |  | Agent           => 'Mozilla/5.0 (X11; U; Linux i686; en-US; ' | 
| 93 |  |  |  |  |  |  | . 'rv:1.1) Gecko/20020913 Debian/1.1-1', | 
| 94 |  |  |  |  |  |  | ); | 
| 95 |  |  |  |  |  |  | } | 
| 96 |  |  |  |  |  |  | $self->{rssagg} = 'rssagg' . $self->{session_id}; | 
| 97 |  |  |  |  |  |  | POE::Component::RSSAggregator->new( | 
| 98 |  |  |  |  |  |  | alias    => $self->{rssagg}, | 
| 99 |  |  |  |  |  |  | callback => $session->postback('_handle_feed'), | 
| 100 |  |  |  |  |  |  | http_alias => $self->{http_id}, | 
| 101 |  |  |  |  |  |  | tmpdir   => $self->{tmpdir} || '.',        # optional caching | 
| 102 |  |  |  |  |  |  | ); | 
| 103 |  |  |  |  |  |  | my $feed = { | 
| 104 |  |  |  |  |  |  | url   => $self->{feed}, | 
| 105 |  |  |  |  |  |  | name  => $self->{name}, | 
| 106 |  |  |  |  |  |  | delay => $self->{delay}, | 
| 107 |  |  |  |  |  |  | }; | 
| 108 |  |  |  |  |  |  | $kernel->post( $self->{rssagg}, 'add_feed', $feed ); | 
| 109 |  |  |  |  |  |  | return; | 
| 110 |  |  |  |  |  |  | } | 
| 111 |  |  |  |  |  |  |  | 
| 112 |  |  |  |  |  |  | sub _handle_feed { | 
| 113 |  |  |  |  |  |  | my ($kernel,$self,$feed) = (@_[KERNEL,OBJECT], $_[ARG1]->[0]); | 
| 114 |  |  |  |  |  |  | for my $headline ( reverse $feed->late_breaking_news ) { | 
| 115 |  |  |  |  |  |  | $kernel->post( | 
| 116 |  |  |  |  |  |  | $self->{http_id}, | 
| 117 |  |  |  |  |  |  | 'request', | 
| 118 |  |  |  |  |  |  | '_feed_url', | 
| 119 |  |  |  |  |  |  | HTTP::Request->new( GET => $headline->url ), | 
| 120 |  |  |  |  |  |  | $headline->headline, | 
| 121 |  |  |  |  |  |  | ); | 
| 122 |  |  |  |  |  |  | $self->{_http_requests}++; | 
| 123 |  |  |  |  |  |  | } | 
| 124 |  |  |  |  |  |  | return; | 
| 125 |  |  |  |  |  |  | } | 
| 126 |  |  |  |  |  |  |  | 
| 127 |  |  |  |  |  |  | sub _feed_url { | 
| 128 |  |  |  |  |  |  | my ($kernel,$self,$request_packet,$response_packet) = @_[KERNEL,OBJECT,ARG0,ARG1]; | 
| 129 |  |  |  |  |  |  | my $http_resp = $response_packet->[0]; | 
| 130 |  |  |  |  |  |  | $self->{_http_requests}--; | 
| 131 |  |  |  |  |  |  | return unless $http_resp and $http_resp->code() == 200; | 
| 132 |  |  |  |  |  |  | my $tag    = $request_packet->[1]; | 
| 133 |  |  |  |  |  |  | my $p = HTML::LinkExtor->new(); | 
| 134 |  |  |  |  |  |  | $p->parse( $http_resp->content() ); | 
| 135 |  |  |  |  |  |  | foreach my $link ( $p->links() ) { | 
| 136 |  |  |  |  |  |  | if ( $link->[0] eq 'a' and $link->[2] =~ /\Q$tag\E/ ) { | 
| 137 |  |  |  |  |  |  | ( my $module = $link->[2] ) =~ s#/CPAN/authors/id/##; | 
| 138 |  |  |  |  |  |  | $kernel->call( $self->{session_id}, '_dispatch', $module ); | 
| 139 |  |  |  |  |  |  | last; | 
| 140 |  |  |  |  |  |  | } | 
| 141 |  |  |  |  |  |  | } | 
| 142 |  |  |  |  |  |  | $kernel->yield( '_real_shutdown' ) if $self->{_shutdown} and $self->{_http_requests} == 0; | 
| 143 |  |  |  |  |  |  | return; | 
| 144 |  |  |  |  |  |  | } | 
| 145 |  |  |  |  |  |  |  | 
| 146 |  |  |  |  |  |  | sub _dispatch { | 
| 147 |  |  |  |  |  |  | my ($kernel,$self,$module) = @_[KERNEL,OBJECT,ARG0]; | 
| 148 |  |  |  |  |  |  | $kernel->post( $self->{sender_id}, $self->{event}, $module ); | 
| 149 |  |  |  |  |  |  | return; | 
| 150 |  |  |  |  |  |  | } | 
| 151 |  |  |  |  |  |  |  | 
| 152 |  |  |  |  |  |  | "This town ain't big enough for the both of us"; | 
| 153 |  |  |  |  |  |  |  | 
| 154 |  |  |  |  |  |  | __END__ |