blib/lib/LyricFinder/Genius.pm | |||
---|---|---|---|
Criterion | Covered | Total | % |
statement | 20 | 77 | 25.9 |
branch | 0 | 22 | 0.0 |
condition | 0 | 24 | 0.0 |
subroutine | 7 | 10 | 70.0 |
pod | 2 | 2 | 100.0 |
total | 29 | 135 | 21.4 |
line | stmt | bran | cond | sub | pod | time | code |
---|---|---|---|---|---|---|---|
1 | package LyricFinder::Genius; | ||||||
2 | |||||||
3 | 1 | 1 | 8 | use strict; | |||
1 | 2 | ||||||
1 | 35 | ||||||
4 | 1 | 1 | 5 | use warnings; | |||
1 | 3 | ||||||
1 | 27 | ||||||
5 | 1 | 1 | 4 | use Carp; | |||
1 | 3 | ||||||
1 | 71 | ||||||
6 | 1 | 1 | 7 | use HTML::Strip; | |||
1 | 3 | ||||||
1 | 25 | ||||||
7 | 1 | 1 | 13 | use parent 'LyricFinder::_Class'; | |||
1 | 4 | ||||||
1 | 6 | ||||||
8 | |||||||
9 | our $haveLyricsCache; | ||||||
10 | BEGIN { | ||||||
11 | 1 | 1 | 98 | $haveLyricsCache = 0; | |||
12 | 1 | 1 | 73 | eval "use LyricFinder::Cache; \$haveLyricsCache = 1; 1"; | |||
1 | 7 | ||||||
1 | 2 | ||||||
1 | 22 | ||||||
13 | } | ||||||
14 | |||||||
15 | my $Source = 'Genius'; | ||||||
16 | my $Site = 'https://genius.com'; | ||||||
17 | my $DEBUG = 0; | ||||||
18 | |||||||
19 | sub new | ||||||
20 | { | ||||||
21 | 0 | 0 | 1 | my $class = shift; | |||
22 | |||||||
23 | 0 | my $self = $class->SUPER::new($Source, @_); | |||||
24 | 0 | @{$self->{'_fetchers'}} = ($Source); | |||||
0 | |||||||
25 | 0 | unshift(@{$self->{'_fetchers'}}, 'Cache') if ($haveLyricsCache | |||||
26 | 0 | 0 | 0 | && $self->{'-cache'} && $self->{'-cache'} !~ /^\>/); | |||
0 | |||||||
27 | |||||||
28 | 0 | bless $self, $class; #BLESS IT! | |||||
29 | |||||||
30 | 0 | return $self; | |||||
31 | } | ||||||
32 | |||||||
33 | sub fetch { | ||||||
34 | 0 | 0 | 1 | my ($self, $artist_in, $song_in) = @_; | |||
35 | |||||||
36 | 0 | $self->_debug("Genius::fetch($artist_in, $song_in)!"); | |||||
37 | |||||||
38 | 0 | 0 | return '' unless ($self->_check_inputs($artist_in, $song_in)); | ||||
39 | 0 | 0 | return '' if ($self->{'Error'} ne 'Ok'); | ||||
40 | |||||||
41 | # first, see if we've got it cached: | ||||||
42 | 0 | $self->_debug("i:haveCache=$haveLyricsCache= -cachedir=".$self->{'-cache'}."="); | |||||
43 | 0 | 0 | 0 | if ($haveLyricsCache && $self->{'-cache'} && $self->{'-cache'} !~ /^\>/) { | |||
0 | |||||||
44 | 0 | my $cache = new LyricFinder::Cache(%{$self}); | |||||
0 | |||||||
45 | 0 | 0 | if ($cache) { | ||||
46 | 0 | my $lyrics = $cache->fetch($artist_in, $song_in); | |||||
47 | 0 | 0 | 0 | if (defined($lyrics) && $lyrics =~ /\w/) { | |||
48 | 0 | $self->_debug("..Got lyrics from cache."); | |||||
49 | 0 | $self->{'Source'} = 'Cache'; | |||||
50 | 0 | $self->{'Site'} = $cache->site(); | |||||
51 | 0 | $self->{'Url'} = $cache->url(); | |||||
52 | |||||||
53 | 0 | return $lyrics; | |||||
54 | } | ||||||
55 | } | ||||||
56 | } | ||||||
57 | |||||||
58 | 0 | $self->{'Site'} = $Site; | |||||
59 | |||||||
60 | 0 | $artist_in = $self->_remove_accents($artist_in); | |||||
61 | 0 | $song_in = $self->_remove_accents($song_in); | |||||
62 | |||||||
63 | # Their URLs look like e.g.: | ||||||
64 | # https://genius.com/ |
||||||
65 | 0 | ($self->{'Url'} = $artist_in) =~ s#\s*\/\s*# and #; #ONLY USE 1ST ARTIST, IF MORE THAN ONE! | |||||
66 | 0 | my $artist = $artist_in; | |||||
67 | 0 | (my $song = $song_in) =~ s#\s*\/\s*#\-#g; #FIX SONGS WITH "/" IN THEM! | |||||
68 | 0 | $self->{'Url'} .= " ${song}-lyrics"; | |||||
69 | 0 | $self->{'Url'} =~ s/\&/and/g; | |||||
70 | 0 | $self->{'Url'} =~ s/ +/\-/g; | |||||
71 | 0 | $self->{'Url'} =~ s/[^a-zA-Z0-9\-]+//g; | |||||
72 | 0 | $self->{'Url'} = $Site . '/' . $self->{'Url'}; | |||||
73 | |||||||
74 | 0 | my $lyrics = $self->_web_fetch($artist_in, $song_in); | |||||
75 | 0 | 0 | 0 | if ($lyrics && $haveLyricsCache && $self->{'-cache'} && $self->{'-cache'} !~ /^\) { | |||
0 | |||||||
0 | |||||||
76 | 0 | $self->_debug("=== WILL CACHE LYRICS! ==="); | |||||
77 | # cache the fetched lyrics, if we can: | ||||||
78 | 0 | my $cache = new LyricFinder::Cache(%{$self}); | |||||
0 | |||||||
79 | 0 | 0 | $cache->save($artist_in, $song_in, $lyrics) if ($cache); | ||||
80 | } | ||||||
81 | 0 | return $lyrics; | |||||
82 | } | ||||||
83 | |||||||
84 | sub _parse { | ||||||
85 | 0 | 0 | my $self = shift; | ||||
86 | 0 | my $html = shift; | |||||
87 | |||||||
88 | 0 | $self->_debug("Genius::_parse()!"); | |||||
89 | 0 | 0 | if (my ($goodbit) = $html =~ | ||||
90 | # m{\ (.+)\<\!\-\-\/sse\-\-\>}msi) |
||||||
91 | m{\ ]*\>(.+?)\ | ||||||
92 | { | ||||||
93 | 0 | my $hs = HTML::Strip->new(); | |||||
94 | 0 | $goodbit =~ s#\<\/?p\>#\r\n#gsi; | |||||
95 | 0 | $goodbit =~ s#\ #\r\n#gsi; |
|||||
96 | 0 | my $text = $hs->parse($goodbit); | |||||
97 | |||||||
98 | #WHILE WE'RE AT IT, SEE IF WE HAVE A COVER IMAGE?!: | ||||||
99 | 0 | 0 | if ($html =~ m#\ | ||||
100 | 0 | my $imgurl = $1; | |||||
101 | 0 | 0 | $imgurl = 'https:' . $imgurl if ($imgurl =~ m#^//#); | ||||
102 | 0 | $self->{'image_url'} = $imgurl; | |||||
103 | } | ||||||
104 | |||||||
105 | 0 | return $self->_normalize_lyric_text($self->_html2text($text)); | |||||
106 | } else { | ||||||
107 | 0 | carp($self->{'Error'} = "e:$Source - Failed to identify lyrics on result page."); | |||||
108 | 0 | return ''; | |||||
109 | } | ||||||
110 | } | ||||||
111 | |||||||
112 | 1 | ||||||
113 | |||||||
114 | __END__ |