line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package LinkEmbedder::Link; |
2
|
30
|
|
|
30
|
|
218
|
use Mojo::Base -base; |
|
30
|
|
|
|
|
80
|
|
|
30
|
|
|
|
|
202
|
|
3
|
|
|
|
|
|
|
|
4
|
30
|
|
|
30
|
|
22509
|
use Mojo::Template; |
|
30
|
|
|
|
|
1241590
|
|
|
30
|
|
|
|
|
348
|
|
5
|
30
|
|
|
30
|
|
1523
|
use Mojo::Util 'trim'; |
|
30
|
|
|
|
|
72
|
|
|
30
|
|
|
|
|
2089
|
|
6
|
|
|
|
|
|
|
|
7
|
30
|
|
50
|
30
|
|
201
|
use constant DEBUG => $ENV{LINK_EMBEDDER_DEBUG} || 0; |
|
30
|
|
|
|
|
66
|
|
|
30
|
|
|
|
|
72335
|
|
8
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
my %DOM_SEL = ( |
10
|
|
|
|
|
|
|
':desc' => ['meta[property="og:description"]', 'meta[name="twitter:description"]', 'meta[name="description"]'], |
11
|
|
|
|
|
|
|
':image' => ['meta[property="og:image"]', 'meta[property="og:image:url"]', 'meta[name="twitter:image"]'], |
12
|
|
|
|
|
|
|
':site_name' => ['meta[property="og:site_name"]', 'meta[property="twitter:site"]'], |
13
|
|
|
|
|
|
|
':title' => ['meta[property="og:title"]', 'meta[name="twitter:title"]', 'title'], |
14
|
|
|
|
|
|
|
); |
15
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
my @JSON_ATTRS = ( |
17
|
|
|
|
|
|
|
'author_name', 'author_url', 'cache_age', 'height', 'provider_name', 'provider_url', |
18
|
|
|
|
|
|
|
'thumbnail_height', 'thumbnail_url', 'thumbnail_width', 'title', 'type', 'url', |
19
|
|
|
|
|
|
|
'version', 'width' |
20
|
|
|
|
|
|
|
); |
21
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
has author_name => undef; |
23
|
|
|
|
|
|
|
has author_url => undef; |
24
|
|
|
|
|
|
|
has cache_age => 0; |
25
|
|
|
|
|
|
|
has description => ''; |
26
|
|
|
|
|
|
|
has error => undef; # {message => "", code => ""} |
27
|
|
|
|
|
|
|
has force_secure => 0; |
28
|
|
|
|
|
|
|
has height => sub { $_[0]->type =~ /^photo|video$/ ? 0 : undef }; |
29
|
|
|
|
|
|
|
has placeholder_url => ''; |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
has provider_name => sub { |
32
|
|
|
|
|
|
|
return undef unless my $name = shift->url->host; |
33
|
|
|
|
|
|
|
return $name =~ /([^\.]+)\.(\w+)$/ ? ucfirst $1 : $name; |
34
|
|
|
|
|
|
|
}; |
35
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
has provider_url => sub { $_[0]->url->host ? $_[0]->url->clone->path('/') : undef }; |
37
|
|
|
|
|
|
|
has template => sub { [__PACKAGE__, sprintf '%s.html.ep', $_[0]->type] }; |
38
|
|
|
|
|
|
|
has thumbnail_height => undef; |
39
|
|
|
|
|
|
|
has thumbnail_url => undef; |
40
|
|
|
|
|
|
|
has thumbnail_width => undef; |
41
|
|
|
|
|
|
|
has title => undef; |
42
|
|
|
|
|
|
|
has type => 'link'; |
43
|
|
|
|
|
|
|
has ua => undef; # Mojo::UserAgent object |
44
|
|
|
|
|
|
|
has url => sub { Mojo::URL->new }; # Mojo::URL |
45
|
|
|
|
|
|
|
has version => '1.0'; |
46
|
|
|
|
|
|
|
has width => sub { $_[0]->type =~ /^photo|video$/ ? 0 : undef }; |
47
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
sub html { |
49
|
7
|
|
|
7
|
1
|
3069
|
my $self = shift; |
50
|
7
|
50
|
|
|
|
16
|
my $template = Mojo::Loader::data_section(@{$self->template}) or return ''; |
|
7
|
|
|
|
|
27
|
|
51
|
7
|
|
|
|
|
1583
|
my $output = Mojo::Template->new({auto_escape => 1, prepend => 'my $l=shift'})->render($template, $self); |
52
|
7
|
50
|
|
|
|
31041
|
die $output if ref $output; |
53
|
7
|
|
|
|
|
59
|
return $output; |
54
|
|
|
|
|
|
|
} |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
sub learn_p { |
57
|
5
|
|
|
5
|
1
|
13
|
my $self = shift; |
58
|
5
|
|
|
5
|
|
23
|
return $self->_get_p($self->url)->then(sub { $self->_learn(shift) }); |
|
5
|
|
|
|
|
737
|
|
59
|
|
|
|
|
|
|
} |
60
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
sub TO_JSON { |
62
|
5
|
|
|
5
|
0
|
15
|
my $self = shift; |
63
|
5
|
|
|
|
|
12
|
my %json; |
64
|
|
|
|
|
|
|
|
65
|
5
|
|
|
|
|
17
|
for my $attr (grep { defined $self->$_ } @JSON_ATTRS) { |
|
70
|
|
|
|
|
1135
|
|
66
|
32
|
|
|
|
|
2468
|
$json{$attr} = $self->$attr; |
67
|
32
|
100
|
|
|
|
268
|
$json{$attr} = "$json{$attr}" if $attr =~ /url$/; |
68
|
|
|
|
|
|
|
} |
69
|
|
|
|
|
|
|
|
70
|
5
|
100
|
|
|
|
16
|
$json{html} = $self->html unless $self->type eq 'link'; |
71
|
|
|
|
|
|
|
|
72
|
5
|
|
|
|
|
38
|
return \%json; |
73
|
|
|
|
|
|
|
} |
74
|
|
|
|
|
|
|
|
75
|
0
|
|
|
0
|
|
0
|
sub _dump { Mojo::Util::dumper($_[0]->TO_JSON); } |
76
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
sub _el { |
78
|
28
|
|
|
28
|
|
71
|
my ($self, $dom, @sel) = @_; |
79
|
28
|
100
|
|
|
|
144
|
@sel = @{$DOM_SEL{$sel[0]}} if $DOM_SEL{$sel[0]}; |
|
12
|
|
|
|
|
59
|
|
80
|
|
|
|
|
|
|
|
81
|
28
|
|
|
|
|
55
|
for my $sel (@sel) { |
82
|
52
|
100
|
|
|
|
7523
|
my $e = $dom->at($sel) or next; |
83
|
4
|
|
100
|
|
|
1203
|
my ($val) = grep {$_} map { trim($_ // '') } $e->{content}, $e->{value}, $e->{href}, $e->text, $e->all_text; |
|
20
|
|
|
|
|
67
|
|
|
20
|
|
|
|
|
770
|
|
84
|
4
|
50
|
|
|
|
75
|
return $val if defined $val; |
85
|
|
|
|
|
|
|
} |
86
|
|
|
|
|
|
|
|
87
|
24
|
|
|
|
|
8701
|
return ''; |
88
|
|
|
|
|
|
|
} |
89
|
|
|
|
|
|
|
|
90
|
|
|
|
|
|
|
sub _get_p { |
91
|
5
|
|
|
5
|
|
45
|
my ($self, $url) = @_; |
92
|
5
|
50
|
|
|
|
23
|
$url = $url->clone->scheme('https') if $self->force_secure; |
93
|
5
|
|
|
|
|
34
|
warn sprintf "[%s] GET %s\n", ref($self), $url if DEBUG; |
94
|
|
|
|
|
|
|
return $self->ua->get_p($url)->then(sub { |
95
|
5
|
|
|
5
|
|
44214
|
my $tx = shift; |
96
|
5
|
50
|
33
|
|
|
37
|
$self->url->scheme('https') if $self->force_secure and $tx->res->is_success; |
97
|
5
|
|
|
|
|
52
|
return $tx; |
98
|
5
|
|
|
|
|
22
|
}); |
99
|
|
|
|
|
|
|
} |
100
|
|
|
|
|
|
|
|
101
|
|
|
|
|
|
|
sub _learn { |
102
|
5
|
|
|
5
|
|
18
|
my ($self, $tx) = @_; |
103
|
5
|
|
|
|
|
19
|
my $h = $tx->res->headers; |
104
|
|
|
|
|
|
|
|
105
|
5
|
|
|
|
|
114
|
my $name = $h->header('X-Provider-Name'); |
106
|
5
|
100
|
|
|
|
68
|
$self->provider_name($name) if $name; |
107
|
|
|
|
|
|
|
|
108
|
5
|
|
50
|
|
|
23
|
my $ct = $h->content_type || ''; |
109
|
5
|
50
|
|
|
|
71
|
$self->type('photo')->_learn_from_url if $ct =~ m!^image/!; |
110
|
5
|
50
|
|
|
|
17
|
$self->type('video')->_learn_from_url if $ct =~ m!^video/!; |
111
|
5
|
100
|
|
|
|
29
|
$self->type('rich')->_learn_from_text($tx) if $ct =~ m!^text/plain!; |
112
|
5
|
100
|
|
|
|
48
|
$self->type('rich')->_learn_from_dom($tx->res->dom) if $ct =~ m!^text/html!; |
113
|
5
|
|
|
|
|
31
|
my $p = $self->_maybe_rebless_p($tx); |
114
|
|
|
|
|
|
|
|
115
|
5
|
|
33
|
|
|
57
|
return $p || $self; |
116
|
|
|
|
|
|
|
} |
117
|
|
|
|
|
|
|
|
118
|
|
|
|
|
|
|
sub _learn_from_dom { |
119
|
4
|
|
|
4
|
|
13
|
my ($self, $dom) = @_; |
120
|
4
|
|
|
|
|
10
|
my $v; |
121
|
|
|
|
|
|
|
|
122
|
4
|
50
|
|
|
|
23
|
$self->author_name($v) if $v = $self->_el($dom, '[itemprop="author"] [itemprop="name"]'); |
123
|
4
|
50
|
|
|
|
19
|
$self->author_url($v) if $v = $self->_el($dom, '[itemprop="author"] [itemprop="email"]'); |
124
|
4
|
50
|
|
|
|
52
|
$self->description($v) if $v = $self->_el($dom, ':desc'); |
125
|
4
|
50
|
|
|
|
16
|
$self->thumbnail_height($v) if $v = $self->_el($dom, 'meta[property="og:image:height"]'); |
126
|
4
|
50
|
|
|
|
15
|
$self->thumbnail_url($v) if $v = $self->_el($dom, ':image'); |
127
|
4
|
50
|
|
|
|
15
|
$self->thumbnail_width($v) if $v = $self->_el($dom, 'meta[property="og:image:width"]'); |
128
|
4
|
50
|
|
|
|
16
|
$self->title($v) if $v = $self->_el($dom, ':title'); |
129
|
|
|
|
|
|
|
|
130
|
4
|
|
|
|
|
42
|
return $self; |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
sub _learn_from_json { |
134
|
0
|
|
|
0
|
|
0
|
my ($self, $tx) = @_; |
135
|
0
|
|
|
|
|
0
|
my $json = $tx->res->json; |
136
|
|
|
|
|
|
|
|
137
|
0
|
|
|
|
|
0
|
warn "[LinkEmbedder] " . $tx->res->text . "\n" if DEBUG; |
138
|
0
|
|
0
|
|
|
0
|
$self->{$_} ||= $json->{$_} for keys %$json; |
139
|
0
|
0
|
0
|
|
|
0
|
$self->{error} = {message => $self->{error}} if defined $self->{error} and !ref $self->{error}; |
140
|
0
|
0
|
0
|
|
|
0
|
$self->{error}{code} = $self->{status} if $self->{status} and $self->{status} =~ /^\d+$/; |
141
|
|
|
|
|
|
|
|
142
|
0
|
|
|
|
|
0
|
return $self; |
143
|
|
|
|
|
|
|
} |
144
|
|
|
|
|
|
|
|
145
|
|
|
|
|
|
|
sub _learn_from_text { |
146
|
1
|
|
|
1
|
|
17
|
my ($self, $tx) = @_; |
147
|
1
|
|
|
|
|
8
|
$self->_learn_from_url; |
148
|
|
|
|
|
|
|
|
149
|
1
|
|
|
|
|
90
|
$self->{paste} = $tx->res->text; |
150
|
1
|
|
|
|
|
80
|
$self->template->[1] = 'paste.html.ep'; |
151
|
|
|
|
|
|
|
|
152
|
1
|
|
|
|
|
14
|
my $title = substr $self->{paste}, 0, 20; |
153
|
1
|
|
|
|
|
5
|
$title =~ s![\r\n]+! !g; |
154
|
1
|
|
|
|
|
4
|
$self->title($title); |
155
|
|
|
|
|
|
|
} |
156
|
|
|
|
|
|
|
|
157
|
|
|
|
|
|
|
sub _learn_from_url { |
158
|
1
|
|
|
1
|
|
3
|
my $self = shift; |
159
|
1
|
|
|
|
|
5
|
my $path = $self->url->path; |
160
|
|
|
|
|
|
|
|
161
|
1
|
50
|
|
|
|
19
|
return $self->title(@$path ? $path->[-1] : 'Image'); |
162
|
|
|
|
|
|
|
} |
163
|
|
|
|
|
|
|
|
164
|
|
|
|
|
|
|
# TODO: Not sure if this is the best solution |
165
|
|
|
|
|
|
|
sub _maybe_rebless_p { |
166
|
5
|
|
|
5
|
|
18
|
my ($self, $tx) = @_; |
167
|
5
|
50
|
|
|
|
22
|
return unless ref $self eq 'LinkEmbedder::Link::Basic'; |
168
|
5
|
50
|
|
|
|
23
|
return unless $self->type eq 'rich'; |
169
|
|
|
|
|
|
|
|
170
|
5
|
50
|
33
|
|
|
48
|
if ($self->title eq 'Jitsi Meet' or $tx->res->body =~ m!\bJitsiMeetJS\b!) { |
171
|
0
|
|
|
|
|
0
|
require LinkEmbedder::Link::Jitsi; |
172
|
0
|
|
|
|
|
0
|
bless $self, 'LinkEmbedder::Link::Jitsi'; |
173
|
0
|
|
|
|
|
0
|
return $self->learn_p; |
174
|
|
|
|
|
|
|
} |
175
|
|
|
|
|
|
|
|
176
|
5
|
|
|
|
|
364
|
return; |
177
|
|
|
|
|
|
|
} |
178
|
|
|
|
|
|
|
|
179
|
|
|
|
|
|
|
1; |
180
|
|
|
|
|
|
|
|
181
|
|
|
|
|
|
|
=encoding utf8 |
182
|
|
|
|
|
|
|
|
183
|
|
|
|
|
|
|
=head1 NAME |
184
|
|
|
|
|
|
|
|
185
|
|
|
|
|
|
|
LinkEmbedder::Link - Meta information for an URL |
186
|
|
|
|
|
|
|
|
187
|
|
|
|
|
|
|
=head1 SYNOPSIS |
188
|
|
|
|
|
|
|
|
189
|
|
|
|
|
|
|
See L. |
190
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
=head1 DESCRIPTION |
192
|
|
|
|
|
|
|
|
193
|
|
|
|
|
|
|
L is a class representing an expanded URL. |
194
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
=head1 ATTRIBUTES |
196
|
|
|
|
|
|
|
|
197
|
|
|
|
|
|
|
=head2 author_name |
198
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
$str = $self->author_name; |
200
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
Might hold the name of the author of L. |
202
|
|
|
|
|
|
|
|
203
|
|
|
|
|
|
|
=head2 author_url |
204
|
|
|
|
|
|
|
|
205
|
|
|
|
|
|
|
$str = $self->author_name; |
206
|
|
|
|
|
|
|
|
207
|
|
|
|
|
|
|
Might hold an URL to the author. |
208
|
|
|
|
|
|
|
|
209
|
|
|
|
|
|
|
=head2 cache_age |
210
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
$int = $self->cache_age; |
212
|
|
|
|
|
|
|
|
213
|
|
|
|
|
|
|
The suggested cache lifetime for this resource, in seconds. |
214
|
|
|
|
|
|
|
|
215
|
|
|
|
|
|
|
=head2 description |
216
|
|
|
|
|
|
|
|
217
|
|
|
|
|
|
|
$str = $self->description; |
218
|
|
|
|
|
|
|
|
219
|
|
|
|
|
|
|
Description of the L. Might be C. |
220
|
|
|
|
|
|
|
|
221
|
|
|
|
|
|
|
=head2 error |
222
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
$hash_ref = $self->author_name; |
224
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
C on success, hash-ref on error. Example: |
226
|
|
|
|
|
|
|
|
227
|
|
|
|
|
|
|
{message => "Oops!", code => 500}; |
228
|
|
|
|
|
|
|
|
229
|
|
|
|
|
|
|
=head2 force_secure |
230
|
|
|
|
|
|
|
|
231
|
|
|
|
|
|
|
$bool = $self->force_secure; |
232
|
|
|
|
|
|
|
$self = $self->force_secure(1); |
233
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
This attribute will translate any unknown http link to https. |
235
|
|
|
|
|
|
|
|
236
|
|
|
|
|
|
|
This attribute is EXPERIMENTAL. Feeback appreciated. |
237
|
|
|
|
|
|
|
|
238
|
|
|
|
|
|
|
=head2 height |
239
|
|
|
|
|
|
|
|
240
|
|
|
|
|
|
|
$int = $self->height; |
241
|
|
|
|
|
|
|
|
242
|
|
|
|
|
|
|
The height of L |