| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package Net::RFC::Search; |
|
2
|
|
|
|
|
|
|
=head1 NAME |
|
3
|
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
Net::RFC::Search - search for RFC's and dump RFC's content either to a variable or to a file. |
|
5
|
|
|
|
|
|
|
|
|
6
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
7
|
|
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
Net::RFC::Search provides 2 methods: |
|
9
|
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
B is for searching for a RFC index number by given 'keyword' (through RFC index text file). |
|
11
|
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
B is for dumping RFC's content either to a variable or to a file. |
|
13
|
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
use Net::RFC::Search; |
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
my $rfc = Net::RFC::Search->new; |
|
17
|
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
# This will return array of RFC indices with "websocket" keyword in their headers. |
|
19
|
|
|
|
|
|
|
my @found = $rfc->search_by_header('WebSocket'); |
|
20
|
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
# This will dump content of RFC 6455 into $rfc_text variable. |
|
22
|
|
|
|
|
|
|
my $rfc_text = $rfc->get_by_index(6455); |
|
23
|
|
|
|
|
|
|
|
|
24
|
|
|
|
|
|
|
# Dumps RFC 6455 into /tmp/6455.txt file |
|
25
|
|
|
|
|
|
|
$rfc->get_by_index(6455, '/tmp/6455.txt'); |
|
26
|
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
=head1 VERSION |
|
28
|
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
Version 0.02 |
|
30
|
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
32
|
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
Net::RFC::Search is a module aimed to be a simple tool to search and dump RFC's. |
|
34
|
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
=head1 CONSTRUCTOR |
|
36
|
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
=over 4 |
|
38
|
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
=item new(%options) |
|
40
|
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
Create instance of C. |
|
42
|
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
B<%options> are optional parameters: |
|
44
|
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
C - a file name to store RFC index file into. Defaults to ~/.rfcindex |
|
46
|
|
|
|
|
|
|
|
|
47
|
|
|
|
|
|
|
C - URL of the RFC site/mirror where index file and RFC's are going to be downloaded from. |
|
48
|
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
=back |
|
50
|
|
|
|
|
|
|
|
|
51
|
|
|
|
|
|
|
=head1 METHODS |
|
52
|
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
=over 4 |
|
54
|
|
|
|
|
|
|
|
|
55
|
|
|
|
|
|
|
=item search_by_header("keyword") |
|
56
|
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
Returns array of RFC index numbers "keyword" has been found in. |
|
58
|
|
|
|
|
|
|
|
|
59
|
|
|
|
|
|
|
Search occurs in RFC header names (i.e. through RFC index file). |
|
60
|
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
=item get_by_index($index [, $filename ]); |
|
62
|
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
Downloads RFC of index number C<$index> and returns downloaded content. |
|
64
|
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
By providing optional C<$filename> content will be dumped into C<$filename>. |
|
66
|
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
=back |
|
68
|
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
=head1 TODO |
|
70
|
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
=over 4 |
|
72
|
|
|
|
|
|
|
|
|
73
|
|
|
|
|
|
|
=item add caching facilities |
|
74
|
|
|
|
|
|
|
|
|
75
|
|
|
|
|
|
|
=item do not rely on LWP::UserAgent only, add lynx/curl as optional methods to retrieve RFC's |
|
76
|
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
=back |
|
78
|
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
=head1 ACKNOWLEDGEMENTS |
|
80
|
|
|
|
|
|
|
|
|
81
|
|
|
|
|
|
|
This module is heavily based on rfc.pl script written by **Derrick Daugherty** (http://www.dewn.com/rfc/) |
|
82
|
|
|
|
|
|
|
|
|
83
|
|
|
|
|
|
|
=head1 AUTHOR |
|
84
|
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
Nikolay Aviltsev, C<< navi@cpan.org >> |
|
86
|
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
=head1 LICENSE AND COPYRIGHT |
|
88
|
|
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
Copyright 2013 Nikolay Aviltsev. |
|
90
|
|
|
|
|
|
|
|
|
91
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it |
|
92
|
|
|
|
|
|
|
under the terms of either: the GNU General Public License as published |
|
93
|
|
|
|
|
|
|
by the Free Software Foundation; or the Artistic License. |
|
94
|
|
|
|
|
|
|
|
|
95
|
|
|
|
|
|
|
See L for more information. |
|
96
|
|
|
|
|
|
|
|
|
97
|
|
|
|
|
|
|
=cut |
|
98
|
|
|
|
|
|
|
|
|
99
|
2
|
|
|
2
|
|
108841
|
use 5.006; |
|
|
2
|
|
|
|
|
9
|
|
|
|
2
|
|
|
|
|
122
|
|
|
100
|
2
|
|
|
2
|
|
11
|
use strict; |
|
|
2
|
|
|
|
|
5
|
|
|
|
2
|
|
|
|
|
104
|
|
|
101
|
|
|
|
|
|
|
|
|
102
|
2
|
|
|
2
|
|
3007
|
use LWP::UserAgent; |
|
|
2
|
|
|
|
|
117085
|
|
|
|
2
|
|
|
|
|
73
|
|
|
103
|
2
|
|
|
2
|
|
1999
|
use IO::File; |
|
|
2
|
|
|
|
|
12964
|
|
|
|
2
|
|
|
|
|
330
|
|
|
104
|
2
|
|
|
2
|
|
15
|
use Carp; |
|
|
2
|
|
|
|
|
4
|
|
|
|
2
|
|
|
|
|
111
|
|
|
105
|
2
|
|
|
2
|
|
4741
|
use File::HomeDir; |
|
|
2
|
|
|
|
|
14401
|
|
|
|
2
|
|
|
|
|
1594
|
|
|
106
|
|
|
|
|
|
|
|
|
107
|
|
|
|
|
|
|
our $VERSION = '0.02'; |
|
108
|
|
|
|
|
|
|
my $ua; |
|
109
|
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
sub new { |
|
111
|
4
|
|
|
4
|
1
|
3318
|
my ($class, %params) = @_; |
|
112
|
|
|
|
|
|
|
|
|
113
|
4
|
|
|
|
|
13
|
my $self = {}; |
|
114
|
4
|
|
66
|
|
|
50
|
$self->{indexpath} = $params{indexpath} || File::HomeDir->my_home . "/.rfcindex"; |
|
115
|
|
|
|
|
|
|
|
|
116
|
4
|
|
100
|
|
|
204
|
$self->{rfcbaseurl} = $params{rfcbaseurl} || 'http://www.ietf.org/rfc/'; |
|
117
|
4
|
|
|
|
|
19
|
$self->{rfcbaseurl} =~ s/\s//g; |
|
118
|
4
|
100
|
|
|
|
26
|
$self->{rfcbaseurl} .= '/' unless substr($self->{rfcbaseurl}, -1) eq '/'; |
|
119
|
|
|
|
|
|
|
|
|
120
|
4
|
|
|
|
|
12
|
bless $self, $class; |
|
121
|
4
|
|
|
|
|
19
|
return $self; |
|
122
|
|
|
|
|
|
|
} |
|
123
|
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
sub _ua { |
|
125
|
5
|
|
|
5
|
|
467
|
my $self = shift; |
|
126
|
5
|
100
|
|
|
|
39
|
return $ua if $ua; |
|
127
|
|
|
|
|
|
|
|
|
128
|
2
|
|
|
|
|
30
|
$ua = LWP::UserAgent->new(timeout => 10); |
|
129
|
|
|
|
|
|
|
} |
|
130
|
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
sub _make_index { |
|
132
|
1
|
|
|
1
|
|
19
|
my $self = shift; |
|
133
|
1
|
|
|
|
|
4
|
my $indexpath = $self->{indexpath}; |
|
134
|
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
# system ("lynx -dump www.ietf.org/download/rfc-index.txt > $indexpath"); |
|
136
|
1
|
|
|
|
|
7
|
my $response = $self->_ua->get('http://www.ietf.org/download/rfc-index.txt'); |
|
137
|
1
|
50
|
|
|
|
1206544
|
if ($response->is_success) { |
|
138
|
1
|
|
|
|
|
25
|
my $fh = IO::File->new($indexpath, 'w'); |
|
139
|
1
|
|
|
|
|
247
|
print $fh $response->decoded_content; |
|
140
|
1
|
|
|
|
|
44747
|
undef $fh; |
|
141
|
|
|
|
|
|
|
} |
|
142
|
|
|
|
|
|
|
else { |
|
143
|
0
|
|
|
|
|
0
|
confess "Could not get rfc-index.txt, please try again later"; |
|
144
|
|
|
|
|
|
|
} |
|
145
|
|
|
|
|
|
|
} |
|
146
|
|
|
|
|
|
|
|
|
147
|
|
|
|
|
|
|
sub search_by_header { |
|
148
|
3
|
|
|
3
|
1
|
10687
|
my ($self, $string) = @_; |
|
149
|
3
|
100
|
|
|
|
81
|
$self->_make_index unless -e $self->{indexpath}; |
|
150
|
|
|
|
|
|
|
|
|
151
|
3
|
|
|
|
|
127
|
my $fh = IO::File->new($self->{indexpath}, "r"); |
|
152
|
|
|
|
|
|
|
|
|
153
|
3
|
|
|
|
|
414
|
my ($thing, @found_indices); |
|
154
|
3
|
|
|
|
|
6
|
my $found = 0; |
|
155
|
|
|
|
|
|
|
|
|
156
|
3
|
|
|
|
|
53376
|
for my $line(<$fh>) { |
|
157
|
85578
|
100
|
|
|
|
226473
|
if ($line !~ /^\s*$/) { |
|
158
|
63750
|
|
|
|
|
105548
|
$thing .= $line; |
|
159
|
63750
|
100
|
|
|
|
200876
|
$found = 1 if ($line =~ /$string/i); |
|
160
|
|
|
|
|
|
|
} |
|
161
|
|
|
|
|
|
|
else { |
|
162
|
21828
|
100
|
|
|
|
60136
|
$thing =~ /^(\d+)/ if $thing; |
|
163
|
21828
|
100
|
100
|
|
|
96171
|
push @found_indices, $1 if ($1 && $found); |
|
164
|
|
|
|
|
|
|
|
|
165
|
21828
|
|
|
|
|
24533
|
$found = 0; |
|
166
|
21828
|
|
|
|
|
33633
|
$thing = ''; |
|
167
|
|
|
|
|
|
|
} |
|
168
|
|
|
|
|
|
|
} |
|
169
|
|
|
|
|
|
|
|
|
170
|
3
|
|
|
|
|
7213
|
undef $fh; |
|
171
|
3
|
|
|
|
|
1520
|
return @found_indices; |
|
172
|
|
|
|
|
|
|
} |
|
173
|
|
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
sub get_by_index { |
|
175
|
3
|
|
|
3
|
1
|
7013
|
my ($self, $index, $dump_to) = @_; |
|
176
|
3
|
50
|
|
|
|
127
|
$self->_make_index unless -e $self->{indexpath}; |
|
177
|
|
|
|
|
|
|
|
|
178
|
3
|
|
|
|
|
7
|
my $rfc; |
|
179
|
3
|
50
|
|
|
|
12
|
if ($index) { |
|
180
|
3
|
|
|
|
|
15
|
my $response = $self->_download_rfc_by_index($index); |
|
181
|
3
|
100
|
|
|
|
23923
|
$rfc = $response->{error} ? $response->{error_message} : $response->{content}; |
|
182
|
|
|
|
|
|
|
} |
|
183
|
|
|
|
|
|
|
|
|
184
|
3
|
100
|
|
|
|
22
|
if ($dump_to) { |
|
185
|
1
|
|
|
|
|
15
|
my $fh = IO::File->new($dump_to, "w"); |
|
186
|
1
|
|
|
|
|
1330
|
print $fh $rfc; |
|
187
|
|
|
|
|
|
|
} |
|
188
|
|
|
|
|
|
|
|
|
189
|
3
|
|
|
|
|
33
|
return $rfc; |
|
190
|
|
|
|
|
|
|
} |
|
191
|
|
|
|
|
|
|
|
|
192
|
|
|
|
|
|
|
sub _download_rfc_by_index { |
|
193
|
3
|
|
|
3
|
|
10
|
my ($self, $index) = @_; |
|
194
|
3
|
50
|
|
|
|
16
|
if (length $index < 4) { |
|
195
|
0
|
|
|
|
|
0
|
$index = '0' . $index; |
|
196
|
|
|
|
|
|
|
} |
|
197
|
|
|
|
|
|
|
|
|
198
|
3
|
|
|
|
|
52
|
my $rfcbaseurl = $self->{rfcbaseurl}; |
|
199
|
3
|
|
|
|
|
12
|
my $url = $self->{rfcbaseurl} . "rfc" . $index . ".txt"; |
|
200
|
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
# `lynx -dump ${rfcbaseurl}rfc$index.txt`; |
|
202
|
3
|
|
|
|
|
16
|
my $response = $self->_ua->get($url); |
|
203
|
|
|
|
|
|
|
|
|
204
|
3
|
100
|
|
|
|
1116945
|
return $response->is_success ? |
|
205
|
|
|
|
|
|
|
{ error => 0, content => $response->decoded_content } : |
|
206
|
|
|
|
|
|
|
{ error => 1, error_code => $response->code, error_message => $response->status_line }; |
|
207
|
|
|
|
|
|
|
} |
|
208
|
|
|
|
|
|
|
|
|
209
|
|
|
|
|
|
|
1; |