line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package WWW::Spinn3r; |
2
|
2
|
|
|
2
|
|
78013
|
use base Class::Accessor; |
|
2
|
|
|
|
|
6
|
|
|
2
|
|
|
|
|
8298
|
|
3
|
2
|
|
|
2
|
|
5263
|
use base WWW::Spinn3r::Common; |
|
2
|
|
|
|
|
5
|
|
|
2
|
|
|
|
|
993
|
|
4
|
2
|
|
|
2
|
|
3913
|
use LWP::UserAgent; |
|
2
|
|
|
|
|
122121
|
|
|
2
|
|
|
|
|
75
|
|
5
|
2
|
|
|
2
|
|
1327
|
use Data::Dumper; |
|
2
|
|
|
|
|
19887
|
|
|
2
|
|
|
|
|
183
|
|
6
|
2
|
|
|
2
|
|
15
|
use Carp; |
|
2
|
|
|
|
|
5
|
|
|
2
|
|
|
|
|
121
|
|
7
|
2
|
|
|
2
|
|
1138
|
use WWW::Spinn3r::next_request_url; |
|
0
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
use WWW::Spinn3r::item; |
9
|
|
|
|
|
|
|
use WWW::Spinn3r::link; |
10
|
|
|
|
|
|
|
use File::Spec; |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
__PACKAGE__->mk_accessors(qw( api api_url from_file future_sleep next_url retries retry_sleep last_url path this_cursor this_feed version want)); |
13
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
$WWW::Spinn3r::VERSION = '3.00700001'; |
15
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
our $DEFAULTS = { |
17
|
|
|
|
|
|
|
api_url => 'http://api.spinn3r.com/rss', |
18
|
|
|
|
|
|
|
debug => 0, |
19
|
|
|
|
|
|
|
retries => 60 * 60 * 24 * 10, |
20
|
|
|
|
|
|
|
retry_sleep => 3, |
21
|
|
|
|
|
|
|
future_sleep => 5, |
22
|
|
|
|
|
|
|
version => '3.0.7', |
23
|
|
|
|
|
|
|
want => 'item', |
24
|
|
|
|
|
|
|
}; |
25
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
sub new { |
28
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
my ($class, %args) = @_; |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
my $self = bless { %$DEFAULTS, %args }, $class; |
32
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
if ($args{from_file}) { |
34
|
|
|
|
|
|
|
# check for file's existance |
35
|
|
|
|
|
|
|
return $self; |
36
|
|
|
|
|
|
|
} |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
croak "Need vendor key" unless $args{params}->{vendor}; |
39
|
|
|
|
|
|
|
croak "Need api name" unless $args{api}; |
40
|
|
|
|
|
|
|
$self->{ua} = new LWP::UserAgent (timeout => 30); |
41
|
|
|
|
|
|
|
unless ($args{mirror}) { |
42
|
|
|
|
|
|
|
$self->{ua}->default_header('Accept-Encoding' => 'gzip'); |
43
|
|
|
|
|
|
|
} |
44
|
|
|
|
|
|
|
|
45
|
|
|
|
|
|
|
return $self; |
46
|
|
|
|
|
|
|
|
47
|
|
|
|
|
|
|
} |
48
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
sub mirror { |
51
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
my ($class, %args) = @_; |
53
|
|
|
|
|
|
|
croak "no mirror path provided" unless $args{path}; |
54
|
|
|
|
|
|
|
return $class->new(%args, mirror => 1); |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
} |
57
|
|
|
|
|
|
|
|
58
|
|
|
|
|
|
|
|
59
|
|
|
|
|
|
|
sub first_url { |
60
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
my ($self) = @_; |
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
# use default version if one is not provided. |
64
|
|
|
|
|
|
|
if (defined $self->{params}->{version}) { |
65
|
|
|
|
|
|
|
$self->version($self->{params}->{version}); |
66
|
|
|
|
|
|
|
delete $self->{params}->{version}; |
67
|
|
|
|
|
|
|
} |
68
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
my $url = $self->api_url . '/' . $self->api . '?version=' . $self->version; |
70
|
|
|
|
|
|
|
for my $param (keys %{ $self->{params} }) { |
71
|
|
|
|
|
|
|
$url .= '&' . $param . '=' . $self->{params}->{$param}; |
72
|
|
|
|
|
|
|
} |
73
|
|
|
|
|
|
|
|
74
|
|
|
|
|
|
|
return $url; |
75
|
|
|
|
|
|
|
|
76
|
|
|
|
|
|
|
} |
77
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
sub _next_feed_from_http { |
80
|
|
|
|
|
|
|
|
81
|
|
|
|
|
|
|
my ($self, $url, %args) = @_; |
82
|
|
|
|
|
|
|
|
83
|
|
|
|
|
|
|
my $tries = 0; |
84
|
|
|
|
|
|
|
my $content = ''; |
85
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
while ($tries < $self->retries and not $content) { |
87
|
|
|
|
|
|
|
|
88
|
|
|
|
|
|
|
$tries++; |
89
|
|
|
|
|
|
|
|
90
|
|
|
|
|
|
|
my ($response, $content_file, $length); |
91
|
|
|
|
|
|
|
|
92
|
|
|
|
|
|
|
my $start = $self->start_timer(); |
93
|
|
|
|
|
|
|
if ($$self{mirror}) { |
94
|
|
|
|
|
|
|
$content_file = $self->local_file($$self{path}, $url); |
95
|
|
|
|
|
|
|
$self->debug("fetching (to file $content_file) $url"); |
96
|
|
|
|
|
|
|
$response = $self->{ua}->get($url, ':content_file' => $content_file); |
97
|
|
|
|
|
|
|
} else { |
98
|
|
|
|
|
|
|
$self->debug("fetching (to memory) $url"); |
99
|
|
|
|
|
|
|
$response = $self->{ua}->get($url); |
100
|
|
|
|
|
|
|
} |
101
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
my $howlong = $self->howlong($start); |
103
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
unless ($response->is_success) { |
105
|
|
|
|
|
|
|
$self->debug($response->status_line); |
106
|
|
|
|
|
|
|
if ($response->status_line =~ /^4\d\d/) { |
107
|
|
|
|
|
|
|
last; |
108
|
|
|
|
|
|
|
} |
109
|
|
|
|
|
|
|
$self->debug("sleeping for " . $self->retry_sleep . " seconds..."); |
110
|
|
|
|
|
|
|
sleep($self->retry_sleep); |
111
|
|
|
|
|
|
|
} else { |
112
|
|
|
|
|
|
|
$length = $$self{mirror} ? -s $content_file : length($response->content); |
113
|
|
|
|
|
|
|
$self->debug("success! $length bytes, in $howlong seconds"); |
114
|
|
|
|
|
|
|
if ($$self{mirror}) { |
115
|
|
|
|
|
|
|
$content = $content_file; |
116
|
|
|
|
|
|
|
} else { |
117
|
|
|
|
|
|
|
$content = $response->decoded_content; |
118
|
|
|
|
|
|
|
} |
119
|
|
|
|
|
|
|
} |
120
|
|
|
|
|
|
|
|
121
|
|
|
|
|
|
|
} |
122
|
|
|
|
|
|
|
|
123
|
|
|
|
|
|
|
unless ($content) { |
124
|
|
|
|
|
|
|
croak "Unable to fetch from spinn3r: $url"; |
125
|
|
|
|
|
|
|
} |
126
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
if ($$self{mirror}) { |
128
|
|
|
|
|
|
|
return $content; |
129
|
|
|
|
|
|
|
} else { |
130
|
|
|
|
|
|
|
return \$content; |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
} |
134
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
sub local_file { |
137
|
|
|
|
|
|
|
|
138
|
|
|
|
|
|
|
my ($self, $path, $url) = @_; |
139
|
|
|
|
|
|
|
|
140
|
|
|
|
|
|
|
my $urlpath = URI->new($url)->path; |
141
|
|
|
|
|
|
|
$urlpath =~ s|^/rss/||; |
142
|
|
|
|
|
|
|
|
143
|
|
|
|
|
|
|
my $filename .= ' ' . URI->new($url)->query; |
144
|
|
|
|
|
|
|
$filename =~ s"\W"-"sg; |
145
|
|
|
|
|
|
|
$filename = $urlpath . '-' . $filename . '.xml'; |
146
|
|
|
|
|
|
|
|
147
|
|
|
|
|
|
|
my $fullpath = File::Spec->catfile($path, $filename); |
148
|
|
|
|
|
|
|
$self->debug("mirror filename: $fullpath"); |
149
|
|
|
|
|
|
|
return $fullpath; |
150
|
|
|
|
|
|
|
|
151
|
|
|
|
|
|
|
} |
152
|
|
|
|
|
|
|
|
153
|
|
|
|
|
|
|
|
154
|
|
|
|
|
|
|
sub next_feed { |
155
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
my ($self) = @_; |
157
|
|
|
|
|
|
|
|
158
|
|
|
|
|
|
|
if ($self->{ua}) { |
159
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
my $url = $self->next_url || $self->first_url; |
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
if ($url =~ /before=$/) { # work around bug in permalink.history |
163
|
|
|
|
|
|
|
return; |
164
|
|
|
|
|
|
|
} |
165
|
|
|
|
|
|
|
|
166
|
|
|
|
|
|
|
if ($url eq $self->last_url or $url =~ /after=$/) { |
167
|
|
|
|
|
|
|
$self->debug("it's the future! will wait for present to catch up. sleeping " . $self->future_sleep . " seconds"); |
168
|
|
|
|
|
|
|
sleep($self->future_sleep); |
169
|
|
|
|
|
|
|
$self->last_url(undef); |
170
|
|
|
|
|
|
|
return $self->next_feed(); |
171
|
|
|
|
|
|
|
} |
172
|
|
|
|
|
|
|
|
173
|
|
|
|
|
|
|
my $xml = $self->_next_feed_from_http($url, %args); |
174
|
|
|
|
|
|
|
|
175
|
|
|
|
|
|
|
$self->last_url($url); |
176
|
|
|
|
|
|
|
if ($self->want eq 'item') { |
177
|
|
|
|
|
|
|
my $items = WWW::Spinn3r::item->new(stringref => $xml, debug => $self->{debug}); |
178
|
|
|
|
|
|
|
return unless $items; |
179
|
|
|
|
|
|
|
$self->this_feed($items); |
180
|
|
|
|
|
|
|
} elsif ($self->want eq 'link') { |
181
|
|
|
|
|
|
|
$self->this_feed(WWW::Spinn3r::link->new(stringref => $xml, debug => $self->{debug})); |
182
|
|
|
|
|
|
|
} |
183
|
|
|
|
|
|
|
|
184
|
|
|
|
|
|
|
} elsif ($self->{from_file}) { |
185
|
|
|
|
|
|
|
my $content_file = File::Spec->catfile($self->from_file); |
186
|
|
|
|
|
|
|
if ($self->want eq 'item') { |
187
|
|
|
|
|
|
|
$self->this_feed(WWW::Spinn3r::item->new(path => $content_file, debug => $self->{debug})); |
188
|
|
|
|
|
|
|
} elsif ($self->want eq 'link') { |
189
|
|
|
|
|
|
|
$self->this_feed(WWW::Spinn3r::link->new(path => $content_file, debug => $self->{debug})); |
190
|
|
|
|
|
|
|
} |
191
|
|
|
|
|
|
|
} |
192
|
|
|
|
|
|
|
|
193
|
|
|
|
|
|
|
} |
194
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
|
196
|
|
|
|
|
|
|
sub next { |
197
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
my ($self) = @_; |
199
|
|
|
|
|
|
|
|
200
|
|
|
|
|
|
|
unless ($self->this_feed) { |
201
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
$self->next_feed(); |
203
|
|
|
|
|
|
|
return undef unless $self->this_feed; # fetch failed |
204
|
|
|
|
|
|
|
$self->this_cursor(0); |
205
|
|
|
|
|
|
|
return unless $self->this_feed; |
206
|
|
|
|
|
|
|
return unless $self->this_feed->{'api:next_request_url'}; |
207
|
|
|
|
|
|
|
$self->next_url($self->this_feed->{'api:next_request_url'}); |
208
|
|
|
|
|
|
|
return $self->next(); |
209
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
} |
211
|
|
|
|
|
|
|
|
212
|
|
|
|
|
|
|
my $item = $self->this_feed->{$self->want}->[$self->this_cursor]; |
213
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
unless ($item) { |
215
|
|
|
|
|
|
|
$self->this_feed(undef); |
216
|
|
|
|
|
|
|
return undef if $self->from_file; |
217
|
|
|
|
|
|
|
return $self->next(); |
218
|
|
|
|
|
|
|
} |
219
|
|
|
|
|
|
|
|
220
|
|
|
|
|
|
|
$self->this_cursor($self->this_cursor+1); |
221
|
|
|
|
|
|
|
return $item; |
222
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
} |
224
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
|
226
|
|
|
|
|
|
|
sub next_mirror { |
227
|
|
|
|
|
|
|
|
228
|
|
|
|
|
|
|
my ($self, %args) = @_; |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
unless ($self->{mirror}) { |
231
|
|
|
|
|
|
|
warn ("next_mirror called in non-mirror mode"); |
232
|
|
|
|
|
|
|
return; |
233
|
|
|
|
|
|
|
} |
234
|
|
|
|
|
|
|
my $url = $self->next_url || $self->first_url; |
235
|
|
|
|
|
|
|
|
236
|
|
|
|
|
|
|
if ($url eq $self->last_url or $url =~ /after=$/) { |
237
|
|
|
|
|
|
|
$self->debug("it's the future! will wait for present to catch up. sleeping " . $self->future_sleep . " seconds"); |
238
|
|
|
|
|
|
|
sleep($self->future_sleep); |
239
|
|
|
|
|
|
|
$self->last_url(undef); |
240
|
|
|
|
|
|
|
return $self->next_mirror(); |
241
|
|
|
|
|
|
|
} |
242
|
|
|
|
|
|
|
|
243
|
|
|
|
|
|
|
my $filename = $self->_next_feed_from_http($url); |
244
|
|
|
|
|
|
|
$self->last_url($url); |
245
|
|
|
|
|
|
|
my $next_url = new WWW::Spinn3r::next_request_url(path => $filename, debug => $self->{debug}); |
246
|
|
|
|
|
|
|
$self->next_url($next_url->{'api:next_request_url'}); |
247
|
|
|
|
|
|
|
|
248
|
|
|
|
|
|
|
} |
249
|
|
|
|
|
|
|
|
250
|
|
|
|
|
|
|
|
251
|
|
|
|
|
|
|
1; |
252
|
|
|
|
|
|
|
|
253
|
|
|
|
|
|
|
|
254
|
|
|
|
|
|
|
=head1 NAME |
255
|
|
|
|
|
|
|
|
256
|
|
|
|
|
|
|
WWW::Spinn3r - An interface to the Spinn3r API (http://www.spinn3r.com) |
257
|
|
|
|
|
|
|
|
258
|
|
|
|
|
|
|
=head1 SYNOPSIS |
259
|
|
|
|
|
|
|
|
260
|
|
|
|
|
|
|
use WWW::Spinn3r; |
261
|
|
|
|
|
|
|
use DateTime; |
262
|
|
|
|
|
|
|
|
263
|
|
|
|
|
|
|
my $API = { |
264
|
|
|
|
|
|
|
vendor => 'acme', # required |
265
|
|
|
|
|
|
|
limit => 5, |
266
|
|
|
|
|
|
|
lang => 'en', |
267
|
|
|
|
|
|
|
tier => '0:5', |
268
|
|
|
|
|
|
|
after => DateTime->now()->subtract(hours => 48), |
269
|
|
|
|
|
|
|
}; |
270
|
|
|
|
|
|
|
|
271
|
|
|
|
|
|
|
my $spnr = new WWW::Spinn3r ( |
272
|
|
|
|
|
|
|
api => 'permalink3.getDelta', params => $API, debug => 1); |
273
|
|
|
|
|
|
|
); |
274
|
|
|
|
|
|
|
|
275
|
|
|
|
|
|
|
while(1) { |
276
|
|
|
|
|
|
|
my $item = $spnr->next; |
277
|
|
|
|
|
|
|
print $item->{title}; |
278
|
|
|
|
|
|
|
print $item->{link}; |
279
|
|
|
|
|
|
|
print $item->{dc}->{source}; |
280
|
|
|
|
|
|
|
print $item->{description}; |
281
|
|
|
|
|
|
|
} |
282
|
|
|
|
|
|
|
|
283
|
|
|
|
|
|
|
=head1 DESCRIPTION |
284
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
WWW::Spinn3r is an iterative interface to the Spinn3r API. The Spinn3r API |
286
|
|
|
|
|
|
|
is implemented over REST and XML and documented at |
287
|
|
|
|
|
|
|
C. |
288
|
|
|
|
|
|
|
|
289
|
|
|
|
|
|
|
=head1 OBTAINING A VENDOR KEY |
290
|
|
|
|
|
|
|
|
291
|
|
|
|
|
|
|
Spinn3r service is available through a B key, which you can |
292
|
|
|
|
|
|
|
get from the good folks at Tailrank, C. |
293
|
|
|
|
|
|
|
|
294
|
|
|
|
|
|
|
=head1 HOW TO USE |
295
|
|
|
|
|
|
|
|
296
|
|
|
|
|
|
|
Most commonly, you'll need just two functions from this module: C |
297
|
|
|
|
|
|
|
and C. C creates a new instance of the API and C |
298
|
|
|
|
|
|
|
returns the next item from the Spinn3r feed, as hashref. Details |
299
|
|
|
|
|
|
|
are below. |
300
|
|
|
|
|
|
|
|
301
|
|
|
|
|
|
|
=head1 B |
302
|
|
|
|
|
|
|
|
303
|
|
|
|
|
|
|
The contructor. This function takes a hash with the following keys: |
304
|
|
|
|
|
|
|
|
305
|
|
|
|
|
|
|
=over 4 |
306
|
|
|
|
|
|
|
|
307
|
|
|
|
|
|
|
=item B |
308
|
|
|
|
|
|
|
|
309
|
|
|
|
|
|
|
C or C, one of the two APIs |
310
|
|
|
|
|
|
|
provided by Spinn3r. |
311
|
|
|
|
|
|
|
|
312
|
|
|
|
|
|
|
=item B |
313
|
|
|
|
|
|
|
|
314
|
|
|
|
|
|
|
These are parameters that are passed to the API call. See |
315
|
|
|
|
|
|
|
C for a list of available parameters |
316
|
|
|
|
|
|
|
and their values. |
317
|
|
|
|
|
|
|
|
318
|
|
|
|
|
|
|
The B parameter to the API is a function of version of this |
319
|
|
|
|
|
|
|
module. and the B accessor method returns the version |
320
|
|
|
|
|
|
|
of the API. By default, the version will be set to the version |
321
|
|
|
|
|
|
|
that corresponds to this module. |
322
|
|
|
|
|
|
|
|
323
|
|
|
|
|
|
|
If the version of the spinn3r API has changed, you can specify it |
324
|
|
|
|
|
|
|
as a parameter. While the module is not guranteed to work with higher |
325
|
|
|
|
|
|
|
versions of the Spinn3r API than it is designed for, it might if the |
326
|
|
|
|
|
|
|
underlying formats and encodings have not changed. |
327
|
|
|
|
|
|
|
|
328
|
|
|
|
|
|
|
=item B |
329
|
|
|
|
|
|
|
|
330
|
|
|
|
|
|
|
This parameter defines the type of item returned by the next() call. |
331
|
|
|
|
|
|
|
WWW::Spinn3r uses XML::Twig to parse the XML returned by Spinn3r and |
332
|
|
|
|
|
|
|
comes with three Twig parsers, C, |
333
|
|
|
|
|
|
|
C and C. The default |
334
|
|
|
|
|
|
|
value for C is C- , which corresponds to the
|
335
|
|
|
|
|
|
|
C module and returns all fields for an item included |
336
|
|
|
|
|
|
|
in the Spinn3r feed. |
337
|
|
|
|
|
|
|
|
338
|
|
|
|
|
|
|
The motivation for having multiple parsers is speed. If you only want |
339
|
|
|
|
|
|
|
certain fields from the feed, for example the link and title, it is |
340
|
|
|
|
|
|
|
significantly faster to write a parser that just extracts those two |
341
|
|
|
|
|
|
|
fields from the feed with XML::Twig. |
342
|
|
|
|
|
|
|
|
343
|
|
|
|
|
|
|
=item B |
344
|
|
|
|
|
|
|
|
345
|
|
|
|
|
|
|
Emits debug noise on STDOUT if set to 1. |
346
|
|
|
|
|
|
|
|
347
|
|
|
|
|
|
|
=item B |
348
|
|
|
|
|
|
|
|
349
|
|
|
|
|
|
|
The number of HTTP retries in case of a 5xx failure from the API. |
350
|
|
|
|
|
|
|
The default is 5. |
351
|
|
|
|
|
|
|
|
352
|
|
|
|
|
|
|
=back |
353
|
|
|
|
|
|
|
|
354
|
|
|
|
|
|
|
=head1 B |
355
|
|
|
|
|
|
|
|
356
|
|
|
|
|
|
|
This method returns the next item from the Spinn3r feed. The item is a |
357
|
|
|
|
|
|
|
reference to a hash, which contains the various fields of an item |
358
|
|
|
|
|
|
|
as parsed by the parser specified in the C field of the |
359
|
|
|
|
|
|
|
consutructor (C- by default).
|
360
|
|
|
|
|
|
|
|
361
|
|
|
|
|
|
|
The module transparently fetches a new set of results from Spinn3r, |
362
|
|
|
|
|
|
|
using the C returned by Spinn3r with every |
363
|
|
|
|
|
|
|
request, and caches the result to implement C. |
364
|
|
|
|
|
|
|
|
365
|
|
|
|
|
|
|
You can control the number of results that are fetched with every call |
366
|
|
|
|
|
|
|
by changing the C parameter at C. |
367
|
|
|
|
|
|
|
|
368
|
|
|
|
|
|
|
=head1 B |
369
|
|
|
|
|
|
|
|
370
|
|
|
|
|
|
|
The last API URL that was fetched. |
371
|
|
|
|
|
|
|
|
372
|
|
|
|
|
|
|
=head1 B |
373
|
|
|
|
|
|
|
|
374
|
|
|
|
|
|
|
WWW::Spinn3r supports mirroring of the Spinn3r feed to local files |
375
|
|
|
|
|
|
|
and then recreating WWW:Spinn3r objects from these files. This |
376
|
|
|
|
|
|
|
is useful if you want to distribute processing of the feeds |
377
|
|
|
|
|
|
|
over multiple processes or computers. |
378
|
|
|
|
|
|
|
|
379
|
|
|
|
|
|
|
To mirror feeds to disk, use the alternative constructor B, |
380
|
|
|
|
|
|
|
which takes all the same arguments as B plus the |
381
|
|
|
|
|
|
|
C argument, which specifies where the files should saved. |
382
|
|
|
|
|
|
|
|
383
|
|
|
|
|
|
|
my $m = mirror WWW::Spinn3r ( path => $mirror_dir, ... ) |
384
|
|
|
|
|
|
|
$m->next_mirror(); |
385
|
|
|
|
|
|
|
|
386
|
|
|
|
|
|
|
The iteration is done with B method, which stores the |
387
|
|
|
|
|
|
|
next feed to a new file, whose filename is derived from the API url. |
388
|
|
|
|
|
|
|
|
389
|
|
|
|
|
|
|
WWW::Spinn3r objects can be created from these disk files when |
390
|
|
|
|
|
|
|
new() is called with the C key: |
391
|
|
|
|
|
|
|
|
392
|
|
|
|
|
|
|
my $m = new WWW::Spinn3r ( from_file => ... ); |
393
|
|
|
|
|
|
|
|
394
|
|
|
|
|
|
|
=head1 DATE STRING FORMAT |
395
|
|
|
|
|
|
|
|
396
|
|
|
|
|
|
|
Spinn3r supports ISO 8601 timestamps in the C parameter. To |
397
|
|
|
|
|
|
|
create ISO 8601 timestamps, use the DateTime module that returns ISO |
398
|
|
|
|
|
|
|
8601 date strings by default. eg: |
399
|
|
|
|
|
|
|
|
400
|
|
|
|
|
|
|
after => DateTime->now()->subtract(hours => 48), |
401
|
|
|
|
|
|
|
after => DateTime->now()->subtract(days => 31), |
402
|
|
|
|
|
|
|
|
403
|
|
|
|
|
|
|
=head1 REPORTING BUGS |
404
|
|
|
|
|
|
|
|
405
|
|
|
|
|
|
|
Bugs should be reported at C |
406
|
|
|
|
|
|
|
|
407
|
|
|
|
|
|
|
=head1 SEE ALSO |
408
|
|
|
|
|
|
|
|
409
|
|
|
|
|
|
|
WWW::Spinn3r::Synced |
410
|
|
|
|
|
|
|
|
411
|
|
|
|
|
|
|
=head1 AUTHOR |
412
|
|
|
|
|
|
|
|
413
|
|
|
|
|
|
|
Vipul Ved Prakash |
414
|
|
|
|
|
|
|
|
415
|
|
|
|
|
|
|
=head1 LICENSE |
416
|
|
|
|
|
|
|
|
417
|
|
|
|
|
|
|
This software is distributed under the same terms as perl itself. |
418
|
|
|
|
|
|
|
|
419
|
|
|
|
|
|
|
=cut |