File Coverage

blib/lib/Mojo/Message.pm
Criterion Covered Total %
statement 171 171 100.0
branch 81 88 92.0
condition 45 56 80.3
subroutine 44 44 100.0
pod 30 30 100.0
total 371 389 95.3


line stmt bran cond sub pod time code
1             package Mojo::Message;
2 59     59   430 use Mojo::Base 'Mojo::EventEmitter';
  59         134  
  59         621  
3              
4 59     59   408 use Carp qw(croak);
  59         222  
  59         2837  
5 59     59   24899 use Mojo::Asset::Memory;
  59         194  
  59         487  
6 59     59   26659 use Mojo::Content::Single;
  59         174  
  59         558  
7 59     59   30385 use Mojo::DOM;
  59         198  
  59         2196  
8 59     59   2784 use Mojo::JSON qw(j);
  59         151  
  59         3527  
9 59     59   16490 use Mojo::JSON::Pointer;
  59         186  
  59         692  
10 59     59   8596 use Mojo::Parameters;
  59         167  
  59         590  
11 59     59   25596 use Mojo::Upload;
  59         177  
  59         458  
12 59     59   439 use Mojo::Util qw(decode);
  59         157  
  59         177426  
13              
14             has content => sub { Mojo::Content::Single->new };
15             has default_charset => 'UTF-8';
16             has max_line_size => sub { $ENV{MOJO_MAX_LINE_SIZE} || 8192 };
17             has max_message_size => sub { $ENV{MOJO_MAX_MESSAGE_SIZE} // 16777216 };
18             has version => '1.1';
19              
20             sub body {
21 1803     1803 1 11812 my $self = shift;
22              
23             # Get
24 1803         4452 my $content = $self->content;
25 1803 100       6225 return $content->is_multipart ? '' : $content->asset->slurp unless @_;
    100          
26              
27             # Set (multipart content needs to be downgraded)
28 838 100       2890 $content = $self->content(Mojo::Content::Single->new)->content if $content->is_multipart;
29 838         3709 $content->asset(Mojo::Asset::Memory->new->add_chunk(@_));
30              
31 838         1783 return $self;
32             }
33              
34             sub body_params {
35 322     322 1 642 my $self = shift;
36              
37 322 100       963 return $self->{body_params} if $self->{body_params};
38 314         1252 my $params = $self->{body_params} = Mojo::Parameters->new;
39 314   66     972 $params->charset($self->content->charset || $self->default_charset);
40              
41             # "application/x-www-form-urlencoded"
42 314   100     978 my $type = $self->headers->content_type // '';
43 314 100       1432 if ($type =~ m!application/x-www-form-urlencoded!i) {
    100          
44 42         164 $params->parse($self->content->asset->slurp);
45             }
46              
47             # "multipart/form-data"
48             elsif ($type =~ m!multipart/form-data!i) {
49 30         55 $params->append(@$_[0, 1]) for @{$self->_parse_formdata};
  30         252  
50             }
51              
52 314         1075 return $params;
53             }
54              
55 1870     1870 1 4068 sub body_size { shift->content->body_size }
56              
57 45     45 1 123 sub build_body { shift->_build('get_body_chunk') }
58 43     43 1 102 sub build_headers { shift->_build('get_header_chunk') }
59 43     43 1 112 sub build_start_line { shift->_build('get_start_line_chunk') }
60              
61 122     122 1 380 sub cookie { shift->_cache('cookies', 0, @_) }
62              
63 1     1 1 2566 sub cookies { croak 'Method "cookies" not implemented by subclass' }
64              
65             sub dom {
66 131     131 1 1486 my $self = shift;
67 131 50       343 return undef if $self->content->is_multipart;
68 131   66     650 my $dom = $self->{dom} ||= Mojo::DOM->new($self->text);
69 131 100       698 return @_ ? $dom->find(@_) : $dom;
70             }
71              
72             sub error {
73 8377     8377 1 12935 my $self = shift;
74 8377 100       40175 return $self->{error} unless @_;
75 166         535 $self->{error} = shift;
76 166         438 return $self->finish;
77             }
78              
79 241     241 1 698 sub every_cookie { shift->_cache('cookies', 1, @_) }
80 313     313 1 991 sub every_upload { shift->_cache('uploads', 1, @_) }
81              
82 1     1 1 760 sub extract_start_line { croak 'Method "extract_start_line" not implemented by subclass' }
83              
84             sub finish {
85 5035     5035 1 7913 my $self = shift;
86 5035         9490 $self->{state} = 'finished';
87 5035 100       17998 return $self->{finished}++ ? $self : $self->emit('finish');
88             }
89              
90             sub fix_headers {
91 1931     1931 1 3142 my $self = shift;
92 1931 50       6693 return $self if $self->{fix}++;
93              
94             # Content-Length or Connection (unless chunked transfer encoding is used)
95 1931         4848 my $content = $self->content;
96 1931         5320 my $headers = $content->headers;
97 1931 100 100     5559 if ($content->is_multipart) { $headers->remove('Content-Length') }
  22 100       113  
98 45         152 elsif ($content->is_chunked || $headers->content_length) { return $self }
99 1886 100       5628 if ($content->is_dynamic) { $headers->connection('close') }
  19         62  
100 1867         5032 else { $headers->content_length($self->body_size) }
101              
102 1886         4526 return $self;
103             }
104              
105             sub get_body_chunk {
106 2983     2983 1 5200 my ($self, $offset) = @_;
107              
108 2983         8528 $self->emit('progress', 'body', $offset);
109 2983         6765 my $chunk = $self->content->get_body_chunk($offset);
110 2982 100 100     13379 return $chunk if !defined $chunk || length $chunk;
111 1843         5519 $self->finish;
112              
113 1843         4540 return $chunk;
114             }
115              
116             sub get_header_chunk {
117 1972     1972 1 3557 my ($self, $offset) = @_;
118 1972         6566 $self->emit('progress', 'headers', $offset);
119 1972         5058 return $self->fix_headers->content->get_header_chunk($offset);
120             }
121              
122 1     1 1 734 sub get_start_line_chunk { croak 'Method "get_start_line_chunk" not implemented by subclass' }
123              
124 1868     1868 1 5506 sub header_size { shift->fix_headers->content->header_size }
125              
126 21574     21574 1 48408 sub headers { shift->content->headers }
127              
128 3766   100 3766 1 20858 sub is_finished { (shift->{state} // '') eq 'finished' }
129              
130 22     22 1 133 sub is_limit_exceeded { !!shift->{limit} }
131              
132             sub json {
133 74     74 1 216 my ($self, $pointer) = @_;
134 74 50       217 return undef if $self->content->is_multipart;
135 74   100     334 my $data = $self->{json} //= j($self->body);
136 74 100       443 return $pointer ? Mojo::JSON::Pointer->new($data)->get($pointer) : $data;
137             }
138              
139             sub parse {
140 2698     2698 1 6281 my ($self, $chunk) = @_;
141              
142 2698 100       6243 return $self if $self->{error};
143 2696         6121 $self->{raw_size} += length $chunk;
144 2696         10795 $self->{buffer} .= $chunk;
145              
146             # Start-line
147 2696 100       6499 unless ($self->{state}) {
148              
149             # Check start-line size
150 2050         5043 my $len = index $self->{buffer}, "\x0a";
151 2050 100       4567 $len = length $self->{buffer} if $len < 0;
152 2050 100       5631 return $self->_limit('Maximum start-line size exceeded') if $len > $self->max_line_size;
153              
154 2047 100       7719 $self->{state} = 'content' if $self->extract_start_line(\$self->{buffer});
155             }
156              
157             # Content
158 2693   100     7625 my $state = $self->{state} // '';
159 2693 100 100     10767 $self->content($self->content->parse(delete $self->{buffer})) if $state eq 'content' || $state eq 'finished';
160              
161             # Check message size
162 2693         8169 my $max = $self->max_message_size;
163 2693 100 100     9838 return $self->_limit('Maximum message size exceeded') if $max && $max < $self->{raw_size};
164              
165             # Check header size
166 2687 100       5991 return $self->_limit('Maximum header size exceeded') if $self->headers->is_limit_exceeded;
167              
168             # Check buffer size
169 2682 100       6382 return $self->_limit('Maximum buffer size exceeded') if $self->content->is_limit_exceeded;
170              
171 2679 100       7663 return $self->emit('progress')->content->is_finished ? $self->finish : $self;
172             }
173              
174             sub save_to {
175 2     2 1 23 my ($self, $path) = @_;
176 2         9 my $content = $self->content;
177 2 100       13 croak 'Multipart content cannot be saved to files' if $content->is_multipart;
178 1         4 $content->asset->move_to($path);
179 1         5 return $self;
180             }
181              
182 1     1 1 774 sub start_line_size { croak 'Method "start_line_size" not implemented by subclass' }
183              
184             sub text {
185 670     670 1 1716 my $self = shift;
186 670         1798 my $body = $self->body;
187 670   66     2215 my $charset = $self->content->charset || $self->default_charset;
188 670 50 66     2870 return $charset ? decode($charset, $body) // $body : $body;
189             }
190              
191             sub to_string {
192 41     41 1 76 my $self = shift;
193 41         107 return $self->build_start_line . $self->build_headers . $self->build_body;
194             }
195              
196 32     32 1 129 sub upload { shift->_cache('uploads', 0, @_) }
197              
198             sub uploads {
199 260     260 1 471 my $self = shift;
200              
201 260         417 my @uploads;
202 260         417 for my $data (@{$self->_parse_formdata(1)}) {
  260         731  
203 34         141 my $upload = Mojo::Upload->new(
204             name => $data->[0],
205             filename => $data->[2],
206             asset => $data->[1]->asset,
207             headers => $data->[1]->headers
208             );
209 34         112 push @uploads, $upload;
210             }
211              
212 260         1020 return \@uploads;
213             }
214              
215             sub _build {
216 131     131   225 my ($self, $method) = @_;
217              
218 131         227 my ($buffer, $offset) = ('', 0);
219 131         173 while (1) {
220              
221             # No chunk yet, try again
222 278 100       721 next unless defined(my $chunk = $self->$method($offset));
223              
224             # End of part
225 277 100       619 last unless my $len = length $chunk;
226              
227 146         207 $offset += $len;
228 146         305 $buffer .= $chunk;
229             }
230              
231 131         595 return $buffer;
232             }
233              
234             sub _cache {
235 708     708   1593 my ($self, $method, $all, $name) = @_;
236              
237             # Cache objects by name
238 708 100       1828 unless ($self->{$method}) {
239 337         897 $self->{$method} = {};
240 337         587 push @{$self->{$method}{$_->name}}, $_ for @{$self->$method};
  337         1332  
  183         572  
241             }
242              
243 708   100     2671 my $objects = $self->{$method}{$name} // [];
244 708 100       2992 return $all ? $objects : $objects->[-1];
245             }
246              
247 17 50   17   110 sub _limit { ++$_[0]{limit} and return $_[0]->error({message => $_[1]}) }
248              
249             sub _parse_formdata {
250 290     290   621 my ($self, $upload) = @_;
251              
252 290         431 my @formdata;
253 290         788 my $content = $self->content;
254 290 100       1197 return \@formdata unless $content->is_multipart;
255 61   66     217 my $charset = $content->charset || $self->default_charset;
256              
257             # Check all parts recursively
258 61         157 my @parts = ($content);
259 61         194 while (my $part = shift @parts) {
260              
261 212 100       535 if ($part->is_multipart) {
262 61         105 unshift @parts, @{$part->parts};
  61         155  
263 61         187 next;
264             }
265              
266 151 50       322 next unless my $disposition = $part->headers->content_disposition;
267 151         662 my ($filename) = $disposition =~ /[; ]filename="((?:\\"|[^"])*)"/;
268 151 100 100     850 next if $upload && !defined $filename || !$upload && defined $filename;
      100        
      100        
269 89         496 my ($name) = $disposition =~ /[; ]name="((?:\\"|[^;"])*)"/;
270 89 100       219 next if !defined $name;
271 88 100       293 $part = $part->asset->slurp unless $upload;
272              
273 88 50       201 if ($charset) {
274 88 100 33     342 $name = decode($charset, $name) // $name if $name;
275 88 100 33     254 $filename = decode($charset, $filename) // $filename if $filename;
276 88 100 33     242 $part = decode($charset, $part) // $part unless $upload;
277             }
278              
279 88         390 push @formdata, [$name, $part, $filename];
280             }
281              
282 61         341 return \@formdata;
283             }
284              
285             1;
286              
287             =encoding utf8
288              
289             =head1 NAME
290              
291             Mojo::Message - HTTP message base class
292              
293             =head1 SYNOPSIS
294              
295             package Mojo::Message::MyMessage;
296             use Mojo::Base 'Mojo::Message';
297              
298             sub cookies {...}
299             sub extract_start_line {...}
300             sub get_start_line_chunk {...}
301             sub start_line_size {...}
302              
303             =head1 DESCRIPTION
304              
305             L is an abstract base class for HTTP message containers, based on L
306             7230|https://tools.ietf.org/html/rfc7230>, L and L
307             2388|https://tools.ietf.org/html/rfc2388>, like L and L.
308              
309             =head1 EVENTS
310              
311             L inherits all events from L and can emit the following new ones.
312              
313             =head2 finish
314              
315             $msg->on(finish => sub ($msg) {...});
316              
317             Emitted after message building or parsing is finished.
318              
319             my $before = time;
320             $msg->on(finish => sub ($msg) { $msg->headers->header('X-Parser-Time' => time - $before) });
321              
322             =head2 progress
323              
324             $msg->on(progress => sub ($msg) {...});
325              
326             Emitted when message building or parsing makes progress.
327              
328             # Building
329             $msg->on(progress => sub ($msg, $state, $offset) { say qq{Building "$state" at offset $offset} });
330              
331             # Parsing
332             $msg->on(progress => sub ($msg) {
333             return unless my $len = $msg->headers->content_length;
334             my $size = $msg->content->progress;
335             say 'Progress: ', $size == $len ? 100 : int($size / ($len / 100)), '%';
336             });
337              
338             =head1 ATTRIBUTES
339              
340             L implements the following attributes.
341              
342             =head2 content
343              
344             my $msg = $msg->content;
345             $msg = $msg->content(Mojo::Content::Single->new);
346              
347             Message content, defaults to a L object.
348              
349             =head2 default_charset
350              
351             my $charset = $msg->default_charset;
352             $msg = $msg->default_charset('UTF-8');
353              
354             Default charset used by L and to extract data from C or
355             C message body, defaults to C.
356              
357             =head2 max_line_size
358              
359             my $size = $msg->max_line_size;
360             $msg = $msg->max_line_size(1024);
361              
362             Maximum start-line size in bytes, defaults to the value of the C environment variable or C<8192>
363             (8KiB).
364              
365             =head2 max_message_size
366              
367             my $size = $msg->max_message_size;
368             $msg = $msg->max_message_size(1024);
369              
370             Maximum message size in bytes, defaults to the value of the C environment variable or
371             C<16777216> (16MiB). Setting the value to C<0> will allow messages of indefinite size.
372              
373             =head2 version
374              
375             my $version = $msg->version;
376             $msg = $msg->version('1.1');
377              
378             HTTP version of message, defaults to C<1.1>.
379              
380             =head1 METHODS
381              
382             L inherits all methods from L and implements the following new ones.
383              
384             =head2 body
385              
386             my $bytes = $msg->body;
387             $msg = $msg->body('Hello!');
388              
389             Slurp or replace L.
390              
391             =head2 body_params
392              
393             my $params = $msg->body_params;
394              
395             C parameters extracted from C or C message body, usually
396             a L object. Note that this method caches all data, so it should not be called before the entire
397             message body has been received. Parts of the message body need to be loaded into memory to parse C parameters, so
398             you have to make sure it is not excessively large. There's a 16MiB limit for requests and a 2GiB limit for responses by
399             default.
400              
401             # Get POST parameter names and values
402             my $hash = $msg->body_params->to_hash;
403              
404             =head2 body_size
405              
406             my $size = $msg->body_size;
407              
408             Content size in bytes.
409              
410             =head2 build_body
411              
412             my $bytes = $msg->build_body;
413              
414             Render whole body with L.
415              
416             =head2 build_headers
417              
418             my $bytes = $msg->build_headers;
419              
420             Render all headers with L.
421              
422             =head2 build_start_line
423              
424             my $bytes = $msg->build_start_line;
425              
426             Render start-line with L.
427              
428             =head2 cookie
429              
430             my $cookie = $msg->cookie('foo');
431              
432             Access message cookies, usually L or L objects. If there are multiple
433             cookies sharing the same name, and you want to access more than just the last one, you can use L. Note
434             that this method caches all data, so it should not be called before all headers have been received.
435              
436             # Get cookie value
437             say $msg->cookie('foo')->value;
438              
439             =head2 cookies
440              
441             my $cookies = $msg->cookies;
442              
443             Access message cookies. Meant to be overloaded in a subclass.
444              
445             =head2 dom
446              
447             my $dom = $msg->dom;
448             my $collection = $msg->dom('a[href]');
449              
450             Retrieve message body from L and turn it into a L object, an optional selector can be used to call
451             the method L on it right away, which then returns a L object. Note that this method
452             caches all data, so it should not be called before the entire message body has been received. The whole message body
453             needs to be loaded into memory to parse it, so you have to make sure it is not excessively large. There's a 16MiB limit
454             for requests and a 2GiB limit for responses by default.
455              
456             # Perform "find" right away
457             say $msg->dom('h1, h2, h3')->map('text')->join("\n");
458              
459             # Use everything else Mojo::DOM has to offer
460             say $msg->dom->at('title')->text;
461             say $msg->dom->at('body')->children->map('tag')->uniq->join("\n");
462              
463             =head2 error
464              
465             my $err = $msg->error;
466             $msg = $msg->error({message => 'Parser error'});
467              
468             Get or set message error, an C return value indicates that there is no error.
469              
470             # Connection or parser error
471             $msg->error({message => 'Connection refused'});
472              
473             # 4xx/5xx response
474             $msg->error({message => 'Internal Server Error', code => 500});
475              
476             =head2 every_cookie
477              
478             my $cookies = $msg->every_cookie('foo');
479              
480             Similar to L, but returns all message cookies sharing the same name as an array reference.
481              
482             # Get first cookie value
483             say $msg->every_cookie('foo')->[0]->value;
484              
485             =head2 every_upload
486              
487             my $uploads = $msg->every_upload('foo');
488              
489             Similar to L, but returns all file uploads sharing the same name as an array reference.
490              
491             # Get content of first uploaded file
492             say $msg->every_upload('foo')->[0]->asset->slurp;
493              
494             =head2 extract_start_line
495              
496             my $bool = $msg->extract_start_line(\$str);
497              
498             Extract start-line from string. Meant to be overloaded in a subclass.
499              
500             =head2 finish
501              
502             $msg = $msg->finish;
503              
504             Finish message parser/generator.
505              
506             =head2 fix_headers
507              
508             $msg = $msg->fix_headers;
509              
510             Make sure message has all required headers.
511              
512             =head2 get_body_chunk
513              
514             my $bytes = $msg->get_body_chunk($offset);
515              
516             Get a chunk of body data starting from a specific position. Note that it might not be possible to get the same chunk
517             twice if content was generated dynamically.
518              
519             =head2 get_header_chunk
520              
521             my $bytes = $msg->get_header_chunk($offset);
522              
523             Get a chunk of header data, starting from a specific position. Note that this method finalizes the message.
524              
525             =head2 get_start_line_chunk
526              
527             my $bytes = $msg->get_start_line_chunk($offset);
528              
529             Get a chunk of start-line data starting from a specific position. Meant to be overloaded in a subclass.
530              
531             =head2 header_size
532              
533             my $size = $msg->header_size;
534              
535             Size of headers in bytes. Note that this method finalizes the message.
536              
537             =head2 headers
538              
539             my $headers = $msg->headers;
540              
541             Message headers, usually a L object.
542              
543             # Longer version
544             my $headers = $msg->content->headers;
545              
546             =head2 is_finished
547              
548             my $bool = $msg->is_finished;
549              
550             Check if message parser/generator is finished.
551              
552             =head2 is_limit_exceeded
553              
554             my $bool = $msg->is_limit_exceeded;
555              
556             Check if message has exceeded L, L, L or
557             L.
558              
559             =head2 json
560              
561             my $value = $msg->json;
562             my $value = $msg->json('/foo/bar');
563              
564             Decode JSON message body directly using L if possible, an C return value indicates a bare C or
565             that decoding failed. An optional JSON Pointer can be used to extract a specific value with L.
566             Note that this method caches all data, so it should not be called before the entire message body has been received. The
567             whole message body needs to be loaded into memory to parse it, so you have to make sure it is not excessively large.
568             There's a 16MiB limit for requests and a 2GiB limit for responses by default.
569              
570             # Extract JSON values
571             say $msg->json->{foo}{bar}[23];
572             say $msg->json('/foo/bar/23');
573              
574             =head2 parse
575              
576             $msg = $msg->parse('HTTP/1.1 200 OK...');
577              
578             Parse message chunk.
579              
580             =head2 save_to
581              
582             $msg = $msg->save_to('/some/path/index.html');
583              
584             Save message body to a file.
585              
586             =head2 start_line_size
587              
588             my $size = $msg->start_line_size;
589              
590             Size of the start-line in bytes. Meant to be overloaded in a subclass.
591              
592             =head2 text
593              
594             my $str = $msg->text;
595              
596             Retrieve L and try to decode it with L or L.
597              
598             =head2 to_string
599              
600             my $str = $msg->to_string;
601              
602             Render whole message. Note that this method finalizes the message, and that it might not be possible to render the same
603             message twice if content was generated dynamically.
604              
605             =head2 upload
606              
607             my $upload = $msg->upload('foo');
608              
609             Access C file uploads, usually L objects. If there are multiple uploads sharing the
610             same name, and you want to access more than just the last one, you can use L. Note that this method
611             caches all data, so it should not be called before the entire message body has been received.
612              
613             # Get content of uploaded file
614             say $msg->upload('foo')->asset->slurp;
615              
616             =head2 uploads
617              
618             my $uploads = $msg->uploads;
619              
620             All C file uploads, usually L objects.
621              
622             # Names of all uploads
623             say $_->name for @{$msg->uploads};
624              
625             =head1 SEE ALSO
626              
627             L, L, L.
628              
629             =cut