File Coverage

blib/lib/Mojo/Message.pm
Criterion Covered Total %
statement 171 171 100.0
branch 81 88 92.0
condition 45 56 80.3
subroutine 44 44 100.0
pod 30 30 100.0
total 371 389 95.3


line stmt bran cond sub pod time code
1             package Mojo::Message;
2 59     59   441 use Mojo::Base 'Mojo::EventEmitter';
  59         118  
  59         691  
3              
4 59     59   426 use Carp qw(croak);
  59         291  
  59         3030  
5 59     59   25913 use Mojo::Asset::Memory;
  59         194  
  59         510  
6 59     59   26815 use Mojo::Content::Single;
  59         240  
  59         626  
7 59     59   31611 use Mojo::DOM;
  59         266  
  59         2326  
8 59     59   2790 use Mojo::JSON qw(j);
  59         163  
  59         3620  
9 59     59   17366 use Mojo::JSON::Pointer;
  59         199  
  59         740  
10 59     59   8696 use Mojo::Parameters;
  59         154  
  59         669  
11 59     59   26183 use Mojo::Upload;
  59         198  
  59         498  
12 59     59   455 use Mojo::Util qw(decode);
  59         158  
  59         183825  
13              
14             has content => sub { Mojo::Content::Single->new };
15             has default_charset => 'UTF-8';
16             has max_line_size => sub { $ENV{MOJO_MAX_LINE_SIZE} || 8192 };
17             has max_message_size => sub { $ENV{MOJO_MAX_MESSAGE_SIZE} // 16777216 };
18             has version => '1.1';
19              
20             sub body {
21 1803     1803 1 10972 my $self = shift;
22              
23             # Get
24 1803         4701 my $content = $self->content;
25 1803 100       6430 return $content->is_multipart ? '' : $content->asset->slurp unless @_;
    100          
26              
27             # Set (multipart content needs to be downgraded)
28 838 100       3167 $content = $self->content(Mojo::Content::Single->new)->content if $content->is_multipart;
29 838         3910 $content->asset(Mojo::Asset::Memory->new->add_chunk(@_));
30              
31 838         1888 return $self;
32             }
33              
34             sub body_params {
35 322     322 1 612 my $self = shift;
36              
37 322 100       941 return $self->{body_params} if $self->{body_params};
38 314         1241 my $params = $self->{body_params} = Mojo::Parameters->new;
39 314   66     1009 $params->charset($self->content->charset || $self->default_charset);
40              
41             # "application/x-www-form-urlencoded"
42 314   100     1055 my $type = $self->headers->content_type // '';
43 314 100       1542 if ($type =~ m!application/x-www-form-urlencoded!i) {
    100          
44 42         146 $params->parse($self->content->asset->slurp);
45             }
46              
47             # "multipart/form-data"
48             elsif ($type =~ m!multipart/form-data!i) {
49 30         62 $params->append(@$_[0, 1]) for @{$self->_parse_formdata};
  30         352  
50             }
51              
52 314         1058 return $params;
53             }
54              
55 1870     1870 1 4122 sub body_size { shift->content->body_size }
56              
57 45     45 1 106 sub build_body { shift->_build('get_body_chunk') }
58 43     43 1 96 sub build_headers { shift->_build('get_header_chunk') }
59 43     43 1 116 sub build_start_line { shift->_build('get_start_line_chunk') }
60              
61 122     122 1 384 sub cookie { shift->_cache('cookies', 0, @_) }
62              
63 1     1 1 2586 sub cookies { croak 'Method "cookies" not implemented by subclass' }
64              
65             sub dom {
66 131     131 1 1230 my $self = shift;
67 131 50       389 return undef if $self->content->is_multipart;
68 131   66     573 my $dom = $self->{dom} ||= Mojo::DOM->new($self->text);
69 131 100       705 return @_ ? $dom->find(@_) : $dom;
70             }
71              
72             sub error {
73 8348     8348 1 12884 my $self = shift;
74 8348 100       40541 return $self->{error} unless @_;
75 166         512 $self->{error} = shift;
76 166         564 return $self->finish;
77             }
78              
79 241     241 1 762 sub every_cookie { shift->_cache('cookies', 1, @_) }
80 313     313 1 1062 sub every_upload { shift->_cache('uploads', 1, @_) }
81              
82 1     1 1 849 sub extract_start_line { croak 'Method "extract_start_line" not implemented by subclass' }
83              
84             sub finish {
85 5035     5035 1 7942 my $self = shift;
86 5035         9510 $self->{state} = 'finished';
87 5035 100       18332 return $self->{finished}++ ? $self : $self->emit('finish');
88             }
89              
90             sub fix_headers {
91 1931     1931 1 3166 my $self = shift;
92 1931 50       6787 return $self if $self->{fix}++;
93              
94             # Content-Length or Connection (unless chunked transfer encoding is used)
95 1931         5211 my $content = $self->content;
96 1931         5760 my $headers = $content->headers;
97 1931 100 100     6049 if ($content->is_multipart) { $headers->remove('Content-Length') }
  22 100       108  
98 45         156 elsif ($content->is_chunked || $headers->content_length) { return $self }
99 1886 100       5950 if ($content->is_dynamic) { $headers->connection('close') }
  19         82  
100 1867         5473 else { $headers->content_length($self->body_size) }
101              
102 1886         4753 return $self;
103             }
104              
105             sub get_body_chunk {
106 2983     2983 1 5656 my ($self, $offset) = @_;
107              
108 2983         8788 $self->emit('progress', 'body', $offset);
109 2983         6938 my $chunk = $self->content->get_body_chunk($offset);
110 2982 100 100     13849 return $chunk if !defined $chunk || length $chunk;
111 1843         5972 $self->finish;
112              
113 1843         4643 return $chunk;
114             }
115              
116             sub get_header_chunk {
117 1972     1972 1 3745 my ($self, $offset) = @_;
118 1972         7021 $self->emit('progress', 'headers', $offset);
119 1972         5625 return $self->fix_headers->content->get_header_chunk($offset);
120             }
121              
122 1     1 1 838 sub get_start_line_chunk { croak 'Method "get_start_line_chunk" not implemented by subclass' }
123              
124 1868     1868 1 5952 sub header_size { shift->fix_headers->content->header_size }
125              
126 21541     21541 1 48832 sub headers { shift->content->headers }
127              
128 3704   100 3704 1 21161 sub is_finished { (shift->{state} // '') eq 'finished' }
129              
130 22     22 1 125 sub is_limit_exceeded { !!shift->{limit} }
131              
132             sub json {
133 74     74 1 204 my ($self, $pointer) = @_;
134 74 50       233 return undef if $self->content->is_multipart;
135 74   100     307 my $data = $self->{json} //= j($self->body);
136 74 100       455 return $pointer ? Mojo::JSON::Pointer->new($data)->get($pointer) : $data;
137             }
138              
139             sub parse {
140 2665     2665 1 6185 my ($self, $chunk) = @_;
141              
142 2665 100       6161 return $self if $self->{error};
143 2663         6215 $self->{raw_size} += length $chunk;
144 2663         10385 $self->{buffer} .= $chunk;
145              
146             # Start-line
147 2663 100       6064 unless ($self->{state}) {
148              
149             # Check start-line size
150 2050         5189 my $len = index $self->{buffer}, "\x0a";
151 2050 100       4499 $len = length $self->{buffer} if $len < 0;
152 2050 100       5739 return $self->_limit('Maximum start-line size exceeded') if $len > $self->max_line_size;
153              
154 2047 100       8244 $self->{state} = 'content' if $self->extract_start_line(\$self->{buffer});
155             }
156              
157             # Content
158 2660   100     7565 my $state = $self->{state} // '';
159 2660 100 100     10566 $self->content($self->content->parse(delete $self->{buffer})) if $state eq 'content' || $state eq 'finished';
160              
161             # Check message size
162 2660         8478 my $max = $self->max_message_size;
163 2660 100 100     10012 return $self->_limit('Maximum message size exceeded') if $max && $max < $self->{raw_size};
164              
165             # Check header size
166 2654 100       5905 return $self->_limit('Maximum header size exceeded') if $self->headers->is_limit_exceeded;
167              
168             # Check buffer size
169 2649 100       6702 return $self->_limit('Maximum buffer size exceeded') if $self->content->is_limit_exceeded;
170              
171 2646 100       7590 return $self->emit('progress')->content->is_finished ? $self->finish : $self;
172             }
173              
174             sub save_to {
175 2     2 1 21 my ($self, $path) = @_;
176 2         8 my $content = $self->content;
177 2 100       9 croak 'Multipart content cannot be saved to files' if $content->is_multipart;
178 1         4 $content->asset->move_to($path);
179 1         5 return $self;
180             }
181              
182 1     1 1 819 sub start_line_size { croak 'Method "start_line_size" not implemented by subclass' }
183              
184             sub text {
185 670     670 1 1756 my $self = shift;
186 670         1961 my $body = $self->body;
187 670   66     2540 my $charset = $self->content->charset || $self->default_charset;
188 670 50 66     3113 return $charset ? decode($charset, $body) // $body : $body;
189             }
190              
191             sub to_string {
192 41     41 1 81 my $self = shift;
193 41         109 return $self->build_start_line . $self->build_headers . $self->build_body;
194             }
195              
196 32     32 1 140 sub upload { shift->_cache('uploads', 0, @_) }
197              
198             sub uploads {
199 260     260 1 488 my $self = shift;
200              
201 260         449 my @uploads;
202 260         465 for my $data (@{$self->_parse_formdata(1)}) {
  260         754  
203 34         159 my $upload = Mojo::Upload->new(
204             name => $data->[0],
205             filename => $data->[2],
206             asset => $data->[1]->asset,
207             headers => $data->[1]->headers
208             );
209 34         110 push @uploads, $upload;
210             }
211              
212 260         1129 return \@uploads;
213             }
214              
215             sub _build {
216 131     131   221 my ($self, $method) = @_;
217              
218 131         258 my ($buffer, $offset) = ('', 0);
219 131         170 while (1) {
220              
221             # No chunk yet, try again
222 278 100       689 next unless defined(my $chunk = $self->$method($offset));
223              
224             # End of part
225 277 100       685 last unless my $len = length $chunk;
226              
227 146         210 $offset += $len;
228 146         312 $buffer .= $chunk;
229             }
230              
231 131         555 return $buffer;
232             }
233              
234             sub _cache {
235 708     708   1659 my ($self, $method, $all, $name) = @_;
236              
237             # Cache objects by name
238 708 100       2045 unless ($self->{$method}) {
239 337         986 $self->{$method} = {};
240 337         608 push @{$self->{$method}{$_->name}}, $_ for @{$self->$method};
  337         1436  
  183         565  
241             }
242              
243 708   100     2769 my $objects = $self->{$method}{$name} // [];
244 708 100       3250 return $all ? $objects : $objects->[-1];
245             }
246              
247 17 50   17   114 sub _limit { ++$_[0]{limit} and return $_[0]->error({message => $_[1]}) }
248              
249             sub _parse_formdata {
250 290     290   623 my ($self, $upload) = @_;
251              
252 290         479 my @formdata;
253 290         831 my $content = $self->content;
254 290 100       1282 return \@formdata unless $content->is_multipart;
255 61   66     215 my $charset = $content->charset || $self->default_charset;
256              
257             # Check all parts recursively
258 61         169 my @parts = ($content);
259 61         208 while (my $part = shift @parts) {
260              
261 212 100       538 if ($part->is_multipart) {
262 61         107 unshift @parts, @{$part->parts};
  61         157  
263 61         206 next;
264             }
265              
266 151 50       358 next unless my $disposition = $part->headers->content_disposition;
267 151         716 my ($filename) = $disposition =~ /[; ]filename="((?:\\"|[^"])*)"/;
268 151 100 100     861 next if $upload && !defined $filename || !$upload && defined $filename;
      100        
      100        
269 89         535 my ($name) = $disposition =~ /[; ]name="((?:\\"|[^;"])*)"/;
270 89 100       275 next if !defined $name;
271 88 100       281 $part = $part->asset->slurp unless $upload;
272              
273 88 50       203 if ($charset) {
274 88 100 33     327 $name = decode($charset, $name) // $name if $name;
275 88 100 33     245 $filename = decode($charset, $filename) // $filename if $filename;
276 88 100 33     245 $part = decode($charset, $part) // $part unless $upload;
277             }
278              
279 88         393 push @formdata, [$name, $part, $filename];
280             }
281              
282 61         304 return \@formdata;
283             }
284              
285             1;
286              
287             =encoding utf8
288              
289             =head1 NAME
290              
291             Mojo::Message - HTTP message base class
292              
293             =head1 SYNOPSIS
294              
295             package Mojo::Message::MyMessage;
296             use Mojo::Base 'Mojo::Message';
297              
298             sub cookies {...}
299             sub extract_start_line {...}
300             sub get_start_line_chunk {...}
301             sub start_line_size {...}
302              
303             =head1 DESCRIPTION
304              
305             L is an abstract base class for HTTP message containers, based on L
306             7230|https://tools.ietf.org/html/rfc7230>, L and L
307             2388|https://tools.ietf.org/html/rfc2388>, like L and L.
308              
309             =head1 EVENTS
310              
311             L inherits all events from L and can emit the following new ones.
312              
313             =head2 finish
314              
315             $msg->on(finish => sub ($msg) {...});
316              
317             Emitted after message building or parsing is finished.
318              
319             my $before = time;
320             $msg->on(finish => sub ($msg) { $msg->headers->header('X-Parser-Time' => time - $before) });
321              
322             =head2 progress
323              
324             $msg->on(progress => sub ($msg) {...});
325              
326             Emitted when message building or parsing makes progress.
327              
328             # Building
329             $msg->on(progress => sub ($msg, $state, $offset) { say qq{Building "$state" at offset $offset} });
330              
331             # Parsing
332             $msg->on(progress => sub ($msg) {
333             return unless my $len = $msg->headers->content_length;
334             my $size = $msg->content->progress;
335             say 'Progress: ', $size == $len ? 100 : int($size / ($len / 100)), '%';
336             });
337              
338             =head1 ATTRIBUTES
339              
340             L implements the following attributes.
341              
342             =head2 content
343              
344             my $msg = $msg->content;
345             $msg = $msg->content(Mojo::Content::Single->new);
346              
347             Message content, defaults to a L object.
348              
349             =head2 default_charset
350              
351             my $charset = $msg->default_charset;
352             $msg = $msg->default_charset('UTF-8');
353              
354             Default charset used by L and to extract data from C or
355             C message body, defaults to C.
356              
357             =head2 max_line_size
358              
359             my $size = $msg->max_line_size;
360             $msg = $msg->max_line_size(1024);
361              
362             Maximum start-line size in bytes, defaults to the value of the C environment variable or C<8192>
363             (8KiB).
364              
365             =head2 max_message_size
366              
367             my $size = $msg->max_message_size;
368             $msg = $msg->max_message_size(1024);
369              
370             Maximum message size in bytes, defaults to the value of the C environment variable or
371             C<16777216> (16MiB). Setting the value to C<0> will allow messages of indefinite size.
372              
373             =head2 version
374              
375             my $version = $msg->version;
376             $msg = $msg->version('1.1');
377              
378             HTTP version of message, defaults to C<1.1>.
379              
380             =head1 METHODS
381              
382             L inherits all methods from L and implements the following new ones.
383              
384             =head2 body
385              
386             my $bytes = $msg->body;
387             $msg = $msg->body('Hello!');
388              
389             Slurp or replace L.
390              
391             =head2 body_params
392              
393             my $params = $msg->body_params;
394              
395             C parameters extracted from C or C message body, usually
396             a L object. Note that this method caches all data, so it should not be called before the entire
397             message body has been received. Parts of the message body need to be loaded into memory to parse C parameters, so
398             you have to make sure it is not excessively large. There's a 16MiB limit for requests and a 2GiB limit for responses by
399             default.
400              
401             # Get POST parameter names and values
402             my $hash = $msg->body_params->to_hash;
403              
404             =head2 body_size
405              
406             my $size = $msg->body_size;
407              
408             Content size in bytes.
409              
410             =head2 build_body
411              
412             my $bytes = $msg->build_body;
413              
414             Render whole body with L.
415              
416             =head2 build_headers
417              
418             my $bytes = $msg->build_headers;
419              
420             Render all headers with L.
421              
422             =head2 build_start_line
423              
424             my $bytes = $msg->build_start_line;
425              
426             Render start-line with L.
427              
428             =head2 cookie
429              
430             my $cookie = $msg->cookie('foo');
431              
432             Access message cookies, usually L or L objects. If there are multiple
433             cookies sharing the same name, and you want to access more than just the last one, you can use L. Note
434             that this method caches all data, so it should not be called before all headers have been received.
435              
436             # Get cookie value
437             say $msg->cookie('foo')->value;
438              
439             =head2 cookies
440              
441             my $cookies = $msg->cookies;
442              
443             Access message cookies. Meant to be overloaded in a subclass.
444              
445             =head2 dom
446              
447             my $dom = $msg->dom;
448             my $collection = $msg->dom('a[href]');
449              
450             Retrieve message body from L and turn it into a L object, an optional selector can be used to call
451             the method L on it right away, which then returns a L object. Note that this method
452             caches all data, so it should not be called before the entire message body has been received. The whole message body
453             needs to be loaded into memory to parse it, so you have to make sure it is not excessively large. There's a 16MiB limit
454             for requests and a 2GiB limit for responses by default.
455              
456             # Perform "find" right away
457             say $msg->dom('h1, h2, h3')->map('text')->join("\n");
458              
459             # Use everything else Mojo::DOM has to offer
460             say $msg->dom->at('title')->text;
461             say $msg->dom->at('body')->children->map('tag')->uniq->join("\n");
462              
463             =head2 error
464              
465             my $err = $msg->error;
466             $msg = $msg->error({message => 'Parser error'});
467              
468             Get or set message error, an C return value indicates that there is no error.
469              
470             # Connection or parser error
471             $msg->error({message => 'Connection refused'});
472              
473             # 4xx/5xx response
474             $msg->error({message => 'Internal Server Error', code => 500});
475              
476             =head2 every_cookie
477              
478             my $cookies = $msg->every_cookie('foo');
479              
480             Similar to L, but returns all message cookies sharing the same name as an array reference.
481              
482             # Get first cookie value
483             say $msg->every_cookie('foo')->[0]->value;
484              
485             =head2 every_upload
486              
487             my $uploads = $msg->every_upload('foo');
488              
489             Similar to L, but returns all file uploads sharing the same name as an array reference.
490              
491             # Get content of first uploaded file
492             say $msg->every_upload('foo')->[0]->asset->slurp;
493              
494             =head2 extract_start_line
495              
496             my $bool = $msg->extract_start_line(\$str);
497              
498             Extract start-line from string. Meant to be overloaded in a subclass.
499              
500             =head2 finish
501              
502             $msg = $msg->finish;
503              
504             Finish message parser/generator.
505              
506             =head2 fix_headers
507              
508             $msg = $msg->fix_headers;
509              
510             Make sure message has all required headers.
511              
512             =head2 get_body_chunk
513              
514             my $bytes = $msg->get_body_chunk($offset);
515              
516             Get a chunk of body data starting from a specific position. Note that it might not be possible to get the same chunk
517             twice if content was generated dynamically.
518              
519             =head2 get_header_chunk
520              
521             my $bytes = $msg->get_header_chunk($offset);
522              
523             Get a chunk of header data, starting from a specific position. Note that this method finalizes the message.
524              
525             =head2 get_start_line_chunk
526              
527             my $bytes = $msg->get_start_line_chunk($offset);
528              
529             Get a chunk of start-line data starting from a specific position. Meant to be overloaded in a subclass.
530              
531             =head2 header_size
532              
533             my $size = $msg->header_size;
534              
535             Size of headers in bytes. Note that this method finalizes the message.
536              
537             =head2 headers
538              
539             my $headers = $msg->headers;
540              
541             Message headers, usually a L object.
542              
543             # Longer version
544             my $headers = $msg->content->headers;
545              
546             =head2 is_finished
547              
548             my $bool = $msg->is_finished;
549              
550             Check if message parser/generator is finished.
551              
552             =head2 is_limit_exceeded
553              
554             my $bool = $msg->is_limit_exceeded;
555              
556             Check if message has exceeded L, L, L or
557             L.
558              
559             =head2 json
560              
561             my $value = $msg->json;
562             my $value = $msg->json('/foo/bar');
563              
564             Decode JSON message body directly using L if possible, an C return value indicates a bare C or
565             that decoding failed. An optional JSON Pointer can be used to extract a specific value with L.
566             Note that this method caches all data, so it should not be called before the entire message body has been received. The
567             whole message body needs to be loaded into memory to parse it, so you have to make sure it is not excessively large.
568             There's a 16MiB limit for requests and a 2GiB limit for responses by default.
569              
570             # Extract JSON values
571             say $msg->json->{foo}{bar}[23];
572             say $msg->json('/foo/bar/23');
573              
574             =head2 parse
575              
576             $msg = $msg->parse('HTTP/1.1 200 OK...');
577              
578             Parse message chunk.
579              
580             =head2 save_to
581              
582             $msg = $msg->save_to('/some/path/index.html');
583              
584             Save message body to a file.
585              
586             =head2 start_line_size
587              
588             my $size = $msg->start_line_size;
589              
590             Size of the start-line in bytes. Meant to be overloaded in a subclass.
591              
592             =head2 text
593              
594             my $str = $msg->text;
595              
596             Retrieve L and try to decode it with L or L.
597              
598             =head2 to_string
599              
600             my $str = $msg->to_string;
601              
602             Render whole message. Note that this method finalizes the message, and that it might not be possible to render the same
603             message twice if content was generated dynamically.
604              
605             =head2 upload
606              
607             my $upload = $msg->upload('foo');
608              
609             Access C file uploads, usually L objects. If there are multiple uploads sharing the
610             same name, and you want to access more than just the last one, you can use L. Note that this method
611             caches all data, so it should not be called before the entire message body has been received.
612              
613             # Get content of uploaded file
614             say $msg->upload('foo')->asset->slurp;
615              
616             =head2 uploads
617              
618             my $uploads = $msg->uploads;
619              
620             All C file uploads, usually L objects.
621              
622             # Names of all uploads
623             say $_->name for @{$msg->uploads};
624              
625             =head1 SEE ALSO
626              
627             L, L, L.
628              
629             =cut