File Coverage

blib/lib/Mojo/Message.pm
Criterion Covered Total %
statement 171 171 100.0
branch 81 88 92.0
condition 45 56 80.3
subroutine 44 44 100.0
pod 30 30 100.0
total 371 389 95.3


line stmt bran cond sub pod time code
1             package Mojo::Message;
2 60     60   462 use Mojo::Base 'Mojo::EventEmitter';
  60         214  
  60         730  
3              
4 60     60   452 use Carp qw(croak);
  60         224  
  60         3243  
5 60     60   26942 use Mojo::Asset::Memory;
  60         771  
  60         571  
6 60     60   27481 use Mojo::Content::Single;
  60         218  
  60         679  
7 60     60   34469 use Mojo::DOM;
  60         215  
  60         2392  
8 60     60   3059 use Mojo::JSON qw(j);
  60         201  
  60         3653  
9 60     60   17545 use Mojo::JSON::Pointer;
  60         257  
  60         616  
10 60     60   9210 use Mojo::Parameters;
  60         179  
  60         1107  
11 60     60   26366 use Mojo::Upload;
  60         172  
  60         496  
12 60     60   444 use Mojo::Util qw(decode);
  60         187  
  60         197243  
13              
14             has content => sub { Mojo::Content::Single->new };
15             has default_charset => 'UTF-8';
16             has max_line_size => sub { $ENV{MOJO_MAX_LINE_SIZE} || 8192 };
17             has max_message_size => sub { $ENV{MOJO_MAX_MESSAGE_SIZE} // 16777216 };
18             has version => '1.1';
19              
20             sub body {
21 1819     1819 1 11217 my $self = shift;
22              
23             # Get
24 1819         4664 my $content = $self->content;
25 1819 100       6563 return $content->is_multipart ? '' : $content->asset->slurp unless @_;
    100          
26              
27             # Set (multipart content needs to be downgraded)
28 845 100       2974 $content = $self->content(Mojo::Content::Single->new)->content if $content->is_multipart;
29 845         4051 $content->asset(Mojo::Asset::Memory->new->add_chunk(@_));
30              
31 845         1870 return $self;
32             }
33              
34             sub body_params {
35 326     326 1 634 my $self = shift;
36              
37 326 100       964 return $self->{body_params} if $self->{body_params};
38 318         1245 my $params = $self->{body_params} = Mojo::Parameters->new;
39 318   66     1074 $params->charset($self->content->charset || $self->default_charset);
40              
41             # "application/x-www-form-urlencoded"
42 318   100     1247 my $type = $self->headers->content_type // '';
43 318 100       1607 if ($type =~ m!application/x-www-form-urlencoded!i) {
    100          
44 42         177 $params->parse($self->content->asset->slurp);
45             }
46              
47             # "multipart/form-data"
48             elsif ($type =~ m!multipart/form-data!i) {
49 30         78 $params->append(@$_[0, 1]) for @{$self->_parse_formdata};
  30         107  
50             }
51              
52 318         1154 return $params;
53             }
54              
55 1893     1893 1 4134 sub body_size { shift->content->body_size }
56              
57 45     45 1 117 sub build_body { shift->_build('get_body_chunk') }
58 43     43 1 106 sub build_headers { shift->_build('get_header_chunk') }
59 43     43 1 123 sub build_start_line { shift->_build('get_start_line_chunk') }
60              
61 122     122 1 408 sub cookie { shift->_cache('cookies', 0, @_) }
62              
63 1     1 1 2749 sub cookies { croak 'Method "cookies" not implemented by subclass' }
64              
65             sub dom {
66 133     133 1 1539 my $self = shift;
67 133 50       341 return undef if $self->content->is_multipart;
68 133   66     600 my $dom = $self->{dom} ||= Mojo::DOM->new($self->text);
69 133 100       758 return @_ ? $dom->find(@_) : $dom;
70             }
71              
72             sub error {
73 8461     8461 1 13301 my $self = shift;
74 8461 100       40483 return $self->{error} unless @_;
75 170         639 $self->{error} = shift;
76 170         474 return $self->finish;
77             }
78              
79 249     249 1 797 sub every_cookie { shift->_cache('cookies', 1, @_) }
80 317     317 1 1076 sub every_upload { shift->_cache('uploads', 1, @_) }
81              
82 1     1 1 786 sub extract_start_line { croak 'Method "extract_start_line" not implemented by subclass' }
83              
84             sub finish {
85 5099     5099 1 7827 my $self = shift;
86 5099         9590 $self->{state} = 'finished';
87 5099 100       18714 return $self->{finished}++ ? $self : $self->emit('finish');
88             }
89              
90             sub fix_headers {
91 1955     1955 1 3083 my $self = shift;
92 1955 50       7057 return $self if $self->{fix}++;
93              
94             # Content-Length or Connection (unless chunked transfer encoding is used)
95 1955         5028 my $content = $self->content;
96 1955         5613 my $headers = $content->headers;
97 1955 100 100     5999 if ($content->is_multipart) { $headers->remove('Content-Length') }
  22 100       121  
98 46         144 elsif ($content->is_chunked || $headers->content_length) { return $self }
99 1909 100       5730 if ($content->is_dynamic) { $headers->connection('close') }
  19         63  
100 1890         5288 else { $headers->content_length($self->body_size) }
101              
102 1909         4767 return $self;
103             }
104              
105             sub get_body_chunk {
106 3019     3019 1 5459 my ($self, $offset) = @_;
107              
108 3019         8912 $self->emit('progress', 'body', $offset);
109 3019         6997 my $chunk = $self->content->get_body_chunk($offset);
110 3018 100 100     13499 return $chunk if !defined $chunk || length $chunk;
111 1867         6158 $self->finish;
112              
113 1867         4689 return $chunk;
114             }
115              
116             sub get_header_chunk {
117 1996     1996 1 3488 my ($self, $offset) = @_;
118 1996         7290 $self->emit('progress', 'headers', $offset);
119 1996         5324 return $self->fix_headers->content->get_header_chunk($offset);
120             }
121              
122 1     1 1 849 sub get_start_line_chunk { croak 'Method "get_start_line_chunk" not implemented by subclass' }
123              
124 1892     1892 1 5682 sub header_size { shift->fix_headers->content->header_size }
125              
126 21832     21832 1 50157 sub headers { shift->content->headers }
127              
128 3744   100 3744 1 22051 sub is_finished { (shift->{state} // '') eq 'finished' }
129              
130 22     22 1 147 sub is_limit_exceeded { !!shift->{limit} }
131              
132             sub json {
133 74     74 1 199 my ($self, $pointer) = @_;
134 74 50       206 return undef if $self->content->is_multipart;
135 74   100     321 my $data = $self->{json} //= j($self->body);
136 74 100       426 return $pointer ? Mojo::JSON::Pointer->new($data)->get($pointer) : $data;
137             }
138              
139             sub parse {
140 2692     2692 1 6217 my ($self, $chunk) = @_;
141              
142 2692 100       6348 return $self if $self->{error};
143 2690         6439 $self->{raw_size} += length $chunk;
144 2690         11052 $self->{buffer} .= $chunk;
145              
146             # Start-line
147 2690 100       6303 unless ($self->{state}) {
148              
149             # Check start-line size
150 2074         5582 my $len = index $self->{buffer}, "\x0a";
151 2074 100       4482 $len = length $self->{buffer} if $len < 0;
152 2074 100       5839 return $self->_limit('Maximum start-line size exceeded') if $len > $self->max_line_size;
153              
154 2071 100       8132 $self->{state} = 'content' if $self->extract_start_line(\$self->{buffer});
155             }
156              
157             # Content
158 2687   100     7842 my $state = $self->{state} // '';
159 2687 100 100     10907 $self->content($self->content->parse(delete $self->{buffer})) if $state eq 'content' || $state eq 'finished';
160              
161             # Check message size
162 2687         8439 my $max = $self->max_message_size;
163 2687 100 100     10176 return $self->_limit('Maximum message size exceeded') if $max && $max < $self->{raw_size};
164              
165             # Check header size
166 2681 100       6063 return $self->_limit('Maximum header size exceeded') if $self->headers->is_limit_exceeded;
167              
168             # Check buffer size
169 2676 100       6423 return $self->_limit('Maximum buffer size exceeded') if $self->content->is_limit_exceeded;
170              
171 2673 100       7848 return $self->emit('progress')->content->is_finished ? $self->finish : $self;
172             }
173              
174             sub save_to {
175 2     2 1 23 my ($self, $path) = @_;
176 2         7 my $content = $self->content;
177 2 100       20 croak 'Multipart content cannot be saved to files' if $content->is_multipart;
178 1         5 $content->asset->move_to($path);
179 1         8 return $self;
180             }
181              
182 1     1 1 822 sub start_line_size { croak 'Method "start_line_size" not implemented by subclass' }
183              
184             sub text {
185 679     679 1 1384 my $self = shift;
186 679         1916 my $body = $self->body;
187 679   66     1843 my $charset = $self->content->charset || $self->default_charset;
188 679 50 66     3614 return $charset ? decode($charset, $body) // $body : $body;
189             }
190              
191             sub to_string {
192 41     41 1 93 my $self = shift;
193 41         121 return $self->build_start_line . $self->build_headers . $self->build_body;
194             }
195              
196 32     32 1 148 sub upload { shift->_cache('uploads', 0, @_) }
197              
198             sub uploads {
199 268     268 1 497 my $self = shift;
200              
201 268         485 my @uploads;
202 268         436 for my $data (@{$self->_parse_formdata(1)}) {
  268         819  
203 34         157 my $upload = Mojo::Upload->new(
204             name => $data->[0],
205             filename => $data->[2],
206             asset => $data->[1]->asset,
207             headers => $data->[1]->headers
208             );
209 34         120 push @uploads, $upload;
210             }
211              
212 268         1070 return \@uploads;
213             }
214              
215             sub _build {
216 131     131   248 my ($self, $method) = @_;
217              
218 131         228 my ($buffer, $offset) = ('', 0);
219 131         183 while (1) {
220              
221             # No chunk yet, try again
222 278 100       755 next unless defined(my $chunk = $self->$method($offset));
223              
224             # End of part
225 277 100       679 last unless my $len = length $chunk;
226              
227 146         242 $offset += $len;
228 146         309 $buffer .= $chunk;
229             }
230              
231 131         707 return $buffer;
232             }
233              
234             sub _cache {
235 720     720   1787 my ($self, $method, $all, $name) = @_;
236              
237             # Cache objects by name
238 720 100       1989 unless ($self->{$method}) {
239 345         1044 $self->{$method} = {};
240 345         669 push @{$self->{$method}{$_->name}}, $_ for @{$self->$method};
  345         1464  
  183         590  
241             }
242              
243 720   100     3393 my $objects = $self->{$method}{$name} // [];
244 720 100       3455 return $all ? $objects : $objects->[-1];
245             }
246              
247 17 50   17   138 sub _limit { ++$_[0]{limit} and return $_[0]->error({message => $_[1]}) }
248              
249             sub _parse_formdata {
250 298     298   678 my ($self, $upload) = @_;
251              
252 298         430 my @formdata;
253 298         801 my $content = $self->content;
254 298 100       1055 return \@formdata unless $content->is_multipart;
255 61   66     225 my $charset = $content->charset || $self->default_charset;
256              
257             # Check all parts recursively
258 61         190 my @parts = ($content);
259 61         185 while (my $part = shift @parts) {
260              
261 212 100       544 if ($part->is_multipart) {
262 61         100 unshift @parts, @{$part->parts};
  61         385  
263 61         183 next;
264             }
265              
266 151 50       369 next unless my $disposition = $part->headers->content_disposition;
267 151         731 my ($filename) = $disposition =~ /[; ]filename="((?:\\"|[^"])*)"/;
268 151 100 100     906 next if $upload && !defined $filename || !$upload && defined $filename;
      100        
      100        
269 89         531 my ($name) = $disposition =~ /[; ]name="((?:\\"|[^;"])*)"/;
270 89 100       233 next if !defined $name;
271 88 100       251 $part = $part->asset->slurp unless $upload;
272              
273 88 50       229 if ($charset) {
274 88 100 33     354 $name = decode($charset, $name) // $name if $name;
275 88 100 33     268 $filename = decode($charset, $filename) // $filename if $filename;
276 88 100 33     279 $part = decode($charset, $part) // $part unless $upload;
277             }
278              
279 88         443 push @formdata, [$name, $part, $filename];
280             }
281              
282 61         384 return \@formdata;
283             }
284              
285             1;
286              
287             =encoding utf8
288              
289             =head1 NAME
290              
291             Mojo::Message - HTTP message base class
292              
293             =head1 SYNOPSIS
294              
295             package Mojo::Message::MyMessage;
296             use Mojo::Base 'Mojo::Message';
297              
298             sub cookies {...}
299             sub extract_start_line {...}
300             sub get_start_line_chunk {...}
301             sub start_line_size {...}
302              
303             =head1 DESCRIPTION
304              
305             L is an abstract base class for HTTP message containers, based on L
306             7230|https://tools.ietf.org/html/rfc7230>, L and L
307             2388|https://tools.ietf.org/html/rfc2388>, like L and L.
308              
309             =head1 EVENTS
310              
311             L inherits all events from L and can emit the following new ones.
312              
313             =head2 finish
314              
315             $msg->on(finish => sub ($msg) {...});
316              
317             Emitted after message building or parsing is finished.
318              
319             my $before = time;
320             $msg->on(finish => sub ($msg) { $msg->headers->header('X-Parser-Time' => time - $before) });
321              
322             =head2 progress
323              
324             $msg->on(progress => sub ($msg) {...});
325              
326             Emitted when message building or parsing makes progress.
327              
328             # Building
329             $msg->on(progress => sub ($msg, $state, $offset) { say qq{Building "$state" at offset $offset} });
330              
331             # Parsing
332             $msg->on(progress => sub ($msg) {
333             return unless my $len = $msg->headers->content_length;
334             my $size = $msg->content->progress;
335             say 'Progress: ', $size == $len ? 100 : int($size / ($len / 100)), '%';
336             });
337              
338             =head1 ATTRIBUTES
339              
340             L implements the following attributes.
341              
342             =head2 content
343              
344             my $msg = $msg->content;
345             $msg = $msg->content(Mojo::Content::Single->new);
346              
347             Message content, defaults to a L object.
348              
349             =head2 default_charset
350              
351             my $charset = $msg->default_charset;
352             $msg = $msg->default_charset('UTF-8');
353              
354             Default charset used by L and to extract data from C or
355             C message body, defaults to C.
356              
357             =head2 max_line_size
358              
359             my $size = $msg->max_line_size;
360             $msg = $msg->max_line_size(1024);
361              
362             Maximum start-line size in bytes, defaults to the value of the C environment variable or C<8192>
363             (8KiB).
364              
365             =head2 max_message_size
366              
367             my $size = $msg->max_message_size;
368             $msg = $msg->max_message_size(1024);
369              
370             Maximum message size in bytes, defaults to the value of the C environment variable or
371             C<16777216> (16MiB). Setting the value to C<0> will allow messages of indefinite size.
372              
373             =head2 version
374              
375             my $version = $msg->version;
376             $msg = $msg->version('1.1');
377              
378             HTTP version of message, defaults to C<1.1>.
379              
380             =head1 METHODS
381              
382             L inherits all methods from L and implements the following new ones.
383              
384             =head2 body
385              
386             my $bytes = $msg->body;
387             $msg = $msg->body('Hello!');
388              
389             Slurp or replace L.
390              
391             =head2 body_params
392              
393             my $params = $msg->body_params;
394              
395             C parameters extracted from C or C message body, usually
396             a L object. Note that this method caches all data, so it should not be called before the entire
397             message body has been received. Parts of the message body need to be loaded into memory to parse C parameters, so
398             you have to make sure it is not excessively large. There's a 16MiB limit for requests and a 2GiB limit for responses by
399             default.
400              
401             # Get POST parameter names and values
402             my $hash = $msg->body_params->to_hash;
403              
404             =head2 body_size
405              
406             my $size = $msg->body_size;
407              
408             Content size in bytes.
409              
410             =head2 build_body
411              
412             my $bytes = $msg->build_body;
413              
414             Render whole body with L.
415              
416             =head2 build_headers
417              
418             my $bytes = $msg->build_headers;
419              
420             Render all headers with L.
421              
422             =head2 build_start_line
423              
424             my $bytes = $msg->build_start_line;
425              
426             Render start-line with L.
427              
428             =head2 cookie
429              
430             my $cookie = $msg->cookie('foo');
431              
432             Access message cookies, usually L or L objects. If there are multiple
433             cookies sharing the same name, and you want to access more than just the last one, you can use L. Note
434             that this method caches all data, so it should not be called before all headers have been received.
435              
436             # Get cookie value
437             say $msg->cookie('foo')->value;
438              
439             =head2 cookies
440              
441             my $cookies = $msg->cookies;
442              
443             Access message cookies. Meant to be overloaded in a subclass.
444              
445             =head2 dom
446              
447             my $dom = $msg->dom;
448             my $collection = $msg->dom('a[href]');
449              
450             Retrieve message body from L and turn it into a L object, an optional selector can be used to call
451             the method L on it right away, which then returns a L object. Note that this method
452             caches all data, so it should not be called before the entire message body has been received. The whole message body
453             needs to be loaded into memory to parse it, so you have to make sure it is not excessively large. There's a 16MiB limit
454             for requests and a 2GiB limit for responses by default.
455              
456             # Perform "find" right away
457             say $msg->dom('h1, h2, h3')->map('text')->join("\n");
458              
459             # Use everything else Mojo::DOM has to offer
460             say $msg->dom->at('title')->text;
461             say $msg->dom->at('body')->children->map('tag')->uniq->join("\n");
462              
463             =head2 error
464              
465             my $err = $msg->error;
466             $msg = $msg->error({message => 'Parser error'});
467              
468             Get or set message error, an C return value indicates that there is no error.
469              
470             # Connection or parser error
471             $msg->error({message => 'Connection refused'});
472              
473             # 4xx/5xx response
474             $msg->error({message => 'Internal Server Error', code => 500});
475              
476             =head2 every_cookie
477              
478             my $cookies = $msg->every_cookie('foo');
479              
480             Similar to L, but returns all message cookies sharing the same name as an array reference.
481              
482             # Get first cookie value
483             say $msg->every_cookie('foo')->[0]->value;
484              
485             =head2 every_upload
486              
487             my $uploads = $msg->every_upload('foo');
488              
489             Similar to L, but returns all file uploads sharing the same name as an array reference.
490              
491             # Get content of first uploaded file
492             say $msg->every_upload('foo')->[0]->asset->slurp;
493              
494             =head2 extract_start_line
495              
496             my $bool = $msg->extract_start_line(\$str);
497              
498             Extract start-line from string. Meant to be overloaded in a subclass.
499              
500             =head2 finish
501              
502             $msg = $msg->finish;
503              
504             Finish message parser/generator.
505              
506             =head2 fix_headers
507              
508             $msg = $msg->fix_headers;
509              
510             Make sure message has all required headers.
511              
512             =head2 get_body_chunk
513              
514             my $bytes = $msg->get_body_chunk($offset);
515              
516             Get a chunk of body data starting from a specific position. Note that it might not be possible to get the same chunk
517             twice if content was generated dynamically.
518              
519             =head2 get_header_chunk
520              
521             my $bytes = $msg->get_header_chunk($offset);
522              
523             Get a chunk of header data, starting from a specific position. Note that this method finalizes the message.
524              
525             =head2 get_start_line_chunk
526              
527             my $bytes = $msg->get_start_line_chunk($offset);
528              
529             Get a chunk of start-line data starting from a specific position. Meant to be overloaded in a subclass.
530              
531             =head2 header_size
532              
533             my $size = $msg->header_size;
534              
535             Size of headers in bytes. Note that this method finalizes the message.
536              
537             =head2 headers
538              
539             my $headers = $msg->headers;
540              
541             Message headers, usually a L object.
542              
543             # Longer version
544             my $headers = $msg->content->headers;
545              
546             =head2 is_finished
547              
548             my $bool = $msg->is_finished;
549              
550             Check if message parser/generator is finished.
551              
552             =head2 is_limit_exceeded
553              
554             my $bool = $msg->is_limit_exceeded;
555              
556             Check if message has exceeded L, L, L or
557             L.
558              
559             =head2 json
560              
561             my $value = $msg->json;
562             my $value = $msg->json('/foo/bar');
563              
564             Decode JSON message body directly using L if possible, an C return value indicates a bare C or
565             that decoding failed. An optional JSON Pointer can be used to extract a specific value with L.
566             Note that this method caches all data, so it should not be called before the entire message body has been received. The
567             whole message body needs to be loaded into memory to parse it, so you have to make sure it is not excessively large.
568             There's a 16MiB limit for requests and a 2GiB limit for responses by default.
569              
570             # Extract JSON values
571             say $msg->json->{foo}{bar}[23];
572             say $msg->json('/foo/bar/23');
573              
574             =head2 parse
575              
576             $msg = $msg->parse('HTTP/1.1 200 OK...');
577              
578             Parse message chunk.
579              
580             =head2 save_to
581              
582             $msg = $msg->save_to('/some/path/index.html');
583              
584             Save message body to a file.
585              
586             =head2 start_line_size
587              
588             my $size = $msg->start_line_size;
589              
590             Size of the start-line in bytes. Meant to be overloaded in a subclass.
591              
592             =head2 text
593              
594             my $str = $msg->text;
595              
596             Retrieve L and try to decode it with L or L.
597              
598             =head2 to_string
599              
600             my $str = $msg->to_string;
601              
602             Render whole message. Note that this method finalizes the message, and that it might not be possible to render the same
603             message twice if content was generated dynamically.
604              
605             =head2 upload
606              
607             my $upload = $msg->upload('foo');
608              
609             Access C file uploads, usually L objects. If there are multiple uploads sharing the
610             same name, and you want to access more than just the last one, you can use L. Note that this method
611             caches all data, so it should not be called before the entire message body has been received.
612              
613             # Get content of uploaded file
614             say $msg->upload('foo')->asset->slurp;
615              
616             =head2 uploads
617              
618             my $uploads = $msg->uploads;
619              
620             All C file uploads, usually L objects.
621              
622             # Names of all uploads
623             say $_->name for @{$msg->uploads};
624              
625             =head1 SEE ALSO
626              
627             L, L, L.
628              
629             =cut