File Coverage

blib/lib/Template/Pure/ParseUtils.pm
Criterion Covered Total %
statement 98 98 100.0
branch 28 32 87.5
condition 13 21 61.9
subroutine 10 10 100.0
pod 5 5 100.0
total 154 166 92.7


line stmt bran cond sub pod time code
1             package Template::Pure::ParseUtils;
2            
3 28     28   185899 use strict;
  28         33  
  28         684  
4 28     28   86 use warnings;
  28         33  
  28         588  
5 28     28   83 use Scalar::Util ();
  28         31  
  28         7497  
6              
7             sub parse_processing_instruction {
8 6     6 1 15 my ($pi) = @_;
9 6         27 my ($target, $body) = ($pi =~m/^\s*([^\s]+)(.+)$/s);
10             my %attrs = map {
11 14         32 my ($key, $val) = split '=', $_;
12 14         26 $key=~s/^\s+//g;
13 14 100       24 if($val=~s/^\\//) {
14 3         38 $val=~s/^['"]|['"]$//g;
15 3         4 my $val2 = \$val;
16 3         6 $key, $val2;
17             } else {
18 11         31 $val=~s/^['"]|['"]$//g;
19 11         22 $key, $val;
20             }
21 6         26 } grep { $_ }
  14         18  
22             split(/['"]\s+/, $body);
23 6         41 return $target => %attrs;
24             }
25              
26             sub parse_itr_spec {
27 11     11 1 21 my ($spec) = @_;
28 11         37 my ($key, $data_spec) = split('<-', $spec);
29 11         27 return $key => +{ parse_data_spec($data_spec) };
30             }
31              
32             {
33             package Template::Pure::Literal;
34             use overload
35 28     28   118 '""' => sub { my $self = shift; return ${$self} };
  28     51   35  
  28         226  
  51         3196  
  51         32  
  51         259  
36             }
37              
38             sub parse_data_template {
39 10     10 1 13 my ($spec) = @_;
40 10         34 $spec=~s/\r|\n//gs; # cleanup newlines.
41              
42 10         25 my $opentag = qr/=\{/;
43 10         19 my $closetag = qr/}/;
44 10         132 my $placeholder = qr{(
45             (?:
46             $opentag (
47             (?:
48             (?> [^={}]+ )
49             |
50             (?2)
51             )*
52             ) $closetag
53             )
54             )}x;
55              
56 10         10 my @parts;
57              
58             # TODO Regexp hack info. Ok so maybe my regexp Foo is not as good as it
59             # could be... The problem I have is that ( [^={]+ ) capture = and { not both
60             # grouped together. I can't seem to get it working right with things like
61             # (?!\=\{)+ that just never seems to pass tests. Since '=' is very common in
62             # HTML tags (like for setting attributes) matching on = is probably not my best
63             # idea. For now there's a hack here to change m/=./ into !\1! and then I revert
64             # it. That obviously sucks and wastes performance as well. I'm leaving it like
65             # this for now but someone with awesome regexp foo I hope can help me out :)
66              
67 10         33 $spec=~s/\=([^{])/\!$1\!/g; #TODO Hack step1
68              
69 10         184 while($spec =~/( [^={]+ ) | $placeholder /gx) {
70 34   66     97 my $part = $1||$2;
71              
72 34         33 $part=~s/\!(.)+\!/\=$1/g; #TODO Hack step2
73              
74 34 100       148 if(my ($is_data_spec) = ($part=~/^$opentag(.+?)$closetag$/)) {
75 17         25 push @parts, +{ parse_data_spec($is_data_spec) };
76             } else {
77 17         99 push @parts, bless \$part, 'Template::Pure::Literal';
78             }
79             }
80 10         80 return @parts;
81             }
82              
83             sub parse_data_spec {
84 156     156 1 163 my $spec = shift;
85              
86             # Is this a literal?
87 156 100       421 if(my ($value) = ($spec =~m/^[\'\"](.+)[\'\"]$/)) {
88             return (
89 4         30 literal => $value,
90             absolute => '',
91             path => [],
92             filters => [],
93             );
94             }
95              
96 152         337 $spec=~s/\r|\n//gs; # cleanup newlines.
97 152         174 my $absolute = ($spec=~s[^\/][]);
98              
99 152         125 my @parts;
100 152         1451 push @parts, $1 while $spec =~ /
101             ((?:
102             [^()\|]+ |
103             ( \(
104             (?: [^()]+ | (?2) )*
105             \) )
106             )*)
107             (?: \|\s* | $)
108             /xg;
109              
110             my ($path_proto, @filters_proto) =
111 328         488 grep { length($_) > 0 }
112 152         195 map { $_=~s/^\s+|\s+$//g; $_ } @parts;
  328         524  
  328         403  
113              
114             #Special case: If you have a part that is " |filter" we need to
115             #munge a bit.
116 152 100       296 if($parts[0] eq '') {
117 1         2 push @filters_proto, $path_proto;
118 1         1 $path_proto = '';
119             }
120              
121 152         451 my @path_proto = split(/\.|\//, $path_proto);
122              
123             my @path = map {
124             # Not ideal regexp here but safe enough I think since ':' is never in a method...
125             # Just would croak on a hash key that is meant to mean this. I'll doc that as
126             # 'don't do that...
127 152         166 my $maybe = ($_=~s/(maybe:)//);
  228         226  
128 228         197 my $optional = ($_=~s/(optional:)//);
129 228         628 +{ key => $_, maybe => $maybe, optional => $optional };
130             } @path_proto;
131              
132             my @filters = map {
133 152         183 my ($filter, $arg_proto) = ($_=~m/^(.*?)(?:\(\s*(.+?)?\s*\))?$/); # Borrowed from Catalyst::Controller
  24         116  
134 24         25 my @arg_parts;
135              
136 24 100       44 if($arg_proto) {
137 12         118 push @arg_parts, $1 while $arg_proto =~ /
138             ((?:
139             [^(),]+ |
140             ( \(
141             (?: [^()]+ | (?2) )*
142             \) )
143             )*)
144             (?: ,\s* | $)
145             /xg;
146             }
147              
148             my @args = map {
149 19         32 my ($data_spec) = ($_=~/^\=\{(.+?)\}$/);
150 19 100       527 $data_spec ? +{ parse_data_spec($data_spec) } : eval $_;
151             } grep {
152 24         44 length($_) > 0;
  31         36  
153             } @arg_parts;
154              
155 24         62 +[ $filter, @args ];
156             } @filters_proto;
157              
158             return (
159 152         1190 absolute => $absolute,
160             path => \@path,
161             filters => \@filters,
162             );
163             }
164              
165             sub parse_match_spec {
166 195     195 1 259 my $spec = shift;
167              
168             # Look for all the possibilities, try to leave $spec in a useful state
169 195         324 my $maybe_target_node = ($spec=~s/^\^//);
170 195         202 my $maybe_filter = ($spec=~s/\|$//);
171 195         230 my $maybe_prepend = ($spec=~s/^(\+)//);
172 195         235 my $maybe_append = ($spec=~s/(\+)$//);
173 195         172 my $maybe_absolute = ($spec=~s[^\/][]);
174              
175 195         375 my ($css, $maybe_attr) = split('@', $spec);
176 195 100 100     431 $css = '.' if $maybe_attr && !$css; # $css unlikely to be 0
177              
178             # All the error conditions I can think of.
179 195 50       292 die "You need a CSS style match: '$spec'"
180             unless $css;
181              
182 195 50 33     286 die "Can't add a filter when appending or prepending: '$spec'"
      66        
183             if $maybe_filter && ($maybe_append || $maybe_prepend);
184              
185 195 50 33     265 die "Can't set a target when filtering: '$spec'"
      66        
186             if $maybe_filter && ($maybe_target_node || $maybe_attr);
187              
188 195 50 66     373 die "Can't set a target attribute and target node: '$spec'"
189             if $maybe_target_node && $maybe_attr;
190              
191 195         184 my $target = 'content';
192 195 100       377 if($maybe_target_node) {
    100          
193 34         36 $target = 'node';
194             } elsif($maybe_attr) {
195 21         26 $target = \$maybe_attr;
196             }
197              
198 195         148 my $mode = 'replace';
199 195 100       419 if($maybe_append) {
    100          
    100          
200 26         31 $mode = 'append';
201             } elsif($maybe_prepend) {
202 11         9 $mode = 'prepend';
203             } elsif($maybe_filter) {
204 2         2 $mode = 'filter';
205 2         2 $target = '';
206             }
207              
208             return (
209 195         1598 absolute => $maybe_absolute,
210             css => $css,
211             target => $target,
212             mode => $mode,
213             );
214             }
215              
216             1;
217              
218             =head1 NAME
219              
220             Template::Pure::ParseUtils - Utility Functions
221              
222             =head1 SYNOPSIS
223              
224             For internal use
225              
226             =head1 DESCRIPTION
227              
228             Contains utility functions for L<Template::Pure>
229              
230             =head1 FUNCTIONS
231              
232             This package contains the following functions:
233              
234             =head2 parse_processing_instruction ($pi)
235              
236             Given a processing instruction, parse it into a $target and %attrs such that:
237              
238             <?pure-include id='ddd'
239             pure:mode='append|prepend|replace'
240             pure:target='node|content'
241             pure:src='include' ?>
242              
243             Is parsed into:
244              
245             "pure-include" => {
246             id => "ddd",
247             "pure:mode" => "append|prepend|replace",
248             "pure:src" => "include",
249             "pure:target" => "node|content"
250             }
251              
252             and returned.
253              
254             =head2 parse_itr_spec ($spec)
255              
256             Used to parse a string when we are specifying an iterator. For example
257              
258             "user<-users"
259              
260             or:
261              
262             "friend<-user.friends"
263              
264             Returns a hashref when the key is the new data label and the value is a reference to the
265             indicated path from the current data context.
266              
267             {
268             user => {
269             absolute => '';
270             filters => [],
271             path => [
272             key => 'users',
273             maybe => '',
274             optional => ''
275             ],
276             },
277             }
278              
279             B<NOTE> you cannot use a filter on an iterator specification.
280              
281             B<NOTE> Indicated data context path must be something that can be coerced into an iterator
282             (an arrayref, a hashref, or an Object that provides the iterator interface).
283              
284             =head2 parse_data_template ($spec)
285              
286             Used to parse a string that is the target action of a match, when the string contains
287             template placeholders, for example:
288              
289             "Hello ={meta.first_name} ={meta.last_name}!"
290              
291             Which is intended to be parsed as containing a string with two placeholders, each pointing
292             to a different path on the current data context.
293              
294             When parsed returns an array, where each element is either a string (for a literal string
295             value) or a hash reference (indicates a patch to a value on the current data context).
296              
297             For example the shown string would parse in this way:
298              
299             (
300             'Hello ',
301             {
302             absolute => '',
303             filters => [],
304             path => [
305             { key => 'meta', optional => undef, maybe => undef },
306             { key => 'first_name', optional => undef, maybe => undef },
307             },
308             ' ',
309             {
310             absolute => '',
311             filters => [],
312             path => [
313             { key => 'meta', optional => undef, maybe => undef },
314             { key => 'first_name', optional => undef, maybe => undef },
315             },
316             '!',
317             );
318              
319             Information inside the placeholder may contain filters and prefixes and other markers:
320              
321             "Year of Birth: ={/maybe:meta.optional:dob | strftime(%Y)}"
322              
323             Would parse as:
324              
325             (
326             'Year of Birth: ',
327             {
328             absolute => '1',
329             filters => [
330             ['strftime', '%Y'],
331             ],
332             path => [
333             { key => 'meta', optional => undef, maybe => 1 },
334             { key => 'dob', optional => 1, maybe => undef },
335             },
336             );
337              
338              
339             =head2 parse_data_spec ($spec)
340              
341             When the action target is a string we need to inspect it to figure out what do do with it.
342             Returns a hash with keys as follows:
343              
344             =over 4
345              
346             =item absolute
347              
348             Boolean. Defaults to False. When true this means the described path should be absolute
349             from the top of the data context. Otherwise the described path is relative to the current
350             point selected in the data context.
351              
352              
353             =item path
354              
355             Example:
356              
357             path => [
358             {
359             key => 'meta',
360             optional => 0,
361             maybe => 0
362             },
363             {
364             key => 'title',
365             optional => 0,
366             maybe => 0
367             }
368             ];
369              
370             An array hashrefs that indicate path parts from the current data context to the value we
371             wish to use. Each hashref contains three keys:
372              
373             =over 4
374              
375             =item key
376              
377             The name that is a 'key' point on the path. Likely to be a key in a hash or a method on an
378             object.
379              
380             =item optional
381              
382             Boolean. Defaults to false. Generally if the key does not match a real path on the current
383             data context, this should return an error. If this value is false, that means instead of
384             throwing an error we return an 'undef'.
385              
386             Value is derived from the prefix 'optional:'. Presence of this prefix sets this to true.
387              
388             B<NOTE> since 'optional:' has special meaning here, this means that if your data context is
389             a hash, you should not have any keys that match 'optional:' for your own purposes... If you
390             really run into this you'll have to write an anonymous subroutine type action.
391              
392             =item maybe
393              
394             Boolean. Defaults to false. Generally if you have several path parts and a midpoint part
395             returns undefined, that mean we throw an exception on later parts (can't find a next path on
396             an undefined value). In some cases (like when you are chaining resultset methods in L<DBIx::Class>)
397             we might not prefer tothrow an error but just return 'undef'. When a path is 'maybe' we
398             wrap in in an object such that the next path is always found (but returns undef).
399              
400             Value is derived from the prefix 'maybe:'. Presence of this prefix sets this to true.
401              
402             B<NOTE> since 'maybe:' has special meaning here, this means that if your data context is
403             a hash, you should not have any keys that match 'maybe:' for your own purposes... If you
404             really run into this you'll have to write an anonymous subroutine type action.
405              
406             =back
407              
408             =item filters
409              
410             An Arrayref of Arrayrefs which are any filters added to the value and their arguments.
411              
412             Example:
413              
414             filters => [
415             [ 'repeat', '3'],
416             [ 'escape_html' ],
417             ];
418              
419             In some cases the arguments for a filter might itself point to a resolved data spec (which itself
420             could include filters... In this case the argument value will be a hashref that is itself the
421             result of a call to L</parse_data_spec>, example:
422              
423             (
424             path => [
425             {
426             key => 'meta', maybe => 0, optional => 0,
427             },
428             {
429             key => 'title', maybe => 0, optional => 0,
430             },
431             ],
432             filters => [
433             ['title_case'],
434             ['truncate',
435             {
436             path => [
437             { key => 'settings', maybe => 0, optional => 0 },
438             { key => 'title_length', maybe => 0, optional => 0 },
439             ],
440             filters => [],
441             },
442             '...',
443             ],
444             ],
445             );
446              
447             You'd have a string to parse like "meta.title | title_case | truncate(={settings.title_length},'...')"
448             which has a filter 'truncate' that has two args, the first being 'whatever the value is at
449             'settings.title_length'' and the second is a literal '...'.
450              
451             You could go wild here with nested values and filters but I recommend if you have such complex
452             needs it would be better to do it in Perl with an anonymous subroutine rather than over cleverness
453             in the string based DSL, which will never be as good as Perl itself. Use it for straight and simple
454             things and for when you want to let non Perl programmers work with the directives.
455              
456             B<NOTE> we run C<eval> on each argument to convert it to a Perl data value, so you could in
457             theory do fancy stuff here like "filter(1+2+3)" and get an arg of '3'. I highly recommend constraint
458             in this. Since its C<eval>'d you should be certain these values are properly cleaned and untainted.
459             For example beware of something like "filter($a)", where $a comes from uncontrolled source such as the
460             input of a HTML Form post, or from external sources like a database or file. This could be considered
461             a possible injection attack location. Because of this we might someday switch this to a non eval
462             parser such as L<Data::Pond> or similar, and if you did crazy expression stuff that don't work with
463             a more restrictive and safe expression parser, its possible your code will break. Buyer beware.
464              
465             B<NOTE> The values for the boolean keys 'maybe' and 'optional' are only specificed to return a
466             Perl value to be evaluated as a boolean. We don't specify the exact value. For example, under Perl
467             both 0 and undef are considered false in boolean context.
468              
469             =back
470              
471             =head2 parse_match_spec ($spec)
472              
473             Given a directive match specification (such as '#head', 'title', 'p.links@href', ...) parse
474             it into a hash that defines how the match is to be performed. Returns a hash with keys are
475             follows.
476              
477             =over 4
478              
479             =item css
480              
481             This is the actual CSS match component ('p', '#id', '.class') or the special match indicator of
482             '.' for the current node.
483              
484             =item target
485              
486             This is the indicator of the replacement target for the match. Can be: 'node', 'content', \'$attribute':
487              
488             =over 4
489              
490             =item content
491              
492             Example Match Specifiction: 'p.headline', 'title', '#id'
493              
494             This is the default value for target. Indicates we will update the matched nodes' content. For example the
495             content of node '<p>content</p>' is 'content'. No special symbols are needed to indicate this target type.
496              
497             =item \$attribute
498              
499             Example Match Specifiction: 'a#homepage@href', 'ul.links@class'
500              
501             When the value of 'target' is a scalar reference, this indicates the update type to be an attribute on the current
502             matched node. The dereferenced scalar is the name of the attribute. If the attribute does not exist in the current
503             node this does not raise an exception, but rather we automatically add it.
504              
505             It is an error to indicate both node and attribute targets.
506              
507             B<NOTE> Should a match specification consist only of an attribute, we presume a 'css' value of '.'
508              
509             =item node
510              
511             Example Match Specifiction: '^p.headline', '^#id'
512              
513             Indicated a target of 'node', which means we will replace the entire matched node. Indicated by a '^' appearing
514             as the first character of the match specification.
515              
516             It is an error to indicate both node and attribute targets.
517              
518             =back
519              
520             =item mode
521              
522             Defines the relationship, if any, between a new value from the data context and any existing information
523             in the template and the match location. One of 'append', 'prepend', or 'replace', with 'replace' being the default.
524              
525             =over 4
526              
527             =item replace
528              
529             Example Match Specifiction: 'title', '#id', 'p.content@class'
530              
531             The default behavior. Needs no special indicators in the match specification. Means the new value
532             completely replaces the match target.
533              
534             =item append
535              
536             Example Match Specifiction: 'title+', '#id+', 'p.content@class+'
537              
538             Match specifications that end with '+' will append to the indicated match (that is we place the
539             new value after the old value, preserving th old value.
540              
541             It is an error to try to set both append and prepend mode on the same target. It is also an error
542             to use append and prepend along with a filter indicator (see below).
543              
544             When appending to a target of attribute where the attribute is 'class', we automatically add a ' ' (space)
545             between the appending value and any existing value. This is a special case since generally a space
546             is required between classes in order for them to work as expected.
547              
548             =item prepend
549              
550             Example Match Specifiction: '+body', '+p.content@class'
551              
552             Match specifications that begin with a '+' (or '^+') indicate we expect to add the data context to the
553             front of the existing value, preserving the existing value.
554              
555             It is an error to try to set both append and prepend mode on the same target. It is also an error
556             to use append and prepend along with a filter indicator (see below).
557              
558             When prepending to a target of attribute where the attribute is 'class', we automatically add a ' ' (space)
559             between the appending value and any existing value. This is a special case since generally a space
560             is required between classes in order for them to work as expected.
561              
562             =item filter
563              
564             Example Match Specification: 'html|', 'body|'
565              
566             Means that we expect to run a filter callback on the matched node. Useful when you want to make global
567             changes across the entire template. Indicated by a '|' or pipe symbol. Cannot be used with append,
568             prepend or any special target indicators (attributes or node).
569              
570             We expect the action the be an anonymous subroutine.
571              
572             =back
573              
574             =back
575              
576             =head1 SEE ALSO
577            
578             L<Template::Pure>.
579              
580             =head1 AUTHOR
581            
582             John Napiorkowski L<email:jjnapiork@cpan.org>
583              
584             But lots of this code was copied from L<Template::Filters> and other prior art on CPAN. Thanks!
585            
586             =head1 COPYRIGHT & LICENSE
587            
588             Please see L<Template::Pure> for copyright and license information.
589              
590             =cut