File Coverage

blib/lib/PPIx/Regexp/Tokenizer.pm

Criterion	Covered	Total	%
statement	494	522	94.6
branch	177	238	74.3
condition	44	64	68.7
subroutine	85	89	95.5
pod	29	29	100.0
total	829	942	88.0

line	stmt	bran	cond	sub	pod	time	code
1							package PPIx::Regexp::Tokenizer;
2
3	9			9		63	use strict;
	9					25
	9					305
4	9			9		44	use warnings;
	9					17
	9					238
5
6	9			9		46	use base qw{ PPIx::Regexp::Support };
	9					14
	9					737
7
8	9			9		56	use Carp qw{ carp croak confess };
	9					20
	9					704
9	9					1291	use PPIx::Regexp::Constant qw{
10							ARRAY_REF
11							CODE_REF
12							HASH_REF
13							LOCATION_LINE
14							LOCATION_CHARACTER
15							LOCATION_COLUMN
16							LOCATION_LOGICAL_LINE
17							MINIMUM_PERL
18							REGEXP_REF
19							TOKEN_LITERAL
20							TOKEN_UNKNOWN
21							@CARP_NOT
22	9			9		66	};
	9					16
23	9			9		4235	use PPIx::Regexp::Token::Assertion ();
	9					25
	9					209
24	9			9		4455	use PPIx::Regexp::Token::Backreference ();
	9					31
	9					291
25	9			9		4152	use PPIx::Regexp::Token::Backtrack ();
	9					24
	9					206
26	9			9		4326	use PPIx::Regexp::Token::CharClass::POSIX ();
	9					23
	9					203
27	9			9		4280	use PPIx::Regexp::Token::CharClass::POSIX::Unknown ();
	9					30
	9					188
28	9			9		4261	use PPIx::Regexp::Token::CharClass::Simple ();
	9					43
	9					220
29	9			9		4353	use PPIx::Regexp::Token::Code ();
	9					45
	9					277
30	9			9		4521	use PPIx::Regexp::Token::Comment ();
	9					22
	9					187
31	9			9		4233	use PPIx::Regexp::Token::Condition ();
	9					38
	9					255
32	9			9		4164	use PPIx::Regexp::Token::Control ();
	9					24
	9					234
33	9			9		4198	use PPIx::Regexp::Token::Delimiter ();
	9					32
	9					269
34	9			9		4075	use PPIx::Regexp::Token::Greediness ();
	9					27
	9					199
35	9			9		3906	use PPIx::Regexp::Token::GroupType::Assertion ();
	9					24
	9					210
36	9			9		4033	use PPIx::Regexp::Token::GroupType::Atomic_Script_Run ();
	9					36
	9					216
37	9			9		3838	use PPIx::Regexp::Token::GroupType::BranchReset ();
	9					25
	9					197
38	9			9		3779	use PPIx::Regexp::Token::GroupType::Code ();
	9					28
	9					205
39	9			9		3779	use PPIx::Regexp::Token::GroupType::Modifier ();
	9					27
	9					232
40	9			9		3988	use PPIx::Regexp::Token::GroupType::NamedCapture ();
	9					23
	9					185
41	9			9		3747	use PPIx::Regexp::Token::GroupType::Script_Run ();
	9					24
	9					198
42	9			9		3905	use PPIx::Regexp::Token::GroupType::Subexpression ();
	9					33
	9					219
43	9			9		3773	use PPIx::Regexp::Token::GroupType::Switch ();
	9					30
	9					192
44	9			9		4094	use PPIx::Regexp::Token::Interpolation ();
	9					24
	9					209
45	9			9		4429	use PPIx::Regexp::Token::Literal ();
	9					35
	9					251
46	9			9		64	use PPIx::Regexp::Token::Modifier ();
	9					27
	9					125
47	9			9		4484	use PPIx::Regexp::Token::Operator ();
	9					26
	9					201
48	9			9		4318	use PPIx::Regexp::Token::Quantifier ();
	9					27
	9					199
49	9			9		64	use PPIx::Regexp::Token::Recursion ();
	9					17
	9					126
50	9			9		44	use PPIx::Regexp::Token::Structure ();
	9					30
	9					132
51	9			9		4124	use PPIx::Regexp::Token::Unknown ();
	9					35
	9					212
52	9			9		4132	use PPIx::Regexp::Token::Whitespace ();
	9					27
	9					239
53	9					496	use PPIx::Regexp::Util qw{
54							is_ppi_regexp_element
55							__instance
56	9			9		60	};
	9					18
57
58	9			9		67	use Scalar::Util qw{ looks_like_number };
	9					21
	9					60895
59
60							our $VERSION = '0.087';
61
62							our $DEFAULT_POSTDEREF;
63							defined $DEFAULT_POSTDEREF
64							or $DEFAULT_POSTDEREF = 1;
65
66							{
67							# Names of classes containing tokenization machinery. There are few
68							# known ordering requirements, since each class recognizes its own,
69							# and I have tried to prevent overlap. Absent such constraints, the
70							# order is in perceived frequency of acceptance, to keep the search
71							# as short as possible. If I were conscientious I would gather
72							# statistics on this.
73							my @classes = ( # TODO make readonly when acceptable way appears
74							'PPIx::Regexp::Token::Literal',
75							'PPIx::Regexp::Token::Interpolation',
76							'PPIx::Regexp::Token::Control', # Note 1
77							'PPIx::Regexp::Token::CharClass::Simple', # Note 2
78							'PPIx::Regexp::Token::Quantifier',
79							'PPIx::Regexp::Token::Greediness',
80							'PPIx::Regexp::Token::CharClass::POSIX', # Note 3
81							'PPIx::Regexp::Token::Structure',
82							'PPIx::Regexp::Token::Assertion',
83							'PPIx::Regexp::Token::Backreference',
84							'PPIx::Regexp::Token::Operator', # Note 4
85							);
86
87							# Note 1: If we are in quote mode ( \Q ... \E ), Control makes a
88							# literal out of anything it sees other than \E. So it
89							# needs to come before almost all other tokenizers. Not
90							# Literal, which already makes literals, and not
91							# Interpolation, which is legal in quote mode, but
92							# everything else.
93
94							# Note 2: CharClass::Simple must come after Literal, because it
95							# relies on Literal to recognize a Unicode named character
96							# ( \N{something} ), so any \N that comes through to it
97							# must be the \N simple character class (which represents
98							# anything but a newline, and was introduced in Perl
99							# 5.11.0.
100
101							# Note 3: CharClass::POSIX has to come before Structure, since both
102							# look for square brackets, and CharClass::POSIX is the
103							# more particular.
104
105							# Note 4: Operator relies on Literal making the characters literal
106							# if they appear in a context where they can not be
107							# operators, and Control making them literals if quoting,
108							# so it must come after both.
109
110							# Return the declared tokenizer classes.
111							sub __tokenizer_classes {
112	538			538		3118	return @classes;
113							}
114
115							}
116
117							{
118							my $errstr;
119
120							sub new {
121	739			739	1	94929	my ( $class, $re, %args ) = @_;
122	739	50				2910	ref $class and $class = ref $class;
123
124	739					1537	$errstr = undef;
125
126							exists $args{default_modifiers}
127							and ARRAY_REF ne ref $args{default_modifiers}
128	739	50	66			2920	and do {
129	0					0	$errstr = 'default_modifiers must be an array reference';
130	0					0	return;
131							};
132
133							my $self = {
134							index_locations => $args{index_locations}, # Index locations
135							capture => undef, # Captures from find_regexp.
136							content => undef, # The string we are tokenizing.
137							cookie => {}, # Cookies
138							cursor_curr => 0, # The current position in the string.
139							cursor_limit => undef, # The end of the portion of the
140							# string being tokenized.
141							cursor_orig => undef, # Position of cursor when tokenizer
142							# called. Used by get_token to prevent
143							# recursion.
144							cursor_modifiers => undef, # Position of modifiers.
145							default_modifiers => $args{default_modifiers} \|\| [],
146							delimiter_finish => undef, # Finishing delimiter of regexp.
147							delimiter_start => undef, # Starting delimiter of regexp.
148							encoding => $args{encoding}, # Character encoding.
149							expect => undef, # Extra classes to expect.
150							expect_next => undef, # Extra classes as of next parse cycle
151							failures => 0, # Number of parse failures.
152							find => undef, # String for find_regexp
153							known => {}, # Known tokenizers, by mode.
154							location => $args{location},
155							match => undef, # Match from find_regexp.
156							mode => 'init', # Initialize
157							modifiers => [{}], # Modifier hash.
158							pending => [], # Tokens made but not returned.
159							prior => TOKEN_UNKNOWN, # Prior significant token.
160							source => $re, # The object we were initialized with.
161							strict => $args{strict}, # like "use re 'strict';".
162							trace => __PACKAGE__->__defined_or(
163	739		100			10562	$args{trace}, $ENV{PPIX_REGEXP_TOKENIZER_TRACE}, 0 ),
164							};
165
166	739	100				3569	if ( __instance( $re, 'PPI::Element' ) ) {
		100
167	11	50				83	is_ppi_regexp_element( $re )
168							or return __set_errstr( ref $re, 'not supported by', $class );
169							# TODO conditionalizstion on PPI class does not really
170							# belong here, but at the moment I have no other idea of
171							# where to put it.
172	11	50				100	$self->{content} = $re->isa( 'PPI::Token::HereDoc' ) ?
173							join( '', $re->content(), "\n", $re->heredoc(),
174							$re->terminator(), "\n" ) :
175							$re->content();
176							} elsif ( ref $re ) {
177	2					9	return __set_errstr( ref $re, 'not supported' );
178							} else {
179	726					2073	$self->{content} = $re;
180							}
181
182	737					1939	bless $self, $class;
183
184	737					3156	$self->{content} = $self->decode( $self->{content} );
185
186	737					2242	$self->{cursor_limit} = length $self->{content};
187
188							$self->{trace}
189	737	50				2213	and warn "\ntokenizing '$self->{content}'\n";
190
191	737					2814	return $self;
192							}
193
194							sub __set_errstr {
195	2			2		8	$errstr = join ' ', @_;
196	2					13	return;
197							}
198
199							sub errstr {
200	2			2	1	5	return $errstr;
201							}
202
203							}
204
205							sub capture {
206	712			712	1	1782	my ( $self ) = @_;
207	712	100				2302	$self->{capture} or return;
208	691	50				1778	defined wantarray or return;
209	691	50				1659	return wantarray ? @{ $self->{capture} } : $self->{capture};
	691					3530
210							}
211
212							sub content {
213	1			1	1	3	my ( $self ) = @_;
214	1					9	return $self->{content};
215							}
216
217							sub cookie {
218	10177			10177	1	18623	my ( $self, $name, @args ) = @_;
219	10177	50				19297	defined $name
220							or confess "Programming error - undefined cookie name";
221	10177	50				19154	if ( $self->{trace} ) {
222	0					0	local $" = ', ';
223	0					0	warn "cookie( '$name', @args )\n";
224							}
225	10177	100				38806	@args or return $self->{cookie}{$name};
226	721					1560	my $cookie = shift @args;
227	721	100				2943	if ( CODE_REF eq ref $cookie ) {
		50
228	593					2967	return ( $self->{cookie}{$name} = $cookie );
229							} elsif ( defined $cookie ) {
230	0					0	confess "Programming error - cookie must be CODE ref or undef";
231							} else {
232	128					570	return delete $self->{cookie}{$name};
233							}
234							}
235
236							# NOTE: Currently this is called only against
237							# COOKIE_LOOKAROUND_ASSERTION, once in PPIx::Token::GroupType::Assertion
238							# to prevent the cookie from being remade if it already exists, and once
239							# in PPIx::Regexp::Token::Assertion to determine if \K is inside a
240							# lookaround assertion. If it gets used other places, or if there is
241							# call for it, I should consider removing the underscores and
242							# documenting it as public.
243							sub __cookie_exists {
244	57			57		187	my ( $self, $name ) = @_;
245	57	50				177	defined $name
246							or confess "Programming error - undefined cookie name";
247	57					246	return $self->{cookie}{$name};
248							}
249
250							sub default_modifiers {
251	0			0	1	0	my ( $self ) = @_;
252	0					0	return [ @{ $self->{default_modifiers} } ];
	0					0
253							}
254
255							sub __effective_modifiers {
256	332			332		934	my ( $self ) = @_;
257							HASH_REF eq ref $self->{effective_modifiers}
258	332	100				1316	or return {};
259	324					639	return { %{ $self->{effective_modifiers} } };
	324					1358
260							}
261
262							sub encoding {
263	0			0	1	0	my ( $self ) = @_;
264	0					0	return $self->{encoding};
265							}
266
267							sub expect {
268	330			330	1	1393	my ( $self, @args ) = @_;
269
270							@args
271	330	50				917	or return;
272
273							$self->{expect_next} = [
274	330	50				765	map { m/ \A PPIx::Regexp:: /smx ? $_ : 'PPIx::Regexp::' . $_ }
	2602					7883
275							@args
276							];
277	330					1029	$self->{expect} = undef;
278	330					914	return;
279							}
280
281							sub failures {
282	8			8	1	19	my ( $self ) = @_;
283	8					22	return $self->{failures};
284							}
285
286							sub find_matching_delimiter {
287	583			583	1	1372	my ( $self ) = @_;
288	583		100			2653	$self->{cursor_curr} \|\|= 0;
289							my $start = substr
290							$self->{content},
291							$self->{cursor_curr},
292	583					1461	1;
293
294	583					1098	my $inx = $self->{cursor_curr};
295	583		66			2302	my $finish = (
296							my $bracketed = $self->close_bracket( $start ) ) \|\| $start;
297
298							=begin comment
299
300							$self->{trace}
301							and warn "Find matching delimiter: Start with '$start' at $self->{cursor_curr}, end with '$finish' at or before $self->{cursor_limit}\n";
302
303							=end comment
304
305							=cut
306
307	583					1238	my $nest = 0;
308
309	583					1878	while ( ++$inx < $self->{cursor_limit} ) {
310	6122					9301	my $char = substr $self->{content}, $inx, 1;
311
312							=begin comment
313
314							$self->{trace}
315							and warn " looking at '$char' at $inx, nest level $nest\n";
316
317							=end comment
318
319							=cut
320
321	6122	100	100			22286	if ( $char eq '\\' && $finish ne '\\' ) {
		100	100
		100
322	317					773	++$inx;
323							} elsif ( $bracketed && $char eq $start ) {
324	1					10	++$nest;
325							} elsif ( $char eq $finish ) {
326							--$nest < 0
327	582	100				3940	and return $inx - $self->{cursor_curr};
328							}
329							}
330
331	2					8	return;
332							}
333
334							sub find_regexp {
335	16830			16830	1	30860	my ( $self, $regexp ) = @_;
336
337	16830	50	0			36780	REGEXP_REF eq ref $regexp
338							or confess
339							'Argument is a ', ( ref $regexp \|\| 'scalar' ), ' not a Regexp';
340
341	16830	100				37729	defined $self->{find} or $self->_remainder();
342
343	16830	100				100451	$self->{find} =~ $regexp
344							or return;
345
346	1840					3474	my @capture;
347	1840					6754	foreach my $inx ( 0 .. $#+ ) {
348	4247	100	66			18977	if ( defined $-[$inx] && defined $+[$inx] ) {
349							push @capture, $self->{capture} = substr
350							$self->{find},
351	3758					19736	$-[$inx],
352							$+[$inx] - $-[$inx];
353							} else {
354	489					1352	push @capture, undef;
355							}
356							}
357	1840					4640	$self->{match} = shift @capture;
358	1840					3935	$self->{capture} = \@capture;
359
360							# The following circumlocution seems to be needed under Perl 5.13.0
361							# for reasons I do not fathom -- at least in the case where
362							# wantarray is false. RT 56864 details the symptoms, which I was
363							# never able to reproduce outside Perl::Critic. But returning $+[0]
364							# directly, the value could transmogrify between here and the
365							# calling module.
366							## my @data = ( $-[0], $+[0] );
367							## return wantarray ? @data : $data[1];
368	1840	50				9691	return wantarray ? ( $-[0] + 0, $+[0] + 0 ) : $+[0] + 0;
369							}
370
371							sub get_mode {
372	46			46	1	127	my ( $self ) = @_;
373	46					230	return $self->{mode};
374							}
375
376							sub get_start_delimiter {
377	1794			1794	1	2942	my ( $self ) = @_;
378	1794					8080	return $self->{delimiter_start};
379							}
380
381							sub get_token {
382	4114			4114	1	7004	my ( $self ) = @_;
383
384							caller eq __PACKAGE__ or $self->{cursor_curr} > $self->{cursor_orig}
385	4114	50	66			13112	or confess 'Programming error - get_token() called without ',
386							'first calling make_token()';
387
388	4114					10181	my $handler = '__PPIX_TOKENIZER__' . $self->{mode};
389
390							my $code = $self->can( $handler )
391							or confess 'Programming error - ',
392							"Getting token in mode '$self->{mode}'. ",
393							"cursor_curr = $self->{cursor_curr}; ",
394							"cursor_limit = $self->{cursor_limit}; ",
395							"length( content ) = ", length $self->{content},
396	4114	50				16923	"; content = '$self->{content}'";
397
398							my $character = substr(
399							$self->{content},
400							$self->{cursor_curr},
401	4114					9752	1
402							);
403
404							$self->{trace}
405	4114	50				8552	and warn "get_token() got '$character' from $self->{cursor_curr}\n";
406
407	4114					9836	return ( $code->( $self, $character ) );
408							}
409
410							sub interpolates {
411	141			141	1	290	my ( $self ) = @_;
412	141					703	return $self->{delimiter_start} ne q{'};
413							}
414
415							sub make_token {
416	5216			5216	1	13002	my ( $self, $length, $class, $arg ) = @_;
417	5216	100				11054	defined $class or $class = caller;
418
419	5216	50				12572	if ( $length + $self->{cursor_curr} > $self->{cursor_limit} ) {
420							$length = $self->{cursor_limit} - $self->{cursor_curr}
421	0	0				0	or return;
422							}
423
424	5216	50				18404	$class =~ m/ \A PPIx::Regexp:: /smx
425							or $class = 'PPIx::Regexp::' . $class;
426							my $content = substr
427							$self->{content},
428							$self->{cursor_curr},
429	5216					11750	$length;
430
431							$self->{trace}
432	5216	50				10384	and warn "make_token( $length, '$class' ) => '$content'\n";
433	5216	50				11656	$self->{trace} > 1
434							and warn " make_token: cursor_curr = $self->{cursor_curr}; ",
435							"cursor_limit = $self->{cursor_limit}\n";
436							my $token = $class->__new( $content,
437							tokenizer => $self,
438	5216	100				9092	%{ $arg \|\| {} } )
	5216	50				36872
439							or return;
440
441							$self->{index_locations}
442	5216	100				15037	and $self->_update_location( $token );
443
444							$token->significant()
445	5216	100				15918	and $self->{expect} = undef;
446
447	5216	100				25050	$token->isa( TOKEN_UNKNOWN ) and $self->{failures}++;
448
449	5216					9055	$self->{cursor_curr} += $length;
450	5216					8354	$self->{find} = undef;
451	5216					8698	$self->{match} = undef;
452	5216					8067	$self->{capture} = undef;
453
454	5216					8367	foreach my $name ( keys %{ $self->{cookie} } ) {
	5216					13504
455	3615					6722	my $cookie = $self->{cookie}{$name};
456							$cookie->( $self, $token )
457	3615	100				9600	or delete $self->{cookie}{$name};
458							}
459
460							# Record this token as the prior token if it is significant. We must
461							# do this after processing cookies, so that the cookies have access
462							# to the old token if they want.
463							$token->significant()
464	5216	100				12692	and $self->{prior_significant_token} = $token;
465
466	5216					21661	return $token;
467							}
468
469							sub match {
470	86			86	1	228	my ( $self ) = @_;
471	86					253	return $self->{match};
472							}
473
474							sub modifier {
475	5036			5036	1	9686	my ( $self, $modifier ) = @_;
476							return PPIx::Regexp::Token::Modifier::__asserts(
477	5036					12769	$self->{modifiers}[-1], $modifier );
478							}
479
480							sub modifier_duplicate {
481	292			292	1	692	my ( $self ) = @_;
482	292					607	push @{ $self->{modifiers} },
483	292					457	{ %{ $self->{modifiers}[-1] } };
	292					1295
484	292					718	return;
485							}
486
487							sub modifier_modify {
488	592			592	1	1783	my ( $self, %args ) = @_;
489
490							# Modifier code is centralized in PPIx::Regexp::Token::Modifier
491							$self->{modifiers}[-1] =
492							PPIx::Regexp::Token::Modifier::__PPIX_TOKENIZER__modifier_modify(
493	592					2796	$self->{modifiers}[-1], \%args );
494
495	592					1548	return;
496
497							}
498
499							sub modifier_pop {
500	288			288	1	736	my ( $self ) = @_;
501	288					1087	@{ $self->{modifiers} } > 1
502	288	100				471	and pop @{ $self->{modifiers} };
	282					779
503	288					846	return;
504							}
505
506							sub modifier_seen {
507	8			8	1	30	my ( $self, $modifier ) = @_;
508	8					17	foreach my $mod ( reverse @{ $self->{modifiers} } ) {
	8					26
509	10	100				47	exists $mod->{$modifier}
510							and return 1;
511							}
512	5					23	return;
513							}
514
515							sub next_token {
516	5750			5750	1	10108	my ( $self ) = @_;
517
518							{
519
520	5750	100				8774	if ( @{ $self->{pending} } ) {
	9847					14513
	9847					20473
521	5214					6947	return shift @{ $self->{pending} };
	5214					17860
522							}
523
524	4633	100				11236	if ( $self->{cursor_curr} >= $self->{cursor_limit} ) {
525							$self->{cursor_limit} >= length $self->{content}
526	1091	100				5228	and return;
527	555	50				2023	$self->{mode} eq 'finish' and return;
528	555					1829	$self->_set_mode( 'finish' );
529	555					1520	$self->{cursor_limit} += length $self->{delimiter_finish};
530							}
531
532	4097	50				10302	if ( my @tokens = $self->get_token() ) {
533	4097					6232	push @{ $self->{pending} }, @tokens;
	4097					8922
534	4097					7469	redo;
535
536							}
537
538							}
539
540	0					0	return;
541
542							}
543
544							sub peek {
545	379			379	1	768	my ( $self, $offset ) = @_;
546	379	100				982	defined $offset or $offset = 0;
547	379	50				979	$offset < 0 and return;
548	379					739	$offset += $self->{cursor_curr};
549	379	50				1015	$offset >= $self->{cursor_limit} and return;
550	379					1967	return substr $self->{content}, $offset, 1;
551							}
552
553							sub ppi_document {
554	83			83	1	230	my ( $self ) = @_;
555
556	83	50				244	defined $self->{find} or $self->_remainder();
557
558	83					596	return PPI::Document->new( \"$self->{find}" );
559							}
560
561							sub prior_significant_token {
562	2413			2413	1	4345	my ( $self, $method, @args ) = @_;
563	2413	100				5043	defined $method or return $self->{prior_significant_token};
564							$self->{prior_significant_token}->can( $method )
565							or confess 'Programming error - ',
566							( ref $self->{prior_significant_token} \|\|
567	2394	50	0			9587	$self->{prior_significant_token} ),
568							' does not support method ', $method;
569	2394					9166	return $self->{prior_significant_token}->$method( @args );
570							}
571
572							# my $length = $token->__recognize_postderef( $tokenizer, $iterator ).
573							#
574							# This method is private to the PPIx-Regexp package, and may be changed
575							# or retracted without warning. What it does is to recognize postfix
576							# dereferences. It returns the length in characters of the first postfix
577							# dereference found, or a false value if none is found.
578							#
579							# The optional $iterator argument can be one of the following:
580							# - A code reference, which will be called to provide PPI::Element
581							# objects to be checked to see if they represent a postfix
582							# dereference.
583							# - A PPI::Element, which is checked to see if it is a postfix
584							# dereference.
585							# - Undef, or omitted, in which case ppi() is called on the invocant,
586							# and everything that follows the '->' operator is checked to see if
587							# it is a postfix dereference.
588							# - Anything else results in an exception and stack trace.
589
590							{
591							sub __recognize_postderef {
592	148			148		356	my ( $self, $token, $iterator ) = @_;
593
594							# Note that if ppi() gets called I have to hold a reference to
595							# the returned object until I am done with all its children.
596	148					300	my $ppi;
597	148	100				383	if ( ! defined $iterator ) {
		50
		0
598
599							# This MUST be done before ppi() is called.
600							$self->{index_locations}
601	144	100				457	and $self->_update_location( $token );
602
603	144					531	$ppi = $token->ppi();
604	29					8264	my @ops = grep { '->' eq $_->content() } @{
605	144	100				328	$ppi->find( 'PPI::Token::Operator' ) \|\| [] };
	144					656
606							$iterator = sub {
607	150	100		150		725	my $op = shift @ops
608							or return;
609	15					93	return $op->snext_sibling();
610	144					40822	};
611							} elsif ( $iterator->isa( 'PPI::Element' ) ) {
612	4					10	my @eles = ( $iterator );
613							$iterator = sub {
614	4			4		15	return shift @eles;
615	4					15	};
616							} elsif ( CODE_REF ne ref $iterator ) {
617	0					0	confess 'Programming error - Iterator not understood';
618							}
619
620	148					796	my $accept = $token->__postderef_accept_cast();
621
622	148					405	while ( my $elem = $iterator->() ) {
623
624	19					464	my $content = $elem->content();
625
626							# As of PPI 1.238, all postfix dereferences are parsed as
627							# casts. So if we find a cast of the correct content we have
628							# a postfix deref.
629	19	100				174	$elem->isa( 'PPI::Token::Cast' )
630							or next;
631
632	15	100				115	if ( $content =~ m/ ( .* ) \* \z /smx ) {
		50
633							# If we're an acceptable cast ending in a glob, accept
634							# it.
635	10	100				129	$accept->{$1}
636							and return length $content;
637							} elsif ( $accept->{$content} ) {
638							# If we're an acceptable cast followed by a subscript,
639							# we're a slice -- accept both cast and subscript.
640	5	50				24	my $next = $elem->snext_sibling()
641							or next;
642	5	50				136	$next->isa( 'PPI::Structure::Subscript' )
643							or next;
644	5					28	return length( $content ) + length( $next->content() );
645							}
646
647							# Otherwise, we're not a postfix dereference; try the next
648							# iteration.
649							}
650
651							# No postfix dereference found.
652	135					782	return;
653							}
654							}
655
656							sub significant {
657	0			0	1	0	return 1;
658							}
659
660							sub strict {
661	4			4	1	13	my ( $self ) = @_;
662	4					59	return $self->{strict};
663							}
664
665							sub _known_tokenizers {
666	3025			3025		5398	my ( $self ) = @_;
667
668	3025					4851	my $mode = $self->{mode};
669
670	3025					4608	my @expect;
671	3025	100				6639	if ( $self->{expect_next} ) {
672	328					1119	$self->{expect} = $self->{expect_next};
673	328					768	$self->{expect_next} = undef;
674							}
675	3025	100				6100	if ( $self->{expect} ) {
676							@expect = $self->_known_tokenizer_check(
677	334					713	@{ $self->{expect} } );
	334					1061
678							}
679
680							exists $self->{known}{$mode} and return (
681	3025	100				7663	@expect, @{ $self->{known}{$mode} } );
	2487					9954
682
683	538					2487	my @found = $self->_known_tokenizer_check(
684							$self->__tokenizer_classes() );
685
686	538					2743	$self->{known}{$mode} = \@found;
687	538					2159	return (@expect, @found);
688							}
689
690							sub _known_tokenizer_check {
691	872			872		3100	my ( $self, @args ) = @_;
692
693	872					2102	my $handler = '__PPIX_TOKENIZER__' . $self->{mode};
694	872					1373	my @found;
695
696	872					1806	foreach my $class ( @args ) {
697
698	8556	100				47463	$class->can( $handler ) or next;
699	8367					15159	push @found, $class;
700
701							}
702
703	872					4140	return @found;
704							}
705
706							sub tokens {
707	204			204	1	671	my ( $self ) = @_;
708
709	204					404	my @rslt;
710	204					766	while ( my $token = $self->next_token() ) {
711	1924					4534	push @rslt, $token;
712							}
713
714	204					1409	return @rslt;
715							}
716
717							# $self->_deprecation_notice( $type, $name );
718							#
719							# This method centralizes deprecation. Type is 'attribute' or
720							# 'method'. Deprecation is driven of the %deprecate hash. Values
721							# are:
722							# false - no warning
723							# 1 - warn on first use
724							# 2 - warn on each use
725							# 3 - die on each use.
726							#
727							# $self->_deprecation_in_progress( $type, $name )
728							#
729							# This method returns true if the deprecation is in progress. In
730							# fact it returns the deprecation level.
731
732							=begin comment
733
734							{
735
736							my %deprecate = (
737							attribute => {
738							postderef => 3,
739							},
740							);
741
742							sub _deprecation_notice {
743							my ( undef, $type, $name, $repl ) = @_; # Invocant unused
744							$deprecate{$type} or return;
745							$deprecate{$type}{$name} or return;
746							my $msg = sprintf 'The %s %s is %s', $name, $type,
747							$deprecate{$type}{$name} > 2 ? 'removed' : 'deprecated';
748							defined $repl
749							and $msg .= "; use $repl instead";
750							$deprecate{$type}{$name} >= 3
751							and croak $msg;
752							warnings::enabled( 'deprecated' )
753							and carp $msg;
754							$deprecate{$type}{$name} == 1
755							and $deprecate{$type}{$name} = 0;
756							return;
757							}
758
759							sub _deprecation_in_progress {
760							my ( $self, $type, $name ) = @_;
761							$deprecate{$type} or return;
762							return $deprecate{$type}{$name};
763							}
764
765							}
766
767							=end comment
768
769							=cut
770
771							sub _remainder {
772	3620			3620		6413	my ( $self ) = @_;
773
774							$self->{cursor_curr} > $self->{cursor_limit}
775	3620	50				9493	and confess "Programming error - Trying to find past end of string";
776							$self->{find} = substr(
777							$self->{content},
778							$self->{cursor_curr},
779							$self->{cursor_limit} - $self->{cursor_curr}
780	3620					9680	);
781
782	3620					6293	return;
783							}
784
785							sub _make_final_token {
786	10			10		35	my ( $self, $len, $class, $arg ) = @_;
787	10					36	my $token = $self->make_token( $len, $class, $arg );
788	10					39	$self->_set_mode( 'kaput' );
789	10					110	return $token;
790							}
791
792							sub _set_mode {
793	1644			1644		3791	my ( $self, $mode ) = @_;
794							$self->{trace}
795	1644	50				3741	and warn "Tokenizer going from mode $self->{mode} to $mode\n";
796	1644					3193	$self->{mode} = $mode;
797	1644	100				3937	if ( 'kaput' eq $mode ) {
798							$self->{cursor_curr} = $self->{cursor_limit} =
799	534					1515	length $self->{content};
800							}
801	1644					2967	return;
802							}
803
804							sub __init_error {
805	10			10		30	my ( $self , $err ) = @_;
806	10	100				30	defined $err
807							or $err = 'Tokenizer found illegal first characters';
808							return $self->_make_final_token(
809	10					56	length $self->{content}, TOKEN_UNKNOWN, {
810							error => $err,
811							},
812							);
813							}
814
815							sub _update_location {
816	107			107		216	my ( $self, $token ) = @_;
817							$token->{location} # Idempotent
818	107	100				236	and return;
819	105		66			262	my $loc = $self->{_location} \|\|= do {
820							my %loc = (
821							location => $self->{location},
822	12					46	);
823	12	100				48	if ( __instance( $self->{source}, 'PPI::Element' ) ) {
824	11		33			136	$loc{location} \|\|= $self->{source}->location();
825	11	50				1976	if ( my $doc = $self->{source}->document() ) {
826	11					323	$loc{tab_width} = $doc->tab_width();
827							}
828							}
829	12		100			110	$loc{tab_width} \|\|= 1;
830	12					50	\%loc;
831							};
832							$loc->{location}
833	105	50				258	or return;
834	105					154	$token->{location} = [ @{ $loc->{location} } ];
	105					297
835	105	50				339	if ( defined( my $content = $token->content() ) ) {
836
837	105					150	my $lines;
838	105					311	pos( $content ) = 0;
839	105					373	$lines++ while $content =~ m/ \n /smxgc;
840	105	100				240	if ( pos $content ) {
841	2					4	$loc->{location}[LOCATION_LINE] += $lines;
842	2					5	$loc->{location}[LOCATION_LOGICAL_LINE] += $lines;
843							$loc->{location}[LOCATION_CHARACTER] =
844	2					5	$loc->{location}[LOCATION_COLUMN] = 1;
845							}
846
847	105	100				249	if ( my $chars = length( $content ) - pos( $content ) ) {
848	102					180	$loc->{location}[LOCATION_CHARACTER] += $chars;
849	102	100	100			294	if ( $loc->{tab_width} > 1 && $content =~ m/ \t /smx ) {
850	5					14	my $pos = $loc->{location}[LOCATION_COLUMN];
851	5					8	my $tab_width = $loc->{tab_width};
852							# Stolen shamelessly from PPI::Document::_visual_length
853	5					12	my ( $vis_inc );
854	5					23	foreach my $part ( split /(\t)/, $content ) {
855	10	100				22	if ($part eq "\t") {
856	5					12	$vis_inc = $tab_width - ($pos-1) % $tab_width;
857							} else {
858	5					8	$vis_inc = length $part;
859							}
860	10					16	$pos += $vis_inc;
861							}
862	5					14	$loc->{location}[LOCATION_COLUMN] = $pos;
863							} else {
864	97					195	$loc->{location}[LOCATION_COLUMN] += $chars;
865							}
866							}
867
868							}
869	105					226	return;
870							}
871
872							sub __PPIX_TOKENIZER__init {
873	534			534		1386	my ( $self ) = @_;
874
875	534	50				3591	$self->find_regexp(
876							qr{ \A ( \s* ) ( qr \| m \| s )? ( \s* ) ( . ) }smx )
877							or return $self->__init_error();
878
879	534					2813	my ( $leading_white, $type, $next_white, $delim_start ) = $self->capture();
880
881	534	100				1949	defined $type
882							or $type = '';
883
884	534	100	100			3249	$type
885							or $delim_start =~ m< \A [/?] \z >smx
886							or return $self->__init_error();
887	528	100	100			3087	$type
			100
888							and not $next_white
889							and $delim_start =~ m< \A \w \z >smx
890							and return $self->__init_error();
891
892	526					1645	$self->{type} = $type;
893
894	526					1142	my @tokens;
895
896	526	100				2000	'' ne $leading_white
897							and push @tokens, $self->make_token( length $leading_white,
898							'PPIx::Regexp::Token::Whitespace' );
899	526					2418	push @tokens, $self->make_token( length $type,
900							'PPIx::Regexp::Token::Structure' );
901	526	100				2089	'' ne $next_white
902							and push @tokens, $self->make_token( length $next_white,
903							'PPIx::Regexp::Token::Whitespace' );
904
905	526					1472	$self->{delimiter_start} = $delim_start;
906
907							$self->{trace}
908	526	50				2075	and warn "Tokenizer found regexp start delimiter '$delim_start' at $self->{cursor_curr}\n";
909
910	526	50				1940	if ( my $offset = $self->find_matching_delimiter() ) {
911	526					1362	my $cursor_limit = $self->{cursor_curr} + $offset;
912							$self->{trace}
913	526	50				1363	and warn "Tokenizer found regexp end delimiter at $cursor_limit\n";
914	526	100				1847	if ( $self->__number_of_extra_parts() ) {
915							### my $found_embedded_comments;
916	43	100				205	if ( $self->close_bracket(
917							$self->{delimiter_start} ) ) {
918							pos $self->{content} = $self->{cursor_curr} +
919	7					88	$offset + 1;
920							# If we're bracketed, there may be Perl comments between
921							# the regex and the replacement. PPI gets the parse
922							# wrong as of 1.220, but if we get the handling of the
923							# underlying string right, we will Just Work when PPI
924							# gets it right.
925	7					74	while ( $self->{content} =~
926							m/ \G \s* \n \s* \# [^\n]* /smxgc ) {
927							## $found_embedded_comments = 1;
928							}
929	7					42	$self->{content} =~ m/ \s* /smxgc;
930							} else {
931							pos $self->{content} = $self->{cursor_curr} +
932	36					251	$offset;
933							}
934							# Localizing cursor_curr and delimiter_start would be
935							# cleaner, but I don't want the old values restored if a
936							# parse error occurs.
937	43					163	my $cursor_curr = $self->{cursor_curr};
938	43					139	my $delimiter_start = $self->{delimiter_start};
939	43					212	$self->{cursor_curr} = pos $self->{content};
940							$self->{delimiter_start} = substr
941							$self->{content},
942							$self->{cursor_curr},
943	43					165	1;
944							$self->{trace}
945	43	50				132	and warn "Tokenizer found replacement start delimiter '$self->{delimiter_start}' at $self->{cursor_curr}\n";
946	43	100				150	if ( my $s_off = $self->find_matching_delimiter() ) {
947							$self->{cursor_modifiers} =
948	41					210	$self->{cursor_curr} + $s_off + 1;
949							$self->{trace}
950	41	50				159	and warn "Tokenizer found replacement end delimiter at @{[
951	0					0	$self->{cursor_curr} + $s_off ]}\n";
952	41					96	$self->{cursor_curr} = $cursor_curr;
953	41					114	$self->{delimiter_start} = $delimiter_start;
954							} else {
955							$self->{trace}
956	2	50				10	and warn 'Tokenizer failed to find replacement',
957							"end delimiter starting at $self->{cursor_curr}\n";
958	2					6	$self->{cursor_curr} = 0;
959							# TODO If I were smart enough here I could check for
960							# PPI mis-parses like s{foo}
961							# #{bar}
962							# {baz}
963							# here, doing so if $found_embedded_comments (commented
964							# out above) is true. The problem is that there seem to
965							# as many mis-parses as there are possible delimiters.
966	2					11	return $self->__init_error(
967							'Tokenizer found mismatched replacement delimiters',
968							);
969							}
970							} else {
971	483					1397	$self->{cursor_modifiers} = $cursor_limit + 1;
972							}
973	524					1209	$self->{cursor_limit} = $cursor_limit;
974							} else {
975	0					0	$self->{cursor_curr} = 0;
976							return $self->_make_final_token(
977	0					0	length( $self->{content} ), TOKEN_UNKNOWN, {
978							error => 'Tokenizer found mismatched regexp delimiters',
979							},
980							);
981							}
982
983							{
984							# We have to instantiate the trailing tokens now so we can
985							# figure out what modifiers are in effect. But we can't
986							# index their locations (if desired) because they are being
987							# instantiated out of order
988
989	524					796	local $self->{index_locations} = 0;
	524					1640
990
991	524					909	my @mods = @{ $self->{default_modifiers} };
	524					1450
992	524					2078	pos $self->{content} = $self->{cursor_modifiers};
993	524					1701	local $self->{cursor_curr} = $self->{cursor_modifiers};
994	524					1546	local $self->{cursor_limit} = length $self->{content};
995	524					960	my @trailing;
996							{
997	524					941	my $len = $self->find_regexp( qr{ \A [[:lower:]]* }smx );
	524					2564
998	524					2609	push @trailing, $self->make_token( $len,
999							'PPIx::Regexp::Token::Modifier' );
1000							}
1001	524	100				2736	if ( my $len = $self->find_regexp( qr{ \A \s+ }smx ) ) {
1002	1					6	push @trailing, $self->make_token( $len,
1003							'PPIx::Regexp::Token::Whitespace' );
1004							}
1005	524	100				2901	if ( my $len = $self->find_regexp( qr{ \A .+ }smx ) ) {
1006	1					11	push @trailing, $self->make_token( $len, TOKEN_UNKNOWN, {
1007							error => 'Trailing characters after expression',
1008							} );
1009							}
1010	524					1874	$self->{trailing_tokens} = \@trailing;
1011	524					1945	push @mods, $trailing[0]->content();
1012							$self->{effective_modifiers} =
1013	524					1606	PPIx::Regexp::Token::Modifier::__aggregate_modifiers (
1014							@mods );
1015							$self->{modifiers} = [
1016	524					1274	{ %{ $self->{effective_modifiers} } },
	524					3315
1017							];
1018							}
1019
1020							$self->{delimiter_finish} = substr
1021							$self->{content},
1022							$self->{cursor_limit},
1023	524					2143	1;
1024
1025	524					1576	push @tokens, $self->make_token( 1,
1026							'PPIx::Regexp::Token::Delimiter' );
1027
1028	524					2877	$self->_set_mode( 'regexp' );
1029
1030	524					1467	$self->{find} = undef;
1031
1032	524					2650	return @tokens;
1033							}
1034
1035							# Match the initial part of the regexp including any leading white
1036							# space. The initial delimiter is the first thing not consumed, though
1037							# we check it for sanity.
1038							sub __initial_match {
1039	0			0		0	my ( $self ) = @_;
1040
1041	0	0				0	$self->find_regexp(
1042							qr{ \A ( \s* ) ( qr \| m \| s )? ( \s* ) (?: [^\w\s] ) }smx )
1043							or return;
1044
1045	0					0	my ( $leading_white, $type, $next_white ) = $self->capture();
1046
1047	0	0				0	defined $type
1048							or $type = '';
1049
1050	0					0	$self->{type} = $type;
1051
1052	0					0	my @tokens;
1053
1054	0	0				0	'' ne $leading_white
1055							and push @tokens, $self->make_token( length $leading_white,
1056							'PPIx::Regexp::Token::Whitespace' );
1057	0					0	push @tokens, $self->make_token( length $type,
1058							'PPIx::Regexp::Token::Structure' );
1059	0	0				0	'' ne $next_white
1060							and push @tokens, $self->make_token( length $next_white,
1061							'PPIx::Regexp::Token::Whitespace' );
1062
1063	0					0	return @tokens;
1064							}
1065
1066							{
1067							my %extra_parts = (
1068							s => 1,
1069							);
1070
1071							# Return the number of extra delimited parts. This will be 0 except
1072							# for s///, which will be 1.
1073							sub __number_of_extra_parts {
1074	850			850		2058	my ( $self ) = @_;
1075	850		100			4213	return $extra_parts{$self->{type}} \|\| 0;
1076							}
1077							}
1078
1079							{
1080							my @part_class = qw{
1081							PPIx::Regexp::Structure::Regexp
1082							PPIx::Regexp::Structure::Replacement
1083							};
1084
1085							# Return the classes for the parts of the expression.
1086							sub __part_classes {
1087	324			324		922	my ( $self ) = @_;
1088	324					980	my $max = $self->__number_of_extra_parts();
1089	324					2215	return @part_class[ 0 .. $max ];
1090							}
1091							}
1092
1093							sub __PPIX_TOKENIZER__regexp {
1094	3025			3025		6295	my ( $self, $character ) = @_;
1095
1096	3025					5312	my $mode = $self->{mode};
1097	3025					5956	my $handler = '__PPIX_TOKENIZER__' . $mode;
1098
1099	3025					5543	$self->{cursor_orig} = $self->{cursor_curr};
1100	3025					7079	foreach my $class ( $self->_known_tokenizers() ) {
1101	13467					53774	my @tokens = grep { $_ } $class->$handler( $self, $character );
	3856					9877
1102							$self->{trace}
1103	13467	50				27857	and warn $class, "->$handler( \$self, '$character' )",
1104							" => (@tokens)\n";
1105							@tokens
1106							and return ( map {
1107	13467	100				28310	ref $_ ? $_ : $self->make_token( $_,
	3022	100				11985
1108							$class ) } @tokens );
1109							}
1110
1111							# Find a fallback processor for the character.
1112	27		33			289	my $fallback = __PACKAGE__->can( '__PPIX_TOKEN_FALLBACK__' . $mode )
1113							\|\| __PACKAGE__->can( '__PPIX_TOKEN_FALLBACK__regexp' )
1114							\|\| confess "Programming error - unable to find fallback for $mode";
1115	27					105	return $fallback->( $self, $character );
1116							}
1117
1118							*__PPIX_TOKENIZER__repl = \&__PPIX_TOKENIZER__regexp;
1119
1120							sub __PPIX_TOKEN_FALLBACK__regexp {
1121	18			18		46	my ( $self, $character ) = @_;
1122
1123							# As a fallback in regexp mode, any escaped character is a literal.
1124	18	100	66			90	if ( $character eq '\\'
1125							&& $self->{cursor_limit} - $self->{cursor_curr} > 1
1126							) {
1127	2					9	return $self->make_token( 2, TOKEN_LITERAL );
1128							}
1129
1130							# Any normal character is unknown.
1131	16					89	return $self->make_token( 1, TOKEN_UNKNOWN, {
1132							error => 'Tokenizer found unexpected literal',
1133							},
1134							);
1135							}
1136
1137							sub __PPIX_TOKEN_FALLBACK__repl {
1138	9			9		24	my ( $self, $character ) = @_;
1139
1140							# As a fallback in replacement mode, any escaped character is a literal.
1141	9	100	66			43	if ( $character eq '\\'
1142							&& defined ( my $next = $self->peek( 1 ) ) ) {
1143
1144	5	0	33			24	if ( $self->interpolates() \|\| $next eq q<'> \|\| $next eq '\\' ) {
			33
1145	5					23	return $self->make_token( 2, TOKEN_LITERAL );
1146							}
1147	0					0	return $self->make_token( 1, TOKEN_LITERAL );
1148							}
1149
1150							# So is any normal character.
1151	4					14	return $self->make_token( 1, TOKEN_LITERAL );
1152							}
1153
1154							sub __PPIX_TOKENIZER__finish {
1155	555			555		1852	my ( $self ) = @_; # $character unused
1156
1157							$self->{cursor_limit} > length $self->{content}
1158	555	50				2492	and confess "Programming error - ran off string";
1159
1160							my @tokens = $self->make_token( length $self->{delimiter_finish},
1161	555					1960	'PPIx::Regexp::Token::Delimiter' );
1162
1163	555	100				2666	if ( $self->{cursor_curr} == $self->{cursor_modifiers} ) {
1164
1165							# We are out of string. Add the trailing tokens (created when we
1166							# did the initial bracket scan) and close up shop.
1167
1168	514					1974	push @tokens, $self->_get_trailing_tokens();
1169
1170	514					1410	$self->_set_mode( 'kaput' );
1171
1172							} else {
1173
1174							# Clear the cookies, because we are going around again.
1175	41					242	$self->{cookie} = {};
1176
1177							# Move the cursor limit to just before the modifiers.
1178	41					154	$self->{cursor_limit} = $self->{cursor_modifiers} - 1;
1179
1180							# If the preceding regular expression was bracketed, we need to
1181							# consume possible whitespace and find another delimiter.
1182
1183	41	100				210	if ( $self->close_bracket( $self->{delimiter_start} ) ) {
1184	7					20	my $accept;
1185							# If we are bracketed, there can be honest-to-God Perl
1186							# comments between the regexp and the replacement, not just
1187							# regexp comments. As of version 1.220, PPI does not get
1188							# this parse right, but if we can handle this is a string,
1189							# then we will Just Work when PPI gets itself straight.
1190	7					67	while ( $self->find_regexp(
1191							qr{ \A ( \s* \n \s* ) ( \# [^\n]* \n ) }smx ) ) {
1192	2					12	my ( $white_space, $comment ) = $self->capture();
1193	2					9	push @tokens, $self->make_token(
1194							length $white_space,
1195							'PPIx::Regexp::Token::Whitespace',
1196							), $self->make_token(
1197							length $comment,
1198							'PPIx::Regexp::Token::Comment',
1199							);
1200							}
1201	7	100				78	$accept = $self->find_regexp( qr{ \A \s+ }smx )
1202							and push @tokens, $self->make_token(
1203							$accept, 'PPIx::Regexp::Token::Whitespace' );
1204	7					63	my $character = $self->peek();
1205	7					29	$self->{delimiter_start} = $character;
1206	7					33	push @tokens, $self->make_token(
1207							1, 'PPIx::Regexp::Token::Delimiter' );
1208							$self->{delimiter_finish} = substr
1209							$self->{content},
1210	7					75	$self->{cursor_limit} - 1,
1211							1;
1212							}
1213
1214	41	100				198	if ( $self->modifier( 'e*' ) ) {
1215							# With /e or /ee, the replacement portion is code. We make
1216							# it all into one big PPIx::Regexp::Token::Code, slap on the
1217							# trailing delimiter and modifiers, and return it all.
1218							push @tokens, $self->make_token(
1219							$self->{cursor_limit} - $self->{cursor_curr},
1220	10					109	'PPIx::Regexp::Token::Code',
1221							{ perl_version_introduced => MINIMUM_PERL },
1222							);
1223	10					56	$self->{cursor_limit} = length $self->{content};
1224	10					41	push @tokens, $self->make_token( 1,
1225							'PPIx::Regexp::Token::Delimiter' ),
1226							$self->_get_trailing_tokens();
1227	10					33	$self->_set_mode( 'kaput' );
1228							} else {
1229							# Put our mode to replacement.
1230	31					224	$self->_set_mode( 'repl' );
1231							}
1232
1233							}
1234
1235	555					2074	return @tokens;
1236
1237							}
1238
1239							# To common processing on trailing tokens.
1240							sub _get_trailing_tokens {
1241	524			524		1260	my ( $self ) = @_;
1242	524	100				1594	if ( $self->{index_locations} ) {
1243							# We turned off index_locations when these were created, because
1244							# they were done out of order. Fix that now.
1245	11					25	foreach my $token ( @{ $self->{trailing_tokens} } ) {
	11					32
1246	11					23	$self->_update_location( $token );
1247							}
1248							}
1249	524					897	return @{ delete $self->{trailing_tokens} };
	524					1792
1250							}
1251
1252							1;
1253
1254							__END__