| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package Data::Search; |
|
2
|
1
|
|
|
1
|
|
21744
|
use 5.005; |
|
|
1
|
|
|
|
|
3
|
|
|
|
1
|
|
|
|
|
36
|
|
|
3
|
1
|
|
|
1
|
|
5
|
use strict; |
|
|
1
|
|
|
|
|
2
|
|
|
|
1
|
|
|
|
|
29
|
|
|
4
|
1
|
|
|
1
|
|
4
|
use warnings; |
|
|
1
|
|
|
|
|
5
|
|
|
|
1
|
|
|
|
|
1164
|
|
|
5
|
|
|
|
|
|
|
require Exporter; |
|
6
|
|
|
|
|
|
|
our $VERSION = '0.03'; |
|
7
|
|
|
|
|
|
|
our @ISA = qw(Exporter); |
|
8
|
|
|
|
|
|
|
our @EXPORT= qw(datasearch); |
|
9
|
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
=head1 NAME |
|
11
|
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
Data::Search - Data structure search |
|
13
|
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
use Data::Search; |
|
17
|
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
$data = { ... }; |
|
19
|
|
|
|
|
|
|
@results = datasearch( data => $data, search => 'values', |
|
20
|
|
|
|
|
|
|
find => qr/string/, return => 'hashcontainer' ); |
|
21
|
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
23
|
|
|
|
|
|
|
|
|
24
|
|
|
|
|
|
|
=head2 datasearch - Search data structures |
|
25
|
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
This function allows you to search arbitrarily large/complex |
|
27
|
|
|
|
|
|
|
data structures for particular elements. |
|
28
|
|
|
|
|
|
|
You can search hash keys, or hash/array values, for a number/string |
|
29
|
|
|
|
|
|
|
or regular expression. |
|
30
|
|
|
|
|
|
|
The datasearch function can return either the found hash keys, the found |
|
31
|
|
|
|
|
|
|
values (which could be data structures themselves) or the container |
|
32
|
|
|
|
|
|
|
of the key or value (which is always going to be a data structure) |
|
33
|
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
By default, hash keys are searched, and the corresponding values are returned. |
|
35
|
|
|
|
|
|
|
To search hash or array values, specify SEARCH => 'values'. |
|
36
|
|
|
|
|
|
|
To search both values and keys, specify SEARCH => 'all'. |
|
37
|
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
To find an exact match of a string, set FIND => 'string'. To use a regular |
|
39
|
|
|
|
|
|
|
expression use the qr operator: FIND => qr/^name.*/i |
|
40
|
|
|
|
|
|
|
FIND may also be a 2 element array, to search for a key-value pair. |
|
41
|
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
To return the hash keys found (or the hash keys corresponding to |
|
43
|
|
|
|
|
|
|
searched values), specify RETURN => 'keys'. |
|
44
|
|
|
|
|
|
|
To return both keys and values specify RETURN => 'all'. |
|
45
|
|
|
|
|
|
|
|
|
46
|
|
|
|
|
|
|
You can also return the data structure containing the found key/value. |
|
47
|
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
To do that, specify RETURN => 'container'. This will return the immediate |
|
49
|
|
|
|
|
|
|
container, either a hash or an array reference. You can also choose to |
|
50
|
|
|
|
|
|
|
get the closest hash container (even if the value was inside an array) |
|
51
|
|
|
|
|
|
|
by specifying RETURN => 'hashcontainer'. |
|
52
|
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
Similarly, you can return the closest array container (even though the |
|
54
|
|
|
|
|
|
|
value found was a hash value or hash key) by specifying |
|
55
|
|
|
|
|
|
|
RETURN => 'arraycontainer' |
|
56
|
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
Also, you can get an outer container by doing RETURN => 'container:xyz' |
|
58
|
|
|
|
|
|
|
in which case the container returned would be a structure pointed to |
|
59
|
|
|
|
|
|
|
by key xyz (if found to contain the search element somewhere inside it). |
|
60
|
|
|
|
|
|
|
Please see the examples at the end of this document. |
|
61
|
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
ARGUMENTS |
|
63
|
|
|
|
|
|
|
The following arguments are accepted (case-insensitively). |
|
64
|
|
|
|
|
|
|
The only mandatory arguments are DATA and FIND. |
|
65
|
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
|
data => Reference of structure to search |
|
67
|
|
|
|
|
|
|
search => What elements to search: keys|values|all (default: keys) |
|
68
|
|
|
|
|
|
|
find => Look for: string | qr/regex/ | [ key => value ] |
|
69
|
|
|
|
|
|
|
return => What to return: keys|values|all| |
|
70
|
|
|
|
|
|
|
container|hashcontainer|arraycontainer|container:key_name |
|
71
|
|
|
|
|
|
|
|
|
72
|
|
|
|
|
|
|
RETURN VALUES |
|
73
|
|
|
|
|
|
|
|
|
74
|
|
|
|
|
|
|
Returns a list of matching elements (could be strings or references |
|
75
|
|
|
|
|
|
|
to internal parts (hashes/arrays) of the data structure. |
|
76
|
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
EXAMPLES |
|
78
|
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
my @results = datasearch( data => $ref, find => 'name' ); |
|
80
|
|
|
|
|
|
|
That will return all values pointed to by hash keys called 'name' |
|
81
|
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
my @results = datasearch( data => $ref, search => 'values', |
|
83
|
|
|
|
|
|
|
find => qr/alex/i, return => 'key' ); |
|
84
|
|
|
|
|
|
|
That will return all keys that point to strings that match "alex" |
|
85
|
|
|
|
|
|
|
case insensitively. |
|
86
|
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
my @results = datasearch( data => $ref, search => 'keys', |
|
88
|
|
|
|
|
|
|
find => qr/_id$/, return => 'all' ); |
|
89
|
|
|
|
|
|
|
That will return all keys that end with "_id", and all values |
|
90
|
|
|
|
|
|
|
pointed to by those keys. |
|
91
|
|
|
|
|
|
|
|
|
92
|
|
|
|
|
|
|
my @results = datasearch( data => $ref, return => 'container:myrecord', |
|
93
|
|
|
|
|
|
|
find => [ suffix => 'Jr' ] ) |
|
94
|
|
|
|
|
|
|
That implies search=>'all', searches for a key 'suffix' |
|
95
|
|
|
|
|
|
|
that has value 'Jr', and returns any matching hashes pointed to by a key |
|
96
|
|
|
|
|
|
|
named myrecord (even if suffix is deep inside those hashes) |
|
97
|
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
=cut |
|
99
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
sub datasearch { |
|
101
|
0
|
|
|
0
|
1
|
|
my $args = get_args( [qw(FIND SEARCH RETURN DATA)], @_ ); |
|
102
|
|
|
|
|
|
|
|
|
103
|
0
|
0
|
|
|
|
|
die "FIND argument is required" unless defined $args->{FIND}; |
|
104
|
0
|
0
|
|
|
|
|
die "DATA argument is required" unless defined $args->{DATA}; |
|
105
|
|
|
|
|
|
|
|
|
106
|
0
|
0
|
0
|
|
|
|
my $sk = 1 if !$args->{SEARCH} || $args->{SEARCH} =~ /key|all/ |
|
|
|
|
0
|
|
|
|
|
|
107
|
|
|
|
|
|
|
or ref($args->{FIND}) eq 'ARRAY'; |
|
108
|
0
|
0
|
0
|
|
|
|
my $sv = 1 if $args->{SEARCH} && $args->{SEARCH} =~ /value|all/; |
|
109
|
|
|
|
|
|
|
|
|
110
|
0
|
0
|
0
|
|
|
|
my $rv = 1 if !$args->{RETURN} || $args->{RETURN} =~ /value|all/; |
|
111
|
0
|
0
|
0
|
|
|
|
my $rk = 1 if $args->{RETURN} && $args->{RETURN} =~ /key|all/; |
|
112
|
0
|
0
|
0
|
|
|
|
my $rc = $args->{RETURN} && $args->{RETURN} =~ /container/ |
|
113
|
|
|
|
|
|
|
? $args->{RETURN} : 0; |
|
114
|
|
|
|
|
|
|
|
|
115
|
0
|
|
|
|
|
|
my (@results, @refs, $container); |
|
116
|
0
|
|
|
|
|
|
@results = _datasearch( $args->{DATA}, $args->{FIND}, $sk, $sv, $rv, $rk, |
|
117
|
|
|
|
|
|
|
$rc, \@refs, undef, undef, undef, 0 ); |
|
118
|
|
|
|
|
|
|
|
|
119
|
0
|
|
|
|
|
|
my @unique; |
|
120
|
0
|
|
|
|
|
|
foreach my $p ( @results ) { # Weed out duplicate references |
|
121
|
0
|
0
|
0
|
|
|
|
push @unique, $p unless ref($p) and grep { ref && $_ == $p } @unique; |
|
|
0
|
0
|
|
|
|
|
|
|
122
|
|
|
|
|
|
|
} |
|
123
|
0
|
|
|
|
|
|
return @unique; |
|
124
|
|
|
|
|
|
|
} ## end sub datasearch |
|
125
|
|
|
|
|
|
|
|
|
126
|
|
|
|
|
|
|
# Internal recursive function called by datasearch |
|
127
|
|
|
|
|
|
|
sub _datasearch { |
|
128
|
0
|
|
|
0
|
|
|
my ($p, $f, $sk, $sv, $rv, $rk, $rc, $refs, $container, $key, $rr, $depth) |
|
129
|
|
|
|
|
|
|
= @_; |
|
130
|
|
|
|
|
|
|
# print "DEPTH IN=$depth\n"; |
|
131
|
0
|
|
|
|
|
|
my ($root) = $rc =~ /:(.+)/; |
|
132
|
0
|
0
|
|
|
|
|
if ( ref($p) ) { |
|
133
|
0
|
0
|
|
|
|
|
if ( grep { $p == $_ } @$refs ) { |
|
|
0
|
|
|
|
|
|
|
|
134
|
0
|
|
|
|
|
|
warn "Skipping duplicate reference to $p"; |
|
135
|
0
|
|
|
|
|
|
return; |
|
136
|
|
|
|
|
|
|
} |
|
137
|
0
|
|
|
|
|
|
push @$refs, $p; |
|
138
|
|
|
|
|
|
|
} |
|
139
|
|
|
|
|
|
|
|
|
140
|
0
|
|
|
|
|
|
my @results; |
|
141
|
0
|
0
|
0
|
|
|
|
if ( ref($p) && $p =~ /HASH/ ) { |
|
|
|
0
|
0
|
|
|
|
|
|
|
|
0
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
142
|
0
|
0
|
|
|
|
|
$container = $p unless $rc =~ /array/; |
|
143
|
0
|
|
|
|
|
|
foreach my $k ( keys %$p ) { |
|
144
|
0
|
0
|
0
|
|
|
|
$rr = $p->{$k} if $root && $root eq $k; |
|
145
|
0
|
0
|
|
|
|
|
my ($f1, $f2) = ref($f) eq 'ARRAY' ? ($f->[0], $f->[1]) : $f; |
|
146
|
0
|
0
|
0
|
|
|
|
if ( $sk and ref($f1) eq 'Regexp' && $k =~ /$f1/ || $k eq $f1 ) { |
|
|
|
|
0
|
|
|
|
|
|
147
|
0
|
0
|
0
|
|
|
|
if ( ! defined $f2 or |
|
|
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
148
|
|
|
|
|
|
|
ref($f2) eq 'Regexp' && $p->{$k} =~ /$f2/ |
|
149
|
|
|
|
|
|
|
|| $p->{$k} eq $f2 ) { |
|
150
|
0
|
0
|
|
|
|
|
if ( $rc ) { |
|
151
|
0
|
0
|
|
|
|
|
if ( $root ) { |
|
152
|
0
|
0
|
|
|
|
|
push @results, $rr if $rr; |
|
153
|
|
|
|
|
|
|
} else { |
|
154
|
0
|
|
|
|
|
|
push @results, $container; |
|
155
|
|
|
|
|
|
|
} |
|
156
|
|
|
|
|
|
|
} else { |
|
157
|
0
|
0
|
|
|
|
|
push @results, $k if $rk; |
|
158
|
0
|
0
|
|
|
|
|
push @results, $p->{$k} if $rv; |
|
159
|
|
|
|
|
|
|
} |
|
160
|
|
|
|
|
|
|
} |
|
161
|
|
|
|
|
|
|
} |
|
162
|
0
|
0
|
|
|
|
|
if ( my @r = _datasearch( $p->{$k}, $f, $sk, $sv, $rv, $rk, |
|
163
|
|
|
|
|
|
|
$rc, $refs, $container, $k, $rr, $depth+1 ) ) { |
|
164
|
0
|
|
|
|
|
|
push @results, @r; |
|
165
|
|
|
|
|
|
|
} |
|
166
|
|
|
|
|
|
|
} |
|
167
|
|
|
|
|
|
|
} elsif ( ref($p) && $p =~ /ARRAY/ ) { |
|
168
|
0
|
0
|
|
|
|
|
$container = $p unless $rc =~ /hash/; |
|
169
|
0
|
|
|
|
|
|
foreach ( @$p ) { |
|
170
|
0
|
0
|
|
|
|
|
if ( my @r = _datasearch( $_, $f, $sk, $sv, $rv, $rk, |
|
171
|
|
|
|
|
|
|
$rc, $refs, $container, $key, $rr, $depth+1 ) ) { |
|
172
|
0
|
|
|
|
|
|
push @results, @r; |
|
173
|
|
|
|
|
|
|
} |
|
174
|
|
|
|
|
|
|
} |
|
175
|
|
|
|
|
|
|
} elsif ( !ref($p) && defined $p && $sv and |
|
176
|
|
|
|
|
|
|
ref($f) eq 'Regexp' && $p =~ /$f/ || $p eq $f ) { |
|
177
|
0
|
0
|
|
|
|
|
if ( $rc ) { |
|
178
|
0
|
0
|
|
|
|
|
if ( $root ) { |
|
179
|
0
|
0
|
|
|
|
|
push @results, $rr if $rr; |
|
180
|
|
|
|
|
|
|
} else { |
|
181
|
0
|
|
|
|
|
|
push @results, $container; |
|
182
|
|
|
|
|
|
|
} |
|
183
|
|
|
|
|
|
|
} else { |
|
184
|
0
|
0
|
|
|
|
|
push @results, $p if $rv; |
|
185
|
0
|
0
|
0
|
|
|
|
push @results, $key if $rk && defined $key; |
|
186
|
|
|
|
|
|
|
} |
|
187
|
|
|
|
|
|
|
} |
|
188
|
|
|
|
|
|
|
# print "DEPTH OUT=$depth\n"; |
|
189
|
0
|
|
|
|
|
|
return @results; |
|
190
|
|
|
|
|
|
|
} ## end sub datasearch |
|
191
|
|
|
|
|
|
|
|
|
192
|
|
|
|
|
|
|
# Return a hash of named parameters (keys converted to upper case) |
|
193
|
|
|
|
|
|
|
sub get_args { |
|
194
|
|
|
|
|
|
|
# Called as get_args(@_) or as get_args( [arg, arg2...], @_ ) |
|
195
|
0
|
0
|
|
0
|
0
|
|
my $valid_arg_list = ( ref($_[0]) eq 'ARRAY' ? shift : '' ); |
|
196
|
|
|
|
|
|
|
|
|
197
|
0
|
0
|
|
|
|
|
die "get_args got odd number of arguments" |
|
198
|
|
|
|
|
|
|
unless (@_/2 == int(@_/2)); |
|
199
|
|
|
|
|
|
|
|
|
200
|
0
|
|
|
|
|
|
my $args; |
|
201
|
0
|
|
|
|
|
|
for ( my $n = 0 ; $n < $#_ ; $n += 2 ) { |
|
202
|
0
|
|
|
|
|
|
$args->{ uc $_[$n] } = $_[ $n + 1 ]; |
|
203
|
|
|
|
|
|
|
} |
|
204
|
|
|
|
|
|
|
|
|
205
|
|
|
|
|
|
|
# Do argument checking, if list of valid arguments was given |
|
206
|
0
|
0
|
|
|
|
|
if ($valid_arg_list) { |
|
207
|
0
|
|
|
|
|
|
foreach my $arg (keys %$args) { |
|
208
|
0
|
0
|
|
|
|
|
die "get_args: Argument \"$arg\" is invalid" |
|
209
|
|
|
|
|
|
|
unless grep (/^\Q$arg\E$/, @$valid_arg_list); |
|
210
|
|
|
|
|
|
|
} |
|
211
|
|
|
|
|
|
|
} |
|
212
|
0
|
|
|
|
|
|
return $args; |
|
213
|
|
|
|
|
|
|
} |
|
214
|
|
|
|
|
|
|
|
|
215
|
|
|
|
|
|
|
1; |
|
216
|
|
|
|
|
|
|
|