| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
# $Id: Opish.pm,v 1.2 2003/09/28 08:50:37 gene Exp $ |
|
2
|
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
package Acme::Opish; |
|
4
|
|
|
|
|
|
|
|
|
5
|
1
|
|
|
1
|
|
29918
|
use vars qw($VERSION); |
|
|
1
|
|
|
|
|
3
|
|
|
|
1
|
|
|
|
|
58
|
|
|
6
|
|
|
|
|
|
|
$VERSION = '0.0601'; |
|
7
|
|
|
|
|
|
|
|
|
8
|
1
|
|
|
1
|
|
6
|
use strict; |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
37
|
|
|
9
|
1
|
|
|
1
|
|
5
|
use Carp; |
|
|
1
|
|
|
|
|
6
|
|
|
|
1
|
|
|
|
|
101
|
|
|
10
|
1
|
|
|
1
|
|
4
|
use base qw(Exporter); |
|
|
1
|
|
|
|
|
2
|
|
|
|
1
|
|
|
|
|
114
|
|
|
11
|
1
|
|
|
1
|
|
5
|
use vars qw(@EXPORT @EXPORT_OK); |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
55
|
|
|
12
|
|
|
|
|
|
|
@EXPORT = @EXPORT_OK = qw( |
|
13
|
|
|
|
|
|
|
enop |
|
14
|
|
|
|
|
|
|
has_silent_e |
|
15
|
|
|
|
|
|
|
no_silent_e |
|
16
|
|
|
|
|
|
|
); |
|
17
|
1
|
|
|
1
|
|
4
|
use File::Basename; |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
1071
|
|
|
18
|
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
# no_silent_e list {{{ |
|
20
|
|
|
|
|
|
|
my %OK; @OK{qw( |
|
21
|
|
|
|
|
|
|
adobe |
|
22
|
|
|
|
|
|
|
acme |
|
23
|
|
|
|
|
|
|
acne |
|
24
|
|
|
|
|
|
|
anime |
|
25
|
|
|
|
|
|
|
antistrophe |
|
26
|
|
|
|
|
|
|
apostrophe |
|
27
|
|
|
|
|
|
|
be |
|
28
|
|
|
|
|
|
|
breve |
|
29
|
|
|
|
|
|
|
Brule |
|
30
|
|
|
|
|
|
|
cabriole |
|
31
|
|
|
|
|
|
|
cache |
|
32
|
|
|
|
|
|
|
Calliope |
|
33
|
|
|
|
|
|
|
capote |
|
34
|
|
|
|
|
|
|
Catananche |
|
35
|
|
|
|
|
|
|
catastrophe |
|
36
|
|
|
|
|
|
|
clave |
|
37
|
|
|
|
|
|
|
cliche |
|
38
|
|
|
|
|
|
|
consomme |
|
39
|
|
|
|
|
|
|
coyote |
|
40
|
|
|
|
|
|
|
diastrophe |
|
41
|
|
|
|
|
|
|
epanastrophe |
|
42
|
|
|
|
|
|
|
epitome |
|
43
|
|
|
|
|
|
|
forte |
|
44
|
|
|
|
|
|
|
Giuseppe |
|
45
|
|
|
|
|
|
|
kamikaze |
|
46
|
|
|
|
|
|
|
karate |
|
47
|
|
|
|
|
|
|
me |
|
48
|
|
|
|
|
|
|
misogyne |
|
49
|
|
|
|
|
|
|
Pele |
|
50
|
|
|
|
|
|
|
phlebotome |
|
51
|
|
|
|
|
|
|
progne |
|
52
|
|
|
|
|
|
|
Psyche |
|
53
|
|
|
|
|
|
|
psyche |
|
54
|
|
|
|
|
|
|
Quixote |
|
55
|
|
|
|
|
|
|
recipie |
|
56
|
|
|
|
|
|
|
Sade |
|
57
|
|
|
|
|
|
|
Salome |
|
58
|
|
|
|
|
|
|
saute |
|
59
|
|
|
|
|
|
|
stanze |
|
60
|
|
|
|
|
|
|
supercatastrophe |
|
61
|
|
|
|
|
|
|
Tempe |
|
62
|
|
|
|
|
|
|
tousche |
|
63
|
|
|
|
|
|
|
tsetse |
|
64
|
|
|
|
|
|
|
tonsillectome |
|
65
|
|
|
|
|
|
|
tonsillotome |
|
66
|
|
|
|
|
|
|
tracheotome |
|
67
|
|
|
|
|
|
|
ukulele |
|
68
|
|
|
|
|
|
|
we |
|
69
|
|
|
|
|
|
|
zimbabwe |
|
70
|
|
|
|
|
|
|
)} = undef; |
|
71
|
|
|
|
|
|
|
# }}} |
|
72
|
|
|
|
|
|
|
|
|
73
|
|
|
|
|
|
|
# Add 'no_silent_e' entries if present and then return the list. |
|
74
|
|
|
|
|
|
|
sub no_silent_e { |
|
75
|
2
|
|
|
2
|
1
|
191
|
$OK{$_} = undef for @_; |
|
76
|
2
|
|
|
|
|
9
|
return keys %OK; |
|
77
|
|
|
|
|
|
|
} |
|
78
|
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
# Remove'no_silent_e' entries if present and then return the list. |
|
80
|
|
|
|
|
|
|
sub has_silent_e { |
|
81
|
1
|
|
|
1
|
1
|
5
|
delete $OK{$_} for @_; |
|
82
|
1
|
|
|
|
|
4
|
return keys %OK; |
|
83
|
|
|
|
|
|
|
} |
|
84
|
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
# Prefix vowels not declared in the 'no_silent_e' list. |
|
86
|
|
|
|
|
|
|
sub enop { |
|
87
|
11
|
|
|
11
|
1
|
2157
|
my $prefix = 'op'; |
|
88
|
|
|
|
|
|
|
# If present, the prefix is given as a named parameter. |
|
89
|
11
|
100
|
|
|
|
31
|
if ($_[0] eq '-opish_prefix') { |
|
90
|
1
|
|
|
|
|
2
|
shift; |
|
91
|
1
|
|
|
|
|
2
|
$prefix = shift; |
|
92
|
|
|
|
|
|
|
} |
|
93
|
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
# Process the given text stream. |
|
95
|
11
|
|
|
|
|
20
|
my @strings = @_; |
|
96
|
|
|
|
|
|
|
# Given as a known system filename. |
|
97
|
11
|
|
|
|
|
22
|
for (@strings) { # {{{ |
|
98
|
14
|
100
|
|
|
|
122
|
if (-f) { |
|
99
|
|
|
|
|
|
|
# Open the file for reading. |
|
100
|
1
|
50
|
|
|
|
43
|
open IN, $_ or carp "Can't read $_: $!\n"; |
|
101
|
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
# Construct a new filename. |
|
103
|
1
|
|
|
|
|
66
|
my ($name, $path) = fileparse($_, ''); |
|
104
|
1
|
|
|
|
|
4
|
$_ = $path . 'opish-' . $name; |
|
105
|
|
|
|
|
|
|
|
|
106
|
|
|
|
|
|
|
# Open the new file for writing. |
|
107
|
1
|
50
|
|
|
|
127
|
open OUT, ">$_" or carp "Can't write $_: $!\n"; |
|
108
|
|
|
|
|
|
|
|
|
109
|
|
|
|
|
|
|
# Write opish to the file. |
|
110
|
1
|
|
|
|
|
25
|
while (my $line = ) { |
|
111
|
4
|
|
|
|
|
11
|
print OUT _to_opish($prefix, $line), "\n"; |
|
112
|
|
|
|
|
|
|
} |
|
113
|
|
|
|
|
|
|
|
|
114
|
|
|
|
|
|
|
# Close the files. |
|
115
|
1
|
|
|
|
|
14
|
close IN; |
|
116
|
1
|
|
|
|
|
64
|
close OUT; |
|
117
|
|
|
|
|
|
|
} # }}} |
|
118
|
|
|
|
|
|
|
# ..or given as strings on the commandline. |
|
119
|
|
|
|
|
|
|
else { |
|
120
|
13
|
|
|
|
|
27
|
$_ = _to_opish($prefix, $_); |
|
121
|
|
|
|
|
|
|
} |
|
122
|
|
|
|
|
|
|
} |
|
123
|
|
|
|
|
|
|
|
|
124
|
11
|
|
|
|
|
62
|
return @strings; |
|
125
|
|
|
|
|
|
|
} |
|
126
|
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
# DrMath++ && DrForr++ && Yay! |
|
128
|
|
|
|
|
|
|
sub _to_opish { |
|
129
|
17
|
|
|
17
|
|
25
|
my ($prefix, $string) = @_; |
|
130
|
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
# XXX Oof. We don't preserve whitespace. : \ |
|
132
|
17
|
|
|
|
|
51
|
my @words = split /\s+/, $string; |
|
133
|
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
# Process each word as a unit. |
|
135
|
17
|
|
|
|
|
28
|
for (@words) { |
|
136
|
|
|
|
|
|
|
# Is this word capitalized? |
|
137
|
35
|
100
|
|
|
|
86
|
my $is_capped = /^[A-Z]/ ? 1 : 0; |
|
138
|
|
|
|
|
|
|
# Lowercase the first letter in case we have to prefix it. |
|
139
|
35
|
|
|
|
|
55
|
$_ = lcfirst; |
|
140
|
|
|
|
|
|
|
|
|
141
|
|
|
|
|
|
|
# Okay. Prefix the sucka. |
|
142
|
|
|
|
|
|
|
# XXX Ack. How can I simplify this ugliness? |
|
143
|
35
|
100
|
|
|
|
131
|
if (exists $OK{ lc $_ }) { # {{{ |
|
|
|
100
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
144
|
2
|
|
|
|
|
11
|
s/ |
|
145
|
|
|
|
|
|
|
( # Capture... |
|
146
|
|
|
|
|
|
|
[aeiouy]+ # consecutive vowels |
|
147
|
|
|
|
|
|
|
\B # that do not terminate at a word boundry |
|
148
|
|
|
|
|
|
|
(?![aeiouy]) # that are not followed by another vowel |
|
149
|
|
|
|
|
|
|
| # or |
|
150
|
|
|
|
|
|
|
[aeiouy]* # any consecutive vowels |
|
151
|
|
|
|
|
|
|
[aeiouy] # with any vowel following |
|
152
|
|
|
|
|
|
|
\b # that terminates at a word boundry. |
|
153
|
|
|
|
|
|
|
) # ...end capture. |
|
154
|
|
|
|
|
|
|
/$prefix$1/gisx; # Add 'op' to what we captured. |
|
155
|
|
|
|
|
|
|
} # }}} |
|
156
|
|
|
|
|
|
|
# Special case 'ye'. |
|
157
|
|
|
|
|
|
|
elsif (lc ($_) eq 'ye') { |
|
158
|
1
|
|
|
|
|
5
|
$_ = 'y' . $prefix . substr ($_, -1); |
|
159
|
|
|
|
|
|
|
} |
|
160
|
|
|
|
|
|
|
# We don't want to prefix a non-vowel y. |
|
161
|
|
|
|
|
|
|
elsif (/^y[aeiouy]/i) { # {{{ |
|
162
|
1
|
|
|
|
|
13
|
s/ |
|
163
|
|
|
|
|
|
|
(?:^y)? # Our string starts with y, but we don't |
|
164
|
|
|
|
|
|
|
# want to consider it for every match. |
|
165
|
|
|
|
|
|
|
( # Capture... |
|
166
|
|
|
|
|
|
|
[aeiouy]+ # consecutive vowels |
|
167
|
|
|
|
|
|
|
\B # that do not terminate at a word boundry |
|
168
|
|
|
|
|
|
|
(?![aeiouy]) # that are not followed by another vowel |
|
169
|
|
|
|
|
|
|
| # or |
|
170
|
|
|
|
|
|
|
[aeiouy]* # any consecutive vowels |
|
171
|
|
|
|
|
|
|
[aiouy] # with any non-e vowel following |
|
172
|
|
|
|
|
|
|
\b # that terminates at a word boundry. |
|
173
|
|
|
|
|
|
|
| # or |
|
174
|
|
|
|
|
|
|
[aeiouy]+ # consecutive vowels |
|
175
|
|
|
|
|
|
|
[aeiouy] # with any vowel following |
|
176
|
|
|
|
|
|
|
\b # that terminates at a word boundry. |
|
177
|
|
|
|
|
|
|
) # ...end capture. |
|
178
|
|
|
|
|
|
|
/$prefix$1/gisx; # Add 'op' to what we captured. |
|
179
|
|
|
|
|
|
|
|
|
180
|
1
|
|
|
|
|
3
|
$_ = 'y' . $_; |
|
181
|
|
|
|
|
|
|
} # }}} |
|
182
|
|
|
|
|
|
|
# This regexp captures the "non-solitary, trailing e" vowels. |
|
183
|
|
|
|
|
|
|
else { # {{{ |
|
184
|
31
|
|
|
|
|
226
|
s/ |
|
185
|
|
|
|
|
|
|
( # Capture... |
|
186
|
|
|
|
|
|
|
[aeiouy]+ # consecutive vowels |
|
187
|
|
|
|
|
|
|
\B # that do not terminate at a word boundry |
|
188
|
|
|
|
|
|
|
(?![aeiouy]) # that are not followed by another vowel |
|
189
|
|
|
|
|
|
|
| # or |
|
190
|
|
|
|
|
|
|
[aeiouy]* # any consecutive vowels |
|
191
|
|
|
|
|
|
|
[aiouy] # with any non-e vowel following |
|
192
|
|
|
|
|
|
|
\b # that terminates at a word boundry. |
|
193
|
|
|
|
|
|
|
| # or |
|
194
|
|
|
|
|
|
|
[aeiouy]+ # consecutive vowels |
|
195
|
|
|
|
|
|
|
[aeiouy] # with any vowel following |
|
196
|
|
|
|
|
|
|
\b # that terminates at a word boundry. |
|
197
|
|
|
|
|
|
|
) # ...end capture. |
|
198
|
|
|
|
|
|
|
/$prefix$1/gisx; # Add 'op' to what we captured. |
|
199
|
|
|
|
|
|
|
} # }}} |
|
200
|
|
|
|
|
|
|
|
|
201
|
|
|
|
|
|
|
# The original word was capitalized. |
|
202
|
35
|
100
|
|
|
|
113
|
$_ = ucfirst if $is_capped; |
|
203
|
|
|
|
|
|
|
} |
|
204
|
|
|
|
|
|
|
|
|
205
|
|
|
|
|
|
|
# Return the words as a single space separated string. |
|
206
|
|
|
|
|
|
|
# XXX Again, oof. We don't preserve whitespace. : \ |
|
207
|
17
|
|
|
|
|
100
|
return join ' ', @words; |
|
208
|
|
|
|
|
|
|
} |
|
209
|
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
1; |
|
211
|
|
|
|
|
|
|
__END__ |