File Coverage

blib/lib/NewsExtractor/SiteSpecificExtractor/www_mdnkids_com.pm

Criterion	Covered	Total	%
statement	9	27	33.3
branch	0	8	0.0
condition			n/a
subroutine	3	5	60.0
pod	0	2	0.0
total	12	42	28.5

line	stmt	bran	sub	pod	time	code
1						package NewsExtractor::SiteSpecificExtractor::www_mdnkids_com;
2	1		1		9	use utf8;
	1				3
	1				39
3	1		1		40	use Moo;
	1				3
	1				5
4						extends 'NewsExtractor::GenericExtractor';
5
6	1		1		320	use Importer 'NewsExtractor::TextUtil' => qw(reformat_dateline normalize_whitespace);
	1				2
	1				5
7
8						sub dateline {
9	0		0	0		my ($self) = @_;
10	0					my $el = $self->dom->at('h2 ~ div.col span');
11	0	0				if ($el) {
12	0					my ($ymd) = $el->all_text() =~ m<$([0-9]{4}/[0-9]{1,2}/[0-9]{1,2})$\z>;
13	0					return reformat_dateline( $ymd, '+08:00' );
14						}
15	0					return undef;
16						}
17
18						sub journalist {
19	0		0	0		my ($self) = @_;
20	0					my ($x, $el);
21	0	0				if ($el = $self->dom->at('h2 ~ div.col span')) {
22	0					$x = $el->all_text() =~ s<$[0-9]{4}/[0-9]{1,2}/[0-9]{1,2}$\z><>r;
23	0					$x = normalize_whitespace($x);
24						}
25	0	0				unless ($x) {
26	0					my $t = $self->content_text;
27
28	0					my @regexps = (
29						qr{\A(\S+)／\S+報導\n},
30						qr{\A\S*(報導／\S+\s+攝影／\S+)\n},
31						qr{\A\S*(文／\S+\s+圖／\S+)\n},
32						qr{\A\S*(\S{3})\n},
33						);
34
35	0					for my $re (@regexps) {
36	0					($x) = $t =~ /$re/;
37	0	0				last if $x;
38						}
39						}
40
41	0					return $x;
42						}
43
44						1;