File Coverage

blib/lib/NNexus/Index/Dlmf.pm
Criterion Covered Total %
statement 9 54 16.6
branch 0 4 0.0
condition 0 3 0.0
subroutine 3 8 37.5
pod 4 5 80.0
total 16 74 21.6


line stmt bran cond sub pod time code
1             # /=====================================================================\ #
2             # | NNexus Autolinker | #
3             # | Indexing Plug-in, DLMF.nist.gov domain | #
4             # |=====================================================================| #
5             # | Part of the Planetary project: http://trac.mathweb.org/planetary | #
6             # | Research software, produced as part of work done by: | #
7             # | the KWARC group at Jacobs University | #
8             # | Copyright (c) 2012 | #
9             # | Released under the MIT License (MIT) | #
10             # |---------------------------------------------------------------------| #
11             # | Adapted from the original NNexus code by | #
12             # | James Gardner and Aaron Krowne | #
13             # |---------------------------------------------------------------------| #
14             # | Deyan Ginev #_# | #
15             # | http://kwarc.info/people/dginev (o o) | #
16             # \=========================================================ooo==U==ooo=/ #
17             package NNexus::Index::Dlmf;
18 1     1   16749 use warnings;
  1         1  
  1         30  
19 1     1   3 use strict;
  1         1  
  1         29  
20 1     1   4 use base qw(NNexus::Index::Template);
  1         0  
  1         356  
21              
22 0     0 1   sub domain_root { "http://dlmf.nist.gov" }
23 0     0 0   sub domain_base { "http://dlmf.nist.gov/" }
24 0     0 1   sub depth_limit { 100 }
25              
26             sub candidate_links {
27 0     0 1   my ($self) = @_;
28 0           my $url = $self->current_url;
29 0           my $dom = $self->current_dom;
30             # We only care about /idx and /not pages (index and notations)
31 0           my @next_jobs = $dom->find('a')->each;
32 0           @next_jobs = map {s/^(\.\.\/)?\.\///; $self->domain_base . $_; } grep {/\.\/(idx|not)(\/\w?)?$/} map { $_->{href}} @next_jobs;
  0            
  0            
  0            
  0            
33 0           \@next_jobs;
34             }
35              
36             sub index_page {
37 0     0 1   my ($self) = @_;
38 0           my $url = $self->current_url;
39 0           my $dom = $self->current_dom;
40 0           my $name;
41 0           my $category = '33-XX'; # Special functions? always?
42 0           my (@def_links,@def_names);
43 0 0         if ($url =~ /\/idx/) {
    0          
44             # DLMF Index page
45 0           my $def_spans = $dom->find('div > ul > li > span > span[class="ltx_text ltx_font_bold"]');
46 0           @def_links = map {s/^(\.\.\/)?\.\///; $self->domain_base . $_; } map {$_->{href}} $def_spans->pluck('a')->each;
  0            
  0            
  0            
47 0           @def_names = map {
48 0           my $t = $_->children->first->content;
49 0           $t =~ s/\(.+\)//g;
50 0           $t =~ s/\:(.*)$//;
51 0           $t;}
52             $def_spans->pluck('parent')->pluck('parent')->each;
53             } elsif ($url =~ /\/not/) {
54 0           my $def_anchors = $dom->find('a[class="ltx_ref"]');
55 0           @def_links = map {s/^(.+)\.\///; $self->domain_base . $_; } map {$_->{href}} $def_anchors->each;
  0            
  0            
  0            
56 0           @def_names = $def_anchors->pluck('parent')->pluck('content')->each;
57 0           @def_names = map {my ($name) = split(';',$_); $name;} @def_names;
  0            
  0            
58             # DLMF Notation page
59             } else {
60             # Default is empty!
61 0           return [];
62             }
63              
64 0           my $results=[];
65 0   0       while (@def_links && @def_names) {
66 0           my ($name,$link)=(shift @def_names, shift @def_links);
67 0           push @$results, {url=>$link,concept=>$name,categories=>[$category]};
68             }
69 0           return $results;
70             }
71              
72             1;
73             __END__