File: files.t

package info (click to toggle)
libhtml-clean-perl 0.8-11
  • links: PTS, VCS
  • area: main
  • in suites: lenny, squeeze, wheezy
  • size: 276 kB
  • ctags: 40
  • sloc: perl: 433; makefile: 34
file content (55 lines) | stat: -rw-r--r-- 1,336 bytes parent folder | download | duplicates (9)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
#!/usr/local/bin/perl

######################### We start with some black magic to print on failure.

# Change 1..1 below to 1..last_test_to_print .

BEGIN { $| = 1; print "1..9\n"; }
END {print "not ok 1\n" unless $loaded;}

use HTML::Clean;
$loaded = 1;
$test = 1;
print "ok 1\n";

foreach $page ('hairy', 'altavista', 'microsoft', 'ibm', 'yahoo', 'infoseek', 'itu', 'cnn') {
  $test ++;
  my $h = new HTML::Clean("t/testpages/$page.html");
  print "not ok $test\n" if (! defined($h));
  # compat changes the 'look' of the page for lynx..
  # $h->compat();
  $h->strip();
  
  if (open(OUTFILE, ">t/testpages/t$page.html")) {
    print OUTFILE ${$h->data()};
    close(OUTFILE);
  } else {
    print "not ok $test\n";
  }
  # if we can open lynx test that..
  if (open(P, "lynx -nolist -dump t/testpages/$page.html |")) {
     my $cvtpage = '';
     my $origpage = '';

     while (<P>) {
        $origpage .= $_;
     }
     close(P);

     if (open(P, "lynx -nolist -dump t/testpages/t$page.html |")) {
       while (<P>) {
          $cvtpage .= $_;
       } 
       close(P);

       if (abs(length($origpage) - length($cvtpage)) > 30) {
          print STDERR "\nWarning, lynx detects different page sizes for $page " .
		length($origpage) . ", " . length($cvtpage) . "\n";
        
       }
     }
  }
	
  print "ok $test\n";
}