File: hlc

package info (click to toggle)
libhtml-parser-perl 3.69-2
  • links: PTS, VCS
  • area: main
  • in suites: wheezy
  • size: 672 kB
  • sloc: perl: 2,022; ansic: 1,972; makefile: 6
file content (24 lines) | stat: -rwxr-xr-x 710 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
#!/usr/bin/perl -w

# This script will assume that the first command line argument
# is a file containing HTML, and return a version
# where all the tags are converted to lowercase.

use strict;
use HTML::Parser ();

HTML::Parser->new(start_h   => [ \&start_lc, "tokenpos, text" ],
	          end_h     => [ sub { print lc shift }, "text" ],
                  default_h => [ sub { print shift }, "text" ],
                 )
    ->parse_file(shift) || die "Can't open file: $!\n";

sub start_lc {
    my($tpos, $text) = @_;
    for (my $i = 0; $i < @$tpos; $i += 2) {
	next if $i && ($i/2) % 2 == 0;  # skip attribute values
	$_ = lc $_ for substr($text, $tpos->[$i], $tpos->[$i+1]);
    }
    print $text;
}