You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
56 lines
1.5 KiB
56 lines
1.5 KiB
#!/usr/bin/perl
|
|
|
|
use Getopt::Long;
|
|
|
|
GetOptions( 'map=s' => \%mapping ) || die "Wrong options\n";
|
|
|
|
for $file (@ARGV) {
|
|
|
|
open(FILE, "$file") || die "File not found: $file\n";
|
|
|
|
$indir = 0;
|
|
|
|
while (<FILE>) {
|
|
|
|
if (/\<H1\>\<A NAME=\".*\" HREF=\".*\"\>(.*)\<\/A\>\<\/H1\>/) {
|
|
$index = $mapping{$1};
|
|
# print "Index: $1 => $index\n";
|
|
} elsif (/\<DIR\>/) {
|
|
$indir = 1;
|
|
} elsif (/\<\/DIR>/) {
|
|
$indir = 0;
|
|
} elsif ($indir) {
|
|
if (/\<LI\>\<A HREF=\"([^\"]*)\"\>([^<]*)\<\/A\>/) {
|
|
unless ($lastindex eq $index) {
|
|
if ($lastindex) {
|
|
print "</$lastindex>\n";
|
|
}
|
|
print "<$index>\n";
|
|
$lastindex = $index;
|
|
}
|
|
$name = dehtml($2);
|
|
$url = $1;
|
|
print STDOUT "<entry name=\"$name\" url=\"$url\"/>\n";
|
|
}
|
|
}
|
|
}
|
|
|
|
close(FILE);
|
|
}
|
|
|
|
if ($lastindex) {
|
|
print "</$lastindex>\n";
|
|
}
|
|
|
|
sub dehtml
|
|
{
|
|
my ( $str ) = @_;
|
|
|
|
$str =~ s/\<CODE\>//g;
|
|
$str =~ s/\<\/CODE\>//g;
|
|
$str =~ s/\<TT\>//g;
|
|
$str =~ s/\<\/TT\>//g;
|
|
|
|
return $str;
|
|
}
|