) {
chomp;
if($state == 0) {
s/\sheight=\"1\%\"//;
if(/(.*)<\/b>(.*)<\/font/) {
my ($name,$author) = ($1,$2);
$name =~ s/\s+$//;
$name =~ s/<\/b>.*//;
$author =~ s/\s+$//;
my $title = $name." - ".$author;
my $foo = "-" x length($title);
print OUT " $title\n";
print OUT " $foo\n\n";
$state = 1;
}
}
if($state == 1 || $state == 2) {
my $text = undef;
if(/<\/p>/) { $text = " "; }
if(/(.+)<\/p>/) {
$text = $1;
}
if(/(.+) /) {
$text = $1."";
}
if($text) {
# Note - Nokia 3650 uses ISO-8859-1
# As such, we convert accents into that
$text =~ s/\à\;/\xe0/g;
$text =~ s/\è\;/\xe8/g;
$text =~ s/\ì\;/\xec/g;
$text =~ s/\ò\;/\xf2/g;
$text =~ s/\á\;/\xe1/g;
$text =~ s/\é\;/\xe9/g;
$text =~ s/\í\;/\xed/g;
$text =~ s/\ó\;/\xf3/g;
$text =~ s/\ñ\;/\xf1/g;
$text =~ s/\¿\;/\xbf/g;
$text =~ s/\¡\;/\xa1/g;
$text =~ s/\"\;/"/g;
$text =~ s/\&\#145\;/\`/g;
$text =~ s/\&\#146\;/'/g;
$text =~ s/\&\#150\;/-/g;
$text =~ s/\&\;/\&/g;
$text =~ s/<\/i>\s?/ /gi;
$text =~ s/(.*?)<\/i>/_$1_/gi;
$text =~ s/^(.*?)<\/i>/_$1_/gi;
$text =~ s/_ _//g;
$text =~ s/(.*)<\/font>/$1/;
if($text) {
print OUT $text."\n\n";
} else { #print "** "; }
#$text =~ s/^(.{15}).*/$1/;
#print "$text\n";
} else { #print "*** ".$_."\n"; }
if($state == 1) {
print OUT "\n";
$state = 2;
}
if(/<\/table\>/) {
$state = 3;
}
}
}
close IN;
close OUT;
|