package Sources::HtmlParser;
use strict;
use warnings;
use base 'HTML::Parser';
sub parseText
{
my($self, $text) = @_;
$self->{mytext} = "";
$self->parse($text);
}
sub text
{
my($self, $origtext, $is_cdata) = @_;
$self->{mytext} .= $origtext;
1;
}
sub get_text
{
my($self) = @_;
return $self->{mytext};
}
1;
my $hp = Sources::HtmlParser->new();
$hp->parseText($httpbody);
$httpbody = HTML::Entities::decode_entities($hp->get_text);
$httpbody =~ s///gms;