#!/usr/bin/perl use strict; use warnings; use utf8; use HTML::TreeBuilder; use Data::Dumper; use utf8; my $Tree = HTML::TreeBuilder->new(); my $data; my $html = qq~ Scanner

Überschrift H1

Überschrift H2

Überschrift H3

Überschrift H4

FETT

SCHIEF

UNTERSTRICHEN

Roter Text

Blauer Text

ObenlinksObenrechts
UntenlinksUntenrechts

Dolor dignissimos voluptas debitis neque quas. Debitis corporis libero consectetur odio molestias eum sunt.

~; $Tree->parse_content($html); my @nodes = $Tree->elementify(); my @content = $nodes[0]->content_list(); foreach my $elem (@content) { $data->{$elem->tag()} = $elem; } foreach my $elem ($data->{'body'}->content_list()) { if (!$elem->is_empty()) { my @list = $elem->content_refs_list(); my $tag = $elem->tag(); if (ref($list[0]) eq 'SCALAR') { print $elem->as_text(),"\n"; } else { #HIER MUESSTE ICH WEITER ABSTEIGEN KOENNEN, ODER? } } } $Tree->delete;