#!/usr/bin/perl
use
5.010;
use
Getopt::Long 0
qw(:config permute bundling no_auto_abbrev)
;
my
%options
;
Getopt::Long::GetOptions(\
%options
,
'markup|m=s'
,
'polyglot=i'
,
'doctype=s'
,
'charset=s'
,
'quote_attributes=s'
,
'voids=s'
,
'start_tags=s'
,
'end_tags=s'
,
'refs=s'
,
'indent_string=s'
,
);
my
$input
=
shift
//
'-'
;
my
$output
=
shift
//
'-'
;
my
$parser
= HTML::HTML5::Parser->new;
my
$dom
= (
$input
eq
'-'
)
?
$parser
->parse_string(
do
{
local
$/ = <STDIN> })
:
$parser
->parse_file(
$input
);
$HTML::HTML5::Sanity::FIX_LANG_ATTRIBUTES
= 2;
my
$fixed_dom
= fix_document(
$dom
);
XML::LibXML::PrettyPrint
->new_for_html(
indent_string
=> (
delete
$options
{indent_string} //
"\t"
))
->pretty_print(
$fixed_dom
);
my
$writer
= HTML::HTML5::Writer
->new(
%options
);
if
(
$output
eq
'-'
)
{
say
$writer
->document(
$fixed_dom
);
}
else
{
open
my
(
$fh
),
'>:encoding(UTF-8)'
,
$output
;
say
$fh
$writer
->document(
$fixed_dom
);
close
$fh
;
}