html2xhtml
parse HTML reliably
RUN apt-get update && \
apt-get install -y libhtml-html5-parser-perl
RUN apt-get update && \
apt-get install -y libhtml-html5-parser-perl
RUN dnf install -y perl-HTML-HTML5-Parser
RUN apt-get update && \
apt-get install -y libhtml-html5-parser-perl