rem tidy up tags, convert to XHTML for easier processing. java -ea -jar G:\dl\trial\tagsoup-1.2.jar --files *.html