import sys import html5lib tree=html5lib.treebuilders.dom.TreeBuilder parser = html5lib.html5parser.HTMLParser(tree=tree) document = parser.parse(sys.stdin) sys.stdout.write(document.toxml("utf-8"))