lxml, . html5lib, . html, , -, html.
BeautifulSoup, Beautiful Soup, :
import html5lib
from html5lib import treebuilders
f = open("mydocument.html")
parser = html5lib.HTMLParser(tree=treebuilders.getTreeBuilder("beautifulsoup"))
minidom_document = parser.parse(f)