html = etree.parse(html_path, etree.HTMLParser())
html = etree.parse(html_path, etree.HTMLParser(encoding="utf-8"))