mirror of
https://github.com/moparisthebest/SickRage
synced 2024-11-16 22:35:03 -05:00
18 lines
535 B
Python
18 lines
535 B
Python
|
"""
|
||
|
HTML parsing library based on the WHATWG "HTML5"
|
||
|
specification. The parser is designed to be compatible with existing
|
||
|
HTML found in the wild and implements well-defined error recovery that
|
||
|
is largely compatible with modern desktop web browsers.
|
||
|
|
||
|
Example usage:
|
||
|
|
||
|
import html5lib
|
||
|
f = open("my_document.html")
|
||
|
tree = html5lib.parse(f)
|
||
|
"""
|
||
|
__version__ = "0.95-dev"
|
||
|
from html5parser import HTMLParser, parse, parseFragment
|
||
|
from treebuilders import getTreeBuilder
|
||
|
from treewalkers import getTreeWalker
|
||
|
from serializer import serialize
|