""" HTML parsing library based on the WHATWG "HTML5" specification. The parser is designed to be compatible with existing HTML found in the wild and implements well-defined error recovery that is largely compatible with modern desktop web browsers. Example usage: import html5lib f = open("my_document.html") tree = html5lib.parse(f) """ from __future__ import absolute_import, division, unicode_literals from .html5parser import HTMLParser, parse, parseFragment from .treebuilders import getTreeBuilder from .treewalkers import getTreeWalker from .serializer import serialize __all__ = ["HTMLParser", "parse", "parseFragment", "getTreeBuilder", "getTreeWalker", "serialize"] # this has to be at the top level, see how setup.py parses this __version__ = "1.0b10"
Name | Type | Size | Permission | Actions |
---|---|---|---|---|
__pycache__ | Folder | 0755 |
|
|
_trie | Folder | 0755 |
|
|
filters | Folder | 0755 |
|
|
treeadapters | Folder | 0755 |
|
|
treebuilders | Folder | 0755 |
|
|
treewalkers | Folder | 0755 |
|
|
__init__.py | File | 780 B | 0644 |
|
_ihatexml.py | File | 16.31 KB | 0644 |
|
_inputstream.py | File | 31.77 KB | 0644 |
|
_tokenizer.py | File | 74.79 KB | 0644 |
|
_utils.py | File | 4 KB | 0644 |
|
constants.py | File | 81.43 KB | 0644 |
|
html5parser.py | File | 114.42 KB | 0644 |
|
serializer.py | File | 13.84 KB | 0644 |
|