1 <?xml version="1.0" encoding="ascii"?>
2 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
3 "DTD/xhtml1-transitional.dtd">
4 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
6 <title>lxml.html.html5parser.HTMLParser</title>
7 <link rel="stylesheet" href="epydoc.css" type="text/css" />
8 <script type="text/javascript" src="epydoc.js"></script>
11 <body bgcolor="white" text="black" link="blue" vlink="#204080"
13 <!-- ==================== NAVIGATION BAR ==================== -->
14 <table class="navbar" border="0" width="100%" cellpadding="0"
15 bgcolor="#a0c0ff" cellspacing="0">
18 <th> <a
19 href="lxml-module.html">Home</a> </th>
22 <th> <a
23 href="module-tree.html">Trees</a> </th>
26 <th> <a
27 href="identifier-index.html">Indices</a> </th>
30 <th> <a
31 href="help.html">Help</a> </th>
33 <!-- Project homepage -->
34 <th class="navbar" align="right" width="100%">
35 <table border="0" cellpadding="0" cellspacing="0">
36 <tr><th class="navbar" align="center"
37 ><a class="navbar" target="_top" href="/">lxml API</a></th>
41 <table width="100%" cellpadding="0" cellspacing="0">
44 <span class="breadcrumbs">
45 <a href="lxml-module.html">Package lxml</a> ::
46 <a href="lxml.html-module.html">Package html</a> ::
47 <a href="lxml.html.html5parser-module.html">Module html5parser</a> ::
52 <table cellpadding="0" cellspacing="0">
53 <!-- hide/show private -->
54 <tr><td align="right"><span class="options">[<a href="javascript:void(0);" class="privatelink"
55 onclick="toggle_private();">hide private</a>]</span></td></tr>
56 <tr><td align="right"><span class="options"
57 >[<a href="frames.html" target="_top">frames</a
58 >] | <a href="lxml.html.html5parser.HTMLParser-class.html"
59 target="_top">no frames</a>]</span></td></tr>
64 <!-- ==================== CLASS DESCRIPTION ==================== -->
65 <h1 class="epydoc">Class HTMLParser</h1><p class="nomargin-top"><span class="codelink"><a href="lxml.html.html5parser-pysrc.html#HTMLParser">source code</a></span></p>
66 <pre class="base-tree">
69 html5lib.html5parser.HTMLParser --+
71 <strong class="uidshort">HTMLParser</strong>
75 An html5lib HTML parser with lxml as tree.
77 <!-- ==================== INSTANCE METHODS ==================== -->
78 <a name="section-InstanceMethods"></a>
79 <table class="summary" border="1" cellpadding="3"
80 cellspacing="0" width="100%" bgcolor="white">
81 <tr bgcolor="#70b0f0" class="table-header">
82 <td colspan="2" class="table-header">
83 <table border="0" cellpadding="0" cellspacing="0" width="100%">
85 <td align="left"><span class="table-header">Instance Methods</span></td>
86 <td align="right" valign="top"
87 ><span class="options">[<a href="#section-InstanceMethods"
88 class="privatelink" onclick="toggle_private();"
89 >hide private</a>]</span></td>
95 <td width="15%" align="right" valign="top" class="summary">
96 <span class="summary-type"> </span>
97 </td><td class="summary">
98 <table width="100%" cellpadding="0" cellspacing="0" border="0">
100 <td><span class="summary-sig"><a href="lxml.html.html5parser.HTMLParser-class.html#__init__" class="summary-sig-name">__init__</a>(<span class="summary-sig-arg">self</span>,
101 <span class="summary-sig-arg">strict</span>=<span class="summary-sig-default">False</span>,
102 <span class="summary-sig-arg">**kwargs</span>)</span><br />
103 strict - raise an exception when a parse error is encountered</td>
104 <td align="right" valign="top">
105 <span class="codelink"><a href="lxml.html.html5parser-pysrc.html#HTMLParser.__init__">source code</a></span>
114 <td colspan="2" class="summary">
115 <p class="indent-wrapped-lines"><b>Inherited from <code>html5lib.html5parser.HTMLParser</code></b>:
116 <code>adjustForeignAttributes</code>,
117 <code>adjustMathMLAttributes</code>,
118 <code>adjustSVGAttributes</code>,
119 <code>isHTMLIntegrationPoint</code>,
120 <code>isMathMLTextIntegrationPoint</code>,
121 <code>mainLoop</code>,
122 <code>normalizeToken</code>,
123 <code>normalizedTokens</code>,
125 <code>parseError</code>,
126 <code>parseFragment</code>,
127 <code>parseRCDataRawtext</code>,
128 <code>reparseTokenNormal</code>,
130 <code>resetInsertionMode</code>
132 <div class="private"> <p class="indent-wrapped-lines"><b>Inherited from <code>html5lib.html5parser.HTMLParser</code></b> (private):
135 <p class="indent-wrapped-lines"><b>Inherited from <code>object</code></b>:
136 <code>__delattr__</code>,
137 <code>__format__</code>,
138 <code>__getattribute__</code>,
139 <code>__hash__</code>,
140 <code>__new__</code>,
141 <code>__reduce__</code>,
142 <code>__reduce_ex__</code>,
143 <code>__repr__</code>,
144 <code>__setattr__</code>,
145 <code>__sizeof__</code>,
146 <code>__str__</code>,
147 <code>__subclasshook__</code>
152 <!-- ==================== PROPERTIES ==================== -->
153 <a name="section-Properties"></a>
154 <table class="summary" border="1" cellpadding="3"
155 cellspacing="0" width="100%" bgcolor="white">
156 <tr bgcolor="#70b0f0" class="table-header">
157 <td colspan="2" class="table-header">
158 <table border="0" cellpadding="0" cellspacing="0" width="100%">
160 <td align="left"><span class="table-header">Properties</span></td>
161 <td align="right" valign="top"
162 ><span class="options">[<a href="#section-Properties"
163 class="privatelink" onclick="toggle_private();"
164 >hide private</a>]</span></td>
170 <td colspan="2" class="summary">
171 <p class="indent-wrapped-lines"><b>Inherited from <code>html5lib.html5parser.HTMLParser</code></b>:
172 <code>documentEncoding</code>
174 <p class="indent-wrapped-lines"><b>Inherited from <code>object</code></b>:
175 <code>__class__</code>
180 <!-- ==================== METHOD DETAILS ==================== -->
181 <a name="section-MethodDetails"></a>
182 <table class="details" border="1" cellpadding="3"
183 cellspacing="0" width="100%" bgcolor="white">
184 <tr bgcolor="#70b0f0" class="table-header">
185 <td colspan="2" class="table-header">
186 <table border="0" cellpadding="0" cellspacing="0" width="100%">
188 <td align="left"><span class="table-header">Method Details</span></td>
189 <td align="right" valign="top"
190 ><span class="options">[<a href="#section-MethodDetails"
191 class="privatelink" onclick="toggle_private();"
192 >hide private</a>]</span></td>
198 <a name="__init__"></a>
200 <table class="details" border="1" cellpadding="3"
201 cellspacing="0" width="100%" bgcolor="white">
203 <table width="100%" cellpadding="0" cellspacing="0" border="0">
204 <tr valign="top"><td>
205 <h3 class="epydoc"><span class="sig"><span class="sig-name">__init__</span>(<span class="sig-arg">self</span>,
206 <span class="sig-arg">strict</span>=<span class="sig-default">False</span>,
207 <span class="sig-arg">**kwargs</span>)</span>
208 <br /><em class="fname">(Constructor)</em>
210 </td><td align="right" valign="top"
211 ><span class="codelink"><a href="lxml.html.html5parser-pysrc.html#HTMLParser.__init__">source code</a></span>
215 <p>strict - raise an exception when a parse error is encountered</p>
216 <p>tree - a treebuilder class controlling the type of tree that will be
217 returned. Built in treebuilders can be accessed through
218 html5lib.treebuilders.getTreeBuilder(treeType)</p>
222 <dd><em class="note">(inherited documentation)</em></dd>
228 <!-- ==================== NAVIGATION BAR ==================== -->
229 <table class="navbar" border="0" width="100%" cellpadding="0"
230 bgcolor="#a0c0ff" cellspacing="0">
233 <th> <a
234 href="lxml-module.html">Home</a> </th>
237 <th> <a
238 href="module-tree.html">Trees</a> </th>
241 <th> <a
242 href="identifier-index.html">Indices</a> </th>
245 <th> <a
246 href="help.html">Help</a> </th>
248 <!-- Project homepage -->
249 <th class="navbar" align="right" width="100%">
250 <table border="0" cellpadding="0" cellspacing="0">
251 <tr><th class="navbar" align="center"
252 ><a class="navbar" target="_top" href="/">lxml API</a></th>
256 <table border="0" cellpadding="0" cellspacing="0" width="100%%">
258 <td align="left" class="footer">
259 Generated by Epydoc 3.0.1
260 on Wed Jan 29 12:26:21 2020
262 <td align="right" class="footer">
263 <a target="mainFrame" href="http://epydoc.sourceforge.net"
264 >http://epydoc.sourceforge.net</a>
269 <script type="text/javascript">
271 // Private objects are initially displayed (because if
272 // javascript is turned off then we want them to be
273 // visible); but by default, we want to hide them. So hide
274 // them unless we have a cookie that says to show them.