a502abe15cfce7562befffadcd227ba55ca396d1
[platform/upstream/python-lxml.git] / doc / html / api / lxml.html.soupparser-pysrc.html
1 <?xml version="1.0" encoding="ascii"?>
2 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
3           "DTD/xhtml1-transitional.dtd">
4 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
5 <head>
6   <title>lxml.html.soupparser</title>
7   <link rel="stylesheet" href="epydoc.css" type="text/css" />
8   <script type="text/javascript" src="epydoc.js"></script>
9 </head>
10
11 <body bgcolor="white" text="black" link="blue" vlink="#204080"
12       alink="#204080">
13 <!-- ==================== NAVIGATION BAR ==================== -->
14 <table class="navbar" border="0" width="100%" cellpadding="0"
15        bgcolor="#a0c0ff" cellspacing="0">
16   <tr valign="middle">
17   <!-- Home link -->
18       <th>&nbsp;&nbsp;&nbsp;<a
19         href="lxml-module.html">Home</a>&nbsp;&nbsp;&nbsp;</th>
20
21   <!-- Tree link -->
22       <th>&nbsp;&nbsp;&nbsp;<a
23         href="module-tree.html">Trees</a>&nbsp;&nbsp;&nbsp;</th>
24
25   <!-- Index link -->
26       <th>&nbsp;&nbsp;&nbsp;<a
27         href="identifier-index.html">Indices</a>&nbsp;&nbsp;&nbsp;</th>
28
29   <!-- Help link -->
30       <th>&nbsp;&nbsp;&nbsp;<a
31         href="help.html">Help</a>&nbsp;&nbsp;&nbsp;</th>
32
33   <!-- Project homepage -->
34       <th class="navbar" align="right" width="100%">
35         <table border="0" cellpadding="0" cellspacing="0">
36           <tr><th class="navbar" align="center"
37             ><a class="navbar" target="_top" href="/">lxml API</a></th>
38           </tr></table></th>
39   </tr>
40 </table>
41 <table width="100%" cellpadding="0" cellspacing="0">
42   <tr valign="top">
43     <td width="100%">
44       <span class="breadcrumbs">
45         <a href="lxml-module.html">Package&nbsp;lxml</a> ::
46         <a href="lxml.html-module.html">Package&nbsp;html</a> ::
47         Module&nbsp;soupparser
48       </span>
49     </td>
50     <td>
51       <table cellpadding="0" cellspacing="0">
52         <!-- hide/show private -->
53         <tr><td align="right"><span class="options">[<a href="javascript:void(0);" class="privatelink"
54     onclick="toggle_private();">hide&nbsp;private</a>]</span></td></tr>
55         <tr><td align="right"><span class="options"
56             >[<a href="frames.html" target="_top">frames</a
57             >]&nbsp;|&nbsp;<a href="lxml.html.soupparser-pysrc.html"
58             target="_top">no&nbsp;frames</a>]</span></td></tr>
59       </table>
60     </td>
61   </tr>
62 </table>
63 <h1 class="epydoc">Source Code for <a href="lxml.html.soupparser-module.html">Module lxml.html.soupparser</a></h1>
64 <pre class="py-src">
65 <a name="L1"></a><tt class="py-lineno">  1</tt>  <tt class="py-line"><tt id="link-0" class="py-name" targets="Variable lxml.html.ElementSoup.__doc__=lxml.html.ElementSoup-module.html#__doc__,Variable lxml.html.soupparser.__doc__=lxml.html.soupparser-module.html#__doc__"><a title="lxml.html.ElementSoup.__doc__
66 lxml.html.soupparser.__doc__" class="py-name" href="#" onclick="return doclink('link-0', '__doc__', 'link-0');">__doc__</a></tt> <tt class="py-op">=</tt> <tt class="py-docstring">"""External interface to the BeautifulSoup HTML parser.</tt> </tt>
67 <a name="L2"></a><tt class="py-lineno">  2</tt>  <tt class="py-line"><tt class="py-docstring">"""</tt> </tt>
68 <a name="L3"></a><tt class="py-lineno">  3</tt>  <tt class="py-line"> </tt>
69 <a name="L4"></a><tt class="py-lineno">  4</tt>  <tt class="py-line"><tt class="py-name">__all__</tt> <tt class="py-op">=</tt> <tt class="py-op">[</tt><tt class="py-string">"fromstring"</tt><tt class="py-op">,</tt> <tt class="py-string">"parse"</tt><tt class="py-op">,</tt> <tt class="py-string">"convert_tree"</tt><tt class="py-op">]</tt> </tt>
70 <a name="L5"></a><tt class="py-lineno">  5</tt>  <tt class="py-line"> </tt>
71 <a name="L6"></a><tt class="py-lineno">  6</tt>  <tt class="py-line"><tt class="py-keyword">from</tt> <tt id="link-1" class="py-name" targets="Package lxml=lxml-module.html"><a title="lxml" class="py-name" href="#" onclick="return doclink('link-1', 'lxml', 'link-1');">lxml</a></tt> <tt class="py-keyword">import</tt> <tt id="link-2" class="py-name" targets="Module lxml.etree=lxml.etree-module.html,Variable lxml.sax.ElementTreeContentHandler.etree=lxml.sax.ElementTreeContentHandler-class.html#etree,Variable lxml.tests.test_elementtree.CElementTreeTestCase.etree=lxml.tests.test_elementtree.CElementTreeTestCase-class.html#etree,Variable lxml.tests.test_elementtree.ETreeTestCaseBase.etree=lxml.tests.test_elementtree.ETreeTestCaseBase-class.html#etree,Variable lxml.tests.test_io.IOTestCaseBase.etree=lxml.tests.test_io.IOTestCaseBase-class.html#etree"><a title="lxml.etree
72 lxml.sax.ElementTreeContentHandler.etree
73 lxml.tests.test_elementtree.CElementTreeTestCase.etree
74 lxml.tests.test_elementtree.ETreeTestCaseBase.etree
75 lxml.tests.test_io.IOTestCaseBase.etree" class="py-name" href="#" onclick="return doclink('link-2', 'etree', 'link-2');">etree</a></tt><tt class="py-op">,</tt> <tt id="link-3" class="py-name" targets="Package lxml.html=lxml.html-module.html,Method lxml.html.diff.href_token.html()=lxml.html.diff.href_token-class.html#html,Method lxml.html.diff.tag_token.html()=lxml.html.diff.tag_token-class.html#html,Method lxml.html.diff.token.html()=lxml.html.diff.token-class.html#html"><a title="lxml.html
76 lxml.html.diff.href_token.html
77 lxml.html.diff.tag_token.html
78 lxml.html.diff.token.html" class="py-name" href="#" onclick="return doclink('link-3', 'html', 'link-3');">html</a></tt> </tt>
79 <a name="L7"></a><tt class="py-lineno">  7</tt>  <tt class="py-line"><tt class="py-keyword">from</tt> <tt class="py-name">BeautifulSoup</tt> <tt class="py-keyword">import</tt> \ </tt>
80 <a name="L8"></a><tt class="py-lineno">  8</tt>  <tt class="py-line">     <tt class="py-name">BeautifulSoup</tt><tt class="py-op">,</tt> <tt class="py-name">Tag</tt><tt class="py-op">,</tt> <tt id="link-4" class="py-name" targets="Function lxml.etree.Comment()=lxml.etree-module.html#Comment"><a title="lxml.etree.Comment" class="py-name" href="#" onclick="return doclink('link-4', 'Comment', 'link-4');">Comment</a></tt><tt class="py-op">,</tt> <tt class="py-name">ProcessingInstruction</tt><tt class="py-op">,</tt> <tt class="py-name">NavigableString</tt> </tt>
81 <a name="L9"></a><tt class="py-lineno">  9</tt>  <tt class="py-line"> </tt>
82 <a name="L10"></a><tt class="py-lineno"> 10</tt>  <tt class="py-line"> </tt>
83 <a name="fromstring"></a><div id="fromstring-def"><a name="L11"></a><tt class="py-lineno"> 11</tt> <a class="py-toggle" href="#" id="fromstring-toggle" onclick="return toggle('fromstring');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#fromstring">fromstring</a><tt class="py-op">(</tt><tt class="py-param">data</tt><tt class="py-op">,</tt> <tt class="py-param">beautifulsoup</tt><tt class="py-op">=</tt><tt class="py-name">None</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">=</tt><tt class="py-name">None</tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-param">bsargs</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
84 </div><div id="fromstring-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="fromstring-expanded"><a name="L12"></a><tt class="py-lineno"> 12</tt>  <tt class="py-line">    <tt class="py-docstring">"""Parse a string of HTML data into an Element tree using the</tt> </tt>
85 <a name="L13"></a><tt class="py-lineno"> 13</tt>  <tt class="py-line"><tt class="py-docstring">    BeautifulSoup parser.</tt> </tt>
86 <a name="L14"></a><tt class="py-lineno"> 14</tt>  <tt class="py-line"><tt class="py-docstring"></tt> </tt>
87 <a name="L15"></a><tt class="py-lineno"> 15</tt>  <tt class="py-line"><tt class="py-docstring">    Returns the root ``&lt;html&gt;`` Element of the tree.</tt> </tt>
88 <a name="L16"></a><tt class="py-lineno"> 16</tt>  <tt class="py-line"><tt class="py-docstring"></tt> </tt>
89 <a name="L17"></a><tt class="py-lineno"> 17</tt>  <tt class="py-line"><tt class="py-docstring">    You can pass a different BeautifulSoup parser through the</tt> </tt>
90 <a name="L18"></a><tt class="py-lineno"> 18</tt>  <tt class="py-line"><tt class="py-docstring">    `beautifulsoup` keyword, and a diffent Element factory function</tt> </tt>
91 <a name="L19"></a><tt class="py-lineno"> 19</tt>  <tt class="py-line"><tt class="py-docstring">    through the `makeelement` keyword.  By default, the standard</tt> </tt>
92 <a name="L20"></a><tt class="py-lineno"> 20</tt>  <tt class="py-line"><tt class="py-docstring">    ``BeautifulSoup`` class and the default factory of `lxml.html` are</tt> </tt>
93 <a name="L21"></a><tt class="py-lineno"> 21</tt>  <tt class="py-line"><tt class="py-docstring">    used.</tt> </tt>
94 <a name="L22"></a><tt class="py-lineno"> 22</tt>  <tt class="py-line"><tt class="py-docstring">    """</tt> </tt>
95 <a name="L23"></a><tt class="py-lineno"> 23</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt id="link-5" class="py-name" targets="Function lxml.html.soupparser._parse()=lxml.html.soupparser-module.html#_parse"><a title="lxml.html.soupparser._parse" class="py-name" href="#" onclick="return doclink('link-5', '_parse', 'link-5');">_parse</a></tt><tt class="py-op">(</tt><tt id="link-6" class="py-name" targets="Method lxml.etree.TreeBuilder.data()=lxml.etree.TreeBuilder-class.html#data"><a title="lxml.etree.TreeBuilder.data" class="py-name" href="#" onclick="return doclink('link-6', 'data', 'link-6');">data</a></tt><tt class="py-op">,</tt> <tt class="py-name">beautifulsoup</tt><tt class="py-op">,</tt> <tt id="link-7" class="py-name" targets="Method lxml.etree._BaseParser.makeelement()=lxml.etree._BaseParser-class.html#makeelement,Method lxml.etree._Element.makeelement()=lxml.etree._Element-class.html#makeelement"><a title="lxml.etree._BaseParser.makeelement
96 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-7', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-name">bsargs</tt><tt class="py-op">)</tt> </tt>
97 </div><a name="L24"></a><tt class="py-lineno"> 24</tt>  <tt class="py-line"> </tt>
98 <a name="parse"></a><div id="parse-def"><a name="L25"></a><tt class="py-lineno"> 25</tt> <a class="py-toggle" href="#" id="parse-toggle" onclick="return toggle('parse');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#parse">parse</a><tt class="py-op">(</tt><tt class="py-param">file</tt><tt class="py-op">,</tt> <tt class="py-param">beautifulsoup</tt><tt class="py-op">=</tt><tt class="py-name">None</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">=</tt><tt class="py-name">None</tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-param">bsargs</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
99 </div><div id="parse-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="parse-expanded"><a name="L26"></a><tt class="py-lineno"> 26</tt>  <tt class="py-line">    <tt class="py-docstring">"""Parse a file into an ElemenTree using the BeautifulSoup parser.</tt> </tt>
100 <a name="L27"></a><tt class="py-lineno"> 27</tt>  <tt class="py-line"><tt class="py-docstring"></tt> </tt>
101 <a name="L28"></a><tt class="py-lineno"> 28</tt>  <tt class="py-line"><tt class="py-docstring">    You can pass a different BeautifulSoup parser through the</tt> </tt>
102 <a name="L29"></a><tt class="py-lineno"> 29</tt>  <tt class="py-line"><tt class="py-docstring">    `beautifulsoup` keyword, and a diffent Element factory function</tt> </tt>
103 <a name="L30"></a><tt class="py-lineno"> 30</tt>  <tt class="py-line"><tt class="py-docstring">    through the `makeelement` keyword.  By default, the standard</tt> </tt>
104 <a name="L31"></a><tt class="py-lineno"> 31</tt>  <tt class="py-line"><tt class="py-docstring">    ``BeautifulSoup`` class and the default factory of `lxml.html` are</tt> </tt>
105 <a name="L32"></a><tt class="py-lineno"> 32</tt>  <tt class="py-line"><tt class="py-docstring">    used.</tt> </tt>
106 <a name="L33"></a><tt class="py-lineno"> 33</tt>  <tt class="py-line"><tt class="py-docstring">    """</tt> </tt>
107 <a name="L34"></a><tt class="py-lineno"> 34</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-keyword">not</tt> <tt id="link-8" class="py-name" targets="Method lxml.objectify.ObjectPath.hasattr()=lxml.objectify.ObjectPath-class.html#hasattr"><a title="lxml.objectify.ObjectPath.hasattr" class="py-name" href="#" onclick="return doclink('link-8', 'hasattr', 'link-8');">hasattr</a></tt><tt class="py-op">(</tt><tt class="py-name">file</tt><tt class="py-op">,</tt> <tt class="py-string">'read'</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
108 <a name="L35"></a><tt class="py-lineno"> 35</tt>  <tt class="py-line">        <tt class="py-name">file</tt> <tt class="py-op">=</tt> <tt class="py-name">open</tt><tt class="py-op">(</tt><tt class="py-name">file</tt><tt class="py-op">)</tt> </tt>
109 <a name="L36"></a><tt class="py-lineno"> 36</tt>  <tt class="py-line">    <tt id="link-9" class="py-name" targets="Variable lxml.etree.iterparse.root=lxml.etree.iterparse-class.html#root"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-9', 'root', 'link-9');">root</a></tt> <tt class="py-op">=</tt> <tt id="link-10" class="py-name"><a title="lxml.html.soupparser._parse" class="py-name" href="#" onclick="return doclink('link-10', '_parse', 'link-5');">_parse</a></tt><tt class="py-op">(</tt><tt class="py-name">file</tt><tt class="py-op">,</tt> <tt class="py-name">beautifulsoup</tt><tt class="py-op">,</tt> <tt id="link-11" class="py-name"><a title="lxml.etree._BaseParser.makeelement
110 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-11', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-name">bsargs</tt><tt class="py-op">)</tt> </tt>
111 <a name="L37"></a><tt class="py-lineno"> 37</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt id="link-12" class="py-name"><a title="lxml.etree
112 lxml.sax.ElementTreeContentHandler.etree
113 lxml.tests.test_elementtree.CElementTreeTestCase.etree
114 lxml.tests.test_elementtree.ETreeTestCaseBase.etree
115 lxml.tests.test_io.IOTestCaseBase.etree" class="py-name" href="#" onclick="return doclink('link-12', 'etree', 'link-2');">etree</a></tt><tt class="py-op">.</tt><tt id="link-13" class="py-name" targets="Function lxml.etree.ElementTree()=lxml.etree-module.html#ElementTree,Module xml.etree.ElementTree=xml.etree.ElementTree-module.html,Class xml.etree.ElementTree.ElementTree=xml.etree.ElementTree.ElementTree-class.html"><a title="lxml.etree.ElementTree
116 xml.etree.ElementTree
117 xml.etree.ElementTree.ElementTree" class="py-name" href="#" onclick="return doclink('link-13', 'ElementTree', 'link-13');">ElementTree</a></tt><tt class="py-op">(</tt><tt id="link-14" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-14', 'root', 'link-9');">root</a></tt><tt class="py-op">)</tt> </tt>
118 </div><a name="L38"></a><tt class="py-lineno"> 38</tt>  <tt class="py-line"> </tt>
119 <a name="convert_tree"></a><div id="convert_tree-def"><a name="L39"></a><tt class="py-lineno"> 39</tt> <a class="py-toggle" href="#" id="convert_tree-toggle" onclick="return toggle('convert_tree');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#convert_tree">convert_tree</a><tt class="py-op">(</tt><tt class="py-param">beautiful_soup_tree</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">=</tt><tt class="py-name">None</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
120 </div><div id="convert_tree-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="convert_tree-expanded"><a name="L40"></a><tt class="py-lineno"> 40</tt>  <tt class="py-line">    <tt class="py-docstring">"""Convert a BeautifulSoup tree to a list of Element trees.</tt> </tt>
121 <a name="L41"></a><tt class="py-lineno"> 41</tt>  <tt class="py-line"><tt class="py-docstring"></tt> </tt>
122 <a name="L42"></a><tt class="py-lineno"> 42</tt>  <tt class="py-line"><tt class="py-docstring">    Returns a list instead of a single root Element to support</tt> </tt>
123 <a name="L43"></a><tt class="py-lineno"> 43</tt>  <tt class="py-line"><tt class="py-docstring">    HTML-like soup with more than one root element.</tt> </tt>
124 <a name="L44"></a><tt class="py-lineno"> 44</tt>  <tt class="py-line"><tt class="py-docstring"></tt> </tt>
125 <a name="L45"></a><tt class="py-lineno"> 45</tt>  <tt class="py-line"><tt class="py-docstring">    You can pass a different Element factory through the `makeelement`</tt> </tt>
126 <a name="L46"></a><tt class="py-lineno"> 46</tt>  <tt class="py-line"><tt class="py-docstring">    keyword.</tt> </tt>
127 <a name="L47"></a><tt class="py-lineno"> 47</tt>  <tt class="py-line"><tt class="py-docstring">    """</tt> </tt>
128 <a name="L48"></a><tt class="py-lineno"> 48</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt id="link-15" class="py-name"><a title="lxml.etree._BaseParser.makeelement
129 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-15', 'makeelement', 'link-7');">makeelement</a></tt> <tt class="py-keyword">is</tt> <tt class="py-name">None</tt><tt class="py-op">:</tt> </tt>
130 <a name="L49"></a><tt class="py-lineno"> 49</tt>  <tt class="py-line">        <tt id="link-16" class="py-name"><a title="lxml.etree._BaseParser.makeelement
131 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-16', 'makeelement', 'link-7');">makeelement</a></tt> <tt class="py-op">=</tt> <tt id="link-17" class="py-name"><a title="lxml.html
132 lxml.html.diff.href_token.html
133 lxml.html.diff.tag_token.html
134 lxml.html.diff.token.html" class="py-name" href="#" onclick="return doclink('link-17', 'html', 'link-3');">html</a></tt><tt class="py-op">.</tt><tt id="link-18" class="py-name" targets="Variable lxml.html.html5parser.html_parser=lxml.html.html5parser-module.html#html_parser,Variable lxml.html.html_parser=lxml.html-module.html#html_parser"><a title="lxml.html.html5parser.html_parser
135 lxml.html.html_parser" class="py-name" href="#" onclick="return doclink('link-18', 'html_parser', 'link-18');">html_parser</a></tt><tt class="py-op">.</tt><tt id="link-19" class="py-name"><a title="lxml.etree._BaseParser.makeelement
136 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-19', 'makeelement', 'link-7');">makeelement</a></tt> </tt>
137 <a name="L50"></a><tt class="py-lineno"> 50</tt>  <tt class="py-line">    <tt id="link-20" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-20', 'root', 'link-9');">root</a></tt> <tt class="py-op">=</tt> <tt id="link-21" class="py-name" targets="Function lxml.html.soupparser._convert_tree()=lxml.html.soupparser-module.html#_convert_tree"><a title="lxml.html.soupparser._convert_tree" class="py-name" href="#" onclick="return doclink('link-21', '_convert_tree', 'link-21');">_convert_tree</a></tt><tt class="py-op">(</tt><tt class="py-name">beautiful_soup_tree</tt><tt class="py-op">,</tt> <tt id="link-22" class="py-name"><a title="lxml.etree._BaseParser.makeelement
138 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-22', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">)</tt> </tt>
139 <a name="L51"></a><tt class="py-lineno"> 51</tt>  <tt class="py-line">    <tt class="py-name">children</tt> <tt class="py-op">=</tt> <tt id="link-23" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-23', 'root', 'link-9');">root</a></tt><tt class="py-op">.</tt><tt id="link-24" class="py-name" targets="Method lxml.etree._Element.getchildren()=lxml.etree._Element-class.html#getchildren,Method lxml.etree._ReadOnlyProxy.getchildren()=lxml.etree._ReadOnlyProxy-class.html#getchildren,Method lxml.objectify.ObjectifiedElement.getchildren()=lxml.objectify.ObjectifiedElement-class.html#getchildren"><a title="lxml.etree._Element.getchildren
140 lxml.etree._ReadOnlyProxy.getchildren
141 lxml.objectify.ObjectifiedElement.getchildren" class="py-name" href="#" onclick="return doclink('link-24', 'getchildren', 'link-24');">getchildren</a></tt><tt class="py-op">(</tt><tt class="py-op">)</tt> </tt>
142 <a name="L52"></a><tt class="py-lineno"> 52</tt>  <tt class="py-line">    <tt class="py-keyword">for</tt> <tt class="py-name">child</tt> <tt class="py-keyword">in</tt> <tt class="py-name">children</tt><tt class="py-op">:</tt> </tt>
143 <a name="L53"></a><tt class="py-lineno"> 53</tt>  <tt class="py-line">        <tt id="link-25" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-25', 'root', 'link-9');">root</a></tt><tt class="py-op">.</tt><tt id="link-26" class="py-name" targets="Method lxml.etree._Element.remove()=lxml.etree._Element-class.html#remove,Method lxml.etree._ResolverRegistry.remove()=lxml.etree._ResolverRegistry-class.html#remove,Method lxml.html.CheckboxValues.remove()=lxml.html.CheckboxValues-class.html#remove,Method lxml.html.MultipleSelectOptions.remove()=lxml.html.MultipleSelectOptions-class.html#remove"><a title="lxml.etree._Element.remove
144 lxml.etree._ResolverRegistry.remove
145 lxml.html.CheckboxValues.remove
146 lxml.html.MultipleSelectOptions.remove" class="py-name" href="#" onclick="return doclink('link-26', 'remove', 'link-26');">remove</a></tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">)</tt> </tt>
147 <a name="L54"></a><tt class="py-lineno"> 54</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt class="py-name">children</tt> </tt>
148 </div><a name="L55"></a><tt class="py-lineno"> 55</tt>  <tt class="py-line"> </tt>
149 <a name="L56"></a><tt class="py-lineno"> 56</tt>  <tt class="py-line"> </tt>
150 <a name="L57"></a><tt class="py-lineno"> 57</tt>  <tt class="py-line"><tt class="py-comment"># helpers</tt> </tt>
151 <a name="L58"></a><tt class="py-lineno"> 58</tt>  <tt class="py-line"> </tt>
152 <a name="_parse"></a><div id="_parse-def"><a name="L59"></a><tt class="py-lineno"> 59</tt> <a class="py-toggle" href="#" id="_parse-toggle" onclick="return toggle('_parse');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#_parse">_parse</a><tt class="py-op">(</tt><tt class="py-param">source</tt><tt class="py-op">,</tt> <tt class="py-param">beautifulsoup</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-param">bsargs</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
153 </div><div id="_parse-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="_parse-expanded"><a name="L60"></a><tt class="py-lineno"> 60</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-name">beautifulsoup</tt> <tt class="py-keyword">is</tt> <tt class="py-name">None</tt><tt class="py-op">:</tt> </tt>
154 <a name="L61"></a><tt class="py-lineno"> 61</tt>  <tt class="py-line">        <tt class="py-name">beautifulsoup</tt> <tt class="py-op">=</tt> <tt class="py-name">BeautifulSoup</tt> </tt>
155 <a name="L62"></a><tt class="py-lineno"> 62</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt id="link-27" class="py-name"><a title="lxml.etree._BaseParser.makeelement
156 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-27', 'makeelement', 'link-7');">makeelement</a></tt> <tt class="py-keyword">is</tt> <tt class="py-name">None</tt><tt class="py-op">:</tt> </tt>
157 <a name="L63"></a><tt class="py-lineno"> 63</tt>  <tt class="py-line">        <tt id="link-28" class="py-name"><a title="lxml.etree._BaseParser.makeelement
158 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-28', 'makeelement', 'link-7');">makeelement</a></tt> <tt class="py-op">=</tt> <tt id="link-29" class="py-name"><a title="lxml.html
159 lxml.html.diff.href_token.html
160 lxml.html.diff.tag_token.html
161 lxml.html.diff.token.html" class="py-name" href="#" onclick="return doclink('link-29', 'html', 'link-3');">html</a></tt><tt class="py-op">.</tt><tt id="link-30" class="py-name"><a title="lxml.html.html5parser.html_parser
162 lxml.html.html_parser" class="py-name" href="#" onclick="return doclink('link-30', 'html_parser', 'link-18');">html_parser</a></tt><tt class="py-op">.</tt><tt id="link-31" class="py-name"><a title="lxml.etree._BaseParser.makeelement
163 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-31', 'makeelement', 'link-7');">makeelement</a></tt> </tt>
164 <a name="L64"></a><tt class="py-lineno"> 64</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-string">'convertEntities'</tt> <tt class="py-keyword">not</tt> <tt class="py-keyword">in</tt> <tt class="py-name">bsargs</tt><tt class="py-op">:</tt> </tt>
165 <a name="L65"></a><tt class="py-lineno"> 65</tt>  <tt class="py-line">        <tt class="py-name">bsargs</tt><tt class="py-op">[</tt><tt class="py-string">'convertEntities'</tt><tt class="py-op">]</tt> <tt class="py-op">=</tt> <tt class="py-string">'html'</tt> </tt>
166 <a name="L66"></a><tt class="py-lineno"> 66</tt>  <tt class="py-line">    <tt class="py-name">tree</tt> <tt class="py-op">=</tt> <tt class="py-name">beautifulsoup</tt><tt class="py-op">(</tt><tt class="py-name">source</tt><tt class="py-op">,</tt> <tt class="py-op">**</tt><tt class="py-name">bsargs</tt><tt class="py-op">)</tt> </tt>
167 <a name="L67"></a><tt class="py-lineno"> 67</tt>  <tt class="py-line">    <tt id="link-32" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-32', 'root', 'link-9');">root</a></tt> <tt class="py-op">=</tt> <tt id="link-33" class="py-name"><a title="lxml.html.soupparser._convert_tree" class="py-name" href="#" onclick="return doclink('link-33', '_convert_tree', 'link-21');">_convert_tree</a></tt><tt class="py-op">(</tt><tt class="py-name">tree</tt><tt class="py-op">,</tt> <tt id="link-34" class="py-name"><a title="lxml.etree._BaseParser.makeelement
168 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-34', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">)</tt> </tt>
169 <a name="L68"></a><tt class="py-lineno"> 68</tt>  <tt class="py-line">    <tt class="py-comment"># from ET: wrap the document in a html root element, if necessary</tt> </tt>
170 <a name="L69"></a><tt class="py-lineno"> 69</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-name">len</tt><tt class="py-op">(</tt><tt id="link-35" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-35', 'root', 'link-9');">root</a></tt><tt class="py-op">)</tt> <tt class="py-op">==</tt> <tt class="py-number">1</tt> <tt class="py-keyword">and</tt> <tt id="link-36" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-36', 'root', 'link-9');">root</a></tt><tt class="py-op">[</tt><tt class="py-number">0</tt><tt class="py-op">]</tt><tt class="py-op">.</tt><tt id="link-37" class="py-name" targets="Variable lxml.etree._Comment.tag=lxml.etree._Comment-class.html#tag,Variable lxml.etree._Element.tag=lxml.etree._Element-class.html#tag,Variable lxml.etree._Entity.tag=lxml.etree._Entity-class.html#tag,Variable lxml.etree._ProcessingInstruction.tag=lxml.etree._ProcessingInstruction-class.html#tag,Variable lxml.etree._ReadOnlyProxy.tag=lxml.etree._ReadOnlyProxy-class.html#tag,Function lxml.tests.test_xpathevaluator.tag()=lxml.tests.test_xpathevaluator-module.html#tag,Variable xml.etree.ElementTree.Element.tag=xml.etree.ElementTree.Element-class.html#tag"><a title="lxml.etree._Comment.tag
171 lxml.etree._Element.tag
172 lxml.etree._Entity.tag
173 lxml.etree._ProcessingInstruction.tag
174 lxml.etree._ReadOnlyProxy.tag
175 lxml.tests.test_xpathevaluator.tag
176 xml.etree.ElementTree.Element.tag" class="py-name" href="#" onclick="return doclink('link-37', 'tag', 'link-37');">tag</a></tt> <tt class="py-op">==</tt> <tt class="py-string">"html"</tt><tt class="py-op">:</tt> </tt>
177 <a name="L70"></a><tt class="py-lineno"> 70</tt>  <tt class="py-line">        <tt class="py-keyword">return</tt> <tt id="link-38" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-38', 'root', 'link-9');">root</a></tt><tt class="py-op">[</tt><tt class="py-number">0</tt><tt class="py-op">]</tt> </tt>
178 <a name="L71"></a><tt class="py-lineno"> 71</tt>  <tt class="py-line">    <tt id="link-39" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-39', 'root', 'link-9');">root</a></tt><tt class="py-op">.</tt><tt id="link-40" class="py-name"><a title="lxml.etree._Comment.tag
179 lxml.etree._Element.tag
180 lxml.etree._Entity.tag
181 lxml.etree._ProcessingInstruction.tag
182 lxml.etree._ReadOnlyProxy.tag
183 lxml.tests.test_xpathevaluator.tag
184 xml.etree.ElementTree.Element.tag" class="py-name" href="#" onclick="return doclink('link-40', 'tag', 'link-37');">tag</a></tt> <tt class="py-op">=</tt> <tt class="py-string">"html"</tt> </tt>
185 <a name="L72"></a><tt class="py-lineno"> 72</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt id="link-41" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-41', 'root', 'link-9');">root</a></tt> </tt>
186 </div><a name="L73"></a><tt class="py-lineno"> 73</tt>  <tt class="py-line"> </tt>
187 <a name="_convert_tree"></a><div id="_convert_tree-def"><a name="L74"></a><tt class="py-lineno"> 74</tt> <a class="py-toggle" href="#" id="_convert_tree-toggle" onclick="return toggle('_convert_tree');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#_convert_tree">_convert_tree</a><tt class="py-op">(</tt><tt class="py-param">beautiful_soup_tree</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
188 </div><div id="_convert_tree-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="_convert_tree-expanded"><a name="L75"></a><tt class="py-lineno"> 75</tt>  <tt class="py-line">    <tt id="link-42" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-42', 'root', 'link-9');">root</a></tt> <tt class="py-op">=</tt> <tt id="link-43" class="py-name"><a title="lxml.etree._BaseParser.makeelement
189 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-43', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">(</tt><tt class="py-name">beautiful_soup_tree</tt><tt class="py-op">.</tt><tt id="link-44" class="py-name" targets="Variable lxml.etree._Entity.name=lxml.etree._Entity-class.html#name,Variable lxml.etree._ModifyContentOnlyEntityProxy.name=lxml.etree._ModifyContentOnlyEntityProxy-class.html#name,Variable lxml.etree._ReadOnlyEntityProxy.name=lxml.etree._ReadOnlyEntityProxy-class.html#name,Variable lxml.html.InputMixin.name=lxml.html.InputMixin-class.html#name,Variable lxml.objectify.PyType.name=lxml.objectify.PyType-class.html#name"><a title="lxml.etree._Entity.name
190 lxml.etree._ModifyContentOnlyEntityProxy.name
191 lxml.etree._ReadOnlyEntityProxy.name
192 lxml.html.InputMixin.name
193 lxml.objectify.PyType.name" class="py-name" href="#" onclick="return doclink('link-44', 'name', 'link-44');">name</a></tt><tt class="py-op">,</tt> </tt>
194 <a name="L76"></a><tt class="py-lineno"> 76</tt>  <tt class="py-line">                       <tt id="link-45" class="py-name" targets="Variable lxml.etree._Element.attrib=lxml.etree._Element-class.html#attrib,Variable lxml.etree._ProcessingInstruction.attrib=lxml.etree._ProcessingInstruction-class.html#attrib,Variable lxml.etree._ReadOnlyElementProxy.attrib=lxml.etree._ReadOnlyElementProxy-class.html#attrib,Variable lxml.etree.__ContentOnlyElement.attrib=lxml.etree.__ContentOnlyElement-class.html#attrib,Variable xml.etree.ElementTree.Element.attrib=xml.etree.ElementTree.Element-class.html#attrib"><a title="lxml.etree._Element.attrib
195 lxml.etree._ProcessingInstruction.attrib
196 lxml.etree._ReadOnlyElementProxy.attrib
197 lxml.etree.__ContentOnlyElement.attrib
198 xml.etree.ElementTree.Element.attrib" class="py-name" href="#" onclick="return doclink('link-45', 'attrib', 'link-45');">attrib</a></tt><tt class="py-op">=</tt><tt class="py-name">dict</tt><tt class="py-op">(</tt><tt class="py-name">beautiful_soup_tree</tt><tt class="py-op">.</tt><tt class="py-name">attrs</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
199 <a name="L77"></a><tt class="py-lineno"> 77</tt>  <tt class="py-line">    <tt id="link-46" class="py-name" targets="Function lxml.html.soupparser._convert_children()=lxml.html.soupparser-module.html#_convert_children"><a title="lxml.html.soupparser._convert_children" class="py-name" href="#" onclick="return doclink('link-46', '_convert_children', 'link-46');">_convert_children</a></tt><tt class="py-op">(</tt><tt id="link-47" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-47', 'root', 'link-9');">root</a></tt><tt class="py-op">,</tt> <tt class="py-name">beautiful_soup_tree</tt><tt class="py-op">,</tt> <tt id="link-48" class="py-name"><a title="lxml.etree._BaseParser.makeelement
200 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-48', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">)</tt> </tt>
201 <a name="L78"></a><tt class="py-lineno"> 78</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt id="link-49" class="py-name"><a title="lxml.etree.iterparse.root" class="py-name" href="#" onclick="return doclink('link-49', 'root', 'link-9');">root</a></tt> </tt>
202 </div><a name="L79"></a><tt class="py-lineno"> 79</tt>  <tt class="py-line"> </tt>
203 <a name="_convert_children"></a><div id="_convert_children-def"><a name="L80"></a><tt class="py-lineno"> 80</tt> <a class="py-toggle" href="#" id="_convert_children-toggle" onclick="return toggle('_convert_children');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#_convert_children">_convert_children</a><tt class="py-op">(</tt><tt class="py-param">parent</tt><tt class="py-op">,</tt> <tt class="py-param">beautiful_soup_tree</tt><tt class="py-op">,</tt> <tt class="py-param">makeelement</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
204 </div><div id="_convert_children-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="_convert_children-expanded"><a name="L81"></a><tt class="py-lineno"> 81</tt>  <tt class="py-line">    <tt id="link-50" class="py-name" targets="Function lxml.etree.SubElement()=lxml.etree-module.html#SubElement"><a title="lxml.etree.SubElement" class="py-name" href="#" onclick="return doclink('link-50', 'SubElement', 'link-50');">SubElement</a></tt> <tt class="py-op">=</tt> <tt id="link-51" class="py-name"><a title="lxml.etree
205 lxml.sax.ElementTreeContentHandler.etree
206 lxml.tests.test_elementtree.CElementTreeTestCase.etree
207 lxml.tests.test_elementtree.ETreeTestCaseBase.etree
208 lxml.tests.test_io.IOTestCaseBase.etree" class="py-name" href="#" onclick="return doclink('link-51', 'etree', 'link-2');">etree</a></tt><tt class="py-op">.</tt><tt id="link-52" class="py-name"><a title="lxml.etree.SubElement" class="py-name" href="#" onclick="return doclink('link-52', 'SubElement', 'link-50');">SubElement</a></tt> </tt>
209 <a name="L82"></a><tt class="py-lineno"> 82</tt>  <tt class="py-line">    <tt class="py-name">et_child</tt> <tt class="py-op">=</tt> <tt class="py-name">None</tt> </tt>
210 <a name="L83"></a><tt class="py-lineno"> 83</tt>  <tt class="py-line">    <tt class="py-keyword">for</tt> <tt class="py-name">child</tt> <tt class="py-keyword">in</tt> <tt class="py-name">beautiful_soup_tree</tt><tt class="py-op">:</tt> </tt>
211 <a name="L84"></a><tt class="py-lineno"> 84</tt>  <tt class="py-line">        <tt class="py-keyword">if</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">,</tt> <tt class="py-name">Tag</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
212 <a name="L85"></a><tt class="py-lineno"> 85</tt>  <tt class="py-line">            <tt class="py-name">et_child</tt> <tt class="py-op">=</tt> <tt id="link-53" class="py-name"><a title="lxml.etree.SubElement" class="py-name" href="#" onclick="return doclink('link-53', 'SubElement', 'link-50');">SubElement</a></tt><tt class="py-op">(</tt><tt class="py-name">parent</tt><tt class="py-op">,</tt> <tt class="py-name">child</tt><tt class="py-op">.</tt><tt id="link-54" class="py-name"><a title="lxml.etree._Entity.name
213 lxml.etree._ModifyContentOnlyEntityProxy.name
214 lxml.etree._ReadOnlyEntityProxy.name
215 lxml.html.InputMixin.name
216 lxml.objectify.PyType.name" class="py-name" href="#" onclick="return doclink('link-54', 'name', 'link-44');">name</a></tt><tt class="py-op">,</tt> <tt id="link-55" class="py-name"><a title="lxml.etree._Element.attrib
217 lxml.etree._ProcessingInstruction.attrib
218 lxml.etree._ReadOnlyElementProxy.attrib
219 lxml.etree.__ContentOnlyElement.attrib
220 xml.etree.ElementTree.Element.attrib" class="py-name" href="#" onclick="return doclink('link-55', 'attrib', 'link-45');">attrib</a></tt><tt class="py-op">=</tt><tt class="py-name">dict</tt><tt class="py-op">(</tt> </tt>
221 <a name="L86"></a><tt class="py-lineno"> 86</tt>  <tt class="py-line">                <tt class="py-op">[</tt><tt class="py-op">(</tt><tt class="py-name">k</tt><tt class="py-op">,</tt> <tt id="link-56" class="py-name" targets="Function lxml.html.soupparser.unescape()=lxml.html.soupparser-module.html#unescape"><a title="lxml.html.soupparser.unescape" class="py-name" href="#" onclick="return doclink('link-56', 'unescape', 'link-56');">unescape</a></tt><tt class="py-op">(</tt><tt id="link-57" class="py-name" targets="Variable lxml.tests.test_objectify.v=lxml.tests.test_objectify-module.html#v"><a title="lxml.tests.test_objectify.v" class="py-name" href="#" onclick="return doclink('link-57', 'v', 'link-57');">v</a></tt><tt class="py-op">)</tt><tt class="py-op">)</tt> <tt class="py-keyword">for</tt> <tt class="py-op">(</tt><tt class="py-name">k</tt><tt class="py-op">,</tt><tt id="link-58" class="py-name"><a title="lxml.tests.test_objectify.v" class="py-name" href="#" onclick="return doclink('link-58', 'v', 'link-57');">v</a></tt><tt class="py-op">)</tt> <tt class="py-keyword">in</tt> <tt class="py-name">child</tt><tt class="py-op">.</tt><tt class="py-name">attrs</tt><tt class="py-op">]</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
222 <a name="L87"></a><tt class="py-lineno"> 87</tt>  <tt class="py-line">            <tt id="link-59" class="py-name"><a title="lxml.html.soupparser._convert_children" class="py-name" href="#" onclick="return doclink('link-59', '_convert_children', 'link-46');">_convert_children</a></tt><tt class="py-op">(</tt><tt class="py-name">et_child</tt><tt class="py-op">,</tt> <tt class="py-name">child</tt><tt class="py-op">,</tt> <tt id="link-60" class="py-name"><a title="lxml.etree._BaseParser.makeelement
223 lxml.etree._Element.makeelement" class="py-name" href="#" onclick="return doclink('link-60', 'makeelement', 'link-7');">makeelement</a></tt><tt class="py-op">)</tt> </tt>
224 <a name="L88"></a><tt class="py-lineno"> 88</tt>  <tt class="py-line">        <tt class="py-keyword">elif</tt> <tt id="link-61" class="py-name" targets="Variable lxml.etree._LogEntry.type=lxml.etree._LogEntry-class.html#type,Variable lxml.html.InputElement.type=lxml.html.InputElement-class.html#type"><a title="lxml.etree._LogEntry.type
225 lxml.html.InputElement.type" class="py-name" href="#" onclick="return doclink('link-61', 'type', 'link-61');">type</a></tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">)</tt> <tt class="py-keyword">is</tt> <tt class="py-name">NavigableString</tt><tt class="py-op">:</tt> </tt>
226 <a name="L89"></a><tt class="py-lineno"> 89</tt>  <tt class="py-line">            <tt id="link-62" class="py-name" targets="Function lxml.html.soupparser._append_text()=lxml.html.soupparser-module.html#_append_text"><a title="lxml.html.soupparser._append_text" class="py-name" href="#" onclick="return doclink('link-62', '_append_text', 'link-62');">_append_text</a></tt><tt class="py-op">(</tt><tt class="py-name">parent</tt><tt class="py-op">,</tt> <tt class="py-name">et_child</tt><tt class="py-op">,</tt> <tt id="link-63" class="py-name"><a title="lxml.html.soupparser.unescape" class="py-name" href="#" onclick="return doclink('link-63', 'unescape', 'link-56');">unescape</a></tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
227 <a name="L90"></a><tt class="py-lineno"> 90</tt>  <tt class="py-line">        <tt class="py-keyword">else</tt><tt class="py-op">:</tt> </tt>
228 <a name="L91"></a><tt class="py-lineno"> 91</tt>  <tt class="py-line">            <tt class="py-keyword">if</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">,</tt> <tt id="link-64" class="py-name"><a title="lxml.etree.Comment" class="py-name" href="#" onclick="return doclink('link-64', 'Comment', 'link-4');">Comment</a></tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
229 <a name="L92"></a><tt class="py-lineno"> 92</tt>  <tt class="py-line">                <tt class="py-name">parent</tt><tt class="py-op">.</tt><tt id="link-65" class="py-name" targets="Method lxml.etree._AppendOnlyElementProxy.append()=lxml.etree._AppendOnlyElementProxy-class.html#append,Method lxml.etree._Element.append()=lxml.etree._Element-class.html#append,Method lxml.etree._OpaqueDocumentWrapper.append()=lxml.etree._OpaqueDocumentWrapper-class.html#append,Method lxml.etree.__ContentOnlyElement.append()=lxml.etree.__ContentOnlyElement-class.html#append"><a title="lxml.etree._AppendOnlyElementProxy.append
230 lxml.etree._Element.append
231 lxml.etree._OpaqueDocumentWrapper.append
232 lxml.etree.__ContentOnlyElement.append" class="py-name" href="#" onclick="return doclink('link-65', 'append', 'link-65');">append</a></tt><tt class="py-op">(</tt><tt id="link-66" class="py-name"><a title="lxml.etree
233 lxml.sax.ElementTreeContentHandler.etree
234 lxml.tests.test_elementtree.CElementTreeTestCase.etree
235 lxml.tests.test_elementtree.ETreeTestCaseBase.etree
236 lxml.tests.test_io.IOTestCaseBase.etree" class="py-name" href="#" onclick="return doclink('link-66', 'etree', 'link-2');">etree</a></tt><tt class="py-op">.</tt><tt id="link-67" class="py-name"><a title="lxml.etree.Comment" class="py-name" href="#" onclick="return doclink('link-67', 'Comment', 'link-4');">Comment</a></tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
237 <a name="L93"></a><tt class="py-lineno"> 93</tt>  <tt class="py-line">            <tt class="py-keyword">elif</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">,</tt> <tt class="py-name">ProcessingInstruction</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
238 <a name="L94"></a><tt class="py-lineno"> 94</tt>  <tt class="py-line">                <tt class="py-name">parent</tt><tt class="py-op">.</tt><tt id="link-68" class="py-name"><a title="lxml.etree._AppendOnlyElementProxy.append
239 lxml.etree._Element.append
240 lxml.etree._OpaqueDocumentWrapper.append
241 lxml.etree.__ContentOnlyElement.append" class="py-name" href="#" onclick="return doclink('link-68', 'append', 'link-65');">append</a></tt><tt class="py-op">(</tt><tt id="link-69" class="py-name"><a title="lxml.etree
242 lxml.sax.ElementTreeContentHandler.etree
243 lxml.tests.test_elementtree.CElementTreeTestCase.etree
244 lxml.tests.test_elementtree.ETreeTestCaseBase.etree
245 lxml.tests.test_io.IOTestCaseBase.etree" class="py-name" href="#" onclick="return doclink('link-69', 'etree', 'link-2');">etree</a></tt><tt class="py-op">.</tt><tt class="py-name">ProcessingInstruction</tt><tt class="py-op">(</tt> </tt>
246 <a name="L95"></a><tt class="py-lineno"> 95</tt>  <tt class="py-line">                    <tt class="py-op">*</tt><tt class="py-name">child</tt><tt class="py-op">.</tt><tt class="py-name">split</tt><tt class="py-op">(</tt><tt class="py-string">' '</tt><tt class="py-op">,</tt> <tt class="py-number">1</tt><tt class="py-op">)</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
247 <a name="L96"></a><tt class="py-lineno"> 96</tt>  <tt class="py-line">            <tt class="py-keyword">else</tt><tt class="py-op">:</tt> <tt class="py-comment"># CData</tt> </tt>
248 <a name="L97"></a><tt class="py-lineno"> 97</tt>  <tt class="py-line">                <tt id="link-70" class="py-name"><a title="lxml.html.soupparser._append_text" class="py-name" href="#" onclick="return doclink('link-70', '_append_text', 'link-62');">_append_text</a></tt><tt class="py-op">(</tt><tt class="py-name">parent</tt><tt class="py-op">,</tt> <tt class="py-name">et_child</tt><tt class="py-op">,</tt> <tt id="link-71" class="py-name"><a title="lxml.html.soupparser.unescape" class="py-name" href="#" onclick="return doclink('link-71', 'unescape', 'link-56');">unescape</a></tt><tt class="py-op">(</tt><tt class="py-name">child</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
249 </div><a name="L98"></a><tt class="py-lineno"> 98</tt>  <tt class="py-line"> </tt>
250 <a name="_append_text"></a><div id="_append_text-def"><a name="L99"></a><tt class="py-lineno"> 99</tt> <a class="py-toggle" href="#" id="_append_text-toggle" onclick="return toggle('_append_text');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#_append_text">_append_text</a><tt class="py-op">(</tt><tt class="py-param">parent</tt><tt class="py-op">,</tt> <tt class="py-param">element</tt><tt class="py-op">,</tt> <tt class="py-param">text</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
251 </div><div id="_append_text-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="_append_text-expanded"><a name="L100"></a><tt class="py-lineno">100</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-name">element</tt> <tt class="py-keyword">is</tt> <tt class="py-name">None</tt><tt class="py-op">:</tt> </tt>
252 <a name="L101"></a><tt class="py-lineno">101</tt>  <tt class="py-line">        <tt class="py-name">parent</tt><tt class="py-op">.</tt><tt id="link-72" class="py-name" targets="Variable lxml.etree.QName.text=lxml.etree.QName-class.html#text,Variable lxml.etree._AppendOnlyElementProxy.text=lxml.etree._AppendOnlyElementProxy-class.html#text,Variable lxml.etree._Element.text=lxml.etree._Element-class.html#text,Variable lxml.etree._Entity.text=lxml.etree._Entity-class.html#text,Variable lxml.etree._ModifyContentOnlyProxy.text=lxml.etree._ModifyContentOnlyProxy-class.html#text,Variable lxml.etree._ReadOnlyEntityProxy.text=lxml.etree._ReadOnlyEntityProxy-class.html#text,Variable lxml.etree._ReadOnlyProxy.text=lxml.etree._ReadOnlyProxy-class.html#text,Variable lxml.etree.__ContentOnlyElement.text=lxml.etree.__ContentOnlyElement-class.html#text,Variable lxml.objectify.ObjectifiedElement.text=lxml.objectify.ObjectifiedElement-class.html#text,Variable xml.etree.ElementTree.Element.text=xml.etree.ElementTree.Element-class.html#text"><a title="lxml.etree.QName.text
253 lxml.etree._AppendOnlyElementProxy.text
254 lxml.etree._Element.text
255 lxml.etree._Entity.text
256 lxml.etree._ModifyContentOnlyProxy.text
257 lxml.etree._ReadOnlyEntityProxy.text
258 lxml.etree._ReadOnlyProxy.text
259 lxml.etree.__ContentOnlyElement.text
260 lxml.objectify.ObjectifiedElement.text
261 xml.etree.ElementTree.Element.text" class="py-name" href="#" onclick="return doclink('link-72', 'text', 'link-72');">text</a></tt> <tt class="py-op">=</tt> <tt class="py-op">(</tt><tt class="py-name">parent</tt><tt class="py-op">.</tt><tt id="link-73" class="py-name"><a title="lxml.etree.QName.text
262 lxml.etree._AppendOnlyElementProxy.text
263 lxml.etree._Element.text
264 lxml.etree._Entity.text
265 lxml.etree._ModifyContentOnlyProxy.text
266 lxml.etree._ReadOnlyEntityProxy.text
267 lxml.etree._ReadOnlyProxy.text
268 lxml.etree.__ContentOnlyElement.text
269 lxml.objectify.ObjectifiedElement.text
270 xml.etree.ElementTree.Element.text" class="py-name" href="#" onclick="return doclink('link-73', 'text', 'link-72');">text</a></tt> <tt class="py-keyword">or</tt> <tt class="py-string">''</tt><tt class="py-op">)</tt> <tt class="py-op">+</tt> <tt id="link-74" class="py-name"><a title="lxml.etree.QName.text
271 lxml.etree._AppendOnlyElementProxy.text
272 lxml.etree._Element.text
273 lxml.etree._Entity.text
274 lxml.etree._ModifyContentOnlyProxy.text
275 lxml.etree._ReadOnlyEntityProxy.text
276 lxml.etree._ReadOnlyProxy.text
277 lxml.etree.__ContentOnlyElement.text
278 lxml.objectify.ObjectifiedElement.text
279 xml.etree.ElementTree.Element.text" class="py-name" href="#" onclick="return doclink('link-74', 'text', 'link-72');">text</a></tt> </tt>
280 <a name="L102"></a><tt class="py-lineno">102</tt>  <tt class="py-line">    <tt class="py-keyword">else</tt><tt class="py-op">:</tt> </tt>
281 <a name="L103"></a><tt class="py-lineno">103</tt>  <tt class="py-line">        <tt class="py-name">element</tt><tt class="py-op">.</tt><tt id="link-75" class="py-name" targets="Variable lxml.etree._Element.tail=lxml.etree._Element-class.html#tail,Variable lxml.etree._ReadOnlyProxy.tail=lxml.etree._ReadOnlyProxy-class.html#tail,Variable xml.etree.ElementTree.Element.tail=xml.etree.ElementTree.Element-class.html#tail"><a title="lxml.etree._Element.tail
282 lxml.etree._ReadOnlyProxy.tail
283 xml.etree.ElementTree.Element.tail" class="py-name" href="#" onclick="return doclink('link-75', 'tail', 'link-75');">tail</a></tt> <tt class="py-op">=</tt> <tt class="py-op">(</tt><tt class="py-name">element</tt><tt class="py-op">.</tt><tt id="link-76" class="py-name"><a title="lxml.etree._Element.tail
284 lxml.etree._ReadOnlyProxy.tail
285 xml.etree.ElementTree.Element.tail" class="py-name" href="#" onclick="return doclink('link-76', 'tail', 'link-75');">tail</a></tt> <tt class="py-keyword">or</tt> <tt class="py-string">''</tt><tt class="py-op">)</tt> <tt class="py-op">+</tt> <tt id="link-77" class="py-name"><a title="lxml.etree.QName.text
286 lxml.etree._AppendOnlyElementProxy.text
287 lxml.etree._Element.text
288 lxml.etree._Entity.text
289 lxml.etree._ModifyContentOnlyProxy.text
290 lxml.etree._ReadOnlyEntityProxy.text
291 lxml.etree._ReadOnlyProxy.text
292 lxml.etree.__ContentOnlyElement.text
293 lxml.objectify.ObjectifiedElement.text
294 xml.etree.ElementTree.Element.text" class="py-name" href="#" onclick="return doclink('link-77', 'text', 'link-72');">text</a></tt> </tt>
295 </div><a name="L104"></a><tt class="py-lineno">104</tt>  <tt class="py-line"> </tt>
296 <a name="L105"></a><tt class="py-lineno">105</tt>  <tt class="py-line"> </tt>
297 <a name="L106"></a><tt class="py-lineno">106</tt>  <tt class="py-line"><tt class="py-comment"># copied from ET's ElementSoup</tt> </tt>
298 <a name="L107"></a><tt class="py-lineno">107</tt>  <tt class="py-line"> </tt>
299 <a name="L108"></a><tt class="py-lineno">108</tt>  <tt class="py-line"><tt class="py-keyword">try</tt><tt class="py-op">:</tt> </tt>
300 <a name="L109"></a><tt class="py-lineno">109</tt>  <tt class="py-line">    <tt class="py-keyword">from</tt> <tt id="link-78" class="py-name"><a title="lxml.html
301 lxml.html.diff.href_token.html
302 lxml.html.diff.tag_token.html
303 lxml.html.diff.token.html" class="py-name" href="#" onclick="return doclink('link-78', 'html', 'link-3');">html</a></tt><tt class="py-op">.</tt><tt class="py-name">entities</tt> <tt class="py-keyword">import</tt> <tt class="py-name">name2codepoint</tt> <tt class="py-comment"># Python 3</tt> </tt>
304 <a name="L110"></a><tt class="py-lineno">110</tt>  <tt class="py-line"><tt class="py-keyword">except</tt> <tt class="py-name">ImportError</tt><tt class="py-op">:</tt> </tt>
305 <a name="L111"></a><tt class="py-lineno">111</tt>  <tt class="py-line">    <tt class="py-keyword">from</tt> <tt class="py-name">htmlentitydefs</tt> <tt class="py-keyword">import</tt> <tt class="py-name">name2codepoint</tt> </tt>
306 <a name="L112"></a><tt class="py-lineno">112</tt>  <tt class="py-line"><tt class="py-keyword">import</tt> <tt class="py-name">re</tt> </tt>
307 <a name="L113"></a><tt class="py-lineno">113</tt>  <tt class="py-line"> </tt>
308 <a name="L114"></a><tt class="py-lineno">114</tt>  <tt class="py-line"><tt id="link-79" class="py-name" targets="Function lxml.html.soupparser.handle_entities()=lxml.html.soupparser-module.html#handle_entities"><a title="lxml.html.soupparser.handle_entities" class="py-name" href="#" onclick="return doclink('link-79', 'handle_entities', 'link-79');">handle_entities</a></tt> <tt class="py-op">=</tt> <tt class="py-name">re</tt><tt class="py-op">.</tt><tt class="py-name">compile</tt><tt class="py-op">(</tt><tt class="py-string">"&amp;(\w+);"</tt><tt class="py-op">)</tt><tt class="py-op">.</tt><tt class="py-name">sub</tt> </tt>
309 <a name="L115"></a><tt class="py-lineno">115</tt>  <tt class="py-line"> </tt>
310 <a name="unescape"></a><div id="unescape-def"><a name="L116"></a><tt class="py-lineno">116</tt> <a class="py-toggle" href="#" id="unescape-toggle" onclick="return toggle('unescape');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="lxml.html.soupparser-module.html#unescape">unescape</a><tt class="py-op">(</tt><tt class="py-param">string</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
311 </div><div id="unescape-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="unescape-expanded"><a name="L117"></a><tt class="py-lineno">117</tt>  <tt class="py-line">    <tt class="py-keyword">if</tt> <tt class="py-keyword">not</tt> <tt class="py-name">string</tt><tt class="py-op">:</tt> </tt>
312 <a name="L118"></a><tt class="py-lineno">118</tt>  <tt class="py-line">        <tt class="py-keyword">return</tt> <tt class="py-string">''</tt> </tt>
313 <a name="L119"></a><tt class="py-lineno">119</tt>  <tt class="py-line">    <tt class="py-comment"># work around oddities in BeautifulSoup's entity handling</tt> </tt>
314 <a name="L120"></a><tt class="py-lineno">120</tt>  <tt class="py-line">    <tt class="py-keyword">def</tt> <tt class="py-def-name">unescape_entity</tt><tt class="py-op">(</tt><tt class="py-param">m</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
315 <a name="L121"></a><tt class="py-lineno">121</tt>  <tt class="py-line">        <tt class="py-keyword">try</tt><tt class="py-op">:</tt> </tt>
316 <a name="L122"></a><tt class="py-lineno">122</tt>  <tt class="py-line">            <tt class="py-keyword">return</tt> <tt class="py-name">unichr</tt><tt class="py-op">(</tt><tt class="py-name">name2codepoint</tt><tt class="py-op">[</tt><tt class="py-name">m</tt><tt class="py-op">.</tt><tt class="py-name">group</tt><tt class="py-op">(</tt><tt class="py-number">1</tt><tt class="py-op">)</tt><tt class="py-op">]</tt><tt class="py-op">)</tt> </tt>
317 <a name="L123"></a><tt class="py-lineno">123</tt>  <tt class="py-line">        <tt class="py-keyword">except</tt> <tt class="py-name">KeyError</tt><tt class="py-op">:</tt> </tt>
318 <a name="L124"></a><tt class="py-lineno">124</tt>  <tt class="py-line">            <tt class="py-keyword">return</tt> <tt class="py-name">m</tt><tt class="py-op">.</tt><tt class="py-name">group</tt><tt class="py-op">(</tt><tt class="py-number">0</tt><tt class="py-op">)</tt> <tt class="py-comment"># use as is</tt> </tt>
319 </div><a name="L125"></a><tt class="py-lineno">125</tt>  <tt class="py-line">    <tt class="py-keyword">return</tt> <tt id="link-80" class="py-name"><a title="lxml.html.soupparser.handle_entities" class="py-name" href="#" onclick="return doclink('link-80', 'handle_entities', 'link-79');">handle_entities</a></tt><tt class="py-op">(</tt><tt class="py-name">unescape_entity</tt><tt class="py-op">,</tt> <tt class="py-name">string</tt><tt class="py-op">)</tt> </tt>
320 </div><a name="L126"></a><tt class="py-lineno">126</tt>  <tt class="py-line"> </tt><script type="text/javascript">
321 <!--
322 expandto(location.href);
323 // -->
324 </script>
325 </pre>
326 <br />
327 <!-- ==================== NAVIGATION BAR ==================== -->
328 <table class="navbar" border="0" width="100%" cellpadding="0"
329        bgcolor="#a0c0ff" cellspacing="0">
330   <tr valign="middle">
331   <!-- Home link -->
332       <th>&nbsp;&nbsp;&nbsp;<a
333         href="lxml-module.html">Home</a>&nbsp;&nbsp;&nbsp;</th>
334
335   <!-- Tree link -->
336       <th>&nbsp;&nbsp;&nbsp;<a
337         href="module-tree.html">Trees</a>&nbsp;&nbsp;&nbsp;</th>
338
339   <!-- Index link -->
340       <th>&nbsp;&nbsp;&nbsp;<a
341         href="identifier-index.html">Indices</a>&nbsp;&nbsp;&nbsp;</th>
342
343   <!-- Help link -->
344       <th>&nbsp;&nbsp;&nbsp;<a
345         href="help.html">Help</a>&nbsp;&nbsp;&nbsp;</th>
346
347   <!-- Project homepage -->
348       <th class="navbar" align="right" width="100%">
349         <table border="0" cellpadding="0" cellspacing="0">
350           <tr><th class="navbar" align="center"
351             ><a class="navbar" target="_top" href="/">lxml API</a></th>
352           </tr></table></th>
353   </tr>
354 </table>
355 <table border="0" cellpadding="0" cellspacing="0" width="100%%">
356   <tr>
357     <td align="left" class="footer">
358     Generated by Epydoc 3.0.1 on Tue Jul 31 10:14:23 2012
359     </td>
360     <td align="right" class="footer">
361       <a target="mainFrame" href="http://epydoc.sourceforge.net"
362         >http://epydoc.sourceforge.net</a>
363     </td>
364   </tr>
365 </table>
366
367 <script type="text/javascript">
368   <!--
369   // Private objects are initially displayed (because if
370   // javascript is turned off then we want them to be
371   // visible); but by default, we want to hide them.  So hide
372   // them unless we have a cookie that says to show them.
373   checkCookie();
374   // -->
375 </script>
376 </body>
377 </html>