summaryrefslogtreecommitdiff
path: root/bs4/tests/test_lxml.py
diff options
context:
space:
mode:
authorLeonard Richardson <leonard.richardson@canonical.com>2012-02-15 10:25:56 -0500
committerLeonard Richardson <leonard.richardson@canonical.com>2012-02-15 10:25:56 -0500
commit6675b6b04bb3228bdca3fe70d1c632c7e180fc31 (patch)
treeffc6e4a48947f7070eed982591ba79b1e13f6ed3 /bs4/tests/test_lxml.py
parent8d0d071f41c59b16e9f4cf361cf08c3359cce05a (diff)
Tested improvements to html5lib treebuilder.
Diffstat (limited to 'bs4/tests/test_lxml.py')
-rw-r--r--bs4/tests/test_lxml.py26
1 files changed, 26 insertions, 0 deletions
diff --git a/bs4/tests/test_lxml.py b/bs4/tests/test_lxml.py
index 0adef20..e2cb2d2 100644
--- a/bs4/tests/test_lxml.py
+++ b/bs4/tests/test_lxml.py
@@ -332,6 +332,32 @@ class TestLXMLBuilderInvalidMarkup(SoupTest):
'<tr><td>foo</td></tr>'
'</table></td>')
+
+ def test_unclosed_a_tag(self):
+ # <a> tags really ought to be closed at some point.
+ #
+ # We have all the <div> tags because HTML5 says to duplicate
+ # the <a> tag rather than closing it, and that's what html5lib
+ # does.
+ markup = """<div id="1">
+ <a href="foo">
+</div>
+<div id="2">
+ <div id="3">
+ <a href="bar"></a>
+ </div>
+</div>"""
+
+ expect = """<div id="1">
+<a href="foo">
+</a></div>
+<div id="2">
+<div id="3">
+<a href="bar"></a>
+</div>
+</div>"""
+ self.assertSoupEquals(markup, expect)
+
def test_unclosed_block_level_elements(self):
# Unclosed block-level elements should be closed.
self.assertSoupEquals(