diff options
author | Leonard Richardson <leonard.richardson@canonical.com> | 2012-02-15 10:25:56 -0500 |
---|---|---|
committer | Leonard Richardson <leonard.richardson@canonical.com> | 2012-02-15 10:25:56 -0500 |
commit | 6675b6b04bb3228bdca3fe70d1c632c7e180fc31 (patch) | |
tree | ffc6e4a48947f7070eed982591ba79b1e13f6ed3 /bs4/tests/test_lxml.py | |
parent | 8d0d071f41c59b16e9f4cf361cf08c3359cce05a (diff) |
Tested improvements to html5lib treebuilder.
Diffstat (limited to 'bs4/tests/test_lxml.py')
-rw-r--r-- | bs4/tests/test_lxml.py | 26 |
1 files changed, 26 insertions, 0 deletions
diff --git a/bs4/tests/test_lxml.py b/bs4/tests/test_lxml.py index 0adef20..e2cb2d2 100644 --- a/bs4/tests/test_lxml.py +++ b/bs4/tests/test_lxml.py @@ -332,6 +332,32 @@ class TestLXMLBuilderInvalidMarkup(SoupTest): '<tr><td>foo</td></tr>' '</table></td>') + + def test_unclosed_a_tag(self): + # <a> tags really ought to be closed at some point. + # + # We have all the <div> tags because HTML5 says to duplicate + # the <a> tag rather than closing it, and that's what html5lib + # does. + markup = """<div id="1"> + <a href="foo"> +</div> +<div id="2"> + <div id="3"> + <a href="bar"></a> + </div> +</div>""" + + expect = """<div id="1"> +<a href="foo"> +</a></div> +<div id="2"> +<div id="3"> +<a href="bar"></a> +</div> +</div>""" + self.assertSoupEquals(markup, expect) + def test_unclosed_block_level_elements(self): # Unclosed block-level elements should be closed. self.assertSoupEquals( |