From 6675b6b04bb3228bdca3fe70d1c632c7e180fc31 Mon Sep 17 00:00:00 2001 From: Leonard Richardson Date: Wed, 15 Feb 2012 10:25:56 -0500 Subject: Tested improvements to html5lib treebuilder. --- bs4/tests/test_lxml.py | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) (limited to 'bs4/tests/test_lxml.py') diff --git a/bs4/tests/test_lxml.py b/bs4/tests/test_lxml.py index 0adef20..e2cb2d2 100644 --- a/bs4/tests/test_lxml.py +++ b/bs4/tests/test_lxml.py @@ -332,6 +332,32 @@ class TestLXMLBuilderInvalidMarkup(SoupTest): 'foo' '') + + def test_unclosed_a_tag(self): + # tags really ought to be closed at some point. + # + # We have all the
tags because HTML5 says to duplicate + # the tag rather than closing it, and that's what html5lib + # does. + markup = """ +""" + + expect = """
+ +
+
+
+ +
+
""" + self.assertSoupEquals(markup, expect) + def test_unclosed_block_level_elements(self): # Unclosed block-level elements should be closed. self.assertSoupEquals( -- cgit v1.2.3 From d8edc821b2bef6dd302ee88782f8c458e06eaf37 Mon Sep 17 00:00:00 2001 From: Leonard Richardson Date: Wed, 15 Feb 2012 11:03:44 -0500 Subject: Tested and cleaned up html5lib insertBefore. --- bs4/tests/test_lxml.py | 3 +++ 1 file changed, 3 insertions(+) (limited to 'bs4/tests/test_lxml.py') diff --git a/bs4/tests/test_lxml.py b/bs4/tests/test_lxml.py index e2cb2d2..359f619 100644 --- a/bs4/tests/test_lxml.py +++ b/bs4/tests/test_lxml.py @@ -381,6 +381,9 @@ class TestLXMLBuilderInvalidMarkup(SoupTest): '
', '
') + def test_floating_text_in_table(self): + self.assertSoupEquals("foo
bar
") + def test_paragraphs_containing_block_display_elements(self): markup = self.soup("

this is the definition:" "

first case
") -- cgit v1.2.3