From 2fcaeb6e916a09fa87b4b2ab57167c39db6cef8c Mon Sep 17 00:00:00 2001 From: Leonard Richardson Date: Sun, 7 Jul 2019 21:46:36 -0400 Subject: ' (which is valid in XML and XHTML, but not HTML 4) is now recognized as a named entity and converted to a single quote. [bug=1818721] --- bs4/testing.py | 6 ++++++ 1 file changed, 6 insertions(+) (limited to 'bs4/testing.py') diff --git a/bs4/testing.py b/bs4/testing.py index e144e7e..9f12e8d 100644 --- a/bs4/testing.py +++ b/bs4/testing.py @@ -491,6 +491,12 @@ Hello, world! u"

\u2022 AT&T is in the s&p 500

" ) + def test_apos_entity(self): + self.assertSoupEquals( + u"

Bob's Bar

", + u"

Bob's Bar

", + ) + def test_entities_in_foreign_document_encoding(self): # “ and ” are invalid numeric entities referencing # Windows-1252 characters. - references a character common -- cgit v1.2.3