From a00624d7fc2e29b41b286f46844cb75f4d96ff63 Mon Sep 17 00:00:00 2001 From: Leonard Richardson Date: Mon, 31 May 2021 15:49:41 -0400 Subject: The html.parser tree builder can now handles named entities found in the HTML5 spec in much the same way that the html5lib tree builder does. Note that the lxml tree builder still handles named entities differently. [bug=1924908] --- CHANGELOG | 5 + bs4/builder/_htmlparser.py | 2 +- bs4/dammit.py | 2387 +++++++++++++++++++++++++++++++++++++++++- bs4/testing.py | 7 +- bs4/tests/test_html5lib.py | 36 + bs4/tests/test_htmlparser.py | 32 + bs4/tests/test_lxml.py | 2 +- bs4/tests/test_soup.py | 45 + 8 files changed, 2484 insertions(+), 32 deletions(-) diff --git a/CHANGELOG b/CHANGELOG index 9ce7bf3..78297f0 100644 --- a/CHANGELOG +++ b/CHANGELOG @@ -47,6 +47,11 @@ guarantee that this will hold for the next release. the