diff options
author | Leonard Richardson <leonardr@segfault.org> | 2012-07-03 17:59:25 -0400 |
---|---|---|
committer | Leonard Richardson <leonardr@segfault.org> | 2012-07-03 17:59:25 -0400 |
commit | 96eaf6e8f54d84b02e0c3c8c334e7cfd29ef343c (patch) | |
tree | 7896fbad9bee2fac1f8e89df3d9235cfd4945e40 /bs4/tests/test_soup.py | |
parent | f0102682ece130382500f0ee58fbc3340f221d54 (diff) |
Mentioned cchardet in docs.
Diffstat (limited to 'bs4/tests/test_soup.py')
-rw-r--r-- | bs4/tests/test_soup.py | 12 |
1 files changed, 6 insertions, 6 deletions
diff --git a/bs4/tests/test_soup.py b/bs4/tests/test_soup.py index 0d04558..a10a89e 100644 --- a/bs4/tests/test_soup.py +++ b/bs4/tests/test_soup.py @@ -153,7 +153,7 @@ class TestEncodingConversion(SoupTest): unicode_output = soup_from_ascii.decode() self.assertTrue(isinstance(unicode_output, unicode)) self.assertEqual(unicode_output, self.document_for(ascii.decode())) - self.assertEqual(soup_from_ascii.original_encoding, "ascii") + self.assertEqual(soup_from_ascii.original_encoding.lower(), "ascii") def test_unicode_in_unicode_out(self): # Unicode input is left alone. The original_encoding attribute @@ -207,30 +207,30 @@ class TestUnicodeDammit(unittest.TestCase): utf8 = b"\xc3\xa9" dammit = UnicodeDammit(utf8) self.assertEqual(dammit.unicode_markup, u'\xe9') - self.assertEqual(dammit.original_encoding, 'utf-8') + self.assertEqual(dammit.original_encoding.lower(), 'utf-8') def test_convert_hebrew(self): hebrew = b"\xed\xe5\xec\xf9" dammit = UnicodeDammit(hebrew, ["iso-8859-8"]) - self.assertEqual(dammit.original_encoding, 'iso-8859-8') + self.assertEqual(dammit.original_encoding.lower(), 'iso-8859-8') self.assertEqual(dammit.unicode_markup, u'\u05dd\u05d5\u05dc\u05e9') def test_dont_see_smart_quotes_where_there_are_none(self): utf_8 = b"\343\202\261\343\203\274\343\202\277\343\202\244 Watch" dammit = UnicodeDammit(utf_8) - self.assertEqual(dammit.original_encoding, 'utf-8') + self.assertEqual(dammit.original_encoding.lower(), 'utf-8') self.assertEqual(dammit.unicode_markup.encode("utf-8"), utf_8) def test_ignore_inappropriate_codecs(self): utf8_data = u"Räksmörgås".encode("utf-8") dammit = UnicodeDammit(utf8_data, ["iso-8859-8"]) - self.assertEqual(dammit.original_encoding, 'utf-8') + self.assertEqual(dammit.original_encoding.lower(), 'utf-8') def test_ignore_invalid_codecs(self): utf8_data = u"Räksmörgås".encode("utf-8") for bad_encoding in ['.utf8', '...', 'utF---16.!']: dammit = UnicodeDammit(utf8_data, [bad_encoding]) - self.assertEqual(dammit.original_encoding, 'utf-8') + self.assertEqual(dammit.original_encoding.lower(), 'utf-8') def test_detect_html5_style_meta_tag(self): |