Merge.

author: Leonard Richardson <leonard.richardson@canonical.com> 2013-05-15 11:10:12 -0400
committer: Leonard Richardson <leonard.richardson@canonical.com> 2013-05-15 11:10:12 -0400
commit: 87c7f93d7feb8bd982dbbc42d814352b60be344d (patch)
tree: 3905df101f631ca66055ab2af50c36d34227268b /bs4
parent: ada530f6bc24bf4e536c1c859d798b836ec0799c (diff)
parent: c3cc17f0dda7d378890a12fd8b5c29de9f923dab (diff)
3 files changed, 18 insertions, 10 deletions
diff --git a/bs4/diagnose.py b/bs4/diagnose.py
index d4e657c..4b5f6e4 100644
--- a/bs4/diagnose.py
+++ b/bs4/diagnose.py
@@ -14,11 +14,6 @@ def diagnose(data):
     print "Diagnostic running on Beautiful Soup %s" % __version__
     print "Python version %s" % sys.version
 
-    if hasattr(data, 'read'):
-        data = data.read()
-    elif os.path.exists(data):
-        print '"%s" looks like a filename. Reading data from the file.' % data
-        data = open(data).read()
     basic_parsers = ["html.parser", "html5lib", "lxml"]
     for name in basic_parsers:
         for builder in builder_registry.builders:
@@ -38,6 +33,16 @@ def diagnose(data):
     if 'html5lib' in basic_parsers:
         import html5lib
         print "Found html5lib version %s" % html5lib.__version__
+
+    if hasattr(data, 'read'):
+        data = data.read()
+    elif os.path.exists(data):
+        print '"%s" looks like a filename. Reading data from the file.' % data
+        data = open(data).read()
+    elif data.startswith("http:") or data.startswith("https:"):
+        print '"%s" looks like a URL. Beautiful Soup is not an HTTP client.' % data
+        print "You need to use some other library to get the document behind the URL, and feed that document to Beautiful Soup."
+        return
     print
 
     for parser in basic_parsers:
diff --git a/bs4/element.py b/bs4/element.py
index 1f121f4..f6864f2 100644
--- a/bs4/element.py
+++ b/bs4/element.py
@@ -1392,10 +1392,13 @@ class Tag(PageElement):
     def recursiveChildGenerator(self):
         return self.descendants
 
-    # This was kind of misleading because has_key() (attributes) was
-    # different from __in__ (contents). has_key() is gone in Python 3,
-    # anyway.
-    has_key = has_attr
+    def has_key(self, key):
+        """This was kind of misleading because has_key() (attributes)
+        was different from __in__ (contents). has_key() is gone in
+        Python 3, anyway."""
+        warnings.warn('has_key is deprecated. Use has_attr("%s") instead.' % (
+                key))
+        return self.has_attr(key)
 
 # Next, a couple classes to represent queries and their results.
 class SoupStrainer(object):
diff --git a/bs4/tests/test_tree.py b/bs4/tests/test_tree.py
index b07de8c..f60485b 100644
--- a/bs4/tests/test_tree.py
+++ b/bs4/tests/test_tree.py
@@ -1618,7 +1618,7 @@ class TestSoupSelector(TreeTest):
         for el in els:
             self.assertEqual(el.name, 'p')
         self.assertEqual(els[1]['class'], ['onep'])
-        self.assertFalse(els[0].has_key('class'))
+        self.assertFalse(els[0].has_attr('class'))
 
     def test_a_bunch_of_emptys(self):
         for selector in ('div#main del', 'div#main div.oops', 'div div#main'):
author	Leonard Richardson <leonard.richardson@canonical.com>	2013-05-15 11:10:12 -0400
committer	Leonard Richardson <leonard.richardson@canonical.com>	2013-05-15 11:10:12 -0400
commit	87c7f93d7feb8bd982dbbc42d814352b60be344d (patch)
tree	3905df101f631ca66055ab2af50c36d34227268b /bs4
parent	ada530f6bc24bf4e536c1c859d798b836ec0799c (diff)
parent	c3cc17f0dda7d378890a12fd8b5c29de9f923dab (diff)