From 3624be8f5ca563fd4ab3db4d602db2ff76955e65 Mon Sep 17 00:00:00 2001 From: Wayne Huang <maximum.huang@gmail.com> Date: Tue, 9 Jun 2015 15:39:28 +0800 Subject: [PATCH 1/2] replace urllib2 by requests to avoid the "SSL: CERTIFICATE_VERIFY_FAILED" --- opengraph/opengraph.py | 6 +++--- setup.py | 3 ++- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/opengraph/opengraph.py b/opengraph/opengraph.py index 9cedb97..4b329a0 100644 --- a/opengraph/opengraph.py +++ b/opengraph/opengraph.py @@ -1,7 +1,7 @@ # encoding: utf-8 import re -import urllib2 +import requests try: from bs4 import BeautifulSoup except ImportError: @@ -48,7 +48,7 @@ def fetch(self, url): """ """ raw = urllib2.urlopen(url) - html = raw.read() + html = raw.text return self.parser(html) def parser(self, html): @@ -123,4 +123,4 @@ def scrape_url(self, doc): def scrape_description(self, doc): tag = doc.html.head.findAll('meta', attrs={"name":"description"}) result = "".join([t['content'] for t in tag]) - return result \ No newline at end of file + return result diff --git a/setup.py b/setup.py index 9d1677e..71c21fa 100644 --- a/setup.py +++ b/setup.py @@ -23,7 +23,8 @@ include_package_data=True, zip_safe=False, install_requires=[ - 'beautifulsoup4' + 'beautifulsoup4', + 'requests' ], entry_points=""" # -*- Entry points: -*- From b3e89597e230a2d5459deeda8c2e944dcb0ffa1d Mon Sep 17 00:00:00 2001 From: Wayne Huang <maximum.huang@gmail.com> Date: Tue, 9 Jun 2015 15:41:10 +0800 Subject: [PATCH 2/2] fix typo --- opengraph/opengraph.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/opengraph/opengraph.py b/opengraph/opengraph.py index 4b329a0..58f98a8 100644 --- a/opengraph/opengraph.py +++ b/opengraph/opengraph.py @@ -47,7 +47,7 @@ def __getattr__(self, name): def fetch(self, url): """ """ - raw = urllib2.urlopen(url) + raw = requests.get(url) html = raw.text return self.parser(html)