Implement function error() for HTMLParser
1. Handle EXCEPTION [getTitleData]: (NotImplementedError) subclasses of ParserBase must override error() URL: http://www.mycplus.com/featured-articles/top-ten-c-language-resources/ 2. Add a debug log to show if server supports gzip
This commit is contained in:
parent
7bde1f7ec6
commit
894b16a7ef
5
buku
5
buku
@ -103,6 +103,9 @@ class BMHTMLParser(HTMLParser.HTMLParser):
|
||||
if self.lasttag == "title" and self.inTitle == True:
|
||||
self.data += data
|
||||
|
||||
def error(self, message):
|
||||
pass
|
||||
|
||||
|
||||
|
||||
def getDataPath():
|
||||
@ -240,6 +243,8 @@ def getTitleData(resp):
|
||||
charset = resp.headers.get_content_charset()
|
||||
|
||||
if resp.headers.get('Content-Encoding') == 'gzip':
|
||||
if debug:
|
||||
print("gzip response")
|
||||
data = gzip.GzipFile(fileobj=io.BytesIO(resp.read())).read()
|
||||
else:
|
||||
data = resp.read()
|
||||
|
Loading…
Reference in New Issue
Block a user