crawler: fix accept code
parent
67f5a21019
commit
99f3c519f2
|
@ -45,7 +45,10 @@ def custom_handler(accept=None, strict=False, delay=None, encoding=None, basic=F
|
||||||
handlers.append(AutoRefererHandler())
|
handlers.append(AutoRefererHandler())
|
||||||
|
|
||||||
handlers.append(EncodingFixHandler(encoding))
|
handlers.append(EncodingFixHandler(encoding))
|
||||||
|
|
||||||
|
if accept:
|
||||||
handlers.append(ContentNegociationHandler(MIMETYPE[accept], strict))
|
handlers.append(ContentNegociationHandler(MIMETYPE[accept], strict))
|
||||||
|
|
||||||
handlers.append(SQliteCacheHandler(delay))
|
handlers.append(SQliteCacheHandler(delay))
|
||||||
|
|
||||||
return build_opener(*handlers)
|
return build_opener(*handlers)
|
||||||
|
@ -164,7 +167,7 @@ class ContentNegociationHandler(BaseHandler):
|
||||||
|
|
||||||
def http_response(self, req, resp):
|
def http_response(self, req, resp):
|
||||||
contenttype = resp.info().get('Content-Type', '').split(';')[0]
|
contenttype = resp.info().get('Content-Type', '').split(';')[0]
|
||||||
if 200 <= resp.code < 300 and self.strict and contenttype in MIMETYPE['html'] and contenttype not in self.accept:
|
if 200 <= resp.code < 300 and self.accept is not None and self.strict and contenttype in MIMETYPE['html'] and contenttype not in self.accept:
|
||||||
# opps, not what we were looking for, let's see if the html page suggests an alternative page of the right types
|
# opps, not what we were looking for, let's see if the html page suggests an alternative page of the right types
|
||||||
|
|
||||||
data = resp.read()
|
data = resp.read()
|
||||||
|
|
Loading…
Reference in New Issue