From 44a6b2591d72c9e66be82b61f021948e7fc7d641 Mon Sep 17 00:00:00 2001 From: pictuga Date: Sun, 7 Nov 2021 19:44:36 +0100 Subject: [PATCH] crawler: cleaner http header object import --- morss/crawler.py | 12 +++++------- 1 file changed, 5 insertions(+), 7 deletions(-) diff --git a/morss/crawler.py b/morss/crawler.py index 396d21d..8d90ad8 100644 --- a/morss/crawler.py +++ b/morss/crawler.py @@ -19,7 +19,6 @@ import os import pickle import random import re -import sys import time import zlib from cgi import parse_header @@ -34,14 +33,14 @@ try: # python 2 from urllib import quote - import mimetools + from mimetools import Message as message_from_string from urllib2 import (BaseHandler, HTTPCookieProcessor, HTTPRedirectHandler, Request, addinfourl, build_opener, parse_http_list, parse_keqv_list) from urlparse import urlparse, urlunparse except ImportError: # python 3 - import email + from email import message_from_string from urllib.parse import quote, urlparse, urlunparse from urllib.request import (BaseHandler, HTTPCookieProcessor, HTTPRedirectHandler, Request, addinfourl, @@ -461,10 +460,7 @@ class CacheHandler(BaseHandler): data = None else: - if sys.version_info[0] >= 3: - data['headers'] = email.message_from_string(data['headers'] or unicode()) # headers - else: - data['headers'] = mimetools.Message(StringIO(data['headers'] or unicode())) + data['headers'] = message_from_string(data['headers'] or unicode()) # headers return data @@ -618,6 +614,8 @@ if 'IGNORE_SSL' in os.environ: if __name__ == '__main__': + import sys + req = adv_get(sys.argv[1] if len(sys.argv) > 1 else 'https://morss.it') if sys.flags.interactive: