Improve widely feedsportal url decoder

master
pictuga 2015-06-14 20:32:47 +08:00
parent 8418212475
commit 5c2151ffd6
1 changed files with 6 additions and 3 deletions

View File

@ -196,9 +196,12 @@ def Fix(item, feedurl='/'):
match = re.search('/([0-9a-zA-Z]{20,})/story01.htm$', item.link) match = re.search('/([0-9a-zA-Z]{20,})/story01.htm$', item.link)
if match: if match:
url = match.groups()[0].split('0') url = match.groups()[0].split('0')
t = {'A': '0', 'B': '.', 'C': '/', 'D': '?', 'E': '-', 'H': ',', 'I': '_', 'L': 'http://', 'S': 'www.', t = {'A': '0', 'B': '.', 'C': '/', 'D': '?', 'E': '-', 'F': '=',
'N': '.com', 'O': '.co.uk'} 'G': '&', 'H': ',', 'I': '_', 'J': '%', 'K': '+', 'L': 'http://',
item.link = ''.join([(t[s[0]] if s[0] in t else '=') + s[1:] for s in url[1:]]) 'M': 'https://', 'N': '.com', 'O': '.co.uk', 'P': ';', 'Q': '|',
'R': ':', 'S': 'www.', , 'T': '#', 'U': '$', 'V': '~', 'W': '!',
'X': '(', 'Y': ')', 'Z': 'Z'}
item.link = ''.join([(t[s[0]] if s[0] in t else s[0]) + s[1:] for s in url[1:]])
log(item.link) log(item.link)
# reddit # reddit