Use readabilite properly
Not thru some weird wrapper anymore
This commit is contained in:
		@@ -15,6 +15,7 @@ import lxml.html
 | 
			
		||||
from . import feeds
 | 
			
		||||
from . import feedify
 | 
			
		||||
from . import crawler
 | 
			
		||||
from . import readabilite
 | 
			
		||||
 | 
			
		||||
import wsgiref.simple_server
 | 
			
		||||
import wsgiref.handlers
 | 
			
		||||
@@ -79,12 +80,6 @@ def log(txt, force=False):
 | 
			
		||||
            print(repr(txt))
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
from . import readabilite
 | 
			
		||||
def readability(html, url):
 | 
			
		||||
    return readabilite.get_article(html)
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
def len_html(txt):
 | 
			
		||||
    if len(txt):
 | 
			
		||||
        return len(lxml.html.fromstring(txt).text_content())
 | 
			
		||||
@@ -287,7 +282,7 @@ def Fill(item, options, feedurl='/', fast=False):
 | 
			
		||||
        log('non-text page')
 | 
			
		||||
        return True
 | 
			
		||||
 | 
			
		||||
    out = readability(data, con.url)
 | 
			
		||||
    out = readabilite.get_article(data)
 | 
			
		||||
 | 
			
		||||
    if options.hungry or count_words(out) > max(count_content, count_desc):
 | 
			
		||||
        item.push_content(out)
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user