diff --git a/morss/readabilite.py b/morss/readabilite.py index 6498a77..3412a57 100644 --- a/morss/readabilite.py +++ b/morss/readabilite.py @@ -93,6 +93,7 @@ def score_node(node): class_id = node.get('class', '') + node.get('id', '') if (isinstance(node, lxml.html.HtmlComment) + or isinstance(node, lxml.html.HtmlProcessingInstruction) or node.tag in tags_bad or regex_bad.search(class_id)): return 0