From ef51152bcd21a8082e90d979e053e0f9703fbc0b Mon Sep 17 00:00:00 2001 From: Samuel Clay Date: Fri, 29 Sep 2017 10:50:08 -0700 Subject: [PATCH] Updating readability class names to look for. --- apps/rss_feeds/text_importer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/apps/rss_feeds/text_importer.py b/apps/rss_feeds/text_importer.py index 051a3bcd9..4a49c618c 100644 --- a/apps/rss_feeds/text_importer.py +++ b/apps/rss_feeds/text_importer.py @@ -76,7 +76,7 @@ class TextImporter: text = text.replace("\u00a0", " ") # Non-breaking space, is mangled when encoding is not utf-8 original_text_doc = readability.Document(text, url=resp.url, - positive_keywords="postContent, postField") + positive_keywords="post, entry, postProp, article, postContent, postField") try: content = original_text_doc.summary(html_partial=True) except (readability.Unparseable, ParserError), e: