diff options
author | cedricbonhomme <devnull@localhost> | 2011-06-01 09:40:38 +0200 |
---|---|---|
committer | cedricbonhomme <devnull@localhost> | 2011-06-01 09:40:38 +0200 |
commit | 74a77378743564072129a656fb0cbf869937bc81 (patch) | |
tree | 7c373b89b098637ae2f7c3c02f6ffc7d46bfd9c2 | |
parent | Minor improvement: HTML purification of articles description with BeautifulSo... (diff) | |
download | newspipe-74a77378743564072129a656fb0cbf869937bc81.tar.gz newspipe-74a77378743564072129a656fb0cbf869937bc81.tar.bz2 newspipe-74a77378743564072129a656fb0cbf869937bc81.zip |
Removed useless code in utils.py. Improvement of the CSStoopTip description.
-rwxr-xr-x | pyAggr3g470r.py | 2 | ||||
-rwxr-xr-x | utils.py | 2 |
2 files changed, 3 insertions, 1 deletions
diff --git a/pyAggr3g470r.py b/pyAggr3g470r.py index 33a5da2c..67beea86 100755 --- a/pyAggr3g470r.py +++ b/pyAggr3g470r.py @@ -35,6 +35,7 @@ import calendar import threading from collections import Counter +from BeautifulSoup import BeautifulSoup import utils import feedgetter @@ -180,6 +181,7 @@ class Root: article_content = utils.clear_string(article.article_description) if article_content: description = " ".join(article_content[:500].split(' ')[:-1]) + description = str(BeautifulSoup(description)) else: description = "No description." # Title of the article @@ -103,7 +103,7 @@ def clear_string(data): """ p = re.compile(r'<[^<]*?/?>') # HTML tags q = re.compile(r'\s') # consecutive white spaces - return p.sub('', q.sub(' ', data.replace('', ''))) + return p.sub('', q.sub(' ', data)) def unescape(text): """ |