diff options
author | cedricbonhomme <devnull@localhost> | 2010-07-07 11:40:31 +0200 |
---|---|---|
committer | cedricbonhomme <devnull@localhost> | 2010-07-07 11:40:31 +0200 |
commit | ae508ad4d7968a03f1254d82b3da6bdf541fd515 (patch) | |
tree | 2ff5ec88926c5c585d16632797552bd92b741bd7 /feedgetter.py | |
parent | Faster top_words function. (diff) | |
download | newspipe-ae508ad4d7968a03f1254d82b3da6bdf541fd515.tar.gz newspipe-ae508ad4d7968a03f1254d82b3da6bdf541fd515.tar.bz2 newspipe-ae508ad4d7968a03f1254d82b3da6bdf541fd515.zip |
Lot of performance improvements
Diffstat (limited to 'feedgetter.py')
-rwxr-xr-x | feedgetter.py | 9 |
1 files changed, 1 insertions, 8 deletions
diff --git a/feedgetter.py b/feedgetter.py index 267246db..d2aca435 100755 --- a/feedgetter.py +++ b/feedgetter.py @@ -16,13 +16,6 @@ from datetime import datetime import utils -url_finders = [ \ - re.compile("([0-9]{1,3}\\.[0-9]{1,3}\\.[0-9]{1,3}\\.[0-9]{1,3}|(((news|telnet|nttp|file|http|ftp|https)://)|(www|ftp)[-A-Za-z0-9]*\\.)[-A-Za-z0-9\\.]+)(:[0-9]*)?/[-A-Za-z0-9_\\$\\.\\+\\!\\*\\(\\),;:@&=\\?/~\\#\\%]*[^]'\\.}>\\),\\\"]"), \ - re.compile("([0-9]{1,3}\\.[0-9]{1,3}\\.[0-9]{1,3}\\.[0-9]{1,3}|(((news|telnet|nttp|file|http|ftp|https)://)|(www|ftp)[-A-Za-z0-9]*\\.)[-A-Za-z0-9\\.]+)(:[0-9]*)?"), \ - re.compile("(~/|/|\\./)([-A-Za-z0-9_\\$\\.\\+\\!\\*\\(\\),;:@&=\\?/~\\#\\%]|\\\\)+"), \ - re.compile("'\\<((mailto:)|)[-A-Za-z0-9\\.]+@[-A-Za-z0-9\\.]+"), \ -] - feeds_list = [] list_of_threads = [] @@ -47,7 +40,7 @@ class FeedGetter(object): with open("./var/feed.lst") as f: for a_feed in f: # test if the URL is well formed - for url_regexp in url_finders: + for url_regexp in utils.url_finders: if url_regexp.match(a_feed): the_good_url = url_regexp.match(a_feed).group(0).replace("\n", "") try: |