aboutsummaryrefslogtreecommitdiff
path: root/source/sqlite2mongo.py
diff options
context:
space:
mode:
authorcedricbonhomme <devnull@localhost>2012-04-15 18:59:50 +0200
committercedricbonhomme <devnull@localhost>2012-04-15 18:59:50 +0200
commite6472738b5253aa328f8b2a4f4f2a23abc8582c2 (patch)
treec61704deed1d3cb37f5e3961794896c6dd115ba5 /source/sqlite2mongo.py
parentBetter use of datetime. (diff)
downloadnewspipe-e6472738b5253aa328f8b2a4f4f2a23abc8582c2.tar.gz
newspipe-e6472738b5253aa328f8b2a4f4f2a23abc8582c2.tar.bz2
newspipe-e6472738b5253aa328f8b2a4f4f2a23abc8582c2.zip
Reorganization of folders.
Diffstat (limited to 'source/sqlite2mongo.py')
-rw-r--r--source/sqlite2mongo.py78
1 files changed, 78 insertions, 0 deletions
diff --git a/source/sqlite2mongo.py b/source/sqlite2mongo.py
new file mode 100644
index 00000000..633fb8f9
--- /dev/null
+++ b/source/sqlite2mongo.py
@@ -0,0 +1,78 @@
+#! /usr/bin/env python
+# -*- coding: utf-8 -*-
+
+import hashlib
+import sqlite3
+import mongodb
+
+import utils
+
+from datetime import datetime
+
+SQLITE_BASE = "./var/feed.db"
+
+
+def sqlite2mongo():
+ """
+ Load feeds and articles in a dictionary.
+ """
+ mongo = mongodb.Articles()
+ list_of_feeds = []
+ list_of_articles = []
+
+ try:
+ conn = sqlite3.connect(SQLITE_BASE, isolation_level = None)
+ c = conn.cursor()
+ list_of_feeds = c.execute("SELECT * FROM feeds").fetchall()
+ except:
+ pass
+
+ if list_of_feeds != []:
+ # Walk through the list of feeds
+ for feed in list_of_feeds:
+ try:
+ list_of_articles = c.execute(\
+ "SELECT * FROM articles WHERE feed_link='" + \
+ feed[2] + "'").fetchall()
+ except:
+ continue
+ sha1_hash = hashlib.sha1()
+ sha1_hash.update(feed[2].encode('utf-8'))
+ feed_id = sha1_hash.hexdigest()
+
+ new_collection = {"feed_id" : feed_id.encode('utf-8'), \
+ "type": 0, \
+ "feed_image" : feed[3].encode('utf-8'), \
+ "feed_title" : feed[0].encode('utf-8'), \
+ "feed_link" : feed[2].encode('utf-8'), \
+ "site_link" : feed[1].encode('utf-8'), \
+ "mail" : feed[4]=="1"}
+
+ mongo.add_collection(new_collection)
+
+ if list_of_articles != []:
+ # Walk through the list of articles for the current feed.
+ articles = []
+ for article in list_of_articles:
+ sha1_hash = hashlib.sha1()
+ sha1_hash.update(article[2].encode('utf-8'))
+ article_id = sha1_hash.hexdigest()
+
+ article = {"article_id": article_id.encode('utf-8'), \
+ "type":1, \
+ "article_date": utils.string_to_datetime(article[0]), \
+ "article_link": article[2].encode('utf-8'), \
+ "article_title": article[1].encode('utf-8'), \
+ "article_content": article[3].encode('utf-8'), \
+ "article_readed": article[4]=="1", \
+ "article_like": article[6]=="1" \
+ }
+
+ articles.append(article)
+
+ mongo.add_articles(articles, feed_id)
+
+ c.close()
+
+if __name__ == "__main__":
+ sqlite2mongo() \ No newline at end of file
bgstack15