diff options
Diffstat (limited to 'source/export.py')
-rw-r--r-- | source/export.py | 190 |
1 files changed, 190 insertions, 0 deletions
diff --git a/source/export.py b/source/export.py new file mode 100644 index 00000000..a14d47c0 --- /dev/null +++ b/source/export.py @@ -0,0 +1,190 @@ +#! /usr/bin/env python +#-*- coding: utf-8 -*- + +# pyAggr3g470r - A Web based news aggregator. +# Copyright (C) 2010 Cédric Bonhomme - http://cedricbonhomme.org/ +# +# For more information : http://bitbucket.org/cedricbonhomme/pyaggr3g470r/ +# +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program. If not, see <http://www.gnu.org/licenses/> + +__author__ = "Cedric Bonhomme" +__version__ = "$Revision: 0.1 $" +__date__ = "$Date: 2011/10/24 $" +__copyright__ = "Copyright (c) Cedric Bonhomme" +__license__ = "GPLv3" + +# +# This file contains the export functions of pyAggr3g470r. Indeed +# it is possible to export the database of articles in different formats: +# - simple HTML webzine; +# - text file; +# - ePub file; +# - PDF file. +# + +import os +import hashlib + +import utils + + +htmlheader = '<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">\n' + \ + '<head>' + \ + '\n\t<title>pyAggr3g470r - News aggregator</title>\n' + \ + '\t<link rel="stylesheet" type="text/css" href="/css/style.css" />' + \ + '\n\t<meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>\n' + \ + '</head>\n' + +htmlfooter = '<p>This software is under GPLv3 license. You are welcome to copy, modify or' + \ + ' redistribute the source code according to the' + \ + ' <a href="http://www.gnu.org/licenses/gpl-3.0.txt">GPLv3</a> license.</p></div>\n' + \ + '</body>\n</html>' + + + +def export_html(feeds): + """ + Export the articles given in parameter in a simple Webzine. + """ + index = htmlheader + index += "<br />\n<ul>" + for feed in feeds.values(): + # creates a folder for each stream + feed_folder = utils.path + "/var/export/webzine/" + \ + utils.normalize_filename(feed.feed_id) + try: + os.makedirs(feed_folder) + except OSError: + # directories already exists (not a problem) + pass + + + index += """<li><a href="%s">%s</a></a></li>\n""" % \ + (feed.feed_id, feed.feed_title) + + posts = htmlheader + for article in feed.articles.values(): + + post_file_name = os.path.normpath(feed_folder + "/" + article.article_id + ".html") + feed_index = os.path.normpath(feed_folder + "/index.html") + + posts += article.article_date + " - " + \ + """<a href="./%s.html">%s</a>""" % \ + (article.article_id, article.article_title[:150]) + "<br />\n" + + + a_post = htmlheader + a_post += '\n<div style="width: 50%; overflow:hidden; text-align: justify; margin:0 auto">\n' + a_post += """<h1><a href="%s">%s</a></h1><br />""" % \ + (article.article_link, article.article_title) + a_post += article.article_description + a_post += "</div>\n<hr />\n" + a_post += """<br />\n<a href="%s">Complete story</a>\n<br />\n""" % (article.article_link,) + a_post += "<hr />\n" + htmlfooter + + + with open(post_file_name, "w") as f: + f.write(a_post) + + posts += htmlfooter + with open(feed_index, "w") as f: + f.write(posts) + + index += "\n</ul>\n<br />" + index += htmlfooter + with open(utils.path + "/var/export/webzine/" + "index.html", "w") as f: + f.write(index) + +def export_txt(feeds): + """ + Export the articles given in parameter in text files. + """ + for feed in feeds.values(): + # creates folder for each stream + folder = utils.path + "/var/export/txt/" + \ + utils.normalize_filename(feed.feed_title.strip().replace(':', '').lower()) + try: + os.makedirs(folder) + except OSError: + # directories already exists (not a problem) + pass + + for article in feed.articles.values(): + name = article.article_date.strip().replace(' ', '_') + name = os.path.normpath(folder + "/" + name + ".txt") + + content = "Title: " + article.article_title + "\n\n\n" + content += utils.clear_string(article.article_description) + + with open(name, "w") as f: + f.write(content) + +def export_epub(feeds): + """ + Export the articles given in parameter in ePub files. + """ + from epub import ez_epub + for feed in feeds.values(): + # creates folder for each stream + folder = utils.path + "/var/export/epub/" + \ + utils.normalize_filename(feed.feed_title.strip().replace(':', '').lower()) + try: + os.makedirs(folder) + except OSError: + # directories already exists (not a problem) + pass + + for article in feed.articles.values(): + name = article.article_date.strip().replace(' ', '_') + name = os.path.normpath(folder + "/" + name + ".epub") + + section = ez_epub.Section() + section.title = article.article_title.decode('utf-8') + section.paragraphs = [utils.clear_string(article.article_description).decode('utf-8')] + ez_epub.makeBook(article.article_title.decode('utf-8'), [feed.feed_title.decode('utf-8')], [section], \ + name, lang='en-US', cover=None) + +def export_pdf(feeds): + """ + Export the articles given in parameter in PDF files. + """ + from xhtml2pdf import pisa + import cStringIO as StringIO + for feed in feeds.values(): + # creates folder for each stream + folder = utils.path + "/var/export/pdf/" + \ + utils.normalize_filename(feed.feed_title.strip().replace(':', '').lower()) + try: + os.makedirs(folder) + except OSError: + # directories already exists (not a problem) + pass + + for article in feed.articles.values(): + name = article.article_date.strip().replace(' ', '_') + name = os.path.normpath(folder + "/" + name + ".pdf") + + content = htmlheader + content += '\n<div style="width: 50%; overflow:hidden; text-align: justify; margin:0 auto">\n' + content += """<h1><a href="%s">%s</a></h1><br />""" % \ + (article.article_link, article.article_title) + content += article.article_description + content += "</div>\n<hr />\n" + content += htmlfooter + + try: + pdf = pisa.CreatePDF(StringIO.StringIO(content), file(name, "wb")) + except: + pass
\ No newline at end of file |