view articles/management/commands/import_old_articles.py @ 131:9c74cd8668eb

For Django 1.6: take advantage of new database connection persistence.
author Brian Neal <bgneal@gmail.com>
date Tue, 24 Dec 2013 16:50:13 -0600
parents b7cdfdde3999
children
line wrap: on
line source
"""
import_old_articles.py - For importing articles from the older version of this
website.

"""
import datetime
import json

from django.conf import settings
from django.core.management.base import LabelCommand
from django.utils.html import linebreaks
import textile

from articles.models import Article


class Command(LabelCommand):
    args = '<filename filename ...>'
    help = 'Imports older articles in JSON format'

    def handle_label(self, filename, **options):
        """
        Process the file of older articles in JSON. Convert to the new model
        scheme.

        """
        with open(filename, 'rb') as f:
            items = json.load(f)

        for item in items:
            if item['model'] == 'band.article':
                self.process_item(item)

    def process_item(self, item):

        fields = item['fields']

        content = fields['text'].strip()
        if fields['markup_enabled']:
            text = textile.textile(content, encoding='utf-8', output='utf-8')
        else:
            text = linebreaks(fields['text'])

        source = linebreaks(fields['source'].strip())

        pdf = fields['pdf'].strip()
        if pdf:
            pdf = u"%s%s" % (settings.MEDIA_URL, pdf.replace('\\', '/'))

        article = Article(
                id=item['pk'],
                title=fields['title'].strip(),
                date=datetime.datetime.strptime(fields['date'], '%Y-%m-%d'),
                text=text,
                source=source,
                url=fields['url'].strip(),
                pdf=pdf)

        article.save()