view articles/management/commands/import_old_articles.py @ 132:e53efcac7a7a

For Django 1.6: CACHE_MIDDLEWARE_ANONYMOUS_ONLY deprecated.
author Brian Neal <bgneal@gmail.com>
date Tue, 24 Dec 2013 17:18:44 -0600
parents b7cdfdde3999
children
line wrap: on
line source
"""
import_old_articles.py - For importing articles from the older version of this
website.

"""
import datetime
import json

from django.conf import settings
from django.core.management.base import LabelCommand
from django.utils.html import linebreaks
import textile

from articles.models import Article


class Command(LabelCommand):
    args = '<filename filename ...>'
    help = 'Imports older articles in JSON format'

    def handle_label(self, filename, **options):
        """
        Process the file of older articles in JSON. Convert to the new model
        scheme.

        """
        with open(filename, 'rb') as f:
            items = json.load(f)

        for item in items:
            if item['model'] == 'band.article':
                self.process_item(item)

    def process_item(self, item):

        fields = item['fields']

        content = fields['text'].strip()
        if fields['markup_enabled']:
            text = textile.textile(content, encoding='utf-8', output='utf-8')
        else:
            text = linebreaks(fields['text'])

        source = linebreaks(fields['source'].strip())

        pdf = fields['pdf'].strip()
        if pdf:
            pdf = u"%s%s" % (settings.MEDIA_URL, pdf.replace('\\', '/'))

        article = Article(
                id=item['pk'],
                title=fields['title'].strip(),
                date=datetime.datetime.strptime(fields['date'], '%Y-%m-%d'),
                text=text,
                source=source,
                url=fields['url'].strip(),
                pdf=pdf)

        article.save()