view articles/management/commands/import_old_articles.py @ 185:cfa730bbca6e

Regroup press articles by year.
author Brian Neal <bgneal@gmail.com>
date Sun, 24 Jan 2016 21:41:28 -0600
parents b7cdfdde3999
children
line wrap: on
line source
"""
import_old_articles.py - For importing articles from the older version of this
website.

"""
import datetime
import json

from django.conf import settings
from django.core.management.base import LabelCommand
from django.utils.html import linebreaks
import textile

from articles.models import Article


class Command(LabelCommand):
    args = '<filename filename ...>'
    help = 'Imports older articles in JSON format'

    def handle_label(self, filename, **options):
        """
        Process the file of older articles in JSON. Convert to the new model
        scheme.

        """
        with open(filename, 'rb') as f:
            items = json.load(f)

        for item in items:
            if item['model'] == 'band.article':
                self.process_item(item)

    def process_item(self, item):

        fields = item['fields']

        content = fields['text'].strip()
        if fields['markup_enabled']:
            text = textile.textile(content, encoding='utf-8', output='utf-8')
        else:
            text = linebreaks(fields['text'])

        source = linebreaks(fields['source'].strip())

        pdf = fields['pdf'].strip()
        if pdf:
            pdf = u"%s%s" % (settings.MEDIA_URL, pdf.replace('\\', '/'))

        article = Article(
                id=item['pk'],
                title=fields['title'].strip(),
                date=datetime.datetime.strptime(fields['date'], '%Y-%m-%d'),
                text=text,
                source=source,
                url=fields['url'].strip(),
                pdf=pdf)

        article.save()