view legacy/management/commands/import_old_potd_comments.py @ 1203:8cd15df9b563

Controlling the xapian install script in tools.
author Brian Neal <bgneal@gmail.com>
date Sat, 04 Jan 2025 14:19:19 -0600
parents ee87ea74d46b
children
line wrap: on
line source
"""
import_old_potd_comments.py - For importing comments on POTD's from SG101 1.0
as csv files.

"""
from __future__ import with_statement
import csv
import optparse
import sys
from datetime import datetime

from django.core.management.base import LabelCommand, CommandError
from django.contrib.auth.models import User
from django.contrib.contenttypes.models import ContentType

from comments.models import Comment
from potd.models import Photo
import legacy.data
from legacy.html2md import MarkdownWriter


PHOTO_ID_OFFSET = 100
ID_OFFSET = 3000


class Command(LabelCommand):
    args = '<filename filename ...>'
    help = 'Imports POTD comments from the old database in CSV format'
    option_list = LabelCommand.option_list + (
        optparse.make_option("-p", "--progress", action="store_true",
            help="Output a . after every 20 items to show progress"),
        optparse.make_option("--fix-mode", action="store_true",
            help="Only create comments if they don't exist already"),
    )
    md_writer = MarkdownWriter()

    def handle_label(self, filename, **options):
        """
        Process each line in the CSV file given by filename by
        creating a new POTD comment.

        """
        self.show_progress = options.get('progress')
        self.fix_mode = options.get('fix_mode')
        self.users = {}

        try:
            with open(filename, "rb") as f:
                self.reader = csv.DictReader(f)
                num_rows = 0
                try:
                    for row in self.reader:
                        self.process_row(row)
                        num_rows += 1
                        if self.show_progress and num_rows % 20 == 0:
                            sys.stdout.write('.')
                            sys.stdout.flush()
                except csv.Error, e:
                    raise CommandError("CSV error: %s %s %s" % (
                        filename, self.reader.line_num, e))

                print

        except IOError:
            raise CommandError("Could not open file: %s" % filename)

    def process_row(self, row):
        """
        Process one row from the CSV file: create a Comment object for
        the row and save it in the database.

        """
        comment_id = int(row['cid']) + ID_OFFSET

        if self.fix_mode:
            try:
                c = Comment.objects.get(pk=comment_id)
            except Comment.DoesNotExist:
                pass
            else:
                return

        try:
            user = self._get_user(row['username'].decode('latin-1'))
        except User.DoesNotExist:
            print "Could not find user %s for comment %s; skipping." % (
                    row['username'], row['cid'])
            return

        pid = int(row['pid']) + PHOTO_ID_OFFSET
        try:
            photo = Photo.objects.get(id=pid)
        except Photo.DoesNotExist:
            print "Could not find photo %s for comment %s; skipping." % (
                    pid, row['cid'])
            return

        comment = Comment(
            id=comment_id,
            content_type=ContentType.objects.get_for_model(photo),
            object_id=photo.id,
            user=user,
            comment=self.to_markdown(row['comment'].decode('latin-1')),
            creation_date=datetime.strptime(row['date'], "%Y-%m-%d %H:%M:%S"),
            ip_address='192.0.2.0',     # TEST-NET
            is_public=True,
            is_removed=False,
        )

        comment.save()

    def _get_user(self, username):
        """
        Returns the user object with the given username.
        Throws User.DoesNotExist if not found.

        """
        try:
            return self.users[username]
        except KeyError:
            pass

        try:
            user = User.objects.get(username=username)
        except User.DoesNotExist:
            old_name = username.lower()
            try:
                user = User.objects.get(
                        username=legacy.data.KNOWN_USERNAME_CHANGES[old_name])
            except KeyError:
                raise User.DoesNotExist

        self.users[username] = user
        return user

    def to_markdown(self, s):

        s = s.replace('\n', '\n<br />')
        self.md_writer.reset()
        self.md_writer.feed(s)
        return self.md_writer.markdown()