Reading a csv file in Django (Python)

Question

I'm trying to figure out how to read from a csv file in a django app. One row of the csv file has data that needs to be parcelled out into different tables/models. But I also need to perform checks on that data to see if it's already in the database.

The app is a continuation of the local library tutorial on the Mozilla website. I'm trying to update the library database by uploading data from a csv file, where each line is a record from a book.

It kinda works, but not without errors. The main struggle is understanding how to iterate through the file correctly. Do I need to be using an input stream, if so am I doing that correctly, or can I just open the file some other way? I've tried that, but had issues with decoding.

The view function I've tried to write (cobbled together from other tutorials, videos and stackexchange posts):

import csv, io

from django.contrib.auth.decorators import permission_required

@permission_required('admin.can_add_log_entry')
def book_upload(request):
    template = "catalog/book_upload.html"

    prompt = {
        'order': 'Order of the CSV should be "authors", "last name", yada yada'
    }

    if request.method == "GET":
        return render(request, template, prompt)

    csv_file = request.FILES['file']
    data_set = csv_file.read().decode('UTF-8')
    io_string = io.StringIO(data_set)

    # skip the header
    next(io_string)

    for row in csv.reader(io_string, delimiter=','):

        # convert the row into a dictionary
        row_dict = row_to_dict(row)

        # check to see if book is in the database
        book = book_is_in_db(row_dict['title'])
        if book:
            add_book_instance(book)
        else:
            # get the author from the db, or create them
            try:
                author = Author.objects.get(first_name=row_dict['first_name'], last_name=row_dict['last_name'])
            except Author.DoesNotExist:
                author = Author.objects.create(first_name=row_dict['first_name'], last_name=row_dict['last_name'])

            # create the book object and save it to the db
            _, created = Book.objects.create(
                title=row_dict['title'],
                author=author,
                summary=row_dict['summary'],
                #genre=genre,
                #language=language,
                isbn=row_dict['isbn'],
                )

            add_book_instance(created)

    context = {}
    return render(request, template, context)


def row_to_dict(row):
    """Returns the given row in a dict format"""
    # Here's how the row list looks like:
    # ['full name', 'first name', 'last name' 'title',
    #  'summary', 'genre', 'language', 'isbn']
    return {'first_name': row[1], 'last_name': row[2], 
        'title': row[3], 'summary': row[4], 'genre': row[5],
        'language': row[6], 'isbn': row[7],
        }

def book_is_in_db(title):
    """Check the book is in db. 
    If yes, return the book, else return None
    """
    try:
        return Book.objects.get(title=title)
    except Book.DoesNotExist:
        return None

def add_book_instance(book):
    """Add a new instance of the book"""
    BookInstance.objects.create(book=book, status='a')

The models:

class Genre(models.Model):
    """Model representing a book genre."""
    name = models.CharField(max_length=200, help_text='Enter a book genre (e.g. Science Fiction)')

    def __str__(self):
        """String for representing the Model object."""
        return self.name


class Book(models.Model):
    """Model representing a book (but not a specific copy of a book)."""
    title = models.CharField(max_length=200)
    author = models.ForeignKey('Author', on_delete=models.SET_NULL, null=True)
    summary = models.TextField(max_length=1000, help_text='Enter a brief description of the book')
    isbn = models.CharField('ISBN', max_length=13, help_text='13 Character ISBN number')
    genre = models.ManyToManyField(Genre, help_text='Select a genre for this book', blank=True)
    language = models.ForeignKey('Language', on_delete=models.SET_NULL, null=True, blank=True)

    def __str__(self):
        """String for representing the Model object."""
        return self.title

    def get_absolute_url(self):
        """Returns the url to access a detail record for this book."""
        return reverse('book-detail', args=[str(self.id)])

    def display_genre(self):
        """Figure this out later"""
        return ', '.join(genre.name for genre in self.genre.all()[:])

    display_genre.short_descriptions = 'Genre'


class BookInstance(models.Model):
    """Model representing a specific copy of a book (i.e. that can be borrowed from the library)."""
    id = models.UUIDField(primary_key=True, default=uuid.uuid4, help_text='Unique ID for this particular book across whole library')
    book = models.ForeignKey('Book', on_delete=models.SET_NULL, null=True) 
    imprint = models.CharField(max_length=200, blank=True)
    due_back = models.DateField(null=True, blank=True)

    LOAN_STATUS = (
        ('m', 'Maintenance'),
        ('o', 'On loan'),
        ('a', 'Available'),
        ('r', 'Reserved'),
    )

    status = models.CharField(
        max_length=1,
        choices=LOAN_STATUS,
        blank=True,
        default='m',
        help_text='Book availability',
    )

    #borrowing/user stuff
    borrower = models.ForeignKey(User, on_delete=models.SET_NULL, null=True, blank=True)

    # a property definition for overdue stuff
    @property
    def is_overdue(self):
        if self.due_back and date.today() > self.due_back:
            return True
        return False

    class Meta:
        ordering = ['due_back']
        permissions = (("can_mark_returned", "Set book as returned"),)

    def __str__(self):
        """String for representing the Model object."""
        return f'{self.id} ({self.book.title})'


class Author(models.Model):
    """Model representing an author."""
    first_name = models.CharField(max_length=100)
    last_name = models.CharField(max_length=100)
    date_of_birth = models.DateField(null=True, blank=True)
    date_of_death = models.DateField('died', null=True, blank=True)

    class Meta:
        ordering = ['last_name', 'first_name']

    def get_absolute_url(self):
        """Returns the url to access a particular author instance."""
        return reverse('author-detail', args=[str(self.id)])

    def __str__(self):
        """String for representing the Model object."""
        return f'{self.last_name}, {self.first_name}'


class Language(models.Model):
    """Model representing a Language."""
    name = models.CharField(max_length=200,
        help_text="Enter the book's natural language (e.g. English, French, Japanese etc.)")

    def __str__(self):
        """String for representing the Model object."""
        return self.name

The csv file:

fullname,first_name,last_name,title,summary,genre,language,isbn
Alex Garland,Alex,Garland,The Beach,A book about the beach,Coming-of-age,English,1234567890123
Simon Singh,Simon,Singh,Fermat's Last Theorem,Maths-y book,Maths,English,3210987654321

Latest error: TypeError at /catalog/upload/ cannot unpack non-iterable Book object, with info:

205. _, created = Book.objects.create(

▼ Local vars
Variable    Value
author  



book    

None

csv_file    



data_set    

('fullname,first_name,last_name,title,summary,genre,language,isbn
'
 'Alex Garland,Alex,Garland,The Beach,A book about the '
 'beach,Coming-of-age,English,1234567890123
'
 "Simon Singh,Simon,Singh,Fermat's Last Theorem,Maths-y "
 'book,Maths,English,3210987654321')

io_string   

<_io.StringIO object at 0x044F2028>

prompt  

{'order': 'Order of the CSV should be "authors", last_name, yada yada'}

request     



row     

['Simon Singh',
 'Simon',
 'Singh',
 "Fermat's Last Theorem",
 'Maths-y book',
 'Maths',
 'English',
 '3210987654321']

row_dict    

{'first_name': 'Simon',
 'genre': 'Maths',
 'isbn': '3210987654321',
 'language': 'English',
 'last_name': 'Singh',
 'summary': 'Maths-y book',
 'title': "Fermat's Last Theorem"}

template    

'catalog/book_upload.html'

Also, I'm not sure what the -, created = part is all about. Is it a tuple and takes care of saving it to the database somehow?

Reading a csv file in Django (Python)

Answers (1)

Related Questions