moviewyrm/bookwyrm/tests/importers/test_librarything_import.py

253 lines
12 KiB
Python
Raw Normal View History

2021-03-08 16:49:10 +00:00
""" testing import """
2021-02-20 16:02:36 +00:00
import csv
import pathlib
from unittest.mock import patch
from django.test import TestCase
import responses
2021-03-30 15:56:25 +00:00
from bookwyrm import models
2021-03-30 16:13:41 +00:00
from bookwyrm.importers import LibrarythingImporter
from bookwyrm.importers.importer import import_data, handle_imported_book
2021-02-20 16:02:36 +00:00
from bookwyrm.settings import DOMAIN
2021-03-08 16:49:10 +00:00
2021-02-20 16:02:36 +00:00
class LibrarythingImport(TestCase):
2021-04-26 16:15:42 +00:00
"""importing from librarything tsv"""
2021-03-08 16:49:10 +00:00
2021-02-20 16:02:36 +00:00
def setUp(self):
2021-04-26 16:15:42 +00:00
"""use a test tsv"""
2021-03-23 16:19:11 +00:00
self.importer = LibrarythingImporter()
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-02-20 16:02:36 +00:00
# Librarything generates latin encoded exports...
2021-03-08 16:49:10 +00:00
self.csv = open(datafile, "r", encoding=self.importer.encoding)
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_user_preview_image_task.delay"):
self.user = models.User.objects.create_user(
"mmai", "mmai@mmai.mmai", "password", local=True
)
2021-02-20 16:02:36 +00:00
models.Connector.objects.create(
identifier=DOMAIN,
2021-03-08 16:49:10 +00:00
name="Local",
2021-02-20 16:02:36 +00:00
local=True,
2021-03-08 16:49:10 +00:00
connector_file="self_connector",
base_url="https://%s" % DOMAIN,
books_url="https://%s/book" % DOMAIN,
covers_url="https://%s/images/covers" % DOMAIN,
search_url="https://%s/search?q=" % DOMAIN,
2021-02-20 16:02:36 +00:00
priority=1,
)
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
work = models.Work.objects.create(title="Test Work")
self.book = models.Edition.objects.create(
title="Example Edition",
remote_id="https://example.com/book/1",
parent_work=work,
)
2021-02-20 16:02:36 +00:00
def test_create_job(self):
2021-04-26 16:15:42 +00:00
"""creates the import job entry and checks csv"""
2021-03-08 16:49:10 +00:00
import_job = self.importer.create_job(self.user, self.csv, False, "public")
2021-02-20 16:02:36 +00:00
self.assertEqual(import_job.user, self.user)
self.assertEqual(import_job.include_reviews, False)
2021-03-08 16:49:10 +00:00
self.assertEqual(import_job.privacy, "public")
2021-02-20 16:02:36 +00:00
import_items = models.ImportItem.objects.filter(job=import_job).all()
self.assertEqual(len(import_items), 3)
self.assertEqual(import_items[0].index, 0)
2021-03-08 16:49:10 +00:00
self.assertEqual(import_items[0].data["Book Id"], "5498194")
2021-02-20 16:02:36 +00:00
self.assertEqual(import_items[1].index, 1)
2021-03-08 16:49:10 +00:00
self.assertEqual(import_items[1].data["Book Id"], "5015319")
2021-02-20 16:02:36 +00:00
self.assertEqual(import_items[2].index, 2)
2021-03-08 16:49:10 +00:00
self.assertEqual(import_items[2].data["Book Id"], "5015399")
2021-02-20 16:02:36 +00:00
def test_create_retry_job(self):
2021-04-26 16:15:42 +00:00
"""trying again with items that didn't import"""
2021-03-08 16:49:10 +00:00
import_job = self.importer.create_job(self.user, self.csv, False, "unlisted")
import_items = models.ImportItem.objects.filter(job=import_job).all()[:2]
retry = self.importer.create_retry_job(self.user, import_job, import_items)
2021-02-20 16:02:36 +00:00
self.assertNotEqual(import_job, retry)
self.assertEqual(retry.user, self.user)
self.assertEqual(retry.include_reviews, False)
2021-03-08 16:49:10 +00:00
self.assertEqual(retry.privacy, "unlisted")
2021-02-20 16:02:36 +00:00
retry_items = models.ImportItem.objects.filter(job=retry).all()
self.assertEqual(len(retry_items), 2)
self.assertEqual(retry_items[0].index, 0)
2021-03-08 16:49:10 +00:00
self.assertEqual(import_items[0].data["Book Id"], "5498194")
2021-02-20 16:02:36 +00:00
self.assertEqual(retry_items[1].index, 1)
2021-03-08 16:49:10 +00:00
self.assertEqual(retry_items[1].data["Book Id"], "5015319")
2021-02-20 16:02:36 +00:00
@responses.activate
def test_import_data(self):
2021-04-26 16:15:42 +00:00
"""resolve entry"""
2021-03-08 16:49:10 +00:00
import_job = self.importer.create_job(self.user, self.csv, False, "unlisted")
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
book = models.Edition.objects.create(title="Test Book")
2021-02-20 16:02:36 +00:00
with patch(
2021-03-08 16:49:10 +00:00
"bookwyrm.models.import_job.ImportItem.get_book_from_isbn"
) as resolve:
2021-02-20 16:02:36 +00:00
resolve.return_value = book
2021-03-30 16:13:41 +00:00
with patch("bookwyrm.importers.importer.handle_imported_book"):
import_data(self.importer.service, import_job.id)
2021-02-20 16:02:36 +00:00
import_item = models.ImportItem.objects.get(job=import_job, index=0)
self.assertEqual(import_item.book.id, book.id)
def test_handle_imported_book(self):
2021-04-26 16:15:42 +00:00
"""librarything import added a book, this adds related connections"""
2021-03-08 16:49:10 +00:00
shelf = self.user.shelf_set.filter(identifier="read").first()
2021-02-20 16:02:36 +00:00
self.assertIsNone(shelf.books.first())
import_job = models.ImportJob.objects.create(user=self.user)
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-03-08 16:49:10 +00:00
csv_file = open(datafile, "r", encoding=self.importer.encoding)
for index, entry in enumerate(
list(csv.DictReader(csv_file, delimiter=self.importer.delimiter))
):
2021-02-20 16:02:36 +00:00
entry = self.importer.parse_fields(entry)
import_item = models.ImportItem.objects.create(
2021-03-08 16:49:10 +00:00
job_id=import_job.id, index=index, data=entry, book=self.book
)
2021-02-20 16:02:36 +00:00
break
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
handle_imported_book(
self.importer.service, self.user, import_item, False, "public"
)
2021-02-20 16:02:36 +00:00
shelf.refresh_from_db()
self.assertEqual(shelf.books.first(), self.book)
readthrough = models.ReadThrough.objects.get(user=self.user)
self.assertEqual(readthrough.book, self.book)
# I can't remember how to create dates and I don't want to look it up.
self.assertEqual(readthrough.start_date.year, 2007)
self.assertEqual(readthrough.start_date.month, 4)
self.assertEqual(readthrough.start_date.day, 16)
self.assertEqual(readthrough.finish_date.year, 2007)
self.assertEqual(readthrough.finish_date.month, 5)
self.assertEqual(readthrough.finish_date.day, 8)
def test_handle_imported_book_already_shelved(self):
2021-04-26 16:15:42 +00:00
"""librarything import added a book, this adds related connections"""
2021-03-08 16:49:10 +00:00
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
shelf = self.user.shelf_set.filter(identifier="to-read").first()
models.ShelfBook.objects.create(shelf=shelf, user=self.user, book=self.book)
2021-02-20 16:02:36 +00:00
import_job = models.ImportJob.objects.create(user=self.user)
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-03-08 16:49:10 +00:00
csv_file = open(datafile, "r", encoding=self.importer.encoding)
for index, entry in enumerate(
list(csv.DictReader(csv_file, delimiter=self.importer.delimiter))
):
2021-02-20 16:02:36 +00:00
entry = self.importer.parse_fields(entry)
import_item = models.ImportItem.objects.create(
2021-03-08 16:49:10 +00:00
job_id=import_job.id, index=index, data=entry, book=self.book
)
2021-02-20 16:02:36 +00:00
break
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
handle_imported_book(
self.importer.service, self.user, import_item, False, "public"
)
2021-02-20 16:02:36 +00:00
shelf.refresh_from_db()
self.assertEqual(shelf.books.first(), self.book)
2021-03-08 16:49:10 +00:00
self.assertIsNone(self.user.shelf_set.get(identifier="read").books.first())
2021-02-20 16:02:36 +00:00
readthrough = models.ReadThrough.objects.get(user=self.user)
self.assertEqual(readthrough.book, self.book)
self.assertEqual(readthrough.start_date.year, 2007)
self.assertEqual(readthrough.start_date.month, 4)
self.assertEqual(readthrough.start_date.day, 16)
self.assertEqual(readthrough.finish_date.year, 2007)
self.assertEqual(readthrough.finish_date.month, 5)
self.assertEqual(readthrough.finish_date.day, 8)
def test_handle_import_twice(self):
2021-04-26 16:15:42 +00:00
"""re-importing books"""
2021-03-08 16:49:10 +00:00
shelf = self.user.shelf_set.filter(identifier="read").first()
2021-02-20 16:02:36 +00:00
import_job = models.ImportJob.objects.create(user=self.user)
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-03-08 16:49:10 +00:00
csv_file = open(datafile, "r", encoding=self.importer.encoding)
for index, entry in enumerate(
list(csv.DictReader(csv_file, delimiter=self.importer.delimiter))
):
2021-02-20 16:02:36 +00:00
entry = self.importer.parse_fields(entry)
import_item = models.ImportItem.objects.create(
2021-03-08 16:49:10 +00:00
job_id=import_job.id, index=index, data=entry, book=self.book
)
2021-02-20 16:02:36 +00:00
break
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
handle_imported_book(
self.importer.service, self.user, import_item, False, "public"
)
handle_imported_book(
self.importer.service, self.user, import_item, False, "public"
)
2021-02-20 16:02:36 +00:00
shelf.refresh_from_db()
self.assertEqual(shelf.books.first(), self.book)
readthrough = models.ReadThrough.objects.get(user=self.user)
self.assertEqual(readthrough.book, self.book)
# I can't remember how to create dates and I don't want to look it up.
self.assertEqual(readthrough.start_date.year, 2007)
self.assertEqual(readthrough.start_date.month, 4)
self.assertEqual(readthrough.start_date.day, 16)
self.assertEqual(readthrough.finish_date.year, 2007)
self.assertEqual(readthrough.finish_date.month, 5)
self.assertEqual(readthrough.finish_date.day, 8)
2021-03-23 16:19:11 +00:00
@patch("bookwyrm.activitystreams.ActivityStream.add_status")
def test_handle_imported_book_review(self, _):
2021-04-26 16:15:42 +00:00
"""librarything review import"""
2021-02-20 16:02:36 +00:00
import_job = models.ImportJob.objects.create(user=self.user)
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-03-08 16:49:10 +00:00
csv_file = open(datafile, "r", encoding=self.importer.encoding)
2021-02-20 16:02:36 +00:00
entry = list(csv.DictReader(csv_file, delimiter=self.importer.delimiter))[0]
entry = self.importer.parse_fields(entry)
import_item = models.ImportItem.objects.create(
2021-03-08 16:49:10 +00:00
job_id=import_job.id, index=0, data=entry, book=self.book
)
2021-02-20 16:02:36 +00:00
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
handle_imported_book(
self.importer.service, self.user, import_item, True, "unlisted"
)
2021-02-20 16:02:36 +00:00
review = models.Review.objects.get(book=self.book, user=self.user)
2021-03-08 16:49:10 +00:00
self.assertEqual(review.content, "chef d'oeuvre")
2021-02-20 16:02:36 +00:00
self.assertEqual(review.rating, 5)
self.assertEqual(review.published_date.year, 2007)
self.assertEqual(review.published_date.month, 5)
self.assertEqual(review.published_date.day, 8)
2021-03-08 16:49:10 +00:00
self.assertEqual(review.privacy, "unlisted")
2021-02-20 16:02:36 +00:00
def test_handle_imported_book_reviews_disabled(self):
2021-04-26 16:15:42 +00:00
"""librarything review import"""
2021-02-20 16:02:36 +00:00
import_job = models.ImportJob.objects.create(user=self.user)
2021-03-30 16:13:41 +00:00
datafile = pathlib.Path(__file__).parent.joinpath("../data/librarything.tsv")
2021-03-08 16:49:10 +00:00
csv_file = open(datafile, "r", encoding=self.importer.encoding)
2021-02-20 16:02:36 +00:00
entry = list(csv.DictReader(csv_file, delimiter=self.importer.delimiter))[2]
entry = self.importer.parse_fields(entry)
import_item = models.ImportItem.objects.create(
2021-03-08 16:49:10 +00:00
job_id=import_job.id, index=0, data=entry, book=self.book
)
2021-02-20 16:02:36 +00:00
2021-05-26 21:57:29 +00:00
with patch("bookwyrm.preview_images.generate_edition_preview_image_task.delay"):
with patch("bookwyrm.models.activitypub_mixin.broadcast_task.delay"):
handle_imported_book(
self.importer.service, self.user, import_item, False, "unlisted"
)
2021-03-08 16:49:10 +00:00
self.assertFalse(
models.Review.objects.filter(book=self.book, user=self.user).exists()
)