bookwyrm/fedireads/connectors/fedireads_connector.py

130 lines
4 KiB
Python
Raw Normal View History

2020-03-28 19:55:53 +00:00
''' using another fedireads instance as a source of book data '''
from datetime import datetime
from django.core.exceptions import ObjectDoesNotExist
from django.core.files.base import ContentFile
import requests
from fedireads import models
from .abstract_connector import AbstractConnector, update_from_mappings
class Connector(AbstractConnector):
''' instantiate a connector '''
def __init__(self, identifier):
super().__init__(identifier)
def search(self, query):
''' right now you can't search fedireads, but... '''
resp = requests.get(
'%s%s' % (self.search_url, query),
headers={
'Accept': 'application/activity+json; charset=utf-8',
},
)
if not resp.ok:
resp.raise_for_status()
return resp.json()
def get_or_create_book(self, fedireads_key):
''' pull up a book record by whatever means possible '''
try:
book = models.Book.objects.select_subclasses().get(
fedireads_key=fedireads_key
)
return book
except ObjectDoesNotExist:
if self.model.is_self:
# we can't load a book from a remote server, this is it
return None
# no book was found, so we start creating a new one
book = models.Book(fedireads_key=fedireads_key)
2020-03-28 23:30:54 +00:00
def update_book(self, book):
''' add remote data to a local book '''
fedireads_key = book.fedireads_key
2020-03-28 19:55:53 +00:00
response = requests.get(
'%s/%s' % (self.base_url, fedireads_key),
headers={
'Accept': 'application/activity+json; charset=utf-8',
},
)
if not response.ok:
response.raise_for_status()
data = response.json()
# great, we can update our book.
2020-03-28 20:14:06 +00:00
mappings = {
'published_date': ('published_date', get_date),
'first_published_date': ('first_published_date', get_date),
2020-03-28 19:55:53 +00:00
}
2020-03-28 20:14:06 +00:00
book = update_from_mappings(book, data, mappings)
2020-03-28 19:55:53 +00:00
2020-03-28 23:30:54 +00:00
if not book.source_url:
book.source_url = response.url
if not book.connector:
book.connector = self.connector
2020-03-28 19:55:53 +00:00
book.save()
if data.get('parent_work'):
work = self.get_or_create_book(data.get('parent_work'))
book.parent_work = work
for author_blob in data.get('authors', []):
author_blob = author_blob.get('author', author_blob)
author_id = author_blob['key']
author_id = author_id.split('/')[-1]
book.authors.add(self.get_or_create_author(author_id))
2020-03-28 23:30:54 +00:00
if book.sync_cover and data.get('covers') and len(data['covers']):
2020-03-28 19:55:53 +00:00
book.cover.save(*self.get_cover(data['covers'][0]), save=True)
return book
def get_or_create_author(self, fedireads_key):
''' load that author '''
try:
return models.Author.objects.get(fedireads_key=fedireads_key)
except ObjectDoesNotExist:
pass
resp = requests.get('%s/authors/%s.json' % (self.url, fedireads_key))
if not resp.ok:
resp.raise_for_status()
data = resp.json()
# ingest a new author
author = models.Author(fedireads_key=fedireads_key)
mappings = {
'born': ('born', get_date),
'died': ('died', get_date),
}
author = update_from_mappings(author, data, mappings)
author.save()
return author
def get_cover(self, cover_url):
''' ask openlibrary for the cover '''
image_name = cover_url.split('/')[-1]
response = requests.get(cover_url)
if not response.ok:
response.raise_for_status()
image_content = ContentFile(response.content)
return [image_name, image_content]
def get_date(date_string):
''' helper function to try to interpret dates '''
try:
datetime.strptime(date_string, "%Y-%m-%dT%H:%M:%S")
except ValueError:
return False