moviewyrm/fedireads/connectors/fedireads_connector.py

109 lines
3.1 KiB
Python
Raw Normal View History

2020-03-28 19:55:53 +00:00
''' using another fedireads instance as a source of book data '''
2020-05-09 19:53:55 +00:00
from uuid import uuid4
2020-03-28 19:55:53 +00:00
from django.core.exceptions import ObjectDoesNotExist
from django.core.files.base import ContentFile
2020-05-09 19:53:55 +00:00
import requests
2020-03-28 19:55:53 +00:00
from fedireads import models
2020-05-10 23:41:24 +00:00
from .abstract_connector import AbstractConnector, SearchResult, Mapping
2020-05-09 20:36:10 +00:00
from .abstract_connector import update_from_mappings, get_date, get_data
2020-03-28 19:55:53 +00:00
class Connector(AbstractConnector):
2020-05-04 00:53:14 +00:00
''' interact with other instances '''
def __init__(self, identifier):
2020-05-10 19:56:59 +00:00
super().__init__(identifier)
2020-05-10 23:41:24 +00:00
self.key_mappings = [
Mapping('isbn_13', model=models.Edition),
Mapping('isbn_10', model=models.Edition),
Mapping('lccn', model=models.Work),
Mapping('oclc_number', model=models.Edition),
Mapping('openlibrary_key'),
Mapping('goodreads_key'),
Mapping('asin'),
]
self.book_mappings = self.key_mappings + [
Mapping('sort_title'),
Mapping('subtitle'),
Mapping('description'),
Mapping('languages'),
Mapping('series'),
Mapping('series_number'),
Mapping('subjects'),
Mapping('subject_places'),
Mapping('first_published_date'),
Mapping('published_date'),
Mapping('pages'),
Mapping('physical_format'),
Mapping('publishers'),
]
self.author_mappings = [
Mapping('born', remote_field='birth_date', formatter=get_date),
Mapping('died', remote_field='death_date', formatter=get_date),
Mapping('bio'),
]
2020-05-04 00:53:14 +00:00
2020-05-10 19:56:59 +00:00
def is_work_data(self, data):
return data['book_type'] == 'Work'
2020-03-28 19:55:53 +00:00
2020-05-10 19:56:59 +00:00
def get_edition_from_work_data(self, data):
return data['editions'][0]
2020-05-10 19:56:59 +00:00
def get_work_from_edition_date(self, data):
return data['work']
2020-05-10 19:56:59 +00:00
def get_authors_from_data(self, data):
for author_url in data.get('authors', []):
yield self.get_or_create_author(author_url)
2020-03-28 19:55:53 +00:00
2020-03-28 23:30:54 +00:00
def get_cover_from_data(self, data):
2020-05-09 19:59:06 +00:00
cover_data = data.get('attachment')
if not cover_data:
2020-05-09 19:53:55 +00:00
return None
2020-05-09 19:59:06 +00:00
cover_url = cover_data[0].get('url')
2020-05-09 19:53:55 +00:00
response = requests.get(cover_url)
if not response.ok:
response.raise_for_status()
2020-05-09 19:59:06 +00:00
image_name = str(uuid4()) + cover_url.split('.')[-1]
2020-05-09 19:53:55 +00:00
image_content = ContentFile(response.content)
return [image_name, image_content]
2020-05-04 00:53:14 +00:00
def get_or_create_author(self, remote_id):
2020-03-28 19:55:53 +00:00
''' load that author '''
try:
2020-05-04 00:53:14 +00:00
return models.Author.objects.get(remote_id=remote_id)
2020-03-28 19:55:53 +00:00
except ObjectDoesNotExist:
pass
data = get_data(remote_id)
2020-03-28 19:55:53 +00:00
# ingest a new author
2020-05-04 00:53:14 +00:00
author = models.Author(remote_id=remote_id)
2020-05-10 23:41:24 +00:00
author = update_from_mappings(author, data, self.author_mappings)
2020-03-28 19:55:53 +00:00
author.save()
return author
2020-05-10 19:56:59 +00:00
def parse_search_data(self, data):
return data
def format_search_result(self, search_result):
return SearchResult(**search_result)
def expand_book_data(self, book):
2020-05-09 20:36:10 +00:00
# TODO
pass