2020-09-17 20:02:52 +00:00
|
|
|
''' basics for an activitypub serializer '''
|
|
|
|
from dataclasses import dataclass, fields, MISSING
|
|
|
|
from json import JSONEncoder
|
|
|
|
|
2020-12-08 17:43:12 +00:00
|
|
|
from django.apps import apps
|
2020-12-21 22:25:10 +00:00
|
|
|
from django.db import IntegrityError, transaction
|
2020-11-23 21:43:46 +00:00
|
|
|
|
2020-12-03 20:35:57 +00:00
|
|
|
from bookwyrm.connectors import ConnectorException, get_data
|
2020-12-08 17:43:12 +00:00
|
|
|
from bookwyrm.tasks import app
|
2020-09-17 20:02:52 +00:00
|
|
|
|
2020-11-12 19:59:34 +00:00
|
|
|
class ActivitySerializerError(ValueError):
|
|
|
|
''' routine problems serializing activitypub json '''
|
|
|
|
|
|
|
|
|
2020-09-17 20:02:52 +00:00
|
|
|
class ActivityEncoder(JSONEncoder):
|
|
|
|
''' used to convert an Activity object into json '''
|
|
|
|
def default(self, o):
|
|
|
|
return o.__dict__
|
|
|
|
|
|
|
|
|
2020-11-01 18:13:51 +00:00
|
|
|
@dataclass
|
2020-11-28 06:10:38 +00:00
|
|
|
class Link:
|
2020-11-01 18:13:51 +00:00
|
|
|
''' for tagging a book in a status '''
|
|
|
|
href: str
|
|
|
|
name: str
|
|
|
|
type: str = 'Link'
|
|
|
|
|
2020-11-28 06:10:38 +00:00
|
|
|
|
2020-11-01 18:13:51 +00:00
|
|
|
@dataclass
|
|
|
|
class Mention(Link):
|
|
|
|
''' a subtype of Link for mentioning an actor '''
|
|
|
|
type: str = 'Mention'
|
|
|
|
|
|
|
|
|
2020-09-17 20:02:52 +00:00
|
|
|
@dataclass
|
|
|
|
class Signature:
|
|
|
|
''' public key block '''
|
|
|
|
creator: str
|
|
|
|
created: str
|
|
|
|
signatureValue: str
|
|
|
|
type: str = 'RsaSignature2017'
|
|
|
|
|
2021-02-17 02:59:26 +00:00
|
|
|
def naive_parse(activity_objects, activity_json, serializer=None):
|
2021-02-16 01:23:17 +00:00
|
|
|
''' this navigates circular import issues '''
|
2021-02-17 02:59:26 +00:00
|
|
|
if not serializer:
|
|
|
|
if activity_json.get('publicKeyPem'):
|
|
|
|
# ugh
|
|
|
|
activity_json['type'] = 'PublicKey'
|
|
|
|
try:
|
|
|
|
activity_type = activity_json['type']
|
|
|
|
serializer = activity_objects[activity_type]
|
|
|
|
except KeyError as e:
|
|
|
|
raise ActivitySerializerError(e)
|
2021-02-16 01:23:17 +00:00
|
|
|
|
|
|
|
return serializer(activity_objects=activity_objects, **activity_json)
|
2020-09-17 20:02:52 +00:00
|
|
|
|
2021-02-16 04:49:23 +00:00
|
|
|
|
2020-09-17 20:02:52 +00:00
|
|
|
@dataclass(init=False)
|
|
|
|
class ActivityObject:
|
|
|
|
''' actor activitypub json '''
|
|
|
|
id: str
|
|
|
|
type: str
|
|
|
|
|
2021-02-16 01:23:17 +00:00
|
|
|
def __init__(self, activity_objects=None, **kwargs):
|
2020-10-17 02:13:18 +00:00
|
|
|
''' this lets you pass in an object with fields that aren't in the
|
|
|
|
dataclass, which it ignores. Any field in the dataclass is required or
|
|
|
|
has a default value '''
|
2020-09-17 20:02:52 +00:00
|
|
|
for field in fields(self):
|
|
|
|
try:
|
|
|
|
value = kwargs[field.name]
|
2021-02-17 03:28:23 +00:00
|
|
|
if value in (None, MISSING):
|
|
|
|
raise KeyError()
|
2021-02-16 02:47:08 +00:00
|
|
|
try:
|
|
|
|
is_subclass = issubclass(field.type, ActivityObject)
|
|
|
|
except TypeError:
|
|
|
|
is_subclass = False
|
2021-02-17 18:30:02 +00:00
|
|
|
# serialize a model obj
|
|
|
|
if hasattr(value, 'to_activity'):
|
|
|
|
value = value.to_activity()
|
2021-02-17 04:17:38 +00:00
|
|
|
# parse a dict into the appropriate activity
|
2021-02-17 18:30:02 +00:00
|
|
|
elif is_subclass and isinstance(value, dict):
|
2021-02-17 20:23:55 +00:00
|
|
|
if activity_objects:
|
|
|
|
value = naive_parse(activity_objects, value)
|
|
|
|
else:
|
2021-02-24 01:18:25 +00:00
|
|
|
value = naive_parse(
|
|
|
|
activity_objects, value, serializer=field.type)
|
2021-02-16 01:23:17 +00:00
|
|
|
|
2020-09-17 20:02:52 +00:00
|
|
|
except KeyError:
|
2020-11-25 19:15:14 +00:00
|
|
|
if field.default == MISSING and \
|
|
|
|
field.default_factory == MISSING:
|
2020-11-12 19:59:34 +00:00
|
|
|
raise ActivitySerializerError(\
|
|
|
|
'Missing required field: %s' % field.name)
|
2020-09-17 20:02:52 +00:00
|
|
|
value = field.default
|
|
|
|
setattr(self, field.name, value)
|
|
|
|
|
|
|
|
|
2021-02-16 19:04:13 +00:00
|
|
|
def to_model(self, model=None, instance=None, allow_create=True, save=True):
|
2020-10-17 02:13:18 +00:00
|
|
|
''' convert from an activity to a model instance '''
|
2021-02-16 19:04:13 +00:00
|
|
|
model = model or get_model_from_type(self.type)
|
2020-09-17 20:02:52 +00:00
|
|
|
|
2021-02-17 00:35:28 +00:00
|
|
|
# only reject statuses if we're potentially creating them
|
|
|
|
if allow_create and \
|
2021-02-17 02:59:26 +00:00
|
|
|
hasattr(model, 'ignore_activity') and \
|
|
|
|
model.ignore_activity(self):
|
2021-02-17 00:35:28 +00:00
|
|
|
return None
|
2020-12-18 20:38:27 +00:00
|
|
|
|
2021-02-16 05:20:00 +00:00
|
|
|
# check for an existing instance
|
2021-02-16 04:49:23 +00:00
|
|
|
instance = instance or model.find_existing(self.serialize())
|
2021-02-17 00:35:28 +00:00
|
|
|
|
2021-02-16 04:49:23 +00:00
|
|
|
if not instance and not allow_create:
|
2021-02-16 05:20:00 +00:00
|
|
|
# so that we don't create when we want to delete or update
|
2021-02-16 04:49:23 +00:00
|
|
|
return None
|
|
|
|
instance = instance or model()
|
2020-12-03 20:35:57 +00:00
|
|
|
|
2020-12-13 20:02:26 +00:00
|
|
|
for field in instance.simple_fields:
|
2021-02-17 04:24:37 +00:00
|
|
|
try:
|
|
|
|
field.set_field_from_activity(instance, self)
|
|
|
|
except AttributeError as e:
|
|
|
|
raise ActivitySerializerError(e)
|
2020-12-08 02:28:42 +00:00
|
|
|
|
2020-12-13 20:02:26 +00:00
|
|
|
# image fields have to be set after other fields because they can save
|
|
|
|
# too early and jank up users
|
|
|
|
for field in instance.image_fields:
|
|
|
|
field.set_field_from_activity(instance, self, save=save)
|
2020-12-12 23:44:17 +00:00
|
|
|
|
2020-12-08 17:43:12 +00:00
|
|
|
if not save:
|
|
|
|
return instance
|
|
|
|
|
2020-12-20 02:34:37 +00:00
|
|
|
with transaction.atomic():
|
|
|
|
# we can't set many to many and reverse fields on an unsaved object
|
2020-12-21 22:25:10 +00:00
|
|
|
try:
|
2021-02-08 17:38:28 +00:00
|
|
|
try:
|
|
|
|
instance.save(broadcast=False)
|
|
|
|
except TypeError:
|
|
|
|
instance.save()
|
2020-12-21 22:25:10 +00:00
|
|
|
except IntegrityError as e:
|
|
|
|
raise ActivitySerializerError(e)
|
2020-11-29 01:29:03 +00:00
|
|
|
|
2020-12-20 02:34:37 +00:00
|
|
|
# add many to many fields, which have to be set post-save
|
|
|
|
for field in instance.many_to_many_fields:
|
|
|
|
# mention books/users, for example
|
|
|
|
field.set_field_from_activity(instance, self)
|
2020-12-08 02:28:42 +00:00
|
|
|
|
|
|
|
# reversed relationships in the models
|
|
|
|
for (model_field_name, activity_field_name) in \
|
2020-12-13 20:02:26 +00:00
|
|
|
instance.deserialize_reverse_fields:
|
2020-12-08 02:28:42 +00:00
|
|
|
# attachments on Status, for example
|
|
|
|
values = getattr(self, activity_field_name)
|
|
|
|
if values is None or values is MISSING:
|
2020-11-29 01:29:03 +00:00
|
|
|
continue
|
2020-12-20 02:34:37 +00:00
|
|
|
|
|
|
|
model_field = getattr(model, model_field_name)
|
2020-12-23 20:45:40 +00:00
|
|
|
# creating a Work, model_field is 'editions'
|
|
|
|
# creating a User, model field is 'key_pair'
|
|
|
|
related_model = model_field.field.model
|
2020-12-23 21:33:46 +00:00
|
|
|
related_field_name = model_field.field.name
|
2020-12-08 02:28:42 +00:00
|
|
|
|
2020-11-29 01:29:03 +00:00
|
|
|
for item in values:
|
2020-12-08 17:43:12 +00:00
|
|
|
set_related_field.delay(
|
|
|
|
related_model.__name__,
|
|
|
|
instance.__class__.__name__,
|
2020-12-20 02:34:37 +00:00
|
|
|
related_field_name,
|
2020-12-08 17:43:12 +00:00
|
|
|
instance.remote_id,
|
|
|
|
item
|
|
|
|
)
|
2020-11-20 17:59:55 +00:00
|
|
|
return instance
|
2020-09-17 20:02:52 +00:00
|
|
|
|
|
|
|
|
|
|
|
def serialize(self):
|
|
|
|
''' convert to dictionary with context attr '''
|
2021-02-17 17:33:33 +00:00
|
|
|
data = self.__dict__.copy()
|
2021-02-16 19:04:13 +00:00
|
|
|
# recursively serialize
|
|
|
|
for (k, v) in data.items():
|
|
|
|
try:
|
2021-02-17 17:33:33 +00:00
|
|
|
if issubclass(type(v), ActivityObject):
|
|
|
|
data[k] = v.serialize()
|
2021-02-16 19:04:13 +00:00
|
|
|
except TypeError:
|
2021-02-17 17:33:33 +00:00
|
|
|
pass
|
2021-02-02 19:05:47 +00:00
|
|
|
data = {k:v for (k, v) in data.items() if v is not None}
|
2020-09-17 20:02:52 +00:00
|
|
|
data['@context'] = 'https://www.w3.org/ns/activitystreams'
|
|
|
|
return data
|
|
|
|
|
|
|
|
|
2020-12-08 17:43:12 +00:00
|
|
|
@app.task
|
|
|
|
@transaction.atomic
|
|
|
|
def set_related_field(
|
2020-12-23 21:33:46 +00:00
|
|
|
model_name, origin_model_name, related_field_name,
|
|
|
|
related_remote_id, data):
|
2020-12-08 17:43:12 +00:00
|
|
|
''' load reverse related fields (editions, attachments) without blocking '''
|
|
|
|
model = apps.get_model('bookwyrm.%s' % model_name, require_ready=True)
|
|
|
|
origin_model = apps.get_model(
|
|
|
|
'bookwyrm.%s' % origin_model_name,
|
|
|
|
require_ready=True
|
|
|
|
)
|
|
|
|
|
2020-12-20 02:34:37 +00:00
|
|
|
with transaction.atomic():
|
|
|
|
if isinstance(data, str):
|
2020-12-23 20:45:40 +00:00
|
|
|
existing = model.find_existing_by_remote_id(data)
|
|
|
|
if existing:
|
|
|
|
data = existing.to_activity()
|
|
|
|
else:
|
|
|
|
data = get_data(data)
|
|
|
|
activity = model.activity_serializer(**data)
|
|
|
|
|
2020-12-20 02:34:37 +00:00
|
|
|
# this must exist because it's the object that triggered this function
|
|
|
|
instance = origin_model.find_existing_by_remote_id(related_remote_id)
|
|
|
|
if not instance:
|
|
|
|
raise ValueError(
|
|
|
|
'Invalid related remote id: %s' % related_remote_id)
|
|
|
|
|
2020-12-23 20:45:40 +00:00
|
|
|
# set the origin's remote id on the activity so it will be there when
|
|
|
|
# the model instance is created
|
|
|
|
# edition.parentWork = instance, for example
|
2020-12-23 21:33:46 +00:00
|
|
|
model_field = getattr(model, related_field_name)
|
|
|
|
if hasattr(model_field, 'activitypub_field'):
|
|
|
|
setattr(
|
|
|
|
activity,
|
|
|
|
getattr(model_field, 'activitypub_field'),
|
|
|
|
instance.remote_id
|
|
|
|
)
|
2021-02-16 05:20:00 +00:00
|
|
|
item = activity.to_model()
|
2020-12-23 21:33:46 +00:00
|
|
|
|
|
|
|
# if the related field isn't serialized (attachments on Status), then
|
|
|
|
# we have to set it post-creation
|
|
|
|
if not hasattr(model_field, 'activitypub_field'):
|
|
|
|
setattr(item, related_field_name, instance)
|
2020-12-23 21:38:36 +00:00
|
|
|
item.save()
|
2020-12-08 17:43:12 +00:00
|
|
|
|
|
|
|
|
2021-02-16 19:04:13 +00:00
|
|
|
def get_model_from_type(activity_type):
|
|
|
|
''' given the activity, what type of model '''
|
|
|
|
models = apps.get_models()
|
|
|
|
model = [m for m in models if hasattr(m, 'activity_serializer') and \
|
|
|
|
hasattr(m.activity_serializer, 'type') and \
|
|
|
|
m.activity_serializer.type == activity_type]
|
2021-02-17 02:59:26 +00:00
|
|
|
if not model:
|
2021-02-16 19:04:13 +00:00
|
|
|
raise ActivitySerializerError(
|
|
|
|
'No model found for activity type "%s"' % activity_type)
|
|
|
|
return model[0]
|
|
|
|
|
2021-02-17 02:59:26 +00:00
|
|
|
|
2021-02-16 19:04:13 +00:00
|
|
|
def resolve_remote_id(remote_id, model=None, refresh=False, save=True):
|
2020-12-12 21:39:55 +00:00
|
|
|
''' take a remote_id and return an instance, creating if necessary '''
|
2021-02-16 19:04:13 +00:00
|
|
|
if model:# a bonus check we can do if we already know the model
|
|
|
|
result = model.find_existing_by_remote_id(remote_id)
|
|
|
|
if result and not refresh:
|
|
|
|
return result
|
2020-09-17 20:02:52 +00:00
|
|
|
|
2020-11-28 18:18:24 +00:00
|
|
|
# load the data and create the object
|
2020-11-28 06:10:38 +00:00
|
|
|
try:
|
2020-11-29 17:40:15 +00:00
|
|
|
data = get_data(remote_id)
|
|
|
|
except (ConnectorException, ConnectionError):
|
2020-11-28 06:10:38 +00:00
|
|
|
raise ActivitySerializerError(
|
|
|
|
'Could not connect to host for remote_id in %s model: %s' % \
|
|
|
|
(model.__name__, remote_id))
|
2021-02-16 19:04:13 +00:00
|
|
|
# determine the model implicitly, if not provided
|
|
|
|
if not model:
|
|
|
|
model = get_model_from_type(data.get('type'))
|
2020-11-28 06:10:38 +00:00
|
|
|
|
2020-12-12 21:39:55 +00:00
|
|
|
# check for existing items with shared unique identifiers
|
2021-02-16 19:04:13 +00:00
|
|
|
result = model.find_existing(data)
|
|
|
|
if result and not refresh:
|
|
|
|
return result
|
2020-12-12 21:39:55 +00:00
|
|
|
|
2020-11-29 17:40:15 +00:00
|
|
|
item = model.activity_serializer(**data)
|
2020-11-28 18:18:24 +00:00
|
|
|
# if we're refreshing, "result" will be set and we'll update it
|
2021-02-16 19:04:13 +00:00
|
|
|
return item.to_model(model=model, instance=result, save=save)
|