mirror of
https://github.com/jointakahe/takahe.git
synced 2024-11-25 16:51:00 +00:00
770aa1531a
Fixes #187
483 lines
22 KiB
Python
483 lines
22 KiB
Python
import datetime
|
|
import os
|
|
import urllib.parse as urllib_parse
|
|
|
|
from dateutil import parser
|
|
from pyld import jsonld
|
|
from pyld.jsonld import JsonLdError
|
|
|
|
schemas = {
|
|
"www.w3.org/ns/activitystreams": {
|
|
"contentType": "application/ld+json",
|
|
"documentUrl": "http://www.w3.org/ns/activitystreams",
|
|
"contextUrl": None,
|
|
"document": {
|
|
"@context": {
|
|
"@vocab": "_:",
|
|
"xsd": "http://www.w3.org/2001/XMLSchema#",
|
|
"as": "https://www.w3.org/ns/activitystreams#",
|
|
"ldp": "http://www.w3.org/ns/ldp#",
|
|
"vcard": "http://www.w3.org/2006/vcard/ns#",
|
|
"id": "@id",
|
|
"type": "@type",
|
|
"Accept": "as:Accept",
|
|
"Activity": "as:Activity",
|
|
"IntransitiveActivity": "as:IntransitiveActivity",
|
|
"Add": "as:Add",
|
|
"Announce": "as:Announce",
|
|
"Application": "as:Application",
|
|
"Arrive": "as:Arrive",
|
|
"Article": "as:Article",
|
|
"Audio": "as:Audio",
|
|
"Block": "as:Block",
|
|
"Collection": "as:Collection",
|
|
"CollectionPage": "as:CollectionPage",
|
|
"Relationship": "as:Relationship",
|
|
"Create": "as:Create",
|
|
"Delete": "as:Delete",
|
|
"Dislike": "as:Dislike",
|
|
"Document": "as:Document",
|
|
"Event": "as:Event",
|
|
"Follow": "as:Follow",
|
|
"Flag": "as:Flag",
|
|
"Group": "as:Group",
|
|
"Ignore": "as:Ignore",
|
|
"Image": "as:Image",
|
|
"Invite": "as:Invite",
|
|
"Join": "as:Join",
|
|
"Leave": "as:Leave",
|
|
"Like": "as:Like",
|
|
"Link": "as:Link",
|
|
"Mention": "as:Mention",
|
|
"Note": "as:Note",
|
|
"Object": "as:Object",
|
|
"Offer": "as:Offer",
|
|
"OrderedCollection": "as:OrderedCollection",
|
|
"OrderedCollectionPage": "as:OrderedCollectionPage",
|
|
"Organization": "as:Organization",
|
|
"Page": "as:Page",
|
|
"Person": "as:Person",
|
|
"Place": "as:Place",
|
|
"Profile": "as:Profile",
|
|
"Question": "as:Question",
|
|
"Reject": "as:Reject",
|
|
"Remove": "as:Remove",
|
|
"Service": "as:Service",
|
|
"TentativeAccept": "as:TentativeAccept",
|
|
"TentativeReject": "as:TentativeReject",
|
|
"Tombstone": "as:Tombstone",
|
|
"Undo": "as:Undo",
|
|
"Update": "as:Update",
|
|
"Video": "as:Video",
|
|
"View": "as:View",
|
|
"Listen": "as:Listen",
|
|
"Read": "as:Read",
|
|
"Move": "as:Move",
|
|
"Travel": "as:Travel",
|
|
"IsFollowing": "as:IsFollowing",
|
|
"IsFollowedBy": "as:IsFollowedBy",
|
|
"IsContact": "as:IsContact",
|
|
"IsMember": "as:IsMember",
|
|
"subject": {"@id": "as:subject", "@type": "@id"},
|
|
"relationship": {"@id": "as:relationship", "@type": "@id"},
|
|
"actor": {"@id": "as:actor", "@type": "@id"},
|
|
"attributedTo": {"@id": "as:attributedTo", "@type": "@id"},
|
|
"attachment": {"@id": "as:attachment", "@type": "@id"},
|
|
"bcc": {"@id": "as:bcc", "@type": "@id"},
|
|
"bto": {"@id": "as:bto", "@type": "@id"},
|
|
"cc": {"@id": "as:cc", "@type": "@id"},
|
|
"context": {"@id": "as:context", "@type": "@id"},
|
|
"current": {"@id": "as:current", "@type": "@id"},
|
|
"first": {"@id": "as:first", "@type": "@id"},
|
|
"generator": {"@id": "as:generator", "@type": "@id"},
|
|
"icon": {"@id": "as:icon", "@type": "@id"},
|
|
"image": {"@id": "as:image", "@type": "@id"},
|
|
"inReplyTo": {"@id": "as:inReplyTo", "@type": "@id"},
|
|
"items": {"@id": "as:items", "@type": "@id"},
|
|
"instrument": {"@id": "as:instrument", "@type": "@id"},
|
|
"orderedItems": {
|
|
"@id": "as:items",
|
|
"@type": "@id",
|
|
"@container": "@list",
|
|
},
|
|
"last": {"@id": "as:last", "@type": "@id"},
|
|
"location": {"@id": "as:location", "@type": "@id"},
|
|
"next": {"@id": "as:next", "@type": "@id"},
|
|
"object": {"@id": "as:object", "@type": "@id"},
|
|
"oneOf": {"@id": "as:oneOf", "@type": "@id"},
|
|
"anyOf": {"@id": "as:anyOf", "@type": "@id"},
|
|
"closed": {"@id": "as:closed", "@type": "xsd:dateTime"},
|
|
"origin": {"@id": "as:origin", "@type": "@id"},
|
|
"accuracy": {"@id": "as:accuracy", "@type": "xsd:float"},
|
|
"prev": {"@id": "as:prev", "@type": "@id"},
|
|
"preview": {"@id": "as:preview", "@type": "@id"},
|
|
"replies": {"@id": "as:replies", "@type": "@id"},
|
|
"result": {"@id": "as:result", "@type": "@id"},
|
|
"audience": {"@id": "as:audience", "@type": "@id"},
|
|
"partOf": {"@id": "as:partOf", "@type": "@id"},
|
|
"tag": {"@id": "as:tag", "@type": "@id"},
|
|
"target": {"@id": "as:target", "@type": "@id"},
|
|
"to": {"@id": "as:to", "@type": "@id"},
|
|
"url": {"@id": "as:url", "@type": "@id"},
|
|
"altitude": {"@id": "as:altitude", "@type": "xsd:float"},
|
|
"content": "as:content",
|
|
"contentMap": {"@id": "as:content", "@container": "@language"},
|
|
"name": "as:name",
|
|
"nameMap": {"@id": "as:name", "@container": "@language"},
|
|
"duration": {"@id": "as:duration", "@type": "xsd:duration"},
|
|
"endTime": {"@id": "as:endTime", "@type": "xsd:dateTime"},
|
|
"height": {"@id": "as:height", "@type": "xsd:nonNegativeInteger"},
|
|
"href": {"@id": "as:href", "@type": "@id"},
|
|
"hreflang": "as:hreflang",
|
|
"latitude": {"@id": "as:latitude", "@type": "xsd:float"},
|
|
"longitude": {"@id": "as:longitude", "@type": "xsd:float"},
|
|
"mediaType": "as:mediaType",
|
|
"published": {"@id": "as:published", "@type": "xsd:dateTime"},
|
|
"radius": {"@id": "as:radius", "@type": "xsd:float"},
|
|
"rel": "as:rel",
|
|
"startIndex": {
|
|
"@id": "as:startIndex",
|
|
"@type": "xsd:nonNegativeInteger",
|
|
},
|
|
"startTime": {"@id": "as:startTime", "@type": "xsd:dateTime"},
|
|
"summary": "as:summary",
|
|
"summaryMap": {"@id": "as:summary", "@container": "@language"},
|
|
"totalItems": {
|
|
"@id": "as:totalItems",
|
|
"@type": "xsd:nonNegativeInteger",
|
|
},
|
|
"units": "as:units",
|
|
"updated": {"@id": "as:updated", "@type": "xsd:dateTime"},
|
|
"width": {"@id": "as:width", "@type": "xsd:nonNegativeInteger"},
|
|
"describes": {"@id": "as:describes", "@type": "@id"},
|
|
"formerType": {"@id": "as:formerType", "@type": "@id"},
|
|
"deleted": {"@id": "as:deleted", "@type": "xsd:dateTime"},
|
|
"inbox": {"@id": "ldp:inbox", "@type": "@id"},
|
|
"outbox": {"@id": "as:outbox", "@type": "@id"},
|
|
"following": {"@id": "as:following", "@type": "@id"},
|
|
"followers": {"@id": "as:followers", "@type": "@id"},
|
|
"streams": {"@id": "as:streams", "@type": "@id"},
|
|
"preferredUsername": "as:preferredUsername",
|
|
"endpoints": {"@id": "as:endpoints", "@type": "@id"},
|
|
"uploadMedia": {"@id": "as:uploadMedia", "@type": "@id"},
|
|
"proxyUrl": {"@id": "as:proxyUrl", "@type": "@id"},
|
|
"liked": {"@id": "as:liked", "@type": "@id"},
|
|
"oauthAuthorizationEndpoint": {
|
|
"@id": "as:oauthAuthorizationEndpoint",
|
|
"@type": "@id",
|
|
},
|
|
"oauthTokenEndpoint": {"@id": "as:oauthTokenEndpoint", "@type": "@id"},
|
|
"provideClientKey": {"@id": "as:provideClientKey", "@type": "@id"},
|
|
"signClientKey": {"@id": "as:signClientKey", "@type": "@id"},
|
|
"sharedInbox": {"@id": "as:sharedInbox", "@type": "@id"},
|
|
"Public": {"@id": "as:Public", "@type": "@id"},
|
|
"source": "as:source",
|
|
"likes": {"@id": "as:likes", "@type": "@id"},
|
|
"shares": {"@id": "as:shares", "@type": "@id"},
|
|
"alsoKnownAs": {"@id": "as:alsoKnownAs", "@type": "@id"},
|
|
}
|
|
},
|
|
},
|
|
"w3id.org/security/v1": {
|
|
"contentType": "application/ld+json",
|
|
"documentUrl": "http://w3id.org/security/v1",
|
|
"contextUrl": None,
|
|
"document": {
|
|
"@context": {
|
|
"id": "@id",
|
|
"type": "@type",
|
|
"dc": "http://purl.org/dc/terms/",
|
|
"sec": "https://w3id.org/security#",
|
|
"xsd": "http://www.w3.org/2001/XMLSchema#",
|
|
"EcdsaKoblitzSignature2016": "sec:EcdsaKoblitzSignature2016",
|
|
"Ed25519Signature2018": "sec:Ed25519Signature2018",
|
|
"EncryptedMessage": "sec:EncryptedMessage",
|
|
"GraphSignature2012": "sec:GraphSignature2012",
|
|
"LinkedDataSignature2015": "sec:LinkedDataSignature2015",
|
|
"LinkedDataSignature2016": "sec:LinkedDataSignature2016",
|
|
"CryptographicKey": "sec:Key",
|
|
"authenticationTag": "sec:authenticationTag",
|
|
"canonicalizationAlgorithm": "sec:canonicalizationAlgorithm",
|
|
"cipherAlgorithm": "sec:cipherAlgorithm",
|
|
"cipherData": "sec:cipherData",
|
|
"cipherKey": "sec:cipherKey",
|
|
"created": {"@id": "dc:created", "@type": "xsd:dateTime"},
|
|
"creator": {"@id": "dc:creator", "@type": "@id"},
|
|
"digestAlgorithm": "sec:digestAlgorithm",
|
|
"digestValue": "sec:digestValue",
|
|
"domain": "sec:domain",
|
|
"encryptionKey": "sec:encryptionKey",
|
|
"expiration": {"@id": "sec:expiration", "@type": "xsd:dateTime"},
|
|
"expires": {"@id": "sec:expiration", "@type": "xsd:dateTime"},
|
|
"initializationVector": "sec:initializationVector",
|
|
"iterationCount": "sec:iterationCount",
|
|
"nonce": "sec:nonce",
|
|
"normalizationAlgorithm": "sec:normalizationAlgorithm",
|
|
"owner": {"@id": "sec:owner", "@type": "@id"},
|
|
"password": "sec:password",
|
|
"privateKey": {"@id": "sec:privateKey", "@type": "@id"},
|
|
"privateKeyPem": "sec:privateKeyPem",
|
|
"publicKey": {"@id": "sec:publicKey", "@type": "@id"},
|
|
"publicKeyBase58": "sec:publicKeyBase58",
|
|
"publicKeyPem": "sec:publicKeyPem",
|
|
"publicKeyWif": "sec:publicKeyWif",
|
|
"publicKeyService": {"@id": "sec:publicKeyService", "@type": "@id"},
|
|
"revoked": {"@id": "sec:revoked", "@type": "xsd:dateTime"},
|
|
"salt": "sec:salt",
|
|
"signature": "sec:signature",
|
|
"signatureAlgorithm": "sec:signingAlgorithm",
|
|
"signatureValue": "sec:signatureValue",
|
|
}
|
|
},
|
|
},
|
|
"w3id.org/identity/v1": {
|
|
"contentType": "application/ld+json",
|
|
"documentUrl": "http://w3id.org/identity/v1",
|
|
"contextUrl": None,
|
|
"document": {
|
|
"@context": {
|
|
"id": "@id",
|
|
"type": "@type",
|
|
"cred": "https://w3id.org/credentials#",
|
|
"dc": "http://purl.org/dc/terms/",
|
|
"identity": "https://w3id.org/identity#",
|
|
"perm": "https://w3id.org/permissions#",
|
|
"ps": "https://w3id.org/payswarm#",
|
|
"rdf": "http://www.w3.org/1999/02/22-rdf-syntax-ns#",
|
|
"rdfs": "http://www.w3.org/2000/01/rdf-schema#",
|
|
"sec": "https://w3id.org/security#",
|
|
"schema": "http://schema.org/",
|
|
"xsd": "http://www.w3.org/2001/XMLSchema#",
|
|
"Group": "https://www.w3.org/ns/activitystreams#Group",
|
|
"claim": {"@id": "cred:claim", "@type": "@id"},
|
|
"credential": {"@id": "cred:credential", "@type": "@id"},
|
|
"issued": {"@id": "cred:issued", "@type": "xsd:dateTime"},
|
|
"issuer": {"@id": "cred:issuer", "@type": "@id"},
|
|
"recipient": {"@id": "cred:recipient", "@type": "@id"},
|
|
"Credential": "cred:Credential",
|
|
"CryptographicKeyCredential": "cred:CryptographicKeyCredential",
|
|
"about": {"@id": "schema:about", "@type": "@id"},
|
|
"address": {"@id": "schema:address", "@type": "@id"},
|
|
"addressCountry": "schema:addressCountry",
|
|
"addressLocality": "schema:addressLocality",
|
|
"addressRegion": "schema:addressRegion",
|
|
"comment": "rdfs:comment",
|
|
"created": {"@id": "dc:created", "@type": "xsd:dateTime"},
|
|
"creator": {"@id": "dc:creator", "@type": "@id"},
|
|
"description": "schema:description",
|
|
"email": "schema:email",
|
|
"familyName": "schema:familyName",
|
|
"givenName": "schema:givenName",
|
|
"image": {"@id": "schema:image", "@type": "@id"},
|
|
"label": "rdfs:label",
|
|
"name": "schema:name",
|
|
"postalCode": "schema:postalCode",
|
|
"streetAddress": "schema:streetAddress",
|
|
"title": "dc:title",
|
|
"url": {"@id": "schema:url", "@type": "@id"},
|
|
"Person": "schema:Person",
|
|
"PostalAddress": "schema:PostalAddress",
|
|
"Organization": "schema:Organization",
|
|
"identityService": {"@id": "identity:identityService", "@type": "@id"},
|
|
"idp": {"@id": "identity:idp", "@type": "@id"},
|
|
"Identity": "identity:Identity",
|
|
"paymentProcessor": "ps:processor",
|
|
"preferences": {"@id": "ps:preferences", "@type": "@vocab"},
|
|
"cipherAlgorithm": "sec:cipherAlgorithm",
|
|
"cipherData": "sec:cipherData",
|
|
"cipherKey": "sec:cipherKey",
|
|
"digestAlgorithm": "sec:digestAlgorithm",
|
|
"digestValue": "sec:digestValue",
|
|
"domain": "sec:domain",
|
|
"expires": {"@id": "sec:expiration", "@type": "xsd:dateTime"},
|
|
"initializationVector": "sec:initializationVector",
|
|
"member": {"@id": "schema:member", "@type": "@id"},
|
|
"memberOf": {"@id": "schema:memberOf", "@type": "@id"},
|
|
"nonce": "sec:nonce",
|
|
"normalizationAlgorithm": "sec:normalizationAlgorithm",
|
|
"owner": {"@id": "sec:owner", "@type": "@id"},
|
|
"password": "sec:password",
|
|
"privateKey": {"@id": "sec:privateKey", "@type": "@id"},
|
|
"privateKeyPem": "sec:privateKeyPem",
|
|
"publicKey": {"@id": "sec:publicKey", "@type": "@id"},
|
|
"publicKeyPem": "sec:publicKeyPem",
|
|
"publicKeyService": {"@id": "sec:publicKeyService", "@type": "@id"},
|
|
"revoked": {"@id": "sec:revoked", "@type": "xsd:dateTime"},
|
|
"signature": "sec:signature",
|
|
"signatureAlgorithm": "sec:signatureAlgorithm",
|
|
"signatureValue": "sec:signatureValue",
|
|
"CryptographicKey": "sec:Key",
|
|
"EncryptedMessage": "sec:EncryptedMessage",
|
|
"GraphSignature2012": "sec:GraphSignature2012",
|
|
"LinkedDataSignature2015": "sec:LinkedDataSignature2015",
|
|
"accessControl": {"@id": "perm:accessControl", "@type": "@id"},
|
|
"writePermission": {"@id": "perm:writePermission", "@type": "@id"},
|
|
}
|
|
},
|
|
},
|
|
"*/schemas/litepub-0.1.jsonld": {
|
|
"contentType": "application/ld+json",
|
|
"documentUrl": "http://w3id.org/security/v1",
|
|
"contextUrl": None,
|
|
"document": {
|
|
"@context": [
|
|
"https://www.w3.org/ns/activitystreams",
|
|
"https://w3id.org/security/v1",
|
|
{
|
|
"Emoji": "toot:Emoji",
|
|
"Hashtag": "as:Hashtag",
|
|
"PropertyValue": "schema:PropertyValue",
|
|
"atomUri": "ostatus:atomUri",
|
|
"conversation": {"@id": "ostatus:conversation", "@type": "@id"},
|
|
"discoverable": "toot:discoverable",
|
|
"manuallyApprovesFollowers": "as:manuallyApprovesFollowers",
|
|
"capabilities": "litepub:capabilities",
|
|
"ostatus": "http://ostatus.org#",
|
|
"schema": "http://schema.org#",
|
|
"toot": "http://joinmastodon.org/ns#",
|
|
"misskey": "https://misskey-hub.net/ns#",
|
|
"fedibird": "http://fedibird.com/ns#",
|
|
"value": "schema:value",
|
|
"sensitive": "as:sensitive",
|
|
"litepub": "http://litepub.social/ns#",
|
|
"invisible": "litepub:invisible",
|
|
"directMessage": "litepub:directMessage",
|
|
"listMessage": {"@id": "litepub:listMessage", "@type": "@id"},
|
|
"quoteUrl": "as:quoteUrl",
|
|
"quoteUri": "fedibird:quoteUri",
|
|
"oauthRegistrationEndpoint": {
|
|
"@id": "litepub:oauthRegistrationEndpoint",
|
|
"@type": "@id",
|
|
},
|
|
"EmojiReact": "litepub:EmojiReact",
|
|
"ChatMessage": "litepub:ChatMessage",
|
|
"alsoKnownAs": {"@id": "as:alsoKnownAs", "@type": "@id"},
|
|
"vcard": "http://www.w3.org/2006/vcard/ns#",
|
|
"formerRepresentations": "litepub:formerRepresentations",
|
|
},
|
|
]
|
|
},
|
|
},
|
|
"joinmastodon.org/ns": {
|
|
"contentType": "application/ld+json",
|
|
"documentUrl": "http://joinmastodon.org/ns",
|
|
"contextUrl": None,
|
|
"document": {},
|
|
},
|
|
}
|
|
|
|
DATETIME_FORMAT = "%Y-%m-%dT%H:%M:%SZ"
|
|
DATETIME_TZ_FORMAT = "%Y-%m-%dT%H:%M:%S+00:00"
|
|
DATETIME_MS_FORMAT = "%Y-%m-%dT%H:%M:%S.%fZ"
|
|
|
|
|
|
def builtin_document_loader(url: str, options={}):
|
|
# Get URL without scheme
|
|
pieces = urllib_parse.urlparse(url)
|
|
if pieces.hostname is None:
|
|
raise JsonLdError(
|
|
f"No schema built-in for {url!r}",
|
|
"jsonld.LoadDocumentError",
|
|
code="loading document failed",
|
|
cause="NoHostnameError",
|
|
)
|
|
key = pieces.hostname + pieces.path.rstrip("/")
|
|
try:
|
|
return schemas[key]
|
|
except KeyError:
|
|
try:
|
|
key = "*" + pieces.path.rstrip("/")
|
|
return schemas[key]
|
|
except KeyError:
|
|
raise JsonLdError(
|
|
f"No schema built-in for {key!r}",
|
|
"jsonld.LoadDocumentError",
|
|
code="loading document failed",
|
|
cause="KeyError",
|
|
)
|
|
|
|
|
|
def canonicalise(json_data: dict, include_security: bool = False) -> dict:
|
|
"""
|
|
Given an ActivityPub JSON-LD document, round-trips it through the LD
|
|
systems to end up in a canonicalised, compacted format.
|
|
|
|
If no context is provided, supplies one automatically.
|
|
|
|
For most well-structured incoming data this won't actually do anything,
|
|
but it's probably good to abide by the spec.
|
|
"""
|
|
if not isinstance(json_data, dict):
|
|
raise ValueError("Pass decoded JSON data into LDDocument")
|
|
context = [
|
|
"https://www.w3.org/ns/activitystreams",
|
|
{
|
|
"blurhash": "toot:blurhash",
|
|
"Emoji": "toot:Emoji",
|
|
"focalPoint": {"@container": "@list", "@id": "toot:focalPoint"},
|
|
"Hashtag": "as:Hashtag",
|
|
"manuallyApprovesFollowers": "as:manuallyApprovesFollowers",
|
|
"Public": "as:Public",
|
|
"sensitive": "as:sensitive",
|
|
"toot": "http://joinmastodon.org/ns#",
|
|
"votersCount": "toot:votersCount",
|
|
},
|
|
]
|
|
if include_security:
|
|
context.append("https://w3id.org/security/v1")
|
|
if "@context" not in json_data:
|
|
json_data["@context"] = context
|
|
|
|
return jsonld.compact(jsonld.expand(json_data), context)
|
|
|
|
|
|
def get_list(container, key) -> list:
|
|
"""
|
|
Given a JSON-LD value (that can be either a list, or a dict if it's just
|
|
one item), always returns a list"""
|
|
if key not in container:
|
|
return []
|
|
value = container[key]
|
|
if not isinstance(value, list):
|
|
return [value]
|
|
return value
|
|
|
|
|
|
def format_ld_date(value: datetime.datetime) -> str:
|
|
return value.strftime(DATETIME_FORMAT)
|
|
|
|
|
|
def parse_ld_date(value: str | None) -> datetime.datetime | None:
|
|
if value is None:
|
|
return None
|
|
return parser.isoparse(value).replace(microsecond=0)
|
|
|
|
|
|
def get_first_image_url(data) -> str | None:
|
|
"""
|
|
'icon' and 'image' fields might be a dict or a list. Return the first
|
|
'url' for something that looks to be for an image.
|
|
"""
|
|
if isinstance(data, list):
|
|
for itm in data:
|
|
if isinstance(itm, dict) and "url" in itm:
|
|
return itm["url"]
|
|
elif isinstance(data, dict):
|
|
return data.get("url")
|
|
return None
|
|
|
|
|
|
def media_type_from_filename(filename):
|
|
_, extension = os.path.splitext(filename)
|
|
if extension == ".png":
|
|
return "image/png"
|
|
elif extension in [".jpg", ".jpeg"]:
|
|
return "image/jpeg"
|
|
elif extension == ".gif":
|
|
return "image/gif"
|
|
elif extension == ".apng":
|
|
return "image/apng"
|
|
elif extension == ".webp":
|
|
return "image/webp"
|
|
else:
|
|
return "application/octet-stream"
|