From 0354e53eea491c9aeff605133d709c67879f86cf Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@noreply.github.com>
Date: Sun, 23 Jul 2023 20:50:44 +0200
Subject: [PATCH 1/8] Type annotations for utils

---
 bookwyrm/activitypub/base_activity.py |  21 +++--
 bookwyrm/activitypub/book.py          |  34 ++++----
 bookwyrm/models/author.py             |   4 +-
 bookwyrm/utils/cache.py               |   9 +-
 bookwyrm/utils/isni.py                | 116 ++++++++++++++++++--------
 bookwyrm/utils/log.py                 |   2 +-
 bookwyrm/utils/sanitizer.py           |   2 +-
 bookwyrm/utils/validate.py            |   4 +-
 mypy.ini                              |   4 +
 9 files changed, 130 insertions(+), 66 deletions(-)

diff --git a/bookwyrm/activitypub/base_activity.py b/bookwyrm/activitypub/base_activity.py
index c78b4f195..9e2545fc4 100644
--- a/bookwyrm/activitypub/base_activity.py
+++ b/bookwyrm/activitypub/base_activity.py
@@ -1,7 +1,10 @@
 """ basics for an activitypub serializer """
+from __future__ import annotations
 from dataclasses import dataclass, fields, MISSING
 from json import JSONEncoder
 import logging
+from typing import Optional, Type, TypeVar
+
 import requests
 
 from django.apps import apps
@@ -10,6 +13,7 @@ from django.utils.http import http_date
 
 from bookwyrm import models
 from bookwyrm.connectors import ConnectorException, get_data
+from bookwyrm.models.base_model import BookWyrmModel
 from bookwyrm.signatures import make_signature
 from bookwyrm.settings import DOMAIN, INSTANCE_ACTOR_USERNAME
 from bookwyrm.tasks import app, MISC
@@ -58,6 +62,9 @@ def naive_parse(activity_objects, activity_json, serializer=None):
     return serializer(activity_objects=activity_objects, **activity_json)
 
 
+TModel = TypeVar("TModel", bound=BookWyrmModel)
+
+
 @dataclass(init=False)
 class ActivityObject:
     """actor activitypub json"""
@@ -101,13 +108,13 @@ class ActivityObject:
     # pylint: disable=too-many-locals,too-many-branches,too-many-arguments
     def to_model(
         self,
-        model=None,
-        instance=None,
-        allow_create=True,
-        save=True,
-        overwrite=True,
-        allow_external_connections=True,
-    ):
+        model: Optional[Type[TModel]] = None,
+        instance: Optional[TModel] = None,
+        allow_create: bool = True,
+        save: bool = True,
+        overwrite: bool = True,
+        allow_external_connections: bool = True,
+    ) -> Optional[TModel]:
         """convert from an activity to a model instance. Args:
         model: the django model that this object is being converted to
             (will guess if not known)
diff --git a/bookwyrm/activitypub/book.py b/bookwyrm/activitypub/book.py
index d3aca4471..31543fcac 100644
--- a/bookwyrm/activitypub/book.py
+++ b/bookwyrm/activitypub/book.py
@@ -1,6 +1,6 @@
 """ book and author data """
 from dataclasses import dataclass, field
-from typing import List
+from typing import List, Optional
 
 from .base_activity import ActivityObject
 from .image import Document
@@ -11,17 +11,17 @@ from .image import Document
 class BookData(ActivityObject):
     """shared fields for all book data and authors"""
 
-    openlibraryKey: str = None
-    inventaireId: str = None
-    librarythingKey: str = None
-    goodreadsKey: str = None
-    bnfId: str = None
-    viaf: str = None
-    wikidata: str = None
-    asin: str = None
-    aasin: str = None
-    isfdb: str = None
-    lastEditedBy: str = None
+    openlibraryKey: Optional[str] = None
+    inventaireId: Optional[str] = None
+    librarythingKey: Optional[str] = None
+    goodreadsKey: Optional[str] = None
+    bnfId: Optional[str] = None
+    viaf: Optional[str] = None
+    wikidata: Optional[str] = None
+    asin: Optional[str] = None
+    aasin: Optional[str] = None
+    isfdb: Optional[str] = None
+    lastEditedBy: Optional[str] = None
     links: List[str] = field(default_factory=lambda: [])
     fileLinks: List[str] = field(default_factory=lambda: [])
 
@@ -83,11 +83,11 @@ class Author(BookData):
     """author of a book"""
 
     name: str
-    isni: str = None
-    viafId: str = None
-    gutenbergId: str = None
-    born: str = None
-    died: str = None
+    isni: Optional[str] = None
+    viafId: Optional[str] = None
+    gutenbergId: Optional[str] = None
+    born: Optional[str] = None
+    died: Optional[str] = None
     aliases: List[str] = field(default_factory=lambda: [])
     bio: str = ""
     wikipediaLink: str = ""
diff --git a/bookwyrm/models/author.py b/bookwyrm/models/author.py
index 5c0c087b2..981e3c0cc 100644
--- a/bookwyrm/models/author.py
+++ b/bookwyrm/models/author.py
@@ -1,5 +1,7 @@
 """ database schema for info about authors """
 import re
+from typing import Tuple, Any
+
 from django.contrib.postgres.indexes import GinIndex
 from django.db import models
 
@@ -38,7 +40,7 @@ class Author(BookDataModel):
     )
     bio = fields.HtmlField(null=True, blank=True)
 
-    def save(self, *args, **kwargs):
+    def save(self, *args: Tuple[Any, ...], **kwargs: dict[str, Any]) -> None:
         """normalize isni format"""
         if self.isni:
             self.isni = re.sub(r"\s", "", self.isni)
diff --git a/bookwyrm/utils/cache.py b/bookwyrm/utils/cache.py
index aebb8e754..5e896e621 100644
--- a/bookwyrm/utils/cache.py
+++ b/bookwyrm/utils/cache.py
@@ -1,8 +1,15 @@
 """ Custom handler for caching """
+from typing import Any, Callable, Tuple, Union
+
 from django.core.cache import cache
 
 
-def get_or_set(cache_key, function, *args, timeout=None):
+def get_or_set(
+    cache_key: str,
+    function: Callable[..., Any],
+    *args: Tuple[Any, ...],
+    timeout: Union[float, None] = None
+) -> Any:
     """Django's built-in get_or_set isn't cutting it"""
     value = cache.get(cache_key)
     if value is None:
diff --git a/bookwyrm/utils/isni.py b/bookwyrm/utils/isni.py
index 318de30ef..6c4200660 100644
--- a/bookwyrm/utils/isni.py
+++ b/bookwyrm/utils/isni.py
@@ -1,15 +1,24 @@
 """ISNI author checking utilities"""
 import xml.etree.ElementTree as ET
+from typing import Union, Optional
+
 import requests
 
 from bookwyrm import activitypub, models
 
 
-def request_isni_data(search_index, search_term, max_records=5):
+def get_element_text(element: Optional[ET.Element]) -> str:
+    """If the element is not None and there is a text attribute return this"""
+    if element is not None and element.text is not None:
+        return element.text
+    return ""
+
+
+def request_isni_data(search_index: str, search_term: str, max_records: int = 5) -> str:
     """Request data from the ISNI API"""
 
     search_string = f'{search_index}="{search_term}"'
-    query_params = {
+    query_params: dict[str, Union[str, int]] = {
         "query": search_string,
         "version": "1.1",
         "operation": "searchRetrieve",
@@ -26,41 +35,52 @@ def request_isni_data(search_index, search_term, max_records=5):
     return result.text
 
 
-def make_name_string(element):
+def make_name_string(element: ET.Element) -> str:
     """create a string of form 'personal_name surname'"""
 
     # NOTE: this will often be incorrect, many naming systems
     # list "surname" before personal name
     forename = element.find(".//forename")
     surname = element.find(".//surname")
-    if forename is not None:
-        return "".join([forename.text, " ", surname.text])
-    return surname.text
+
+    forename_text = get_element_text(forename)
+    surname_text = get_element_text(surname)
+
+    return "".join(
+        [forename_text, " " if forename_text and surname_text else "", surname_text]
+    )
 
 
-def get_other_identifier(element, code):
+def get_other_identifier(element: ET.Element, code: str) -> str:
     """Get other identifiers associated with an author from their ISNI record"""
 
     identifiers = element.findall(".//otherIdentifierOfIdentity")
     for section_head in identifiers:
         if (
-            section_head.find(".//type") is not None
-            and section_head.find(".//type").text == code
-            and section_head.find(".//identifier") is not None
+            (section_type := section_head.find(".//type")) is not None
+            and section_type.text is not None
+            and section_type.text == code
+            and (identifier := section_head.find(".//identifier")) is not None
+            and identifier.text is not None
         ):
-            return section_head.find(".//identifier").text
+            return identifier.text
 
     # if we can't find it in otherIdentifierOfIdentity,
     # try sources
     for source in element.findall(".//sources"):
-        code_of_source = source.find(".//codeOfSource")
-        if code_of_source is not None and code_of_source.text.lower() == code.lower():
-            return source.find(".//sourceIdentifier").text
+        if (
+            (code_of_source := source.find(".//codeOfSource")) is not None
+            and code_of_source.text is not None
+            and code_of_source.text.lower() == code.lower()
+            and (source_identifier := source.find(".//sourceIdentifier")) is not None
+            and source_identifier.text is not None
+        ):
+            return source_identifier.text
 
     return ""
 
 
-def get_external_information_uri(element, match_string):
+def get_external_information_uri(element: ET.Element, match_string: str) -> str:
     """Get URLs associated with an author from their ISNI record"""
 
     sources = element.findall(".//externalInformation")
@@ -69,14 +89,18 @@ def get_external_information_uri(element, match_string):
         uri = source.find(".//URI")
         if (
             uri is not None
+            and uri.text is not None
             and information is not None
+            and information.text is not None
             and information.text.lower() == match_string.lower()
         ):
             return uri.text
     return ""
 
 
-def find_authors_by_name(name_string, description=False):
+def find_authors_by_name(
+    name_string: str, description: bool = False
+) -> list[activitypub.Author]:
     """Query the ISNI database for possible author matches by name"""
 
     payload = request_isni_data("pica.na", name_string)
@@ -92,7 +116,11 @@ def find_authors_by_name(name_string, description=False):
         if not personal_name:
             continue
 
-        author = get_author_from_isni(element.find(".//isniUnformatted").text)
+        author = get_author_from_isni(
+            get_element_text(element.find(".//isniUnformatted"))
+        )
+        if author is None:
+            continue
 
         if bool(description):
 
@@ -111,22 +139,23 @@ def find_authors_by_name(name_string, description=False):
                 # some of the "titles" in ISNI are a little ...iffy
                 # @ is used by ISNI/OCLC to index the starting point ignoring stop words
                 # (e.g. "The @Government of no one")
-                title_elements = [
-                    e
-                    for e in titles
-                    if hasattr(e, "text") and not e.text.replace("@", "").isnumeric()
-                ]
-                if len(title_elements):
-                    author.bio = title_elements[0].text.replace("@", "")
-                else:
-                    author.bio = None
+                author.bio = ""
+                for title in titles:
+                    if (
+                        title is not None
+                        and hasattr(title, "text")
+                        and title.text is not None
+                        and not title.text.replace("@", "").isnumeric()
+                    ):
+                        author.bio = title.text.replace("@", "")
+                        break
 
         possible_authors.append(author)
 
     return possible_authors
 
 
-def get_author_from_isni(isni):
+def get_author_from_isni(isni: str) -> Optional[activitypub.Author]:
     """Find data to populate a new author record from their ISNI"""
 
     payload = request_isni_data("pica.isn", isni)
@@ -135,25 +164,32 @@ def get_author_from_isni(isni):
     # there should only be a single responseRecord
     # but let's use the first one just in case
     element = root.find(".//responseRecord")
-    name = make_name_string(element.find(".//forename/.."))
+    if element is None:
+        # TODO What if there is no responseRecord?
+        #  return empty Author or None, or raise Exception?
+        return None
+
+    name = (
+        make_name_string(forename)
+        if (forename := element.find(".//forename/..")) is not None
+        else ""
+    )
     viaf = get_other_identifier(element, "viaf")
     # use a set to dedupe aliases in ISNI
     aliases = set()
     aliases_element = element.findall(".//personalNameVariant")
     for entry in aliases_element:
         aliases.add(make_name_string(entry))
-    # aliases needs to be list not set
-    aliases = list(aliases)
-    bio = element.find(".//nameTitle")
-    bio = bio.text if bio is not None else ""
+    bio = get_element_text(element.find(".//nameTitle"))
     wikipedia = get_external_information_uri(element, "Wikipedia")
 
     author = activitypub.Author(
-        id=element.find(".//isniURI").text,
+        id=get_element_text(element.find(".//isniURI")),
         name=name,
         isni=isni,
         viafId=viaf,
-        aliases=aliases,
+        # aliases needs to be list not set
+        aliases=list(aliases),
         bio=bio,
         wikipediaLink=wikipedia,
     )
@@ -161,21 +197,27 @@ def get_author_from_isni(isni):
     return author
 
 
-def build_author_from_isni(match_value):
+def build_author_from_isni(match_value: str) -> dict[str, activitypub.Author]:
     """Build basic author class object from ISNI URL"""
 
     # if it is an isni value get the data
     if match_value.startswith("https://isni.org/isni/"):
         isni = match_value.replace("https://isni.org/isni/", "")
-        return {"author": get_author_from_isni(isni)}
+        author = get_author_from_isni(isni)
+        if author is not None:
+            return {"author": author}
     # otherwise it's a name string
     return {}
 
 
-def augment_author_metadata(author, isni):
+def augment_author_metadata(author: models.Author, isni: str) -> None:
     """Update any missing author fields from ISNI data"""
 
     isni_author = get_author_from_isni(isni)
+    if isni_author is None:
+        # TODO Should we just return or raise an exception to indicate a problem?
+        return
+
     isni_author.to_model(model=models.Author, instance=author, overwrite=False)
 
     # we DO want to overwrite aliases because we're adding them to the
diff --git a/bookwyrm/utils/log.py b/bookwyrm/utils/log.py
index 70f32ef03..7a4a2f898 100644
--- a/bookwyrm/utils/log.py
+++ b/bookwyrm/utils/log.py
@@ -10,7 +10,7 @@ class IgnoreVariableDoesNotExist(logging.Filter):
     these errors are not useful to us.
     """
 
-    def filter(self, record):
+    def filter(self, record: logging.LogRecord) -> bool:
         if record.exc_info:
             (_, err_value, _) = record.exc_info
             while err_value:
diff --git a/bookwyrm/utils/sanitizer.py b/bookwyrm/utils/sanitizer.py
index 2fd0ff4ff..4f5132c9e 100644
--- a/bookwyrm/utils/sanitizer.py
+++ b/bookwyrm/utils/sanitizer.py
@@ -2,7 +2,7 @@
 import bleach
 
 
-def clean(input_text):
+def clean(input_text: str) -> str:
     """Run through "bleach" """
     return bleach.clean(
         input_text,
diff --git a/bookwyrm/utils/validate.py b/bookwyrm/utils/validate.py
index b91add3ad..ed1b00b0e 100644
--- a/bookwyrm/utils/validate.py
+++ b/bookwyrm/utils/validate.py
@@ -1,8 +1,10 @@
 """Validations"""
+from typing import Optional
+
 from bookwyrm.settings import DOMAIN, USE_HTTPS
 
 
-def validate_url_domain(url):
+def validate_url_domain(url: str) -> Optional[str]:
     """Basic check that the URL starts with the instance domain name"""
     if not url:
         return None
diff --git a/mypy.ini b/mypy.ini
index 39f6863fe..ed7ad018d 100644
--- a/mypy.ini
+++ b/mypy.ini
@@ -10,6 +10,10 @@ django_settings_module = "bookwyrm.settings"
 ignore_errors = True
 implicit_reexport = True
 
+[mypy-bookwyrm.utils.*]
+ignore_errors = False
+disallow_untyped_calls = False
+
 [mypy-celerywyrm.*]
 ignore_errors = False
 

From ff8e4597e5192f197c15b02500d6d1b22afe25cb Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@noreply.github.com>
Date: Sun, 23 Jul 2023 20:50:44 +0200
Subject: [PATCH 2/8] Type annotations for utils

---
 bookwyrm/models/author.py  |   4 +-
 bookwyrm/utils/cache.py    |   9 ++-
 bookwyrm/utils/isni.py     | 116 +++++++++++++++++++++++++------------
 bookwyrm/utils/log.py      |   2 +-
 bookwyrm/utils/validate.py |   4 +-
 mypy.ini                   |   4 ++
 6 files changed, 98 insertions(+), 41 deletions(-)

diff --git a/bookwyrm/models/author.py b/bookwyrm/models/author.py
index 5c0c087b2..981e3c0cc 100644
--- a/bookwyrm/models/author.py
+++ b/bookwyrm/models/author.py
@@ -1,5 +1,7 @@
 """ database schema for info about authors """
 import re
+from typing import Tuple, Any
+
 from django.contrib.postgres.indexes import GinIndex
 from django.db import models
 
@@ -38,7 +40,7 @@ class Author(BookDataModel):
     )
     bio = fields.HtmlField(null=True, blank=True)
 
-    def save(self, *args, **kwargs):
+    def save(self, *args: Tuple[Any, ...], **kwargs: dict[str, Any]) -> None:
         """normalize isni format"""
         if self.isni:
             self.isni = re.sub(r"\s", "", self.isni)
diff --git a/bookwyrm/utils/cache.py b/bookwyrm/utils/cache.py
index aebb8e754..5e896e621 100644
--- a/bookwyrm/utils/cache.py
+++ b/bookwyrm/utils/cache.py
@@ -1,8 +1,15 @@
 """ Custom handler for caching """
+from typing import Any, Callable, Tuple, Union
+
 from django.core.cache import cache
 
 
-def get_or_set(cache_key, function, *args, timeout=None):
+def get_or_set(
+    cache_key: str,
+    function: Callable[..., Any],
+    *args: Tuple[Any, ...],
+    timeout: Union[float, None] = None
+) -> Any:
     """Django's built-in get_or_set isn't cutting it"""
     value = cache.get(cache_key)
     if value is None:
diff --git a/bookwyrm/utils/isni.py b/bookwyrm/utils/isni.py
index 318de30ef..6c4200660 100644
--- a/bookwyrm/utils/isni.py
+++ b/bookwyrm/utils/isni.py
@@ -1,15 +1,24 @@
 """ISNI author checking utilities"""
 import xml.etree.ElementTree as ET
+from typing import Union, Optional
+
 import requests
 
 from bookwyrm import activitypub, models
 
 
-def request_isni_data(search_index, search_term, max_records=5):
+def get_element_text(element: Optional[ET.Element]) -> str:
+    """If the element is not None and there is a text attribute return this"""
+    if element is not None and element.text is not None:
+        return element.text
+    return ""
+
+
+def request_isni_data(search_index: str, search_term: str, max_records: int = 5) -> str:
     """Request data from the ISNI API"""
 
     search_string = f'{search_index}="{search_term}"'
-    query_params = {
+    query_params: dict[str, Union[str, int]] = {
         "query": search_string,
         "version": "1.1",
         "operation": "searchRetrieve",
@@ -26,41 +35,52 @@ def request_isni_data(search_index, search_term, max_records=5):
     return result.text
 
 
-def make_name_string(element):
+def make_name_string(element: ET.Element) -> str:
     """create a string of form 'personal_name surname'"""
 
     # NOTE: this will often be incorrect, many naming systems
     # list "surname" before personal name
     forename = element.find(".//forename")
     surname = element.find(".//surname")
-    if forename is not None:
-        return "".join([forename.text, " ", surname.text])
-    return surname.text
+
+    forename_text = get_element_text(forename)
+    surname_text = get_element_text(surname)
+
+    return "".join(
+        [forename_text, " " if forename_text and surname_text else "", surname_text]
+    )
 
 
-def get_other_identifier(element, code):
+def get_other_identifier(element: ET.Element, code: str) -> str:
     """Get other identifiers associated with an author from their ISNI record"""
 
     identifiers = element.findall(".//otherIdentifierOfIdentity")
     for section_head in identifiers:
         if (
-            section_head.find(".//type") is not None
-            and section_head.find(".//type").text == code
-            and section_head.find(".//identifier") is not None
+            (section_type := section_head.find(".//type")) is not None
+            and section_type.text is not None
+            and section_type.text == code
+            and (identifier := section_head.find(".//identifier")) is not None
+            and identifier.text is not None
         ):
-            return section_head.find(".//identifier").text
+            return identifier.text
 
     # if we can't find it in otherIdentifierOfIdentity,
     # try sources
     for source in element.findall(".//sources"):
-        code_of_source = source.find(".//codeOfSource")
-        if code_of_source is not None and code_of_source.text.lower() == code.lower():
-            return source.find(".//sourceIdentifier").text
+        if (
+            (code_of_source := source.find(".//codeOfSource")) is not None
+            and code_of_source.text is not None
+            and code_of_source.text.lower() == code.lower()
+            and (source_identifier := source.find(".//sourceIdentifier")) is not None
+            and source_identifier.text is not None
+        ):
+            return source_identifier.text
 
     return ""
 
 
-def get_external_information_uri(element, match_string):
+def get_external_information_uri(element: ET.Element, match_string: str) -> str:
     """Get URLs associated with an author from their ISNI record"""
 
     sources = element.findall(".//externalInformation")
@@ -69,14 +89,18 @@ def get_external_information_uri(element, match_string):
         uri = source.find(".//URI")
         if (
             uri is not None
+            and uri.text is not None
             and information is not None
+            and information.text is not None
             and information.text.lower() == match_string.lower()
         ):
             return uri.text
     return ""
 
 
-def find_authors_by_name(name_string, description=False):
+def find_authors_by_name(
+    name_string: str, description: bool = False
+) -> list[activitypub.Author]:
     """Query the ISNI database for possible author matches by name"""
 
     payload = request_isni_data("pica.na", name_string)
@@ -92,7 +116,11 @@ def find_authors_by_name(name_string, description=False):
         if not personal_name:
             continue
 
-        author = get_author_from_isni(element.find(".//isniUnformatted").text)
+        author = get_author_from_isni(
+            get_element_text(element.find(".//isniUnformatted"))
+        )
+        if author is None:
+            continue
 
         if bool(description):
 
@@ -111,22 +139,23 @@ def find_authors_by_name(name_string, description=False):
                 # some of the "titles" in ISNI are a little ...iffy
                 # @ is used by ISNI/OCLC to index the starting point ignoring stop words
                 # (e.g. "The @Government of no one")
-                title_elements = [
-                    e
-                    for e in titles
-                    if hasattr(e, "text") and not e.text.replace("@", "").isnumeric()
-                ]
-                if len(title_elements):
-                    author.bio = title_elements[0].text.replace("@", "")
-                else:
-                    author.bio = None
+                author.bio = ""
+                for title in titles:
+                    if (
+                        title is not None
+                        and hasattr(title, "text")
+                        and title.text is not None
+                        and not title.text.replace("@", "").isnumeric()
+                    ):
+                        author.bio = title.text.replace("@", "")
+                        break
 
         possible_authors.append(author)
 
     return possible_authors
 
 
-def get_author_from_isni(isni):
+def get_author_from_isni(isni: str) -> Optional[activitypub.Author]:
     """Find data to populate a new author record from their ISNI"""
 
     payload = request_isni_data("pica.isn", isni)
@@ -135,25 +164,32 @@ def get_author_from_isni(isni):
     # there should only be a single responseRecord
     # but let's use the first one just in case
     element = root.find(".//responseRecord")
-    name = make_name_string(element.find(".//forename/.."))
+    if element is None:
+        # TODO What if there is no responseRecord?
+        #  return empty Author or None, or raise Exception?
+        return None
+
+    name = (
+        make_name_string(forename)
+        if (forename := element.find(".//forename/..")) is not None
+        else ""
+    )
     viaf = get_other_identifier(element, "viaf")
     # use a set to dedupe aliases in ISNI
     aliases = set()
     aliases_element = element.findall(".//personalNameVariant")
     for entry in aliases_element:
         aliases.add(make_name_string(entry))
-    # aliases needs to be list not set
-    aliases = list(aliases)
-    bio = element.find(".//nameTitle")
-    bio = bio.text if bio is not None else ""
+    bio = get_element_text(element.find(".//nameTitle"))
     wikipedia = get_external_information_uri(element, "Wikipedia")
 
     author = activitypub.Author(
-        id=element.find(".//isniURI").text,
+        id=get_element_text(element.find(".//isniURI")),
         name=name,
         isni=isni,
         viafId=viaf,
-        aliases=aliases,
+        # aliases needs to be list not set
+        aliases=list(aliases),
         bio=bio,
         wikipediaLink=wikipedia,
     )
@@ -161,21 +197,27 @@ def get_author_from_isni(isni):
     return author
 
 
-def build_author_from_isni(match_value):
+def build_author_from_isni(match_value: str) -> dict[str, activitypub.Author]:
     """Build basic author class object from ISNI URL"""
 
     # if it is an isni value get the data
     if match_value.startswith("https://isni.org/isni/"):
         isni = match_value.replace("https://isni.org/isni/", "")
-        return {"author": get_author_from_isni(isni)}
+        author = get_author_from_isni(isni)
+        if author is not None:
+            return {"author": author}
     # otherwise it's a name string
     return {}
 
 
-def augment_author_metadata(author, isni):
+def augment_author_metadata(author: models.Author, isni: str) -> None:
     """Update any missing author fields from ISNI data"""
 
     isni_author = get_author_from_isni(isni)
+    if isni_author is None:
+        # TODO Should we just return or raise an exception to indicate a problem?
+        return
+
     isni_author.to_model(model=models.Author, instance=author, overwrite=False)
 
     # we DO want to overwrite aliases because we're adding them to the
diff --git a/bookwyrm/utils/log.py b/bookwyrm/utils/log.py
index 70f32ef03..7a4a2f898 100644
--- a/bookwyrm/utils/log.py
+++ b/bookwyrm/utils/log.py
@@ -10,7 +10,7 @@ class IgnoreVariableDoesNotExist(logging.Filter):
     these errors are not useful to us.
     """
 
-    def filter(self, record):
+    def filter(self, record: logging.LogRecord) -> bool:
         if record.exc_info:
             (_, err_value, _) = record.exc_info
             while err_value:
diff --git a/bookwyrm/utils/validate.py b/bookwyrm/utils/validate.py
index b91add3ad..ed1b00b0e 100644
--- a/bookwyrm/utils/validate.py
+++ b/bookwyrm/utils/validate.py
@@ -1,8 +1,10 @@
 """Validations"""
+from typing import Optional
+
 from bookwyrm.settings import DOMAIN, USE_HTTPS
 
 
-def validate_url_domain(url):
+def validate_url_domain(url: str) -> Optional[str]:
     """Basic check that the URL starts with the instance domain name"""
     if not url:
         return None
diff --git a/mypy.ini b/mypy.ini
index 2a29e314f..f938cc7b6 100644
--- a/mypy.ini
+++ b/mypy.ini
@@ -13,6 +13,10 @@ implicit_reexport = True
 [mypy-bookwyrm.connectors.*]
 ignore_errors = False
 
+[mypy-bookwyrm.utils.*]
+ignore_errors = False
+disallow_untyped_calls = False
+
 [mypy-celerywyrm.*]
 ignore_errors = False
 

From 767cd146399fb40086eb2cd93bc2f7aa8512610b Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Mon, 21 Aug 2023 13:10:12 +0200
Subject: [PATCH 3/8] Stricter checks for bookwyrm.utils

---
 mypy.ini | 1 -
 1 file changed, 1 deletion(-)

diff --git a/mypy.ini b/mypy.ini
index f938cc7b6..8eee0ba62 100644
--- a/mypy.ini
+++ b/mypy.ini
@@ -15,7 +15,6 @@ ignore_errors = False
 
 [mypy-bookwyrm.utils.*]
 ignore_errors = False
-disallow_untyped_calls = False
 
 [mypy-celerywyrm.*]
 ignore_errors = False

From 0f2c0c034db515cb8201d09143fb264797e6d6e7 Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Mon, 21 Aug 2023 13:28:08 +0200
Subject: [PATCH 4/8] Removed TODOs. When data is invalid return None.

---
 bookwyrm/utils/isni.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/bookwyrm/utils/isni.py b/bookwyrm/utils/isni.py
index 6c4200660..e3b2c65f3 100644
--- a/bookwyrm/utils/isni.py
+++ b/bookwyrm/utils/isni.py
@@ -165,8 +165,6 @@ def get_author_from_isni(isni: str) -> Optional[activitypub.Author]:
     # but let's use the first one just in case
     element = root.find(".//responseRecord")
     if element is None:
-        # TODO What if there is no responseRecord?
-        #  return empty Author or None, or raise Exception?
         return None
 
     name = (
@@ -215,8 +213,7 @@ def augment_author_metadata(author: models.Author, isni: str) -> None:
 
     isni_author = get_author_from_isni(isni)
     if isni_author is None:
-        # TODO Should we just return or raise an exception to indicate a problem?
-        return
+        return None
 
     isni_author.to_model(model=models.Author, instance=author, overwrite=False)
 

From 2e88e73509f6b226e564697e2203981542603689 Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Mon, 21 Aug 2023 14:00:09 +0200
Subject: [PATCH 5/8] Remove returned None to make pylint happy

---
 bookwyrm/utils/isni.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bookwyrm/utils/isni.py b/bookwyrm/utils/isni.py
index e3b2c65f3..0d0a86887 100644
--- a/bookwyrm/utils/isni.py
+++ b/bookwyrm/utils/isni.py
@@ -213,7 +213,7 @@ def augment_author_metadata(author: models.Author, isni: str) -> None:
 
     isni_author = get_author_from_isni(isni)
     if isni_author is None:
-        return None
+        return
 
     isni_author.to_model(model=models.Author, instance=author, overwrite=False)
 

From a5ede835b205e7c5ef920c2fb8ae18e5c7d91d11 Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Wed, 13 Sep 2023 09:09:43 +0200
Subject: [PATCH 6/8] Dump dependencies related to typing

---
 requirements.txt | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index e8328b170..87b29fbd6 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -43,13 +43,14 @@ pytest-env==0.6.2
 pytest-xdist==2.3.0
 pytidylib==0.3.2
 pylint==2.14.0
-mypy==1.4.1
+mypy==1.5.1
 celery-types==0.18.0
-django-stubs[compatible-mypy]==4.2.3
-types-bleach==6.0.0.3
+django-stubs[compatible-mypy]==4.2.4
+types-bleach==6.0.0.4
 types-dataclasses==0.6.6
-types-Markdown==3.4.2.9
-types-Pillow==10.0.0.1
-types-psycopg2==2.9.21.10
-types-python-dateutil==2.8.19.13
-types-requests==2.31.0.1
+types-Markdown==3.4.2.10
+types-Pillow==10.0.0.3
+types-psycopg2==2.9.21.11
+types-python-dateutil==2.8.19.14
+types-requests==2.31.0.2
+types-requests==2.31.0.2

From a5cf912ae89e71af9cbb8e1d3257c6fc131ef9f1 Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Wed, 13 Sep 2023 09:22:53 +0200
Subject: [PATCH 7/8] Fix some annotations

---
 bookwyrm/activitypub/base_activity.py | 5 ++++-
 bookwyrm/utils/cache.py               | 6 +++---
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/bookwyrm/activitypub/base_activity.py b/bookwyrm/activitypub/base_activity.py
index f7f4b216c..05e7d8a05 100644
--- a/bookwyrm/activitypub/base_activity.py
+++ b/bookwyrm/activitypub/base_activity.py
@@ -1,4 +1,5 @@
 """ basics for an activitypub serializer """
+from __future__ import annotations
 from dataclasses import dataclass, fields, MISSING
 from json import JSONEncoder
 import logging
@@ -72,7 +73,9 @@ class ActivityObject:
 
     def __init__(
         self,
-        activity_objects: Optional[list[str, base_model.BookWyrmModel]] = None,
+        activity_objects: Optional[
+            dict[str, Union[str, list[str], ActivityObject, base_model.BookWyrmModel]]
+        ] = None,
         **kwargs: Any,
     ):
         """this lets you pass in an object with fields that aren't in the
diff --git a/bookwyrm/utils/cache.py b/bookwyrm/utils/cache.py
index 5e896e621..c8262ef59 100644
--- a/bookwyrm/utils/cache.py
+++ b/bookwyrm/utils/cache.py
@@ -6,12 +6,12 @@ from django.core.cache import cache
 
 def get_or_set(
     cache_key: str,
-    function: Callable[..., Any],
+    function: Callable[..., str],
     *args: Tuple[Any, ...],
     timeout: Union[float, None] = None
-) -> Any:
+) -> str:
     """Django's built-in get_or_set isn't cutting it"""
-    value = cache.get(cache_key)
+    value = str(cache.get(cache_key))
     if value is None:
         value = function(*args)
         cache.set(cache_key, value, timeout=timeout)

From af5f71f5acdb2a8537f86220e97500b4ae568108 Mon Sep 17 00:00:00 2001
From: Joeri de Ruiter <jderuiter@users.noreply.github.com>
Date: Wed, 13 Sep 2023 10:21:30 +0200
Subject: [PATCH 8/8] Revert return type for get_or_set

---
 bookwyrm/utils/cache.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bookwyrm/utils/cache.py b/bookwyrm/utils/cache.py
index c8262ef59..5e896e621 100644
--- a/bookwyrm/utils/cache.py
+++ b/bookwyrm/utils/cache.py
@@ -6,12 +6,12 @@ from django.core.cache import cache
 
 def get_or_set(
     cache_key: str,
-    function: Callable[..., str],
+    function: Callable[..., Any],
     *args: Tuple[Any, ...],
     timeout: Union[float, None] = None
-) -> str:
+) -> Any:
     """Django's built-in get_or_set isn't cutting it"""
-    value = str(cache.get(cache_key))
+    value = cache.get(cache_key)
     if value is None:
         value = function(*args)
         cache.set(cache_key, value, timeout=timeout)