Skip to content

Commit

Permalink
Make LazyRoleSet faster by reducing greedy lookups (#422)
Browse files Browse the repository at this point in the history
  • Loading branch information
jace authored Nov 3, 2023
1 parent 5a67126 commit 6395747
Show file tree
Hide file tree
Showing 2 changed files with 88 additions and 64 deletions.
133 changes: 75 additions & 58 deletions src/coaster/sqlalchemy/roles.py
Original file line number Diff line number Diff line change
Expand Up @@ -276,31 +276,38 @@ def _roles_via_relationship(
actor: t.Any,
relationship: t.Any,
actor_attr: t.Optional[ActorAttrType],
roles: t.Union[t.Set[str], LazyRoleSet],
wanted_roles: t.Set[str],
offer_map: t.Optional[RoleOfferMap],
) -> t.Union[t.Set[str], LazyRoleSet]:
) -> t.Set[str]:
"""Find roles granted via a relationship."""
relobj = None # Role-granting object found via the relationship

# There is no actor_attr. Check if the relationship is a RoleMixin and call
# roles_for to get offered roles, then remap using the offer map.
# If there is no actor_attr, check if the relationship is a RoleMixin and call
# roles_for to get offered roles, then remap using the offer map, subsetting the
# offer map to the wanted roles. The offer map may be larger than currently wanted,
# and lookups in the offered roles could be expensive.
if actor_attr is None:
if isinstance(relationship, RoleMixin):
offered_roles: t.Union[t.Set[str], LazyRoleSet]
offered_roles = relationship.roles_for(actor)
if offer_map is not None:
offered_roles = set(
offer_map_subset = {
original_role
for original_role, remapped_roles in offer_map.items()
if remapped_roles & wanted_roles
}
return set(
chain.from_iterable(
offer_map[role] for role in offered_roles if role in offer_map
offer_map[role] for role in offered_roles & offer_map_subset
)
)
return offered_roles
return offered_roles & wanted_roles
raise TypeError(
f"{relationship!r} is not a RoleMixin and no actor attribute was specified"
)

# We have a relationship. If it's a collection, find the item in it that relates
# to the actor.
# We have a relationship and an actor attribute on the relationship. If the
# relationship is a collection, find the item in it that relates to the actor.

# TODO: Support WriteOnlyCollection
if isinstance(relationship, QueryBase):
Expand Down Expand Up @@ -333,25 +340,30 @@ def _roles_via_relationship(

# We have a related object. Get roles from it
if isinstance(relobj, RoleGrantABC):
# If this object grants roles, get them. It may not grant the one we're looking
# for and that's okay. Grab the others
# If this object grants roles, get them
offered_roles = relobj.offered_roles
# But if we have an offer_map, remap the roles and only keep the ones
# specified in the map
if offer_map:
offered_roles = set(
# If we have an offer_map, remap the roles and only keep the ones
# specified in the map
offer_map_subset = {
original_role
for original_role, remapped_roles in offer_map.items()
if remapped_roles & wanted_roles
}
return set(
chain.from_iterable(
offer_map[role] for role in offered_roles if role in offer_map
offer_map[role] for role in offered_roles & offer_map_subset
)
)
return offered_roles
# Without an offer map, return the subset of offered roles and wanted roles
return offered_roles & wanted_roles
# Not a role granting object. Implies that the default roles are granted
# by its very existence.
return roles
return wanted_roles


class RoleGrantABC(metaclass=ABCMeta):
"""Base class for an object that grants roles to an actor."""
"""Base class for an object that grants roles to a subject."""

@property
@abstractmethod
Expand All @@ -377,7 +389,6 @@ class LazyRoleSet(abc.MutableSet):
'actor',
'_present',
'_not_present',
'_scanned_granted_via',
'_scanned_granted_by',
)

Expand All @@ -391,10 +402,6 @@ def __init__(
#: Roles the actor does not have
self._not_present: t.Set[str] = set()
# Relationships that have been scanned already
# Contains (relattr, actor_attr)
self._scanned_granted_via: t.Set[
t.Tuple[str, t.Optional[ActorAttrType]]
] = set()
self._scanned_granted_by: t.Set[str] = set() # Contains relattr

def __repr__(self) -> str: # pragma: no cover
Expand All @@ -419,10 +426,10 @@ def _role_is_present(self, role: str) -> bool:
self._not_present.add(role)
return False

# granted_via says a role may be granted by a secondary object that sits
# `granted_via` says a role may be granted by a secondary object that sits
# in a relationship between the current object and the actor. The secondary
# could be a direct attribute of the current object, or could be inside a
# list or query relationship. _roles_via_relationship will check.
# list or query relationship. `_roles_via_relationship` will check.
# The related object may grant roles in one of three ways:
# 1. By its mere existence (default).
# 2. By offering roles via an `offered_roles` property (see `RoleGrantABC`).
Expand All @@ -433,18 +440,21 @@ def _role_is_present(self, role: str) -> bool:
self.obj.__roles__[role].get('granted_via', {}).items()
):
offer_map = self.obj.__relationship_role_offer_map__.get(relattr)
if (relattr, actor_attr) not in self._scanned_granted_via:
relationship = self.obj._get_relationship(relattr)
if relationship is not None:
# Optimization: does the same relationship grant other roles
# via the same actor_attr? Gather those roles and check all
# of them together. However, we will use a single role
# offer map and not consult the one specified on the other
# roles. They are expected to be identical. This is
# guaranteed if the offer map was specified using
# `with_roles(grants_via=)` but not if specified directly
# in `__roles__[role]['granted_via']`.
possible_roles = {role}
relationship = self.obj._get_relationship(relattr)
if relationship is not None:
possibly_granted_roles = {role}
# Optimization: does the same relationship grant other roles via
# the same non-None `actor_attr`? Gather those roles and check
# all of them together. However, we will use a single role offer
# map and not consult the one specified on the other roles. They
# are expected to be identical. This is guaranteed if the offer
# map was specified using `with_roles(grants_via=)` but not if
# specified directly in `__roles__[role]['granted_via']`. If
# `actor_attr` is None, the relationship must be a `RoleMixin`
# instance that implements `roles_for` and returns a
# `LazyRoleSet` that does expensive lookups. That's no longer an
# optimization and the greedy grab should not be attempted.
if actor_attr is not None:
for arole, actions in self.obj.__roles__.items():
if (
arole != role
Expand All @@ -454,19 +464,18 @@ def _role_is_present(self, role: str) -> bool:
actions['granted_via'][relattr], actor_attr
)
):
possible_roles.add(arole)

granted_roles = _roles_via_relationship(
self.actor,
relationship,
actor_attr,
possible_roles,
offer_map,
)
self._present.update(granted_roles)
self._scanned_granted_via.add((relattr, actor_attr))
if role in granted_roles:
return True
possibly_granted_roles.add(arole)

granted_roles = _roles_via_relationship(
self.actor,
relationship,
actor_attr,
possibly_granted_roles,
offer_map,
)
self._present.update(granted_roles)
if role in granted_roles:
return True
# granted_by says a role is granted by the actor being present in a
# relationship
for relattr in self.obj.__roles__[role].get('granted_by', ()):
Expand All @@ -491,10 +500,12 @@ def _role_is_present(self, role: str) -> bool:

def _contents(self) -> t.Set[str]:
"""Return all available roles."""
# Populate cache
[ # pylint: disable=expression-not-assigned
self._role_is_present(role) for role in self.obj.__roles__
]
# Populate cache (TODO: cache this step to avoid repeat checks)
for role in self.obj.__roles__:
self._role_is_present(role)
# self._present may have roles that are not specified in self.obj.__roles__,
# notably implicit roles like `all` and `auth`. Therefore we must return the
# cache instead of capturing available roles in the loop above
return self._present

def __contains__(self, key: t.Any) -> bool:
Expand All @@ -508,8 +519,10 @@ def __len__(self) -> int:

def __bool__(self) -> bool:
# Make bool() faster than len() by using the cache first
return bool(self._present) or any(
self._role_is_present(role) for role in self.obj.__roles__
return (
True
if bool(self._present)
else any(self._role_is_present(role) for role in self.obj.__roles__)
)

def __eq__(self, other: t.Any) -> bool:
Expand All @@ -520,6 +533,10 @@ def __eq__(self, other: t.Any) -> bool:
def __ne__(self, other: t.Any) -> bool:
return not self.__eq__(other)

def __and__(self, other: t.Iterable[str]) -> t.Set[str]:
"""Faster implementation that avoids lazy lookups where not needed."""
return {role for role in other if self._role_is_present(role)}

def add(self, value: str) -> None:
"""Add role `value` to the set."""
self._present.add(value)
Expand Down Expand Up @@ -561,7 +578,7 @@ def copy(self) -> LazyRoleSet:
issubset = nary_op(abc.MutableSet.__le__)
issuperset = nary_op(abc.MutableSet.__ge__)
union = nary_op(abc.MutableSet.__or__)
intersection = nary_op(abc.MutableSet.__and__)
intersection = nary_op(__and__)
difference = nary_op(abc.MutableSet.__sub__)
symmetric_difference = nary_op(abc.MutableSet.__xor__)
update = nary_op(abc.MutableSet.__ior__)
Expand Down Expand Up @@ -610,7 +627,7 @@ def __repr__(self) -> str:
return f'DynamicAssociationProxy({self.rel!r}, {self.attr!r})'

@overload
def __get__(self, obj: None, cls: t.Type[_T]) -> te.Self:
def __get__(self, obj: None, cls: t.Type) -> te.Self:
...

@overload
Expand Down
19 changes: 13 additions & 6 deletions tests/coaster_tests/sqlalchemy_roles_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -244,6 +244,9 @@ class RoleGrantMany(BaseMixin, Model):
'secondary_role': {'granted_by': ['secondary_users']},
}

primary_users: DynamicMapped[RoleUser] = relationship(
lazy='dynamic', back_populates='doc'
)
secondary_users: Mapped[t.List[RoleUser]] = relationship(
secondary=granted_users, back_populates='secondary_docs'
)
Expand All @@ -258,9 +261,7 @@ class RoleUser(BaseMixin, Model):
sa.ForeignKey('role_grant_many.id')
)
doc: Mapped[t.Optional[RoleGrantMany]] = relationship(
RoleGrantMany,
foreign_keys=[doc_id],
backref=sa.orm.backref('primary_users', lazy='dynamic'),
foreign_keys=[doc_id], back_populates='primary_users'
)
secondary_docs: Mapped[t.List[RoleGrantMany]] = relationship(
RoleGrantMany, secondary=granted_users, back_populates='secondary_users'
Expand Down Expand Up @@ -1069,7 +1070,9 @@ def test_granted_via(self) -> None:

# From m2, roles2 has role1, role2 but not role3
assert 'role2' in roles2 # Granted in m2 via rel_lazy (only)
assert 'role1' in roles2._present # Granted in m2, auto discovered
assert 'role1' not in roles2._present # Granted in m2 separately
assert 'role1' in roles2
assert 'role1' in roles2._present # Cached after explicit lookup
assert 'role3' not in roles2._present # Not granted in m2, not discovered
assert 'role3' not in roles2._not_present # Not rejected either

Expand All @@ -1087,15 +1090,19 @@ def test_granted_via(self) -> None:
assert 'role3' not in roles4a._present
# role1 = False, role2 = True, role3 = True
assert 'role2' in roles4a # Discovered via rel_lazy
assert 'role3' in roles4a._present # This got cached despite not being rel_lazy
assert 'role3' not in roles4a._present # Not in rel_lazy, so not auto cached
assert 'role3' in roles4a
assert 'role3' in roles4a._present

roles4b = document.roles_for(u4)
# No roles cached yet
assert 'role2' not in roles4b._present
assert 'role3' not in roles4b._present
# role1 = False, role2 = True, role3 = True
assert 'role3' in roles4b # Discovered via rel_list
assert 'role2' in roles4b._present # This got cached despite not being rel_list
assert 'role2' not in roles4b._present # Not via rel_list, not auto-discovered
assert 'role2' in roles4b
assert 'role2' in roles4b._present

# The child model inherits remapped roles from document
# role1 is skipped even if present, while role2 and role3 are remapped
Expand Down

0 comments on commit 6395747

Please sign in to comment.