Source code for julee.domain.repositories.base
"""
Generic base repository protocol for common CRUD operations.
This module defines a generic BaseRepository protocol that captures the common
patterns shared across all domain repositories in the Capture, Extract,
Assemble, Publish workflow. This reduces code duplication while maintaining
type safety and clean interfaces.
All repository operations follow the same principles:
- **Idempotency**: All methods are designed to be idempotent and safe for
retry. Multiple calls with the same parameters will produce the same
result without unintended side effects.
- **Workflow Safety**: All operations are safe to call from deterministic
workflow contexts. Non-deterministic operations (like ID generation) are
explicitly delegated to activities.
- **Domain Objects**: Methods accept and return domain objects or primitives,
never framework-specific types.
In Temporal workflow contexts, these protocols are implemented by workflow
stubs that delegate to activities for durability and proper error handling.
"""
from typing import Protocol, Optional, runtime_checkable, TypeVar, List, Dict
from pydantic import BaseModel
# Type variable bound to Pydantic BaseModel for domain entities
[docs]
T = TypeVar("T", bound=BaseModel)
@runtime_checkable
[docs]
class BaseRepository(Protocol[T]):
"""Generic base repository protocol for common CRUD operations.
This protocol defines the common interface shared by all domain
repositories in the system. It uses generics to provide type safety
while eliminating code duplication.
Type Parameter:
T: The domain entity type (must extend Pydantic BaseModel)
"""
[docs]
async def get(self, entity_id: str) -> Optional[T]:
"""Retrieve an entity by ID.
Args:
entity_id: Unique entity identifier
Returns:
Entity if found, None otherwise
.. rubric:: Implementation Notes
- Must be idempotent: multiple calls return same result
- Should handle missing entities gracefully (return None)
- Loads complete entity with all relationships
"""
...
[docs]
async def get_many(self, entity_ids: List[str]) -> Dict[str, Optional[T]]:
"""Retrieve multiple entities by ID.
Args:
entity_ids: List of unique entity identifiers
Returns:
Dict mapping entity_id to entity (or None if not found)
.. rubric:: Implementation Notes
- Must be idempotent: multiple calls return same result
- Should handle missing entities gracefully (return None for missing)
- Implementations may optimize with batch operations or fall back
to individual get() calls
- Keys in returned dict correspond exactly to input entity_ids
- Missing entities have None values in the returned dict
.. rubric:: Workflow Context
In Temporal workflows, this method is implemented as an activity
to ensure batch operations are durably stored and consistent
across workflow replays.
"""
...
[docs]
async def save(self, entity: T) -> None:
"""Save an entity.
Args:
entity: Complete entity to save
.. rubric:: Implementation Notes
- Must be idempotent: saving same entity state is safe
- Should update the updated_at timestamp
- Must save complete entity with all relationships
- Handles both new entities and updates to existing ones
"""
...
[docs]
async def list_all(self) -> List[T]:
"""List all entities.
Returns:
List of all entities in the repository
.. rubric:: Implementation Notes
- Must be idempotent: multiple calls return same result
- Returns empty list if no entities exist
- Should return entities in a consistent order (e.g., by ID)
- For large datasets, consider pagination at the use case level
.. rubric:: Workflow Context
In Temporal workflows, this method is implemented as an activity
to ensure the list operation is durably stored and consistent
across workflow replays.
.. rubric:: Default Implementation
Base protocol provides a default that returns empty list.
Repository implementations should override this method as needed.
.. note::
This default implementation returns empty list to avoid
breaking existing repositories. Specific repositories should
implement proper list_all() functionality as needed.
"""
return []
[docs]
async def generate_id(self) -> str:
"""Generate a unique entity identifier.
This operation is non-deterministic and must be called from
workflow activities, not directly from workflow code.
Returns:
Unique entity ID string
.. rubric:: Implementation Notes
- Must generate globally unique identifiers
- May use UUIDs, database sequences, or distributed ID generators
- Should be fast and reliable
- Failure here should be rare but handled gracefully
.. rubric:: Workflow Context
In Temporal workflows, this method is implemented as an activity
to ensure the generated ID is durably stored and consistent
across workflow replays.
"""
...