feat(memory): #87 project setup & core architecture

Implements Sub-Issue #87 of Issue #62 (Agent Memory System). Core infrastructure: - memory/types.py: Type definitions for all memory types (Working, Episodic, Semantic, Procedural) with enums for MemoryType, ScopeLevel, Outcome - memory/config.py: MemorySettings with MEM_ env prefix, thread-safe singleton - memory/exceptions.py: Comprehensive exception hierarchy for memory operations - memory/manager.py: MemoryManager facade with placeholder methods Directory structure: - working/: Working memory (Redis/in-memory) - to be implemented in #89 - episodic/: Episodic memory (experiences) - to be implemented in #90 - semantic/: Semantic memory (facts) - to be implemented in #91 - procedural/: Procedural memory (skills) - to be implemented in #92 - scoping/: Scope management - to be implemented in #93 - indexing/: Vector indexing - to be implemented in #94 - consolidation/: Memory consolidation - to be implemented in #95 Tests: 71 unit tests for config, types, and exceptions Docs: Comprehensive implementation plan at docs/architecture/memory-system-plan.md 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-01-05 01:27:36 +01:00
parent 4b149b8a52
commit 085a748929
17 changed files with 3242 additions and 0 deletions
--- a/backend/app/services/memory/init.py
+++ b/backend/app/services/memory/init.py
@@ -0,0 +1,136 @@
+"""
+Agent Memory System
+
+Multi-tier cognitive memory for AI agents, providing:
+- Working Memory: Session-scoped ephemeral state (Redis/In-memory)
+- Episodic Memory: Experiential records of past tasks (PostgreSQL)
+- Semantic Memory: Learned facts and knowledge (PostgreSQL + pgvector)
+- Procedural Memory: Learned skills and procedures (PostgreSQL)
+
+Usage:
+    from app.services.memory import (
+        MemoryManager,
+        MemorySettings,
+        get_memory_settings,
+        MemoryType,
+        ScopeLevel,
+    )
+
+    # Create a manager for a session
+    manager = MemoryManager.for_session(
+        session_id="sess-123",
+        project_id=uuid,
+    )
+
+    async with manager:
+        # Working memory
+        await manager.set_working("key", {"data": "value"})
+        value = await manager.get_working("key")
+
+        # Episodic memory
+        episode = await manager.record_episode(episode_data)
+        similar = await manager.search_episodes("query")
+
+        # Semantic memory
+        fact = await manager.store_fact(fact_data)
+        facts = await manager.search_facts("query")
+
+        # Procedural memory
+        procedure = await manager.record_procedure(procedure_data)
+        procedures = await manager.find_procedures("context")
+"""
+
+# Configuration
+from .config import (
+    MemorySettings,
+    get_default_settings,
+    get_memory_settings,
+    reset_memory_settings,
+)
+
+# Exceptions
+from .exceptions import (
+    CheckpointError,
+    EmbeddingError,
+    MemoryCapacityError,
+    MemoryConflictError,
+    MemoryConsolidationError,
+    MemoryError,
+    MemoryExpiredError,
+    MemoryNotFoundError,
+    MemoryRetrievalError,
+    MemoryScopeError,
+    MemorySerializationError,
+    MemoryStorageError,
+)
+
+# Manager
+from .manager import MemoryManager
+
+# Types
+from .types import (
+    ConsolidationStatus,
+    ConsolidationType,
+    Episode,
+    EpisodeCreate,
+    Fact,
+    FactCreate,
+    MemoryItem,
+    MemoryStats,
+    MemoryStore,
+    MemoryType,
+    Outcome,
+    Procedure,
+    ProcedureCreate,
+    RetrievalResult,
+    ScopeContext,
+    ScopeLevel,
+    Step,
+    TaskState,
+    WorkingMemoryItem,
+)
+
+__all__ = [
+    "CheckpointError",
+    "ConsolidationStatus",
+    "ConsolidationType",
+    "EmbeddingError",
+    "Episode",
+    "EpisodeCreate",
+    "Fact",
+    "FactCreate",
+    "MemoryCapacityError",
+    "MemoryConflictError",
+    "MemoryConsolidationError",
+    # Exceptions
+    "MemoryError",
+    "MemoryExpiredError",
+    "MemoryItem",
+    # Manager
+    "MemoryManager",
+    "MemoryNotFoundError",
+    "MemoryRetrievalError",
+    "MemoryScopeError",
+    "MemorySerializationError",
+    # Configuration
+    "MemorySettings",
+    "MemoryStats",
+    "MemoryStorageError",
+    # Types - Abstract
+    "MemoryStore",
+    # Types - Enums
+    "MemoryType",
+    "Outcome",
+    "Procedure",
+    "ProcedureCreate",
+    "RetrievalResult",
+    # Types - Data Classes
+    "ScopeContext",
+    "ScopeLevel",
+    "Step",
+    "TaskState",
+    "WorkingMemoryItem",
+    "get_default_settings",
+    "get_memory_settings",
+    "reset_memory_settings",
+]
--- a/backend/app/services/memory/config.py
+++ b/backend/app/services/memory/config.py
@@ -0,0 +1,410 @@
+"""
+Memory System Configuration.
+
+Provides Pydantic settings for the Agent Memory System,
+including storage backends, capacity limits, and consolidation policies.
+"""
+
+import threading
+from functools import lru_cache
+from typing import Any
+
+from pydantic import Field, field_validator, model_validator
+from pydantic_settings import BaseSettings
+
+
+class MemorySettings(BaseSettings):
+    """
+    Configuration for the Agent Memory System.
+
+    All settings can be overridden via environment variables
+    with the MEM_ prefix.
+    """
+
+    # Working Memory Settings
+    working_memory_backend: str = Field(
+        default="redis",
+        description="Backend for working memory: 'redis' or 'memory'",
+    )
+    working_memory_default_ttl_seconds: int = Field(
+        default=3600,
+        ge=60,
+        le=86400,
+        description="Default TTL for working memory items (1 hour default)",
+    )
+    working_memory_max_items_per_session: int = Field(
+        default=1000,
+        ge=100,
+        le=100000,
+        description="Maximum items per session in working memory",
+    )
+    working_memory_max_value_size_bytes: int = Field(
+        default=1048576,  # 1MB
+        ge=1024,
+        le=104857600,  # 100MB
+        description="Maximum size of a single value in working memory",
+    )
+    working_memory_checkpoint_enabled: bool = Field(
+        default=True,
+        description="Enable checkpointing for working memory recovery",
+    )
+
+    # Redis Settings (for working memory)
+    redis_url: str = Field(
+        default="redis://localhost:6379/0",
+        description="Redis connection URL",
+    )
+    redis_prefix: str = Field(
+        default="mem",
+        description="Redis key prefix for memory items",
+    )
+    redis_connection_timeout_seconds: int = Field(
+        default=5,
+        ge=1,
+        le=60,
+        description="Redis connection timeout",
+    )
+
+    # Episodic Memory Settings
+    episodic_max_episodes_per_project: int = Field(
+        default=10000,
+        ge=100,
+        le=1000000,
+        description="Maximum episodes to retain per project",
+    )
+    episodic_default_importance: float = Field(
+        default=0.5,
+        ge=0.0,
+        le=1.0,
+        description="Default importance score for new episodes",
+    )
+    episodic_retention_days: int = Field(
+        default=365,
+        ge=7,
+        le=3650,
+        description="Days to retain episodes before archival",
+    )
+
+    # Semantic Memory Settings
+    semantic_max_facts_per_project: int = Field(
+        default=50000,
+        ge=1000,
+        le=10000000,
+        description="Maximum facts to retain per project",
+    )
+    semantic_confidence_decay_days: int = Field(
+        default=90,
+        ge=7,
+        le=365,
+        description="Days until confidence decays by 50%",
+    )
+    semantic_min_confidence: float = Field(
+        default=0.1,
+        ge=0.0,
+        le=1.0,
+        description="Minimum confidence before fact is pruned",
+    )
+
+    # Procedural Memory Settings
+    procedural_max_procedures_per_project: int = Field(
+        default=1000,
+        ge=10,
+        le=100000,
+        description="Maximum procedures per project",
+    )
+    procedural_min_success_rate: float = Field(
+        default=0.3,
+        ge=0.0,
+        le=1.0,
+        description="Minimum success rate before procedure is pruned",
+    )
+    procedural_min_uses_before_suggest: int = Field(
+        default=3,
+        ge=1,
+        le=100,
+        description="Minimum uses before procedure is suggested",
+    )
+
+    # Embedding Settings
+    embedding_model: str = Field(
+        default="text-embedding-3-small",
+        description="Model to use for embeddings",
+    )
+    embedding_dimensions: int = Field(
+        default=1536,
+        ge=256,
+        le=4096,
+        description="Embedding vector dimensions",
+    )
+    embedding_batch_size: int = Field(
+        default=100,
+        ge=1,
+        le=1000,
+        description="Batch size for embedding generation",
+    )
+    embedding_cache_enabled: bool = Field(
+        default=True,
+        description="Enable caching of embeddings",
+    )
+
+    # Retrieval Settings
+    retrieval_default_limit: int = Field(
+        default=10,
+        ge=1,
+        le=100,
+        description="Default limit for retrieval queries",
+    )
+    retrieval_max_limit: int = Field(
+        default=100,
+        ge=10,
+        le=1000,
+        description="Maximum limit for retrieval queries",
+    )
+    retrieval_min_similarity: float = Field(
+        default=0.5,
+        ge=0.0,
+        le=1.0,
+        description="Minimum similarity score for retrieval",
+    )
+
+    # Consolidation Settings
+    consolidation_enabled: bool = Field(
+        default=True,
+        description="Enable automatic memory consolidation",
+    )
+    consolidation_batch_size: int = Field(
+        default=100,
+        ge=10,
+        le=1000,
+        description="Batch size for consolidation jobs",
+    )
+    consolidation_schedule_cron: str = Field(
+        default="0 3 * * *",
+        description="Cron expression for nightly consolidation (3 AM)",
+    )
+    consolidation_working_to_episodic_delay_minutes: int = Field(
+        default=30,
+        ge=5,
+        le=1440,
+        description="Minutes after session end before consolidating to episodic",
+    )
+
+    # Pruning Settings
+    pruning_enabled: bool = Field(
+        default=True,
+        description="Enable automatic memory pruning",
+    )
+    pruning_min_age_days: int = Field(
+        default=7,
+        ge=1,
+        le=365,
+        description="Minimum age before memory can be pruned",
+    )
+    pruning_importance_threshold: float = Field(
+        default=0.2,
+        ge=0.0,
+        le=1.0,
+        description="Importance threshold below which memory can be pruned",
+    )
+
+    # Caching Settings
+    cache_enabled: bool = Field(
+        default=True,
+        description="Enable caching for memory retrieval",
+    )
+    cache_ttl_seconds: int = Field(
+        default=300,
+        ge=10,
+        le=3600,
+        description="Cache TTL for retrieval results",
+    )
+    cache_max_items: int = Field(
+        default=10000,
+        ge=100,
+        le=1000000,
+        description="Maximum items in memory cache",
+    )
+
+    # Performance Settings
+    max_retrieval_time_ms: int = Field(
+        default=100,
+        ge=10,
+        le=5000,
+        description="Target maximum retrieval time in milliseconds",
+    )
+    parallel_retrieval: bool = Field(
+        default=True,
+        description="Enable parallel retrieval from multiple memory types",
+    )
+    max_parallel_retrievals: int = Field(
+        default=4,
+        ge=1,
+        le=10,
+        description="Maximum concurrent retrieval operations",
+    )
+
+    @field_validator("working_memory_backend")
+    @classmethod
+    def validate_backend(cls, v: str) -> str:
+        """Validate working memory backend."""
+        valid_backends = {"redis", "memory"}
+        if v not in valid_backends:
+            raise ValueError(f"backend must be one of: {valid_backends}")
+        return v
+
+    @field_validator("embedding_model")
+    @classmethod
+    def validate_embedding_model(cls, v: str) -> str:
+        """Validate embedding model name."""
+        valid_models = {
+            "text-embedding-3-small",
+            "text-embedding-3-large",
+            "text-embedding-ada-002",
+        }
+        if v not in valid_models:
+            raise ValueError(f"embedding_model must be one of: {valid_models}")
+        return v
+
+    @model_validator(mode="after")
+    def validate_limits(self) -> "MemorySettings":
+        """Validate that limits are consistent."""
+        if self.retrieval_default_limit > self.retrieval_max_limit:
+            raise ValueError(
+                f"retrieval_default_limit ({self.retrieval_default_limit}) "
+                f"cannot exceed retrieval_max_limit ({self.retrieval_max_limit})"
+            )
+        return self
+
+    def get_working_memory_config(self) -> dict[str, Any]:
+        """Get working memory configuration as a dictionary."""
+        return {
+            "backend": self.working_memory_backend,
+            "default_ttl_seconds": self.working_memory_default_ttl_seconds,
+            "max_items_per_session": self.working_memory_max_items_per_session,
+            "max_value_size_bytes": self.working_memory_max_value_size_bytes,
+            "checkpoint_enabled": self.working_memory_checkpoint_enabled,
+        }
+
+    def get_redis_config(self) -> dict[str, Any]:
+        """Get Redis configuration as a dictionary."""
+        return {
+            "url": self.redis_url,
+            "prefix": self.redis_prefix,
+            "connection_timeout_seconds": self.redis_connection_timeout_seconds,
+        }
+
+    def get_embedding_config(self) -> dict[str, Any]:
+        """Get embedding configuration as a dictionary."""
+        return {
+            "model": self.embedding_model,
+            "dimensions": self.embedding_dimensions,
+            "batch_size": self.embedding_batch_size,
+            "cache_enabled": self.embedding_cache_enabled,
+        }
+
+    def get_consolidation_config(self) -> dict[str, Any]:
+        """Get consolidation configuration as a dictionary."""
+        return {
+            "enabled": self.consolidation_enabled,
+            "batch_size": self.consolidation_batch_size,
+            "schedule_cron": self.consolidation_schedule_cron,
+            "working_to_episodic_delay_minutes": (
+                self.consolidation_working_to_episodic_delay_minutes
+            ),
+        }
+
+    def to_dict(self) -> dict[str, Any]:
+        """Convert settings to dictionary for logging/debugging."""
+        return {
+            "working_memory": self.get_working_memory_config(),
+            "redis": self.get_redis_config(),
+            "episodic": {
+                "max_episodes_per_project": self.episodic_max_episodes_per_project,
+                "default_importance": self.episodic_default_importance,
+                "retention_days": self.episodic_retention_days,
+            },
+            "semantic": {
+                "max_facts_per_project": self.semantic_max_facts_per_project,
+                "confidence_decay_days": self.semantic_confidence_decay_days,
+                "min_confidence": self.semantic_min_confidence,
+            },
+            "procedural": {
+                "max_procedures_per_project": self.procedural_max_procedures_per_project,
+                "min_success_rate": self.procedural_min_success_rate,
+                "min_uses_before_suggest": self.procedural_min_uses_before_suggest,
+            },
+            "embedding": self.get_embedding_config(),
+            "retrieval": {
+                "default_limit": self.retrieval_default_limit,
+                "max_limit": self.retrieval_max_limit,
+                "min_similarity": self.retrieval_min_similarity,
+            },
+            "consolidation": self.get_consolidation_config(),
+            "pruning": {
+                "enabled": self.pruning_enabled,
+                "min_age_days": self.pruning_min_age_days,
+                "importance_threshold": self.pruning_importance_threshold,
+            },
+            "cache": {
+                "enabled": self.cache_enabled,
+                "ttl_seconds": self.cache_ttl_seconds,
+                "max_items": self.cache_max_items,
+            },
+            "performance": {
+                "max_retrieval_time_ms": self.max_retrieval_time_ms,
+                "parallel_retrieval": self.parallel_retrieval,
+                "max_parallel_retrievals": self.max_parallel_retrievals,
+            },
+        }
+
+    model_config = {
+        "env_prefix": "MEM_",
+        "env_file": ".env",
+        "env_file_encoding": "utf-8",
+        "case_sensitive": False,
+        "extra": "ignore",
+    }
+
+
+# Thread-safe singleton pattern
+_settings: MemorySettings | None = None
+_settings_lock = threading.Lock()
+
+
+def get_memory_settings() -> MemorySettings:
+    """
+    Get the global MemorySettings instance.
+
+    Thread-safe with double-checked locking pattern.
+
+    Returns:
+        MemorySettings instance
+    """
+    global _settings
+    if _settings is None:
+        with _settings_lock:
+            if _settings is None:
+                _settings = MemorySettings()
+    return _settings
+
+
+def reset_memory_settings() -> None:
+    """
+    Reset the global settings instance.
+
+    Primarily used for testing.
+    """
+    global _settings
+    with _settings_lock:
+        _settings = None
+
+
+@lru_cache(maxsize=1)
+def get_default_settings() -> MemorySettings:
+    """
+    Get default settings (cached).
+
+    Use this for read-only access to defaults.
+    For mutable access, use get_memory_settings().
+    """
+    return MemorySettings()
--- a/backend/app/services/memory/consolidation/init.py
+++ b/backend/app/services/memory/consolidation/init.py
@@ -0,0 +1,10 @@
+"""
+Memory Consolidation
+
+Transfers and extracts knowledge between memory tiers:
+- Working -> Episodic
+- Episodic -> Semantic
+- Episodic -> Procedural
+"""
+
+# Will be populated in #95
--- a/backend/app/services/memory/episodic/init.py
+++ b/backend/app/services/memory/episodic/init.py
@@ -0,0 +1,8 @@
+"""
+Episodic Memory
+
+Experiential memory storing past task completions,
+failures, and learnings.
+"""
+
+# Will be populated in #90
--- a/backend/app/services/memory/exceptions.py
+++ b/backend/app/services/memory/exceptions.py
@@ -0,0 +1,206 @@
+"""
+Memory System Exceptions
+
+Custom exception classes for the Agent Memory System.
+"""
+
+from typing import Any
+from uuid import UUID
+
+
+class MemoryError(Exception):
+    """Base exception for all memory-related errors."""
+
+    def __init__(
+        self,
+        message: str,
+        *,
+        memory_type: str | None = None,
+        scope_type: str | None = None,
+        scope_id: str | None = None,
+        details: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__(message)
+        self.message = message
+        self.memory_type = memory_type
+        self.scope_type = scope_type
+        self.scope_id = scope_id
+        self.details = details or {}
+
+
+class MemoryNotFoundError(MemoryError):
+    """Raised when a memory item is not found."""
+
+    def __init__(
+        self,
+        message: str = "Memory not found",
+        *,
+        memory_id: UUID | str | None = None,
+        key: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.memory_id = memory_id
+        self.key = key
+
+
+class MemoryCapacityError(MemoryError):
+    """Raised when memory capacity limits are exceeded."""
+
+    def __init__(
+        self,
+        message: str = "Memory capacity exceeded",
+        *,
+        current_size: int = 0,
+        max_size: int = 0,
+        item_count: int = 0,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.current_size = current_size
+        self.max_size = max_size
+        self.item_count = item_count
+
+
+class MemoryExpiredError(MemoryError):
+    """Raised when attempting to access expired memory."""
+
+    def __init__(
+        self,
+        message: str = "Memory has expired",
+        *,
+        key: str | None = None,
+        expired_at: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.key = key
+        self.expired_at = expired_at
+
+
+class MemoryStorageError(MemoryError):
+    """Raised when memory storage operations fail."""
+
+    def __init__(
+        self,
+        message: str = "Memory storage operation failed",
+        *,
+        operation: str | None = None,
+        backend: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.operation = operation
+        self.backend = backend
+
+
+class MemorySerializationError(MemoryError):
+    """Raised when memory serialization/deserialization fails."""
+
+    def __init__(
+        self,
+        message: str = "Memory serialization failed",
+        *,
+        content_type: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.content_type = content_type
+
+
+class MemoryScopeError(MemoryError):
+    """Raised when memory scope operations fail."""
+
+    def __init__(
+        self,
+        message: str = "Memory scope error",
+        *,
+        requested_scope: str | None = None,
+        allowed_scopes: list[str] | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.requested_scope = requested_scope
+        self.allowed_scopes = allowed_scopes or []
+
+
+class MemoryConsolidationError(MemoryError):
+    """Raised when memory consolidation fails."""
+
+    def __init__(
+        self,
+        message: str = "Memory consolidation failed",
+        *,
+        source_type: str | None = None,
+        target_type: str | None = None,
+        items_processed: int = 0,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.source_type = source_type
+        self.target_type = target_type
+        self.items_processed = items_processed
+
+
+class MemoryRetrievalError(MemoryError):
+    """Raised when memory retrieval fails."""
+
+    def __init__(
+        self,
+        message: str = "Memory retrieval failed",
+        *,
+        query: str | None = None,
+        retrieval_type: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.query = query
+        self.retrieval_type = retrieval_type
+
+
+class EmbeddingError(MemoryError):
+    """Raised when embedding generation fails."""
+
+    def __init__(
+        self,
+        message: str = "Embedding generation failed",
+        *,
+        content_length: int = 0,
+        model: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.content_length = content_length
+        self.model = model
+
+
+class CheckpointError(MemoryError):
+    """Raised when checkpoint operations fail."""
+
+    def __init__(
+        self,
+        message: str = "Checkpoint operation failed",
+        *,
+        checkpoint_id: str | None = None,
+        operation: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.checkpoint_id = checkpoint_id
+        self.operation = operation
+
+
+class MemoryConflictError(MemoryError):
+    """Raised when there's a conflict in memory (e.g., contradictory facts)."""
+
+    def __init__(
+        self,
+        message: str = "Memory conflict detected",
+        *,
+        conflicting_ids: list[str | UUID] | None = None,
+        conflict_type: str | None = None,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(message, **kwargs)
+        self.conflicting_ids = conflicting_ids or []
+        self.conflict_type = conflict_type
--- a/backend/app/services/memory/indexing/init.py
+++ b/backend/app/services/memory/indexing/init.py
@@ -0,0 +1,7 @@
+"""
+Memory Indexing
+
+Vector embeddings and retrieval engine for memory search.
+"""
+
+# Will be populated in #94
--- a/backend/app/services/memory/manager.py
+++ b/backend/app/services/memory/manager.py
@@ -0,0 +1,606 @@
+"""
+Memory Manager
+
+Facade for the Agent Memory System providing unified access
+to all memory types and operations.
+"""
+
+import logging
+from typing import Any
+from uuid import UUID
+
+from .config import MemorySettings, get_memory_settings
+from .types import (
+    Episode,
+    EpisodeCreate,
+    Fact,
+    FactCreate,
+    MemoryStats,
+    MemoryType,
+    Outcome,
+    Procedure,
+    ProcedureCreate,
+    RetrievalResult,
+    ScopeContext,
+    ScopeLevel,
+    TaskState,
+)
+
+logger = logging.getLogger(__name__)
+
+
+class MemoryManager:
+    """
+    Unified facade for the Agent Memory System.
+
+    Provides a single entry point for all memory operations across
+    working, episodic, semantic, and procedural memory types.
+
+    Usage:
+        manager = MemoryManager.create()
+
+        # Working memory
+        await manager.set_working("key", {"data": "value"})
+        value = await manager.get_working("key")
+
+        # Episodic memory
+        episode = await manager.record_episode(episode_data)
+        similar = await manager.search_episodes("query")
+
+        # Semantic memory
+        fact = await manager.store_fact(fact_data)
+        facts = await manager.search_facts("query")
+
+        # Procedural memory
+        procedure = await manager.record_procedure(procedure_data)
+        procedures = await manager.find_procedures("context")
+    """
+
+    def __init__(
+        self,
+        settings: MemorySettings,
+        scope: ScopeContext,
+    ) -> None:
+        """
+        Initialize the MemoryManager.
+
+        Args:
+            settings: Memory configuration settings
+            scope: The scope context for this manager instance
+        """
+        self._settings = settings
+        self._scope = scope
+        self._initialized = False
+
+        # These will be initialized when the respective sub-modules are implemented
+        self._working_memory: Any | None = None
+        self._episodic_memory: Any | None = None
+        self._semantic_memory: Any | None = None
+        self._procedural_memory: Any | None = None
+
+        logger.debug(
+            "MemoryManager created for scope %s:%s",
+            scope.scope_type.value,
+            scope.scope_id,
+        )
+
+    @classmethod
+    def create(
+        cls,
+        scope_type: ScopeLevel = ScopeLevel.SESSION,
+        scope_id: str = "default",
+        parent_scope: ScopeContext | None = None,
+        settings: MemorySettings | None = None,
+    ) -> "MemoryManager":
+        """
+        Create a new MemoryManager instance.
+
+        Args:
+            scope_type: The scope level for this manager
+            scope_id: The scope identifier
+            parent_scope: Optional parent scope for inheritance
+            settings: Optional custom settings (uses global if not provided)
+
+        Returns:
+            A new MemoryManager instance
+        """
+        if settings is None:
+            settings = get_memory_settings()
+
+        scope = ScopeContext(
+            scope_type=scope_type,
+            scope_id=scope_id,
+            parent=parent_scope,
+        )
+
+        return cls(settings=settings, scope=scope)
+
+    @classmethod
+    def for_session(
+        cls,
+        session_id: str,
+        agent_instance_id: UUID | None = None,
+        project_id: UUID | None = None,
+    ) -> "MemoryManager":
+        """
+        Create a MemoryManager for a specific session.
+
+        Builds the appropriate scope hierarchy based on provided IDs.
+
+        Args:
+            session_id: The session identifier
+            agent_instance_id: Optional agent instance ID
+            project_id: Optional project ID
+
+        Returns:
+            A MemoryManager configured for the session scope
+        """
+        settings = get_memory_settings()
+
+        # Build scope hierarchy
+        parent: ScopeContext | None = None
+
+        if project_id:
+            parent = ScopeContext(
+                scope_type=ScopeLevel.PROJECT,
+                scope_id=str(project_id),
+                parent=ScopeContext(
+                    scope_type=ScopeLevel.GLOBAL,
+                    scope_id="global",
+                ),
+            )
+
+        if agent_instance_id:
+            parent = ScopeContext(
+                scope_type=ScopeLevel.AGENT_INSTANCE,
+                scope_id=str(agent_instance_id),
+                parent=parent,
+            )
+
+        scope = ScopeContext(
+            scope_type=ScopeLevel.SESSION,
+            scope_id=session_id,
+            parent=parent,
+        )
+
+        return cls(settings=settings, scope=scope)
+
+    @property
+    def scope(self) -> ScopeContext:
+        """Get the current scope context."""
+        return self._scope
+
+    @property
+    def settings(self) -> MemorySettings:
+        """Get the memory settings."""
+        return self._settings
+
+    # =========================================================================
+    # Working Memory Operations
+    # =========================================================================
+
+    async def set_working(
+        self,
+        key: str,
+        value: Any,
+        ttl_seconds: int | None = None,
+    ) -> None:
+        """
+        Set a value in working memory.
+
+        Args:
+            key: The key to store the value under
+            value: The value to store (must be JSON serializable)
+            ttl_seconds: Optional TTL (uses default if not provided)
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug("set_working called for key=%s (not yet implemented)", key)
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def get_working(
+        self,
+        key: str,
+        default: Any = None,
+    ) -> Any:
+        """
+        Get a value from working memory.
+
+        Args:
+            key: The key to retrieve
+            default: Default value if key not found
+
+        Returns:
+            The stored value or default
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug("get_working called for key=%s (not yet implemented)", key)
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def delete_working(self, key: str) -> bool:
+        """
+        Delete a value from working memory.
+
+        Args:
+            key: The key to delete
+
+        Returns:
+            True if the key was deleted, False if not found
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug("delete_working called for key=%s (not yet implemented)", key)
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def set_task_state(self, state: TaskState) -> None:
+        """
+        Set the current task state in working memory.
+
+        Args:
+            state: The task state to store
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug(
+            "set_task_state called for task=%s (not yet implemented)",
+            state.task_id,
+        )
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def get_task_state(self) -> TaskState | None:
+        """
+        Get the current task state from working memory.
+
+        Returns:
+            The current task state or None
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug("get_task_state called (not yet implemented)")
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def create_checkpoint(self) -> str:
+        """
+        Create a checkpoint of the current working memory state.
+
+        Returns:
+            The checkpoint ID
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug("create_checkpoint called (not yet implemented)")
+        raise NotImplementedError("Working memory not yet implemented")
+
+    async def restore_checkpoint(self, checkpoint_id: str) -> None:
+        """
+        Restore working memory from a checkpoint.
+
+        Args:
+            checkpoint_id: The checkpoint to restore from
+        """
+        # Placeholder - will be implemented in #89
+        logger.debug(
+            "restore_checkpoint called for id=%s (not yet implemented)",
+            checkpoint_id,
+        )
+        raise NotImplementedError("Working memory not yet implemented")
+
+    # =========================================================================
+    # Episodic Memory Operations
+    # =========================================================================
+
+    async def record_episode(self, episode: EpisodeCreate) -> Episode:
+        """
+        Record a new episode in episodic memory.
+
+        Args:
+            episode: The episode data to record
+
+        Returns:
+            The created episode with ID
+        """
+        # Placeholder - will be implemented in #90
+        logger.debug(
+            "record_episode called for task=%s (not yet implemented)",
+            episode.task_type,
+        )
+        raise NotImplementedError("Episodic memory not yet implemented")
+
+    async def search_episodes(
+        self,
+        query: str,
+        limit: int | None = None,
+    ) -> RetrievalResult[Episode]:
+        """
+        Search for similar episodes.
+
+        Args:
+            query: The search query
+            limit: Maximum results to return
+
+        Returns:
+            Retrieval result with matching episodes
+        """
+        # Placeholder - will be implemented in #90
+        logger.debug(
+            "search_episodes called for query=%s (not yet implemented)",
+            query[:50],
+        )
+        raise NotImplementedError("Episodic memory not yet implemented")
+
+    async def get_recent_episodes(
+        self,
+        limit: int = 10,
+    ) -> list[Episode]:
+        """
+        Get the most recent episodes.
+
+        Args:
+            limit: Maximum episodes to return
+
+        Returns:
+            List of recent episodes
+        """
+        # Placeholder - will be implemented in #90
+        logger.debug("get_recent_episodes called (not yet implemented)")
+        raise NotImplementedError("Episodic memory not yet implemented")
+
+    async def get_episodes_by_outcome(
+        self,
+        outcome: Outcome,
+        limit: int = 10,
+    ) -> list[Episode]:
+        """
+        Get episodes by outcome.
+
+        Args:
+            outcome: The outcome to filter by
+            limit: Maximum episodes to return
+
+        Returns:
+            List of episodes with the specified outcome
+        """
+        # Placeholder - will be implemented in #90
+        logger.debug(
+            "get_episodes_by_outcome called for outcome=%s (not yet implemented)",
+            outcome.value,
+        )
+        raise NotImplementedError("Episodic memory not yet implemented")
+
+    # =========================================================================
+    # Semantic Memory Operations
+    # =========================================================================
+
+    async def store_fact(self, fact: FactCreate) -> Fact:
+        """
+        Store a new fact in semantic memory.
+
+        Args:
+            fact: The fact data to store
+
+        Returns:
+            The created fact with ID
+        """
+        # Placeholder - will be implemented in #91
+        logger.debug(
+            "store_fact called for %s %s %s (not yet implemented)",
+            fact.subject,
+            fact.predicate,
+            fact.object,
+        )
+        raise NotImplementedError("Semantic memory not yet implemented")
+
+    async def search_facts(
+        self,
+        query: str,
+        limit: int | None = None,
+    ) -> RetrievalResult[Fact]:
+        """
+        Search for facts matching a query.
+
+        Args:
+            query: The search query
+            limit: Maximum results to return
+
+        Returns:
+            Retrieval result with matching facts
+        """
+        # Placeholder - will be implemented in #91
+        logger.debug(
+            "search_facts called for query=%s (not yet implemented)",
+            query[:50],
+        )
+        raise NotImplementedError("Semantic memory not yet implemented")
+
+    async def get_facts_by_entity(
+        self,
+        entity: str,
+        limit: int = 20,
+    ) -> list[Fact]:
+        """
+        Get facts related to an entity.
+
+        Args:
+            entity: The entity to search for
+            limit: Maximum facts to return
+
+        Returns:
+            List of facts mentioning the entity
+        """
+        # Placeholder - will be implemented in #91
+        logger.debug(
+            "get_facts_by_entity called for entity=%s (not yet implemented)",
+            entity,
+        )
+        raise NotImplementedError("Semantic memory not yet implemented")
+
+    async def reinforce_fact(self, fact_id: UUID) -> Fact:
+        """
+        Reinforce a fact (increase confidence from repeated learning).
+
+        Args:
+            fact_id: The fact to reinforce
+
+        Returns:
+            The updated fact
+        """
+        # Placeholder - will be implemented in #91
+        logger.debug(
+            "reinforce_fact called for id=%s (not yet implemented)",
+            fact_id,
+        )
+        raise NotImplementedError("Semantic memory not yet implemented")
+
+    # =========================================================================
+    # Procedural Memory Operations
+    # =========================================================================
+
+    async def record_procedure(self, procedure: ProcedureCreate) -> Procedure:
+        """
+        Record a new procedure.
+
+        Args:
+            procedure: The procedure data to record
+
+        Returns:
+            The created procedure with ID
+        """
+        # Placeholder - will be implemented in #92
+        logger.debug(
+            "record_procedure called for name=%s (not yet implemented)",
+            procedure.name,
+        )
+        raise NotImplementedError("Procedural memory not yet implemented")
+
+    async def find_procedures(
+        self,
+        context: str,
+        limit: int = 5,
+    ) -> list[Procedure]:
+        """
+        Find procedures matching the current context.
+
+        Args:
+            context: The context to match against
+            limit: Maximum procedures to return
+
+        Returns:
+            List of matching procedures sorted by success rate
+        """
+        # Placeholder - will be implemented in #92
+        logger.debug(
+            "find_procedures called for context=%s (not yet implemented)",
+            context[:50],
+        )
+        raise NotImplementedError("Procedural memory not yet implemented")
+
+    async def record_procedure_outcome(
+        self,
+        procedure_id: UUID,
+        success: bool,
+    ) -> None:
+        """
+        Record the outcome of using a procedure.
+
+        Args:
+            procedure_id: The procedure that was used
+            success: Whether the procedure succeeded
+        """
+        # Placeholder - will be implemented in #92
+        logger.debug(
+            "record_procedure_outcome called for id=%s success=%s (not yet implemented)",
+            procedure_id,
+            success,
+        )
+        raise NotImplementedError("Procedural memory not yet implemented")
+
+    # =========================================================================
+    # Cross-Memory Operations
+    # =========================================================================
+
+    async def recall(
+        self,
+        query: str,
+        memory_types: list[MemoryType] | None = None,
+        limit: int = 10,
+    ) -> dict[MemoryType, list[Any]]:
+        """
+        Recall memories across multiple memory types.
+
+        Args:
+            query: The search query
+            memory_types: Memory types to search (all if not specified)
+            limit: Maximum results per type
+
+        Returns:
+            Dictionary mapping memory types to results
+        """
+        # Placeholder - will be implemented in #97 (Component Integration)
+        logger.debug("recall called for query=%s (not yet implemented)", query[:50])
+        raise NotImplementedError("Cross-memory recall not yet implemented")
+
+    async def get_stats(
+        self,
+        memory_type: MemoryType | None = None,
+    ) -> list[MemoryStats]:
+        """
+        Get memory statistics.
+
+        Args:
+            memory_type: Specific type or all if not specified
+
+        Returns:
+            List of statistics for requested memory types
+        """
+        # Placeholder - will be implemented in #100 (Metrics & Observability)
+        logger.debug("get_stats called (not yet implemented)")
+        raise NotImplementedError("Memory stats not yet implemented")
+
+    # =========================================================================
+    # Lifecycle Operations
+    # =========================================================================
+
+    async def initialize(self) -> None:
+        """
+        Initialize the memory manager and its backends.
+
+        Should be called before using the manager.
+        """
+        if self._initialized:
+            logger.debug("MemoryManager already initialized")
+            return
+
+        logger.info(
+            "Initializing MemoryManager for scope %s:%s",
+            self._scope.scope_type.value,
+            self._scope.scope_id,
+        )
+
+        # TODO: Initialize backends when implemented
+
+        self._initialized = True
+        logger.info("MemoryManager initialized successfully")
+
+    async def close(self) -> None:
+        """
+        Close the memory manager and release resources.
+
+        Should be called when done using the manager.
+        """
+        if not self._initialized:
+            return
+
+        logger.info(
+            "Closing MemoryManager for scope %s:%s",
+            self._scope.scope_type.value,
+            self._scope.scope_id,
+        )
+
+        # TODO: Close backends when implemented
+
+        self._initialized = False
+        logger.info("MemoryManager closed successfully")
+
+    async def __aenter__(self) -> "MemoryManager":
+        """Async context manager entry."""
+        await self.initialize()
+        return self
+
+    async def __aexit__(self, exc_type: Any, exc_val: Any, exc_tb: Any) -> None:
+        """Async context manager exit."""
+        await self.close()
--- a/backend/app/services/memory/procedural/init.py
+++ b/backend/app/services/memory/procedural/init.py
@@ -0,0 +1,7 @@
+"""
+Procedural Memory
+
+Learned skills and procedures from successful task patterns.
+"""
+
+# Will be populated in #92
--- a/backend/app/services/memory/scoping/init.py
+++ b/backend/app/services/memory/scoping/init.py
@@ -0,0 +1,8 @@
+"""
+Memory Scoping
+
+Hierarchical scoping for memory with inheritance:
+Global -> Project -> Agent Type -> Agent Instance -> Session
+"""
+
+# Will be populated in #93
--- a/backend/app/services/memory/semantic/init.py
+++ b/backend/app/services/memory/semantic/init.py
@@ -0,0 +1,8 @@
+"""
+Semantic Memory
+
+Fact storage with triple format (subject, predicate, object)
+and semantic search capabilities.
+"""
+
+# Will be populated in #91
--- a/backend/app/services/memory/types.py
+++ b/backend/app/services/memory/types.py
@@ -0,0 +1,322 @@
+"""
+Memory System Types
+
+Core type definitions and interfaces for the Agent Memory System.
+"""
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime
+from enum import Enum
+from typing import Any
+from uuid import UUID
+
+
+class MemoryType(str, Enum):
+    """Types of memory in the agent memory system."""
+
+    WORKING = "working"
+    EPISODIC = "episodic"
+    SEMANTIC = "semantic"
+    PROCEDURAL = "procedural"
+
+
+class ScopeLevel(str, Enum):
+    """Hierarchical scoping levels for memory."""
+
+    GLOBAL = "global"
+    PROJECT = "project"
+    AGENT_TYPE = "agent_type"
+    AGENT_INSTANCE = "agent_instance"
+    SESSION = "session"
+
+
+class Outcome(str, Enum):
+    """Outcome of a task or episode."""
+
+    SUCCESS = "success"
+    FAILURE = "failure"
+    PARTIAL = "partial"
+
+
+class ConsolidationStatus(str, Enum):
+    """Status of a memory consolidation job."""
+
+    PENDING = "pending"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    FAILED = "failed"
+
+
+class ConsolidationType(str, Enum):
+    """Types of memory consolidation."""
+
+    WORKING_TO_EPISODIC = "working_to_episodic"
+    EPISODIC_TO_SEMANTIC = "episodic_to_semantic"
+    EPISODIC_TO_PROCEDURAL = "episodic_to_procedural"
+    PRUNING = "pruning"
+
+
+@dataclass
+class ScopeContext:
+    """Represents a memory scope with its hierarchy."""
+
+    scope_type: ScopeLevel
+    scope_id: str
+    parent: "ScopeContext | None" = None
+
+    def get_hierarchy(self) -> list["ScopeContext"]:
+        """Get the full scope hierarchy from root to this scope."""
+        hierarchy: list[ScopeContext] = []
+        current: ScopeContext | None = self
+        while current is not None:
+            hierarchy.insert(0, current)
+            current = current.parent
+        return hierarchy
+
+    def to_key_prefix(self) -> str:
+        """Convert scope to a key prefix for storage."""
+        return f"{self.scope_type.value}:{self.scope_id}"
+
+
+@dataclass
+class MemoryItem:
+    """Base class for all memory items."""
+
+    id: UUID
+    memory_type: MemoryType
+    scope_type: ScopeLevel
+    scope_id: str
+    created_at: datetime
+    updated_at: datetime
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+    def get_age_seconds(self) -> float:
+        """Get the age of this memory item in seconds."""
+        return (datetime.now() - self.created_at).total_seconds()
+
+
+@dataclass
+class WorkingMemoryItem:
+    """A key-value item in working memory."""
+
+    id: UUID
+    scope_type: ScopeLevel
+    scope_id: str
+    key: str
+    value: Any
+    expires_at: datetime | None = None
+    created_at: datetime = field(default_factory=datetime.now)
+    updated_at: datetime = field(default_factory=datetime.now)
+
+    def is_expired(self) -> bool:
+        """Check if this item has expired."""
+        if self.expires_at is None:
+            return False
+        return datetime.now() > self.expires_at
+
+
+@dataclass
+class TaskState:
+    """Current state of a task in working memory."""
+
+    task_id: str
+    task_type: str
+    description: str
+    status: str = "in_progress"
+    current_step: int = 0
+    total_steps: int = 0
+    progress_percent: float = 0.0
+    context: dict[str, Any] = field(default_factory=dict)
+    started_at: datetime = field(default_factory=datetime.now)
+    updated_at: datetime = field(default_factory=datetime.now)
+
+
+@dataclass
+class Episode:
+    """An episodic memory - a recorded experience."""
+
+    id: UUID
+    project_id: UUID
+    agent_instance_id: UUID | None
+    agent_type_id: UUID | None
+    session_id: str
+    task_type: str
+    task_description: str
+    actions: list[dict[str, Any]]
+    context_summary: str
+    outcome: Outcome
+    outcome_details: str
+    duration_seconds: float
+    tokens_used: int
+    lessons_learned: list[str]
+    importance_score: float
+    embedding: list[float] | None
+    occurred_at: datetime
+    created_at: datetime
+    updated_at: datetime
+
+
+@dataclass
+class EpisodeCreate:
+    """Data required to create a new episode."""
+
+    project_id: UUID
+    session_id: str
+    task_type: str
+    task_description: str
+    actions: list[dict[str, Any]]
+    context_summary: str
+    outcome: Outcome
+    outcome_details: str
+    duration_seconds: float
+    tokens_used: int
+    lessons_learned: list[str] = field(default_factory=list)
+    importance_score: float = 0.5
+    agent_instance_id: UUID | None = None
+    agent_type_id: UUID | None = None
+
+
+@dataclass
+class Fact:
+    """A semantic memory fact - a piece of knowledge."""
+
+    id: UUID
+    project_id: UUID | None  # None for global facts
+    subject: str
+    predicate: str
+    object: str
+    confidence: float
+    source_episode_ids: list[UUID]
+    first_learned: datetime
+    last_reinforced: datetime
+    reinforcement_count: int
+    embedding: list[float] | None
+    created_at: datetime
+    updated_at: datetime
+
+
+@dataclass
+class FactCreate:
+    """Data required to create a new fact."""
+
+    subject: str
+    predicate: str
+    object: str
+    confidence: float = 0.8
+    project_id: UUID | None = None
+    source_episode_ids: list[UUID] = field(default_factory=list)
+
+
+@dataclass
+class Procedure:
+    """A procedural memory - a learned skill or procedure."""
+
+    id: UUID
+    project_id: UUID | None
+    agent_type_id: UUID | None
+    name: str
+    trigger_pattern: str
+    steps: list[dict[str, Any]]
+    success_count: int
+    failure_count: int
+    last_used: datetime | None
+    embedding: list[float] | None
+    created_at: datetime
+    updated_at: datetime
+
+    @property
+    def success_rate(self) -> float:
+        """Calculate the success rate of this procedure."""
+        total = self.success_count + self.failure_count
+        if total == 0:
+            return 0.0
+        return self.success_count / total
+
+
+@dataclass
+class ProcedureCreate:
+    """Data required to create a new procedure."""
+
+    name: str
+    trigger_pattern: str
+    steps: list[dict[str, Any]]
+    project_id: UUID | None = None
+    agent_type_id: UUID | None = None
+
+
+@dataclass
+class Step:
+    """A single step in a procedure."""
+
+    order: int
+    action: str
+    parameters: dict[str, Any] = field(default_factory=dict)
+    expected_outcome: str = ""
+    fallback_action: str | None = None
+
+
+class MemoryStore[T: MemoryItem](ABC):
+    """Abstract base class for memory storage backends."""
+
+    @abstractmethod
+    async def store(self, item: T) -> T:
+        """Store a memory item."""
+        ...
+
+    @abstractmethod
+    async def get(self, item_id: UUID) -> T | None:
+        """Get a memory item by ID."""
+        ...
+
+    @abstractmethod
+    async def delete(self, item_id: UUID) -> bool:
+        """Delete a memory item."""
+        ...
+
+    @abstractmethod
+    async def list(
+        self,
+        scope_type: ScopeLevel | None = None,
+        scope_id: str | None = None,
+        limit: int = 100,
+        offset: int = 0,
+    ) -> list[T]:
+        """List memory items with optional scope filtering."""
+        ...
+
+    @abstractmethod
+    async def count(
+        self,
+        scope_type: ScopeLevel | None = None,
+        scope_id: str | None = None,
+    ) -> int:
+        """Count memory items with optional scope filtering."""
+        ...
+
+
+@dataclass
+class RetrievalResult[T]:
+    """Result of a memory retrieval operation."""
+
+    items: list[T]
+    total_count: int
+    query: str
+    retrieval_type: str
+    latency_ms: float
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class MemoryStats:
+    """Statistics about memory usage."""
+
+    memory_type: MemoryType
+    scope_type: ScopeLevel | None
+    scope_id: str | None
+    item_count: int
+    total_size_bytes: int
+    oldest_item_age_seconds: float
+    newest_item_age_seconds: float
+    avg_item_size_bytes: float
+    metadata: dict[str, Any] = field(default_factory=dict)
--- a/backend/app/services/memory/working/init.py
+++ b/backend/app/services/memory/working/init.py
@@ -0,0 +1,8 @@
+"""
+Working Memory
+
+Session-scoped ephemeral memory for current task state,
+variables, and scratchpad.
+"""
+
+# Will be populated in #89