API Reference¶

`contextfs.core.ContextFS` ¶

Universal AI Memory Layer.

Provides: - Semantic search with RAG - Cross-repo namespace isolation - Session management - Git-aware context - Memory lineage (evolve, merge, split) - CORE FEATURE

Memory lineage works automatically based on .env configuration. Configure CONTEXTFS_BACKEND to select storage backend.

Source code in src/contextfs/core.py

class ContextFS:
    """
    Universal AI Memory Layer.

    Provides:
    - Semantic search with RAG
    - Cross-repo namespace isolation
    - Session management
    - Git-aware context
    - Memory lineage (evolve, merge, split) - CORE FEATURE

    Memory lineage works automatically based on .env configuration.
    Configure CONTEXTFS_BACKEND to select storage backend.
    """

    def __init__(
        self,
        data_dir: Path | None = None,
        namespace_id: str | None = None,
        auto_load: bool = True,
        auto_index: bool = True,
    ):
        """
        Initialize ContextFS.

        Args:
            data_dir: Data directory (default: ~/.contextfs)
            namespace_id: Default namespace (default: global or auto-detect from repo)
            auto_load: Load memories on startup
            auto_index: Auto-index repository on first memory save
        """
        self.config = get_config()
        self.data_dir = data_dir or self.config.data_dir
        self.data_dir.mkdir(parents=True, exist_ok=True)

        # Auto-detect namespace from current repo
        self._repo_path: Path | None = None
        if namespace_id is None:
            namespace_id, self._repo_path = self._detect_namespace_and_repo()
        self.namespace_id = namespace_id

        # Initialize storage using backend factory
        self._db_path = self.data_dir / self.config.sqlite_filename
        self._init_db()

        # Initialize RAG backend with configurable embedding backend
        # When chroma_host is set, uses HttpClient (server mode) instead of PersistentClient
        # When chroma_auto_server is True, auto-starts server on corruption
        self.rag = RAGBackend(
            data_dir=self.data_dir,
            embedding_model=self.config.embedding_model,
            embedding_backend=self.config.embedding_backend,
            use_gpu=self.config.use_gpu,
            parallel_workers=self.config.embedding_parallel_workers,
            chroma_host=self.config.chroma_host,
            chroma_port=self.config.chroma_port,
            chroma_auto_server=self.config.chroma_auto_server,
        )

        # Initialize FTS and Hybrid search backends
        from contextfs.fts import FTSBackend, HybridSearch

        self._fts = FTSBackend(self._db_path)
        self._hybrid = HybridSearch(fts_backend=self._fts, rag_backend=self.rag)

        # Initialize graph backend if configured
        self._graph = self._init_graph_backend()

        # Initialize unified storage router (keeps all backends in sync)
        self._storage = StorageRouter(
            db_path=self._db_path,
            rag_backend=self.rag,
            graph_backend=self._graph,
        )

        # Alias for backwards compatibility
        self.storage = self._storage

        # Initialize memory lineage (CORE FEATURE)
        self._lineage = MemoryLineage(self._storage, self._graph)

        # Auto-indexing
        self._auto_index = auto_index
        self._auto_indexer = None
        self._indexing_triggered = False

        # Current session
        self._current_session: Session | None = None

        # Auto-load memories
        if auto_load and self.config.auto_load_on_startup:
            self._load_startup_context()

    def _init_graph_backend(self):
        """Initialize graph backend based on configuration."""
        if not self.config.falkordb_enabled:
            return None

        try:
            from contextfs.graph_backend import FalkorDBBackend

            graph = FalkorDBBackend(
                host=self.config.falkordb_host,
                port=self.config.falkordb_port,
                password=self.config.falkordb_password,
                graph_name=self.config.falkordb_graph_name,
            )
            logger.info(
                f"FalkorDB graph backend enabled: {self.config.falkordb_host}:{self.config.falkordb_port}"
            )
            return graph
        except ImportError:
            logger.warning("FalkorDB not installed. Graph features using SQLite fallback.")
            return None
        except Exception as e:
            logger.warning(f"FalkorDB connection failed: {e}. Using SQLite fallback.")
            return None

    def _detect_namespace(self) -> str:
        """Detect namespace from current git repo or use global."""
        namespace_id, _ = self._detect_namespace_and_repo()
        return namespace_id

    def _detect_namespace_and_repo(self) -> tuple[str, Path | None]:
        """Detect namespace and repo path from current git repo."""
        cwd = Path.cwd()

        # Walk up to find .git
        for parent in [cwd] + list(cwd.parents):
            if (parent / ".git").exists():
                return Namespace.for_repo(str(parent)).id, parent

        return "global", None

    def _init_db(self) -> None:
        """Initialize SQLite database with Alembic migrations."""
        from contextfs.migrations.runner import run_migrations, stamp_database

        db_exists = self._db_path.exists()

        if db_exists:
            # Check if database has alembic_version table
            conn = sqlite3.connect(self._db_path)
            cursor = conn.cursor()
            cursor.execute(
                "SELECT name FROM sqlite_master WHERE type='table' AND name='alembic_version'"
            )
            has_alembic = cursor.fetchone() is not None
            conn.close()

            if not has_alembic:
                # Existing database without migrations - stamp it first
                logger.info("Stamping existing database with migration baseline")
                stamp_database(self._db_path, "001")

        # Run any pending migrations
        try:
            run_migrations(self._db_path)
        except Exception as e:
            logger.warning(f"Migration failed, falling back to legacy init: {e}")
            self._init_db_legacy()

    def _init_db_legacy(self) -> None:
        """Legacy database initialization (fallback)."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Memories table
        cursor.execute("""
            CREATE TABLE IF NOT EXISTS memories (
                id TEXT PRIMARY KEY,
                content TEXT NOT NULL,
                type TEXT NOT NULL,
                tags TEXT,
                summary TEXT,
                namespace_id TEXT NOT NULL,
                source_file TEXT,
                source_repo TEXT,
                source_tool TEXT,
                project TEXT,
                session_id TEXT,
                created_at TEXT NOT NULL,
                updated_at TEXT NOT NULL,
                metadata TEXT,
                structured_data TEXT,
                authoritative INTEGER DEFAULT 0
            )
        """)

        # Add structured_data column if it doesn't exist (for existing databases)
        try:
            cursor.execute("ALTER TABLE memories ADD COLUMN structured_data TEXT")
        except sqlite3.OperationalError:
            pass  # Column already exists

        # Add authoritative column if it doesn't exist (Phase 3)
        try:
            cursor.execute("ALTER TABLE memories ADD COLUMN authoritative INTEGER DEFAULT 0")
        except sqlite3.OperationalError:
            pass  # Column already exists

        # Sessions table
        cursor.execute("""
            CREATE TABLE IF NOT EXISTS sessions (
                id TEXT PRIMARY KEY,
                label TEXT,
                namespace_id TEXT NOT NULL,
                tool TEXT NOT NULL,
                repo_path TEXT,
                branch TEXT,
                started_at TEXT NOT NULL,
                ended_at TEXT,
                summary TEXT,
                metadata TEXT
            )
        """)

        # Messages table
        cursor.execute("""
            CREATE TABLE IF NOT EXISTS messages (
                id TEXT PRIMARY KEY,
                session_id TEXT NOT NULL,
                role TEXT NOT NULL,
                content TEXT NOT NULL,
                timestamp TEXT NOT NULL,
                metadata TEXT,
                FOREIGN KEY (session_id) REFERENCES sessions(id)
            )
        """)

        # Namespaces table
        cursor.execute("""
            CREATE TABLE IF NOT EXISTS namespaces (
                id TEXT PRIMARY KEY,
                name TEXT NOT NULL,
                parent_id TEXT,
                repo_path TEXT,
                created_at TEXT NOT NULL,
                metadata TEXT
            )
        """)

        # FTS for text search
        cursor.execute("""
            CREATE VIRTUAL TABLE IF NOT EXISTS memories_fts USING fts5(
                id, content, summary, tags,
                content='memories',
                content_rowid='rowid'
            )
        """)

        # Indexes
        cursor.execute(
            "CREATE INDEX IF NOT EXISTS idx_memories_namespace ON memories(namespace_id)"
        )
        cursor.execute("CREATE INDEX IF NOT EXISTS idx_memories_type ON memories(type)")
        cursor.execute(
            "CREATE INDEX IF NOT EXISTS idx_sessions_namespace ON sessions(namespace_id)"
        )
        cursor.execute("CREATE INDEX IF NOT EXISTS idx_sessions_label ON sessions(label)")

        conn.commit()
        conn.close()

    def _load_startup_context(self) -> None:
        """Load relevant context on startup."""
        # This could load recent memories, active session, etc.
        pass

    def check_and_repair_chromadb(self) -> bool:
        """Check if ChromaDB needs repair and rebuild if necessary.

        This is called automatically when corruption is detected during
        initialization. Returns True if repair was performed.
        """
        import logging

        logger = logging.getLogger(__name__)

        if not self.rag.needs_rebuild:
            return False

        logger.info("ChromaDB was auto-recovered from corruption. Rebuilding from SQLite...")

        try:
            # Rebuild ChromaDB from SQLite (our memories are safe there)
            stats = self.rebuild_chromadb()
            logger.info(f"ChromaDB rebuilt successfully: {stats.get('rebuilt', 0)} memories")
            self.rag.mark_rebuilt()
            return True
        except Exception as e:
            logger.error(f"Failed to rebuild ChromaDB: {e}")
            return False

    # ==================== Auto-Indexing ====================

    def _get_auto_indexer(self):
        """Lazy-load the auto-indexer."""
        if self._auto_indexer is None:
            from contextfs.autoindex import AutoIndexer

            self._auto_indexer = AutoIndexer(
                config=self.config,
                db_path=self._db_path,
            )
        return self._auto_indexer

    def _maybe_auto_index(self) -> dict | None:
        """
        Trigger auto-indexing on first memory save if applicable.

        Returns indexing stats if indexing occurred, None otherwise.
        """
        if not self._auto_index or self._indexing_triggered:
            return None

        if not self._repo_path or not self._repo_path.exists():
            return None

        self._indexing_triggered = True

        indexer = self._get_auto_indexer()

        # Check if already indexed
        if indexer.is_indexed(self.namespace_id):
            logger.debug(f"Namespace {self.namespace_id} already indexed")
            return None

        # Index repository
        logger.info(f"Auto-indexing repository: {self._repo_path}")

        def on_progress(current: int, total: int, file: str) -> None:
            if current % 10 == 0 or current == total:
                logger.info(f"Indexing: {current}/{total} - {file}")

        try:
            stats = indexer.index_repository(
                repo_path=self._repo_path,
                namespace_id=self.namespace_id,
                storage=self.storage,
                on_progress=on_progress,
                incremental=True,
            )
            logger.info(
                f"Auto-indexing complete: {stats['files_indexed']} files, "
                f"{stats['memories_created']} memories"
            )
            return stats
        except Exception as e:
            logger.warning(f"Auto-indexing failed: {e}")
            return None

    def _namespace_for_path(self, repo_path: Path) -> str:
        """Get namespace ID for a repository path."""
        from contextfs.schemas import Namespace

        return Namespace.for_repo(str(repo_path)).id

    def index_repository(
        self,
        repo_path: Path | None = None,
        on_progress: Callable[[int, int, str], None] | None = None,
        incremental: bool = True,
        project: str | None = None,
        source_repo: str | None = None,
        mode: str = "all",
    ) -> dict:
        """
        Manually index a repository to ChromaDB.

        Args:
            repo_path: Repository path (default: current repo)
            on_progress: Progress callback (current, total, file)
            incremental: Only index new/changed files
            project: Project name for grouping memories across repos
            source_repo: Repository name (default: repo directory name)
            mode: "all", "files_only", or "commits_only"

        Returns:
            Indexing statistics
        """
        from contextfs.autoindex import IndexMode

        path = repo_path or self._repo_path
        if not path:
            raise ValueError("No repository path available")

        # Use namespace derived from the repo being indexed, not ctx's namespace
        namespace_id = self._namespace_for_path(Path(path))

        # Default source_repo to directory name
        if source_repo is None:
            source_repo = Path(path).name

        # Convert string mode to IndexMode enum
        index_mode = IndexMode(mode) if isinstance(mode, str) else mode

        indexer = self._get_auto_indexer()
        return indexer.index_repository(
            repo_path=path,
            namespace_id=namespace_id,
            storage=self.storage,
            on_progress=on_progress,
            incremental=incremental,
            project=project,
            source_repo=source_repo,
            mode=index_mode,
        )

    def get_index_status(self, repo_path: Path | None = None):
        """Get indexing status for a repository.

        Args:
            repo_path: Repository path (default: current working directory's repo)
        """
        if repo_path:
            namespace_id = self._namespace_for_path(repo_path)
        else:
            # Detect from current working directory
            namespace_id, _ = self._detect_namespace_and_repo()
        return self._get_auto_indexer().get_status(namespace_id)

    def clear_index(self, repo_path: Path | None = None) -> None:
        """Clear indexing status for a repository.

        Args:
            repo_path: Repository path (default: current working directory's repo)
        """
        if repo_path:
            namespace_id = self._namespace_for_path(repo_path)
        else:
            namespace_id, _ = self._detect_namespace_and_repo()
        self._get_auto_indexer().clear_index(namespace_id)
        self._indexing_triggered = False

    def list_indexes(self) -> list:
        """List all indexed repositories."""
        return self._get_auto_indexer().list_all_indexes()

    def cleanup_indexes(self, dry_run: bool = False) -> dict:
        """
        Remove indexes for repositories that no longer exist on disk.

        Args:
            dry_run: If True, only report what would be deleted without deleting

        Returns:
            Dict with 'removed' (list of removed indexes) and 'kept' (list of valid indexes)
        """
        return self._get_auto_indexer().cleanup_stale_indexes(dry_run=dry_run)

    def delete_index(self, namespace_id: str | None = None, repo_path: str | None = None) -> bool:
        """
        Delete a specific index by namespace ID or repository path.

        Args:
            namespace_id: The namespace ID to delete
            repo_path: The repository path to delete

        Returns:
            True if deleted, False if not found
        """
        indexer = self._get_auto_indexer()
        if namespace_id:
            return indexer.delete_index(namespace_id)
        elif repo_path:
            return indexer.delete_index_by_path(repo_path)
        return False

    def update_repo_path(
        self,
        namespace_id: str | None = None,
        old_path: str | None = None,
        new_path: str | None = None,
    ) -> dict:
        """
        Update the repository path for an existing index.

        Use this when a repository has been moved to a new location.
        The namespace_id remains the same, preserving all indexed memories
        in both SQLite and ChromaDB.

        Args:
            namespace_id: The namespace ID to update (preferred)
            old_path: The old repository path to find the index (alternative)
            new_path: The new repository path

        Returns:
            Dict with status and updated info:
            - success: bool
            - namespace_id: str (if successful)
            - old_path: str (previous path)
            - new_path: str (updated path)
            - files_indexed, commits_indexed, memories_created: int (preserved counts)
        """
        indexer = self._get_auto_indexer()
        return indexer.update_repo_path(
            namespace_id=namespace_id,
            old_path=old_path,
            new_path=new_path,
        )

    def find_index_by_repo_name(self, repo_name: str) -> list[dict]:
        """
        Find indexes that match a repository name.

        Useful when you know the repo name but not the exact path.

        Args:
            repo_name: Repository directory name to search for

        Returns:
            List of matching indexes with their info
        """
        indexer = self._get_auto_indexer()
        return indexer.find_index_by_repo_name(repo_name)

    def migrate_namespace(
        self,
        old_namespace_id: str,
        new_namespace_id: str,
        new_source: str | None = None,
        new_remote_url: str | None = None,
    ) -> dict:
        """
        Migrate an index from one namespace ID to another.

        Updates all references in SQLite and ChromaDB to use the new namespace ID.
        Use this when converting from path-based to git-remote-based namespaces.

        Args:
            old_namespace_id: Current namespace ID
            new_namespace_id: New namespace ID to migrate to
            new_source: Namespace derivation source (explicit, git_remote, path)
            new_remote_url: Git remote URL if available

        Returns:
            Migration statistics
        """
        indexer = self._get_auto_indexer()
        return indexer.migrate_namespace(
            old_namespace_id=old_namespace_id,
            new_namespace_id=new_namespace_id,
            new_source=new_source,
            new_remote_url=new_remote_url,
            storage=self.storage,
        )

    def get_migration_candidates(self) -> list[dict]:
        """
        Find indexes that should be migrated from path-based to git-remote-based.

        Returns list of indexes where:
        - Current namespace is path-based (old format)
        - Repo has a git remote URL
        - New git-remote namespace would be different

        Returns:
            List of migration candidates with old/new namespace info
        """
        indexer = self._get_auto_indexer()
        return indexer.get_migration_candidates()

    def migrate_all_to_git_remote(self, dry_run: bool = False) -> dict:
        """
        Migrate all path-based namespaces to git-remote-based where possible.

        This makes namespaces portable across machines, enabling proper sync
        between developers with different local paths.

        Args:
            dry_run: If True, only report what would be migrated

        Returns:
            Migration summary with counts and any errors
        """
        indexer = self._get_auto_indexer()
        return indexer.migrate_all_to_git_remote(
            storage=self.storage,
            dry_run=dry_run,
        )

    def index_directory(
        self,
        root_dir: Path,
        max_depth: int = 5,
        on_progress: Callable[[int, int, str], None] | None = None,
        on_repo_start: Callable[[str, str | None], None] | None = None,
        on_repo_complete: Callable[[str, dict], None] | None = None,
        incremental: bool = True,
        project_override: str | None = None,
        repo_filter: Callable[[Path], bool] | None = None,
    ) -> dict:
        """
        Recursively scan a directory for git repos and index each.

        Args:
            root_dir: Root directory to scan for git repositories
            max_depth: Maximum directory depth to search (default: 5)
            on_progress: Progress callback for file indexing (current, total, file)
            on_repo_start: Callback when starting a repo (repo_name, project)
            on_repo_complete: Callback when repo completes (repo_name, stats)
            incremental: Only index new/changed files
            project_override: Override auto-detected project name for all repos
            repo_filter: Optional callback to filter repos (return True to include)

        Returns:
            Summary statistics including repos found, files indexed, etc.
        """
        indexer = self._get_auto_indexer()
        return indexer.index_directory(
            root_dir=root_dir,
            storage=self.storage,
            max_depth=max_depth,
            on_progress=on_progress,
            on_repo_start=on_repo_start,
            on_repo_complete=on_repo_complete,
            incremental=incremental,
            project_override=project_override,
            repo_filter=repo_filter,
        )

    def discover_repos(self, root_dir: Path, max_depth: int = 5) -> list[dict]:
        """
        Discover git repositories without indexing them.

        Args:
            root_dir: Root directory to scan
            max_depth: Maximum directory depth to search

        Returns:
            List of repo info dicts with path, name, project, suggested_tags
        """
        from contextfs.autoindex import discover_git_repos

        return discover_git_repos(root_dir, max_depth=max_depth)

    # ==================== Memory Operations ====================

    def save(
        self,
        content: str,
        type: MemoryType = MemoryType.FACT,
        tags: list[str] | None = None,
        summary: str | None = None,
        namespace_id: str | None = None,
        source_tool: str | None = None,
        source_repo: str | None = None,
        project: str | None = None,
        metadata: dict | None = None,
        created_at: datetime | None = None,
        updated_at: datetime | None = None,
        id: str | None = None,
        structured_data: dict | None = None,
        authoritative: bool = False,
    ) -> Memory:
        """
        Save content to memory.

        Args:
            content: Content to save
            type: Memory type
            tags: Tags for categorization
            summary: Brief summary
            namespace_id: Namespace (default: current)
            source_tool: Tool that created memory (claude-code, claude-desktop, gemini, etc.)
            source_repo: Repository name/path
            project: Project name for grouping memories across repos
            metadata: Additional metadata
            created_at: Original creation timestamp (for sync, defaults to now)
            updated_at: Original update timestamp (for sync, defaults to now)
            id: Memory ID (for sync, auto-generated if not provided)
            structured_data: Optional structured data validated against TYPE_SCHEMAS
            authoritative: Whether this is the authoritative/canonical version in a lineage

        Returns:
            Saved Memory object
        """
        # Trigger auto-indexing on first save (indexes codebase to ChromaDB)
        self._maybe_auto_index()

        # Auto-detect source_repo from repo_path
        if source_repo is None and self._repo_path:
            source_repo = self._repo_path.name

        # Auto-set project from source_repo if not provided
        if project is None and source_repo:
            project = source_repo

        # Check for duplicate by content hash (skip if already exists)
        content_hash = hashlib.sha256(content.encode()).hexdigest()[:16]
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()
        cursor.execute(
            "SELECT id FROM memories WHERE content_hash = ? AND namespace_id = ?",
            (content_hash, namespace_id or self.namespace_id),
        )
        existing = cursor.fetchone()
        if existing and id is None:
            # Return existing memory instead of creating duplicate
            conn.close()
            return self.recall(existing[0])  # type: ignore

        memory_kwargs = {
            "content": content,
            "type": type,
            "tags": tags or [],
            "summary": summary,
            "namespace_id": namespace_id or self.namespace_id,
            "source_tool": source_tool,
            "source_repo": source_repo,
            "project": project,
            "session_id": self._current_session.id if self._current_session else None,
            "metadata": metadata or {},
            "created_at": created_at or datetime.now(timezone.utc),
            "updated_at": updated_at or datetime.now(timezone.utc),
            "structured_data": structured_data,
            "authoritative": authoritative,
            "content_hash": content_hash,
        }
        if id is not None:
            memory_kwargs["id"] = id
        memory = Memory(**memory_kwargs)
        conn.close()

        # Save to SQLite
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Get vector_clock from metadata if available (for sync consistency)
        vector_clock = None
        if memory.metadata and memory.metadata.get("_vector_clock"):
            vector_clock = json.dumps(memory.metadata["_vector_clock"])

        cursor.execute(
            """
            INSERT OR REPLACE INTO memories (id, content, type, tags, summary, namespace_id,
                                  source_file, source_repo, source_tool, project, session_id, created_at, updated_at, metadata, structured_data, authoritative, content_hash, vector_clock)
            VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
        """,
            (
                memory.id,
                memory.content,
                memory.type.value,
                json.dumps(memory.tags),
                memory.summary,
                memory.namespace_id,
                memory.source_file,
                memory.source_repo,
                memory.source_tool,
                memory.project,
                memory.session_id,
                memory.created_at.isoformat(),
                memory.updated_at.isoformat(),
                json.dumps(memory.metadata),
                json.dumps(memory.structured_data) if memory.structured_data is not None else None,
                1 if memory.authoritative else 0,
                content_hash,
                vector_clock,
            ),
        )

        # Update session's memories_created list if we have an active session
        if (
            self._current_session
            and memory.session_id
            and memory.id not in self._current_session.memories_created
        ):
            self._current_session.memories_created.append(memory.id)
            # Update session in database
            cursor.execute(
                "UPDATE sessions SET memories_created = ? WHERE id = ?",
                (json.dumps(self._current_session.memories_created), self._current_session.id),
            )

        # Update FTS index
        # For content-linked FTS (content='memories'), we need to use the special rebuild command
        # First try the direct approach, fall back to rebuild if it fails
        try:
            # Get the rowid for this memory
            cursor.execute("SELECT rowid FROM memories WHERE id = ?", (memory.id,))
            row = cursor.fetchone()
            if row:
                rowid = row[0]
                # Delete old FTS entry using the special 'delete' command
                try:
                    cursor.execute(
                        "INSERT INTO memories_fts(memories_fts, rowid) VALUES('delete', ?)",
                        (rowid,),
                    )
                except sqlite3.OperationalError:
                    pass  # May not exist yet
                # Insert new FTS entry
                cursor.execute(
                    """
                    INSERT INTO memories_fts(rowid, id, content, summary, tags, type, namespace_id, source_repo, source_tool, project)
                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                    """,
                    (
                        rowid,
                        memory.id,
                        memory.content,
                        memory.summary,
                        " ".join(memory.tags),
                        memory.type.value if hasattr(memory.type, "value") else memory.type,
                        memory.namespace_id,
                        memory.source_repo,
                        memory.source_tool,
                        memory.project,
                    ),
                )
        except sqlite3.DatabaseError:
            # If FTS is corrupted, rebuild it
            try:
                cursor.execute("INSERT INTO memories_fts(memories_fts) VALUES('rebuild')")
            except sqlite3.DatabaseError:
                pass  # FTS rebuild failed, will be handled later

        conn.commit()
        conn.close()

        # Add to RAG index
        self.rag.add_memory(memory)

        # Auto-link to related memories
        self._auto_link_references(memory)

        return memory

    def save_batch(
        self,
        memories: list[Memory],
        skip_rag: bool = False,
    ) -> int:
        """
        Save multiple memories in a single transaction for efficiency.

        Used by sync operations to bulk-insert pulled memories.

        Args:
            memories: List of Memory objects to save
            skip_rag: If True, skip adding to RAG index (caller will rebuild)

        Returns:
            Number of memories saved
        """
        if not memories:
            return 0

        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Get existing content hashes to skip duplicates
        existing_hashes: set[str] = set()
        cursor.execute("SELECT content_hash FROM memories WHERE content_hash IS NOT NULL")
        for row in cursor.fetchall():
            existing_hashes.add(row[0])

        count = 0
        for memory in memories:
            try:
                # Compute content hash for duplicate detection
                content_hash = hashlib.sha256(memory.content.encode()).hexdigest()[:16]

                # Skip if content already exists (unless sync is providing specific ID)
                if content_hash in existing_hashes and not skip_rag:
                    # skip_rag=True indicates sync operation, allow ID-based upsert
                    continue

                # Get vector_clock from metadata if available
                vector_clock = None
                if memory.metadata and memory.metadata.get("_vector_clock"):
                    vector_clock = json.dumps(memory.metadata["_vector_clock"])

                cursor.execute(
                    """
                    INSERT OR REPLACE INTO memories (id, content, type, tags, summary, namespace_id,
                                      source_file, source_repo, source_tool, project, session_id, created_at, updated_at, metadata, structured_data, authoritative, content_hash, vector_clock)
                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                    """,
                    (
                        memory.id,
                        memory.content,
                        memory.type.value if hasattr(memory.type, "value") else memory.type,
                        json.dumps(memory.tags),
                        memory.summary,
                        memory.namespace_id,
                        memory.source_file,
                        memory.source_repo,
                        memory.source_tool,
                        memory.project,
                        memory.session_id,
                        memory.created_at.isoformat()
                        if hasattr(memory.created_at, "isoformat")
                        else memory.created_at,
                        memory.updated_at.isoformat()
                        if hasattr(memory.updated_at, "isoformat")
                        else memory.updated_at,
                        json.dumps(memory.metadata) if memory.metadata else "{}",
                        json.dumps(memory.structured_data)
                        if memory.structured_data is not None
                        else None,
                        1 if getattr(memory, "authoritative", False) else 0,
                        content_hash,
                        vector_clock,
                    ),
                )
                existing_hashes.add(content_hash)
                count += 1
            except Exception as e:
                logger.warning(f"Failed to save memory {memory.id}: {e}")

        # Commit all changes
        conn.commit()

        # Rebuild FTS index once (much faster than individual updates)
        try:
            cursor.execute("INSERT INTO memories_fts(memories_fts) VALUES('rebuild')")
            conn.commit()
        except sqlite3.DatabaseError as e:
            logger.warning(f"FTS rebuild failed: {e}")

        conn.close()

        # Add to RAG index in batch
        if not skip_rag:
            for memory in memories:
                try:
                    self.rag.add_memory(memory)
                except Exception as e:
                    logger.warning(f"Failed to add memory {memory.id} to RAG: {e}")

        return count

    def search(
        self,
        query: str,
        limit: int = 10,
        type: MemoryType | None = None,
        tags: list[str] | None = None,
        namespace_id: str | None = None,
        source_tool: str | None = None,
        source_repo: str | None = None,
        project: str | None = None,
        cross_repo: bool = False,
        mode: str = "hybrid",
        use_semantic: bool | None = None,  # Deprecated, use mode instead
    ) -> list[SearchResult]:
        """
        Search memories.

        Args:
            query: Search query
            limit: Maximum results
            type: Filter by type
            tags: Filter by tags
            namespace_id: Filter by namespace (None with cross_repo=True searches all)
            source_tool: Filter by source tool (claude-code, claude-desktop, gemini, etc.)
            source_repo: Filter by source repository name
            project: Filter by project name (groups memories across repos)
            cross_repo: If True, search across all namespaces/repos
            mode: Search mode - "hybrid" (default), "semantic", "keyword", "smart"
                  - hybrid: Combines FTS + RAG using Reciprocal Rank Fusion
                  - semantic: RAG vector search only (good for conceptual queries)
                  - keyword: FTS5 keyword search only (fast, good for exact terms)
                  - smart: Routes to optimal backend based on memory type
            use_semantic: DEPRECATED - use mode="semantic" or mode="keyword" instead

        Returns:
            List of SearchResult objects
        """
        import re

        # Handle deprecated use_semantic parameter
        if use_semantic is not None:
            mode = "semantic" if use_semantic else "keyword"

        # Auto-detect memory ID pattern (8+ hex chars)
        # If query looks like a memory ID, use recall() instead of vector search
        if re.match(r"^[a-f0-9]{8,}$", query.lower().strip()):
            memory = self.recall(query.strip())
            if memory:
                # Check type filter if specified
                if type and memory.type != type:
                    return []
                return [SearchResult(memory=memory, score=1.0)]
            # If not found by ID, fall through to regular search

        # For cross-repo or project search, don't filter by namespace
        effective_namespace = (
            None if (cross_repo or project) else (namespace_id or self.namespace_id)
        )

        # Determine fetch limit (over-fetch for post-filtering)
        fetch_limit = limit * 2 if (source_tool or source_repo or project) else limit

        # Execute search based on mode
        if mode == "semantic":
            results = self.rag.search(
                query=query,
                limit=fetch_limit,
                type=type,
                tags=tags,
                namespace_id=effective_namespace,
            )
        elif mode == "keyword":
            results = self._fts.search(
                query=query,
                limit=fetch_limit,
                type=type,
                tags=tags,
                namespace_id=effective_namespace,
            )
        elif mode == "smart":
            results = self._hybrid.smart_search(
                query=query,
                limit=fetch_limit,
                type=type,
                tags=tags,
                namespace_id=effective_namespace,
            )
        else:  # Default: hybrid
            results = self._hybrid.search(
                query=query,
                limit=fetch_limit,
                type=type,
                tags=tags,
                namespace_id=effective_namespace,
            )

        # Post-filter by source_tool, source_repo, and project if specified
        if source_tool or source_repo or project:
            filtered = []
            for r in results:
                if source_tool and r.memory.source_tool != source_tool:
                    continue
                if source_repo and r.memory.source_repo != source_repo:
                    continue
                if project and r.memory.project != project:
                    continue
                filtered.append(r)
            results = filtered[:limit]

        return results

    def search_global(
        self,
        query: str,
        limit: int = 10,
        type: MemoryType | None = None,
        source_tool: str | None = None,
        source_repo: str | None = None,
    ) -> list[SearchResult]:
        """
        Search memories across all repos and namespaces.

        Args:
            query: Search query
            limit: Maximum results
            type: Filter by type
            source_tool: Filter by source tool
            source_repo: Filter by source repository

        Returns:
            List of SearchResult objects from all repos
        """
        return self.search(
            query=query,
            limit=limit,
            type=type,
            source_tool=source_tool,
            source_repo=source_repo,
            cross_repo=True,
        )

    def list_repos(self) -> list[dict]:
        """
        List all repositories with memories.

        Returns:
            List of dicts with repo info (name, namespace_id, memory_count)
        """
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute("""
            SELECT DISTINCT source_repo, namespace_id, COUNT(*) as count
            FROM memories
            WHERE source_repo IS NOT NULL
            GROUP BY source_repo, namespace_id
            ORDER BY count DESC
        """)

        repos = []
        for row in cursor.fetchall():
            repos.append(
                {
                    "source_repo": row[0],
                    "namespace_id": row[1],
                    "memory_count": row[2],
                }
            )

        conn.close()
        return repos

    def list_tools(self) -> list[dict]:
        """
        List all source tools with memories.

        Returns:
            List of dicts with tool info (name, memory_count)
        """
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute("""
            SELECT DISTINCT source_tool, COUNT(*) as count
            FROM memories
            WHERE source_tool IS NOT NULL
            GROUP BY source_tool
            ORDER BY count DESC
        """)

        tools = []
        for row in cursor.fetchall():
            tools.append(
                {
                    "source_tool": row[0],
                    "memory_count": row[1],
                }
            )

        conn.close()
        return tools

    def list_projects(self) -> list[dict]:
        """
        List all projects with memories.

        Returns:
            List of dicts with project info (name, repos, memory_count)
        """
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute("""
            SELECT project, GROUP_CONCAT(DISTINCT source_repo) as repos, COUNT(*) as count
            FROM memories
            WHERE project IS NOT NULL
            GROUP BY project
            ORDER BY count DESC
        """)

        projects = []
        for row in cursor.fetchall():
            projects.append(
                {
                    "project": row[0],
                    "repos": row[1].split(",") if row[1] else [],
                    "memory_count": row[2],
                }
            )

        conn.close()
        return projects

    def search_project(
        self,
        project: str,
        query: str | None = None,
        limit: int = 10,
        type: MemoryType | None = None,
    ) -> list[SearchResult]:
        """
        Search memories within a project (across all repos in the project).

        Args:
            project: Project name
            query: Optional search query (if None, returns recent memories)
            limit: Maximum results
            type: Filter by type

        Returns:
            List of SearchResult objects
        """
        if query:
            return self.search(
                query=query,
                limit=limit,
                type=type,
                project=project,
                cross_repo=True,
            )
        else:
            # Return recent memories for project
            conn = sqlite3.connect(self._db_path)
            cursor = conn.cursor()

            sql = "SELECT * FROM memories WHERE project = ? AND deleted_at IS NULL"
            params = [project]

            if type:
                sql += " AND type = ?"
                params.append(type.value)

            sql += f" ORDER BY created_at DESC LIMIT {limit}"

            cursor.execute(sql, params)
            rows = cursor.fetchall()
            conn.close()

            return [SearchResult(memory=self._row_to_memory(row), score=1.0) for row in rows]

    def _fts_search(
        self,
        query: str,
        limit: int,
        type: MemoryType | None,
        tags: list[str] | None,
        namespace_id: str | None,
    ) -> list[SearchResult]:
        """Full-text search fallback."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        sql = """
            SELECT m.* FROM memories m
            JOIN memories_fts fts ON m.id = fts.id
            WHERE memories_fts MATCH ? AND m.deleted_at IS NULL
        """
        params = [query]

        if namespace_id:
            sql += " AND m.namespace_id = ?"
            params.append(namespace_id)

        if type:
            sql += " AND m.type = ?"
            params.append(type.value)

        sql += f" LIMIT {limit}"

        cursor.execute(sql, params)
        rows = cursor.fetchall()
        conn.close()

        results = []
        for row in rows:
            memory = self._row_to_memory(row)
            results.append(SearchResult(memory=memory, score=0.8))

        return results

    def recall(self, memory_id: str) -> Memory | None:
        """
        Recall a specific memory by ID.

        Checks SQLite first, then falls back to ChromaDB for indexed memories.

        Args:
            memory_id: Memory ID (can be partial, at least 8 chars)

        Returns:
            Memory or None
        """
        # Use StorageRouter for unified recall (SQLite + ChromaDB fallback)
        return self.storage.recall(memory_id)

    def list_recent(
        self,
        limit: int = 10,
        type: MemoryType | None = None,
        namespace_id: str | None = None,
        source_tool: str | None = None,
        project: str | None = None,
    ) -> list[Memory]:
        """List recent memories."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        sql = "SELECT * FROM memories WHERE deleted_at IS NULL"
        params: list = []

        if namespace_id:
            sql += " AND namespace_id = ?"
            params.append(namespace_id)

        if type:
            sql += " AND type = ?"
            params.append(type.value)

        if source_tool:
            sql += " AND source_tool = ?"
            params.append(source_tool)

        if project:
            sql += " AND project = ?"
            params.append(project)

        sql += f" ORDER BY created_at DESC LIMIT {limit}"

        cursor.execute(sql, params)
        rows = cursor.fetchall()
        conn.close()

        return [self._row_to_memory(row) for row in rows]

    def delete(self, memory_id: str, hard_delete: bool = False) -> bool:
        """Soft-delete a memory (sets deleted_at timestamp).

        Args:
            memory_id: ID of memory to delete (supports partial matching)
            hard_delete: If True, permanently remove instead of soft-delete

        Returns:
            True if memory was deleted, False if not found
        """
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Support partial ID matching
        cursor.execute("SELECT id FROM memories WHERE id LIKE ?", (f"{memory_id}%",))
        row = cursor.fetchone()
        if not row:
            conn.close()
            return False

        full_id = row[0]

        if hard_delete:
            # Permanently delete memory
            cursor.execute("DELETE FROM memories WHERE id = ?", (full_id,))
            deleted = cursor.rowcount > 0
        else:
            # Soft delete - set deleted_at timestamp for sync propagation
            now = datetime.now(timezone.utc).isoformat()
            cursor.execute(
                "UPDATE memories SET deleted_at = ?, updated_at = ? WHERE id = ? AND deleted_at IS NULL",
                (now, now, full_id),
            )
            deleted = cursor.rowcount > 0

        conn.commit()
        conn.close()

        if deleted:
            # Clean up edges after releasing the connection to avoid "database is locked"
            if hard_delete:
                self._storage._delete_edges_for_memory(full_id)
            else:
                self._storage._soft_delete_edges_for_memory(full_id)

            self.rag.remove_memory(full_id)

        return deleted

    def update(
        self,
        memory_id: str,
        content: str | None = None,
        type: MemoryType | None = None,
        tags: list[str] | None = None,
        summary: str | None = None,
        project: str | None = None,
        metadata: dict | None = None,
        authoritative: bool | None = None,
    ) -> Memory | None:
        """
        Update an existing memory.

        Args:
            memory_id: Memory ID (can be partial, at least 8 chars)
            content: New content (optional)
            type: New type (optional)
            tags: New tags (optional)
            summary: New summary (optional)
            project: New project (optional)
            metadata: New metadata (optional)
            authoritative: New authoritative flag (optional)

        Returns:
            Updated Memory or None if not found
        """
        # First, recall the existing memory
        memory = self.recall(memory_id)
        if not memory:
            return None

        # Update fields if provided
        if content is not None:
            memory.content = content
        if type is not None:
            memory.type = type
        if tags is not None:
            memory.tags = tags
        if summary is not None:
            memory.summary = summary
        if project is not None:
            memory.project = project
        if metadata is not None:
            memory.metadata = metadata
        if authoritative is not None:
            memory.authoritative = authoritative

        memory.updated_at = datetime.now(timezone.utc)

        # Update in database
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute(
            """
            UPDATE memories SET
                content = ?,
                type = ?,
                tags = ?,
                summary = ?,
                project = ?,
                updated_at = ?,
                metadata = ?,
                authoritative = ?
            WHERE id = ?
        """,
            (
                memory.content,
                memory.type.value,
                json.dumps(memory.tags),
                memory.summary,
                memory.project,
                memory.updated_at.isoformat(),
                json.dumps(memory.metadata),
                1 if memory.authoritative else 0,
                memory.id,
            ),
        )

        # Update FTS
        cursor.execute("DELETE FROM memories_fts WHERE id = ?", (memory.id,))
        cursor.execute(
            """
            INSERT INTO memories_fts (id, content, summary, tags)
            VALUES (?, ?, ?, ?)
        """,
            (memory.id, memory.content, memory.summary, " ".join(memory.tags)),
        )

        conn.commit()
        conn.close()

        # Update RAG index
        self.rag.remove_memory(memory.id)
        self.rag.add_memory(memory)

        return memory

    def _row_to_memory(self, row) -> Memory:
        """Convert database row to Memory object."""
        # DB schema (after migration 002):
        # id, content, type, tags, summary, namespace_id, source_file,
        # source_repo, source_tool, project, session_id, created_at,
        # updated_at, metadata
        return Memory(
            id=row[0],
            content=row[1],
            type=MemoryType(row[2]),
            tags=json.loads(row[3]) if row[3] else [],
            summary=row[4],
            namespace_id=row[5],
            source_file=row[6],
            source_repo=row[7],
            source_tool=row[8],
            project=row[9],
            session_id=row[10],
            created_at=datetime.fromisoformat(row[11]),
            updated_at=datetime.fromisoformat(row[12]),
            metadata=json.loads(row[13]) if row[13] else {},
        )

    # ==================== Memory Lineage Operations (CORE FEATURE) ====================

    def evolve(
        self,
        memory_id: str,
        new_content: str,
        summary: str | None = None,
        preserve_tags: bool | None = None,
        additional_tags: list[str] | None = None,
    ) -> Memory:
        """
        Evolve a memory by creating an updated version while preserving history.

        The original memory remains unchanged. A new memory is created with
        an EVOLVED_FROM relationship to the original. This is a CORE FEATURE
        that tracks memory changes over time.

        Args:
            memory_id: ID of memory to evolve
            new_content: Updated content for new memory
            summary: Optional new summary
            preserve_tags: Whether to copy tags (default from config)
            additional_tags: Additional tags for new memory

        Returns:
            New evolved Memory object

        Example:
            >>> mem = ctx.save("Initial documentation")
            >>> evolved = ctx.evolve(mem.id, "Updated documentation with examples")
            >>> # Original still exists, evolved has EVOLVED_FROM relationship
        """
        if preserve_tags is None:
            preserve_tags = self.config.lineage_preserve_tags

        return self._lineage.evolve(
            memory_id=memory_id,
            new_content=new_content,
            summary=summary,
            preserve_tags=preserve_tags,
            additional_tags=additional_tags,
        )

    def merge(
        self,
        memory_ids: list[str],
        merged_content: str | None = None,
        summary: str | None = None,
        strategy: str | MergeStrategy | None = None,
        memory_type: MemoryType | None = None,
    ) -> Memory:
        """
        Merge multiple memories into a single memory.

        Creates a new memory with MERGED_FROM relationships to all originals.
        Original memories are not modified. This is a CORE FEATURE for
        consolidating related information.

        Args:
            memory_ids: List of memory IDs to merge (minimum 2)
            merged_content: Content for merged memory (auto-generated if None)
            summary: Summary for merged memory
            strategy: Merge strategy (union, intersection, latest, oldest)
            memory_type: Type for merged memory

        Returns:
            New merged Memory object

        Example:
            >>> m1 = ctx.save("Auth uses JWT")
            >>> m2 = ctx.save("Auth requires 2FA")
            >>> merged = ctx.merge([m1.id, m2.id], summary="Auth documentation")
        """
        # Convert string strategy to enum
        if strategy is None:
            strategy = MergeStrategy(self.config.lineage_merge_strategy.value)
        elif isinstance(strategy, str):
            strategy = MergeStrategy(strategy)

        return self._lineage.merge(
            memory_ids=memory_ids,
            merged_content=merged_content,
            summary=summary,
            strategy=strategy,
            memory_type=memory_type,
        )

    def split(
        self,
        memory_id: str,
        parts: list[str],
        summaries: list[str] | None = None,
        preserve_tags: bool | None = None,
    ) -> list[Memory]:
        """
        Split a memory into multiple parts.

        Creates new memories with SPLIT_FROM relationships to the original.
        Original memory is not modified. This is a CORE FEATURE for
        breaking down complex information.

        Args:
            memory_id: ID of memory to split
            parts: List of content strings for each part (minimum 2)
            summaries: Optional summaries for each part
            preserve_tags: Whether to copy tags from original

        Returns:
            List of new Memory objects

        Example:
            >>> mem = ctx.save("Auth: JWT tokens. Sessions expire in 1h. 2FA required.")
            >>> parts = ctx.split(mem.id, [
            ...     "Auth uses JWT tokens",
            ...     "Sessions expire in 1 hour",
            ...     "2FA is required",
            ... ])
        """
        if preserve_tags is None:
            preserve_tags = self.config.lineage_preserve_tags

        return self._lineage.split(
            memory_id=memory_id,
            parts=parts,
            summaries=summaries,
            preserve_tags=preserve_tags,
        )

    def get_lineage(
        self,
        memory_id: str,
        direction: str = "both",
    ) -> dict[str, Any]:
        """
        Get the evolution lineage of a memory.

        Traces EVOLVED_FROM, MERGED_FROM, SPLIT_FROM relationships to
        find ancestors and descendants. This is a CORE FEATURE for
        understanding memory history.

        Args:
            memory_id: Memory ID to trace
            direction: "ancestors", "descendants", or "both"

        Returns:
            Dict with:
                - root: ID of original ancestor
                - memory: Current memory object
                - ancestors: List of ancestor memories with depths
                - descendants: List of descendant memories with depths
                - timeline: Chronologically ordered history

        Example:
            >>> lineage = ctx.get_lineage("abc123")
            >>> print(f"Root: {lineage['root']}")
            >>> for a in lineage['ancestors']:
            ...     print(f"  <- {a['memory_id']} ({a['relation']})")
        """
        return self._lineage.get_history(memory_id)

    def get_authoritative(self, memory_id: str) -> Memory | None:
        """
        Find the authoritative memory in a lineage chain.

        Traverses the lineage of the given memory to find the one marked
        as authoritative. If no memory is marked authoritative, returns None.

        Args:
            memory_id: Any memory ID in the lineage chain

        Returns:
            The authoritative Memory object, or None if no authoritative version exists

        Example:
            >>> auth = ctx.get_authoritative("abc123")
            >>> if auth:
            ...     print(f"Authoritative: {auth.id}")
        """
        # Get the full lineage
        lineage = self.get_lineage(memory_id)
        if not lineage:
            return None

        # Check current memory
        memory = lineage.get("memory")
        if memory and memory.authoritative:
            return memory

        # Check ancestors
        for ancestor in lineage.get("ancestors", []):
            ancestor_id = ancestor.get("memory_id") or ancestor.get("id")
            if ancestor_id:
                ancestor_mem = self.recall(ancestor_id)
                if ancestor_mem and ancestor_mem.authoritative:
                    return ancestor_mem

        # Check descendants
        for descendant in lineage.get("descendants", []):
            desc_id = descendant.get("memory_id") or descendant.get("id")
            if desc_id:
                desc_mem = self.recall(desc_id)
                if desc_mem and desc_mem.authoritative:
                    return desc_mem

        return None

    def set_authoritative(
        self,
        memory_id: str,
        exclusive: bool = True,
    ) -> Memory | None:
        """
        Mark a memory as the authoritative version in its lineage.

        Args:
            memory_id: Memory ID to mark as authoritative
            exclusive: If True, unmarks all other memories in the lineage chain

        Returns:
            Updated Memory object, or None if memory not found

        Example:
            >>> auth = ctx.set_authoritative("abc123")
            >>> print(f"{auth.id} is now authoritative")
        """
        memory = self.recall(memory_id)
        if not memory:
            return None

        # If exclusive, unmark other authoritative memories in lineage
        if exclusive:
            lineage = self.get_lineage(memory_id)
            if lineage:
                # Unmark ancestors
                for ancestor in lineage.get("ancestors", []):
                    ancestor_id = ancestor.get("memory_id") or ancestor.get("id")
                    if ancestor_id and ancestor_id != memory_id:
                        ancestor_mem = self.recall(ancestor_id)
                        if ancestor_mem and ancestor_mem.authoritative:
                            self._unset_authoritative(ancestor_id)

                # Unmark descendants
                for descendant in lineage.get("descendants", []):
                    desc_id = descendant.get("memory_id") or descendant.get("id")
                    if desc_id and desc_id != memory_id:
                        desc_mem = self.recall(desc_id)
                        if desc_mem and desc_mem.authoritative:
                            self._unset_authoritative(desc_id)

        # Mark the target memory as authoritative
        return self.update(memory_id=memory_id, authoritative=True)

    def _unset_authoritative(self, memory_id: str) -> None:
        """Unmark a memory as authoritative (internal helper)."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()
        cursor.execute(
            "UPDATE memories SET authoritative = 0 WHERE id = ?",
            (memory_id,),
        )
        conn.commit()
        conn.close()

    def search_authoritative(
        self,
        query: str,
        limit: int = 10,
        **kwargs: Any,
    ) -> list[SearchResult]:
        """
        Search only authoritative memories.

        Args:
            query: Search query
            limit: Maximum results
            **kwargs: Additional search filters

        Returns:
            List of SearchResult containing only authoritative memories
        """
        # Get more results than needed, then filter to authoritative
        results = self.search(query, limit=limit * 3, **kwargs)
        authoritative_results = [r for r in results if r.memory.authoritative]
        return authoritative_results[:limit]

    def link(
        self,
        from_memory_id: str,
        to_memory_id: str,
        relation: str | EdgeRelation = EdgeRelation.REFERENCES,
        weight: float = 1.0,
        bidirectional: bool = False,
    ) -> bool:
        """
        Create a relationship link between two memories.

        Args:
            from_memory_id: Source memory ID
            to_memory_id: Target memory ID
            relation: Type of relationship (default: REFERENCES)
            weight: Relationship strength (0.0-1.0)
            bidirectional: Whether to create inverse edge

        Returns:
            True if link created successfully

        Example:
            >>> ctx.link("mem1", "mem2", relation="references")
            >>> ctx.link("auth_doc", "login_doc", relation="related_to", bidirectional=True)
        """
        if isinstance(relation, str):
            relation = EdgeRelation(relation)

        # Resolve partial IDs
        from_mem = self._storage.recall(from_memory_id)
        to_mem = self._storage.recall(to_memory_id)

        if not from_mem or not to_mem:
            return False

        # Use storage router directly (has SQLite fallback)
        # validate=False because we already confirmed both memories exist via recall()
        edge = self._storage.add_edge(
            from_id=from_mem.id,
            to_id=to_mem.id,
            relation=relation,
            weight=weight,
            validate=False,
        )

        # Create bidirectional edge if requested
        if bidirectional and edge:
            inverse_relation = self._get_inverse_relation(relation)
            self._storage.add_edge(
                from_id=to_mem.id,
                to_id=from_mem.id,
                relation=inverse_relation,
                weight=weight,
                validate=False,
            )

        return edge is not None

    def _get_inverse_relation(self, relation: EdgeRelation) -> EdgeRelation:
        """Get inverse relation for bidirectional links."""
        return EdgeRelation.get_inverse(relation)

    def get_related(
        self,
        memory_id: str,
        relation: str | EdgeRelation | None = None,
        max_depth: int = 1,
    ) -> list[dict[str, Any]]:
        """
        Find memories related to a given memory.

        Uses graph traversal to find connected memories.

        Args:
            memory_id: Starting memory ID
            relation: Filter by relation type (None = all)
            max_depth: Maximum traversal depth

        Returns:
            List of related memories with relationship info

        Example:
            >>> related = ctx.get_related("auth_doc", max_depth=2)
            >>> for r in related:
            ...     print(f"{r['memory'].id}: {r['relation']} (depth {r['depth']})")
        """
        if isinstance(relation, str):
            relation = EdgeRelation(relation)

        # Resolve partial ID
        mem = self._storage.recall(memory_id)
        if not mem:
            return []

        # Use storage router directly (has SQLite fallback)
        results = self._storage.get_related(
            memory_id=mem.id,
            relation=relation,
            max_depth=max_depth,
        )

        # Convert GraphTraversalResult to dict format
        return [
            {
                "id": r.memory.id,
                "memory": r.memory,
                "relation": r.relation.value,
                "depth": r.depth,
                "content": r.memory.content,
                "summary": r.memory.summary,
            }
            for r in results
        ]

    def has_graph(self) -> bool:
        """Check if graph backend is available for advanced lineage operations."""
        return self._graph is not None or self._storage.has_graph()

    # ==================== Auto-Linking ====================

    def _auto_link_references(self, memory: Memory) -> list[dict[str, Any]]:
        """
        Automatically detect and create links from a saved memory.

        Uses semantic similarity to find related memories and creates
        RELATED_TO links automatically. Also detects explicit memory ID
        references in content.

        Args:
            memory: The newly saved memory to auto-link

        Returns:
            List of created links with id, relation, and method
        """
        import re

        if not self.config.auto_link_enabled:
            return []

        linked: list[dict[str, Any]] = []
        linked_ids: set[str] = set()

        # 1. Semantic similarity search (primary method)
        try:
            # Search for similar memories using content
            search_text = memory.summary or memory.content[:500]
            results = self.search(
                search_text,
                limit=self.config.auto_link_max + 2,  # Extra to filter self
                cross_repo=False,  # Stay within same namespace
            )

            for r in results:
                # Skip self
                if r.memory.id == memory.id:
                    continue
                # Check threshold
                if r.score < self.config.auto_link_threshold:
                    continue
                # Limit links
                if len(linked) >= self.config.auto_link_max:
                    break

                # Create link
                self.link(
                    from_memory_id=memory.id,
                    to_memory_id=r.memory.id,
                    relation=EdgeRelation.RELATED_TO,
                )
                linked.append(
                    {
                        "id": r.memory.id,
                        "relation": "related_to",
                        "score": r.score,
                        "method": "semantic",
                    }
                )
                linked_ids.add(r.memory.id)

        except Exception as e:
            logger.debug(f"Semantic auto-link failed: {e}")

        # 2. Explicit memory ID detection (secondary method)
        id_pattern = r"\b([a-f0-9]{8,})\b"
        matches = re.findall(id_pattern, memory.content.lower())

        for potential_id in set(matches):
            # Skip self-reference
            if memory.id.lower().startswith(potential_id):
                continue
            # Skip already linked
            if any(lid.lower().startswith(potential_id) for lid in linked_ids):
                continue

            # Verify memory exists
            target = self.recall(potential_id)
            if target and target.id not in linked_ids:
                # Detect relation type from context
                relation = self._detect_relation_type(memory.content, potential_id)
                self.link(
                    from_memory_id=memory.id,
                    to_memory_id=target.id,
                    relation=relation,
                )
                linked.append(
                    {
                        "id": target.id,
                        "relation": relation.value,
                        "method": "id_reference",
                    }
                )
                linked_ids.add(target.id)

        return linked

    def _detect_relation_type(self, content: str, memory_id: str) -> EdgeRelation:
        """
        Detect relation type from keywords near a memory ID reference.

        Args:
            content: Full content text
            memory_id: The memory ID found in content

        Returns:
            Appropriate EdgeRelation based on surrounding context
        """
        content_lower = content.lower()
        idx = content_lower.find(memory_id[:8].lower())
        if idx == -1:
            return EdgeRelation.REFERENCES

        # Get context before the memory ID (50 chars)
        context = content_lower[max(0, idx - 50) : idx]

        # Keyword to relation mapping
        keyword_relations = {
            ("fix", "fixed", "fixes", "resolved", "resolves"): EdgeRelation.SUPERSEDES,
            ("supersede", "supersedes", "update", "updates", "replace"): EdgeRelation.SUPERSEDES,
            ("related", "see also", "similar", "like"): EdgeRelation.RELATED_TO,
            ("depend", "depends", "requires", "needs", "require"): EdgeRelation.DEPENDS_ON,
            ("contradict", "conflicts", "conflict", "disagree"): EdgeRelation.CONTRADICTS,
            ("implement", "implements", "implementation"): EdgeRelation.IMPLEMENTS,
            ("part of", "belongs to", "component"): EdgeRelation.PART_OF,
            ("caused by", "because of", "due to"): EdgeRelation.CAUSED_BY,
        }

        for keywords, relation in keyword_relations.items():
            if any(kw in context for kw in keywords):
                return relation

        return EdgeRelation.REFERENCES

    # ==================== Session Operations ====================

    def _get_device_name(self) -> str:
        """Get the device name (hostname)."""
        import socket

        try:
            return socket.gethostname()
        except Exception:
            return "unknown"

    def start_session(
        self,
        tool: str = "contextfs",
        label: str | None = None,
        repo_path: str | None = None,
        branch: str | None = None,
    ) -> Session:
        """Start a new session."""
        # End current session if exists
        if self._current_session:
            self.end_session()

        session = Session(
            tool=tool,
            label=label,
            namespace_id=self.namespace_id,
            repo_path=repo_path or str(Path.cwd()),
            branch=branch or self._get_current_branch(),
            device_name=self._get_device_name(),
        )

        # Save to database
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute(
            """
            INSERT INTO sessions (id, label, namespace_id, tool, repo_path, branch,
                                  started_at, ended_at, summary, metadata,
                                  device_name, memories_created)
            VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
        """,
            (
                session.id,
                session.label,
                session.namespace_id,
                session.tool,
                session.repo_path,
                session.branch,
                session.started_at.isoformat(),
                None,
                None,
                json.dumps(session.metadata),
                session.device_name,
                json.dumps(session.memories_created),
            ),
        )

        conn.commit()
        conn.close()

        self._current_session = session
        return session

    def end_session(self, generate_summary: bool = True) -> None:
        """End the current session."""
        if not self._current_session:
            return

        self._current_session.end()

        # Update in database
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute(
            """
            UPDATE sessions SET ended_at = ?, summary = ?, memories_created = ?
            WHERE id = ?
        """,
            (
                self._current_session.ended_at.isoformat(),
                self._current_session.summary,
                json.dumps(self._current_session.memories_created),
                self._current_session.id,
            ),
        )

        conn.commit()
        conn.close()

        # Save session as episodic memory
        if generate_summary and self._current_session.messages:
            self.save(
                content=self._format_session_summary(),
                type=MemoryType.EPISODIC,
                tags=["session", self._current_session.tool],
                summary=f"Session {self._current_session.id[:8]}",
                metadata={"session_id": self._current_session.id},
            )

        self._current_session = None

    def add_message(self, role: str, content: str) -> SessionMessage:
        """Add a message to current session."""
        if not self._current_session:
            self.start_session()

        msg = self._current_session.add_message(role, content)

        # Save to database
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute(
            """
            INSERT INTO messages (id, session_id, role, content, timestamp, metadata)
            VALUES (?, ?, ?, ?, ?, ?)
        """,
            (
                msg.id,
                self._current_session.id,
                msg.role,
                msg.content,
                msg.timestamp.isoformat(),
                json.dumps(msg.metadata),
            ),
        )

        conn.commit()
        conn.close()

        return msg

    def load_session(
        self,
        session_id: str | None = None,
        label: str | None = None,
    ) -> Session | None:
        """Load a session by ID or label."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        columns = """id, label, namespace_id, tool, repo_path, branch, started_at, ended_at,
                     summary, metadata, device_name, memories_created"""

        if session_id:
            cursor.execute(f"SELECT {columns} FROM sessions WHERE id LIKE ?", (f"{session_id}%",))
        elif label:
            cursor.execute(f"SELECT {columns} FROM sessions WHERE label = ?", (label,))
        else:
            return None

        row = cursor.fetchone()
        if not row:
            conn.close()
            return None

        session = Session(
            id=row[0],
            label=row[1],
            namespace_id=row[2],
            tool=row[3],
            repo_path=row[4],
            branch=row[5],
            started_at=datetime.fromisoformat(row[6]),
            ended_at=datetime.fromisoformat(row[7]) if row[7] else None,
            summary=row[8],
            metadata=json.loads(row[9]) if row[9] else {},
            device_name=row[10],
            memories_created=json.loads(row[11]) if row[11] else [],
        )

        # Load messages
        cursor.execute(
            "SELECT * FROM messages WHERE session_id = ? ORDER BY timestamp", (session.id,)
        )
        for msg_row in cursor.fetchall():
            session.messages.append(
                SessionMessage(
                    id=msg_row[0],
                    role=msg_row[2],
                    content=msg_row[3],
                    timestamp=datetime.fromisoformat(msg_row[4]),
                    metadata=json.loads(msg_row[5]) if msg_row[5] else {},
                )
            )

        conn.close()
        return session

    def list_sessions(
        self,
        limit: int = 10,
        offset: int = 0,
        tool: str | None = None,
        label: str | None = None,
        all_namespaces: bool = False,
    ) -> list[Session]:
        """List recent sessions."""
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        columns = """id, label, namespace_id, tool, repo_path, branch, started_at, ended_at,
                     summary, metadata, device_name, memories_created"""

        if all_namespaces:
            sql = f"SELECT {columns} FROM sessions WHERE 1=1"
            params: list = []
        else:
            sql = f"SELECT {columns} FROM sessions WHERE namespace_id = ?"
            params = [self.namespace_id]

        if tool:
            sql += " AND tool = ?"
            params.append(tool)

        if label:
            sql += " AND label LIKE ?"
            params.append(f"%{label}%")

        sql += f" ORDER BY started_at DESC LIMIT {limit} OFFSET {offset}"

        cursor.execute(sql, params)
        rows = cursor.fetchall()
        conn.close()

        sessions = []
        for row in rows:
            sessions.append(
                Session(
                    id=row[0],
                    label=row[1],
                    namespace_id=row[2],
                    tool=row[3],
                    repo_path=row[4],
                    branch=row[5],
                    started_at=datetime.fromisoformat(row[6]),
                    ended_at=datetime.fromisoformat(row[7]) if row[7] else None,
                    summary=row[8],
                    metadata=json.loads(row[9]) if row[9] else {},
                    device_name=row[10],
                    memories_created=json.loads(row[11]) if row[11] else [],
                )
            )

        return sessions

    def update_session(
        self,
        session_id: str,
        label: str | None = None,
        summary: str | None = None,
    ) -> Session | None:
        """
        Update an existing session.

        Args:
            session_id: Session ID (can be partial)
            label: New label (optional)
            summary: New summary (optional)

        Returns:
            Updated Session or None if not found
        """
        session = self.load_session(session_id=session_id)
        if not session:
            return None

        # Update fields if provided
        if label is not None:
            session.label = label
        if summary is not None:
            session.summary = summary

        # Update in database
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        cursor.execute(
            """
            UPDATE sessions SET label = ?, summary = ?
            WHERE id = ?
        """,
            (session.label, session.summary, session.id),
        )

        conn.commit()
        conn.close()

        return session

    def delete_session(self, session_id: str) -> bool:
        """
        Delete a session and its messages.

        Args:
            session_id: Session ID (can be partial)

        Returns:
            True if deleted, False if not found
        """
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Support partial ID matching
        cursor.execute("SELECT id FROM sessions WHERE id LIKE ?", (f"{session_id}%",))
        row = cursor.fetchone()
        if not row:
            conn.close()
            return False

        full_id = row[0]

        # Delete messages first
        cursor.execute("DELETE FROM messages WHERE session_id = ?", (full_id,))

        # Delete session
        cursor.execute("DELETE FROM sessions WHERE id = ?", (full_id,))
        deleted = cursor.rowcount > 0

        conn.commit()
        conn.close()

        return deleted

    def _format_session_summary(self) -> str:
        """Format session messages for episodic memory."""
        if not self._current_session:
            return ""

        lines = [f"Session with {self._current_session.tool}"]
        for msg in self._current_session.messages[-10:]:  # Last 10 messages
            lines.append(f"{msg.role}: {msg.content[:200]}...")

        return "\n".join(lines)

    def _get_current_branch(self) -> str | None:
        """Get current git branch."""
        try:
            head_path = Path.cwd() / ".git" / "HEAD"
            if head_path.exists():
                content = head_path.read_text().strip()
                if content.startswith("ref: refs/heads/"):
                    return content[16:]
        except Exception:
            pass
        return None

    # ==================== Context Helpers ====================

    def get_context_for_task(self, task: str, limit: int = 5) -> list[str]:
        """Get relevant context strings for a task."""
        results = self.search(task, limit=limit)
        return [r.memory.to_context_string() for r in results]

    def get_current_session(self) -> Session | None:
        """Get current active session."""
        return self._current_session

    # ==================== Cleanup ====================

    def reset_chromadb(self) -> bool:
        """
        Reset the ChromaDB database.

        Use this when ChromaDB becomes corrupted (e.g., after version upgrades).
        This will delete all vector embeddings but SQLite data remains intact.
        After reset, you should re-index to rebuild the ChromaDB database.

        Returns:
            True if reset successful, False otherwise
        """
        return self.rag.reset_database()

    def rebuild_chromadb(
        self,
        on_progress: callable = None,
    ) -> dict:
        """
        Rebuild ChromaDB from SQLite data.

        Use this to restore search capability after ChromaDB corruption
        without needing to re-index from source files.

        This is MUCH faster than re-indexing because:
        - No file scanning needed
        - No file content processing
        - Memories already exist in SQLite

        Args:
            on_progress: Callback for progress updates (current, total)

        Returns:
            Statistics dict with count of memories rebuilt
        """
        return self.storage.rebuild_chromadb_from_sqlite(on_progress=on_progress)

    def reindex_all_repos(
        self,
        incremental: bool = True,
        mode: str = "all",
        on_progress: Callable[[str, int, int], None] | None = None,
    ) -> dict:
        """
        Reindex all repositories that have been previously indexed.

        Uses stored repo paths from index_status table to reindex.
        Useful for rebuilding indexes after ChromaDB corruption or upgrades.

        Args:
            incremental: Only index new/changed files (default: True)
            mode: "all", "files_only", or "commits_only"
            on_progress: Callback (repo_name, current_repo, total_repos)

        Returns:
            Statistics dict with repos processed, files indexed, etc.
        """
        # Get repo paths from index_status table
        conn = sqlite3.connect(self._db_path)
        cursor = conn.cursor()

        # Check if index_status table exists
        cursor.execute("SELECT name FROM sqlite_master WHERE type='table' AND name='index_status'")
        if not cursor.fetchone():
            conn.close()
            return {
                "success": True,
                "repos_found": 0,
                "repos_indexed": 0,
                "repos_failed": 0,
                "total_files": 0,
                "total_memories": 0,
                "errors": [],
            }

        cursor.execute("""
            SELECT namespace_id, repo_path
            FROM index_status
            WHERE repo_path IS NOT NULL AND repo_path != ''
        """)

        repos = []
        for row in cursor.fetchall():
            repos.append(
                {
                    "namespace_id": row[0],
                    "repo_path": row[1],
                }
            )

        conn.close()

        if not repos:
            return {
                "success": True,
                "repos_found": 0,
                "repos_indexed": 0,
                "repos_failed": 0,
                "total_files": 0,
                "total_memories": 0,
                "errors": [],
            }

        successful = 0
        failed = 0
        total_files = 0
        total_memories = 0
        errors = []

        for i, repo_info in enumerate(repos):
            repo_path = Path(repo_info["repo_path"])
            repo_name = repo_path.name

            if on_progress:
                on_progress(repo_name, i + 1, len(repos))

            # Verify path exists and is a git repo
            if not repo_path.exists():
                errors.append(f"{repo_name}: Path no longer exists: {repo_path}")
                failed += 1
                continue

            if not (repo_path / ".git").exists():
                errors.append(f"{repo_name}: Not a git repository: {repo_path}")
                failed += 1
                continue

            try:
                result = self.index_repository(
                    repo_path=repo_path,
                    incremental=incremental,
                    mode=mode,
                )
                total_files += result.get("files_indexed", 0)
                total_memories += result.get("memories_created", 0)
                successful += 1
            except Exception as e:
                errors.append(f"{repo_name}: {e!s}")
                failed += 1

        return {
            "success": failed == 0,
            "repos_found": len(repos),
            "repos_indexed": successful,
            "repos_failed": failed,
            "total_files": total_files,
            "total_memories": total_memories,
            "errors": errors,
        }

    def close(self) -> None:
        """Clean shutdown."""
        if self._current_session:
            self.end_session()
        if self._fts:
            self._fts.close()
        if self.rag:
            self.rag.close()

    def __enter__(self):
        """Context manager entry."""
        return self

    def __exit__(self, exc_type, exc_val, exc_tb):
        """Context manager exit - ensure cleanup."""
        self.close()
        return False

`init(data_dir=None, namespace_id=None, auto_load=True, auto_index=True)` ¶

Initialize ContextFS.

Parameters:

Name	Type	Description	Default
`data_dir`	`Path \| None`	Data directory (default: ~/.contextfs)	`None`
`namespace_id`	`str \| None`	Default namespace (default: global or auto-detect from repo)	`None`
`auto_load`	`bool`	Load memories on startup	`True`
`auto_index`	`bool`	Auto-index repository on first memory save	`True`

Source code in src/contextfs/core.py

def __init__(
    self,
    data_dir: Path | None = None,
    namespace_id: str | None = None,
    auto_load: bool = True,
    auto_index: bool = True,
):
    """
    Initialize ContextFS.

    Args:
        data_dir: Data directory (default: ~/.contextfs)
        namespace_id: Default namespace (default: global or auto-detect from repo)
        auto_load: Load memories on startup
        auto_index: Auto-index repository on first memory save
    """
    self.config = get_config()
    self.data_dir = data_dir or self.config.data_dir
    self.data_dir.mkdir(parents=True, exist_ok=True)

    # Auto-detect namespace from current repo
    self._repo_path: Path | None = None
    if namespace_id is None:
        namespace_id, self._repo_path = self._detect_namespace_and_repo()
    self.namespace_id = namespace_id

    # Initialize storage using backend factory
    self._db_path = self.data_dir / self.config.sqlite_filename
    self._init_db()

    # Initialize RAG backend with configurable embedding backend
    # When chroma_host is set, uses HttpClient (server mode) instead of PersistentClient
    # When chroma_auto_server is True, auto-starts server on corruption
    self.rag = RAGBackend(
        data_dir=self.data_dir,
        embedding_model=self.config.embedding_model,
        embedding_backend=self.config.embedding_backend,
        use_gpu=self.config.use_gpu,
        parallel_workers=self.config.embedding_parallel_workers,
        chroma_host=self.config.chroma_host,
        chroma_port=self.config.chroma_port,
        chroma_auto_server=self.config.chroma_auto_server,
    )

    # Initialize FTS and Hybrid search backends
    from contextfs.fts import FTSBackend, HybridSearch

    self._fts = FTSBackend(self._db_path)
    self._hybrid = HybridSearch(fts_backend=self._fts, rag_backend=self.rag)

    # Initialize graph backend if configured
    self._graph = self._init_graph_backend()

    # Initialize unified storage router (keeps all backends in sync)
    self._storage = StorageRouter(
        db_path=self._db_path,
        rag_backend=self.rag,
        graph_backend=self._graph,
    )

    # Alias for backwards compatibility
    self.storage = self._storage

    # Initialize memory lineage (CORE FEATURE)
    self._lineage = MemoryLineage(self._storage, self._graph)

    # Auto-indexing
    self._auto_index = auto_index
    self._auto_indexer = None
    self._indexing_triggered = False

    # Current session
    self._current_session: Session | None = None

    # Auto-load memories
    if auto_load and self.config.auto_load_on_startup:
        self._load_startup_context()

`save(content, type=MemoryType.FACT, tags=None, summary=None, namespace_id=None, source_tool=None, source_repo=None, project=None, metadata=None, created_at=None, updated_at=None, id=None, structured_data=None, authoritative=False)` ¶

Save content to memory.

Parameters:

Name	Type	Description	Default
`content`	`str`	Content to save	required
`type`	`MemoryType`	Memory type	`FACT`
`tags`	`list[str] \| None`	Tags for categorization	`None`
`summary`	`str \| None`	Brief summary	`None`
`namespace_id`	`str \| None`	Namespace (default: current)	`None`
`source_tool`	`str \| None`	Tool that created memory (claude-code, claude-desktop, gemini, etc.)	`None`
`source_repo`	`str \| None`	Repository name/path	`None`
`project`	`str \| None`	Project name for grouping memories across repos	`None`
`metadata`	`dict \| None`	Additional metadata	`None`
`created_at`	`datetime \| None`	Original creation timestamp (for sync, defaults to now)	`None`
`updated_at`	`datetime \| None`	Original update timestamp (for sync, defaults to now)	`None`
`id`	`str \| None`	Memory ID (for sync, auto-generated if not provided)	`None`
`structured_data`	`dict \| None`	Optional structured data validated against TYPE_SCHEMAS	`None`
`authoritative`	`bool`	Whether this is the authoritative/canonical version in a lineage	`False`

Returns:

Type	Description
`Memory`	Saved Memory object

Source code in src/contextfs/core.py

def save(
    self,
    content: str,
    type: MemoryType = MemoryType.FACT,
    tags: list[str] | None = None,
    summary: str | None = None,
    namespace_id: str | None = None,
    source_tool: str | None = None,
    source_repo: str | None = None,
    project: str | None = None,
    metadata: dict | None = None,
    created_at: datetime | None = None,
    updated_at: datetime | None = None,
    id: str | None = None,
    structured_data: dict | None = None,
    authoritative: bool = False,
) -> Memory:
    """
    Save content to memory.

    Args:
        content: Content to save
        type: Memory type
        tags: Tags for categorization
        summary: Brief summary
        namespace_id: Namespace (default: current)
        source_tool: Tool that created memory (claude-code, claude-desktop, gemini, etc.)
        source_repo: Repository name/path
        project: Project name for grouping memories across repos
        metadata: Additional metadata
        created_at: Original creation timestamp (for sync, defaults to now)
        updated_at: Original update timestamp (for sync, defaults to now)
        id: Memory ID (for sync, auto-generated if not provided)
        structured_data: Optional structured data validated against TYPE_SCHEMAS
        authoritative: Whether this is the authoritative/canonical version in a lineage

    Returns:
        Saved Memory object
    """
    # Trigger auto-indexing on first save (indexes codebase to ChromaDB)
    self._maybe_auto_index()

    # Auto-detect source_repo from repo_path
    if source_repo is None and self._repo_path:
        source_repo = self._repo_path.name

    # Auto-set project from source_repo if not provided
    if project is None and source_repo:
        project = source_repo

    # Check for duplicate by content hash (skip if already exists)
    content_hash = hashlib.sha256(content.encode()).hexdigest()[:16]
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()
    cursor.execute(
        "SELECT id FROM memories WHERE content_hash = ? AND namespace_id = ?",
        (content_hash, namespace_id or self.namespace_id),
    )
    existing = cursor.fetchone()
    if existing and id is None:
        # Return existing memory instead of creating duplicate
        conn.close()
        return self.recall(existing[0])  # type: ignore

    memory_kwargs = {
        "content": content,
        "type": type,
        "tags": tags or [],
        "summary": summary,
        "namespace_id": namespace_id or self.namespace_id,
        "source_tool": source_tool,
        "source_repo": source_repo,
        "project": project,
        "session_id": self._current_session.id if self._current_session else None,
        "metadata": metadata or {},
        "created_at": created_at or datetime.now(timezone.utc),
        "updated_at": updated_at or datetime.now(timezone.utc),
        "structured_data": structured_data,
        "authoritative": authoritative,
        "content_hash": content_hash,
    }
    if id is not None:
        memory_kwargs["id"] = id
    memory = Memory(**memory_kwargs)
    conn.close()

    # Save to SQLite
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    # Get vector_clock from metadata if available (for sync consistency)
    vector_clock = None
    if memory.metadata and memory.metadata.get("_vector_clock"):
        vector_clock = json.dumps(memory.metadata["_vector_clock"])

    cursor.execute(
        """
        INSERT OR REPLACE INTO memories (id, content, type, tags, summary, namespace_id,
                              source_file, source_repo, source_tool, project, session_id, created_at, updated_at, metadata, structured_data, authoritative, content_hash, vector_clock)
        VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
    """,
        (
            memory.id,
            memory.content,
            memory.type.value,
            json.dumps(memory.tags),
            memory.summary,
            memory.namespace_id,
            memory.source_file,
            memory.source_repo,
            memory.source_tool,
            memory.project,
            memory.session_id,
            memory.created_at.isoformat(),
            memory.updated_at.isoformat(),
            json.dumps(memory.metadata),
            json.dumps(memory.structured_data) if memory.structured_data is not None else None,
            1 if memory.authoritative else 0,
            content_hash,
            vector_clock,
        ),
    )

    # Update session's memories_created list if we have an active session
    if (
        self._current_session
        and memory.session_id
        and memory.id not in self._current_session.memories_created
    ):
        self._current_session.memories_created.append(memory.id)
        # Update session in database
        cursor.execute(
            "UPDATE sessions SET memories_created = ? WHERE id = ?",
            (json.dumps(self._current_session.memories_created), self._current_session.id),
        )

    # Update FTS index
    # For content-linked FTS (content='memories'), we need to use the special rebuild command
    # First try the direct approach, fall back to rebuild if it fails
    try:
        # Get the rowid for this memory
        cursor.execute("SELECT rowid FROM memories WHERE id = ?", (memory.id,))
        row = cursor.fetchone()
        if row:
            rowid = row[0]
            # Delete old FTS entry using the special 'delete' command
            try:
                cursor.execute(
                    "INSERT INTO memories_fts(memories_fts, rowid) VALUES('delete', ?)",
                    (rowid,),
                )
            except sqlite3.OperationalError:
                pass  # May not exist yet
            # Insert new FTS entry
            cursor.execute(
                """
                INSERT INTO memories_fts(rowid, id, content, summary, tags, type, namespace_id, source_repo, source_tool, project)
                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                """,
                (
                    rowid,
                    memory.id,
                    memory.content,
                    memory.summary,
                    " ".join(memory.tags),
                    memory.type.value if hasattr(memory.type, "value") else memory.type,
                    memory.namespace_id,
                    memory.source_repo,
                    memory.source_tool,
                    memory.project,
                ),
            )
    except sqlite3.DatabaseError:
        # If FTS is corrupted, rebuild it
        try:
            cursor.execute("INSERT INTO memories_fts(memories_fts) VALUES('rebuild')")
        except sqlite3.DatabaseError:
            pass  # FTS rebuild failed, will be handled later

    conn.commit()
    conn.close()

    # Add to RAG index
    self.rag.add_memory(memory)

    # Auto-link to related memories
    self._auto_link_references(memory)

    return memory

`update(memory_id, content=None, type=None, tags=None, summary=None, project=None, metadata=None, authoritative=None)` ¶

Update an existing memory.

Parameters:

Name	Type	Description	Default
`memory_id`	`str`	Memory ID (can be partial, at least 8 chars)	required
`content`	`str \| None`	New content (optional)	`None`
`type`	`MemoryType \| None`	New type (optional)	`None`
`tags`	`list[str] \| None`	New tags (optional)	`None`
`summary`	`str \| None`	New summary (optional)	`None`
`project`	`str \| None`	New project (optional)	`None`
`metadata`	`dict \| None`	New metadata (optional)	`None`
`authoritative`	`bool \| None`	New authoritative flag (optional)	`None`

Returns:

Type	Description
`Memory \| None`	Updated Memory or None if not found

Source code in src/contextfs/core.py

def update(
    self,
    memory_id: str,
    content: str | None = None,
    type: MemoryType | None = None,
    tags: list[str] | None = None,
    summary: str | None = None,
    project: str | None = None,
    metadata: dict | None = None,
    authoritative: bool | None = None,
) -> Memory | None:
    """
    Update an existing memory.

    Args:
        memory_id: Memory ID (can be partial, at least 8 chars)
        content: New content (optional)
        type: New type (optional)
        tags: New tags (optional)
        summary: New summary (optional)
        project: New project (optional)
        metadata: New metadata (optional)
        authoritative: New authoritative flag (optional)

    Returns:
        Updated Memory or None if not found
    """
    # First, recall the existing memory
    memory = self.recall(memory_id)
    if not memory:
        return None

    # Update fields if provided
    if content is not None:
        memory.content = content
    if type is not None:
        memory.type = type
    if tags is not None:
        memory.tags = tags
    if summary is not None:
        memory.summary = summary
    if project is not None:
        memory.project = project
    if metadata is not None:
        memory.metadata = metadata
    if authoritative is not None:
        memory.authoritative = authoritative

    memory.updated_at = datetime.now(timezone.utc)

    # Update in database
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    cursor.execute(
        """
        UPDATE memories SET
            content = ?,
            type = ?,
            tags = ?,
            summary = ?,
            project = ?,
            updated_at = ?,
            metadata = ?,
            authoritative = ?
        WHERE id = ?
    """,
        (
            memory.content,
            memory.type.value,
            json.dumps(memory.tags),
            memory.summary,
            memory.project,
            memory.updated_at.isoformat(),
            json.dumps(memory.metadata),
            1 if memory.authoritative else 0,
            memory.id,
        ),
    )

    # Update FTS
    cursor.execute("DELETE FROM memories_fts WHERE id = ?", (memory.id,))
    cursor.execute(
        """
        INSERT INTO memories_fts (id, content, summary, tags)
        VALUES (?, ?, ?, ?)
    """,
        (memory.id, memory.content, memory.summary, " ".join(memory.tags)),
    )

    conn.commit()
    conn.close()

    # Update RAG index
    self.rag.remove_memory(memory.id)
    self.rag.add_memory(memory)

    return memory

`search(query, limit=10, type=None, tags=None, namespace_id=None, source_tool=None, source_repo=None, project=None, cross_repo=False, mode='hybrid', use_semantic=None)` ¶

Search memories.

Parameters:

Name	Type	Description	Default
`query`	`str`	Search query	required
`limit`	`int`	Maximum results	`10`
`type`	`MemoryType \| None`	Filter by type	`None`
`tags`	`list[str] \| None`	Filter by tags	`None`
`namespace_id`	`str \| None`	Filter by namespace (None with cross_repo=True searches all)	`None`
`source_tool`	`str \| None`	Filter by source tool (claude-code, claude-desktop, gemini, etc.)	`None`
`source_repo`	`str \| None`	Filter by source repository name	`None`
`project`	`str \| None`	Filter by project name (groups memories across repos)	`None`
`cross_repo`	`bool`	If True, search across all namespaces/repos	`False`
`mode`	`str`	Search mode - "hybrid" (default), "semantic", "keyword", "smart" - hybrid: Combines FTS + RAG using Reciprocal Rank Fusion - semantic: RAG vector search only (good for conceptual queries) - keyword: FTS5 keyword search only (fast, good for exact terms) - smart: Routes to optimal backend based on memory type	`'hybrid'`
`use_semantic`	`bool \| None`	DEPRECATED - use mode="semantic" or mode="keyword" instead	`None`

Returns:

Type	Description
`list[SearchResult]`	List of SearchResult objects

Source code in src/contextfs/core.py

def search(
    self,
    query: str,
    limit: int = 10,
    type: MemoryType | None = None,
    tags: list[str] | None = None,
    namespace_id: str | None = None,
    source_tool: str | None = None,
    source_repo: str | None = None,
    project: str | None = None,
    cross_repo: bool = False,
    mode: str = "hybrid",
    use_semantic: bool | None = None,  # Deprecated, use mode instead
) -> list[SearchResult]:
    """
    Search memories.

    Args:
        query: Search query
        limit: Maximum results
        type: Filter by type
        tags: Filter by tags
        namespace_id: Filter by namespace (None with cross_repo=True searches all)
        source_tool: Filter by source tool (claude-code, claude-desktop, gemini, etc.)
        source_repo: Filter by source repository name
        project: Filter by project name (groups memories across repos)
        cross_repo: If True, search across all namespaces/repos
        mode: Search mode - "hybrid" (default), "semantic", "keyword", "smart"
              - hybrid: Combines FTS + RAG using Reciprocal Rank Fusion
              - semantic: RAG vector search only (good for conceptual queries)
              - keyword: FTS5 keyword search only (fast, good for exact terms)
              - smart: Routes to optimal backend based on memory type
        use_semantic: DEPRECATED - use mode="semantic" or mode="keyword" instead

    Returns:
        List of SearchResult objects
    """
    import re

    # Handle deprecated use_semantic parameter
    if use_semantic is not None:
        mode = "semantic" if use_semantic else "keyword"

    # Auto-detect memory ID pattern (8+ hex chars)
    # If query looks like a memory ID, use recall() instead of vector search
    if re.match(r"^[a-f0-9]{8,}$", query.lower().strip()):
        memory = self.recall(query.strip())
        if memory:
            # Check type filter if specified
            if type and memory.type != type:
                return []
            return [SearchResult(memory=memory, score=1.0)]
        # If not found by ID, fall through to regular search

    # For cross-repo or project search, don't filter by namespace
    effective_namespace = (
        None if (cross_repo or project) else (namespace_id or self.namespace_id)
    )

    # Determine fetch limit (over-fetch for post-filtering)
    fetch_limit = limit * 2 if (source_tool or source_repo or project) else limit

    # Execute search based on mode
    if mode == "semantic":
        results = self.rag.search(
            query=query,
            limit=fetch_limit,
            type=type,
            tags=tags,
            namespace_id=effective_namespace,
        )
    elif mode == "keyword":
        results = self._fts.search(
            query=query,
            limit=fetch_limit,
            type=type,
            tags=tags,
            namespace_id=effective_namespace,
        )
    elif mode == "smart":
        results = self._hybrid.smart_search(
            query=query,
            limit=fetch_limit,
            type=type,
            tags=tags,
            namespace_id=effective_namespace,
        )
    else:  # Default: hybrid
        results = self._hybrid.search(
            query=query,
            limit=fetch_limit,
            type=type,
            tags=tags,
            namespace_id=effective_namespace,
        )

    # Post-filter by source_tool, source_repo, and project if specified
    if source_tool or source_repo or project:
        filtered = []
        for r in results:
            if source_tool and r.memory.source_tool != source_tool:
                continue
            if source_repo and r.memory.source_repo != source_repo:
                continue
            if project and r.memory.project != project:
                continue
            filtered.append(r)
        results = filtered[:limit]

    return results

`recall(memory_id)` ¶

Recall a specific memory by ID.

Checks SQLite first, then falls back to ChromaDB for indexed memories.

Parameters:

Name	Type	Description	Default
`memory_id`	`str`	Memory ID (can be partial, at least 8 chars)	required

Returns:

Type	Description
`Memory \| None`	Memory or None

Source code in src/contextfs/core.py

def recall(self, memory_id: str) -> Memory | None:
    """
    Recall a specific memory by ID.

    Checks SQLite first, then falls back to ChromaDB for indexed memories.

    Args:
        memory_id: Memory ID (can be partial, at least 8 chars)

    Returns:
        Memory or None
    """
    # Use StorageRouter for unified recall (SQLite + ChromaDB fallback)
    return self.storage.recall(memory_id)

`delete(memory_id, hard_delete=False)` ¶

Soft-delete a memory (sets deleted_at timestamp).

Parameters:

Name	Type	Description	Default
`memory_id`	`str`	ID of memory to delete (supports partial matching)	required
`hard_delete`	`bool`	If True, permanently remove instead of soft-delete	`False`

Returns:

Type	Description
`bool`	True if memory was deleted, False if not found

Source code in src/contextfs/core.py

def delete(self, memory_id: str, hard_delete: bool = False) -> bool:
    """Soft-delete a memory (sets deleted_at timestamp).

    Args:
        memory_id: ID of memory to delete (supports partial matching)
        hard_delete: If True, permanently remove instead of soft-delete

    Returns:
        True if memory was deleted, False if not found
    """
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    # Support partial ID matching
    cursor.execute("SELECT id FROM memories WHERE id LIKE ?", (f"{memory_id}%",))
    row = cursor.fetchone()
    if not row:
        conn.close()
        return False

    full_id = row[0]

    if hard_delete:
        # Permanently delete memory
        cursor.execute("DELETE FROM memories WHERE id = ?", (full_id,))
        deleted = cursor.rowcount > 0
    else:
        # Soft delete - set deleted_at timestamp for sync propagation
        now = datetime.now(timezone.utc).isoformat()
        cursor.execute(
            "UPDATE memories SET deleted_at = ?, updated_at = ? WHERE id = ? AND deleted_at IS NULL",
            (now, now, full_id),
        )
        deleted = cursor.rowcount > 0

    conn.commit()
    conn.close()

    if deleted:
        # Clean up edges after releasing the connection to avoid "database is locked"
        if hard_delete:
            self._storage._delete_edges_for_memory(full_id)
        else:
            self._storage._soft_delete_edges_for_memory(full_id)

        self.rag.remove_memory(full_id)

    return deleted

`list_recent(limit=10, type=None, namespace_id=None, source_tool=None, project=None)` ¶

List recent memories.

Source code in src/contextfs/core.py

def list_recent(
    self,
    limit: int = 10,
    type: MemoryType | None = None,
    namespace_id: str | None = None,
    source_tool: str | None = None,
    project: str | None = None,
) -> list[Memory]:
    """List recent memories."""
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    sql = "SELECT * FROM memories WHERE deleted_at IS NULL"
    params: list = []

    if namespace_id:
        sql += " AND namespace_id = ?"
        params.append(namespace_id)

    if type:
        sql += " AND type = ?"
        params.append(type.value)

    if source_tool:
        sql += " AND source_tool = ?"
        params.append(source_tool)

    if project:
        sql += " AND project = ?"
        params.append(project)

    sql += f" ORDER BY created_at DESC LIMIT {limit}"

    cursor.execute(sql, params)
    rows = cursor.fetchall()
    conn.close()

    return [self._row_to_memory(row) for row in rows]

`index_repository(repo_path=None, on_progress=None, incremental=True, project=None, source_repo=None, mode='all')` ¶

Manually index a repository to ChromaDB.

Parameters:

Name	Type	Description	Default
`repo_path`	`Path \| None`	Repository path (default: current repo)	`None`
`on_progress`	`Callable[[int, int, str], None] \| None`	Progress callback (current, total, file)	`None`
`incremental`	`bool`	Only index new/changed files	`True`
`project`	`str \| None`	Project name for grouping memories across repos	`None`
`source_repo`	`str \| None`	Repository name (default: repo directory name)	`None`
`mode`	`str`	"all", "files_only", or "commits_only"	`'all'`

Returns:

Type	Description
`dict`	Indexing statistics

Source code in src/contextfs/core.py

def index_repository(
    self,
    repo_path: Path | None = None,
    on_progress: Callable[[int, int, str], None] | None = None,
    incremental: bool = True,
    project: str | None = None,
    source_repo: str | None = None,
    mode: str = "all",
) -> dict:
    """
    Manually index a repository to ChromaDB.

    Args:
        repo_path: Repository path (default: current repo)
        on_progress: Progress callback (current, total, file)
        incremental: Only index new/changed files
        project: Project name for grouping memories across repos
        source_repo: Repository name (default: repo directory name)
        mode: "all", "files_only", or "commits_only"

    Returns:
        Indexing statistics
    """
    from contextfs.autoindex import IndexMode

    path = repo_path or self._repo_path
    if not path:
        raise ValueError("No repository path available")

    # Use namespace derived from the repo being indexed, not ctx's namespace
    namespace_id = self._namespace_for_path(Path(path))

    # Default source_repo to directory name
    if source_repo is None:
        source_repo = Path(path).name

    # Convert string mode to IndexMode enum
    index_mode = IndexMode(mode) if isinstance(mode, str) else mode

    indexer = self._get_auto_indexer()
    return indexer.index_repository(
        repo_path=path,
        namespace_id=namespace_id,
        storage=self.storage,
        on_progress=on_progress,
        incremental=incremental,
        project=project,
        source_repo=source_repo,
        mode=index_mode,
    )

`get_index_status(repo_path=None)` ¶

Get indexing status for a repository.

Parameters:

Name	Type	Description	Default
`repo_path`	`Path \| None`	Repository path (default: current working directory's repo)	`None`

Source code in src/contextfs/core.py

def get_index_status(self, repo_path: Path | None = None):
    """Get indexing status for a repository.

    Args:
        repo_path: Repository path (default: current working directory's repo)
    """
    if repo_path:
        namespace_id = self._namespace_for_path(repo_path)
    else:
        # Detect from current working directory
        namespace_id, _ = self._detect_namespace_and_repo()
    return self._get_auto_indexer().get_status(namespace_id)

`clear_index(repo_path=None)` ¶

Clear indexing status for a repository.

Parameters:

Name	Type	Description	Default
`repo_path`	`Path \| None`	Repository path (default: current working directory's repo)	`None`

Source code in src/contextfs/core.py

def clear_index(self, repo_path: Path | None = None) -> None:
    """Clear indexing status for a repository.

    Args:
        repo_path: Repository path (default: current working directory's repo)
    """
    if repo_path:
        namespace_id = self._namespace_for_path(repo_path)
    else:
        namespace_id, _ = self._detect_namespace_and_repo()
    self._get_auto_indexer().clear_index(namespace_id)
    self._indexing_triggered = False

`start_session(tool='contextfs', label=None, repo_path=None, branch=None)` ¶

Start a new session.

Source code in src/contextfs/core.py

def start_session(
    self,
    tool: str = "contextfs",
    label: str | None = None,
    repo_path: str | None = None,
    branch: str | None = None,
) -> Session:
    """Start a new session."""
    # End current session if exists
    if self._current_session:
        self.end_session()

    session = Session(
        tool=tool,
        label=label,
        namespace_id=self.namespace_id,
        repo_path=repo_path or str(Path.cwd()),
        branch=branch or self._get_current_branch(),
        device_name=self._get_device_name(),
    )

    # Save to database
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    cursor.execute(
        """
        INSERT INTO sessions (id, label, namespace_id, tool, repo_path, branch,
                              started_at, ended_at, summary, metadata,
                              device_name, memories_created)
        VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
    """,
        (
            session.id,
            session.label,
            session.namespace_id,
            session.tool,
            session.repo_path,
            session.branch,
            session.started_at.isoformat(),
            None,
            None,
            json.dumps(session.metadata),
            session.device_name,
            json.dumps(session.memories_created),
        ),
    )

    conn.commit()
    conn.close()

    self._current_session = session
    return session

`end_session(generate_summary=True)` ¶

End the current session.

Source code in src/contextfs/core.py

def end_session(self, generate_summary: bool = True) -> None:
    """End the current session."""
    if not self._current_session:
        return

    self._current_session.end()

    # Update in database
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    cursor.execute(
        """
        UPDATE sessions SET ended_at = ?, summary = ?, memories_created = ?
        WHERE id = ?
    """,
        (
            self._current_session.ended_at.isoformat(),
            self._current_session.summary,
            json.dumps(self._current_session.memories_created),
            self._current_session.id,
        ),
    )

    conn.commit()
    conn.close()

    # Save session as episodic memory
    if generate_summary and self._current_session.messages:
        self.save(
            content=self._format_session_summary(),
            type=MemoryType.EPISODIC,
            tags=["session", self._current_session.tool],
            summary=f"Session {self._current_session.id[:8]}",
            metadata={"session_id": self._current_session.id},
        )

    self._current_session = None

`update_session(session_id, label=None, summary=None)` ¶

Update an existing session.

Parameters:

Name	Type	Description	Default
`session_id`	`str`	Session ID (can be partial)	required
`label`	`str \| None`	New label (optional)	`None`
`summary`	`str \| None`	New summary (optional)	`None`

Returns:

Type	Description
`Session \| None`	Updated Session or None if not found

Source code in src/contextfs/core.py

def update_session(
    self,
    session_id: str,
    label: str | None = None,
    summary: str | None = None,
) -> Session | None:
    """
    Update an existing session.

    Args:
        session_id: Session ID (can be partial)
        label: New label (optional)
        summary: New summary (optional)

    Returns:
        Updated Session or None if not found
    """
    session = self.load_session(session_id=session_id)
    if not session:
        return None

    # Update fields if provided
    if label is not None:
        session.label = label
    if summary is not None:
        session.summary = summary

    # Update in database
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    cursor.execute(
        """
        UPDATE sessions SET label = ?, summary = ?
        WHERE id = ?
    """,
        (session.label, session.summary, session.id),
    )

    conn.commit()
    conn.close()

    return session

`delete_session(session_id)` ¶

Delete a session and its messages.

Parameters:

Name	Type	Description	Default
`session_id`	`str`	Session ID (can be partial)	required

Returns:

Type	Description
`bool`	True if deleted, False if not found

Source code in src/contextfs/core.py

def delete_session(self, session_id: str) -> bool:
    """
    Delete a session and its messages.

    Args:
        session_id: Session ID (can be partial)

    Returns:
        True if deleted, False if not found
    """
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    # Support partial ID matching
    cursor.execute("SELECT id FROM sessions WHERE id LIKE ?", (f"{session_id}%",))
    row = cursor.fetchone()
    if not row:
        conn.close()
        return False

    full_id = row[0]

    # Delete messages first
    cursor.execute("DELETE FROM messages WHERE session_id = ?", (full_id,))

    # Delete session
    cursor.execute("DELETE FROM sessions WHERE id = ?", (full_id,))
    deleted = cursor.rowcount > 0

    conn.commit()
    conn.close()

    return deleted

`get_current_session()` ¶

Get current active session.

Source code in src/contextfs/core.py

def get_current_session(self) -> Session | None:
    """Get current active session."""
    return self._current_session

`list_sessions(limit=10, offset=0, tool=None, label=None, all_namespaces=False)` ¶

List recent sessions.

Source code in src/contextfs/core.py

def list_sessions(
    self,
    limit: int = 10,
    offset: int = 0,
    tool: str | None = None,
    label: str | None = None,
    all_namespaces: bool = False,
) -> list[Session]:
    """List recent sessions."""
    conn = sqlite3.connect(self._db_path)
    cursor = conn.cursor()

    columns = """id, label, namespace_id, tool, repo_path, branch, started_at, ended_at,
                 summary, metadata, device_name, memories_created"""

    if all_namespaces:
        sql = f"SELECT {columns} FROM sessions WHERE 1=1"
        params: list = []
    else:
        sql = f"SELECT {columns} FROM sessions WHERE namespace_id = ?"
        params = [self.namespace_id]

    if tool:
        sql += " AND tool = ?"
        params.append(tool)

    if label:
        sql += " AND label LIKE ?"
        params.append(f"%{label}%")

    sql += f" ORDER BY started_at DESC LIMIT {limit} OFFSET {offset}"

    cursor.execute(sql, params)
    rows = cursor.fetchall()
    conn.close()

    sessions = []
    for row in rows:
        sessions.append(
            Session(
                id=row[0],
                label=row[1],
                namespace_id=row[2],
                tool=row[3],
                repo_path=row[4],
                branch=row[5],
                started_at=datetime.fromisoformat(row[6]),
                ended_at=datetime.fromisoformat(row[7]) if row[7] else None,
                summary=row[8],
                metadata=json.loads(row[9]) if row[9] else {},
                device_name=row[10],
                memories_created=json.loads(row[11]) if row[11] else [],
            )
        )

    return sessions

`contextfs.schemas.Memory` ¶

Bases: BaseModel

A single memory item.

Supports optional structured_data for type-specific schema validation. When structured_data is provided, it is validated against TYPE_SCHEMAS for the memory's type. This enables typed memory with enforced structure.

Source code in src/contextfs/schemas.py

class Memory(BaseModel):
    """
    A single memory item.

    Supports optional structured_data for type-specific schema validation.
    When structured_data is provided, it is validated against TYPE_SCHEMAS
    for the memory's type. This enables typed memory with enforced structure.
    """

    id: str = Field(default_factory=lambda: str(uuid.uuid4())[:12])
    content: str
    type: MemoryType = MemoryType.FACT
    tags: list[str] = Field(default_factory=list)
    summary: str | None = None

    # Typed structured data (validated against TYPE_SCHEMAS)
    structured_data: dict[str, Any] | None = Field(
        default=None,
        description="Optional structured data validated against the type's JSON schema",
    )

    # Namespace for cross-repo support
    namespace_id: str = "global"

    # Timestamps
    created_at: datetime = Field(default_factory=datetime.now)
    updated_at: datetime = Field(default_factory=datetime.now)

    # Source tracking
    source_file: str | None = None
    source_repo: str | None = None
    source_tool: str | None = None  # claude-code, claude-desktop, gemini, chatgpt, etc.
    project: str | None = None  # Project name for grouping memories across repos
    session_id: str | None = None

    # Metadata
    metadata: dict[str, Any] = Field(default_factory=dict)

    # Authoritative flag (Phase 3)
    # Marks this memory as the canonical/official version in a lineage chain
    authoritative: bool = Field(
        default=False,
        description="Whether this is the authoritative/canonical version in a lineage",
    )

    # Embedding (populated by RAG backend)
    embedding: list[float] | None = None

    @model_validator(mode="after")
    def validate_structured_data_schema(self) -> "Memory":
        """Validate structured_data against the type's JSON schema if provided."""
        if self.structured_data is not None:
            type_value = self.type.value if isinstance(self.type, MemoryType) else self.type
            is_valid, error = validate_structured_data(type_value, self.structured_data)
            if not is_valid:
                raise ValueError(
                    f"structured_data validation failed for type '{type_value}': {error}"
                )
        return self

    def to_context_string(self) -> str:
        """Format for context injection."""
        prefix = f"[{self.type.value}]"
        if self.summary:
            return f"{prefix} {self.summary}: {self.content[:200]}..."
        return f"{prefix} {self.content[:300]}..."

    def get_structured_field(self, field: str, default: Any = None) -> Any:
        """Get a field from structured_data with a default value."""
        if self.structured_data is None:
            return default
        return self.structured_data.get(field, default)

    @property
    def typed_data(self) -> TypedStructuredData | dict[str, Any] | None:
        """
        Get structured_data as a typed Pydantic model if available.

        Returns the appropriate typed model (DecisionData, ErrorData, etc.)
        if the memory type has a corresponding class, otherwise returns
        the raw dict or None.
        """
        if self.structured_data is None:
            return None
        type_value = self.type.value if isinstance(self.type, MemoryType) else self.type
        return parse_structured_data(type_value, self.structured_data)

    # Factory methods for creating typed memories
    @classmethod
    def decision(
        cls,
        content: str,
        decision: str,
        rationale: str | None = None,
        alternatives: list[str] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a decision memory with typed structured_data."""
        structured = {"decision": decision}
        if rationale:
            structured["rationale"] = rationale
        if alternatives:
            structured["alternatives"] = alternatives
        return cls(
            content=content,
            type=MemoryType.DECISION,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def procedural(
        cls,
        content: str,
        steps: list[str],
        title: str | None = None,
        prerequisites: list[str] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a procedural memory with typed structured_data."""
        structured: dict[str, Any] = {"steps": steps}
        if title:
            structured["title"] = title
        if prerequisites:
            structured["prerequisites"] = prerequisites
        return cls(
            content=content,
            type=MemoryType.PROCEDURAL,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def error(
        cls,
        content: str,
        error_type: str,
        message: str,
        file: str | None = None,
        line: int | None = None,
        resolution: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create an error memory with typed structured_data."""
        structured: dict[str, Any] = {"error_type": error_type, "message": message}
        if file:
            structured["file"] = file
        if line:
            structured["line"] = line
        if resolution:
            structured["resolution"] = resolution
        return cls(
            content=content,
            type=MemoryType.ERROR,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def api(
        cls,
        content: str,
        endpoint: str,
        method: str | None = None,
        parameters: list[dict[str, Any]] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create an API memory with typed structured_data."""
        structured: dict[str, Any] = {"endpoint": endpoint}
        if method:
            structured["method"] = method
        if parameters:
            structured["parameters"] = parameters
        return cls(
            content=content,
            type=MemoryType.API,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def todo(
        cls,
        content: str,
        title: str,
        status: str | None = None,
        priority: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a todo memory with typed structured_data."""
        structured: dict[str, Any] = {"title": title}
        if status:
            structured["status"] = status
        if priority:
            structured["priority"] = priority
        return cls(
            content=content,
            type=MemoryType.TODO,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def fact(
        cls,
        content: str,
        category: str | None = None,
        source: str | None = None,
        confidence: float | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a fact memory with typed structured_data."""
        structured: dict[str, Any] = {}
        if category:
            structured["category"] = category
        if source:
            structured["source"] = source
        if confidence is not None:
            structured["confidence"] = confidence
        return cls(
            content=content,
            type=MemoryType.FACT,
            structured_data=structured if structured else None,
            **kwargs,
        )

    @classmethod
    def episodic(
        cls,
        content: str,
        session_type: str | None = None,
        participants: list[str] | None = None,
        outcome: str | None = None,
        tool: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create an episodic memory with typed structured_data."""
        structured: dict[str, Any] = {}
        if session_type:
            structured["session_type"] = session_type
        if participants:
            structured["participants"] = participants
        if outcome:
            structured["outcome"] = outcome
        if tool:
            structured["tool"] = tool
        return cls(
            content=content,
            type=MemoryType.EPISODIC,
            structured_data=structured if structured else None,
            **kwargs,
        )

    @classmethod
    def user(
        cls,
        content: str,
        preference_key: str,
        preference_value: str | None = None,
        scope: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a user preference memory with typed structured_data."""
        structured: dict[str, Any] = {"preference_key": preference_key}
        if preference_value:
            structured["preference_value"] = preference_value
        if scope:
            structured["scope"] = scope
        return cls(
            content=content,
            type=MemoryType.USER,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def code(
        cls,
        content: str,
        language: str | None = None,
        purpose: str | None = None,
        file_path: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a code memory with typed structured_data."""
        structured: dict[str, Any] = {}
        if language:
            structured["language"] = language
        if purpose:
            structured["purpose"] = purpose
        if file_path:
            structured["file_path"] = file_path
        return cls(
            content=content,
            type=MemoryType.CODE,
            structured_data=structured if structured else None,
            **kwargs,
        )

    @classmethod
    def commit(
        cls,
        content: str,
        sha: str | None = None,
        author: str | None = None,
        message: str | None = None,
        files_changed: list[str] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a commit memory with typed structured_data."""
        structured: dict[str, Any] = {}
        if sha:
            structured["sha"] = sha
            structured["short_sha"] = sha[:7] if len(sha) >= 7 else sha
        if author:
            structured["author"] = author
        if message:
            structured["message"] = message
        if files_changed:
            structured["files_changed"] = files_changed
        return cls(
            content=content,
            type=MemoryType.COMMIT,
            structured_data=structured if structured else None,
            **kwargs,
        )

    @classmethod
    def doc(
        cls,
        content: str,
        doc_type: str | None = None,
        title: str | None = None,
        url: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a documentation reference memory with typed structured_data."""
        structured: dict[str, Any] = {}
        if doc_type:
            structured["doc_type"] = doc_type
        if title:
            structured["title"] = title
        if url:
            structured["url"] = url
        return cls(
            content=content,
            type=MemoryType.DOC,
            structured_data=structured if structured else None,
            **kwargs,
        )

    # =========================================================================
    # Workflow/Agent Factory Methods
    # =========================================================================

    @classmethod
    def workflow(
        cls,
        content: str,
        name: str,
        status: str = "draft",
        description: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a workflow memory with typed structured_data."""
        structured: dict[str, Any] = {"name": name, "status": status}
        if description:
            structured["description"] = description
        return cls(
            content=content,
            type=MemoryType.WORKFLOW,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def task(
        cls,
        content: str,
        name: str,
        workflow_id: str | None = None,
        status: str = "pending",
        assigned_agent: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a task memory with typed structured_data."""
        structured: dict[str, Any] = {"name": name, "status": status}
        if workflow_id:
            structured["workflow_id"] = workflow_id
        if assigned_agent:
            structured["assigned_agent"] = assigned_agent
        return cls(
            content=content,
            type=MemoryType.TASK,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def step(
        cls,
        content: str,
        task_id: str,
        step_number: int = 0,
        action: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a step memory with typed structured_data."""
        structured: dict[str, Any] = {"task_id": task_id, "step_number": step_number}
        if action:
            structured["action"] = action
        return cls(
            content=content,
            type=MemoryType.STEP,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def agent_run(
        cls,
        content: str,
        agent_name: str,
        model: str | None = None,
        status: str = "running",
        workflow_id: str | None = None,
        task_id: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create an agent run memory with typed structured_data."""
        structured: dict[str, Any] = {"agent_name": agent_name, "status": status}
        if model:
            structured["model"] = model
        if workflow_id:
            structured["workflow_id"] = workflow_id
        if task_id:
            structured["task_id"] = task_id
        return cls(
            content=content,
            type=MemoryType.AGENT_RUN,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def issue(
        cls,
        content: str,
        title: str,
        severity: str | None = None,
        status: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create an issue memory with typed structured_data."""
        structured: dict[str, Any] = {"title": title}
        if severity:
            structured["severity"] = severity
        if status:
            structured["status"] = status
        return cls(
            content=content,
            type=MemoryType.ISSUE,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def schema_def(
        cls,
        content: str,
        name: str,
        schema_type: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a schema memory with typed structured_data.

        Note: Named schema_def to avoid conflict with Pydantic's schema() method.
        """
        structured: dict[str, Any] = {"name": name}
        if schema_type:
            structured["schema_type"] = schema_type
        return cls(
            content=content,
            type=MemoryType.SCHEMA,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def test_case(
        cls,
        content: str,
        name: str,
        test_type: str | None = None,
        status: str | None = None,
        file: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a test memory with typed structured_data.

        Note: Named test_case to avoid conflict with pytest.
        """
        structured: dict[str, Any] = {"name": name}
        if test_type:
            structured["test_type"] = test_type
        if status:
            structured["status"] = status
        if file:
            structured["file"] = file
        return cls(
            content=content,
            type=MemoryType.TEST,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def review(
        cls,
        content: str,
        pr_number: int,
        reviewer: str | None = None,
        status: str = "pending",
        **kwargs: Any,
    ) -> "Memory":
        """Create a review memory with typed structured_data."""
        structured: dict[str, Any] = {"pr_number": pr_number, "status": status}
        if reviewer:
            structured["reviewer"] = reviewer
        return cls(
            content=content,
            type=MemoryType.REVIEW,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def release(
        cls,
        content: str,
        version: str,
        date: str | None = None,
        changes: list[str] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a release memory with typed structured_data."""
        structured: dict[str, Any] = {"version": version}
        if date:
            structured["date"] = date
        if changes:
            structured["changes"] = changes
        return cls(
            content=content,
            type=MemoryType.RELEASE,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def config(
        cls,
        content: str,
        name: str,
        environment: str | None = None,
        settings: dict[str, Any] | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a config memory with typed structured_data."""
        structured: dict[str, Any] = {"name": name}
        if environment:
            structured["environment"] = environment
        if settings:
            structured["settings"] = settings
        return cls(
            content=content,
            type=MemoryType.CONFIG,
            structured_data=structured,
            **kwargs,
        )

    @classmethod
    def dependency(
        cls,
        content: str,
        name: str,
        version: str = "unknown",
        dep_type: str | None = None,
        **kwargs: Any,
    ) -> "Memory":
        """Create a dependency memory with typed structured_data."""
        structured: dict[str, Any] = {"name": name, "version": version}
        if dep_type:
            structured["dep_type"] = dep_type
        return cls(
            content=content,
            type=MemoryType.DEPENDENCY,
            structured_data=structured,
            **kwargs,
        )

    # =========================================================================
    # Formal Type System Integration
    # =========================================================================

    def as_typed(self, schema_type: type) -> "Mem":
        """
        Convert to schema-indexed Mem[S] type for type-safe structured_data access.

        This method wraps the Memory in a Mem[S] container that provides:
        - Type-safe access to structured_data via the .data property
        - Schema validation ensuring structured_data matches type S
        - Generic type parameter for static type checking

        Args:
            schema_type: The schema type (must be BaseSchema subclass).

        Returns:
            Mem[S] wrapper around this memory.

        Raises:
            ValueError: If structured_data doesn't match schema.

        Example:
            >>> from contextfs.schemas import DecisionData
            >>> memory = Memory.decision("DB choice", decision="PostgreSQL")
            >>> typed = memory.as_typed(DecisionData)
            >>> typed.data.decision  # Type-safe: str
            'PostgreSQL'
        """
        from contextfs.types.memory import Mem

        return Mem.wrap(self, schema_type)

    def as_versioned(self, schema_type: type) -> "VersionedMem":
        """
        Get versioned wrapper with timeline support for evolution tracking.

        This method wraps the Memory in a VersionedMem[S] container that provides:
        - Timeline of version entries with ChangeReason tracking
        - Type-safe evolution operations
        - Integration with memory lineage system

        Args:
            schema_type: The schema type (must be BaseSchema subclass).

        Returns:
            VersionedMem[S] wrapper with timeline support.

        Example:
            >>> from contextfs.schemas import DecisionData
            >>> from contextfs.types import ChangeReason
            >>> memory = Memory.decision("DB choice", decision="PostgreSQL")
            >>> versioned = memory.as_versioned(DecisionData)
            >>> versioned.evolve(
            ...     DecisionData(decision="SQLite"),
            ...     reason=ChangeReason.CORRECTION
            ... )
        """
        from contextfs.types.versioned import VersionedMem

        return VersionedMem.from_memory(self, schema_type)

`typed_data` `property` ¶

Get structured_data as a typed Pydantic model if available.

Returns the appropriate typed model (DecisionData, ErrorData, etc.) if the memory type has a corresponding class, otherwise returns the raw dict or None.

`agent_run(content, agent_name, model=None, status='running', workflow_id=None, task_id=None, **kwargs)` `classmethod` ¶

Create an agent run memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def agent_run(
    cls,
    content: str,
    agent_name: str,
    model: str | None = None,
    status: str = "running",
    workflow_id: str | None = None,
    task_id: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create an agent run memory with typed structured_data."""
    structured: dict[str, Any] = {"agent_name": agent_name, "status": status}
    if model:
        structured["model"] = model
    if workflow_id:
        structured["workflow_id"] = workflow_id
    if task_id:
        structured["task_id"] = task_id
    return cls(
        content=content,
        type=MemoryType.AGENT_RUN,
        structured_data=structured,
        **kwargs,
    )

`api(content, endpoint, method=None, parameters=None, **kwargs)` `classmethod` ¶

Create an API memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def api(
    cls,
    content: str,
    endpoint: str,
    method: str | None = None,
    parameters: list[dict[str, Any]] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create an API memory with typed structured_data."""
    structured: dict[str, Any] = {"endpoint": endpoint}
    if method:
        structured["method"] = method
    if parameters:
        structured["parameters"] = parameters
    return cls(
        content=content,
        type=MemoryType.API,
        structured_data=structured,
        **kwargs,
    )

`as_typed(schema_type)` ¶

Convert to schema-indexed Mem[S] type for type-safe structured_data access.

This method wraps the Memory in a Mem[S] container that provides: - Type-safe access to structured_data via the .data property - Schema validation ensuring structured_data matches type S - Generic type parameter for static type checking

Parameters:

Name	Type	Description	Default
`schema_type`	`type`	The schema type (must be BaseSchema subclass).	required

Returns:

Type	Description
`Mem`	Mem[S] wrapper around this memory.

Raises:

Type	Description
`ValueError`	If structured_data doesn't match schema.

Example

from contextfs.schemas import DecisionData memory = Memory.decision("DB choice", decision="PostgreSQL") typed = memory.as_typed(DecisionData) typed.data.decision # Type-safe: str 'PostgreSQL'

Source code in src/contextfs/schemas.py

def as_typed(self, schema_type: type) -> "Mem":
    """
    Convert to schema-indexed Mem[S] type for type-safe structured_data access.

    This method wraps the Memory in a Mem[S] container that provides:
    - Type-safe access to structured_data via the .data property
    - Schema validation ensuring structured_data matches type S
    - Generic type parameter for static type checking

    Args:
        schema_type: The schema type (must be BaseSchema subclass).

    Returns:
        Mem[S] wrapper around this memory.

    Raises:
        ValueError: If structured_data doesn't match schema.

    Example:
        >>> from contextfs.schemas import DecisionData
        >>> memory = Memory.decision("DB choice", decision="PostgreSQL")
        >>> typed = memory.as_typed(DecisionData)
        >>> typed.data.decision  # Type-safe: str
        'PostgreSQL'
    """
    from contextfs.types.memory import Mem

    return Mem.wrap(self, schema_type)

`as_versioned(schema_type)` ¶

Get versioned wrapper with timeline support for evolution tracking.

This method wraps the Memory in a VersionedMem[S] container that provides: - Timeline of version entries with ChangeReason tracking - Type-safe evolution operations - Integration with memory lineage system

Parameters:

Name	Type	Description	Default
`schema_type`	`type`	The schema type (must be BaseSchema subclass).	required

Returns:

Type	Description
`VersionedMem`	VersionedMem[S] wrapper with timeline support.

Example

from contextfs.schemas import DecisionData from contextfs.types import ChangeReason memory = Memory.decision("DB choice", decision="PostgreSQL") versioned = memory.as_versioned(DecisionData) versioned.evolve( ... DecisionData(decision="SQLite"), ... reason=ChangeReason.CORRECTION ... )

Source code in src/contextfs/schemas.py

def as_versioned(self, schema_type: type) -> "VersionedMem":
    """
    Get versioned wrapper with timeline support for evolution tracking.

    This method wraps the Memory in a VersionedMem[S] container that provides:
    - Timeline of version entries with ChangeReason tracking
    - Type-safe evolution operations
    - Integration with memory lineage system

    Args:
        schema_type: The schema type (must be BaseSchema subclass).

    Returns:
        VersionedMem[S] wrapper with timeline support.

    Example:
        >>> from contextfs.schemas import DecisionData
        >>> from contextfs.types import ChangeReason
        >>> memory = Memory.decision("DB choice", decision="PostgreSQL")
        >>> versioned = memory.as_versioned(DecisionData)
        >>> versioned.evolve(
        ...     DecisionData(decision="SQLite"),
        ...     reason=ChangeReason.CORRECTION
        ... )
    """
    from contextfs.types.versioned import VersionedMem

    return VersionedMem.from_memory(self, schema_type)

`code(content, language=None, purpose=None, file_path=None, **kwargs)` `classmethod` ¶

Create a code memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def code(
    cls,
    content: str,
    language: str | None = None,
    purpose: str | None = None,
    file_path: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a code memory with typed structured_data."""
    structured: dict[str, Any] = {}
    if language:
        structured["language"] = language
    if purpose:
        structured["purpose"] = purpose
    if file_path:
        structured["file_path"] = file_path
    return cls(
        content=content,
        type=MemoryType.CODE,
        structured_data=structured if structured else None,
        **kwargs,
    )

`commit(content, sha=None, author=None, message=None, files_changed=None, **kwargs)` `classmethod` ¶

Create a commit memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def commit(
    cls,
    content: str,
    sha: str | None = None,
    author: str | None = None,
    message: str | None = None,
    files_changed: list[str] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a commit memory with typed structured_data."""
    structured: dict[str, Any] = {}
    if sha:
        structured["sha"] = sha
        structured["short_sha"] = sha[:7] if len(sha) >= 7 else sha
    if author:
        structured["author"] = author
    if message:
        structured["message"] = message
    if files_changed:
        structured["files_changed"] = files_changed
    return cls(
        content=content,
        type=MemoryType.COMMIT,
        structured_data=structured if structured else None,
        **kwargs,
    )

`config(content, name, environment=None, settings=None, **kwargs)` `classmethod` ¶

Create a config memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def config(
    cls,
    content: str,
    name: str,
    environment: str | None = None,
    settings: dict[str, Any] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a config memory with typed structured_data."""
    structured: dict[str, Any] = {"name": name}
    if environment:
        structured["environment"] = environment
    if settings:
        structured["settings"] = settings
    return cls(
        content=content,
        type=MemoryType.CONFIG,
        structured_data=structured,
        **kwargs,
    )

`decision(content, decision, rationale=None, alternatives=None, **kwargs)` `classmethod` ¶

Create a decision memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def decision(
    cls,
    content: str,
    decision: str,
    rationale: str | None = None,
    alternatives: list[str] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a decision memory with typed structured_data."""
    structured = {"decision": decision}
    if rationale:
        structured["rationale"] = rationale
    if alternatives:
        structured["alternatives"] = alternatives
    return cls(
        content=content,
        type=MemoryType.DECISION,
        structured_data=structured,
        **kwargs,
    )

`dependency(content, name, version='unknown', dep_type=None, **kwargs)` `classmethod` ¶

Create a dependency memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def dependency(
    cls,
    content: str,
    name: str,
    version: str = "unknown",
    dep_type: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a dependency memory with typed structured_data."""
    structured: dict[str, Any] = {"name": name, "version": version}
    if dep_type:
        structured["dep_type"] = dep_type
    return cls(
        content=content,
        type=MemoryType.DEPENDENCY,
        structured_data=structured,
        **kwargs,
    )

`doc(content, doc_type=None, title=None, url=None, **kwargs)` `classmethod` ¶

Create a documentation reference memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def doc(
    cls,
    content: str,
    doc_type: str | None = None,
    title: str | None = None,
    url: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a documentation reference memory with typed structured_data."""
    structured: dict[str, Any] = {}
    if doc_type:
        structured["doc_type"] = doc_type
    if title:
        structured["title"] = title
    if url:
        structured["url"] = url
    return cls(
        content=content,
        type=MemoryType.DOC,
        structured_data=structured if structured else None,
        **kwargs,
    )

`episodic(content, session_type=None, participants=None, outcome=None, tool=None, **kwargs)` `classmethod` ¶

Create an episodic memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def episodic(
    cls,
    content: str,
    session_type: str | None = None,
    participants: list[str] | None = None,
    outcome: str | None = None,
    tool: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create an episodic memory with typed structured_data."""
    structured: dict[str, Any] = {}
    if session_type:
        structured["session_type"] = session_type
    if participants:
        structured["participants"] = participants
    if outcome:
        structured["outcome"] = outcome
    if tool:
        structured["tool"] = tool
    return cls(
        content=content,
        type=MemoryType.EPISODIC,
        structured_data=structured if structured else None,
        **kwargs,
    )

`error(content, error_type, message, file=None, line=None, resolution=None, **kwargs)` `classmethod` ¶

Create an error memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def error(
    cls,
    content: str,
    error_type: str,
    message: str,
    file: str | None = None,
    line: int | None = None,
    resolution: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create an error memory with typed structured_data."""
    structured: dict[str, Any] = {"error_type": error_type, "message": message}
    if file:
        structured["file"] = file
    if line:
        structured["line"] = line
    if resolution:
        structured["resolution"] = resolution
    return cls(
        content=content,
        type=MemoryType.ERROR,
        structured_data=structured,
        **kwargs,
    )

`fact(content, category=None, source=None, confidence=None, **kwargs)` `classmethod` ¶

Create a fact memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def fact(
    cls,
    content: str,
    category: str | None = None,
    source: str | None = None,
    confidence: float | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a fact memory with typed structured_data."""
    structured: dict[str, Any] = {}
    if category:
        structured["category"] = category
    if source:
        structured["source"] = source
    if confidence is not None:
        structured["confidence"] = confidence
    return cls(
        content=content,
        type=MemoryType.FACT,
        structured_data=structured if structured else None,
        **kwargs,
    )

`get_structured_field(field, default=None)` ¶

Get a field from structured_data with a default value.

Source code in src/contextfs/schemas.py

def get_structured_field(self, field: str, default: Any = None) -> Any:
    """Get a field from structured_data with a default value."""
    if self.structured_data is None:
        return default
    return self.structured_data.get(field, default)

`issue(content, title, severity=None, status=None, **kwargs)` `classmethod` ¶

Create an issue memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def issue(
    cls,
    content: str,
    title: str,
    severity: str | None = None,
    status: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create an issue memory with typed structured_data."""
    structured: dict[str, Any] = {"title": title}
    if severity:
        structured["severity"] = severity
    if status:
        structured["status"] = status
    return cls(
        content=content,
        type=MemoryType.ISSUE,
        structured_data=structured,
        **kwargs,
    )

`procedural(content, steps, title=None, prerequisites=None, **kwargs)` `classmethod` ¶

Create a procedural memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def procedural(
    cls,
    content: str,
    steps: list[str],
    title: str | None = None,
    prerequisites: list[str] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a procedural memory with typed structured_data."""
    structured: dict[str, Any] = {"steps": steps}
    if title:
        structured["title"] = title
    if prerequisites:
        structured["prerequisites"] = prerequisites
    return cls(
        content=content,
        type=MemoryType.PROCEDURAL,
        structured_data=structured,
        **kwargs,
    )

`release(content, version, date=None, changes=None, **kwargs)` `classmethod` ¶

Create a release memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def release(
    cls,
    content: str,
    version: str,
    date: str | None = None,
    changes: list[str] | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a release memory with typed structured_data."""
    structured: dict[str, Any] = {"version": version}
    if date:
        structured["date"] = date
    if changes:
        structured["changes"] = changes
    return cls(
        content=content,
        type=MemoryType.RELEASE,
        structured_data=structured,
        **kwargs,
    )

`review(content, pr_number, reviewer=None, status='pending', **kwargs)` `classmethod` ¶

Create a review memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def review(
    cls,
    content: str,
    pr_number: int,
    reviewer: str | None = None,
    status: str = "pending",
    **kwargs: Any,
) -> "Memory":
    """Create a review memory with typed structured_data."""
    structured: dict[str, Any] = {"pr_number": pr_number, "status": status}
    if reviewer:
        structured["reviewer"] = reviewer
    return cls(
        content=content,
        type=MemoryType.REVIEW,
        structured_data=structured,
        **kwargs,
    )

`schema_def(content, name, schema_type=None, **kwargs)` `classmethod` ¶

Create a schema memory with typed structured_data.

Note: Named schema_def to avoid conflict with Pydantic's schema() method.

Source code in src/contextfs/schemas.py

@classmethod
def schema_def(
    cls,
    content: str,
    name: str,
    schema_type: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a schema memory with typed structured_data.

    Note: Named schema_def to avoid conflict with Pydantic's schema() method.
    """
    structured: dict[str, Any] = {"name": name}
    if schema_type:
        structured["schema_type"] = schema_type
    return cls(
        content=content,
        type=MemoryType.SCHEMA,
        structured_data=structured,
        **kwargs,
    )

`step(content, task_id, step_number=0, action=None, **kwargs)` `classmethod` ¶

Create a step memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def step(
    cls,
    content: str,
    task_id: str,
    step_number: int = 0,
    action: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a step memory with typed structured_data."""
    structured: dict[str, Any] = {"task_id": task_id, "step_number": step_number}
    if action:
        structured["action"] = action
    return cls(
        content=content,
        type=MemoryType.STEP,
        structured_data=structured,
        **kwargs,
    )

`task(content, name, workflow_id=None, status='pending', assigned_agent=None, **kwargs)` `classmethod` ¶

Create a task memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def task(
    cls,
    content: str,
    name: str,
    workflow_id: str | None = None,
    status: str = "pending",
    assigned_agent: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a task memory with typed structured_data."""
    structured: dict[str, Any] = {"name": name, "status": status}
    if workflow_id:
        structured["workflow_id"] = workflow_id
    if assigned_agent:
        structured["assigned_agent"] = assigned_agent
    return cls(
        content=content,
        type=MemoryType.TASK,
        structured_data=structured,
        **kwargs,
    )

`test_case(content, name, test_type=None, status=None, file=None, **kwargs)` `classmethod` ¶

Create a test memory with typed structured_data.

Note: Named test_case to avoid conflict with pytest.

Source code in src/contextfs/schemas.py

@classmethod
def test_case(
    cls,
    content: str,
    name: str,
    test_type: str | None = None,
    status: str | None = None,
    file: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a test memory with typed structured_data.

    Note: Named test_case to avoid conflict with pytest.
    """
    structured: dict[str, Any] = {"name": name}
    if test_type:
        structured["test_type"] = test_type
    if status:
        structured["status"] = status
    if file:
        structured["file"] = file
    return cls(
        content=content,
        type=MemoryType.TEST,
        structured_data=structured,
        **kwargs,
    )

`to_context_string()` ¶

Format for context injection.

Source code in src/contextfs/schemas.py

def to_context_string(self) -> str:
    """Format for context injection."""
    prefix = f"[{self.type.value}]"
    if self.summary:
        return f"{prefix} {self.summary}: {self.content[:200]}..."
    return f"{prefix} {self.content[:300]}..."

`todo(content, title, status=None, priority=None, **kwargs)` `classmethod` ¶

Create a todo memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def todo(
    cls,
    content: str,
    title: str,
    status: str | None = None,
    priority: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a todo memory with typed structured_data."""
    structured: dict[str, Any] = {"title": title}
    if status:
        structured["status"] = status
    if priority:
        structured["priority"] = priority
    return cls(
        content=content,
        type=MemoryType.TODO,
        structured_data=structured,
        **kwargs,
    )

`user(content, preference_key, preference_value=None, scope=None, **kwargs)` `classmethod` ¶

Create a user preference memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def user(
    cls,
    content: str,
    preference_key: str,
    preference_value: str | None = None,
    scope: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a user preference memory with typed structured_data."""
    structured: dict[str, Any] = {"preference_key": preference_key}
    if preference_value:
        structured["preference_value"] = preference_value
    if scope:
        structured["scope"] = scope
    return cls(
        content=content,
        type=MemoryType.USER,
        structured_data=structured,
        **kwargs,
    )

`validate_structured_data_schema()` ¶

Validate structured_data against the type's JSON schema if provided.

Source code in src/contextfs/schemas.py

@model_validator(mode="after")
def validate_structured_data_schema(self) -> "Memory":
    """Validate structured_data against the type's JSON schema if provided."""
    if self.structured_data is not None:
        type_value = self.type.value if isinstance(self.type, MemoryType) else self.type
        is_valid, error = validate_structured_data(type_value, self.structured_data)
        if not is_valid:
            raise ValueError(
                f"structured_data validation failed for type '{type_value}': {error}"
            )
    return self

`workflow(content, name, status='draft', description=None, **kwargs)` `classmethod` ¶

Create a workflow memory with typed structured_data.

Source code in src/contextfs/schemas.py

@classmethod
def workflow(
    cls,
    content: str,
    name: str,
    status: str = "draft",
    description: str | None = None,
    **kwargs: Any,
) -> "Memory":
    """Create a workflow memory with typed structured_data."""
    structured: dict[str, Any] = {"name": name, "status": status}
    if description:
        structured["description"] = description
    return cls(
        content=content,
        type=MemoryType.WORKFLOW,
        structured_data=structured,
        **kwargs,
    )

`contextfs.schemas.MemoryType` ¶

Bases: str, Enum

Types of memories.

Source code in src/contextfs/schemas.py

class MemoryType(str, Enum):
    """Types of memories."""

    # Core types
    FACT = "fact"  # Static facts, configurations
    DECISION = "decision"  # Architectural/design decisions
    PROCEDURAL = "procedural"  # How-to procedures
    EPISODIC = "episodic"  # Session/conversation memories
    USER = "user"  # User preferences
    CODE = "code"  # Code snippets
    ERROR = "error"  # Runtime errors, stack traces
    COMMIT = "commit"  # Git commit history

    # Extended types
    TODO = "todo"  # Tasks, work items
    ISSUE = "issue"  # Bugs, problems, tickets
    API = "api"  # API endpoints, contracts
    SCHEMA = "schema"  # Data models, DB schemas
    TEST = "test"  # Test cases, coverage
    REVIEW = "review"  # PR feedback, code reviews
    RELEASE = "release"  # Changelogs, versions
    CONFIG = "config"  # Environment configs
    DEPENDENCY = "dependency"  # Package versions
    DOC = "doc"  # Documentation

    # Workflow/Agent types
    WORKFLOW = "workflow"  # Workflow definitions
    TASK = "task"  # Individual workflow tasks
    STEP = "step"  # Execution steps within tasks
    AGENT_RUN = "agent_run"  # LLM agent execution records

`contextfs.schemas.SearchResult` ¶

Bases: BaseModel

Search result with relevance score.

Source code in src/contextfs/schemas.py

class SearchResult(BaseModel):
    """Search result with relevance score."""

    memory: Memory
    score: float = Field(ge=0.0, le=1.0)
    highlights: list[str] = Field(default_factory=list)
    source: str | None = None  # "fts", "rag", or "hybrid"

`contextfs.schemas.Session` ¶

Bases: BaseModel

A conversation session.

Source code in src/contextfs/schemas.py

class Session(BaseModel):
    """A conversation session."""

    id: str = Field(default_factory=lambda: str(uuid.uuid4()))
    label: str | None = None
    namespace_id: str = "global"

    # Tool that created session
    tool: str = "contextfs"  # claude-code, gemini, codex, etc.

    # Device tracking
    device_name: str | None = None  # hostname or user-friendly device name

    # Git context
    repo_path: str | None = None
    branch: str | None = None

    # Messages
    messages: list[SessionMessage] = Field(default_factory=list)

    # Timestamps
    started_at: datetime = Field(default_factory=datetime.now)
    ended_at: datetime | None = None

    # Generated summary
    summary: str | None = None

    # Memories created during this session (IDs)
    memories_created: list[str] = Field(default_factory=list)

    metadata: dict[str, Any] = Field(default_factory=dict)

    def add_message(self, role: str, content: str) -> SessionMessage:
        msg = SessionMessage(role=role, content=content)
        self.messages.append(msg)
        return msg

    def end(self) -> None:
        self.ended_at = datetime.now(timezone.utc)

`contextfs.schemas.Namespace` ¶

Bases: BaseModel

Namespace for cross-repo memory isolation.

Hierarchy: - global: Shared across all repos - org/team: Shared within organization - repo: Specific to repository - session: Specific to session

Namespace ID derivation priority: 1. Explicit ID from .contextfs/config.yaml (highest priority) 2. Git remote URL (portable across machines) 3. Local path fallback (not portable, for repos without remotes)

Source code in src/contextfs/schemas.py

class Namespace(BaseModel):
    """
    Namespace for cross-repo memory isolation.

    Hierarchy:
    - global: Shared across all repos
    - org/team: Shared within organization
    - repo: Specific to repository
    - session: Specific to session

    Namespace ID derivation priority:
    1. Explicit ID from .contextfs/config.yaml (highest priority)
    2. Git remote URL (portable across machines)
    3. Local path fallback (not portable, for repos without remotes)
    """

    id: str = Field(default_factory=lambda: str(uuid.uuid4())[:12])
    name: str
    parent_id: str | None = None
    repo_path: str | None = None
    remote_url: str | None = None  # Git remote URL if available
    source: str | None = None  # How namespace was derived (explicit, git_remote, path)
    created_at: datetime = Field(default_factory=datetime.now)
    metadata: dict[str, Any] = Field(default_factory=dict)

    @classmethod
    def global_ns(cls) -> "Namespace":
        return cls(id="global", name="global")

    @classmethod
    def for_repo(cls, repo_path: str, use_path_fallback: bool = True) -> "Namespace":
        """
        Create namespace for a repository.

        Derivation priority:
        1. Explicit namespace_id from .contextfs/config.yaml
        2. Git remote origin URL (portable across machines)
        3. Local path (fallback, not portable)

        Args:
            repo_path: Path to the repository
            use_path_fallback: If False, return None when no remote URL found

        Returns:
            Namespace object with stable ID
        """
        from pathlib import Path

        resolved_path = str(Path(repo_path).resolve())
        repo_name = resolved_path.split("/")[-1]

        # 1. Check for explicit namespace in .contextfs/config.yaml
        explicit_id = _read_contextfs_namespace(resolved_path)
        if explicit_id:
            return cls(
                id=explicit_id,
                name=repo_name,
                repo_path=resolved_path,
                source=NamespaceSource.EXPLICIT,
            )

        # 2. Try git remote URL (portable across machines)
        remote_url = _get_git_remote_url(resolved_path)
        if remote_url:
            normalized_url = _normalize_git_url(remote_url)
            repo_id = hashlib.sha256(normalized_url.encode()).hexdigest()[:12]
            return cls(
                id=f"repo-{repo_id}",
                name=repo_name,
                repo_path=resolved_path,
                remote_url=remote_url,
                source=NamespaceSource.GIT_REMOTE,
            )

        # 3. Fallback to path-based (not portable, but works for local-only repos)
        if use_path_fallback:
            repo_id = hashlib.sha256(resolved_path.encode()).hexdigest()[:12]
            return cls(
                id=f"local-{repo_id}",
                name=repo_name,
                repo_path=resolved_path,
                source=NamespaceSource.PATH,
            )

        return None

    @classmethod
    def for_repo_legacy(cls, repo_path: str) -> "Namespace":
        """
        Legacy path-based namespace generation.

        Use this only for migration purposes or when you specifically
        need the old path-based behavior.
        """
        from pathlib import Path

        resolved_path = str(Path(repo_path).resolve())
        repo_id = hashlib.sha256(resolved_path.encode()).hexdigest()[:12]
        return cls(
            id=f"repo-{repo_id}",
            name=resolved_path.split("/")[-1],
            repo_path=resolved_path,
            source=NamespaceSource.PATH,
        )

`for_repo(repo_path, use_path_fallback=True)` `classmethod` ¶

Create namespace for a repository.

Derivation priority: 1. Explicit namespace_id from .contextfs/config.yaml 2. Git remote origin URL (portable across machines) 3. Local path (fallback, not portable)

Parameters:

Name	Type	Description	Default
`repo_path`	`str`	Path to the repository	required
`use_path_fallback`	`bool`	If False, return None when no remote URL found	`True`

Returns:

Type	Description
`Namespace`	Namespace object with stable ID

Source code in src/contextfs/schemas.py

@classmethod
def for_repo(cls, repo_path: str, use_path_fallback: bool = True) -> "Namespace":
    """
    Create namespace for a repository.

    Derivation priority:
    1. Explicit namespace_id from .contextfs/config.yaml
    2. Git remote origin URL (portable across machines)
    3. Local path (fallback, not portable)

    Args:
        repo_path: Path to the repository
        use_path_fallback: If False, return None when no remote URL found

    Returns:
        Namespace object with stable ID
    """
    from pathlib import Path

    resolved_path = str(Path(repo_path).resolve())
    repo_name = resolved_path.split("/")[-1]

    # 1. Check for explicit namespace in .contextfs/config.yaml
    explicit_id = _read_contextfs_namespace(resolved_path)
    if explicit_id:
        return cls(
            id=explicit_id,
            name=repo_name,
            repo_path=resolved_path,
            source=NamespaceSource.EXPLICIT,
        )

    # 2. Try git remote URL (portable across machines)
    remote_url = _get_git_remote_url(resolved_path)
    if remote_url:
        normalized_url = _normalize_git_url(remote_url)
        repo_id = hashlib.sha256(normalized_url.encode()).hexdigest()[:12]
        return cls(
            id=f"repo-{repo_id}",
            name=repo_name,
            repo_path=resolved_path,
            remote_url=remote_url,
            source=NamespaceSource.GIT_REMOTE,
        )

    # 3. Fallback to path-based (not portable, but works for local-only repos)
    if use_path_fallback:
        repo_id = hashlib.sha256(resolved_path.encode()).hexdigest()[:12]
        return cls(
            id=f"local-{repo_id}",
            name=repo_name,
            repo_path=resolved_path,
            source=NamespaceSource.PATH,
        )

    return None

`for_repo_legacy(repo_path)` `classmethod` ¶

Legacy path-based namespace generation.

Use this only for migration purposes or when you specifically need the old path-based behavior.

Source code in src/contextfs/schemas.py

@classmethod
def for_repo_legacy(cls, repo_path: str) -> "Namespace":
    """
    Legacy path-based namespace generation.

    Use this only for migration purposes or when you specifically
    need the old path-based behavior.
    """
    from pathlib import Path

    resolved_path = str(Path(repo_path).resolve())
    repo_id = hashlib.sha256(resolved_path.encode()).hexdigest()[:12]
    return cls(
        id=f"repo-{repo_id}",
        name=resolved_path.split("/")[-1],
        repo_path=resolved_path,
        source=NamespaceSource.PATH,
    )

API Reference¶

contextfs.core.ContextFS ¶

__init__(data_dir=None, namespace_id=None, auto_load=True, auto_index=True) ¶

save(content, type=MemoryType.FACT, tags=None, summary=None, namespace_id=None, source_tool=None, source_repo=None, project=None, metadata=None, created_at=None, updated_at=None, id=None, structured_data=None, authoritative=False) ¶

update(memory_id, content=None, type=None, tags=None, summary=None, project=None, metadata=None, authoritative=None) ¶

search(query, limit=10, type=None, tags=None, namespace_id=None, source_tool=None, source_repo=None, project=None, cross_repo=False, mode='hybrid', use_semantic=None) ¶

recall(memory_id) ¶

delete(memory_id, hard_delete=False) ¶

list_recent(limit=10, type=None, namespace_id=None, source_tool=None, project=None) ¶

index_repository(repo_path=None, on_progress=None, incremental=True, project=None, source_repo=None, mode='all') ¶

get_index_status(repo_path=None) ¶

clear_index(repo_path=None) ¶

start_session(tool='contextfs', label=None, repo_path=None, branch=None) ¶

end_session(generate_summary=True) ¶

update_session(session_id, label=None, summary=None) ¶

delete_session(session_id) ¶

get_current_session() ¶

list_sessions(limit=10, offset=0, tool=None, label=None, all_namespaces=False) ¶

contextfs.schemas.Memory ¶

typed_data property ¶

agent_run(content, agent_name, model=None, status='running', workflow_id=None, task_id=None, **kwargs) classmethod ¶

api(content, endpoint, method=None, parameters=None, **kwargs) classmethod ¶

as_typed(schema_type) ¶

as_versioned(schema_type) ¶

code(content, language=None, purpose=None, file_path=None, **kwargs) classmethod ¶

commit(content, sha=None, author=None, message=None, files_changed=None, **kwargs) classmethod ¶

config(content, name, environment=None, settings=None, **kwargs) classmethod ¶

decision(content, decision, rationale=None, alternatives=None, **kwargs) classmethod ¶

dependency(content, name, version='unknown', dep_type=None, **kwargs) classmethod ¶

doc(content, doc_type=None, title=None, url=None, **kwargs) classmethod ¶

episodic(content, session_type=None, participants=None, outcome=None, tool=None, **kwargs) classmethod ¶

error(content, error_type, message, file=None, line=None, resolution=None, **kwargs) classmethod ¶

fact(content, category=None, source=None, confidence=None, **kwargs) classmethod ¶

get_structured_field(field, default=None) ¶

issue(content, title, severity=None, status=None, **kwargs) classmethod ¶

procedural(content, steps, title=None, prerequisites=None, **kwargs) classmethod ¶

release(content, version, date=None, changes=None, **kwargs) classmethod ¶

review(content, pr_number, reviewer=None, status='pending', **kwargs) classmethod ¶

schema_def(content, name, schema_type=None, **kwargs) classmethod ¶

step(content, task_id, step_number=0, action=None, **kwargs) classmethod ¶

task(content, name, workflow_id=None, status='pending', assigned_agent=None, **kwargs) classmethod ¶

test_case(content, name, test_type=None, status=None, file=None, **kwargs) classmethod ¶

to_context_string() ¶

todo(content, title, status=None, priority=None, **kwargs) classmethod ¶

user(content, preference_key, preference_value=None, scope=None, **kwargs) classmethod ¶

validate_structured_data_schema() ¶

workflow(content, name, status='draft', description=None, **kwargs) classmethod ¶

contextfs.schemas.MemoryType ¶

contextfs.schemas.SearchResult ¶

contextfs.schemas.Session ¶

contextfs.schemas.Namespace ¶

for_repo(repo_path, use_path_fallback=True) classmethod ¶

for_repo_legacy(repo_path) classmethod ¶

`contextfs.core.ContextFS` ¶

`init(data_dir=None, namespace_id=None, auto_load=True, auto_index=True)` ¶

`save(content, type=MemoryType.FACT, tags=None, summary=None, namespace_id=None, source_tool=None, source_repo=None, project=None, metadata=None, created_at=None, updated_at=None, id=None, structured_data=None, authoritative=False)` ¶

`update(memory_id, content=None, type=None, tags=None, summary=None, project=None, metadata=None, authoritative=None)` ¶

`search(query, limit=10, type=None, tags=None, namespace_id=None, source_tool=None, source_repo=None, project=None, cross_repo=False, mode='hybrid', use_semantic=None)` ¶

`recall(memory_id)` ¶

`delete(memory_id, hard_delete=False)` ¶

`list_recent(limit=10, type=None, namespace_id=None, source_tool=None, project=None)` ¶

`index_repository(repo_path=None, on_progress=None, incremental=True, project=None, source_repo=None, mode='all')` ¶

`get_index_status(repo_path=None)` ¶

`clear_index(repo_path=None)` ¶

`start_session(tool='contextfs', label=None, repo_path=None, branch=None)` ¶

`end_session(generate_summary=True)` ¶

`update_session(session_id, label=None, summary=None)` ¶

`delete_session(session_id)` ¶

`get_current_session()` ¶

`list_sessions(limit=10, offset=0, tool=None, label=None, all_namespaces=False)` ¶

`contextfs.schemas.Memory` ¶

`typed_data` `property` ¶

`agent_run(content, agent_name, model=None, status='running', workflow_id=None, task_id=None, **kwargs)` `classmethod` ¶

`api(content, endpoint, method=None, parameters=None, **kwargs)` `classmethod` ¶

`as_typed(schema_type)` ¶

`as_versioned(schema_type)` ¶

`code(content, language=None, purpose=None, file_path=None, **kwargs)` `classmethod` ¶

`commit(content, sha=None, author=None, message=None, files_changed=None, **kwargs)` `classmethod` ¶

`config(content, name, environment=None, settings=None, **kwargs)` `classmethod` ¶

`decision(content, decision, rationale=None, alternatives=None, **kwargs)` `classmethod` ¶

`dependency(content, name, version='unknown', dep_type=None, **kwargs)` `classmethod` ¶

`doc(content, doc_type=None, title=None, url=None, **kwargs)` `classmethod` ¶

`episodic(content, session_type=None, participants=None, outcome=None, tool=None, **kwargs)` `classmethod` ¶

`error(content, error_type, message, file=None, line=None, resolution=None, **kwargs)` `classmethod` ¶

`fact(content, category=None, source=None, confidence=None, **kwargs)` `classmethod` ¶

`get_structured_field(field, default=None)` ¶

`issue(content, title, severity=None, status=None, **kwargs)` `classmethod` ¶

`procedural(content, steps, title=None, prerequisites=None, **kwargs)` `classmethod` ¶

`release(content, version, date=None, changes=None, **kwargs)` `classmethod` ¶

`review(content, pr_number, reviewer=None, status='pending', **kwargs)` `classmethod` ¶

`schema_def(content, name, schema_type=None, **kwargs)` `classmethod` ¶

`step(content, task_id, step_number=0, action=None, **kwargs)` `classmethod` ¶

`task(content, name, workflow_id=None, status='pending', assigned_agent=None, **kwargs)` `classmethod` ¶

`test_case(content, name, test_type=None, status=None, file=None, **kwargs)` `classmethod` ¶

`to_context_string()` ¶

`todo(content, title, status=None, priority=None, **kwargs)` `classmethod` ¶

`user(content, preference_key, preference_value=None, scope=None, **kwargs)` `classmethod` ¶

`validate_structured_data_schema()` ¶

`workflow(content, name, status='draft', description=None, **kwargs)` `classmethod` ¶

`contextfs.schemas.MemoryType` ¶

`contextfs.schemas.SearchResult` ¶

`contextfs.schemas.Session` ¶

`contextfs.schemas.Namespace` ¶

`for_repo(repo_path, use_path_fallback=True)` `classmethod` ¶

`for_repo_legacy(repo_path)` `classmethod` ¶