model_reference_manager

Singleton manager for model reference lifecycle: backend selection, caching, and the public API.

TModelRecord `module-attribute`

TModelRecord = TypeVar(
    "TModelRecord", bound=GenericModelRecord
)

all `module-attribute`

__all__ = [
    "DeferredPrefetchHandle",
    "ModelReferenceManager",
    "PrefetchStrategy",
]

PrefetchStrategy

Bases: StrEnum

Controls when and how the manager fetches model references.

Source code in src/horde_model_reference/model_reference_manager.py

class PrefetchStrategy(StrEnum):
    """Controls when and how the manager fetches model references."""

    LAZY = "lazy"
    """Defer backend fetches until first access (legacy lazy_mode=True behavior)."""

    SYNC = "sync"
    """Immediately fetch all categories on the calling thread during initialization."""

    DEFERRED = "deferred"
    """Expose a handle the caller can trigger later (sync or async) without blocking init."""

    ASYNC = "async"
    """Automatically schedule a background async warm-up when an event loop is available."""

    NONE = "none"
    """Skip all automatic warm-up; callers must invoke caching helpers manually."""

LAZY `class-attribute` `instance-attribute`

LAZY = 'lazy'

Defer backend fetches until first access (legacy lazy_mode=True behavior).

SYNC `class-attribute` `instance-attribute`

SYNC = 'sync'

Immediately fetch all categories on the calling thread during initialization.

DEFERRED `class-attribute` `instance-attribute`

DEFERRED = 'deferred'

Expose a handle the caller can trigger later (sync or async) without blocking init.

ASYNC `class-attribute` `instance-attribute`

ASYNC = 'async'

Automatically schedule a background async warm-up when an event loop is available.

NONE `class-attribute` `instance-attribute`

NONE = 'none'

Skip all automatic warm-up; callers must invoke caching helpers manually.

ModelReferenceManager

Singleton class for downloading and reading model reference files.

This class is responsible for managing the lifecycle of model reference files, including downloading, caching, and providing access to the model references.

Uses a pluggable backend architecture to support different data sources (GitHub, database, etc.).

Settings on initialization (base_path, backend, prefetch_strategy, etc) are only set on the first instantiation

(e.g. ModelReferenceManager(base_path=...)). Subsequent instantiations will return the same instance.

Retrieve all model references with get_all_model_references_or_none().

Source code in src/horde_model_reference/model_reference_manager.py

class ModelReferenceManager:
    """Singleton class for downloading and reading model reference files.

    This class is responsible for managing the lifecycle of model reference files,
    including downloading, caching, and providing access to the model references.

    Uses a pluggable backend architecture to support different data sources (GitHub, database, etc.).

        Settings on initialization (base_path, backend, prefetch_strategy, etc) are only set on the first instantiation
    (e.g. `ModelReferenceManager(base_path=...)`). Subsequent instantiations will return the same instance.

    Retrieve all model references with `get_all_model_references_or_none()`.
    """

    backend: ModelReferenceBackend
    """The backend provider for model reference data."""
    _cached_records: dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]
    """Cache of pydantic model records by category."""

    _instance: ModelReferenceManager | None = None
    _replicate_mode: ReplicateMode = ReplicateMode.REPLICA
    _offline: bool = False
    _prefetch_strategy: PrefetchStrategy = PrefetchStrategy.SYNC
    _deferred_prefetch_handle: DeferredPrefetchHandle | None = None
    _async_prefetch_task: asyncio.Task[None] | None = None
    _provider_registry: ModelProviderRegistry
    _audit_writer: AuditTrailWriter | None = None
    _pending_queue_service: PendingQueueService | None = None
    _group_alias_store: GroupAliasStore | None = None
    _group_family_store: GroupFamilyStore | None = None
    _group_schema_store: GroupSchemaStore | None = None

    _lock: RLock = RLock()

    @classmethod
    def get_instance(cls) -> ModelReferenceManager:
        """Get the singleton instance of ModelReferenceManager.

        Returns:
            ModelReferenceManager: The singleton instance.

        Raises:
            RuntimeError: If the instance has not been created yet.

        """
        with cls._lock:
            if cls._instance is None:
                raise RuntimeError("ModelReferenceManager instance has not been created yet.")
            return cls._instance

    @classmethod
    def has_instance(cls) -> bool:
        """Check if the singleton instance has been created.

        Returns:
            bool: True if the instance exists, False otherwise.

        """
        with cls._lock:
            return cls._instance is not None

    @classmethod
    def reset(cls) -> None:
        """Destroy the singleton instance so a fresh one can be created.

        Intended for testing and development only. Production code should not
        call this - the singleton is designed to live for the process lifetime.
        """
        with cls._lock:
            instance = cls._instance
            if instance is None:
                return

            if instance._deferred_prefetch_handle is not None:
                instance._deferred_prefetch_handle = None

            if instance._async_prefetch_task is not None and not instance._async_prefetch_task.done():
                instance._async_prefetch_task.cancel()
                instance._async_prefetch_task = None

            cls._instance = None

    @staticmethod
    def _create_backend(
        base_path: str | Path,
        replicate_mode: ReplicateMode,
        audit_writer: AuditTrailWriter | None,
        offline: bool = False,
    ) -> ModelReferenceBackend:
        """Create the appropriate backend based on mode and settings.

        Args:
            base_path: Base path for model reference files.
            replicate_mode: The replication mode.
            audit_writer: Optional audit writer used by write-capable backends.
            offline: If True, return a read-only local-disk backend that never downloads,
                regardless of replicate_mode. Used by subprocesses whose parent owns downloading.

        Returns:
            ModelReferenceBackend: The configured backend instance.

        """
        logger.debug(
            f"Creating backend with replicate_mode={replicate_mode}, base_path={base_path}, offline={offline}",
        )
        if offline:
            logger.info("Using LocalReadOnlyBackend (offline=True); references are read from disk, never downloaded")
            return LocalReadOnlyBackend(
                base_path=base_path,
                cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
            )

        if replicate_mode == ReplicateMode.PRIMARY:
            logger.debug("Creating backend for PRIMARY mode")

            # Check if GitHub seeding will be needed
            github_seeding_will_occur = False
            if horde_model_reference_settings.github_seed_enabled:
                # Quick check to see if any categories are missing
                # (we'll do proper check after backend creation)
                github_seeding_will_occur = True

            filesystem_backend = FileSystemBackend(
                base_path=base_path,
                cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
                replicate_mode=ReplicateMode.PRIMARY,
                skip_startup_metadata_population=github_seeding_will_occur,
                audit_writer=audit_writer,
            )

            if horde_model_reference_settings.github_seed_enabled:
                logger.info("GitHub seeding enabled for PRIMARY mode")

                all_paths = filesystem_backend.get_all_category_file_paths()
                missing_categories = [cat for cat, path in all_paths.items() if path is None or not path.exists()]

                if missing_categories:
                    logger.info(f"Missing categories detected: {missing_categories}. Seeding from GitHub...")

                    github_backend = GitHubBackend(
                        base_path=base_path,
                        replicate_mode=ReplicateMode.PRIMARY,
                    )

                    github_backend.fetch_all_categories(force_refresh=True)
                    logger.info("GitHub seeding completed")

                    # Populate metadata after seeding
                    logger.info("Populating metadata after GitHub seeding")
                    filesystem_backend.ensure_all_metadata_populated()
                else:
                    logger.debug("All files exist, skipping GitHub seeding")
                    # Files exist but seeding was skipped, so run metadata population
                    logger.info("Running metadata population check (seeding was skipped)")
                    filesystem_backend.ensure_all_metadata_populated()

            if horde_model_reference_settings.redis.use_redis:
                from horde_model_reference.backends.redis_backend import RedisBackend

                logger.info("Wrapping FileSystemBackend with RedisBackend for distributed caching")
                return RedisBackend(
                    file_backend=filesystem_backend,
                    redis_settings=horde_model_reference_settings.redis,
                    cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
                )

            logger.info("Using FileSystemBackend for single-worker PRIMARY deployment")
            return filesystem_backend

        logger.debug("Creating backend for REPLICA mode")

        github_backend = GitHubBackend(
            base_path=base_path,
            replicate_mode=ReplicateMode.REPLICA,
        )

        if horde_model_reference_settings.primary_api_url:
            logger.info(f"Using HTTPBackend with PRIMARY API: {horde_model_reference_settings.primary_api_url}")
            return HTTPBackend(
                primary_api_url=horde_model_reference_settings.primary_api_url,
                github_backend=github_backend,
                cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
                timeout_seconds=horde_model_reference_settings.primary_api_timeout,
                enable_github_fallback=horde_model_reference_settings.enable_github_fallback,
            )

        logger.info("Using GitHubBackend only (no PRIMARY API configured)")
        return github_backend

    def __new__(
        cls,
        *,
        backend: ModelReferenceBackend | None = None,
        base_path: str | Path = horde_model_reference_paths.base_path,
        replicate_mode: ReplicateMode = horde_model_reference_settings.replicate_mode,
        prefetch_strategy: PrefetchStrategy = PrefetchStrategy.LAZY,
        offline: bool = horde_model_reference_settings.offline,
    ) -> ModelReferenceManager:
        """Create a new instance of ModelReferenceManager.

        Uses the singleton pattern to ensure only one instance exists to avoid multiple downloads and conversions.
        Subsequent instantiations will return the same instance, and an attempt to re-instantiate with different
        settings will raise an exception.

        Args:
            backend: The backend to use for fetching model references.
                If None, automatically selects the appropriate backend based on replicate_mode and settings:
                - PRIMARY mode: FileSystemBackend (optionally wrapped with RedisBackend if configured)
                - REPLICA mode: HTTPBackend (if PRIMARY API URL configured) or GitHubBackend (fallback)
                Defaults to None.
            base_path: The base path to use for storing model reference files.
                Only used if backend is None. Defaults to horde_model_reference_paths.base_path.
            replicate_mode: The replicate mode to use.
                - PRIMARY: Local filesystem is source of truth
                - REPLICA: Fetch from PRIMARY API or GitHub
                Only used if backend is None. Defaults to horde_model_reference_settings.replicate_mode.
            prefetch_strategy: Controls whether initial cache warm-up is skipped (LAZY/NONE),
                performed synchronously, deferred, or executed via background async task.
                Defaults to PrefetchStrategy.LAZY.
            offline: If True, read references from local disk only via LocalReadOnlyBackend and never
                download (no GitHub / PRIMARY API / Redis), regardless of replicate_mode. Intended for
                subprocesses whose parent already downloaded the reference files.
                Defaults to horde_model_reference_settings.offline.

        Returns:
            ModelReferenceManager: The singleton instance of ModelReferenceManager.

        Raises:
            RuntimeError: If an attempt is made to re-instantiate with different settings.

        """
        if not isinstance(prefetch_strategy, PrefetchStrategy):
            try:
                prefetch_strategy = PrefetchStrategy(prefetch_strategy)
            except ValueError as exc:  # pragma: no cover - defensive branch
                raise ValueError(
                    f"prefetch_strategy must be one of: {', '.join(strategy.value for strategy in PrefetchStrategy)}"
                ) from exc

        with cls._lock:
            if not cls._instance:
                cls._instance = super().__new__(cls)

                audit_writer: AuditTrailWriter | None = None
                if horde_model_reference_settings.audit.enabled:
                    audit_writer = AuditTrailWriter(
                        root_path=horde_model_reference_paths.audit_path,
                        max_file_size_bytes=horde_model_reference_settings.audit.max_segment_bytes,
                    )

                if backend is None:
                    backend = cls._create_backend(
                        base_path=base_path,
                        replicate_mode=replicate_mode,
                        audit_writer=audit_writer,
                        offline=offline,
                    )

                # Offline backends are REPLICA-shaped regardless of the requested mode; align the
                # manager's recorded mode to the backend so the mode-match assertion below holds and
                # downstream code does not assume PRIMARY write capability.
                if offline:
                    replicate_mode = backend.replicate_mode

                backend_mode = backend.replicate_mode
                if backend_mode != replicate_mode:
                    raise RuntimeError(
                        "Backend replicate_mode does not match requested ModelReferenceManager configuration. "
                        f"Backend mode: {backend_mode}, requested mode: {replicate_mode}."
                    )

                cls._instance.backend = backend
                cls._instance._replicate_mode = replicate_mode
                cls._instance._offline = offline
                if backend.supports_writes():
                    cls._instance._audit_writer = audit_writer
                    cls._instance._pending_queue_service = cls._build_pending_queue_service(
                        audit_writer=audit_writer,
                    )
                    cls._instance._group_alias_store = GroupAliasStore(
                        file_path=horde_model_reference_paths.group_aliases_path,
                    )
                    cls._instance._group_family_store = GroupFamilyStore(
                        file_path=horde_model_reference_paths.group_families_path,
                    )
                    cls._instance._group_schema_store = GroupSchemaStore(
                        file_path=horde_model_reference_paths.group_schemas_path,
                        alias_store=cls._instance._group_alias_store,
                    )
                else:
                    cls._instance._audit_writer = None
                    cls._instance._pending_queue_service = None
                    cls._instance._group_alias_store = None
                    cls._instance._group_family_store = None
                    cls._instance._group_schema_store = None
                cls._instance._cached_records = {}
                cls._instance._deferred_prefetch_handle = None
                cls._instance._async_prefetch_task = None
                cls._instance._provider_registry = ModelProviderRegistry()

                # Register invalidation callback so backend can notify us when cache is stale
                cls._instance.backend.register_invalidation_callback(cls._instance._on_backend_invalidated)

                cls._instance._apply_prefetch_strategy(strategy=prefetch_strategy)
            else:
                if backend is not None and backend is not cls._instance.backend:
                    raise RuntimeError(
                        "ModelReferenceManager is a singleton and has already been instantiated "
                        "with a different backend."
                    )
                if offline != cls._instance._offline:
                    raise RuntimeError(
                        "ModelReferenceManager is a singleton and has already been instantiated with a different "
                        f"offline setting.\nExisting offline={cls._instance._offline}; new offline={offline}."
                    )
                if not offline and replicate_mode != cls._instance._replicate_mode:
                    raise RuntimeError(
                        "ModelReferenceManager is a singleton and has already been instantiated with different "
                        "settings.\nExisting settings: "
                        f"replicate_mode={cls._instance._replicate_mode}.\n"
                        "New settings: "
                        f"replicate_mode={replicate_mode}."
                    )
                if prefetch_strategy != cls._instance._prefetch_strategy:
                    raise RuntimeError(
                        "ModelReferenceManager is a singleton and has already been instantiated with different "
                        "settings."
                        f"\nExisting prefetch_strategy={cls._instance._prefetch_strategy.value};"
                        f" new prefetch_strategy={prefetch_strategy.value}."
                    )

        return cls._instance

    def _apply_prefetch_strategy(self, *, strategy: PrefetchStrategy) -> None:
        """Apply the configured prefetch strategy once the backend is available."""
        self._prefetch_strategy = strategy
        self._deferred_prefetch_handle = None
        self._async_prefetch_task = None

        if strategy in (PrefetchStrategy.LAZY, PrefetchStrategy.NONE):
            logger.debug(f"prefetch skipped because strategy={strategy.value}")
            return

        if strategy is PrefetchStrategy.SYNC:
            self._fetch_from_backend_if_needed(force_refresh=False)
            return

        if strategy is PrefetchStrategy.DEFERRED:
            self._deferred_prefetch_handle = DeferredPrefetchHandle(manager=self, force_refresh=False)
            logger.info(
                "Deferred prefetch handle created; call run_sync/run_async to warm caches without blocking",
            )
            return

        if strategy is PrefetchStrategy.ASYNC:
            self._schedule_async_prefetch(force_refresh=False)
            return

        raise ValueError(f"Unsupported prefetch strategy: {strategy}")

    def _on_backend_invalidated(self, category: MODEL_REFERENCE_CATEGORY) -> None:
        """On callback invoked by backend when a category's cache is invalidated.

        This ensures the pydantic model cache stays in sync with backend invalidations.

        Args:
            category: The category that was invalidated.

        """
        logger.debug(f"Backend invalidated category {category}, clearing pydantic cache")
        self._invalidate_cache(category)

    def _invalidate_cache(self, category: MODEL_REFERENCE_CATEGORY | None = None) -> None:
        """Invalidate the cached pydantic model references.

        Args:
            category: If provided, only invalidate the specific category.
                If None, invalidate the entire cache.

        """
        with self._lock:
            if category is None:
                logger.debug("Invalidating entire cached pydantic records.")
                self._cached_records = {}
            else:
                logger.debug(f"Invalidating cached pydantic records for category: {category}.")
                self._cached_records.pop(category, None)

    def invalidate_category_cache(self, category: MODEL_REFERENCE_CATEGORY) -> None:
        """Explicitly invalidate cached data for a category.

        Intended for use by the apply workflow after a successful backend write,
        so stale data is never served regardless of backend callback timing.

        Args:
            category: The category whose cache should be dropped.

        """
        self._invalidate_cache(category)

    def _fetch_from_backend_if_needed(
        self,
        force_refresh: bool,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]:
        """Fetch references from backend if needed.

        Args:
            force_refresh: Whether to force refresh all categories.

        """
        return self.backend.fetch_all_categories(force_refresh=force_refresh)

    async def _fetch_from_backend_if_needed_async(
        self,
        force_refresh: bool,
        httpx_client: httpx.AsyncClient | None,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]:
        """Asynchronously fetch references from backend if needed.

        Args:
            force_refresh: Whether to force refresh all categories.
            httpx_client: An optional httpx async client to use.

        """
        return await self.backend.fetch_all_categories_async(
            force_refresh=force_refresh,
            httpx_client=httpx_client,
        )

    @staticmethod
    def _build_pending_queue_service(
        *,
        audit_writer: AuditTrailWriter | None,
    ) -> PendingQueueService | None:
        """Create the pending queue service when enabled."""
        if not horde_model_reference_settings.pending_queue.enabled:
            return None

        from horde_model_reference.pending_queue.service import PendingQueueService
        from horde_model_reference.pending_queue.store import PendingQueueStore

        store = PendingQueueStore(root_path=horde_model_reference_paths.pending_queue_path)
        return PendingQueueService(store=store, audit_writer=audit_writer)

    @property
    def prefetch_strategy(self) -> PrefetchStrategy:
        """Return the prefetch strategy originally configured for this manager."""
        return self._prefetch_strategy

    @property
    def offline(self) -> bool:
        """Return whether this manager reads from local disk only (never downloads)."""
        return self._offline

    @property
    def pending_queue_service(self) -> PendingQueueService | None:
        """Return the pending queue service when queueing is enabled."""
        return self._pending_queue_service

    @property
    def group_alias_store(self) -> GroupAliasStore | None:
        """Return the group alias store when in PRIMARY mode."""
        return self._group_alias_store

    @property
    def group_family_store(self) -> GroupFamilyStore | None:
        """Return the related-group family store when in PRIMARY mode."""
        return self._group_family_store

    @property
    def group_schema_store(self) -> GroupSchemaStore | None:
        """Return the group schema store when in PRIMARY mode."""
        return self._group_schema_store

    @property
    def deferred_prefetch_handle(self) -> DeferredPrefetchHandle | None:
        """Handle that callers can use to trigger a deferred eager fetch."""
        return self._deferred_prefetch_handle

    @property
    def is_warm(self) -> bool:
        """Return whether every category has been loaded into the in-memory cache.

        This is a pure in-memory check (it does not consult the backend). Use it to
        assert readiness after a warm-up (e.g. ``PrefetchStrategy.ASYNC`` or
        :meth:`ensure_ready_async`) instead of relying on a log line. A category cached
        as ``None`` (e.g. managed elsewhere or empty) still counts as loaded; ``False``
        means at least one category has never been fetched.
        """
        with self._lock:
            return all(category in self._cached_records for category in MODEL_REFERENCE_CATEGORY)

    @property
    def prefetch_pending(self) -> bool:
        """Return whether a deferred warm-up is exposed but has not yet made the cache warm.

        ``True`` means a :class:`DeferredPrefetchHandle` is available and no async
        prefetch task is running, yet the cache is not warm - so the caller must
        trigger the handle (``run_sync`` / ``run_async``) to warm it. This makes the
        ``PrefetchStrategy.ASYNC`` "no running event loop" degrade discoverable beyond
        the logged warning.
        """
        return self._deferred_prefetch_handle is not None and self._async_prefetch_task is None and not self.is_warm

    def create_deferred_prefetch_handle(
        self,
        *,
        force_refresh: bool = False,
    ) -> DeferredPrefetchHandle:
        """Create a deferred prefetch handle tied to this manager.

        Args:
            force_refresh: Whether the handle should bypass backend caches.

        Returns:
            DeferredPrefetchHandle: Handle that can execute the warm-up later.

        """
        handle = DeferredPrefetchHandle(manager=self, force_refresh=force_refresh)
        self._deferred_prefetch_handle = handle
        return handle

    def _schedule_async_prefetch(self, *, force_refresh: bool) -> None:
        """Schedule an async cache warm-up when an event loop is available."""
        handle = self.create_deferred_prefetch_handle(force_refresh=force_refresh)

        try:
            loop = asyncio.get_running_loop()
        except RuntimeError:
            logger.warning(
                "PrefetchStrategy.ASYNC requested but no running event loop detected; "
                "exposing deferred handle for manual execution instead.",
            )
            self._async_prefetch_task = None
            return

        logger.info("Scheduling asynchronous prefetch warm-up task")
        task = loop.create_task(handle.run_async())
        self._async_prefetch_task = task

        def _log_completion(completed: asyncio.Task[None]) -> None:
            try:
                completed.result()
            except Exception as exc:  # pragma: no cover - best-effort logging
                logger.error("Deferred async prefetch failed: %s", exc)

        task.add_done_callback(_log_completion)

    async def warm_cache_async(
        self,
        *,
        force_refresh: bool = False,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> None:
        """Warm cached pydantic records using backend async APIs.

        Args:
            force_refresh: Whether to bypass backend caches while warming.
            httpx_client: Optional shared async client for HTTP backends.

        """
        await self.get_all_model_references_or_none_async(
            overwrite_existing=force_refresh,
            httpx_client=httpx_client,
        )

    def ensure_ready(self, *, overwrite_existing: bool = False) -> None:
        """Ensure cached references exist synchronously (sync mirror of :meth:`ensure_ready_async`).

        Useful for warming the cache up-front from synchronous code - or for completing
        a deferred ``PrefetchStrategy.ASYNC`` warm-up that degraded because no event loop
        was running at construction. After this returns, :attr:`is_warm` is ``True``.

        Args:
            overwrite_existing: Whether to bypass backend caches while warming.

        """
        self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)

    async def ensure_ready_async(
        self,
        *,
        overwrite_existing: bool = False,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> None:
        """Ensure cached references exist by delegating to ``warm_cache_async``.

        Args:
            overwrite_existing: Whether to bypass backend caches while warming.
            httpx_client: Optional shared async client for HTTP backends.

        """
        await self.warm_cache_async(force_refresh=overwrite_existing, httpx_client=httpx_client)

    def supports_metadata(self) -> bool:
        """Return whether the active backend tracks per-category metadata.

        Metadata (timestamps, operation counts) is typically only available in PRIMARY
        mode; REPLICA backends return ``False``. Check this before relying on
        :meth:`get_metadata` / :meth:`last_updated` returning a value.
        """
        return self.backend.supports_metadata()

    def get_metadata(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        *,
        raise_if_unsupported: bool = False,
    ) -> CategoryMetadata | None:
        """Return per-category metadata, or ``None`` when the backend cannot provide it.

        A first-class manager accessor so library consumers do not need to reach into
        ``manager.backend`` and contend with backend-varying ``supports_metadata()``.

        Args:
            category: The category to fetch metadata for.
            raise_if_unsupported: When ``True``, raise ``NotImplementedError`` instead of
                returning ``None`` if the backend does not support metadata.

        Returns:
            The category metadata, or ``None`` when unsupported (and not raising).

        """
        if not self.backend.supports_metadata():
            if raise_if_unsupported:
                raise NotImplementedError(f"{type(self.backend).__name__} does not support metadata tracking")
            return None
        return self.backend.get_metadata(category)

    async def get_metadata_async(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        *,
        raise_if_unsupported: bool = False,
    ) -> CategoryMetadata | None:
        """Async counterpart to :meth:`get_metadata`."""
        if not self.backend.supports_metadata():
            if raise_if_unsupported:
                raise NotImplementedError(f"{type(self.backend).__name__} does not support metadata tracking")
            return None
        return await self.backend.get_metadata_async(category)

    def last_updated(self, category: MODEL_REFERENCE_CATEGORY) -> int | None:
        """Return the unix timestamp of the category's last update, or ``None``.

        Convenience over :meth:`get_metadata` for cheap change-detection polling by
        library consumers. Returns ``None`` when the backend does not track metadata.

        Args:
            category: The category to inspect.

        Returns:
            The ``last_updated`` unix timestamp, or ``None`` when unavailable.

        """
        metadata = self.get_metadata(category)
        return metadata.last_updated if metadata is not None else None

    @staticmethod
    def _file_json_dict_to_model_reference(
        category: MODEL_REFERENCE_CATEGORY,
        file_json_dict: dict[str, Any] | None,
        safe_mode: bool = False,
    ) -> dict[str, GenericModelRecord] | None:
        """Return a model reference object from a JSON dictionary, or None if conversion failed.

        Args:
            category: The target model reference category to convert.
            file_json_dict: The dict object representing the model reference.
            safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
                and None is returned. Defaults to False.

        Returns:
            dict[str, GenericModelRecord] | None: The dict representing the model reference,
                or None if conversion failed.

        """
        if file_json_dict is None:
            logger.warning(f"File dict json is None for {category}.")
            return None

        if category in categories_managed_elsewhere:
            logger.info(f"Skipping conversion for category: {category} (managed elsewhere)")
            return None

        try:
            record_type = MODEL_RECORD_TYPE_LOOKUP.get(category, GenericModelRecord)
            model_reference: dict[str, GenericModelRecord] = {}
            for model_value in file_json_dict.values():
                model_instance = record_type.model_validate(model_value)
                model_reference[model_instance.name] = model_instance

            return model_reference

        except Exception as e:
            if not safe_mode:
                logger.exception(f"Failed to convert file dict JSON to model reference for {category}: {e}")
                return None
            raise e

    @staticmethod
    def model_reference_to_json_dict(
        model_reference: dict[str, GenericModelRecord],
        safe_mode: bool = False,
    ) -> dict[str, Any] | None:
        """Return a JSON dictionary from a model reference object, or None if conversion failed.

        Args:
            model_reference: The model reference object.
            safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
                and None is returned. Use `model_reference_to_json_dict_safe()` for the better type hinting if you
                intend to use this. Defaults to False.

        Returns:
            dict | None: The dict representing the model reference, or None if conversion failed.

        """
        if model_reference is None:
            raise ValueError("model_reference cannot be None")

        try:
            return {
                name: record.model_dump(
                    exclude_unset=True,
                )
                for name, record in model_reference.items()
            }
        except Exception as e:
            if not safe_mode:
                logger.exception(f"Failed to convert model reference to JSON: {e}")
                return None

            raise e

    @staticmethod
    def model_reference_to_json_dict_safe(
        model_reference: dict[str, GenericModelRecord],
    ) -> dict[str, Any]:
        """Return a JSON dictionary from a model reference object.

        Raises an exception if conversion fails.

        Args:
            model_reference: The model reference object.

        Returns:
            dict: The dict representing the model reference.

        """
        json_dict_safe = ModelReferenceManager.model_reference_to_json_dict(model_reference, safe_mode=True)

        if json_dict_safe is None:
            raise RuntimeError("Conversion to JSON dict failed in safe mode, but no exception was raised.")

        return json_dict_safe

    def _get_all_cached_model_references(
        self,
        safe_mode: bool = False,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
        """Get all cached pydantic model references.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference
                categories to their corresponding pydantic model objects.

        """
        with self._lock:
            logger.debug(f"Returning {len(self._cached_records)} cached pydantic model references.")
            return dict(self._cached_records)

    def _evaluate_cache_state(
        self,
        *,
        overwrite_existing: bool,
        safe_mode: bool,
    ) -> tuple[
        bool,
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None],
        list[MODEL_REFERENCE_CATEGORY],
    ]:
        """Return whether cached data can be reused plus categories needing refresh."""
        with self._lock:
            refresh_map = {category: self.backend.needs_refresh(category) for category in MODEL_REFERENCE_CATEGORY}
            all_categories_cached = all(cat in self._cached_records for cat in MODEL_REFERENCE_CATEGORY)
            needs_backend_refresh = overwrite_existing or any(refresh_map.values())

            if not overwrite_existing and all_categories_cached and not needs_backend_refresh:
                logger.debug("Using fully cached pydantic model references.")
                return True, self._get_all_cached_model_references(safe_mode=safe_mode), []

            categories_to_load: list[MODEL_REFERENCE_CATEGORY] = []
            for category in MODEL_REFERENCE_CATEGORY:
                cached_value = self._cached_records.get(category)
                if (
                    overwrite_existing
                    or category not in self._cached_records
                    or cached_value is None
                    or refresh_map[category]
                ):
                    categories_to_load.append(category)

            return False, {}, categories_to_load

    def _load_categories_from_payload(
        self,
        *,
        categories_to_load: Iterable[MODEL_REFERENCE_CATEGORY],
        payload: dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None] | None,
        overwrite_existing: bool,
        safe_mode: bool,
    ) -> None:
        """Convert backend payload into cached pydantic models for selected categories."""
        normalized_payload = payload or {}
        prepared_payload: dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None] = {}
        missing_payload: list[MODEL_REFERENCE_CATEGORY] = []

        for category in categories_to_load:
            if category in normalized_payload:
                prepared_payload[category] = normalized_payload[category]
            else:
                missing_payload.append(category)

        if missing_payload:
            logger.debug(
                "Backend payload missing %d categories; falling back to per-category fetch: %s",
                len(missing_payload),
                missing_payload,
            )
            for category in missing_payload:
                prepared_payload[category] = self.backend.fetch_category(
                    category,
                    force_refresh=overwrite_existing,
                )

        with self._lock:
            for category, file_json in prepared_payload.items():
                model_reference = self._file_json_dict_to_model_reference(
                    category,
                    file_json,
                    safe_mode=safe_mode,
                )
                self._cached_records[category] = model_reference

    def get_all_model_references_or_none(
        self,
        overwrite_existing: bool = False,
        *,
        safe_mode: bool = False,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
        """Return a mapping of all model reference categories to their corresponding model reference objects.

        Note that values may be None if the model reference file could not be found or parsed.

        Args:
            overwrite_existing: Whether to force a redownload of all model reference files.
                Defaults to False.
            safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
                and None is returned for that category. Defaults to False. Use `get_all_model_references()`
                for the better type hinting if you intend to use this.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference
                categories to their corresponding model reference objects.

        """
        use_cache, cached_result, categories_to_load = self._evaluate_cache_state(
            overwrite_existing=overwrite_existing,
            safe_mode=safe_mode,
        )

        if use_cache:
            return cached_result

        logger.debug("Fetching model references from backend as needed.")
        backend_payload = self._fetch_from_backend_if_needed(force_refresh=overwrite_existing)

        if categories_to_load:
            logger.debug("Loading %d model reference categories: %s", len(categories_to_load), categories_to_load)
            self._load_categories_from_payload(
                categories_to_load=categories_to_load,
                payload=backend_payload,
                overwrite_existing=overwrite_existing,
                safe_mode=safe_mode,
            )

        return self._get_all_cached_model_references(safe_mode=safe_mode)

    def _build_safe_reference_view(
        self,
        all_references: dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None],
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
        """Convert a possibly sparse reference view into a safe mapping with logging.

        Args:
            all_references: Mapping of categories to model reference dicts or None.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping where
            missing categories map to empty dicts.

        """
        safe_references: dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] = {}
        missing_references: list[MODEL_REFERENCE_CATEGORY] = []
        for category, reference in all_references.items():
            if reference is not None:
                safe_references[category] = reference
            elif category not in categories_managed_elsewhere:
                missing_references.append(category)
                safe_references[category] = {}

        if missing_references:
            logger.error(f"Missing model references for categories: {missing_references}")

        return safe_references

    def get_all_model_references(
        self,
        overwrite_existing: bool = False,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
        """Return a mapping of all model reference categories to their corresponding model reference objects.

        If a model reference file could not be found or parsed, an exception is raised. If you want to allow
        missing model references, use `get_all_model_references_or_none()` instead.

        Args:
            overwrite_existing: Whether to force a redownload of all model reference files.
                Defaults to False.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: A mapping of model reference
                categories to their corresponding model reference objects.

        """
        all_references = self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)
        return self._build_safe_reference_view(all_references)

    async def get_all_model_references_or_none_async(
        self,
        overwrite_existing: bool = False,
        *,
        safe_mode: bool = False,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
        """Return model references asynchronously without enforcing presence.

        Args:
            overwrite_existing: Whether to force backend refresh.
            safe_mode: Whether to propagate conversion errors.
            httpx_client: Optional shared async client for HTTP backends.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: Possibly
            sparse mapping keyed by category.

        """
        use_cache, cached_result, categories_to_load = self._evaluate_cache_state(
            overwrite_existing=overwrite_existing,
            safe_mode=safe_mode,
        )

        if use_cache:
            return cached_result

        logger.debug("Asynchronously fetching model references from backend as needed.")
        backend_payload = await self._fetch_from_backend_if_needed_async(
            force_refresh=overwrite_existing,
            httpx_client=httpx_client,
        )

        if categories_to_load:
            logger.debug("Loading %d model reference categories via async payload", len(categories_to_load))
            self._load_categories_from_payload(
                categories_to_load=categories_to_load,
                payload=backend_payload,
                overwrite_existing=overwrite_existing,
                safe_mode=safe_mode,
            )

        return self._get_all_cached_model_references(safe_mode=safe_mode)

    async def get_all_model_references_async(
        self,
        overwrite_existing: bool = False,
        *,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
        """Return all model references asynchronously, raising on missing categories.

        Args:
            overwrite_existing: Whether to force backend refresh.
            httpx_client: Optional shared async client for HTTP backends.

        Returns:
            dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping with
            empty dicts substituted for missing categories.

        """
        all_references = await self.get_all_model_references_or_none_async(
            overwrite_existing=overwrite_existing,
            httpx_client=httpx_client,
        )
        return self._build_safe_reference_view(all_references)

    def get_model_reference_or_none(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        overwrite_existing: bool = False,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> dict[str, GenericModelRecord] | None:
        """Return the model reference object for a specific category.

        Args:
            category: The category to retrieve.
            overwrite_existing: Whether to force a redownload. Defaults to False.
            source: Which source(s) to read from. Defaults to canonical horde data
                (:data:`~horde_model_reference.source_consts.HORDE_SOURCE_ID`). Pass
                ``"any"`` to merge all registered providers, or a provider id / sequence
                of ids to select specific third-party sources. On name collisions the
                canonical (or earlier-listed) source wins.

        Returns:
            dict[str, GenericModelRecord] | None: The model reference object for the category,
                or None if not found.

        """
        if self._is_canonical_only(source):
            all_references = self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)
            return all_references.get(category)
        return self._merge_sourced_reference(category, source, overwrite_existing=overwrite_existing)

    async def get_model_reference_or_none_async(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        overwrite_existing: bool = False,
        *,
        httpx_client: httpx.AsyncClient | None = None,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> dict[str, GenericModelRecord] | None:
        """Return a single category's references asynchronously without strict enforcement.

        Args:
            category: Target category to load.
            overwrite_existing: Whether to force backend refresh.
            httpx_client: Optional shared async client for HTTP backends.
            source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

        Returns:
            dict[str, GenericModelRecord] | None: Mapping of model names or None.

        """
        if self._is_canonical_only(source):
            all_references = await self.get_all_model_references_or_none_async(
                overwrite_existing=overwrite_existing,
                httpx_client=httpx_client,
            )
            return all_references.get(category)
        return await self._merge_sourced_reference_async(
            category,
            source,
            overwrite_existing=overwrite_existing,
            httpx_client=httpx_client,
        )

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.audio_generation],
        overwrite_existing: bool = False,
    ) -> dict[str, AudioGenerationModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.blip],
        overwrite_existing: bool = False,
    ) -> dict[str, BlipModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.clip],
        overwrite_existing: bool = False,
    ) -> dict[str, ClipModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.codeformer],
        overwrite_existing: bool = False,
    ) -> dict[str, CodeformerModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.controlnet],
        overwrite_existing: bool = False,
    ) -> dict[str, ControlNetModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.image_generation],
        overwrite_existing: bool = False,
    ) -> dict[str, ImageGenerationModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: Literal[MODEL_REFERENCE_CATEGORY.text_generation],
        overwrite_existing: bool = False,
    ) -> dict[str, TextGenerationModelRecord]: ...

    @overload
    def get_model_reference(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        overwrite_existing: bool = False,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> dict[str, GenericModelRecord]: ...

    def get_model_reference(
        self,
        category: MODEL_REFERENCE_CATEGORY = MODEL_REFERENCE_CATEGORY.image_generation,
        overwrite_existing: bool = False,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> Mapping[str, GenericModelRecord]:
        """Return the model reference object for a specific category.

        Raises an exception if the model reference could not be found or parsed.
        If you want to allow missing model references, use `get_model_reference_or_none()` instead.

        Args:
            category: The category to retrieve.
            overwrite_existing: Whether to force a redownload. Defaults to False.
            source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

        Returns:
            Mapping[str, GenericModelRecord]: The model reference object for the category.

        """
        model_reference = self.get_model_reference_or_none(
            category,
            overwrite_existing=overwrite_existing,
            source=source,
        )
        if model_reference is None:
            raise RuntimeError(f"Model reference for category {category} not found or could not be parsed.")

        return model_reference

    async def get_model_reference_async(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        overwrite_existing: bool = False,
        *,
        httpx_client: httpx.AsyncClient | None = None,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> dict[str, GenericModelRecord]:
        """Return a single category's references asynchronously, raising if missing.

        Args:
            category: Target category to load.
            overwrite_existing: Whether to force backend refresh.
            httpx_client: Optional shared async client for HTTP backends.
            source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

        Returns:
            dict[str, GenericModelRecord]: Mapping of model names for the category.

        Raises:
            RuntimeError: If the category is missing or could not be parsed.

        """
        model_reference = await self.get_model_reference_or_none_async(
            category,
            overwrite_existing=overwrite_existing,
            httpx_client=httpx_client,
            source=source,
        )
        if model_reference is None:
            raise RuntimeError(f"Model reference for category {category} not found or could not be parsed.")

        return model_reference

    def get_model_or_none(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        model_name: str,
        overwrite_existing: bool = False,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> GenericModelRecord | None:
        """Return a specific model from a category.

        Args:
            category: The category to retrieve.
            model_name: The name of the model within the category.
            overwrite_existing: Whether to force a redownload. Defaults to False.
            source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

        Returns:
            GenericModelRecord | None: The model record, or None if not found.

        """
        model_reference = self.get_model_reference_or_none(
            category,
            overwrite_existing=overwrite_existing,
            source=source,
        )
        if model_reference is None:
            return None

        return model_reference.get(model_name)

    def get_model(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        model_name: str,
        overwrite_existing: bool = False,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> GenericModelRecord:
        """Return a specific model from a category.

        Raises an exception if the model could not be found or parsed.
        If you want to allow missing models, use `get_model_or_none()` instead.

        Args:
            category: The category to retrieve.
            model_name: The name of the model within the category.
            overwrite_existing: Whether to force a redownload. Defaults to False.
            source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

        Returns:
            GenericModelRecord: The model record.

        """
        model_reference = self.get_model_reference(
            category,
            overwrite_existing=overwrite_existing,
            source=source,
        )

        model_record = model_reference.get(model_name)
        if model_record is None:
            raise RuntimeError(f"Model {model_name} not found in category {category}.")

        return model_record

    def get_raw_model_reference_json(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        overwrite_existing: bool = False,
    ) -> dict[str, Any] | None:
        """Return the raw JSON dict for a specific category without pydantic validation.

        This method delegates to the backend to fetch the raw JSON data directly,
        avoiding the overhead of creating pydantic models. Ideal for API endpoints
        that need fast JSON responses.

        Args:
            category: The category to retrieve.
            overwrite_existing: Whether to force a redownload. Defaults to False.

        Returns:
            dict[str, Any] | None: The raw JSON dict for the category, or None if not found.

        """
        return self.backend.fetch_category(category, force_refresh=overwrite_existing)

    def get_raw_model_json(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        model_name: str,
        overwrite_existing: bool = False,
    ) -> dict[str, Any] | None:
        """Return the raw JSON dict for a specific model in a category without pydantic validation.

        This method delegates to the backend to fetch the raw JSON data directly,
        avoiding the overhead of creating pydantic models. Ideal for API endpoints
        that need fast JSON responses.

        Args:
            category: The category to retrieve.
            model_name: The name of the model within the category.
            overwrite_existing: Whether to force a redownload. Defaults to False.

        Returns:
            dict[str, Any] | None: The raw JSON dict for the model, or None if not found.

        """
        category_json = self.backend.fetch_category(category, force_refresh=overwrite_existing)

        if category_json is None:
            return None

        return category_json.get(model_name)

    def _get_typed_models(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        *,
        record_type: type[TModelRecord],
    ) -> dict[str, TModelRecord]:
        """Return a typed mapping for the requested category."""
        model_reference = self.get_model_reference(category)

        if len(model_reference) == 0:
            return {}

        typed_reference: dict[str, TModelRecord] = {}
        for name, record in model_reference.items():
            if not isinstance(record, record_type):
                raise RuntimeError(
                    f"Some records in {category.value} category are not {record_type.__name__} instances."
                )
            typed_reference[name] = record

        return typed_reference

    @property
    def provider_registry(self) -> ModelProviderRegistry:
        """Return the registry of third-party model providers owned by this manager."""
        return self._provider_registry

    def register_provider(self, provider: ModelProvider, *, replace: bool = False) -> None:
        """Register a third-party :class:`ModelProvider` for use in reads/queries.

        Args:
            provider: The provider to register.
            replace: If ``True``, replace an existing provider with the same source id.

        Raises:
            ValueError: If the source id is reserved/empty, or already registered and
                *replace* is ``False``.

        """
        self._provider_registry.register(provider, replace=replace)

    def unregister_provider(self, source_id: str) -> bool:
        """Remove the provider registered under *source_id*.

        Returns:
            bool: ``True`` if a provider was removed, ``False`` otherwise.

        """
        return self._provider_registry.unregister(source_id)

    def list_providers(self) -> list[str]:
        """Return the source ids of all registered providers (registration order)."""
        return self._provider_registry.source_ids()

    def get_provider(self, source_id: str) -> ModelProvider | None:
        """Return the provider registered under *source_id*, or ``None``."""
        return self._provider_registry.get(source_id)

    def _resolve_ordered_source_ids(
        self,
        selectors: list[str],
    ) -> list[str]:
        """Return an ordered, de-duplicated list of concrete source ids to read.

        Unlike a canonical-first split, this preserves each selector's **position** so
        callers control collision precedence (earlier sources win during the
        ``setdefault`` merge). The canonical source (:data:`HORDE_SOURCE_ID`) is treated
        as just another id and keeps wherever it appears in the selector, so
        ``["pending", "horde"]`` lets the ``"pending"`` provider override canonical while
        the default ``["horde"]`` is canonical-only.

        ``ANY_SOURCE`` expands to the canonical source **first**, then every registered
        provider in registration order, preserving the historical "canonical wins"
        default for ``"any"``. Explicitly named, unregistered provider ids raise
        ``ValueError``; ids discovered via ``ANY_SOURCE`` are simply the live set and
        never raise.
        """
        ordered: list[str] = []
        seen: set[str] = set()

        def _add(source_id: str) -> None:
            if source_id not in seen:
                seen.add(source_id)
                ordered.append(source_id)

        for selector in selectors:
            if selector == ANY_SOURCE:
                _add(HORDE_SOURCE_ID)
                for provider_id in self._provider_registry.source_ids():
                    _add(provider_id)
            elif selector == HORDE_SOURCE_ID:
                _add(HORDE_SOURCE_ID)
            else:
                if not self._provider_registry.has(selector):
                    raise ValueError(
                        f"No provider registered under source id {selector!r}. "
                        f"Registered providers: {self._provider_registry.source_ids()}.",
                    )
                _add(selector)

        return ordered

    @staticmethod
    def _is_canonical_only(source: SourceSelector) -> bool:
        """Return whether *source* selects canonical data exclusively (the default)."""
        return normalize_source_selector(source) == [HORDE_SOURCE_ID]

    def _gather_sourced_records(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        source: SourceSelector,
        *,
        overwrite_existing: bool = False,
    ) -> tuple[list[GenericModelRecord], list[str], dict[str, SourceOutcome]]:
        """Collect records and aligned source ids for *category* from the selected sources.

        Records are returned in **selector order** (the canonical source is read at its
        position in the selector rather than always first), so the first source to
        provide a given name wins during the ``setdefault`` merge. Duplicates are
        intentionally retained so callers/queries can detect collisions. A provider
        raising or returning ``None`` is logged and skipped (error isolation).

        The third return value maps every *selected* source id to its outcome
        (``"ok"`` / ``"empty"`` / ``"error"``) so callers can distinguish a source
        that failed from one that simply had nothing for this category.
        """
        selectors = normalize_source_selector(source)
        ordered_source_ids = self._resolve_ordered_source_ids(selectors)

        records: list[GenericModelRecord] = []
        sources: list[str] = []
        status: dict[str, SourceOutcome] = {}

        for source_id in ordered_source_ids:
            status[source_id] = "empty"

            if source_id == HORDE_SOURCE_ID:
                canonical = self.get_all_model_references_or_none(
                    overwrite_existing=overwrite_existing,
                ).get(category)
                if canonical:
                    status[source_id] = "ok"
                    for record in canonical.values():
                        records.append(record)
                        sources.append(HORDE_SOURCE_ID)
                continue

            provider = self._provider_registry.get(source_id)
            if provider is None:  # pragma: no cover - guarded by _resolve_ordered_source_ids
                continue
            if not provider.serves_category(category):
                continue
            try:
                provided = provider.fetch_category(category, force_refresh=overwrite_existing)
            except Exception as exc:
                status[source_id] = "error"
                logger.error(
                    f"Provider {source_id!r} raised while fetching category {category.value!r}; skipping: {exc}",
                )
                continue
            if not provided:
                continue
            status[source_id] = "ok"
            for record in provided.values():
                records.append(record)
                sources.append(source_id)

        return records, sources, status

    def _merge_sourced_reference(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        source: SourceSelector,
        *,
        overwrite_existing: bool = False,
    ) -> dict[str, GenericModelRecord] | None:
        """Return a canonical-wins merged ``name -> record`` mapping across *source*.

        Returns ``None`` only when no source produced any records for the category,
        preserving the ``*_or_none`` contract.
        """
        records, sources, _status = self._gather_sourced_records(
            category,
            source,
            overwrite_existing=overwrite_existing,
        )
        if not records:
            return None

        merged: dict[str, GenericModelRecord] = {}
        for record, _source in zip(records, sources, strict=True):
            merged.setdefault(record.name, record)
        return merged

    async def _gather_sourced_records_async(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        source: SourceSelector,
        *,
        overwrite_existing: bool = False,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> tuple[list[GenericModelRecord], list[str], dict[str, SourceOutcome]]:
        """Async counterpart to :meth:`_gather_sourced_records` using provider async fetch."""
        selectors = normalize_source_selector(source)
        ordered_source_ids = self._resolve_ordered_source_ids(selectors)

        records: list[GenericModelRecord] = []
        sources: list[str] = []
        status: dict[str, SourceOutcome] = {}

        for source_id in ordered_source_ids:
            status[source_id] = "empty"

            if source_id == HORDE_SOURCE_ID:
                all_references = await self.get_all_model_references_or_none_async(
                    overwrite_existing=overwrite_existing,
                    httpx_client=httpx_client,
                )
                canonical = all_references.get(category)
                if canonical:
                    status[source_id] = "ok"
                    for record in canonical.values():
                        records.append(record)
                        sources.append(HORDE_SOURCE_ID)
                continue

            provider = self._provider_registry.get(source_id)
            if provider is None:  # pragma: no cover - guarded by _resolve_ordered_source_ids
                continue
            if not provider.serves_category(category):
                continue
            try:
                provided = await provider.fetch_category_async(category, force_refresh=overwrite_existing)
            except Exception as exc:
                status[source_id] = "error"
                logger.error(
                    f"Provider {source_id!r} raised while fetching category {category.value!r}; skipping: {exc}",
                )
                continue
            if not provided:
                continue
            status[source_id] = "ok"
            for record in provided.values():
                records.append(record)
                sources.append(source_id)

        return records, sources, status

    async def _merge_sourced_reference_async(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        source: SourceSelector,
        *,
        overwrite_existing: bool = False,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> dict[str, GenericModelRecord] | None:
        """Async counterpart to :meth:`_merge_sourced_reference`."""
        records, sources, _status = await self._gather_sourced_records_async(
            category,
            source,
            overwrite_existing=overwrite_existing,
            httpx_client=httpx_client,
        )
        if not records:
            return None

        merged: dict[str, GenericModelRecord] = {}
        for record, _source in zip(records, sources, strict=True):
            merged.setdefault(record.name, record)
        return merged

    @overload
    def query(
        self,
        category: Literal["image_generation", MODEL_REFERENCE_CATEGORY.image_generation],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ImageGenerationQuery: ...

    @overload
    def query(
        self,
        category: Literal["text_generation", MODEL_REFERENCE_CATEGORY.text_generation],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> TextModelQuery: ...

    @overload
    def query(
        self,
        category: Literal["controlnet", MODEL_REFERENCE_CATEGORY.controlnet],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ControlNetQuery: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["blip", MODEL_REFERENCE_CATEGORY.blip],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[BlipModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["clip", MODEL_REFERENCE_CATEGORY.clip],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[ClipModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["codeformer", MODEL_REFERENCE_CATEGORY.codeformer],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[CodeformerModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["esrgan", MODEL_REFERENCE_CATEGORY.esrgan],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[EsrganModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["gfpgan", MODEL_REFERENCE_CATEGORY.gfpgan],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[GfpganModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["safety_checker", MODEL_REFERENCE_CATEGORY.safety_checker],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[SafetyCheckerModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["audio_generation", MODEL_REFERENCE_CATEGORY.audio_generation],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[AudioGenerationModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["video_generation", MODEL_REFERENCE_CATEGORY.video_generation],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[VideoGenerationModelRecord, GenericFieldName]: ...

    @overload
    def query(  # pyrefly: ignore[inconsistent-overload]
        self,
        category: Literal["miscellaneous", MODEL_REFERENCE_CATEGORY.miscellaneous],
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[MiscellaneousModelRecord, GenericFieldName]: ...

    @overload
    def query(
        self,
        category: MODEL_REFERENCE_CATEGORY | str,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> ModelQuery[
        GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName
    ]: ...

    def query(
        self,
        category: MODEL_REFERENCE_CATEGORY | str,
        *,
        source: SourceSelector = HORDE_SOURCE_ID,
    ) -> (
        ImageGenerationQuery
        | TextModelQuery
        | ControlNetQuery
        | ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName]
    ):
        """Return the query builder for a single category.

        This is the single entry point for filtering, sorting, and aggregating model
        records. The returned builder is typed to the category's record class; the
        three domain categories return enriched subclasses with extra helpers
        (``ImageGenerationQuery``, ``TextModelQuery``, ``ControlNetQuery``).

        Args:
            category: The model reference category to query, as the
                :class:`~horde_model_reference.meta_consts.MODEL_REFERENCE_CATEGORY`
                member (recommended, for precise return typing) or its string value.
            source: Which source(s) to include. Defaults to canonical horde data
                (:data:`~horde_model_reference.source_consts.HORDE_SOURCE_ID`). Pass
                ``"any"`` to merge all registered providers, or a provider id / ordered
                sequence of ids. When more than one source is selected, results are
                de-duplicated by name (canonical / earlier-listed source wins); use
                :meth:`~horde_model_reference.query.ModelQuery.duplicate_names` to detect
                collisions and :meth:`~horde_model_reference.query.ModelQuery.where_source`
                to filter by provenance.

        Returns:
            A ``ModelQuery`` (or typed subclass) ready for chaining filters.

        """
        category = MODEL_REFERENCE_CATEGORY(category)
        canonical_only = self._is_canonical_only(source)

        if category == MODEL_REFERENCE_CATEGORY.image_generation:
            if canonical_only:
                return build_image_query(
                    self._get_typed_models(category, record_type=ImageGenerationModelRecord),
                )
            img_records, img_sources, img_status = self._gather_typed_sourced(
                category,
                record_type=ImageGenerationModelRecord,
                source=source,
            )
            return ImageGenerationQuery(
                img_records,
                ImageGenerationModelRecord,
                sources=img_sources,
                source_status=img_status,
            )

        if category == MODEL_REFERENCE_CATEGORY.text_generation:
            if canonical_only:
                return build_text_query(
                    self._get_typed_models(category, record_type=TextGenerationModelRecord),
                )
            txt_records, txt_sources, txt_status = self._gather_typed_sourced(
                category,
                record_type=TextGenerationModelRecord,
                source=source,
            )
            return TextModelQuery(
                txt_records,
                TextGenerationModelRecord,
                sources=txt_sources,
                source_status=txt_status,
            )

        if category == MODEL_REFERENCE_CATEGORY.controlnet:
            if canonical_only:
                return build_controlnet_query(
                    self._get_typed_models(category, record_type=ControlNetModelRecord),
                )
            cn_records, cn_sources, cn_status = self._gather_typed_sourced(
                category,
                record_type=ControlNetModelRecord,
                source=source,
            )
            return ControlNetQuery(
                cn_records,
                ControlNetModelRecord,
                sources=cn_sources,
                source_status=cn_status,
            )

        record_type = MODEL_RECORD_TYPE_LOOKUP.get(category, GenericModelRecord)
        if canonical_only:
            return build_query(self._get_typed_models(category, record_type=record_type), record_type)
        sourced_records, sourced_sources, sourced_status = self._gather_typed_sourced(
            category,
            record_type=record_type,
            source=source,
        )
        return ModelQuery(sourced_records, record_type, sources=sourced_sources, source_status=sourced_status)

    def _gather_typed_sourced(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        *,
        record_type: type[TModelRecord],
        source: SourceSelector,
    ) -> tuple[list[TModelRecord], list[str], dict[str, SourceOutcome]]:
        """Gather records (and aligned sources) for *category*, validating their type.

        Raises:
            RuntimeError: If any source supplies a record that is not an instance of
                *record_type* (or a subclass of it).

        """
        records, sources, status = self._gather_sourced_records(category, source)
        typed_records: list[TModelRecord] = []
        for record in records:
            if not isinstance(record, record_type):
                raise RuntimeError(
                    f"A source for category {category.value} supplied record {record.name!r} "
                    f"that is not a {record_type.__name__} instance.",
                )
            typed_records.append(record)
        return typed_records, sources, status

    def query_all(
        self,
    ) -> ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName]:
        """Return a query builder spanning all categories.

        Returns:
            A ``ModelQuery[GenericModelRecord]`` over every cached record.

        """
        all_refs = self.get_all_model_references()
        return build_cross_category_query(all_refs)

    _CATEGORY_TO_HORDE_TYPE: ClassVar[dict[MODEL_REFERENCE_CATEGORY, HordeModelType]] = {
        MODEL_REFERENCE_CATEGORY.image_generation: "image",
        MODEL_REFERENCE_CATEGORY.text_generation: "text",
    }

    async def get_popular_models(
        self,
        category: MODEL_REFERENCE_CATEGORY,
        *,
        limit: int = 10,
        sort_by: Literal["worker_count", "usage_day", "usage_month", "usage_total"] = "worker_count",
        include_workers: bool = False,
    ) -> list[PopularModelResult]:
        """Return models ranked by live Horde popularity metrics.

        Requires the Horde public API to be reachable. Only ``image_generation``
        and ``text_generation`` categories have Horde API data; other categories
        return an empty list.

        Args:
            category: Model category to rank.
            limit: Maximum number of results.
            sort_by: Metric to rank by.
            include_workers: Whether to fetch per-worker details (slower).

        Returns:
            A list of ``PopularModelResult`` sorted by the chosen metric.

        """
        from horde_model_reference.integrations.data_merger import (
            CombinedModelStatistics,
            PopularModelResult,
            merge_category_with_horde_data,
        )
        from horde_model_reference.integrations.horde_api_integration import HordeAPIIntegration

        horde_type: HordeModelType | None = self._CATEGORY_TO_HORDE_TYPE.get(category)
        if horde_type is None:
            return []

        model_reference = self.get_model_reference_or_none(category)
        if model_reference is None:
            return []

        horde_api = HordeAPIIntegration()
        indexed_status, indexed_stats, indexed_workers = await horde_api.get_combined_data_indexed(
            model_type=horde_type,
            include_workers=include_workers,
        )

        merged = merge_category_with_horde_data(
            model_names=model_reference.keys(),
            horde_status=indexed_status,
            horde_stats=indexed_stats,
            workers=indexed_workers,
        )

        def _sort_key(item: tuple[str, Any]) -> float:
            _name, stats = item
            if not isinstance(stats, CombinedModelStatistics):
                return 0.0
            if sort_by == "worker_count":
                return float(stats.worker_count)
            if stats.usage_stats is None:
                return 0.0
            if sort_by == "usage_day":
                return float(stats.usage_stats.day)
            if sort_by == "usage_month":
                return float(stats.usage_stats.month)
            return float(stats.usage_stats.total)

        ranked = sorted(merged.items(), key=_sort_key, reverse=True)[:limit]

        results: list[PopularModelResult] = []
        for name, stats in ranked:
            record = model_reference.get(name)
            if record is None:
                continue
            results.append(
                PopularModelResult(
                    name=name,
                    record=record.model_dump(mode="json", exclude_none=True),
                    stats=stats,
                )
            )

        return results

backend `instance-attribute`

backend: ModelReferenceBackend

The backend provider for model reference data.

_cached_records `instance-attribute`

_cached_records: dict[
    MODEL_REFERENCE_CATEGORY,
    dict[str, GenericModelRecord] | None,
]

Cache of pydantic model records by category.

_instance `class-attribute` `instance-attribute`

_instance: ModelReferenceManager | None = None

_replicate_mode `class-attribute` `instance-attribute`

_replicate_mode: ReplicateMode = REPLICA

_offline `class-attribute` `instance-attribute`

_offline: bool = False

_prefetch_strategy `class-attribute` `instance-attribute`

_prefetch_strategy: PrefetchStrategy = SYNC

_deferred_prefetch_handle `class-attribute` `instance-attribute`

_deferred_prefetch_handle: DeferredPrefetchHandle | None = (
    None
)

_async_prefetch_task `class-attribute` `instance-attribute`

_async_prefetch_task: Task[None] | None = None

_provider_registry `instance-attribute`

_provider_registry: ModelProviderRegistry

_audit_writer `class-attribute` `instance-attribute`

_audit_writer: AuditTrailWriter | None = None

_pending_queue_service `class-attribute` `instance-attribute`

_pending_queue_service: PendingQueueService | None = None

_group_alias_store `class-attribute` `instance-attribute`

_group_alias_store: GroupAliasStore | None = None

_group_family_store `class-attribute` `instance-attribute`

_group_family_store: GroupFamilyStore | None = None

_group_schema_store `class-attribute` `instance-attribute`

_group_schema_store: GroupSchemaStore | None = None

_lock `class-attribute` `instance-attribute`

_lock: RLock = RLock()

prefetch_strategy `property`

prefetch_strategy: PrefetchStrategy

Return the prefetch strategy originally configured for this manager.

offline `property`

offline: bool

Return whether this manager reads from local disk only (never downloads).

pending_queue_service `property`

pending_queue_service: PendingQueueService | None

Return the pending queue service when queueing is enabled.

group_alias_store `property`

group_alias_store: GroupAliasStore | None

Return the group alias store when in PRIMARY mode.

group_family_store `property`

group_family_store: GroupFamilyStore | None

Return the related-group family store when in PRIMARY mode.

group_schema_store `property`

group_schema_store: GroupSchemaStore | None

Return the group schema store when in PRIMARY mode.

deferred_prefetch_handle `property`

deferred_prefetch_handle: DeferredPrefetchHandle | None

Handle that callers can use to trigger a deferred eager fetch.

is_warm `property`

is_warm: bool

Return whether every category has been loaded into the in-memory cache.

This is a pure in-memory check (it does not consult the backend). Use it to assert readiness after a warm-up (e.g. PrefetchStrategy.ASYNC or :meth:ensure_ready_async) instead of relying on a log line. A category cached as None (e.g. managed elsewhere or empty) still counts as loaded; False means at least one category has never been fetched.

prefetch_pending `property`

prefetch_pending: bool

Return whether a deferred warm-up is exposed but has not yet made the cache warm.

True means a :class:DeferredPrefetchHandle is available and no async prefetch task is running, yet the cache is not warm - so the caller must trigger the handle (run_sync / run_async) to warm it. This makes the PrefetchStrategy.ASYNC "no running event loop" degrade discoverable beyond the logged warning.

provider_registry `property`

provider_registry: ModelProviderRegistry

Return the registry of third-party model providers owned by this manager.

_CATEGORY_TO_HORDE_TYPE `class-attribute`

_CATEGORY_TO_HORDE_TYPE: dict[
    MODEL_REFERENCE_CATEGORY, HordeModelType
] = {image_generation: "image", text_generation: "text"}

get_instance `classmethod`

get_instance() -> ModelReferenceManager

Get the singleton instance of ModelReferenceManager.

Returns:

ModelReferenceManager ( ModelReferenceManager ) –

The singleton instance.

Raises:

RuntimeError –

If the instance has not been created yet.

Source code in src/horde_model_reference/model_reference_manager.py

@classmethod
def get_instance(cls) -> ModelReferenceManager:
    """Get the singleton instance of ModelReferenceManager.

    Returns:
        ModelReferenceManager: The singleton instance.

    Raises:
        RuntimeError: If the instance has not been created yet.

    """
    with cls._lock:
        if cls._instance is None:
            raise RuntimeError("ModelReferenceManager instance has not been created yet.")
        return cls._instance

has_instance `classmethod`

has_instance() -> bool

Check if the singleton instance has been created.

Returns:

bool ( bool ) –

True if the instance exists, False otherwise.

Source code in src/horde_model_reference/model_reference_manager.py

@classmethod
def has_instance(cls) -> bool:
    """Check if the singleton instance has been created.

    Returns:
        bool: True if the instance exists, False otherwise.

    """
    with cls._lock:
        return cls._instance is not None

reset `classmethod`

reset() -> None

Destroy the singleton instance so a fresh one can be created.

Intended for testing and development only. Production code should not call this - the singleton is designed to live for the process lifetime.

Source code in src/horde_model_reference/model_reference_manager.py

@classmethod
def reset(cls) -> None:
    """Destroy the singleton instance so a fresh one can be created.

    Intended for testing and development only. Production code should not
    call this - the singleton is designed to live for the process lifetime.
    """
    with cls._lock:
        instance = cls._instance
        if instance is None:
            return

        if instance._deferred_prefetch_handle is not None:
            instance._deferred_prefetch_handle = None

        if instance._async_prefetch_task is not None and not instance._async_prefetch_task.done():
            instance._async_prefetch_task.cancel()
            instance._async_prefetch_task = None

        cls._instance = None

_create_backend `staticmethod`

_create_backend(
    base_path: str | Path,
    replicate_mode: ReplicateMode,
    audit_writer: AuditTrailWriter | None,
    offline: bool = False,
) -> ModelReferenceBackend

Create the appropriate backend based on mode and settings.

Parameters:

base_path (str | Path) –

Base path for model reference files.
replicate_mode (ReplicateMode) –

The replication mode.
audit_writer (AuditTrailWriter | None) –

Optional audit writer used by write-capable backends.
offline (bool, default: False ) –

If True, return a read-only local-disk backend that never downloads, regardless of replicate_mode. Used by subprocesses whose parent owns downloading.

Returns:

ModelReferenceBackend ( ModelReferenceBackend ) –

The configured backend instance.

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def _create_backend(
    base_path: str | Path,
    replicate_mode: ReplicateMode,
    audit_writer: AuditTrailWriter | None,
    offline: bool = False,
) -> ModelReferenceBackend:
    """Create the appropriate backend based on mode and settings.

    Args:
        base_path: Base path for model reference files.
        replicate_mode: The replication mode.
        audit_writer: Optional audit writer used by write-capable backends.
        offline: If True, return a read-only local-disk backend that never downloads,
            regardless of replicate_mode. Used by subprocesses whose parent owns downloading.

    Returns:
        ModelReferenceBackend: The configured backend instance.

    """
    logger.debug(
        f"Creating backend with replicate_mode={replicate_mode}, base_path={base_path}, offline={offline}",
    )
    if offline:
        logger.info("Using LocalReadOnlyBackend (offline=True); references are read from disk, never downloaded")
        return LocalReadOnlyBackend(
            base_path=base_path,
            cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
        )

    if replicate_mode == ReplicateMode.PRIMARY:
        logger.debug("Creating backend for PRIMARY mode")

        # Check if GitHub seeding will be needed
        github_seeding_will_occur = False
        if horde_model_reference_settings.github_seed_enabled:
            # Quick check to see if any categories are missing
            # (we'll do proper check after backend creation)
            github_seeding_will_occur = True

        filesystem_backend = FileSystemBackend(
            base_path=base_path,
            cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
            replicate_mode=ReplicateMode.PRIMARY,
            skip_startup_metadata_population=github_seeding_will_occur,
            audit_writer=audit_writer,
        )

        if horde_model_reference_settings.github_seed_enabled:
            logger.info("GitHub seeding enabled for PRIMARY mode")

            all_paths = filesystem_backend.get_all_category_file_paths()
            missing_categories = [cat for cat, path in all_paths.items() if path is None or not path.exists()]

            if missing_categories:
                logger.info(f"Missing categories detected: {missing_categories}. Seeding from GitHub...")

                github_backend = GitHubBackend(
                    base_path=base_path,
                    replicate_mode=ReplicateMode.PRIMARY,
                )

                github_backend.fetch_all_categories(force_refresh=True)
                logger.info("GitHub seeding completed")

                # Populate metadata after seeding
                logger.info("Populating metadata after GitHub seeding")
                filesystem_backend.ensure_all_metadata_populated()
            else:
                logger.debug("All files exist, skipping GitHub seeding")
                # Files exist but seeding was skipped, so run metadata population
                logger.info("Running metadata population check (seeding was skipped)")
                filesystem_backend.ensure_all_metadata_populated()

        if horde_model_reference_settings.redis.use_redis:
            from horde_model_reference.backends.redis_backend import RedisBackend

            logger.info("Wrapping FileSystemBackend with RedisBackend for distributed caching")
            return RedisBackend(
                file_backend=filesystem_backend,
                redis_settings=horde_model_reference_settings.redis,
                cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
            )

        logger.info("Using FileSystemBackend for single-worker PRIMARY deployment")
        return filesystem_backend

    logger.debug("Creating backend for REPLICA mode")

    github_backend = GitHubBackend(
        base_path=base_path,
        replicate_mode=ReplicateMode.REPLICA,
    )

    if horde_model_reference_settings.primary_api_url:
        logger.info(f"Using HTTPBackend with PRIMARY API: {horde_model_reference_settings.primary_api_url}")
        return HTTPBackend(
            primary_api_url=horde_model_reference_settings.primary_api_url,
            github_backend=github_backend,
            cache_ttl_seconds=horde_model_reference_settings.cache_ttl_seconds,
            timeout_seconds=horde_model_reference_settings.primary_api_timeout,
            enable_github_fallback=horde_model_reference_settings.enable_github_fallback,
        )

    logger.info("Using GitHubBackend only (no PRIMARY API configured)")
    return github_backend

new

__new__(
    *,
    backend: ModelReferenceBackend | None = None,
    base_path: str
    | Path = horde_model_reference_paths.base_path,
    replicate_mode: ReplicateMode = horde_model_reference_settings.replicate_mode,
    prefetch_strategy: PrefetchStrategy = PrefetchStrategy.LAZY,
    offline: bool = horde_model_reference_settings.offline,
) -> ModelReferenceManager

Create a new instance of ModelReferenceManager.

Uses the singleton pattern to ensure only one instance exists to avoid multiple downloads and conversions. Subsequent instantiations will return the same instance, and an attempt to re-instantiate with different settings will raise an exception.

Parameters:

backend (ModelReferenceBackend | None, default: None ) –

The backend to use for fetching model references. If None, automatically selects the appropriate backend based on replicate_mode and settings: - PRIMARY mode: FileSystemBackend (optionally wrapped with RedisBackend if configured) - REPLICA mode: HTTPBackend (if PRIMARY API URL configured) or GitHubBackend (fallback) Defaults to None.
base_path (str | Path, default: base_path ) –

The base path to use for storing model reference files. Only used if backend is None. Defaults to horde_model_reference_paths.base_path.
replicate_mode (ReplicateMode, default: replicate_mode ) –

The replicate mode to use. - PRIMARY: Local filesystem is source of truth - REPLICA: Fetch from PRIMARY API or GitHub Only used if backend is None. Defaults to horde_model_reference_settings.replicate_mode.
prefetch_strategy (PrefetchStrategy, default: LAZY ) –

Controls whether initial cache warm-up is skipped (LAZY/NONE), performed synchronously, deferred, or executed via background async task. Defaults to PrefetchStrategy.LAZY.
offline (bool, default: offline ) –

If True, read references from local disk only via LocalReadOnlyBackend and never download (no GitHub / PRIMARY API / Redis), regardless of replicate_mode. Intended for subprocesses whose parent already downloaded the reference files. Defaults to horde_model_reference_settings.offline.

Returns:

ModelReferenceManager ( ModelReferenceManager ) –

The singleton instance of ModelReferenceManager.

Raises:

RuntimeError –

If an attempt is made to re-instantiate with different settings.

Source code in src/horde_model_reference/model_reference_manager.py

def __new__(
    cls,
    *,
    backend: ModelReferenceBackend | None = None,
    base_path: str | Path = horde_model_reference_paths.base_path,
    replicate_mode: ReplicateMode = horde_model_reference_settings.replicate_mode,
    prefetch_strategy: PrefetchStrategy = PrefetchStrategy.LAZY,
    offline: bool = horde_model_reference_settings.offline,
) -> ModelReferenceManager:
    """Create a new instance of ModelReferenceManager.

    Uses the singleton pattern to ensure only one instance exists to avoid multiple downloads and conversions.
    Subsequent instantiations will return the same instance, and an attempt to re-instantiate with different
    settings will raise an exception.

    Args:
        backend: The backend to use for fetching model references.
            If None, automatically selects the appropriate backend based on replicate_mode and settings:
            - PRIMARY mode: FileSystemBackend (optionally wrapped with RedisBackend if configured)
            - REPLICA mode: HTTPBackend (if PRIMARY API URL configured) or GitHubBackend (fallback)
            Defaults to None.
        base_path: The base path to use for storing model reference files.
            Only used if backend is None. Defaults to horde_model_reference_paths.base_path.
        replicate_mode: The replicate mode to use.
            - PRIMARY: Local filesystem is source of truth
            - REPLICA: Fetch from PRIMARY API or GitHub
            Only used if backend is None. Defaults to horde_model_reference_settings.replicate_mode.
        prefetch_strategy: Controls whether initial cache warm-up is skipped (LAZY/NONE),
            performed synchronously, deferred, or executed via background async task.
            Defaults to PrefetchStrategy.LAZY.
        offline: If True, read references from local disk only via LocalReadOnlyBackend and never
            download (no GitHub / PRIMARY API / Redis), regardless of replicate_mode. Intended for
            subprocesses whose parent already downloaded the reference files.
            Defaults to horde_model_reference_settings.offline.

    Returns:
        ModelReferenceManager: The singleton instance of ModelReferenceManager.

    Raises:
        RuntimeError: If an attempt is made to re-instantiate with different settings.

    """
    if not isinstance(prefetch_strategy, PrefetchStrategy):
        try:
            prefetch_strategy = PrefetchStrategy(prefetch_strategy)
        except ValueError as exc:  # pragma: no cover - defensive branch
            raise ValueError(
                f"prefetch_strategy must be one of: {', '.join(strategy.value for strategy in PrefetchStrategy)}"
            ) from exc

    with cls._lock:
        if not cls._instance:
            cls._instance = super().__new__(cls)

            audit_writer: AuditTrailWriter | None = None
            if horde_model_reference_settings.audit.enabled:
                audit_writer = AuditTrailWriter(
                    root_path=horde_model_reference_paths.audit_path,
                    max_file_size_bytes=horde_model_reference_settings.audit.max_segment_bytes,
                )

            if backend is None:
                backend = cls._create_backend(
                    base_path=base_path,
                    replicate_mode=replicate_mode,
                    audit_writer=audit_writer,
                    offline=offline,
                )

            # Offline backends are REPLICA-shaped regardless of the requested mode; align the
            # manager's recorded mode to the backend so the mode-match assertion below holds and
            # downstream code does not assume PRIMARY write capability.
            if offline:
                replicate_mode = backend.replicate_mode

            backend_mode = backend.replicate_mode
            if backend_mode != replicate_mode:
                raise RuntimeError(
                    "Backend replicate_mode does not match requested ModelReferenceManager configuration. "
                    f"Backend mode: {backend_mode}, requested mode: {replicate_mode}."
                )

            cls._instance.backend = backend
            cls._instance._replicate_mode = replicate_mode
            cls._instance._offline = offline
            if backend.supports_writes():
                cls._instance._audit_writer = audit_writer
                cls._instance._pending_queue_service = cls._build_pending_queue_service(
                    audit_writer=audit_writer,
                )
                cls._instance._group_alias_store = GroupAliasStore(
                    file_path=horde_model_reference_paths.group_aliases_path,
                )
                cls._instance._group_family_store = GroupFamilyStore(
                    file_path=horde_model_reference_paths.group_families_path,
                )
                cls._instance._group_schema_store = GroupSchemaStore(
                    file_path=horde_model_reference_paths.group_schemas_path,
                    alias_store=cls._instance._group_alias_store,
                )
            else:
                cls._instance._audit_writer = None
                cls._instance._pending_queue_service = None
                cls._instance._group_alias_store = None
                cls._instance._group_family_store = None
                cls._instance._group_schema_store = None
            cls._instance._cached_records = {}
            cls._instance._deferred_prefetch_handle = None
            cls._instance._async_prefetch_task = None
            cls._instance._provider_registry = ModelProviderRegistry()

            # Register invalidation callback so backend can notify us when cache is stale
            cls._instance.backend.register_invalidation_callback(cls._instance._on_backend_invalidated)

            cls._instance._apply_prefetch_strategy(strategy=prefetch_strategy)
        else:
            if backend is not None and backend is not cls._instance.backend:
                raise RuntimeError(
                    "ModelReferenceManager is a singleton and has already been instantiated "
                    "with a different backend."
                )
            if offline != cls._instance._offline:
                raise RuntimeError(
                    "ModelReferenceManager is a singleton and has already been instantiated with a different "
                    f"offline setting.\nExisting offline={cls._instance._offline}; new offline={offline}."
                )
            if not offline and replicate_mode != cls._instance._replicate_mode:
                raise RuntimeError(
                    "ModelReferenceManager is a singleton and has already been instantiated with different "
                    "settings.\nExisting settings: "
                    f"replicate_mode={cls._instance._replicate_mode}.\n"
                    "New settings: "
                    f"replicate_mode={replicate_mode}."
                )
            if prefetch_strategy != cls._instance._prefetch_strategy:
                raise RuntimeError(
                    "ModelReferenceManager is a singleton and has already been instantiated with different "
                    "settings."
                    f"\nExisting prefetch_strategy={cls._instance._prefetch_strategy.value};"
                    f" new prefetch_strategy={prefetch_strategy.value}."
                )

    return cls._instance

_apply_prefetch_strategy

_apply_prefetch_strategy(
    *, strategy: PrefetchStrategy
) -> None

Apply the configured prefetch strategy once the backend is available.

Source code in src/horde_model_reference/model_reference_manager.py

def _apply_prefetch_strategy(self, *, strategy: PrefetchStrategy) -> None:
    """Apply the configured prefetch strategy once the backend is available."""
    self._prefetch_strategy = strategy
    self._deferred_prefetch_handle = None
    self._async_prefetch_task = None

    if strategy in (PrefetchStrategy.LAZY, PrefetchStrategy.NONE):
        logger.debug(f"prefetch skipped because strategy={strategy.value}")
        return

    if strategy is PrefetchStrategy.SYNC:
        self._fetch_from_backend_if_needed(force_refresh=False)
        return

    if strategy is PrefetchStrategy.DEFERRED:
        self._deferred_prefetch_handle = DeferredPrefetchHandle(manager=self, force_refresh=False)
        logger.info(
            "Deferred prefetch handle created; call run_sync/run_async to warm caches without blocking",
        )
        return

    if strategy is PrefetchStrategy.ASYNC:
        self._schedule_async_prefetch(force_refresh=False)
        return

    raise ValueError(f"Unsupported prefetch strategy: {strategy}")

_on_backend_invalidated

_on_backend_invalidated(
    category: MODEL_REFERENCE_CATEGORY,
) -> None

On callback invoked by backend when a category's cache is invalidated.

This ensures the pydantic model cache stays in sync with backend invalidations.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category that was invalidated.

Source code in src/horde_model_reference/model_reference_manager.py

def _on_backend_invalidated(self, category: MODEL_REFERENCE_CATEGORY) -> None:
    """On callback invoked by backend when a category's cache is invalidated.

    This ensures the pydantic model cache stays in sync with backend invalidations.

    Args:
        category: The category that was invalidated.

    """
    logger.debug(f"Backend invalidated category {category}, clearing pydantic cache")
    self._invalidate_cache(category)

_invalidate_cache

_invalidate_cache(
    category: MODEL_REFERENCE_CATEGORY | None = None,
) -> None

Invalidate the cached pydantic model references.

Parameters:

category (MODEL_REFERENCE_CATEGORY | None, default: None ) –

If provided, only invalidate the specific category. If None, invalidate the entire cache.

Source code in src/horde_model_reference/model_reference_manager.py

def _invalidate_cache(self, category: MODEL_REFERENCE_CATEGORY | None = None) -> None:
    """Invalidate the cached pydantic model references.

    Args:
        category: If provided, only invalidate the specific category.
            If None, invalidate the entire cache.

    """
    with self._lock:
        if category is None:
            logger.debug("Invalidating entire cached pydantic records.")
            self._cached_records = {}
        else:
            logger.debug(f"Invalidating cached pydantic records for category: {category}.")
            self._cached_records.pop(category, None)

invalidate_category_cache

invalidate_category_cache(
    category: MODEL_REFERENCE_CATEGORY,
) -> None

Explicitly invalidate cached data for a category.

Intended for use by the apply workflow after a successful backend write, so stale data is never served regardless of backend callback timing.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category whose cache should be dropped.

Source code in src/horde_model_reference/model_reference_manager.py

def invalidate_category_cache(self, category: MODEL_REFERENCE_CATEGORY) -> None:
    """Explicitly invalidate cached data for a category.

    Intended for use by the apply workflow after a successful backend write,
    so stale data is never served regardless of backend callback timing.

    Args:
        category: The category whose cache should be dropped.

    """
    self._invalidate_cache(category)

_fetch_from_backend_if_needed

_fetch_from_backend_if_needed(
    force_refresh: bool,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]

Fetch references from backend if needed.

Parameters:

force_refresh (bool) –

Whether to force refresh all categories.

Source code in src/horde_model_reference/model_reference_manager.py

def _fetch_from_backend_if_needed(
    self,
    force_refresh: bool,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]:
    """Fetch references from backend if needed.

    Args:
        force_refresh: Whether to force refresh all categories.

    """
    return self.backend.fetch_all_categories(force_refresh=force_refresh)

_fetch_from_backend_if_needed_async `async`

_fetch_from_backend_if_needed_async(
    force_refresh: bool, httpx_client: AsyncClient | None
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]

Asynchronously fetch references from backend if needed.

Parameters:

force_refresh (bool) –

Whether to force refresh all categories.
httpx_client (AsyncClient | None) –

An optional httpx async client to use.

Source code in src/horde_model_reference/model_reference_manager.py

async def _fetch_from_backend_if_needed_async(
    self,
    force_refresh: bool,
    httpx_client: httpx.AsyncClient | None,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None]:
    """Asynchronously fetch references from backend if needed.

    Args:
        force_refresh: Whether to force refresh all categories.
        httpx_client: An optional httpx async client to use.

    """
    return await self.backend.fetch_all_categories_async(
        force_refresh=force_refresh,
        httpx_client=httpx_client,
    )

_build_pending_queue_service `staticmethod`

_build_pending_queue_service(
    *, audit_writer: AuditTrailWriter | None
) -> PendingQueueService | None

Create the pending queue service when enabled.

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def _build_pending_queue_service(
    *,
    audit_writer: AuditTrailWriter | None,
) -> PendingQueueService | None:
    """Create the pending queue service when enabled."""
    if not horde_model_reference_settings.pending_queue.enabled:
        return None

    from horde_model_reference.pending_queue.service import PendingQueueService
    from horde_model_reference.pending_queue.store import PendingQueueStore

    store = PendingQueueStore(root_path=horde_model_reference_paths.pending_queue_path)
    return PendingQueueService(store=store, audit_writer=audit_writer)

create_deferred_prefetch_handle

create_deferred_prefetch_handle(
    *, force_refresh: bool = False
) -> DeferredPrefetchHandle

Create a deferred prefetch handle tied to this manager.

Parameters:

force_refresh (bool, default: False ) –

Whether the handle should bypass backend caches.

Returns:

DeferredPrefetchHandle ( DeferredPrefetchHandle ) –

Handle that can execute the warm-up later.

Source code in src/horde_model_reference/model_reference_manager.py

def create_deferred_prefetch_handle(
    self,
    *,
    force_refresh: bool = False,
) -> DeferredPrefetchHandle:
    """Create a deferred prefetch handle tied to this manager.

    Args:
        force_refresh: Whether the handle should bypass backend caches.

    Returns:
        DeferredPrefetchHandle: Handle that can execute the warm-up later.

    """
    handle = DeferredPrefetchHandle(manager=self, force_refresh=force_refresh)
    self._deferred_prefetch_handle = handle
    return handle

_schedule_async_prefetch

_schedule_async_prefetch(*, force_refresh: bool) -> None

Schedule an async cache warm-up when an event loop is available.

Source code in src/horde_model_reference/model_reference_manager.py

def _schedule_async_prefetch(self, *, force_refresh: bool) -> None:
    """Schedule an async cache warm-up when an event loop is available."""
    handle = self.create_deferred_prefetch_handle(force_refresh=force_refresh)

    try:
        loop = asyncio.get_running_loop()
    except RuntimeError:
        logger.warning(
            "PrefetchStrategy.ASYNC requested but no running event loop detected; "
            "exposing deferred handle for manual execution instead.",
        )
        self._async_prefetch_task = None
        return

    logger.info("Scheduling asynchronous prefetch warm-up task")
    task = loop.create_task(handle.run_async())
    self._async_prefetch_task = task

    def _log_completion(completed: asyncio.Task[None]) -> None:
        try:
            completed.result()
        except Exception as exc:  # pragma: no cover - best-effort logging
            logger.error("Deferred async prefetch failed: %s", exc)

    task.add_done_callback(_log_completion)

warm_cache_async `async`

warm_cache_async(
    *,
    force_refresh: bool = False,
    httpx_client: AsyncClient | None = None,
) -> None

Warm cached pydantic records using backend async APIs.

Parameters:

force_refresh (bool, default: False ) –

Whether to bypass backend caches while warming.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.

Source code in src/horde_model_reference/model_reference_manager.py

async def warm_cache_async(
    self,
    *,
    force_refresh: bool = False,
    httpx_client: httpx.AsyncClient | None = None,
) -> None:
    """Warm cached pydantic records using backend async APIs.

    Args:
        force_refresh: Whether to bypass backend caches while warming.
        httpx_client: Optional shared async client for HTTP backends.

    """
    await self.get_all_model_references_or_none_async(
        overwrite_existing=force_refresh,
        httpx_client=httpx_client,
    )

ensure_ready

ensure_ready(*, overwrite_existing: bool = False) -> None

Ensure cached references exist synchronously (sync mirror of :meth:ensure_ready_async).

Useful for warming the cache up-front from synchronous code - or for completing a deferred PrefetchStrategy.ASYNC warm-up that degraded because no event loop was running at construction. After this returns, :attr:is_warm is True.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to bypass backend caches while warming.

Source code in src/horde_model_reference/model_reference_manager.py

def ensure_ready(self, *, overwrite_existing: bool = False) -> None:
    """Ensure cached references exist synchronously (sync mirror of :meth:`ensure_ready_async`).

    Useful for warming the cache up-front from synchronous code - or for completing
    a deferred ``PrefetchStrategy.ASYNC`` warm-up that degraded because no event loop
    was running at construction. After this returns, :attr:`is_warm` is ``True``.

    Args:
        overwrite_existing: Whether to bypass backend caches while warming.

    """
    self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)

ensure_ready_async `async`

ensure_ready_async(
    *,
    overwrite_existing: bool = False,
    httpx_client: AsyncClient | None = None,
) -> None

Ensure cached references exist by delegating to warm_cache_async.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to bypass backend caches while warming.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.

Source code in src/horde_model_reference/model_reference_manager.py

async def ensure_ready_async(
    self,
    *,
    overwrite_existing: bool = False,
    httpx_client: httpx.AsyncClient | None = None,
) -> None:
    """Ensure cached references exist by delegating to ``warm_cache_async``.

    Args:
        overwrite_existing: Whether to bypass backend caches while warming.
        httpx_client: Optional shared async client for HTTP backends.

    """
    await self.warm_cache_async(force_refresh=overwrite_existing, httpx_client=httpx_client)

supports_metadata

supports_metadata() -> bool

Return whether the active backend tracks per-category metadata.

Metadata (timestamps, operation counts) is typically only available in PRIMARY mode; REPLICA backends return False. Check this before relying on :meth:get_metadata / :meth:last_updated returning a value.

Source code in src/horde_model_reference/model_reference_manager.py

def supports_metadata(self) -> bool:
    """Return whether the active backend tracks per-category metadata.

    Metadata (timestamps, operation counts) is typically only available in PRIMARY
    mode; REPLICA backends return ``False``. Check this before relying on
    :meth:`get_metadata` / :meth:`last_updated` returning a value.
    """
    return self.backend.supports_metadata()

get_metadata

get_metadata(
    category: MODEL_REFERENCE_CATEGORY,
    *,
    raise_if_unsupported: bool = False,
) -> CategoryMetadata | None

Return per-category metadata, or None when the backend cannot provide it.

A first-class manager accessor so library consumers do not need to reach into manager.backend and contend with backend-varying supports_metadata().

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to fetch metadata for.
raise_if_unsupported (bool, default: False ) –

When True, raise NotImplementedError instead of returning None if the backend does not support metadata.

Returns:

CategoryMetadata | None –

The category metadata, or None when unsupported (and not raising).

Source code in src/horde_model_reference/model_reference_manager.py

def get_metadata(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    *,
    raise_if_unsupported: bool = False,
) -> CategoryMetadata | None:
    """Return per-category metadata, or ``None`` when the backend cannot provide it.

    A first-class manager accessor so library consumers do not need to reach into
    ``manager.backend`` and contend with backend-varying ``supports_metadata()``.

    Args:
        category: The category to fetch metadata for.
        raise_if_unsupported: When ``True``, raise ``NotImplementedError`` instead of
            returning ``None`` if the backend does not support metadata.

    Returns:
        The category metadata, or ``None`` when unsupported (and not raising).

    """
    if not self.backend.supports_metadata():
        if raise_if_unsupported:
            raise NotImplementedError(f"{type(self.backend).__name__} does not support metadata tracking")
        return None
    return self.backend.get_metadata(category)

get_metadata_async `async`

get_metadata_async(
    category: MODEL_REFERENCE_CATEGORY,
    *,
    raise_if_unsupported: bool = False,
) -> CategoryMetadata | None

Async counterpart to :meth:get_metadata.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_metadata_async(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    *,
    raise_if_unsupported: bool = False,
) -> CategoryMetadata | None:
    """Async counterpart to :meth:`get_metadata`."""
    if not self.backend.supports_metadata():
        if raise_if_unsupported:
            raise NotImplementedError(f"{type(self.backend).__name__} does not support metadata tracking")
        return None
    return await self.backend.get_metadata_async(category)

last_updated

last_updated(
    category: MODEL_REFERENCE_CATEGORY,
) -> int | None

Return the unix timestamp of the category's last update, or None.

Convenience over :meth:get_metadata for cheap change-detection polling by library consumers. Returns None when the backend does not track metadata.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to inspect.

Returns:

int | None –

The last_updated unix timestamp, or None when unavailable.

Source code in src/horde_model_reference/model_reference_manager.py

def last_updated(self, category: MODEL_REFERENCE_CATEGORY) -> int | None:
    """Return the unix timestamp of the category's last update, or ``None``.

    Convenience over :meth:`get_metadata` for cheap change-detection polling by
    library consumers. Returns ``None`` when the backend does not track metadata.

    Args:
        category: The category to inspect.

    Returns:
        The ``last_updated`` unix timestamp, or ``None`` when unavailable.

    """
    metadata = self.get_metadata(category)
    return metadata.last_updated if metadata is not None else None

_file_json_dict_to_model_reference `staticmethod`

_file_json_dict_to_model_reference(
    category: MODEL_REFERENCE_CATEGORY,
    file_json_dict: dict[str, Any] | None,
    safe_mode: bool = False,
) -> dict[str, GenericModelRecord] | None

Return a model reference object from a JSON dictionary, or None if conversion failed.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The target model reference category to convert.
file_json_dict (dict[str, Any] | None) –

The dict object representing the model reference.
safe_mode (bool, default: False ) –

Whether to raise exceptions on failure. If False, exceptions are caught and None is returned. Defaults to False.

Returns:

dict[str, GenericModelRecord] | None –

dict[str, GenericModelRecord] | None: The dict representing the model reference, or None if conversion failed.

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def _file_json_dict_to_model_reference(
    category: MODEL_REFERENCE_CATEGORY,
    file_json_dict: dict[str, Any] | None,
    safe_mode: bool = False,
) -> dict[str, GenericModelRecord] | None:
    """Return a model reference object from a JSON dictionary, or None if conversion failed.

    Args:
        category: The target model reference category to convert.
        file_json_dict: The dict object representing the model reference.
        safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
            and None is returned. Defaults to False.

    Returns:
        dict[str, GenericModelRecord] | None: The dict representing the model reference,
            or None if conversion failed.

    """
    if file_json_dict is None:
        logger.warning(f"File dict json is None for {category}.")
        return None

    if category in categories_managed_elsewhere:
        logger.info(f"Skipping conversion for category: {category} (managed elsewhere)")
        return None

    try:
        record_type = MODEL_RECORD_TYPE_LOOKUP.get(category, GenericModelRecord)
        model_reference: dict[str, GenericModelRecord] = {}
        for model_value in file_json_dict.values():
            model_instance = record_type.model_validate(model_value)
            model_reference[model_instance.name] = model_instance

        return model_reference

    except Exception as e:
        if not safe_mode:
            logger.exception(f"Failed to convert file dict JSON to model reference for {category}: {e}")
            return None
        raise e

model_reference_to_json_dict `staticmethod`

model_reference_to_json_dict(
    model_reference: dict[str, GenericModelRecord],
    safe_mode: bool = False,
) -> dict[str, Any] | None

Return a JSON dictionary from a model reference object, or None if conversion failed.

Parameters:

model_reference (dict[str, GenericModelRecord]) –

The model reference object.
safe_mode (bool, default: False ) –

Whether to raise exceptions on failure. If False, exceptions are caught and None is returned. Use model_reference_to_json_dict_safe() for the better type hinting if you intend to use this. Defaults to False.

Returns:

dict[str, Any] | None –

dict | None: The dict representing the model reference, or None if conversion failed.

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def model_reference_to_json_dict(
    model_reference: dict[str, GenericModelRecord],
    safe_mode: bool = False,
) -> dict[str, Any] | None:
    """Return a JSON dictionary from a model reference object, or None if conversion failed.

    Args:
        model_reference: The model reference object.
        safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
            and None is returned. Use `model_reference_to_json_dict_safe()` for the better type hinting if you
            intend to use this. Defaults to False.

    Returns:
        dict | None: The dict representing the model reference, or None if conversion failed.

    """
    if model_reference is None:
        raise ValueError("model_reference cannot be None")

    try:
        return {
            name: record.model_dump(
                exclude_unset=True,
            )
            for name, record in model_reference.items()
        }
    except Exception as e:
        if not safe_mode:
            logger.exception(f"Failed to convert model reference to JSON: {e}")
            return None

        raise e

model_reference_to_json_dict_safe `staticmethod`

model_reference_to_json_dict_safe(
    model_reference: dict[str, GenericModelRecord],
) -> dict[str, Any]

Return a JSON dictionary from a model reference object.

Raises an exception if conversion fails.

Parameters:

model_reference (dict[str, GenericModelRecord]) –

The model reference object.

Returns:

dict ( dict[str, Any] ) –

The dict representing the model reference.

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def model_reference_to_json_dict_safe(
    model_reference: dict[str, GenericModelRecord],
) -> dict[str, Any]:
    """Return a JSON dictionary from a model reference object.

    Raises an exception if conversion fails.

    Args:
        model_reference: The model reference object.

    Returns:
        dict: The dict representing the model reference.

    """
    json_dict_safe = ModelReferenceManager.model_reference_to_json_dict(model_reference, safe_mode=True)

    if json_dict_safe is None:
        raise RuntimeError("Conversion to JSON dict failed in safe mode, but no exception was raised.")

    return json_dict_safe

_get_all_cached_model_references

_get_all_cached_model_references(
    safe_mode: bool = False,
) -> dict[
    MODEL_REFERENCE_CATEGORY,
    dict[str, GenericModelRecord] | None,
]

Get all cached pydantic model references.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference categories to their corresponding pydantic model objects.

Source code in src/horde_model_reference/model_reference_manager.py

def _get_all_cached_model_references(
    self,
    safe_mode: bool = False,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
    """Get all cached pydantic model references.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference
            categories to their corresponding pydantic model objects.

    """
    with self._lock:
        logger.debug(f"Returning {len(self._cached_records)} cached pydantic model references.")
        return dict(self._cached_records)

_evaluate_cache_state

_evaluate_cache_state(
    *, overwrite_existing: bool, safe_mode: bool
) -> tuple[
    bool,
    dict[
        MODEL_REFERENCE_CATEGORY,
        dict[str, GenericModelRecord] | None,
    ],
    list[MODEL_REFERENCE_CATEGORY],
]

Return whether cached data can be reused plus categories needing refresh.

Source code in src/horde_model_reference/model_reference_manager.py

def _evaluate_cache_state(
    self,
    *,
    overwrite_existing: bool,
    safe_mode: bool,
) -> tuple[
    bool,
    dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None],
    list[MODEL_REFERENCE_CATEGORY],
]:
    """Return whether cached data can be reused plus categories needing refresh."""
    with self._lock:
        refresh_map = {category: self.backend.needs_refresh(category) for category in MODEL_REFERENCE_CATEGORY}
        all_categories_cached = all(cat in self._cached_records for cat in MODEL_REFERENCE_CATEGORY)
        needs_backend_refresh = overwrite_existing or any(refresh_map.values())

        if not overwrite_existing and all_categories_cached and not needs_backend_refresh:
            logger.debug("Using fully cached pydantic model references.")
            return True, self._get_all_cached_model_references(safe_mode=safe_mode), []

        categories_to_load: list[MODEL_REFERENCE_CATEGORY] = []
        for category in MODEL_REFERENCE_CATEGORY:
            cached_value = self._cached_records.get(category)
            if (
                overwrite_existing
                or category not in self._cached_records
                or cached_value is None
                or refresh_map[category]
            ):
                categories_to_load.append(category)

        return False, {}, categories_to_load

_load_categories_from_payload

_load_categories_from_payload(
    *,
    categories_to_load: Iterable[MODEL_REFERENCE_CATEGORY],
    payload: dict[
        MODEL_REFERENCE_CATEGORY, dict[str, Any] | None
    ]
    | None,
    overwrite_existing: bool,
    safe_mode: bool,
) -> None

Convert backend payload into cached pydantic models for selected categories.

Source code in src/horde_model_reference/model_reference_manager.py

def _load_categories_from_payload(
    self,
    *,
    categories_to_load: Iterable[MODEL_REFERENCE_CATEGORY],
    payload: dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None] | None,
    overwrite_existing: bool,
    safe_mode: bool,
) -> None:
    """Convert backend payload into cached pydantic models for selected categories."""
    normalized_payload = payload or {}
    prepared_payload: dict[MODEL_REFERENCE_CATEGORY, dict[str, Any] | None] = {}
    missing_payload: list[MODEL_REFERENCE_CATEGORY] = []

    for category in categories_to_load:
        if category in normalized_payload:
            prepared_payload[category] = normalized_payload[category]
        else:
            missing_payload.append(category)

    if missing_payload:
        logger.debug(
            "Backend payload missing %d categories; falling back to per-category fetch: %s",
            len(missing_payload),
            missing_payload,
        )
        for category in missing_payload:
            prepared_payload[category] = self.backend.fetch_category(
                category,
                force_refresh=overwrite_existing,
            )

    with self._lock:
        for category, file_json in prepared_payload.items():
            model_reference = self._file_json_dict_to_model_reference(
                category,
                file_json,
                safe_mode=safe_mode,
            )
            self._cached_records[category] = model_reference

get_all_model_references_or_none

get_all_model_references_or_none(
    overwrite_existing: bool = False,
    *,
    safe_mode: bool = False,
) -> dict[
    MODEL_REFERENCE_CATEGORY,
    dict[str, GenericModelRecord] | None,
]

Return a mapping of all model reference categories to their corresponding model reference objects.

Note that values may be None if the model reference file could not be found or parsed.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to force a redownload of all model reference files. Defaults to False.
safe_mode (bool, default: False ) –

Whether to raise exceptions on failure. If False, exceptions are caught and None is returned for that category. Defaults to False. Use get_all_model_references() for the better type hinting if you intend to use this.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference categories to their corresponding model reference objects.

Source code in src/horde_model_reference/model_reference_manager.py

def get_all_model_references_or_none(
    self,
    overwrite_existing: bool = False,
    *,
    safe_mode: bool = False,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
    """Return a mapping of all model reference categories to their corresponding model reference objects.

    Note that values may be None if the model reference file could not be found or parsed.

    Args:
        overwrite_existing: Whether to force a redownload of all model reference files.
            Defaults to False.
        safe_mode: Whether to raise exceptions on failure. If False, exceptions are caught
            and None is returned for that category. Defaults to False. Use `get_all_model_references()`
            for the better type hinting if you intend to use this.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: A mapping of model reference
            categories to their corresponding model reference objects.

    """
    use_cache, cached_result, categories_to_load = self._evaluate_cache_state(
        overwrite_existing=overwrite_existing,
        safe_mode=safe_mode,
    )

    if use_cache:
        return cached_result

    logger.debug("Fetching model references from backend as needed.")
    backend_payload = self._fetch_from_backend_if_needed(force_refresh=overwrite_existing)

    if categories_to_load:
        logger.debug("Loading %d model reference categories: %s", len(categories_to_load), categories_to_load)
        self._load_categories_from_payload(
            categories_to_load=categories_to_load,
            payload=backend_payload,
            overwrite_existing=overwrite_existing,
            safe_mode=safe_mode,
        )

    return self._get_all_cached_model_references(safe_mode=safe_mode)

_build_safe_reference_view

_build_safe_reference_view(
    all_references: dict[
        MODEL_REFERENCE_CATEGORY,
        dict[str, GenericModelRecord] | None,
    ],
) -> dict[
    MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]
]

Convert a possibly sparse reference view into a safe mapping with logging.

Parameters:

all_references (dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]) –

Mapping of categories to model reference dicts or None.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping where
dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] –

missing categories map to empty dicts.

Source code in src/horde_model_reference/model_reference_manager.py

def _build_safe_reference_view(
    self,
    all_references: dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None],
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
    """Convert a possibly sparse reference view into a safe mapping with logging.

    Args:
        all_references: Mapping of categories to model reference dicts or None.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping where
        missing categories map to empty dicts.

    """
    safe_references: dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] = {}
    missing_references: list[MODEL_REFERENCE_CATEGORY] = []
    for category, reference in all_references.items():
        if reference is not None:
            safe_references[category] = reference
        elif category not in categories_managed_elsewhere:
            missing_references.append(category)
            safe_references[category] = {}

    if missing_references:
        logger.error(f"Missing model references for categories: {missing_references}")

    return safe_references

get_all_model_references

get_all_model_references(
    overwrite_existing: bool = False,
) -> dict[
    MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]
]

Return a mapping of all model reference categories to their corresponding model reference objects.

If a model reference file could not be found or parsed, an exception is raised. If you want to allow missing model references, use get_all_model_references_or_none() instead.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to force a redownload of all model reference files. Defaults to False.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: A mapping of model reference categories to their corresponding model reference objects.

Source code in src/horde_model_reference/model_reference_manager.py

def get_all_model_references(
    self,
    overwrite_existing: bool = False,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
    """Return a mapping of all model reference categories to their corresponding model reference objects.

    If a model reference file could not be found or parsed, an exception is raised. If you want to allow
    missing model references, use `get_all_model_references_or_none()` instead.

    Args:
        overwrite_existing: Whether to force a redownload of all model reference files.
            Defaults to False.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: A mapping of model reference
            categories to their corresponding model reference objects.

    """
    all_references = self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)
    return self._build_safe_reference_view(all_references)

get_all_model_references_or_none_async `async`

get_all_model_references_or_none_async(
    overwrite_existing: bool = False,
    *,
    safe_mode: bool = False,
    httpx_client: AsyncClient | None = None,
) -> dict[
    MODEL_REFERENCE_CATEGORY,
    dict[str, GenericModelRecord] | None,
]

Return model references asynchronously without enforcing presence.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to force backend refresh.
safe_mode (bool, default: False ) –

Whether to propagate conversion errors.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: Possibly
dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None] –

sparse mapping keyed by category.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_all_model_references_or_none_async(
    self,
    overwrite_existing: bool = False,
    *,
    safe_mode: bool = False,
    httpx_client: httpx.AsyncClient | None = None,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]:
    """Return model references asynchronously without enforcing presence.

    Args:
        overwrite_existing: Whether to force backend refresh.
        safe_mode: Whether to propagate conversion errors.
        httpx_client: Optional shared async client for HTTP backends.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord] | None]: Possibly
        sparse mapping keyed by category.

    """
    use_cache, cached_result, categories_to_load = self._evaluate_cache_state(
        overwrite_existing=overwrite_existing,
        safe_mode=safe_mode,
    )

    if use_cache:
        return cached_result

    logger.debug("Asynchronously fetching model references from backend as needed.")
    backend_payload = await self._fetch_from_backend_if_needed_async(
        force_refresh=overwrite_existing,
        httpx_client=httpx_client,
    )

    if categories_to_load:
        logger.debug("Loading %d model reference categories via async payload", len(categories_to_load))
        self._load_categories_from_payload(
            categories_to_load=categories_to_load,
            payload=backend_payload,
            overwrite_existing=overwrite_existing,
            safe_mode=safe_mode,
        )

    return self._get_all_cached_model_references(safe_mode=safe_mode)

get_all_model_references_async `async`

get_all_model_references_async(
    overwrite_existing: bool = False,
    *,
    httpx_client: AsyncClient | None = None,
) -> dict[
    MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]
]

Return all model references asynchronously, raising on missing categories.

Parameters:

overwrite_existing (bool, default: False ) –

Whether to force backend refresh.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.

Returns:

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] –

dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping with
dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]] –

empty dicts substituted for missing categories.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_all_model_references_async(
    self,
    overwrite_existing: bool = False,
    *,
    httpx_client: httpx.AsyncClient | None = None,
) -> dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]:
    """Return all model references asynchronously, raising on missing categories.

    Args:
        overwrite_existing: Whether to force backend refresh.
        httpx_client: Optional shared async client for HTTP backends.

    Returns:
        dict[MODEL_REFERENCE_CATEGORY, dict[str, GenericModelRecord]]: Mapping with
        empty dicts substituted for missing categories.

    """
    all_references = await self.get_all_model_references_or_none_async(
        overwrite_existing=overwrite_existing,
        httpx_client=httpx_client,
    )
    return self._build_safe_reference_view(all_references)

get_model_reference_or_none

get_model_reference_or_none(
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord] | None

Return the model reference object for a specific category.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to retrieve.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. Defaults to canonical horde data (:data:~horde_model_reference.source_consts.HORDE_SOURCE_ID). Pass "any" to merge all registered providers, or a provider id / sequence of ids to select specific third-party sources. On name collisions the canonical (or earlier-listed) source wins.

Returns:

dict[str, GenericModelRecord] | None –

dict[str, GenericModelRecord] | None: The model reference object for the category, or None if not found.

Source code in src/horde_model_reference/model_reference_manager.py

def get_model_reference_or_none(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord] | None:
    """Return the model reference object for a specific category.

    Args:
        category: The category to retrieve.
        overwrite_existing: Whether to force a redownload. Defaults to False.
        source: Which source(s) to read from. Defaults to canonical horde data
            (:data:`~horde_model_reference.source_consts.HORDE_SOURCE_ID`). Pass
            ``"any"`` to merge all registered providers, or a provider id / sequence
            of ids to select specific third-party sources. On name collisions the
            canonical (or earlier-listed) source wins.

    Returns:
        dict[str, GenericModelRecord] | None: The model reference object for the category,
            or None if not found.

    """
    if self._is_canonical_only(source):
        all_references = self.get_all_model_references_or_none(overwrite_existing=overwrite_existing)
        return all_references.get(category)
    return self._merge_sourced_reference(category, source, overwrite_existing=overwrite_existing)

get_model_reference_or_none_async `async`

get_model_reference_or_none_async(
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    httpx_client: AsyncClient | None = None,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord] | None

Return a single category's references asynchronously without strict enforcement.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

Target category to load.
overwrite_existing (bool, default: False ) –

Whether to force backend refresh.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. See :meth:get_model_reference_or_none.

Returns:

dict[str, GenericModelRecord] | None –

dict[str, GenericModelRecord] | None: Mapping of model names or None.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_model_reference_or_none_async(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    httpx_client: httpx.AsyncClient | None = None,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord] | None:
    """Return a single category's references asynchronously without strict enforcement.

    Args:
        category: Target category to load.
        overwrite_existing: Whether to force backend refresh.
        httpx_client: Optional shared async client for HTTP backends.
        source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

    Returns:
        dict[str, GenericModelRecord] | None: Mapping of model names or None.

    """
    if self._is_canonical_only(source):
        all_references = await self.get_all_model_references_or_none_async(
            overwrite_existing=overwrite_existing,
            httpx_client=httpx_client,
        )
        return all_references.get(category)
    return await self._merge_sourced_reference_async(
        category,
        source,
        overwrite_existing=overwrite_existing,
        httpx_client=httpx_client,
    )

get_model_reference

get_model_reference(
    category: Literal[audio_generation],
    overwrite_existing: bool = False,
) -> dict[str, AudioGenerationModelRecord]

get_model_reference(
    category: Literal[blip],
    overwrite_existing: bool = False,
) -> dict[str, BlipModelRecord]

get_model_reference(
    category: Literal[clip],
    overwrite_existing: bool = False,
) -> dict[str, ClipModelRecord]

get_model_reference(
    category: Literal[codeformer],
    overwrite_existing: bool = False,
) -> dict[str, CodeformerModelRecord]

get_model_reference(
    category: Literal[controlnet],
    overwrite_existing: bool = False,
) -> dict[str, ControlNetModelRecord]

get_model_reference(
    category: Literal[image_generation],
    overwrite_existing: bool = False,
) -> dict[str, ImageGenerationModelRecord]

get_model_reference(
    category: Literal[text_generation],
    overwrite_existing: bool = False,
) -> dict[str, TextGenerationModelRecord]

get_model_reference(
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord]

get_model_reference(
    category: MODEL_REFERENCE_CATEGORY = MODEL_REFERENCE_CATEGORY.image_generation,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> Mapping[str, GenericModelRecord]

Return the model reference object for a specific category.

Raises an exception if the model reference could not be found or parsed. If you want to allow missing model references, use get_model_reference_or_none() instead.

Parameters:

category (MODEL_REFERENCE_CATEGORY, default: image_generation ) –

The category to retrieve.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. See :meth:get_model_reference_or_none.

Returns:

Mapping[str, GenericModelRecord] –

Mapping[str, GenericModelRecord]: The model reference object for the category.

Source code in src/horde_model_reference/model_reference_manager.py

def get_model_reference(
    self,
    category: MODEL_REFERENCE_CATEGORY = MODEL_REFERENCE_CATEGORY.image_generation,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> Mapping[str, GenericModelRecord]:
    """Return the model reference object for a specific category.

    Raises an exception if the model reference could not be found or parsed.
    If you want to allow missing model references, use `get_model_reference_or_none()` instead.

    Args:
        category: The category to retrieve.
        overwrite_existing: Whether to force a redownload. Defaults to False.
        source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

    Returns:
        Mapping[str, GenericModelRecord]: The model reference object for the category.

    """
    model_reference = self.get_model_reference_or_none(
        category,
        overwrite_existing=overwrite_existing,
        source=source,
    )
    if model_reference is None:
        raise RuntimeError(f"Model reference for category {category} not found or could not be parsed.")

    return model_reference

get_model_reference_async `async`

get_model_reference_async(
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    httpx_client: AsyncClient | None = None,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord]

Return a single category's references asynchronously, raising if missing.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

Target category to load.
overwrite_existing (bool, default: False ) –

Whether to force backend refresh.
httpx_client (AsyncClient | None, default: None ) –

Optional shared async client for HTTP backends.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. See :meth:get_model_reference_or_none.

Returns:

dict[str, GenericModelRecord] –

dict[str, GenericModelRecord]: Mapping of model names for the category.

Raises:

RuntimeError –

If the category is missing or could not be parsed.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_model_reference_async(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
    *,
    httpx_client: httpx.AsyncClient | None = None,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> dict[str, GenericModelRecord]:
    """Return a single category's references asynchronously, raising if missing.

    Args:
        category: Target category to load.
        overwrite_existing: Whether to force backend refresh.
        httpx_client: Optional shared async client for HTTP backends.
        source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

    Returns:
        dict[str, GenericModelRecord]: Mapping of model names for the category.

    Raises:
        RuntimeError: If the category is missing or could not be parsed.

    """
    model_reference = await self.get_model_reference_or_none_async(
        category,
        overwrite_existing=overwrite_existing,
        httpx_client=httpx_client,
        source=source,
    )
    if model_reference is None:
        raise RuntimeError(f"Model reference for category {category} not found or could not be parsed.")

    return model_reference

get_model_or_none

get_model_or_none(
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> GenericModelRecord | None

Return a specific model from a category.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to retrieve.
model_name (str) –

The name of the model within the category.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. See :meth:get_model_reference_or_none.

Returns:

GenericModelRecord | None –

GenericModelRecord | None: The model record, or None if not found.

Source code in src/horde_model_reference/model_reference_manager.py

def get_model_or_none(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> GenericModelRecord | None:
    """Return a specific model from a category.

    Args:
        category: The category to retrieve.
        model_name: The name of the model within the category.
        overwrite_existing: Whether to force a redownload. Defaults to False.
        source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

    Returns:
        GenericModelRecord | None: The model record, or None if not found.

    """
    model_reference = self.get_model_reference_or_none(
        category,
        overwrite_existing=overwrite_existing,
        source=source,
    )
    if model_reference is None:
        return None

    return model_reference.get(model_name)

get_model

get_model(
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> GenericModelRecord

Return a specific model from a category.

Raises an exception if the model could not be found or parsed. If you want to allow missing models, use get_model_or_none() instead.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to retrieve.
model_name (str) –

The name of the model within the category.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to read from. See :meth:get_model_reference_or_none.

Returns:

GenericModelRecord ( GenericModelRecord ) –

The model record.

Source code in src/horde_model_reference/model_reference_manager.py

def get_model(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> GenericModelRecord:
    """Return a specific model from a category.

    Raises an exception if the model could not be found or parsed.
    If you want to allow missing models, use `get_model_or_none()` instead.

    Args:
        category: The category to retrieve.
        model_name: The name of the model within the category.
        overwrite_existing: Whether to force a redownload. Defaults to False.
        source: Which source(s) to read from. See :meth:`get_model_reference_or_none`.

    Returns:
        GenericModelRecord: The model record.

    """
    model_reference = self.get_model_reference(
        category,
        overwrite_existing=overwrite_existing,
        source=source,
    )

    model_record = model_reference.get(model_name)
    if model_record is None:
        raise RuntimeError(f"Model {model_name} not found in category {category}.")

    return model_record

get_raw_model_reference_json

get_raw_model_reference_json(
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
) -> dict[str, Any] | None

Return the raw JSON dict for a specific category without pydantic validation.

This method delegates to the backend to fetch the raw JSON data directly, avoiding the overhead of creating pydantic models. Ideal for API endpoints that need fast JSON responses.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to retrieve.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.

Returns:

dict[str, Any] | None –

dict[str, Any] | None: The raw JSON dict for the category, or None if not found.

Source code in src/horde_model_reference/model_reference_manager.py

def get_raw_model_reference_json(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    overwrite_existing: bool = False,
) -> dict[str, Any] | None:
    """Return the raw JSON dict for a specific category without pydantic validation.

    This method delegates to the backend to fetch the raw JSON data directly,
    avoiding the overhead of creating pydantic models. Ideal for API endpoints
    that need fast JSON responses.

    Args:
        category: The category to retrieve.
        overwrite_existing: Whether to force a redownload. Defaults to False.

    Returns:
        dict[str, Any] | None: The raw JSON dict for the category, or None if not found.

    """
    return self.backend.fetch_category(category, force_refresh=overwrite_existing)

get_raw_model_json

get_raw_model_json(
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
) -> dict[str, Any] | None

Return the raw JSON dict for a specific model in a category without pydantic validation.

This method delegates to the backend to fetch the raw JSON data directly, avoiding the overhead of creating pydantic models. Ideal for API endpoints that need fast JSON responses.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

The category to retrieve.
model_name (str) –

The name of the model within the category.
overwrite_existing (bool, default: False ) –

Whether to force a redownload. Defaults to False.

Returns:

dict[str, Any] | None –

dict[str, Any] | None: The raw JSON dict for the model, or None if not found.

Source code in src/horde_model_reference/model_reference_manager.py

def get_raw_model_json(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    model_name: str,
    overwrite_existing: bool = False,
) -> dict[str, Any] | None:
    """Return the raw JSON dict for a specific model in a category without pydantic validation.

    This method delegates to the backend to fetch the raw JSON data directly,
    avoiding the overhead of creating pydantic models. Ideal for API endpoints
    that need fast JSON responses.

    Args:
        category: The category to retrieve.
        model_name: The name of the model within the category.
        overwrite_existing: Whether to force a redownload. Defaults to False.

    Returns:
        dict[str, Any] | None: The raw JSON dict for the model, or None if not found.

    """
    category_json = self.backend.fetch_category(category, force_refresh=overwrite_existing)

    if category_json is None:
        return None

    return category_json.get(model_name)

_get_typed_models

_get_typed_models(
    category: MODEL_REFERENCE_CATEGORY,
    *,
    record_type: type[TModelRecord],
) -> dict[str, TModelRecord]

Return a typed mapping for the requested category.

Source code in src/horde_model_reference/model_reference_manager.py

def _get_typed_models(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    *,
    record_type: type[TModelRecord],
) -> dict[str, TModelRecord]:
    """Return a typed mapping for the requested category."""
    model_reference = self.get_model_reference(category)

    if len(model_reference) == 0:
        return {}

    typed_reference: dict[str, TModelRecord] = {}
    for name, record in model_reference.items():
        if not isinstance(record, record_type):
            raise RuntimeError(
                f"Some records in {category.value} category are not {record_type.__name__} instances."
            )
        typed_reference[name] = record

    return typed_reference

register_provider

register_provider(
    provider: ModelProvider, *, replace: bool = False
) -> None

Register a third-party :class:ModelProvider for use in reads/queries.

Parameters:

provider (ModelProvider) –

The provider to register.
replace (bool, default: False ) –

If True, replace an existing provider with the same source id.

Raises:

ValueError –

If the source id is reserved/empty, or already registered and replace is False.

Source code in src/horde_model_reference/model_reference_manager.py

def register_provider(self, provider: ModelProvider, *, replace: bool = False) -> None:
    """Register a third-party :class:`ModelProvider` for use in reads/queries.

    Args:
        provider: The provider to register.
        replace: If ``True``, replace an existing provider with the same source id.

    Raises:
        ValueError: If the source id is reserved/empty, or already registered and
            *replace* is ``False``.

    """
    self._provider_registry.register(provider, replace=replace)

unregister_provider

unregister_provider(source_id: str) -> bool

Remove the provider registered under source_id.

Returns:

bool ( bool ) –

True if a provider was removed, False otherwise.

Source code in src/horde_model_reference/model_reference_manager.py

def unregister_provider(self, source_id: str) -> bool:
    """Remove the provider registered under *source_id*.

    Returns:
        bool: ``True`` if a provider was removed, ``False`` otherwise.

    """
    return self._provider_registry.unregister(source_id)

list_providers

list_providers() -> list[str]

Return the source ids of all registered providers (registration order).

Source code in src/horde_model_reference/model_reference_manager.py

def list_providers(self) -> list[str]:
    """Return the source ids of all registered providers (registration order)."""
    return self._provider_registry.source_ids()

get_provider

get_provider(source_id: str) -> ModelProvider | None

Return the provider registered under source_id, or None.

Source code in src/horde_model_reference/model_reference_manager.py

def get_provider(self, source_id: str) -> ModelProvider | None:
    """Return the provider registered under *source_id*, or ``None``."""
    return self._provider_registry.get(source_id)

_resolve_ordered_source_ids

_resolve_ordered_source_ids(
    selectors: list[str],
) -> list[str]

Return an ordered, de-duplicated list of concrete source ids to read.

Unlike a canonical-first split, this preserves each selector's position so callers control collision precedence (earlier sources win during the setdefault merge). The canonical source (:data:HORDE_SOURCE_ID) is treated as just another id and keeps wherever it appears in the selector, so ["pending", "horde"] lets the "pending" provider override canonical while the default ["horde"] is canonical-only.

ANY_SOURCE expands to the canonical source first, then every registered provider in registration order, preserving the historical "canonical wins" default for "any". Explicitly named, unregistered provider ids raise ValueError; ids discovered via ANY_SOURCE are simply the live set and never raise.

Source code in src/horde_model_reference/model_reference_manager.py

def _resolve_ordered_source_ids(
    self,
    selectors: list[str],
) -> list[str]:
    """Return an ordered, de-duplicated list of concrete source ids to read.

    Unlike a canonical-first split, this preserves each selector's **position** so
    callers control collision precedence (earlier sources win during the
    ``setdefault`` merge). The canonical source (:data:`HORDE_SOURCE_ID`) is treated
    as just another id and keeps wherever it appears in the selector, so
    ``["pending", "horde"]`` lets the ``"pending"`` provider override canonical while
    the default ``["horde"]`` is canonical-only.

    ``ANY_SOURCE`` expands to the canonical source **first**, then every registered
    provider in registration order, preserving the historical "canonical wins"
    default for ``"any"``. Explicitly named, unregistered provider ids raise
    ``ValueError``; ids discovered via ``ANY_SOURCE`` are simply the live set and
    never raise.
    """
    ordered: list[str] = []
    seen: set[str] = set()

    def _add(source_id: str) -> None:
        if source_id not in seen:
            seen.add(source_id)
            ordered.append(source_id)

    for selector in selectors:
        if selector == ANY_SOURCE:
            _add(HORDE_SOURCE_ID)
            for provider_id in self._provider_registry.source_ids():
                _add(provider_id)
        elif selector == HORDE_SOURCE_ID:
            _add(HORDE_SOURCE_ID)
        else:
            if not self._provider_registry.has(selector):
                raise ValueError(
                    f"No provider registered under source id {selector!r}. "
                    f"Registered providers: {self._provider_registry.source_ids()}.",
                )
            _add(selector)

    return ordered

_is_canonical_only `staticmethod`

_is_canonical_only(source: SourceSelector) -> bool

Return whether source selects canonical data exclusively (the default).

Source code in src/horde_model_reference/model_reference_manager.py

@staticmethod
def _is_canonical_only(source: SourceSelector) -> bool:
    """Return whether *source* selects canonical data exclusively (the default)."""
    return normalize_source_selector(source) == [HORDE_SOURCE_ID]

_gather_sourced_records

_gather_sourced_records(
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
) -> tuple[
    list[GenericModelRecord],
    list[str],
    dict[str, SourceOutcome],
]

Collect records and aligned source ids for category from the selected sources.

Records are returned in selector order (the canonical source is read at its position in the selector rather than always first), so the first source to provide a given name wins during the setdefault merge. Duplicates are intentionally retained so callers/queries can detect collisions. A provider raising or returning None is logged and skipped (error isolation).

The third return value maps every selected source id to its outcome ("ok" / "empty" / "error") so callers can distinguish a source that failed from one that simply had nothing for this category.

Source code in src/horde_model_reference/model_reference_manager.py

def _gather_sourced_records(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
) -> tuple[list[GenericModelRecord], list[str], dict[str, SourceOutcome]]:
    """Collect records and aligned source ids for *category* from the selected sources.

    Records are returned in **selector order** (the canonical source is read at its
    position in the selector rather than always first), so the first source to
    provide a given name wins during the ``setdefault`` merge. Duplicates are
    intentionally retained so callers/queries can detect collisions. A provider
    raising or returning ``None`` is logged and skipped (error isolation).

    The third return value maps every *selected* source id to its outcome
    (``"ok"`` / ``"empty"`` / ``"error"``) so callers can distinguish a source
    that failed from one that simply had nothing for this category.
    """
    selectors = normalize_source_selector(source)
    ordered_source_ids = self._resolve_ordered_source_ids(selectors)

    records: list[GenericModelRecord] = []
    sources: list[str] = []
    status: dict[str, SourceOutcome] = {}

    for source_id in ordered_source_ids:
        status[source_id] = "empty"

        if source_id == HORDE_SOURCE_ID:
            canonical = self.get_all_model_references_or_none(
                overwrite_existing=overwrite_existing,
            ).get(category)
            if canonical:
                status[source_id] = "ok"
                for record in canonical.values():
                    records.append(record)
                    sources.append(HORDE_SOURCE_ID)
            continue

        provider = self._provider_registry.get(source_id)
        if provider is None:  # pragma: no cover - guarded by _resolve_ordered_source_ids
            continue
        if not provider.serves_category(category):
            continue
        try:
            provided = provider.fetch_category(category, force_refresh=overwrite_existing)
        except Exception as exc:
            status[source_id] = "error"
            logger.error(
                f"Provider {source_id!r} raised while fetching category {category.value!r}; skipping: {exc}",
            )
            continue
        if not provided:
            continue
        status[source_id] = "ok"
        for record in provided.values():
            records.append(record)
            sources.append(source_id)

    return records, sources, status

_merge_sourced_reference

_merge_sourced_reference(
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
) -> dict[str, GenericModelRecord] | None

Return a canonical-wins merged name -> record mapping across source.

Returns None only when no source produced any records for the category, preserving the *_or_none contract.

Source code in src/horde_model_reference/model_reference_manager.py

def _merge_sourced_reference(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
) -> dict[str, GenericModelRecord] | None:
    """Return a canonical-wins merged ``name -> record`` mapping across *source*.

    Returns ``None`` only when no source produced any records for the category,
    preserving the ``*_or_none`` contract.
    """
    records, sources, _status = self._gather_sourced_records(
        category,
        source,
        overwrite_existing=overwrite_existing,
    )
    if not records:
        return None

    merged: dict[str, GenericModelRecord] = {}
    for record, _source in zip(records, sources, strict=True):
        merged.setdefault(record.name, record)
    return merged

_gather_sourced_records_async `async`

_gather_sourced_records_async(
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
    httpx_client: AsyncClient | None = None,
) -> tuple[
    list[GenericModelRecord],
    list[str],
    dict[str, SourceOutcome],
]

Async counterpart to :meth:_gather_sourced_records using provider async fetch.

Source code in src/horde_model_reference/model_reference_manager.py

async def _gather_sourced_records_async(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
    httpx_client: httpx.AsyncClient | None = None,
) -> tuple[list[GenericModelRecord], list[str], dict[str, SourceOutcome]]:
    """Async counterpart to :meth:`_gather_sourced_records` using provider async fetch."""
    selectors = normalize_source_selector(source)
    ordered_source_ids = self._resolve_ordered_source_ids(selectors)

    records: list[GenericModelRecord] = []
    sources: list[str] = []
    status: dict[str, SourceOutcome] = {}

    for source_id in ordered_source_ids:
        status[source_id] = "empty"

        if source_id == HORDE_SOURCE_ID:
            all_references = await self.get_all_model_references_or_none_async(
                overwrite_existing=overwrite_existing,
                httpx_client=httpx_client,
            )
            canonical = all_references.get(category)
            if canonical:
                status[source_id] = "ok"
                for record in canonical.values():
                    records.append(record)
                    sources.append(HORDE_SOURCE_ID)
            continue

        provider = self._provider_registry.get(source_id)
        if provider is None:  # pragma: no cover - guarded by _resolve_ordered_source_ids
            continue
        if not provider.serves_category(category):
            continue
        try:
            provided = await provider.fetch_category_async(category, force_refresh=overwrite_existing)
        except Exception as exc:
            status[source_id] = "error"
            logger.error(
                f"Provider {source_id!r} raised while fetching category {category.value!r}; skipping: {exc}",
            )
            continue
        if not provided:
            continue
        status[source_id] = "ok"
        for record in provided.values():
            records.append(record)
            sources.append(source_id)

    return records, sources, status

_merge_sourced_reference_async `async`

_merge_sourced_reference_async(
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
    httpx_client: AsyncClient | None = None,
) -> dict[str, GenericModelRecord] | None

Async counterpart to :meth:_merge_sourced_reference.

Source code in src/horde_model_reference/model_reference_manager.py

async def _merge_sourced_reference_async(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    source: SourceSelector,
    *,
    overwrite_existing: bool = False,
    httpx_client: httpx.AsyncClient | None = None,
) -> dict[str, GenericModelRecord] | None:
    """Async counterpart to :meth:`_merge_sourced_reference`."""
    records, sources, _status = await self._gather_sourced_records_async(
        category,
        source,
        overwrite_existing=overwrite_existing,
        httpx_client=httpx_client,
    )
    if not records:
        return None

    merged: dict[str, GenericModelRecord] = {}
    for record, _source in zip(records, sources, strict=True):
        merged.setdefault(record.name, record)
    return merged

query

query(
    category: Literal["image_generation", image_generation],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ImageGenerationQuery

query(
    category: Literal["text_generation", text_generation],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> TextModelQuery

query(
    category: Literal["controlnet", controlnet],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ControlNetQuery

query(
    category: Literal["blip", blip],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[BlipModelRecord, GenericFieldName]

query(
    category: Literal["clip", clip],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[ClipModelRecord, GenericFieldName]

query(
    category: Literal["codeformer", codeformer],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[CodeformerModelRecord, GenericFieldName]

query(
    category: Literal["esrgan", esrgan],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[EsrganModelRecord, GenericFieldName]

query(
    category: Literal["gfpgan", gfpgan],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[GfpganModelRecord, GenericFieldName]

query(
    category: Literal["safety_checker", safety_checker],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[SafetyCheckerModelRecord, GenericFieldName]

query(
    category: Literal["audio_generation", audio_generation],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[
    AudioGenerationModelRecord, GenericFieldName
]

query(
    category: Literal["video_generation", video_generation],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[
    VideoGenerationModelRecord, GenericFieldName
]

query(
    category: Literal["miscellaneous", miscellaneous],
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[MiscellaneousModelRecord, GenericFieldName]

query(
    category: MODEL_REFERENCE_CATEGORY | str,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> ModelQuery[
    GenericModelRecord,
    GenericFieldName
    | ImageGenFieldName
    | TextGenFieldName
    | ControlNetFieldName,
]

query(
    category: MODEL_REFERENCE_CATEGORY | str,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> (
    ImageGenerationQuery
    | TextModelQuery
    | ControlNetQuery
    | ModelQuery[
        GenericModelRecord,
        GenericFieldName
        | ImageGenFieldName
        | TextGenFieldName
        | ControlNetFieldName,
    ]
)

Return the query builder for a single category.

This is the single entry point for filtering, sorting, and aggregating model records. The returned builder is typed to the category's record class; the three domain categories return enriched subclasses with extra helpers (ImageGenerationQuery, TextModelQuery, ControlNetQuery).

Parameters:

category (MODEL_REFERENCE_CATEGORY | str) –

The model reference category to query, as the :class:~horde_model_reference.meta_consts.MODEL_REFERENCE_CATEGORY member (recommended, for precise return typing) or its string value.
source (SourceSelector, default: HORDE_SOURCE_ID ) –

Which source(s) to include. Defaults to canonical horde data (:data:~horde_model_reference.source_consts.HORDE_SOURCE_ID). Pass "any" to merge all registered providers, or a provider id / ordered sequence of ids. When more than one source is selected, results are de-duplicated by name (canonical / earlier-listed source wins); use :meth:~horde_model_reference.query.ModelQuery.duplicate_names to detect collisions and :meth:~horde_model_reference.query.ModelQuery.where_source to filter by provenance.

Returns:

ImageGenerationQuery | TextModelQuery | ControlNetQuery | ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName] –

A ModelQuery (or typed subclass) ready for chaining filters.

Source code in src/horde_model_reference/model_reference_manager.py

def query(
    self,
    category: MODEL_REFERENCE_CATEGORY | str,
    *,
    source: SourceSelector = HORDE_SOURCE_ID,
) -> (
    ImageGenerationQuery
    | TextModelQuery
    | ControlNetQuery
    | ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName]
):
    """Return the query builder for a single category.

    This is the single entry point for filtering, sorting, and aggregating model
    records. The returned builder is typed to the category's record class; the
    three domain categories return enriched subclasses with extra helpers
    (``ImageGenerationQuery``, ``TextModelQuery``, ``ControlNetQuery``).

    Args:
        category: The model reference category to query, as the
            :class:`~horde_model_reference.meta_consts.MODEL_REFERENCE_CATEGORY`
            member (recommended, for precise return typing) or its string value.
        source: Which source(s) to include. Defaults to canonical horde data
            (:data:`~horde_model_reference.source_consts.HORDE_SOURCE_ID`). Pass
            ``"any"`` to merge all registered providers, or a provider id / ordered
            sequence of ids. When more than one source is selected, results are
            de-duplicated by name (canonical / earlier-listed source wins); use
            :meth:`~horde_model_reference.query.ModelQuery.duplicate_names` to detect
            collisions and :meth:`~horde_model_reference.query.ModelQuery.where_source`
            to filter by provenance.

    Returns:
        A ``ModelQuery`` (or typed subclass) ready for chaining filters.

    """
    category = MODEL_REFERENCE_CATEGORY(category)
    canonical_only = self._is_canonical_only(source)

    if category == MODEL_REFERENCE_CATEGORY.image_generation:
        if canonical_only:
            return build_image_query(
                self._get_typed_models(category, record_type=ImageGenerationModelRecord),
            )
        img_records, img_sources, img_status = self._gather_typed_sourced(
            category,
            record_type=ImageGenerationModelRecord,
            source=source,
        )
        return ImageGenerationQuery(
            img_records,
            ImageGenerationModelRecord,
            sources=img_sources,
            source_status=img_status,
        )

    if category == MODEL_REFERENCE_CATEGORY.text_generation:
        if canonical_only:
            return build_text_query(
                self._get_typed_models(category, record_type=TextGenerationModelRecord),
            )
        txt_records, txt_sources, txt_status = self._gather_typed_sourced(
            category,
            record_type=TextGenerationModelRecord,
            source=source,
        )
        return TextModelQuery(
            txt_records,
            TextGenerationModelRecord,
            sources=txt_sources,
            source_status=txt_status,
        )

    if category == MODEL_REFERENCE_CATEGORY.controlnet:
        if canonical_only:
            return build_controlnet_query(
                self._get_typed_models(category, record_type=ControlNetModelRecord),
            )
        cn_records, cn_sources, cn_status = self._gather_typed_sourced(
            category,
            record_type=ControlNetModelRecord,
            source=source,
        )
        return ControlNetQuery(
            cn_records,
            ControlNetModelRecord,
            sources=cn_sources,
            source_status=cn_status,
        )

    record_type = MODEL_RECORD_TYPE_LOOKUP.get(category, GenericModelRecord)
    if canonical_only:
        return build_query(self._get_typed_models(category, record_type=record_type), record_type)
    sourced_records, sourced_sources, sourced_status = self._gather_typed_sourced(
        category,
        record_type=record_type,
        source=source,
    )
    return ModelQuery(sourced_records, record_type, sources=sourced_sources, source_status=sourced_status)

_gather_typed_sourced

_gather_typed_sourced(
    category: MODEL_REFERENCE_CATEGORY,
    *,
    record_type: type[TModelRecord],
    source: SourceSelector,
) -> tuple[
    list[TModelRecord], list[str], dict[str, SourceOutcome]
]

Gather records (and aligned sources) for category, validating their type.

Raises:

RuntimeError –

If any source supplies a record that is not an instance of record_type (or a subclass of it).

Source code in src/horde_model_reference/model_reference_manager.py

def _gather_typed_sourced(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    *,
    record_type: type[TModelRecord],
    source: SourceSelector,
) -> tuple[list[TModelRecord], list[str], dict[str, SourceOutcome]]:
    """Gather records (and aligned sources) for *category*, validating their type.

    Raises:
        RuntimeError: If any source supplies a record that is not an instance of
            *record_type* (or a subclass of it).

    """
    records, sources, status = self._gather_sourced_records(category, source)
    typed_records: list[TModelRecord] = []
    for record in records:
        if not isinstance(record, record_type):
            raise RuntimeError(
                f"A source for category {category.value} supplied record {record.name!r} "
                f"that is not a {record_type.__name__} instance.",
            )
        typed_records.append(record)
    return typed_records, sources, status

query_all

query_all() -> ModelQuery[
    GenericModelRecord,
    GenericFieldName
    | ImageGenFieldName
    | TextGenFieldName
    | ControlNetFieldName,
]

Return a query builder spanning all categories.

Returns:

ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName] –

A ModelQuery[GenericModelRecord] over every cached record.

Source code in src/horde_model_reference/model_reference_manager.py

def query_all(
    self,
) -> ModelQuery[GenericModelRecord, GenericFieldName | ImageGenFieldName | TextGenFieldName | ControlNetFieldName]:
    """Return a query builder spanning all categories.

    Returns:
        A ``ModelQuery[GenericModelRecord]`` over every cached record.

    """
    all_refs = self.get_all_model_references()
    return build_cross_category_query(all_refs)

get_popular_models `async`

get_popular_models(
    category: MODEL_REFERENCE_CATEGORY,
    *,
    limit: int = 10,
    sort_by: Literal[
        "worker_count",
        "usage_day",
        "usage_month",
        "usage_total",
    ] = "worker_count",
    include_workers: bool = False,
) -> list[PopularModelResult]

Return models ranked by live Horde popularity metrics.

Requires the Horde public API to be reachable. Only image_generation and text_generation categories have Horde API data; other categories return an empty list.

Parameters:

category (MODEL_REFERENCE_CATEGORY) –

Model category to rank.
limit (int, default: 10 ) –

Maximum number of results.
sort_by (Literal['worker_count', 'usage_day', 'usage_month', 'usage_total'], default: 'worker_count' ) –

Metric to rank by.
include_workers (bool, default: False ) –

Whether to fetch per-worker details (slower).

Returns:

list[PopularModelResult] –

A list of PopularModelResult sorted by the chosen metric.

Source code in src/horde_model_reference/model_reference_manager.py

async def get_popular_models(
    self,
    category: MODEL_REFERENCE_CATEGORY,
    *,
    limit: int = 10,
    sort_by: Literal["worker_count", "usage_day", "usage_month", "usage_total"] = "worker_count",
    include_workers: bool = False,
) -> list[PopularModelResult]:
    """Return models ranked by live Horde popularity metrics.

    Requires the Horde public API to be reachable. Only ``image_generation``
    and ``text_generation`` categories have Horde API data; other categories
    return an empty list.

    Args:
        category: Model category to rank.
        limit: Maximum number of results.
        sort_by: Metric to rank by.
        include_workers: Whether to fetch per-worker details (slower).

    Returns:
        A list of ``PopularModelResult`` sorted by the chosen metric.

    """
    from horde_model_reference.integrations.data_merger import (
        CombinedModelStatistics,
        PopularModelResult,
        merge_category_with_horde_data,
    )
    from horde_model_reference.integrations.horde_api_integration import HordeAPIIntegration

    horde_type: HordeModelType | None = self._CATEGORY_TO_HORDE_TYPE.get(category)
    if horde_type is None:
        return []

    model_reference = self.get_model_reference_or_none(category)
    if model_reference is None:
        return []

    horde_api = HordeAPIIntegration()
    indexed_status, indexed_stats, indexed_workers = await horde_api.get_combined_data_indexed(
        model_type=horde_type,
        include_workers=include_workers,
    )

    merged = merge_category_with_horde_data(
        model_names=model_reference.keys(),
        horde_status=indexed_status,
        horde_stats=indexed_stats,
        workers=indexed_workers,
    )

    def _sort_key(item: tuple[str, Any]) -> float:
        _name, stats = item
        if not isinstance(stats, CombinedModelStatistics):
            return 0.0
        if sort_by == "worker_count":
            return float(stats.worker_count)
        if stats.usage_stats is None:
            return 0.0
        if sort_by == "usage_day":
            return float(stats.usage_stats.day)
        if sort_by == "usage_month":
            return float(stats.usage_stats.month)
        return float(stats.usage_stats.total)

    ranked = sorted(merged.items(), key=_sort_key, reverse=True)[:limit]

    results: list[PopularModelResult] = []
    for name, stats in ranked:
        record = model_reference.get(name)
        if record is None:
            continue
        results.append(
            PopularModelResult(
                name=name,
                record=record.model_dump(mode="json", exclude_none=True),
                stats=stats,
            )
        )

    return results

DeferredPrefetchHandle

Bases: Awaitable[None]

Encapsulates a deferred eager fetch for a ModelReferenceManager.

Source code in src/horde_model_reference/model_reference_manager.py

class DeferredPrefetchHandle(Awaitable[None]):
    """Encapsulates a deferred eager fetch for a `ModelReferenceManager`."""

    def __init__(
        self,
        *,
        manager: ModelReferenceManager,
        force_refresh: bool,
    ) -> None:
        """Store the manager reference and desired refresh semantics."""
        self._manager = manager
        self._force_refresh = force_refresh

    @property
    def force_refresh(self) -> bool:
        """Whether this handle forces a backend refresh when executed."""
        return self._force_refresh

    def run_sync(self) -> None:
        """Execute the deferred warm-up synchronously on the current thread.

        Warms the manager's converted-record cache (not just the backend layer) so the
        next read is served without a backend fetch or pydantic conversion - leaving
        :attr:`ModelReferenceManager.is_warm` ``True`` afterwards.
        """
        self._manager.ensure_ready(overwrite_existing=self._force_refresh)

    async def run_async(
        self,
        *,
        httpx_client: httpx.AsyncClient | None = None,
    ) -> None:
        """Execute the deferred warm-up asynchronously, warming the manager's record cache."""
        await self._manager.ensure_ready_async(
            overwrite_existing=self._force_refresh,
            httpx_client=httpx_client,
        )

    def __await__(self) -> Generator[Any]:
        """Allow awaiting the handle directly as sugar for run_async()."""
        return self.run_async().__await__()

_manager `instance-attribute`

_manager = manager

_force_refresh `instance-attribute`

_force_refresh = force_refresh

force_refresh `property`

force_refresh: bool

Whether this handle forces a backend refresh when executed.

init

__init__(
    *, manager: ModelReferenceManager, force_refresh: bool
) -> None

Store the manager reference and desired refresh semantics.

Source code in src/horde_model_reference/model_reference_manager.py

def __init__(
    self,
    *,
    manager: ModelReferenceManager,
    force_refresh: bool,
) -> None:
    """Store the manager reference and desired refresh semantics."""
    self._manager = manager
    self._force_refresh = force_refresh

run_sync

run_sync() -> None

Execute the deferred warm-up synchronously on the current thread.

Warms the manager's converted-record cache (not just the backend layer) so the next read is served without a backend fetch or pydantic conversion - leaving :attr:ModelReferenceManager.is_warm True afterwards.

Source code in src/horde_model_reference/model_reference_manager.py

def run_sync(self) -> None:
    """Execute the deferred warm-up synchronously on the current thread.

    Warms the manager's converted-record cache (not just the backend layer) so the
    next read is served without a backend fetch or pydantic conversion - leaving
    :attr:`ModelReferenceManager.is_warm` ``True`` afterwards.
    """
    self._manager.ensure_ready(overwrite_existing=self._force_refresh)

run_async `async`

run_async(
    *, httpx_client: AsyncClient | None = None
) -> None

Execute the deferred warm-up asynchronously, warming the manager's record cache.

Source code in src/horde_model_reference/model_reference_manager.py

async def run_async(
    self,
    *,
    httpx_client: httpx.AsyncClient | None = None,
) -> None:
    """Execute the deferred warm-up asynchronously, warming the manager's record cache."""
    await self._manager.ensure_ready_async(
        overwrite_existing=self._force_refresh,
        httpx_client=httpx_client,
    )

await

__await__() -> Generator[Any]

Allow awaiting the handle directly as sugar for run_async().

Source code in src/horde_model_reference/model_reference_manager.py

def __await__(self) -> Generator[Any]:
    """Allow awaiting the handle directly as sugar for run_async()."""
    return self.run_async().__await__()

model_reference_manager

TModelRecord module-attribute

__all__ module-attribute

PrefetchStrategy

LAZY class-attribute instance-attribute

SYNC class-attribute instance-attribute

DEFERRED class-attribute instance-attribute

ASYNC class-attribute instance-attribute

NONE class-attribute instance-attribute

ModelReferenceManager

backend instance-attribute

_cached_records instance-attribute

_instance class-attribute instance-attribute

_replicate_mode class-attribute instance-attribute

_offline class-attribute instance-attribute

_prefetch_strategy class-attribute instance-attribute

_deferred_prefetch_handle class-attribute instance-attribute

_async_prefetch_task class-attribute instance-attribute

_provider_registry instance-attribute

_audit_writer class-attribute instance-attribute

_pending_queue_service class-attribute instance-attribute

_group_alias_store class-attribute instance-attribute

_group_family_store class-attribute instance-attribute

_group_schema_store class-attribute instance-attribute

_lock class-attribute instance-attribute

prefetch_strategy property

offline property

pending_queue_service property

group_alias_store property

group_family_store property

group_schema_store property

deferred_prefetch_handle property

is_warm property

prefetch_pending property

provider_registry property

_CATEGORY_TO_HORDE_TYPE class-attribute

get_instance classmethod

has_instance classmethod

reset classmethod

_create_backend staticmethod

__new__

_apply_prefetch_strategy

_on_backend_invalidated

_invalidate_cache

invalidate_category_cache

_fetch_from_backend_if_needed

_fetch_from_backend_if_needed_async async

_build_pending_queue_service staticmethod

create_deferred_prefetch_handle

_schedule_async_prefetch

warm_cache_async async

ensure_ready

ensure_ready_async async

supports_metadata

get_metadata

get_metadata_async async

last_updated

_file_json_dict_to_model_reference staticmethod

model_reference_to_json_dict staticmethod

model_reference_to_json_dict_safe staticmethod

_get_all_cached_model_references

_evaluate_cache_state

_load_categories_from_payload

get_all_model_references_or_none

_build_safe_reference_view

get_all_model_references

get_all_model_references_or_none_async async

get_all_model_references_async async

get_model_reference_or_none

get_model_reference_or_none_async async

get_model_reference

get_model_reference_async async

get_model_or_none

get_model

get_raw_model_reference_json

get_raw_model_json

_get_typed_models

register_provider

unregister_provider

list_providers

TModelRecord `module-attribute`

all `module-attribute`

LAZY `class-attribute` `instance-attribute`

SYNC `class-attribute` `instance-attribute`

DEFERRED `class-attribute` `instance-attribute`

ASYNC `class-attribute` `instance-attribute`

NONE `class-attribute` `instance-attribute`

backend `instance-attribute`

_cached_records `instance-attribute`

_instance `class-attribute` `instance-attribute`

_replicate_mode `class-attribute` `instance-attribute`

_offline `class-attribute` `instance-attribute`

_prefetch_strategy `class-attribute` `instance-attribute`

_deferred_prefetch_handle `class-attribute` `instance-attribute`

_async_prefetch_task `class-attribute` `instance-attribute`

_provider_registry `instance-attribute`

_audit_writer `class-attribute` `instance-attribute`

_pending_queue_service `class-attribute` `instance-attribute`

_group_alias_store `class-attribute` `instance-attribute`

_group_family_store `class-attribute` `instance-attribute`

_group_schema_store `class-attribute` `instance-attribute`

_lock `class-attribute` `instance-attribute`

prefetch_strategy `property`

offline `property`

pending_queue_service `property`

group_alias_store `property`

group_family_store `property`

group_schema_store `property`

deferred_prefetch_handle `property`

is_warm `property`

prefetch_pending `property`

provider_registry `property`

_CATEGORY_TO_HORDE_TYPE `class-attribute`

get_instance `classmethod`

has_instance `classmethod`

reset `classmethod`

_create_backend `staticmethod`

new

_fetch_from_backend_if_needed_async `async`

_build_pending_queue_service `staticmethod`

warm_cache_async `async`

ensure_ready_async `async`

get_metadata_async `async`

_file_json_dict_to_model_reference `staticmethod`

model_reference_to_json_dict `staticmethod`

model_reference_to_json_dict_safe `staticmethod`

get_all_model_references_or_none_async `async`

get_all_model_references_async `async`

get_model_reference_or_none_async `async`

get_model_reference_async `async`

_is_canonical_only `staticmethod`

_gather_sourced_records_async `async`

_merge_sourced_reference_async `async`

get_popular_models `async`

_manager `instance-attribute`

_force_refresh `instance-attribute`

force_refresh `property`

init

run_async `async`

await