Core-Readout Models — Full Module

For the main API reference with class details, see the Models overview.

This page shows the complete module contents.

BaseCoreReadout

BaseCoreReadout(
    core: Core,
    readout: MultiReadoutBase,
    learning_rate: float,
    loss: Module | None = None,
    validation_loss: Module | None = None,
    data_info: dict[str, Any] | None = None,
)

Bases: LightningModule

Base module for models combining a shared core and a multi-session readout. All models following the Core Readout pattern should inherit from this class.

This LightningModule encapsulates a model made of a shared core and a flexible multi-session readout, suitable for training across-session architectures. It defines training, validation, and testing steps, provides hooks for optimizer and scheduler configuration, and methods for handling data info and visualization.

Initializes a BaseCoreReadout module.

PARAMETER	DESCRIPTION
`core`	The shared feature extraction core network. TYPE: `Core`
`readout`	The multi-session readout module mapping core features to neuron outputs per session. TYPE: `MultiReadoutBase`
`learning_rate`	Learning rate for network training. TYPE: `float`
`loss`	Loss function for training. Defaults to PoissonLoss3d if None. TYPE: `Module` DEFAULT: `None`
`validation_loss`	Loss used to compute correlation performance metric. Defaults to CorrelationLoss3d (avg=True) if None. TYPE: `Module` DEFAULT: `None`
`data_info`	Dictionary containing data-specific metadata, such as input_shape, session neuron counts, etc. If None, defaults to empty dict. TYPE: `dict[str, Any]` DEFAULT: `None`

Source code in openretina/models/core_readout.py

def __init__(
    self,
    core: Core,
    readout: MultiReadoutBase,
    learning_rate: float,
    loss: nn.Module | None = None,
    validation_loss: nn.Module | None = None,
    data_info: dict[str, Any] | None = None,
):
    """
    Initializes a BaseCoreReadout module.

    Args:
        core (Core): The shared feature extraction core network.
        readout (MultiReadoutBase): The multi-session readout module mapping core features to neuron outputs
            per session.
        learning_rate (float): Learning rate for network training.
        loss (nn.Module, optional): Loss function for training. Defaults to PoissonLoss3d if None.
        validation_loss (nn.Module, optional): Loss used to compute correlation performance metric.
            Defaults to CorrelationLoss3d (avg=True) if None.
        data_info (dict[str, Any], optional): Dictionary containing data-specific metadata, such as input_shape,
            session neuron counts, etc. If None, defaults to empty dict.
    """
    super().__init__()

    self.core = core
    self.readout = readout
    self.learning_rate = learning_rate
    self.loss = loss if loss is not None else PoissonLoss3d()
    self.validation_loss = validation_loss if validation_loss is not None else CorrelationLoss3d(avg=True)
    if data_info is None:
        data_info = {}
    self.data_info = data_info

    # Finally, save hyperparameters without logging them to the logger objects for now
    self.save_hyperparameters(logger=False)

pretrained_cfg `property`

pretrained_cfg: dict[str, Any]

Alias for data_info, following timm (Pytorch Image Models) conventions.

save_weight_visualizations

save_weight_visualizations(
    folder_path: str,
    file_format: str = "jpg",
    state_suffix: str = "",
) -> None

Save weight visualizations for core and readout modules.

PARAMETER	DESCRIPTION
`folder_path`	Base directory to save visualizations TYPE: `str`
`file_format`	Image format for saved files TYPE: `str` DEFAULT: `'jpg'`
`state_suffix`	Optional suffix for state identification TYPE: `str` DEFAULT: `''`

Source code in openretina/models/core_readout.py

def save_weight_visualizations(self, folder_path: str, file_format: str = "jpg", state_suffix: str = "") -> None:
    """
    Save weight visualizations for core and readout modules.

    Args:
        folder_path: Base directory to save visualizations
        file_format: Image format for saved files
        state_suffix: Optional suffix for state identification
    """

    # Helper function to call save_weight_visualizations with dynamic parameter support
    def _call_save_viz(module: Any, subfolder: str) -> None:
        full_path = os.path.join(folder_path, subfolder)

        # Check if the method supports state_suffix parameter
        if "state_suffix" in inspect.signature(module.save_weight_visualizations).parameters:
            kwargs = {"state_suffix": state_suffix}
        else:
            kwargs = {}

        module.save_weight_visualizations(full_path, file_format, **kwargs)

    _call_save_viz(self.core, "weights_core")
    _call_save_viz(self.readout, "weights_readout")

update_model_data_info

update_model_data_info(data_info: dict[str, Any]) -> None

To update relevant model attributes when loading a (trained) model and training it with new data only.

Source code in openretina/models/core_readout.py

def update_model_data_info(self, data_info: dict[str, Any]) -> None:
    """To update relevant model attributes when loading a (trained) model and training it with new data only."""
    # update model.data_info and n_neurons_dict with the new data info
    for key in data_info.keys():
        if key == "input_shape":
            assert all(self.data_info[key][dim] == data_info[key][dim] for dim in range(len(data_info[key]))), (
                f"Input shapes don't match: model has {self.data_info[key]}, new data has {data_info[key]}"
            )
        else:
            self.data_info[key].update(data_info[key])

    # update saved hyperparameters (so that the model can be loaded from checkpoint correctly)
    if hasattr(self, "hparams"):
        self.hparams["n_neurons_dict"] = self.data_info["n_neurons_dict"]
        self.hparams["data_info"] = self.data_info

UnifiedCoreReadout

UnifiedCoreReadout(
    in_shape: Int[tuple, "channels time height width"],
    n_neurons_dict: dict[str, int],
    core: DictConfig,
    readout: DictConfig,
    hidden_channels: tuple[int, ...]
    | Iterable[int]
    | None = None,
    learning_rate: float = 0.001,
    loss: Module | DictConfig | None = None,
    validation_loss: Module | DictConfig | None = None,
    data_info: dict[str, Any] | None = None,
    optimizer: DictConfig | None = None,
    lr_scheduler: DictConfig | None = None,
)

Bases: BaseCoreReadout

A flexible core-readout model for multi-session neural data, designed for Hydra config workflows.

This class is the recommended entry point for defining core-readout models via config files using Hydra. It allows unified instantiation of arbitrary core and readout modules, specified via DictConfig, enabling rapid experimentation and extensibility. Supports all multi-session settings, custom core/readout combinations, and integration with configuration-driven pipelines (including hyperparameter optimization).

Initializes a UnifiedCoreReadout for multi-session configurable neural modeling via Hydra configs.

PARAMETER	DESCRIPTION
`in_shape`	Input shape as (channels, time, height, width) for the core module. TYPE: `tuple[int, int, int, int]`
`hidden_channels`	List of hidden channels for the core; used in core config initialization. TYPE: `Iterable[int]` DEFAULT: `None`
`n_neurons_dict`	Mapping from session/dataset identifier to neuron count for each session. TYPE: `dict[str, int]`
`core`	Hydra config for instantiating the core module (should specify class and params). TYPE: `DictConfig`
`readout`	Hydra config for the readout module (specifies type and custom session-aware params). TYPE: `DictConfig`
`learning_rate`	Learning rate for model training. Defaults to 0.001. TYPE: `float` DEFAULT: `0.001`
`loss`	Loss function for training. Defaults to PoissonLoss3d if None. TYPE: `Module` DEFAULT: `None`
`validation_loss`	Loss used to compute correlation performance metric. Defaults to CorrelationLoss3d(avg=True) if None. TYPE: `Module` DEFAULT: `None`
`data_info`	Additional metadata dictionary, e.g., with input shape and neuron mapping. TYPE: `dict[str, Any]` DEFAULT: `None`
`optimizer`	Hydra config for optimizer instantiation. If None, defaults to AdamW. TYPE: `DictConfig` DEFAULT: `None`
`lr_scheduler`	Hydra config for learning rate scheduler. If None, defaults to ReduceLROnPlateau. TYPE: `DictConfig` DEFAULT: `None`

Source code in openretina/models/core_readout.py

def __init__(
    self,
    in_shape: Int[tuple, "channels time height width"],
    n_neurons_dict: dict[str, int],
    core: DictConfig,
    readout: DictConfig,
    hidden_channels: tuple[int, ...] | Iterable[int] | None = None,
    learning_rate: float = 0.001,
    loss: nn.Module | DictConfig | None = None,
    validation_loss: nn.Module | DictConfig | None = None,
    data_info: dict[str, Any] | None = None,
    optimizer: DictConfig | None = None,
    lr_scheduler: DictConfig | None = None,
):
    """
    Initializes a UnifiedCoreReadout for multi-session configurable neural modeling via Hydra configs.

    Args:
        in_shape (tuple[int, int, int, int]):
            Input shape as (channels, time, height, width) for the core module.
        hidden_channels (Iterable[int]):
            List of hidden channels for the core; used in core config initialization.
        n_neurons_dict (dict[str, int]):
            Mapping from session/dataset identifier to neuron count for each session.
        core (DictConfig):
            Hydra config for instantiating the core module (should specify class and params).
        readout (DictConfig):
            Hydra config for the readout module (specifies type and custom session-aware params).
        learning_rate (float, optional):
            Learning rate for model training. Defaults to 0.001.
        loss (nn.Module, optional):
            Loss function for training. Defaults to PoissonLoss3d if None.
        validation_loss (nn.Module, optional):
            Loss used to compute correlation performance metric. Defaults to CorrelationLoss3d(avg=True) if None.
        data_info (dict[str, Any], optional):
            Additional metadata dictionary, e.g., with input shape and neuron mapping.
        optimizer (DictConfig, optional):
            Hydra config for optimizer instantiation. If None, defaults to AdamW.
        lr_scheduler (DictConfig, optional):
            Hydra config for learning rate scheduler. If None, defaults to ReduceLROnPlateau.
    """
    # Make sure in_shape and hidden_channels are a tuple
    # (with hydra configs they can be a `omegaconf.listconfig.ListConfig`).
    # This lead to an error when logging hyperparameters with the csv logger during training.
    in_shape = tuple(in_shape)
    if hidden_channels is not None:
        hidden_channels = tuple(hidden_channels)
        core.channels = (in_shape[0], *hidden_channels)

    core_module = hydra.utils.instantiate(
        core,
        n_neurons_dict=n_neurons_dict,
    )

    # determine input_shape of readout if it is not already present
    if "in_shape" not in readout:
        in_shape_readout = self.compute_readout_input_shape(in_shape, core_module)
        readout["in_shape"] = (in_shape_readout[0],) + tuple(in_shape_readout[1:])

    # Extract mean_activity_dict from data_info if available
    mean_activity_dict = None if data_info is None else data_info.get("mean_activity_dict")

    readout_module = hydra.utils.instantiate(
        readout,
        n_neurons_dict=n_neurons_dict,
        mean_activity_dict=mean_activity_dict,
    )

    if loss is not None and isinstance(loss, DictConfig):
        loss_module = hydra.utils.instantiate(loss)
    else:
        loss_module = loss

    if validation_loss is not None and isinstance(validation_loss, DictConfig):
        validation_loss_module = hydra.utils.instantiate(validation_loss)
    else:
        validation_loss_module = validation_loss

    # Store optimizer and scheduler configs for use in configure_optimizers
    self.optimizer_config = optimizer
    self.lr_scheduler_config = lr_scheduler

    super().__init__(
        core=core_module,
        readout=readout_module,
        learning_rate=learning_rate,
        loss=loss_module,
        validation_loss=validation_loss_module,
        data_info=data_info,
    )

configure_optimizers

configure_optimizers()

Configure optimizers and schedulers using Hydra configs.

This method overrides BaseCoreReadout.configure_optimizers() to use configurable optimizers and schedulers via the utility functions.

Source code in openretina/models/core_readout.py

def configure_optimizers(self):
    """
    Configure optimizers and schedulers using Hydra configs.

    This method overrides BaseCoreReadout.configure_optimizers() to use
    configurable optimizers and schedulers via the utility functions.
    """

    # Instantiate optimizer using utility function
    optimizer = instantiate_optimizer(
        self.optimizer_config,
        self.parameters(),
        self.learning_rate,
    )

    # Instantiate scheduler using utility function
    scheduler_dict = instantiate_scheduler(
        self.lr_scheduler_config,
        optimizer,
        self.learning_rate,
        trainer=getattr(self, "trainer", None),
    )

    return {
        "optimizer": optimizer,
        "lr_scheduler": scheduler_dict,
    }

ExampleCoreReadout

ExampleCoreReadout(
    in_shape: Int[tuple, "channels time height width"],
    hidden_channels: Iterable[int],
    temporal_kernel_sizes: Iterable[int],
    spatial_kernel_sizes: Iterable[int],
    n_neurons_dict: dict[str, int],
    core_gamma_input: float = 0.0,
    core_gamma_hidden: float = 0.0,
    core_gamma_in_sparse: float = 0.0,
    core_gamma_temporal: float = 40.0,
    core_input_padding: bool
    | str
    | int
    | tuple[int, int, int] = False,
    core_hidden_padding: bool
    | str
    | int
    | tuple[int, int, int] = True,
    readout_scale: bool = True,
    readout_bias: bool = True,
    readout_gaussian_masks: bool = True,
    readout_gaussian_mean_scale: float = 6.0,
    readout_gaussian_var_scale: float = 4.0,
    readout_positive: bool = True,
    readout_gamma: float = 0.4,
    readout_gamma_masks: float = 0.0,
    readout_reg_avg: bool = False,
    learning_rate: float = 0.01,
    cut_first_n_frames_in_core: int = 30,
    dropout_rate: float = 0.0,
    maxpool_every_n_layers: Optional[int] = None,
    downsample_input_kernel_size: Optional[
        tuple[int, int, int]
    ] = None,
    convolution_type: str = "custom_separable",
    color_squashing_weights: tuple[float, ...]
    | None = None,
    data_info: dict[str, Any] | None = None,
)

Bases: BaseCoreReadout

Example implementation of a custom Core-Readout model, using a convolutional core and a Gaussian readout.

This class serves as a guide for constructing custom Core-Readout models without using the unified Hydra configuration system and the UnifiedCoreReadout class. Use this model as a reference if you wish to instantiate or design core/readout units directly in code rather than through configuration files. For most workflows, especially those using Hydra, UnifiedCoreReadout is preferred for maximum flexibility.

N.B., this class is provided as a reference example.

Source code in openretina/models/core_readout.py

def __init__(
    self,
    in_shape: Int[tuple, "channels time height width"],
    hidden_channels: Iterable[int],
    temporal_kernel_sizes: Iterable[int],
    spatial_kernel_sizes: Iterable[int],
    n_neurons_dict: dict[str, int],
    core_gamma_input: float = 0.0,
    core_gamma_hidden: float = 0.0,
    core_gamma_in_sparse: float = 0.0,
    core_gamma_temporal: float = 40.0,
    core_input_padding: bool | str | int | tuple[int, int, int] = False,
    core_hidden_padding: bool | str | int | tuple[int, int, int] = True,
    readout_scale: bool = True,
    readout_bias: bool = True,
    readout_gaussian_masks: bool = True,
    readout_gaussian_mean_scale: float = 6.0,
    readout_gaussian_var_scale: float = 4.0,
    readout_positive: bool = True,
    readout_gamma: float = 0.4,
    readout_gamma_masks: float = 0.0,
    readout_reg_avg: bool = False,
    learning_rate: float = 0.01,
    cut_first_n_frames_in_core: int = 30,
    dropout_rate: float = 0.0,
    maxpool_every_n_layers: Optional[int] = None,
    downsample_input_kernel_size: Optional[tuple[int, int, int]] = None,
    convolution_type: str = "custom_separable",
    color_squashing_weights: tuple[float, ...] | None = None,
    data_info: dict[str, Any] | None = None,
):
    warnings.warn(
        "You are using ExampleCoreReadout, which is intended as a reference/example class for custom "
        "core-readout model implementations. For most configuration-driven workflows, especially if you "
        "use Hydra, consider using UnifiedCoreReadout instead, or writing your own class that inherits "
        "from BaseCoreReadout.",
        UserWarning,
        stacklevel=2,
    )
    core = SimpleCoreWrapper(
        channels=(in_shape[0], *hidden_channels),
        temporal_kernel_sizes=tuple(temporal_kernel_sizes),
        spatial_kernel_sizes=tuple(spatial_kernel_sizes),
        gamma_input=core_gamma_input,
        gamma_temporal=core_gamma_temporal,
        gamma_in_sparse=core_gamma_in_sparse,
        gamma_hidden=core_gamma_hidden,
        cut_first_n_frames=cut_first_n_frames_in_core,
        dropout_rate=dropout_rate,
        maxpool_every_n_layers=maxpool_every_n_layers,
        downsample_input_kernel_size=downsample_input_kernel_size,
        input_padding=core_input_padding,
        color_squashing_weights=color_squashing_weights,
        hidden_padding=core_hidden_padding,
        convolution_type=convolution_type,
    )

    # Run one forward pass to determine output shape of core
    in_shape_readout = self.compute_readout_input_shape(in_shape, core)
    LOGGER.info(f"{in_shape_readout=}")

    readout = MultiGaussianMaskReadout(
        in_shape_readout,
        n_neurons_dict,
        readout_scale,
        readout_bias,
        readout_gaussian_mean_scale,
        readout_gaussian_var_scale,
        readout_positive,
        readout_gamma,
        readout_gamma_masks,
        readout_reg_avg,
    )

    super().__init__(core=core, readout=readout, learning_rate=learning_rate, data_info=data_info)

on_load_checkpoint

on_load_checkpoint(checkpoint) -> None

To support legacy models that use bias_param instead of bias in their readout layers.

Source code in openretina/models/core_readout.py

def on_load_checkpoint(self, checkpoint) -> None:
    """To support legacy models that use `bias_param` instead of `bias` in their readout layers."""
    state_dict = checkpoint["state_dict"]

    readout_bias_keys = [k for k in state_dict.keys() if k.startswith("readout.") and k.endswith(".bias_param")]
    for key in readout_bias_keys:
        new_key = key.removesuffix(".bias_param") + ".bias"
        state_dict[new_key] = state_dict.pop(key)
    if len(readout_bias_keys) > 0:
        LOGGER.warning(f"Renamed the following readout bias keys: {readout_bias_keys}")

load_core_readout_from_remote

load_core_readout_from_remote(
    model_name: str,
    device: str,
    cache_directory_path: str | PathLike | None = None,
) -> BaseCoreReadout

Download and load a pre-trained core-readout model by name. Falls back to legacy ExampleCoreReadout format.

Source code in openretina/models/core_readout.py

def load_core_readout_from_remote(
    model_name: str,
    device: str,
    cache_directory_path: str | os.PathLike | None = None,
) -> BaseCoreReadout:
    """Download and load a pre-trained core-readout model by name. Falls back to legacy ExampleCoreReadout format."""
    if cache_directory_path is None:
        cache_directory_path = get_cache_directory()
    if model_name not in _MODEL_NAME_TO_REMOTE_LOCATION:
        raise ValueError(
            f"Model name {model_name} not supported for download yet. "
            f"The following names are supported: {sorted(_MODEL_NAME_TO_REMOTE_LOCATION.keys())}"
        )
    remote_path = _MODEL_NAME_TO_REMOTE_LOCATION[model_name]
    local_path = get_local_file_path(remote_path, cache_directory_path)
    try:
        return UnifiedCoreReadout.load_from_checkpoint(local_path, map_location=device)
    except:  # noqa: E722
        # Support for legacy ExampleCoreReadout model
        return ExampleCoreReadout.load_from_checkpoint(local_path, map_location=device)

load_core_readout_model

load_core_readout_model(
    model_path_or_name: str,
    device: str,
    cache_directory_path: str | PathLike | None = None,
) -> BaseCoreReadout

Load a core-readout model from a local path or remote name. Tries known remote names first, then local paths.

Source code in openretina/models/core_readout.py

def load_core_readout_model(
    model_path_or_name: str,
    device: str,
    cache_directory_path: str | os.PathLike | None = None,
) -> BaseCoreReadout:
    """Load a core-readout model from a local path or remote name. Tries known remote names first, then local paths."""
    if cache_directory_path is None:
        cache_directory_path = get_cache_directory()
    if model_path_or_name in _MODEL_NAME_TO_REMOTE_LOCATION:
        return load_core_readout_from_remote(model_path_or_name, device)

    local_path = get_local_file_path(model_path_or_name, cache_directory_path)
    try:
        return UnifiedCoreReadout.load_from_checkpoint(local_path, map_location=device)
    except:  # noqa: E722
        # Support for legacy ExampleCoreReadout model
        return ExampleCoreReadout.load_from_checkpoint(local_path, map_location=device)

Core-Readout Models — Full Module

BaseCoreReadout

pretrained_cfg property

save_weight_visualizations

update_model_data_info

UnifiedCoreReadout

configure_optimizers

ExampleCoreReadout

on_load_checkpoint

load_core_readout_from_remote

load_core_readout_model

pretrained_cfg `property`