Maheswaranathan et al. 2023 Dataset

Primate and mouse retinal ganglion cell responses to natural scenes, originally published in Maheswaranathan et al. (2023): Interpreting the retinal neural code for natural scenes: From computations to neurons, Neuron.

Dataset: purl.stanford.edu/rk663dm5577

Stimuli

stimuli

Minimal stimulus loading utilities to train a model on the data used in Maheswaranathan et al. 2023

Paper: https://doi.org/10.1016/j.neuron.2023.06.007 Data: https://doi.org/10.25740/rk663dm5577

OpenRetina provides a mirror of the dataset on huggingface: https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip

load_all_stimuli

load_all_stimuli(
    base_data_path: str | PathLike,
    stim_type: Literal[
        "naturalscene", "whitenoise"
    ] = "naturalscene",
    normalize_stimuli: bool = True,
) -> dict[str, MoviesTrainTestSplit]

Load all stimuli from sessions within subfolders in a given base data path.

The base data path should point to the location of the neural_code_data folder. (See https://doi.org/10.25740/rk663dm5577 for dataset download).

Alternatively, base_data_path can point directly to our huggingface mirror of the dataset, which will then be downloaded and extracted automatically to the openretina cache directory. https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip

Source code in openretina/data_io/maheswaranathan_2023/stimuli.py

def load_all_stimuli(
    base_data_path: str | os.PathLike,
    stim_type: Literal["naturalscene", "whitenoise"] = "naturalscene",
    normalize_stimuli: bool = True,
) -> dict[str, MoviesTrainTestSplit]:
    """
    Load all stimuli from sessions within subfolders in a given base data path.

    The base data path should point to the location of the `neural_code_data` folder.
    (See https://doi.org/10.25740/rk663dm5577 for dataset download).

    Alternatively, base_data_path can point directly to our huggingface mirror of the dataset, which will then
    be downloaded and extracted automatically to the openretina cache directory.
    https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip
    """
    # Resolve data path
    base_data_path = get_local_file_path(str(base_data_path))
    full_data_path = os.path.join(base_data_path, "ganglion_cell_data")

    stimuli_all_sessions = {}
    for session in [x.name for x in os.scandir(os.fspath(full_data_path)) if x.is_dir()]:
        session_path = os.path.normpath(os.path.join(full_data_path, session))
        for recording_file in os.listdir(session_path):
            if str(recording_file).endswith(f"{stim_type}.h5"):
                recording_file = os.path.join(session_path, recording_file)

                print(f"Loading stimuli from {recording_file}")

                # Load video stimuli
                train_video = load_dataset_from_h5(recording_file, "/train/stimulus")
                test_video = load_dataset_from_h5(recording_file, "/test/stimulus")

                # Add channel dimension
                train_video = train_video[None, ...]
                test_video = test_video[None, ...]

                if normalize_stimuli:
                    train_video, test_video, norm_dict = normalize_train_test_movies(train_video, test_video)
                else:
                    norm_dict = {"norm_mean": None, "norm_std": None}

                stimuli_all_sessions[str(session)] = MoviesTrainTestSplit(
                    train=train_video,
                    test=test_video,
                    stim_id=stim_type,
                    random_sequences=None,
                    norm_mean=norm_dict["norm_mean"],
                    norm_std=norm_dict["norm_std"],
                )
    return stimuli_all_sessions

Responses

responses

Minimal responses loading utilities to train a model on the data used in Maheswaranathan et al. 2023

Paper: https://doi.org/10.1016/j.neuron.2023.06.007 Data: https://doi.org/10.25740/rk663dm5577

OpenRetina provides a mirror of the dataset on huggingface: https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip

load_test_repeats_for_session

load_test_repeats_for_session(
    session_path: str | PathLike,
    response_type: Literal[
        "firing_rate_5ms",
        "firing_rate_10ms",
        "firing_rate_20ms",
    ] = "firing_rate_20ms",
    fr_normalization: float = 1,
) -> Float[ndarray, "repeats neurons test_time"]

Load test response repeats for a single session.

Source code in openretina/data_io/maheswaranathan_2023/responses.py

def load_test_repeats_for_session(
    session_path: str | os.PathLike,
    response_type: Literal["firing_rate_5ms", "firing_rate_10ms", "firing_rate_20ms"] = "firing_rate_20ms",
    fr_normalization: float = 1,
) -> Float[np.ndarray, "repeats neurons test_time"]:
    """
    Load test response repeats for a single session.
    """

    with h5py.File(session_path, "r") as f:
        # There are two possible ways in which the files can be structured

        # 1. Repeats are saved with different response types
        if response_type in f["test/repeats"].keys():
            stacked_repeats: Float[np.ndarray, "repeats neurons time"] = f[f"test/repeats/{response_type}"][...]  # type: ignore
        # 2. Repeats are saved with only one response type, by cell id
        else:
            all_test_repeats = {}
            for cell_id in [x for x in f["test/repeats"].keys() if "cell" in x]:
                test_repeats = f[f"test/repeats/{cell_id}"][...]  # type: ignore
                all_test_repeats[cell_id] = test_repeats

            sorted_keys = sorted(all_test_repeats.keys(), key=lambda x: int(x.split("cell")[-1]))
            stacked_repeats = np.stack([all_test_repeats[key] for key in sorted_keys], axis=0) / fr_normalization

            stacked_repeats = rearrange(stacked_repeats, "neurons repeats time -> repeats neurons time")

    return stacked_repeats

load_all_responses

load_all_responses(
    base_data_path: str | PathLike,
    response_type: Literal[
        "firing_rate_5ms",
        "firing_rate_10ms",
        "firing_rate_20ms",
    ] = "firing_rate_20ms",
    stim_type: Literal[
        "naturalscene", "whitenoise"
    ] = "naturalscene",
    fr_normalization: float = 1,
) -> dict[str, ResponsesTrainTestSplit]

Load all neural responses from sessions within subfolders in a given base data path.

The base data path should point to the location of of the neural_code_data folder. (See https://doi.org/10.25740/rk663dm5577 for dataset download).

Alternatively, base_data_path can point directly to our huggingface mirror of the dataset, which will then be downloaded and extracted automatically to the openretina cache directory. https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip

Source code in openretina/data_io/maheswaranathan_2023/responses.py

def load_all_responses(
    base_data_path: str | os.PathLike,
    response_type: Literal["firing_rate_5ms", "firing_rate_10ms", "firing_rate_20ms"] = "firing_rate_20ms",
    stim_type: Literal["naturalscene", "whitenoise"] = "naturalscene",
    fr_normalization: float = 1,
) -> dict[str, ResponsesTrainTestSplit]:
    """
    Load all neural responses from sessions within subfolders in a given base data path.

    The base data path should point to the location of of the `neural_code_data` folder.
    (See https://doi.org/10.25740/rk663dm5577 for dataset download).

    Alternatively, base_data_path can point directly to our huggingface mirror of the dataset, which will then
    be downloaded and extracted automatically to the openretina cache directory.
    https://huggingface.co/datasets/open-retina/open-retina/resolve/main/baccus_lab/maheswaranathan_2023/neural_code_data.zip
    """
    # Resolve data path
    base_data_path = get_local_file_path(str(base_data_path))
    full_data_path = os.path.join(base_data_path, "ganglion_cell_data")

    responses_all_sessions = {}
    for session in [x.name for x in os.scandir(os.fspath(full_data_path)) if x.is_dir()]:
        session_path = os.path.join(full_data_path, session)
        for recording_file in [x for x in os.listdir(session_path) if str(x).endswith(f"{stim_type}.h5")]:
            recording_file = os.path.join(session_path, recording_file)

            print(f"Loading responses from {recording_file}")

            # Load neural responses
            train_session_data = load_dataset_from_h5(recording_file, f"/train/response/{response_type}")
            test_session_data = load_dataset_from_h5(recording_file, f"/test/response/{response_type}")

            assert train_session_data.shape[0] == test_session_data.shape[0], (
                "Train and test responses should have the same number of neurons."
            )

            responses_all_sessions[str(session)] = ResponsesTrainTestSplit(
                train=train_session_data / fr_normalization,
                test=test_session_data / fr_normalization,
                stim_id=stim_type,
                test_by_trial=load_test_repeats_for_session(recording_file, response_type, fr_normalization),
            )
    return responses_all_sessions