From 2a82314b5c0ee5e7e1f8b996dacef6291bb1b7b6 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 10:37:16 -0500
Subject: [PATCH 001/104] Copy hssm.py to prepare for base class extraction

---
 src/hssm/hssmbase_temp.py | 2299 +++++++++++++++++++++++++++++++++++++
 1 file changed, 2299 insertions(+)
 create mode 100644 src/hssm/hssmbase_temp.py

diff --git a/src/hssm/hssmbase_temp.py b/src/hssm/hssmbase_temp.py
new file mode 100644
index 000000000..5906c6eac
--- /dev/null
+++ b/src/hssm/hssmbase_temp.py
@@ -0,0 +1,2299 @@
+"""HSSM: Hierarchical Sequential Sampling Models.
+
+A package based on pymc and bambi to perform Bayesian inference for hierarchical
+sequential sampling models.
+
+This file defines the entry class HSSM.
+"""
+
+import datetime
+import logging
+import typing
+from copy import deepcopy
+from inspect import isclass, signature
+from os import PathLike
+from pathlib import Path
+from typing import Any, Callable, Literal, Optional, Union, cast, get_args
+
+import arviz as az
+import bambi as bmb
+import cloudpickle as cpickle
+import matplotlib as mpl
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+import pymc as pm
+import pytensor
+import seaborn as sns
+import xarray as xr
+from bambi.model_components import DistributionalComponent
+from bambi.transformations import transformations_namespace
+from pymc.model.transform.conditioning import do
+from ssms.config import model_config as ssms_model_config
+
+from hssm._types import LoglikKind, SupportedModels
+from hssm.data_validator import DataValidator
+from hssm.defaults import (
+    INITVAL_JITTER_SETTINGS,
+    INITVAL_SETTINGS,
+    MissingDataNetwork,
+    missing_data_networks_suffix,
+)
+from hssm.distribution_utils import (
+    assemble_callables,
+    make_distribution,
+    make_family,
+    make_likelihood_callable,
+    make_missing_data_callable,
+)
+from hssm.utils import (
+    _compute_log_likelihood,
+    _get_alias_dict,
+    _print_prior,
+    _rearrange_data,
+    _split_array,
+)
+
+from . import plotting
+from .config import Config, ModelConfig
+from .param import Params
+from .param import UserParam as Param
+
+_logger = logging.getLogger("hssm")
+
+# NOTE: Temporary mapping from old sampler names to new ones in bambi 0.16.0
+_new_sampler_mapping: dict[str, Literal["pymc", "numpyro", "blackjax"]] = {
+    "mcmc": "pymc",
+    "nuts_numpyro": "numpyro",
+    "nuts_blackjax": "blackjax",
+}
+
+
+class classproperty:
+    """A decorator that combines the behavior of @property and @classmethod.
+
+    This decorator allows you to define a property that can be accessed on the class
+    itself, rather than on instances of the class. It is useful for defining class-level
+    properties that need to perform some computation or access class-level data.
+
+    This implementation is provided for compatibility with Python versions 3.10 through
+    3.12, as one cannot combine the @property and @classmethod decorators is across all
+    these versions.
+
+    Example
+    -------
+    class MyClass:
+        @classproperty
+        def my_class_property(cls):
+            return "This is a class property"
+
+    print(MyClass.my_class_property)  # Output: This is a class property
+    """
+
+    def __init__(self, fget):
+        self.fget = fget
+
+    def __get__(self, instance, owner):  # noqa: D105
+        return self.fget(owner)
+
+
+class HSSM(DataValidator):
+    """The basic Hierarchical Sequential Sampling Model (HSSM) class.
+
+    Parameters
+    ----------
+    data
+        A pandas DataFrame with the minimum requirements of containing the data with the
+        columns "rt" and "response".
+    model
+        The name of the model to use. Currently supported models are "ddm", "ddm_sdv",
+        "full_ddm", "angle", "levy", "ornstein", "weibull", "race_no_bias_angle_4",
+        "ddm_seq2_no_bias". If any other string is passed, the model will be considered
+        custom, in which case all `model_config`, `loglik`, and `loglik_kind` have to be
+        provided by the user.
+    choices : optional
+        When an `int`, the number of choices that the participants can make. If `2`, the
+        choices are [-1, 1] by default. If anything greater than `2`, the choices are
+        [0, 1, ..., n_choices - 1] by default. If a `list` is provided, it should be the
+        list of choices that the participants can make. Defaults to `2`. If any value
+        other than the choices provided is found in the "response" column of the data,
+        an error will be raised.
+    include : optional
+        A list of dictionaries specifying parameter specifications to include in the
+        model. If left unspecified, defaults will be used for all parameter
+        specifications. Defaults to None.
+    model_config : optional
+        A dictionary containing the model configuration information. If None is
+        provided, defaults will be used if there are any. Defaults to None.
+        Fields for this `dict` are usually:
+
+        - `"list_params"`: a list of parameters indicating the parameters of the model.
+            The order in which the parameters are specified in this list is important.
+            Values for each parameter will be passed to the likelihood function in this
+            order.
+        - `"backend"`: Only used when `loglik_kind` is `approx_differentiable` and
+            an onnx file is supplied for the likelihood approximation network (LAN).
+            Valid values are `"jax"` or `"pytensor"`. It determines whether the LAN in
+            ONNX should be converted to `"jax"` or `"pytensor"`. If not provided,
+            `jax` will be used for maximum performance.
+        - `"default_priors"`: A `dict` indicating the default priors for each parameter.
+        - `"bounds"`: A `dict` indicating the boundaries for each parameter. In the case
+            of LAN, these bounds are training boundaries.
+        - `"rv"`: Optional. Can be a `RandomVariable` class containing the user's own
+            `rng_fn` function for sampling from the distribution that the user is
+            supplying. If not supplied, HSSM will automatically generate a
+            `RandomVariable` using the simulator identified by `model` from the
+            `ssm_simulators` package. If `model` is not supported in `ssm_simulators`,
+            a warning will be raised letting the user know that sampling from the
+            `RandomVariable` will result in errors.
+        - `"extra_fields"`: Optional. A list of strings indicating the additional
+            columns in `data` that will be passed to the likelihood function for
+            calculation. This is helpful if the likelihood function depends on data
+            other than the observed data and the parameter values.
+    loglik : optional
+        A likelihood function. Defaults to None. Requirements are:
+
+        1. if `loglik_kind` is `"analytical"` or `"blackbox"`, a pm.Distribution, a
+           pytensor Op, or a Python callable can be used. Signatures are:
+            - `pm.Distribution`: needs to have parameters specified exactly as listed in
+            `list_params`
+            - `pytensor.graph.Op` and `Callable`: needs to accept the parameters
+            specified exactly as listed in `list_params`
+        2. If `loglik_kind` is `"approx_differentiable"`, then in addition to the
+            specifications above, a `str` or `Pathlike` can also be used to specify a
+            path to an `onnx` file. If a `str` is provided, HSSM will first look locally
+            for an `onnx` file. If that is not successful, HSSM will try to download
+            that `onnx` file from Hugging Face hub.
+        3. It can also be `None`, in which case a default likelihood function will be
+            used
+    loglik_kind : optional
+        A string that specifies the kind of log-likelihood function specified with
+        `loglik`. Defaults to `None`. Can be one of the following:
+
+        - `"analytical"`: an analytical (approximation) likelihood function. It is
+            differentiable and can be used with samplers that requires differentiation.
+        - `"approx_differentiable"`: a likelihood approximation network (LAN) likelihood
+            function. It is differentiable and can be used with samplers that requires
+            differentiation.
+        - `"blackbox"`: a black box likelihood function. It is typically NOT
+            differentiable.
+        - `None`, in which a default will be used. For `ddm` type of models, the default
+            will be `analytical`. For other models supported, it will be
+            `approx_differentiable`. If the model is a custom one, a ValueError
+            will be raised.
+    p_outlier : optional
+        The fixed lapse probability or the prior distribution of the lapse probability.
+        Defaults to a fixed value of 0.05. When `None`, the lapse probability will not
+        be included in estimation.
+    lapse : optional
+        The lapse distribution. This argument is required only if `p_outlier` is not
+        `None`. Defaults to Uniform(0.0, 10.0).
+    global_formula : optional
+        A string that specifies a regressions formula which will be used for all model
+        parameters. If you specify parameter-wise regressions in addition, these will
+        override the global regression for the respective parameter.
+    link_settings : optional
+        An optional string literal that indicates the link functions to use for each
+        parameter. Helpful for hierarchical models where sampling might get stuck/
+        very slow. Can be one of the following:
+
+        - `"log_logit"`: applies log link functions to positive parameters and
+        generalized logit link functions to parameters that have explicit bounds.
+        - `None`: unless otherwise specified, the `"identity"` link functions will be
+        used.
+        The default value is `None`.
+    prior_settings : optional
+        An optional string literal that indicates the prior distributions to use for
+        each parameter. Helpful for hierarchical models where sampling might get stuck/
+        very slow. Can be one of the following:
+
+        - `"safe"`: HSSM will scan all parameters in the model and apply safe priors to
+        all parameters that do not have explicit bounds.
+        - None: HSSM will use bambi to provide default priors for all parameters. Not
+        recommended when you are using hierarchical models.
+        The default value is `"safe"`.
+    extra_namespace : optional
+        Additional user supplied variables with transformations or data to include in
+        the environment where the formula is evaluated. Defaults to `None`.
+    missing_data : optional
+        Specifies whether the model should handle missing data. Can be a `bool` or a
+        `float`. If `False`, and if the `rt` column contains in the data -999.0,
+        the model will drop these rows and produce a warning. If `True`, the model will
+        treat code -999.0 as missing data. If a `float` is provided, the model will
+        treat this value as the missing data value. Defaults to `False`.
+    deadline : optional
+        Specifies whether the model should handle deadline data. Can be a `bool` or a
+        `str`. If `False`, the model will not do nothing even if a deadline column is
+        provided. If `True`, the model will treat the `deadline` column as deadline
+        data. If a `str` is provided, the model will treat this value as the name of the
+        deadline column. Defaults to `False`.
+    loglik_missing_data : optional
+        A likelihood function for missing data. Please see the `loglik` parameter to see
+        how to specify the likelihood function this parameter. If nothing is provided,
+        a default likelihood function will be used. This parameter is required only if
+        either `missing_data` or `deadline` is not `False`. Defaults to `None`.
+    process_initvals : optional
+        If `True`, the model will process the initial values. Defaults to `True`.
+    initval_jitter : optional
+        The jitter value for the initial values. Defaults to `0.01`.
+    **kwargs
+        Additional arguments passed to the `bmb.Model` object.
+
+    Attributes
+    ----------
+    data
+        A pandas DataFrame with at least two columns of "rt" and "response" indicating
+        the response time and responses.
+    list_params
+        The list of strs of parameter names.
+    model_name
+        The name of the model.
+    loglik:
+        The likelihood function or a path to an onnx file.
+    loglik_kind:
+        The kind of likelihood used.
+    model_config
+        A dictionary representing the model configuration.
+    model_distribution
+        The likelihood function of the model in the form of a pm.Distribution subclass.
+    family
+        A Bambi family object.
+    priors
+        A dictionary containing the prior distribution of parameters.
+    formula
+        A string representing the model formula.
+    link
+        A string or a dictionary representing the link functions for all parameters.
+    params
+        A list of Param objects representing model parameters.
+    initval_jitter
+        The jitter value for the initial values.
+    """
+
+    def __init__(
+        self,
+        data: pd.DataFrame,
+        model: SupportedModels | str = "ddm",
+        choices: list[int] | None = None,
+        include: list[dict[str, Any] | Param] | None = None,
+        model_config: ModelConfig | dict | None = None,
+        loglik: (
+            str | PathLike | Callable | pytensor.graph.Op | type[pm.Distribution] | None
+        ) = None,
+        loglik_kind: LoglikKind | None = None,
+        p_outlier: float | dict | bmb.Prior | None = 0.05,
+        lapse: dict | bmb.Prior | None = bmb.Prior("Uniform", lower=0.0, upper=20.0),
+        global_formula: str | None = None,
+        link_settings: Literal["log_logit"] | None = None,
+        prior_settings: Literal["safe"] | None = "safe",
+        extra_namespace: dict[str, Any] | None = None,
+        missing_data: bool | float = False,
+        deadline: bool | str = False,
+        loglik_missing_data: (
+            str | PathLike | Callable | pytensor.graph.Op | None
+        ) = None,
+        process_initvals: bool = True,
+        initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
+        **kwargs,
+    ):
+        # Attach arguments to the instance
+        # so that we can easily define some
+        # methods that need to access these
+        # arguments (context: pickling / save - load).
+
+        # Define a dict with all call arguments:
+        self._init_args = {
+            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
+        }
+        if kwargs:
+            self._init_args.update(kwargs)
+
+        self.data = data.copy()
+        self._inference_obj: az.InferenceData | None = None
+        self._initvals: dict[str, Any] = {}
+        self.initval_jitter = initval_jitter
+        self._inference_obj_vi: pm.Approximation | None = None
+        self._vi_approx = None
+        self._map_dict = None
+        self.global_formula = global_formula
+
+        self.link_settings = link_settings
+        self.prior_settings = prior_settings
+
+        self.missing_data_value = -999.0
+
+        additional_namespace = transformations_namespace.copy()
+        if extra_namespace is not None:
+            additional_namespace.update(extra_namespace)
+        self.additional_namespace = additional_namespace
+
+        # Construct a model_config from defaults
+        self.model_config = Config.from_defaults(model, loglik_kind)
+        # Update defaults with user-provided config, if any
+        if model_config is not None:
+            if isinstance(model_config, dict):
+                if "choices" not in model_config:
+                    if choices is not None:
+                        model_config["choices"] = choices
+                else:
+                    if choices is not None:
+                        _logger.info(
+                            "choices list provided in both model_config and "
+                            "as an argument directly."
+                            " Using the one provided in model_config. \n"
+                            "We recommend providing choices in model_config."
+                        )
+            elif isinstance(model_config, ModelConfig):
+                if model_config.choices is None:
+                    if choices is not None:
+                        model_config.choices = choices
+                else:
+                    if choices is not None:
+                        _logger.info(
+                            "choices list provided in both model_config and "
+                            "as an argument directly."
+                            " Using the one provided in model_config. \n"
+                            "We recommend providing choices in model_config."
+                        )
+
+            self.model_config.update_config(
+                model_config
+                if isinstance(model_config, ModelConfig)
+                else ModelConfig(**model_config)  # also serves as dict validation
+            )
+        else:
+            # Model config is not provided, but at this point was constructed from
+            # defaults.
+            if model not in typing.get_args(SupportedModels):
+                # TODO: ideally use self.supported_models above but mypy doesn't like it
+                if choices is not None:
+                    self.model_config.update_choices(choices)
+                elif model in ssms_model_config:
+                    self.model_config.update_choices(
+                        ssms_model_config[model]["choices"]
+                    )
+                    _logger.info(
+                        "choices argument passed as None, "
+                        "but found %s in ssms-simulators. "
+                        "Using choices, from ssm-simulators configs: %s",
+                        model,
+                        ssms_model_config[model]["choices"],
+                    )
+            else:
+                # Model config already constructed from defaults, and model string is
+                # in SupportedModels. So we are guaranteed that choices are in
+                # self.model_config already.
+
+                if choices is not None:
+                    _logger.info(
+                        "Model string is in SupportedModels."
+                        " Ignoring choices arguments."
+                    )
+
+        # Update loglik with user-provided value
+        self.model_config.update_loglik(loglik)
+        # Ensure that all required fields are valid
+        self.model_config.validate()
+
+        # Set up shortcuts so old code will work
+        self.response = self.model_config.response
+        self.list_params = self.model_config.list_params
+        self.choices = self.model_config.choices
+        self.model_name = self.model_config.model_name
+        self.loglik = self.model_config.loglik
+        self.loglik_kind = self.model_config.loglik_kind
+        self.extra_fields = self.model_config.extra_fields
+
+        if self.choices is None:
+            raise ValueError(
+                "`choices` must be provided either in `model_config` or as an argument."
+            )
+
+        self.n_choices = len(self.choices)
+        self._pre_check_data_sanity()
+
+        # Process missing data setting
+        # AF-TODO: Could be a function in data validator?
+        if isinstance(missing_data, float):
+            if not ((self.data.rt == missing_data).any()):
+                raise ValueError(
+                    f"missing_data argument is provided as a float {missing_data}, "
+                    f"However, you have no RTs of {missing_data} in your dataset!"
+                )
+            else:
+                self.missing_data = True
+                self.missing_data_value = missing_data
+        elif isinstance(missing_data, bool):
+            if missing_data and (not (self.data.rt == -999.0).any()):
+                raise ValueError(
+                    "missing_data argument is provided as True, "
+                    " so RTs of -999.0 are treated as missing. \n"
+                    "However, you have no RTs of -999.0 in your dataset!"
+                )
+            elif (not missing_data) and (self.data.rt == -999.0).any():
+                # self.missing_data = True
+                raise ValueError(
+                    "Missing data provided as False. \n"
+                    "However, you have RTs of -999.0 in your dataset!"
+                )
+            else:
+                self.missing_data = missing_data
+        else:
+            raise ValueError(
+                "missing_data argument must be a bool or a float! \n"
+                f"You provided: {type(missing_data)}"
+            )
+
+        if isinstance(deadline, str):
+            self.deadline = True
+            self.deadline_name = deadline
+        else:
+            self.deadline = deadline
+            self.deadline_name = "deadline"
+
+        if (
+            not self.missing_data and not self.deadline
+        ) and loglik_missing_data is not None:
+            raise ValueError(
+                "You have specified a loglik_missing_data function, but you have not "
+                + "set the missing_data or deadline flag to True."
+            )
+        self.loglik_missing_data = loglik_missing_data
+
+        # Update data based on missing_data and deadline
+        self._handle_missing_data_and_deadline()
+        # Set self.missing_data_network based on `missing_data` and `deadline`
+        self.missing_data_network = self._set_missing_data_and_deadline(
+            self.missing_data, self.deadline, self.data
+        )
+
+        if self.deadline:
+            self.response.append(self.deadline_name)
+
+        # Process lapse distribution
+        self.has_lapse = p_outlier is not None and p_outlier != 0
+        self._check_lapse(lapse)
+        if self.has_lapse and self.list_params[-1] != "p_outlier":
+            self.list_params.append("p_outlier")
+
+        # Process all parameters
+        self.params = Params.from_user_specs(
+            model=self,
+            include=[] if include is None else include,
+            kwargs=kwargs,
+            p_outlier=p_outlier,
+        )
+
+        self._parent = self.params.parent
+        self._parent_param = self.params.parent_param
+
+        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
+
+        # For parameters that have a regression backend, apply bounds at the likelihood
+        # level to ensure that the samples that are out of bounds
+        # are discarded (replaced with a large negative value).
+        self.bounds = {
+            name: param.bounds
+            for name, param in self.params.items()
+            if param.is_regression and param.bounds is not None
+        }
+
+        # Set p_outlier and lapse
+        self.p_outlier = self.params.get("p_outlier")
+        self.lapse = lapse if self.has_lapse else None
+
+        self._post_check_data_sanity()
+
+        self.model_distribution = self._make_model_distribution()
+
+        self.family = make_family(
+            self.model_distribution,
+            self.list_params,
+            self.link,
+            self._parent,
+        )
+
+        self.model = bmb.Model(
+            self.formula,
+            data=self.data,
+            family=self.family,
+            priors=self.priors,  # center_predictors=False
+            extra_namespace=self.additional_namespace,
+            **kwargs,
+        )
+
+        self._aliases = _get_alias_dict(
+            self.model, self._parent_param, self.response_c, self.response_str
+        )
+        self.set_alias(self._aliases)
+        self.model.build()
+
+        if process_initvals:
+            self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
+        if self.initval_jitter > 0:
+            self._jitter_initvals(
+                jitter_epsilon=self.initval_jitter,
+                vector_only=True,
+            )
+
+        # Make sure we reset rvs_to_initial_values --> Only None's
+        # Otherwise PyMC barks at us when asking to compute likelihoods
+        self.pymc_model.rvs_to_initial_values.update(
+            {key_: None for key_ in self.pymc_model.rvs_to_initial_values.keys()}
+        )
+        _logger.info("Model initialized successfully.")
+
+    @classproperty
+    def supported_models(cls) -> tuple[SupportedModels, ...]:
+        """Get a tuple of all supported models.
+
+        Returns
+        -------
+        tuple[SupportedModels, ...]
+            A tuple containing all supported model names.
+        """
+        return get_args(SupportedModels)
+
+    @classmethod
+    def _store_init_args(cls, *args, **kwargs):
+        """Store initialization arguments using signature binding."""
+        sig = signature(cls.__init__)
+        bound_args = sig.bind(*args, **kwargs)
+        bound_args.apply_defaults()
+        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
+
+    def find_MAP(self, **kwargs):
+        """Perform Maximum A Posteriori estimation.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the MAP estimates of the model parameters.
+        """
+        self._map_dict = pm.find_MAP(model=self.pymc_model, **kwargs)
+        return self._map_dict
+
+    def sample(
+        self,
+        sampler: Literal["pymc", "numpyro", "blackjax", "nutpie", "laplace"]
+        | None = None,
+        init: str | None = None,
+        initvals: str | dict | None = None,
+        include_response_params: bool = False,
+        **kwargs,
+    ) -> az.InferenceData | pm.Approximation:
+        """Perform sampling using the `fit` method via bambi.Model.
+
+        Parameters
+        ----------
+        sampler: optional
+            The sampler to use. Can be one of "pymc", "numpyro",
+            "blackjax", "nutpie", or "laplace". If using `blackbox` likelihoods,
+            this cannot be "numpyro", "blackjax", or "nutpie". By default it is None,
+            and sampler will automatically be chosen: when the model uses the
+            `approx_differentiable` likelihood, and `jax` backend, "numpyro" will
+            be used. Otherwise, "pymc" (the default PyMC NUTS sampler) will be used.
+
+            Note that the old sampler names such as "mcmc", "nuts_numpyro",
+            "nuts_blackjax" will be deprecated and removed in future releases. A warning
+            will be raised if any of these old names are used.
+        init: optional
+            Initialization method to use for the sampler. If any of the NUTS samplers
+            is used, defaults to `"adapt_diag"`. Otherwise, defaults to `"auto"`.
+        initvals: optional
+            Pass initial values to the sampler. This can be a dictionary of initial
+            values for parameters of the model, or a string "map" to use initialization
+            at the MAP estimate. If "map" is used, the MAP estimate will be computed if
+            not already attached to the base class from prior call to 'find_MAP`.
+        include_response_params: optional
+            Include parameters of the response distribution in the output. These usually
+            take more space than other parameters as there's one of them per
+            observation. Defaults to False.
+        kwargs
+            Other arguments passed to bmb.Model.fit(). Please see [here]
+            (https://bambinos.github.io/bambi/api_reference.html#bambi.models.Model.fit)
+            for full documentation.
+
+        Returns
+        -------
+        az.InferenceData | pm.Approximation
+            A reference to the `model.traces` object, which stores the traces of the
+            last call to `model.sample()`. `model.traces` is an ArviZ `InferenceData`
+            instance if `sampler` is `"pymc"` (default), `"numpyro"`,
+            `"blackjax"` or "`laplace".
+        """
+        # If initvals are None (default)
+        # we skip processing initvals here.
+        if sampler in _new_sampler_mapping:
+            _logger.warning(
+                f"Sampler '{sampler}' is deprecated. "
+                "Please use the new sampler names: "
+                "'pymc', 'numpyro', 'blackjax', 'nutpie', or 'laplace'."
+            )
+            sampler = _new_sampler_mapping[sampler]  # type: ignore
+
+        if sampler == "vi":
+            raise ValueError(
+                "VI is not supported via the sample() method. "
+                "Please use the vi() method instead."
+            )
+
+        if initvals is not None:
+            if isinstance(initvals, dict):
+                kwargs["initvals"] = initvals
+            else:
+                if isinstance(initvals, str):
+                    if initvals == "map":
+                        if self._map_dict is None:
+                            _logger.info(
+                                "initvals='map' but no map"
+                                "estimate precomputed. \n"
+                                "Running map estimation first..."
+                            )
+                            self.find_MAP()
+                            kwargs["initvals"] = self._map_dict
+                        else:
+                            kwargs["initvals"] = self._map_dict
+                else:
+                    raise ValueError(
+                        "initvals argument must be a dictionary or 'map'"
+                        " to use the MAP estimate."
+                    )
+        else:
+            kwargs["initvals"] = self._initvals
+            _logger.info("Using default initvals. \n")
+
+        if sampler is None:
+            if (
+                self.loglik_kind == "approx_differentiable"
+                and self.model_config.backend == "jax"
+            ):
+                sampler = "numpyro"
+            else:
+                sampler = "pymc"
+
+        if self.loglik_kind == "blackbox":
+            if sampler in ["blackjax", "numpyro", "nutpie"]:
+                raise ValueError(
+                    f"{sampler} sampler does not work with blackbox likelihoods."
+                )
+
+            if "step" not in kwargs:
+                kwargs |= {"step": pm.Slice(model=self.pymc_model)}
+
+        if (
+            self.loglik_kind == "approx_differentiable"
+            and self.model_config.backend == "jax"
+            and sampler == "pymc"
+            and kwargs.get("cores", None) != 1
+        ):
+            _logger.warning(
+                "Parallel sampling might not work with `jax` backend and the PyMC NUTS "
+                + "sampler on some platforms. Please consider using `numpyro`, "
+                + "`blackjax`, or `nutpie` sampler if that is a problem."
+            )
+
+        if self._check_extra_fields():
+            self._update_extra_fields()
+
+        if init is None:
+            if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]:
+                init = "adapt_diag"
+            else:
+                init = "auto"
+
+        # If sampler is finally `numpyro` make sure
+        # the jitter argument is set to False
+        if sampler == "numpyro":
+            if "nuts_sampler_kwargs" in kwargs:
+                if kwargs["nuts_sampler_kwargs"].get("jitter"):
+                    _logger.warning(
+                        "The jitter argument is set to True. "
+                        + "This argument is not supported "
+                        + "by the numpyro backend. "
+                        + "The jitter argument will be set to False."
+                    )
+                kwargs["nuts_sampler_kwargs"]["jitter"] = False
+            else:
+                kwargs["nuts_sampler_kwargs"] = {"jitter": False}
+
+        if sampler != "pymc" and "step" in kwargs:
+            raise ValueError(
+                "`step` samplers (enabled by the `step` argument) are only supported "
+                "by the `pymc` sampler."
+            )
+
+        if self._inference_obj is not None:
+            _logger.warning(
+                "The model has already been sampled. Overwriting the previous "
+                + "inference object. Any previous reference to the inference object "
+                + "will still point to the old object."
+            )
+
+        # Define whether likelihood should be computed
+        compute_likelihood = True
+        if "idata_kwargs" in kwargs:
+            if "log_likelihood" in kwargs["idata_kwargs"]:
+                compute_likelihood = kwargs["idata_kwargs"].pop("log_likelihood", True)
+
+        omit_offsets = kwargs.pop("omit_offsets", False)
+        self._inference_obj = self.model.fit(
+            inference_method=(
+                "pymc"
+                if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]
+                else sampler
+            ),
+            init=init,
+            include_response_params=include_response_params,
+            omit_offsets=omit_offsets,
+            **kwargs,
+        )
+
+        # Separate out log likelihood computation
+        if compute_likelihood:
+            self.log_likelihood(self._inference_obj, inplace=True)
+
+        # Subset data vars in posterior
+        self._clean_posterior_group(idata=self._inference_obj)
+        return self.traces
+
+    def vi(
+        self,
+        method: str = "advi",
+        niter: int = 10000,
+        draws: int = 1000,
+        return_idata: bool = True,
+        ignore_mcmc_start_point_defaults=False,
+        **vi_kwargs,
+    ) -> pm.Approximation | az.InferenceData:
+        """Perform Variational Inference.
+
+        Parameters
+        ----------
+        niter : int
+            The number of iterations to run the VI algorithm. Defaults to 3000.
+        method : str
+            The method to use for VI. Can be one of "advi" or "fullrank_advi", "svgd",
+            "asvgd".Defaults to "advi".
+        draws : int
+            The number of samples to draw from the posterior distribution.
+            Defaults to 1000.
+        return_idata : bool
+            If True, returns an InferenceData object. Otherwise, returns the
+            approximation object directly. Defaults to True.
+
+        Returns
+        -------
+            pm.Approximation or az.InferenceData: The mean field approximation object.
+        """
+        if self.loglik_kind == "analytical":
+            _logger.warning(
+                "VI is not recommended for the analytical likelihood,"
+                " since gradients can be brittle."
+            )
+        elif self.loglik_kind == "blackbox":
+            raise ValueError(
+                "VI is not supported for blackbox likelihoods, "
+                " since likelihood gradients are needed!"
+            )
+
+        if ("start" not in vi_kwargs) and not ignore_mcmc_start_point_defaults:
+            _logger.info("Using MCMC starting point defaults.")
+            vi_kwargs["start"] = self._initvals
+
+        # Run variational inference directly from pymc model
+        with self.pymc_model:
+            self._vi_approx = pm.fit(n=niter, method=method, **vi_kwargs)
+
+        # Sample from the approximate posterior
+        if self._vi_approx is not None:
+            self._inference_obj_vi = self._vi_approx.sample(draws)
+
+        # Post-processing
+        self._clean_posterior_group(idata=self._inference_obj_vi)
+
+        # Return the InferenceData object if return_idata is True
+        if return_idata:
+            return self._inference_obj_vi
+        # Otherwise return the appromation object directly
+        return self.vi_approx
+
+    def _clean_posterior_group(self, idata: az.InferenceData | None = None):
+        """Clean up the posterior group of the InferenceData object.
+
+        Parameters
+        ----------
+        idata : az.InferenceData
+            The InferenceData object to clean up. If None, the last InferenceData object
+            will be used.
+        """
+        # # Logic behind which variables to keep:
+        # # We essentially want to get rid of
+        # # all the trial-wise variables.
+
+        # # We drop all distributional components, IF they are deterministics
+        # # (in which case they will be trial wise systematically)
+        # # and we keep distributional components, IF they are
+        # # basic random-variabels (in which case they should never
+        # # appear trial-wise).
+        if idata is None:
+            raise ValueError(
+                "The InferenceData object is None. Cannot clean up the posterior group."
+            )
+        elif not hasattr(idata, "posterior"):
+            raise ValueError(
+                "The InferenceData object does not have a posterior group. "
+                + "Cannot clean up the posterior group."
+            )
+
+        vars_to_keep = set(idata["posterior"].data_vars.keys()).difference(
+            set(
+                key_
+                for key_ in self.model.distributional_components.keys()
+                if key_ in [var_.name for var_ in self.pymc_model.deterministics]
+            )
+        )
+        vars_to_keep_clean = [
+            var_
+            for var_ in vars_to_keep
+            if isinstance(var_, str) and "_mean" not in var_
+        ]
+
+        setattr(
+            idata,
+            "posterior",
+            idata["posterior"][vars_to_keep_clean],
+        )
+
+    def log_likelihood(
+        self,
+        idata: az.InferenceData | None = None,
+        data: pd.DataFrame | None = None,
+        inplace: bool = True,
+        keep_likelihood_params: bool = False,
+    ) -> az.InferenceData | None:
+        """Compute the log likelihood of the model.
+
+        Parameters
+        ----------
+        idata : optional
+            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
+        data : optional
+            A pandas DataFrame with values for the predictors that are used to obtain
+            out-of-sample predictions. If omitted, the original dataset is used.
+        inplace : optional
+            If `True` will modify idata in-place and append a `log_likelihood` group to
+            `idata`. Otherwise, it will return a copy of idata with the predictions
+            added, by default True.
+        keep_likelihood_params : optional
+            If `True`, the trial wise likelihood parameters that are computed
+            on route to getting the log likelihood are kept in the `idata` object.
+            Defaults to False. See also the method `add_likelihood_parameters_to_idata`.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if self._inference_obj is None and idata is None:
+            raise ValueError(
+                "Neither has the model been sampled yet nor"
+                + " an idata object has been provided."
+            )
+
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError(
+                    "The model has not been sampled yet. "
+                    + "Please provide an idata object."
+                )
+            else:
+                idata = self._inference_obj
+
+        # Actual likelihood computation
+        idata = _compute_log_likelihood(self.model, idata, data, inplace)
+
+        # clean up posterior:
+        if not keep_likelihood_params:
+            self._clean_posterior_group(idata=idata)
+
+        if inplace:
+            return None
+        else:
+            return idata
+
+    def add_likelihood_parameters_to_idata(
+        self,
+        idata: az.InferenceData | None = None,
+        inplace: bool = False,
+    ) -> az.InferenceData | None:
+        """Add likelihood parameters to the InferenceData object.
+
+        Parameters
+        ----------
+        idata : az.InferenceData
+            The InferenceData object returned by HSSM.sample().
+        inplace : bool
+            If True, the likelihood parameters are added to idata in-place. Otherwise,
+            a copy of idata with the likelihood parameters added is returned.
+            Defaults to False.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError("No idata provided and model not yet sampled!")
+            else:
+                idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
+                    deepcopy(self._inference_obj)
+                    if not inplace
+                    else self._inference_obj
+                )
+        else:
+            idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
+                deepcopy(idata) if not inplace else idata
+            )
+        return idata
+
+    def sample_posterior_predictive(
+        self,
+        idata: az.InferenceData | None = None,
+        data: pd.DataFrame | None = None,
+        inplace: bool = True,
+        include_group_specific: bool = True,
+        kind: Literal["response", "response_params"] = "response",
+        draws: int | float | list[int] | np.ndarray | None = None,
+        safe_mode: bool = True,
+    ) -> az.InferenceData | None:
+        """Perform posterior predictive sampling from the HSSM model.
+
+        Parameters
+        ----------
+        idata : optional
+            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
+            the `InferenceData` from the last time `sample()` is called will be used.
+        data : optional
+            An optional data frame with values for the predictors that are used to
+            obtain out-of-sample predictions. If omitted, the original dataset is used.
+        inplace : optional
+            If `True` will modify idata in-place and append a `posterior_predictive`
+            group to `idata`. Otherwise, it will return a copy of idata with the
+            predictions added, by default True.
+        include_group_specific : optional
+            If `True` will make predictions including the group specific effects.
+            Otherwise, predictions are made with common effects only (i.e. group-
+            specific are set to zero), by default True.
+        kind: optional
+            Indicates the type of prediction required. Can be `"response_params"` or
+            `"response"`. The first returns draws from the posterior distribution of the
+            likelihood parameters, while the latter returns the draws from the posterior
+            predictive distribution (i.e. the posterior probability distribution for a
+            new observation) in addition to the posterior distribution. Defaults to
+            "response_params".
+        draws: optional
+            The number of samples to draw from the posterior predictive distribution
+            from each chain.
+            When it's an integer >= 1, the number of samples to be extracted from the
+            `draw` dimension. If this integer is larger than the number of posterior
+            samples in each chain, all posterior samples will be used
+            in posterior predictive sampling. When a float between 0 and 1, the
+            proportion of samples from the draw dimension from each chain to be used in
+            posterior predictive sampling.. If this proportion is very
+            small, at least one sample will be used. When None, all posterior samples
+            will be used. Defaults to None.
+        safe_mode: bool
+            If True, the function will split the draws into chunks of 10 to avoid memory
+            issues. Defaults to True.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet and idata is not provided.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError(
+                    "The model has not been sampled yet. "
+                    + "Please either provide an idata object or sample the model first."
+                )
+            idata = self._inference_obj
+            _logger.info(
+                "idata=None, we use the traces assigned to the HSSM object as idata."
+            )
+
+        if idata is not None:
+            if "posterior_predictive" in idata.groups():
+                del idata["posterior_predictive"]
+                _logger.warning(
+                    "pre-existing posterior_predictive group deleted from idata. \n"
+                )
+
+        if self._check_extra_fields(data):
+            self._update_extra_fields(data)
+
+        if isinstance(draws, np.ndarray):
+            draws = draws.astype(int)
+        elif isinstance(draws, list):
+            draws = np.array(draws).astype(int)
+        elif isinstance(draws, int | float):
+            draws = np.arange(int(draws))
+        elif draws is None:
+            draws = idata["posterior"].draw.values
+        else:
+            raise ValueError(
+                "draws must be an integer, " + "a list of integers, or a numpy array."
+            )
+
+        assert isinstance(draws, np.ndarray)
+
+        # Make a copy of idata, set the `posterior` group to be a random sub-sample
+        # of the original (draw dimension gets sub-sampled)
+
+        idata_copy = idata.copy()
+
+        if (draws.shape != idata["posterior"].draw.values.shape) or (
+            (draws.shape == idata["posterior"].draw.values.shape)
+            and not np.allclose(draws, idata["posterior"].draw.values)
+        ):
+            # Reassign posterior to sub-sampled version
+            setattr(idata_copy, "posterior", idata["posterior"].isel(draw=draws))
+
+        if kind == "response":
+            # If we run kind == 'response' we actually run the observation RV
+            if safe_mode:
+                # safe mode splits the draws into chunks of 10 to avoid
+                # memory issues (TODO: Figure out the source of memory issues)
+                split_draws = _split_array(
+                    idata_copy["posterior"].draw.values, divisor=10
+                )
+
+                posterior_predictive_list = []
+                for samples_tmp in split_draws:
+                    tmp_posterior = idata["posterior"].sel(draw=samples_tmp)
+                    setattr(idata_copy, "posterior", tmp_posterior)
+                    self.model.predict(
+                        idata_copy, kind, data, True, include_group_specific
+                    )
+                    posterior_predictive_list.append(idata_copy["posterior_predictive"])
+
+                if inplace:
+                    idata.add_groups(
+                        posterior_predictive=xr.concat(
+                            posterior_predictive_list, dim="draw"
+                        )
+                    )
+                    # for inplace, we don't return anything
+                    return None
+                else:
+                    # Reassign original posterior to idata_copy
+                    setattr(idata_copy, "posterior", idata["posterior"])
+                    # Add new posterior predictive group to idata_copy
+                    del idata_copy["posterior_predictive"]
+                    idata_copy.add_groups(
+                        posterior_predictive=xr.concat(
+                            posterior_predictive_list, dim="draw"
+                        )
+                    )
+                    return idata_copy
+            else:
+                if inplace:
+                    # If not safe-mode
+                    # We call .predict() directly without any
+                    # chunking of data.
+
+                    # .predict() is called on the copy of idata
+                    # since we still subsampled (or assigned) the draws
+                    self.model.predict(
+                        idata_copy, kind, data, True, include_group_specific
+                    )
+
+                    # posterior predictive group added to idata
+                    idata.add_groups(
+                        posterior_predictive=idata_copy["posterior_predictive"]
+                    )
+                    # don't return anything if inplace
+                    return None
+                else:
+                    # Not safe mode and not inplace
+                    # Function acts as very thin wrapper around
+                    # .predict(). It just operates on the
+                    # idata_copy object
+                    return self.model.predict(
+                        idata_copy, kind, data, False, include_group_specific
+                    )
+        elif kind == "response_params":
+            # If kind == 'response_params', we don't need to run the RV directly,
+            # there shouldn't really be any significant memory issues here,
+            # we can simply ignore settings, since the computational overhead
+            # should be very small --> nudges user towards good outputs.
+            _logger.warning(
+                "The kind argument is set to 'mean', but 'draws' argument "
+                + "is not None: The draws argument will be ignored!"
+            )
+            return self.model.predict(
+                idata, kind, data, inplace, include_group_specific
+            )
+        else:
+            raise ValueError("`kind` must be either 'response' or 'response_params'.")
+
+    def plot_predictive(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
+        """Produce a posterior predictive plot.
+
+        Equivalent to calling `hssm.plotting.plot_predictive()` with the
+        model. Please see that function for
+        [full documentation][hssm.plotting.plot_predictive].
+
+        Returns
+        -------
+        mpl.axes.Axes | sns.FacetGrid
+            The matplotlib axis or seaborn FacetGrid object containing the plot.
+        """
+        return plotting.plot_predictive(self, **kwargs)
+
+    def plot_quantile_probability(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
+        """Produce a quantile probability plot.
+
+        Equivalent to calling `hssm.plotting.plot_quantile_probability()` with the
+        model. Please see that function for
+        [full documentation][hssm.plotting.plot_quantile_probability].
+
+        Returns
+        -------
+        mpl.axes.Axes | sns.FacetGrid
+            The matplotlib axis or seaborn FacetGrid object containing the plot.
+        """
+        return plotting.plot_quantile_probability(self, **kwargs)
+
+    def predict(self, **kwargs) -> az.InferenceData:
+        """Generate samples from the predictive distribution."""
+        return self.model.predict(**kwargs)
+
+    def sample_do(
+        self, params: dict[str, Any], draws: int = 100, return_model=False, **kwargs
+    ) -> az.InferenceData | tuple[az.InferenceData, pm.Model]:
+        """Generate samples from the predictive distribution using the `do-operator`."""
+        do_model = do(self.pymc_model, params)
+        do_idata = pm.sample_prior_predictive(model=do_model, draws=draws, **kwargs)
+
+        # clean up `rt,response_mean` to `v`
+        do_idata = self._drop_parent_str_from_idata(idata=do_idata)
+
+        # rename otherwise inconsistentdims and coords
+        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
+            setattr(
+                do_idata,
+                "prior_predictive",
+                do_idata["prior_predictive"].rename_dims(
+                    {"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].coords:
+            setattr(
+                do_idata,
+                "prior_predictive",
+                do_idata["prior_predictive"].rename_vars(
+                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+
+        if return_model:
+            return do_idata, do_model
+        return do_idata
+
+    def sample_prior_predictive(
+        self,
+        draws: int = 500,
+        var_names: str | list[str] | None = None,
+        omit_offsets: bool = True,
+        random_seed: np.random.Generator | None = None,
+    ) -> az.InferenceData:
+        """Generate samples from the prior predictive distribution.
+
+        Parameters
+        ----------
+        draws
+            Number of draws to sample from the prior predictive distribution. Defaults
+            to 500.
+        var_names
+            A list of names of variables for which to compute the prior predictive
+            distribution. Defaults to ``None`` which means both observed and unobserved
+            RVs.
+        omit_offsets
+            Whether to omit offset terms. Defaults to ``True``.
+        random_seed
+            Seed for the random number generator.
+
+        Returns
+        -------
+        az.InferenceData
+            ``InferenceData`` object with the groups ``prior``, ``prior_predictive`` and
+            ``observed_data``.
+        """
+        prior_predictive = self.model.prior_predictive(
+            draws, var_names, omit_offsets, random_seed
+        )
+
+        # AF-COMMENT: Not sure if necessary to include the
+        # mean prior here (which adds deterministics that
+        # could be recomputed elsewhere)
+        prior_predictive.add_groups(posterior=prior_predictive.prior)
+        self.model.predict(prior_predictive, kind="mean", inplace=True)
+
+        # clean
+        setattr(prior_predictive, "prior", prior_predictive["posterior"])
+        del prior_predictive["posterior"]
+
+        if self._inference_obj is None:
+            self._inference_obj = prior_predictive
+        else:
+            self._inference_obj.extend(prior_predictive)
+
+        # clean up `rt,response_mean` to `v`
+        idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
+
+        # rename otherwise inconsistentdims and coords
+        if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
+            setattr(
+                idata,
+                "prior_predictive",
+                idata["prior_predictive"].rename_dims(
+                    {"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+        if "rt,response_extra_dim_0" in idata["prior_predictive"].coords:
+            setattr(
+                idata,
+                "prior_predictive",
+                idata["prior_predictive"].rename_vars(
+                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+
+        # Update self._inference_obj to match the cleaned idata
+        self._inference_obj = idata
+        return deepcopy(self._inference_obj)
+
+    @property
+    def pymc_model(self) -> pm.Model:
+        """Provide access to the PyMC model.
+
+        Returns
+        -------
+        pm.Model
+            The PyMC model built by bambi
+        """
+        return self.model.backend.model
+
+    def set_alias(self, aliases: dict[str, str | dict]):
+        """Set parameter aliases.
+
+        Sets the aliases according to the dictionary passed to it and rebuild the
+        model.
+
+        Parameters
+        ----------
+        aliases
+            A dict specifying the parameter names being aliased and the aliases.
+        """
+        self.model.set_alias(aliases)
+        self.model.build()
+
+    @property
+    def response_c(self) -> str:
+        """Return the response variable names in c() format."""
+        return f"c({', '.join(self.response)})"
+
+    @property
+    def response_str(self) -> str:
+        """Return the response variable names in string format."""
+        return ",".join(self.response)
+
+    # NOTE: can't annotate return type because the graphviz dependency is optional
+    def graph(self, formatting="plain", name=None, figsize=None, dpi=300, fmt="png"):
+        """Produce a graphviz Digraph from a built HSSM model.
+
+        Requires graphviz, which may be installed most easily with `conda install -c
+        conda-forge python-graphviz`. Alternatively, you may install the `graphviz`
+        binaries yourself, and then `pip install graphviz` to get the python bindings.
+        See http://graphviz.readthedocs.io/en/stable/manual.html for more information.
+
+        Parameters
+        ----------
+        formatting
+            One of `"plain"` or `"plain_with_params"`. Defaults to `"plain"`.
+        name
+            Name of the figure to save. Defaults to `None`, no figure is saved.
+        figsize
+            Maximum width and height of figure in inches. Defaults to `None`, the
+            figure size is set automatically. If defined and the drawing is larger than
+            the given size, the drawing is uniformly scaled down so that it fits within
+            the given size.  Only works if `name` is not `None`.
+        dpi
+            Point per inch of the figure to save.
+            Defaults to 300. Only works if `name` is not `None`.
+        fmt
+            Format of the figure to save.
+            Defaults to `"png"`. Only works if `name` is not `None`.
+
+        Returns
+        -------
+        graphviz.Graph
+            The graph
+        """
+        graph = self.model.graph(formatting, name, figsize, dpi, fmt)
+
+        parent_param = self._parent_param
+        if parent_param.is_regression:
+            return graph
+
+        # Modify the graph
+        # 1. Remove all nodes and edges related to `{parent}_mean`:
+        graph.body = [
+            item for item in graph.body if f"{parent_param.name}_mean" not in item
+        ]
+        # 2. Add a new edge from parent to response
+        graph.edge(parent_param.name, self.response_str)
+
+        return graph
+
+    def compile_logp(self, keep_transformed: bool = False, **kwargs):
+        """Compile the log probability function for the model.
+
+        Parameters
+        ----------
+        keep_transformed : bool, optional
+            If True, keeps the transformed variables in the compiled function.
+            If False, removes value transforms before compilation.
+            Defaults to False.
+        **kwargs
+            Additional keyword arguments passed to PyMC's compile_logp:
+            - vars: List of variables. Defaults to None (all variables).
+            - jacobian: Whether to include log(|det(dP/dQ)|) term for
+            transformed variables. Defaults to True.
+            - sum: Whether to sum all terms instead of returning a vector.
+            Defaults to True.
+
+        Returns
+        -------
+        callable
+            A compiled function that computes the model log probability.
+        """
+        if keep_transformed:
+            return self.pymc_model.compile_logp(
+                vars=kwargs.get("vars", None),
+                jacobian=kwargs.get("jacobian", True),
+                sum=kwargs.get("sum", True),
+            )
+        else:
+            new_model = pm.model.transform.conditioning.remove_value_transforms(
+                self.pymc_model
+            )
+            return new_model.compile_logp(
+                vars=kwargs.get("vars", None),
+                jacobian=kwargs.get("jacobian", True),
+                sum=kwargs.get("sum", True),
+            )
+
+    def plot_trace(
+        self,
+        data: az.InferenceData | None = None,
+        include_deterministic: bool = False,
+        tight_layout: bool = True,
+        **kwargs,
+    ) -> None:
+        """Generate trace plot with ArviZ but with additional convenience features.
+
+        This is a simple wrapper for the az.plot_trace() function. By default, it
+        filters out the deterministic values from the plot. Please see the
+        [arviz documentation]
+        (https://arviz-devs.github.io/arviz/api/generated/arviz.plot_trace.html)
+        for additional parameters that can be specified.
+
+        Parameters
+        ----------
+        data : optional
+            An ArviZ InferenceData object. If None, the traces stored in the model will
+            be used.
+        include_deterministic : optional
+            Whether to include deterministic variables in the plot. Defaults to False.
+            Note that if include deterministic is set to False and and `var_names` is
+            provided, the `var_names` provided will be modified to also exclude the
+            deterministic values. If this is not desirable, set
+            `include deterministic` to True.
+        tight_layout : optional
+            Whether to call plt.tight_layout() after plotting. Defaults to True.
+        """
+        data = data or self.traces
+        if not isinstance(data, az.InferenceData):
+            raise TypeError("data must be an InferenceData object.")
+
+        if not include_deterministic:
+            var_names = list(
+                set([var.name for var in self.pymc_model.free_RVs]).intersection(
+                    set(list(data["posterior"].data_vars.keys()))
+                )
+            )
+            # var_names = self._get_deterministic_var_names(data)
+            if var_names:
+                if "var_names" in kwargs:
+                    if isinstance(kwargs["var_names"], str):
+                        if kwargs["var_names"] not in var_names:
+                            var_names.append(kwargs["var_names"])
+                        kwargs["var_names"] = var_names
+                    elif isinstance(kwargs["var_names"], list):
+                        kwargs["var_names"] = list(
+                            set(var_names) | set(kwargs["var_names"])
+                        )
+                    elif kwargs["var_names"] is None:
+                        kwargs["var_names"] = var_names
+                    else:
+                        raise ValueError(
+                            "`var_names` must be a string, a list of strings, or None."
+                        )
+                else:
+                    kwargs["var_names"] = var_names
+        az.plot_trace(data, **kwargs)
+
+        if tight_layout:
+            plt.tight_layout()
+
+    def summary(
+        self,
+        data: az.InferenceData | None = None,
+        include_deterministic: bool = False,
+        **kwargs,
+    ) -> pd.DataFrame | xr.Dataset:
+        """Produce a summary table with ArviZ but with additional convenience features.
+
+        This is a simple wrapper for the az.summary() function. By default, it
+        filters out the deterministic values from the plot. Please see the
+        [arviz documentation]
+        (https://arviz-devs.github.io/arviz/api/generated/arviz.summary.html)
+        for additional parameters that can be specified.
+
+        Parameters
+        ----------
+        data
+            An ArviZ InferenceData object. If None, the traces stored in the model will
+            be used.
+        include_deterministic : optional
+            Whether to include deterministic variables in the plot. Defaults to False.
+            Note that if include_deterministic is set to False and and `var_names` is
+            provided, the `var_names` provided will be modified to also exclude the
+            deterministic values. If this is not desirable, set
+            `include_deterministic` to True.
+
+        Returns
+        -------
+        pd.DataFrame | xr.Dataset
+            A pandas DataFrame or xarray Dataset containing the summary statistics.
+        """
+        data = data or self.traces
+        if not isinstance(data, az.InferenceData):
+            raise TypeError("data must be an InferenceData object.")
+
+        if not include_deterministic:
+            var_names = list(
+                set([var.name for var in self.pymc_model.free_RVs]).intersection(
+                    set(list(data["posterior"].data_vars.keys()))
+                )
+            )
+            # var_names = self._get_deterministic_var_names(data)
+            if var_names:
+                kwargs["var_names"] = list(set(var_names + kwargs.get("var_names", [])))
+        return az.summary(data, **kwargs)
+
+    def initial_point(self, transformed: bool = False) -> dict[str, np.ndarray]:
+        """Compute the initial point of the model.
+
+        This is a slightly altered version of pm.initial_point.initial_point().
+
+        Parameters
+        ----------
+        transformed : bool, optional
+            If True, return the initial point in transformed space.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the initial point of the model parameters.
+        """
+        fn = pm.initial_point.make_initial_point_fn(
+            model=self.pymc_model, return_transformed=transformed
+        )
+        return pm.model.Point(fn(None), model=self.pymc_model)
+
+    def restore_traces(
+        self, traces: az.InferenceData | pm.Approximation | str | PathLike
+    ) -> None:
+        """Restore traces from an InferenceData object or a .netcdf file.
+
+        Parameters
+        ----------
+        traces
+            An InferenceData object or a path to a file containing the traces.
+        """
+        if isinstance(traces, pm.Approximation):
+            self._inference_obj_vi = traces
+            return
+
+        if isinstance(traces, (str, PathLike)):
+            traces = az.from_netcdf(traces)
+        self._inference_obj = cast("az.InferenceData", traces)
+
+    def restore_vi_traces(
+        self, traces: az.InferenceData | pm.Approximation | str | PathLike
+    ) -> None:
+        """Restore VI traces from an InferenceData object or a .netcdf file.
+
+        Parameters
+        ----------
+        traces
+            An InferenceData object or a path to a file containing the VI traces.
+        """
+        if isinstance(traces, pm.Approximation):
+            self._inference_obj_vi = traces
+            return
+
+        if isinstance(traces, (str, PathLike)):
+            traces = az.from_netcdf(traces)
+        self._inference_obj_vi = cast("az.InferenceData", traces)
+
+    def save_model(
+        self,
+        model_name: str | None = None,
+        allow_absolute_base_path: bool = False,
+        base_path: str | Path = "hssm_models",
+        save_idata_only: bool = False,
+    ) -> None:
+        """Save a HSSM model instance and its inference results to disk.
+
+        Parameters
+        ----------
+        model : HSSM
+            The HSSM model instance to save
+        model_name : str | None
+            Name to use for the saved model files.
+            If None, will use model.model_name with timestamp
+        allow_absolute_base_path : bool
+            Whether to allow absolute paths for base_path
+        base_path : str | Path
+            Base directory to save model files in.
+            Must be relative path if allow_absolute_base_path=False
+        save_idata_only: bool = False,
+            Whether to save the model class instance itself
+
+        Raises
+        ------
+        ValueError
+            If base_path is absolute and allow_absolute_base_path=False
+        """
+        # check if base_path is absolute
+        if not allow_absolute_base_path:
+            if str(base_path).startswith("/"):
+                raise ValueError(
+                    "base_path must be a relative path"
+                    " if allow_absolute_base_path is False"
+                )
+
+        if model_name is None:
+            # Get date string format as suffix to model name
+            model_name = (
+                self.model_name
+                + "_"
+                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
+            )
+
+        # check if folder by name model_name exists
+        model_name = model_name.replace(" ", "_")
+        model_path = Path(base_path).joinpath(model_name)
+        model_path.mkdir(parents=True, exist_ok=True)
+
+        # Save model to pickle file
+        if not save_idata_only:
+            with open(model_path.joinpath("model.pkl"), "wb") as f:
+                cpickle.dump(self, f)
+
+        # Save traces to netcdf file
+        if self._inference_obj is not None:
+            az.to_netcdf(self._inference_obj, model_path.joinpath("traces.nc"))
+
+        # Save vi_traces to netcdf file
+        if self._inference_obj_vi is not None:
+            az.to_netcdf(self._inference_obj_vi, model_path.joinpath("vi_traces.nc"))
+
+    @classmethod
+    def load_model(
+        cls, path: Union[str, Path]
+    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
+        """Load a HSSM model instance and its inference results from disk.
+
+        Parameters
+        ----------
+        path : str | Path
+            Path to the model directory or model.pkl file. If a directory is provided,
+            will look for model.pkl, traces.nc and vi_traces.nc files within it.
+
+        Returns
+        -------
+        HSSM
+            The loaded HSSM model instance with inference results attached if available.
+        """
+        # Convert path to Path object
+        path = Path(path)
+
+        # If path points to a file, assume it's model.pkl
+        if path.is_file():
+            model_dir = path.parent
+            model_path = path
+        else:
+            # Path points to directory
+            model_dir = path
+            model_path = model_dir.joinpath("model.pkl")
+
+        # check if model_dir exists
+        if not model_dir.exists():
+            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
+
+        # check if model.pkl exists raise logging information if not
+        if not model_path.exists():
+            _logger.info(
+                f"model.pkl file does not exist in {model_dir}. "
+                "Attempting to load traces only."
+            )
+            if (not model_dir.joinpath("traces.nc").exists()) and (
+                not model_dir.joinpath("vi_traces.nc").exists()
+            ):
+                raise FileNotFoundError(f"No traces found in {model_dir}.")
+            else:
+                idata_dict = cls.load_model_idata(model_dir)
+                return idata_dict
+        else:
+            # Load model from pickle file
+            with open(model_path, "rb") as f:
+                model = cpickle.load(f)
+
+            # Load traces if they exist
+            traces_path = model_dir.joinpath("traces.nc")
+            if traces_path.exists():
+                model.restore_traces(traces_path)
+
+            # Load VI traces if they exist
+            vi_traces_path = model_dir.joinpath("vi_traces.nc")
+            if vi_traces_path.exists():
+                model.restore_vi_traces(vi_traces_path)
+        return model
+
+    @classmethod
+    def load_model_idata(cls, path: str | Path) -> dict[str, az.InferenceData | None]:
+        """Load the traces from a model directory.
+
+        Parameters
+        ----------
+        path : str | Path
+            Path to the model directory containing traces.nc and/or vi_traces.nc files.
+
+        Returns
+        -------
+        dict[str, az.InferenceData | None]
+            A dictionary with keys "idata_mcmc" and "idata_vi" containing the traces
+            from the model directory. If the traces do not exist, the corresponding
+            value will be None.
+        """
+        idata_dict: dict[str, az.InferenceData | None] = {}
+        model_dir = Path(path)
+        # check if path exists
+        if not model_dir.exists():
+            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
+
+        # check if traces.nc exists
+        traces_path = model_dir.joinpath("traces.nc")
+        if not traces_path.exists():
+            _logger.warning(f"traces.nc file does not exist in {model_dir}.")
+            idata_dict["idata_mcmc"] = None
+        else:
+            idata_dict["idata_mcmc"] = az.from_netcdf(traces_path)
+
+        # check if vi_traces.nc exists
+        vi_traces_path = model_dir.joinpath("vi_traces.nc")
+        if not vi_traces_path.exists():
+            _logger.warning(f"vi_traces.nc file does not exist in {model_dir}.")
+            idata_dict["idata_vi"] = None
+        else:
+            idata_dict["idata_vi"] = az.from_netcdf(vi_traces_path)
+
+        return idata_dict
+
+    def __getstate__(self):
+        """Get the state of the model for pickling.
+
+        This method is called when pickling the model.
+        It returns a dictionary containing the constructor
+        arguments needed to recreate the model instance.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the constructor arguments
+            under the key 'constructor_args'.
+        """
+        state = {"constructor_args": self._init_args}
+        return state
+
+    def __setstate__(self, state):
+        """Set the state of the model when unpickling.
+
+        This method is called when unpickling the model. It creates a new instance
+        of HSSM using the constructor arguments stored in the state dictionary,
+        and copies its attributes to the current instance.
+
+        Parameters
+        ----------
+        state : dict
+            A dictionary containing the constructor arguments under the key
+            'constructor_args'.
+        """
+        new_instance = HSSM(**state["constructor_args"])
+        self.__dict__ = new_instance.__dict__
+
+    def __repr__(self) -> str:
+        """Create a representation of the model."""
+        output = [
+            "Hierarchical Sequential Sampling Model",
+            f"Model: {self.model_name}\n",
+            f"Response variable: {self.response_str}",
+            f"Likelihood: {self.loglik_kind}",
+            f"Observations: {len(self.data)}\n",
+            "Parameters:\n",
+        ]
+
+        for param in self.params.values():
+            if param.name == "p_outlier":
+                continue
+            output.append(f"{param.name}:")
+
+            component = self.model.components[param.name]
+
+            # Regression case:
+            if param.is_regression:
+                assert isinstance(component, DistributionalComponent)
+                output.append(f"    Formula: {param.formula}")
+                output.append("    Priors:")
+                intercept_term = component.intercept_term
+                if intercept_term is not None:
+                    output.append(_print_prior(intercept_term))
+                for _, common_term in component.common_terms.items():
+                    output.append(_print_prior(common_term))
+                for _, group_specific_term in component.group_specific_terms.items():
+                    output.append(_print_prior(group_specific_term))
+                output.append(f"    Link: {param.link}")
+            # None regression case
+            else:
+                if param.prior is None:
+                    prior = (
+                        component.intercept_term.prior
+                        if param.is_parent
+                        else component.prior
+                    )
+                else:
+                    prior = param.prior
+                output.append(f"    Prior: {prior}")
+            output.append(f"    Explicit bounds: {param.bounds}")
+            output.append(
+                " (ignored due to link function)"
+                if self.link_settings is not None
+                else ""
+            )
+
+        # TODO: Handle p_outlier regression correctly here.
+        if self.p_outlier is not None:
+            output.append("")
+            output.append(f"Lapse probability: {self.p_outlier.prior}")
+            output.append(f"Lapse distribution: {self.lapse}")
+
+        return "\n".join(output)
+
+    def __str__(self) -> str:
+        """Create a string representation of the model."""
+        return self.__repr__()
+
+    @property
+    def traces(self) -> az.InferenceData | pm.Approximation:
+        """Return the trace of the model after sampling.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        az.InferenceData | pm.Approximation
+            The trace of the model after the last call to `sample()`.
+        """
+        if not self._inference_obj:
+            raise ValueError("Please sample the model first.")
+
+        return self._inference_obj
+
+    @property
+    def vi_idata(self) -> az.InferenceData:
+        """Return the variational inference approximation object.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        az.InferenceData
+            The variational inference approximation object.
+        """
+        if not self._inference_obj_vi:
+            raise ValueError(
+                "Please run variational inference first, "
+                "no variational posterior attached."
+            )
+
+        return self._inference_obj_vi
+
+    @property
+    def vi_approx(self) -> pm.Approximation:
+        """Return the variational inference approximation object.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        pm.Approximation
+            The variational inference approximation object.
+        """
+        if not self._vi_approx:
+            raise ValueError(
+                "Please run variational inference first, "
+                "no variational approximation attached."
+            )
+
+        return self._vi_approx
+
+    @property
+    def map(self) -> dict:
+        """Return the MAP estimates of the model parameters.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the MAP estimates of the model parameters.
+        """
+        if not self._map_dict:
+            raise ValueError("Please compute map first.")
+
+        return self._map_dict
+
+    @property
+    def initvals(self) -> dict:
+        """Return the initial values of the model parameters for sampling.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the initial values of the model parameters.
+            This dict serves as the default for initial values, and can be passed
+            directly to the `.sample()` function.
+        """
+        if self._initvals == {}:
+            self._initvals = self.initial_point()
+        return self._initvals
+
+    def _check_lapse(self, lapse):
+        """Determine if p_outlier and lapse is specified correctly."""
+        # Basically, avoid situations where only one of them is specified.
+        if self.has_lapse and lapse is None:
+            raise ValueError(
+                "You have specified `p_outlier`. Please also specify `lapse`."
+            )
+        if lapse is not None and not self.has_lapse:
+            _logger.warning(
+                "You have specified the `lapse` argument to include a lapse "
+                + "distribution, but `p_outlier` is set to either 0 or None. "
+                + "Your lapse distribution will be ignored."
+            )
+        if "p_outlier" in self.list_params and self.list_params[-1] != "p_outlier":
+            raise ValueError(
+                "Please do not include 'p_outlier' in `list_params`. "
+                + "We automatically append it to `list_params` when `p_outlier` "
+                + "parameter is not None"
+            )
+
+    def _make_model_distribution(self) -> type[pm.Distribution]:
+        """Make a pm.Distribution for the model."""
+        ### Logic for different types of likelihoods:
+        # -`analytical` and `blackbox`:
+        #     loglik should be a `pm.Distribution`` or a Python callable (any arbitrary
+        #     function).
+        # - `approx_differentiable`:
+        #     In addition to `pm.Distribution` and any arbitrary function, it can also
+        #     be an str (which we will download from hugging face) or a Pathlike
+        #     which we will download and make a distribution.
+
+        # If user has already provided a log-likelihood function as a distribution
+        # Use it directly as the distribution
+        if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
+            return self.loglik
+
+        params_is_reg = [
+            param.is_vector
+            for param_name, param in self.params.items()
+            if param_name != "p_outlier"
+        ]
+        if self.extra_fields is not None:
+            params_is_reg += [True for _ in self.extra_fields]
+
+        if self.loglik_kind == "approx_differentiable":
+            if self.model_config.backend == "jax":
+                likelihood_callable = make_likelihood_callable(
+                    loglik=self.loglik,
+                    loglik_kind="approx_differentiable",
+                    backend="jax",
+                    params_is_reg=params_is_reg,
+                )
+            else:
+                likelihood_callable = make_likelihood_callable(
+                    loglik=self.loglik,
+                    loglik_kind="approx_differentiable",
+                    backend=self.model_config.backend,
+                )
+        else:
+            likelihood_callable = make_likelihood_callable(
+                loglik=self.loglik,
+                loglik_kind=self.loglik_kind,
+                backend=self.model_config.backend,
+            )
+
+        self.loglik = likelihood_callable
+
+        # Make the callable for missing data
+        # And assemble it with the callable for the likelihood
+        if self.missing_data_network != MissingDataNetwork.NONE:
+            if self.missing_data_network == MissingDataNetwork.OPN:
+                params_only = False
+            elif self.missing_data_network == MissingDataNetwork.CPN:
+                params_only = True
+            else:
+                params_only = None
+
+            if self.loglik_missing_data is None:
+                self.loglik_missing_data = (
+                    self.model_name
+                    + missing_data_networks_suffix[self.missing_data_network]
+                    + ".onnx"
+                )
+
+            backend_tmp: Literal["pytensor", "jax", "other"] | None = (
+                "jax"
+                if self.model_config.backend != "pytensor"
+                else self.model_config.backend
+            )
+            missing_data_callable = make_missing_data_callable(
+                self.loglik_missing_data, backend_tmp, params_is_reg, params_only
+            )
+
+            self.loglik_missing_data = missing_data_callable
+
+            self.loglik = assemble_callables(
+                self.loglik,
+                self.loglik_missing_data,
+                params_only,
+                has_deadline=self.deadline,
+            )
+
+        if self.missing_data:
+            _logger.info(
+                "Re-arranging data to separate missing and observed datapoints. "
+                "Missing data (rt == %s) will be on top, "
+                "observed datapoints follow.",
+                self.missing_data_value,
+            )
+
+        self.data = _rearrange_data(self.data)
+        return make_distribution(
+            rv=self.model_config.rv or self.model_name,
+            loglik=self.loglik,
+            list_params=self.list_params,
+            bounds=self.bounds,
+            lapse=self.lapse,
+            extra_fields=(
+                None
+                if not self.extra_fields
+                else [deepcopy(self.data[field].values) for field in self.extra_fields]
+            ),
+        )
+
+    def _get_deterministic_var_names(self, idata) -> list[str]:
+        """Filter out the deterministic variables in var_names."""
+        var_names = [
+            f"~{param_name}"
+            for param_name, param in self.params.items()
+            if (param.is_regression)
+        ]
+
+        if f"{self._parent}_mean" in idata["posterior"].data_vars:
+            var_names.append(f"~{self._parent}_mean")
+
+        # Parent parameters (always regression implicitly)
+        # which don't have a formula attached
+        # should be dropped from var_names, since the actual
+        # parent name shows up as a regression.
+        if f"{self._parent}" in idata["posterior"].data_vars:
+            if self.params[self._parent].formula is None:
+                # Drop from var_names
+                var_names = [var for var in var_names if var != f"~{self._parent}"]
+
+        return var_names
+
+    def _drop_parent_str_from_idata(
+        self, idata: az.InferenceData | None
+    ) -> az.InferenceData:
+        """Drop the parent_str variable from an InferenceData object.
+
+        Parameters
+        ----------
+        idata
+            The InferenceData object to be modified.
+
+        Returns
+        -------
+        xr.Dataset
+            The modified InferenceData object.
+        """
+        if idata is None:
+            raise ValueError("Please provide an InferenceData object.")
+        else:
+            for group in idata.groups():
+                if ("rt,response_mean" in idata[group].data_vars) and (
+                    self._parent not in idata[group].data_vars
+                ):
+                    setattr(
+                        idata,
+                        group,
+                        idata[group].rename({"rt,response_mean": self._parent}),
+                    )
+            return idata
+
+    def _postprocess_initvals_deterministic(
+        self, initval_settings: dict = INITVAL_SETTINGS
+    ) -> None:
+        """Set initial values for subset of parameters."""
+        self._initvals = self.initial_point()
+        # Consider case where link functions are set to 'log_logit'
+        # or 'None'
+        if self.link_settings not in ["log_logit", None]:
+            _logger.info(
+                "Not preprocessing initial values, "
+                + "because none of the two standard link settings are chosen!"
+            )
+            return None
+
+        # Set initial values for particular parameters
+        for name_, starting_value in self.pymc_model.initial_point().items():
+            # strip name of `_log__` and `_interval__` suffixes
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+
+            # We need to check if the parameter is actually backed by
+            # a regression.
+
+            # If not, we don't actually apply a link function to it as per default.
+            # Therefore we need to apply the initial value strategy corresponding
+            # to 'None' link function.
+
+            # If the user actively supplies a link function, the user
+            # should also have supplied an initial value insofar it matters.
+
+            if self.params[self._get_prefix(name_tmp)].is_regression:
+                param_link_setting = self.link_settings
+            else:
+                param_link_setting = None
+            if name_tmp in initval_settings[param_link_setting].keys():
+                if self._check_if_initval_user_supplied(name_tmp):
+                    _logger.info(
+                        "User supplied initial value detected for %s, \n"
+                        " skipping overwrite with default value.",
+                        name_tmp,
+                    )
+                    continue
+
+                # Apply specific settings from initval_settings dictionary
+                dtype = self._initvals[name_tmp].dtype
+                self._initvals[name_tmp] = np.array(
+                    initval_settings[param_link_setting][name_tmp]
+                ).astype(dtype)
+
+    def _get_prefix(self, name_str: str) -> str:
+        """Get parameters wise link setting function from parameter prefix."""
+        # `p_outlier` is the only basic parameter floating around that has
+        # an underscore in it's name.
+        # We need to handle it separately. (Renaming might be better...)
+        if "_" in name_str:
+            if "p_outlier" not in name_str:
+                name_str_prefix = name_str.split("_")[0]
+            else:
+                name_str_prefix = "p_outlier"
+        else:
+            name_str_prefix = name_str
+        return name_str_prefix
+
+    def _check_if_initval_user_supplied(
+        self,
+        name_str: str,
+        return_value: bool = False,
+    ) -> bool | float | int | np.ndarray | dict[str, Any] | None:
+        """Check if initial value is user-supplied."""
+        # The function assumes that the name_str is either raw parameter name
+        # or `paramname_Intercept`, because we only really provide special default
+        # initial values for those types of parameters
+
+        # `p_outlier` is the only basic parameter floating around that has
+        # an underscore in it's name.
+        # We need to handle it separately. (Renaming might be better...)
+        if "_" in name_str:
+            if "p_outlier" not in name_str:
+                name_str_prefix = name_str.split("_")[0]
+                # name_str_suffix = "".join(name_str.split("_")[1:])
+                name_str_suffix = name_str[len(name_str_prefix + "_") :]
+            else:
+                name_str_prefix = "p_outlier"
+                if name_str == "p_outlier":
+                    name_str_suffix = ""
+                else:
+                    # name_str_suffix = "".join(name_str.split("_")[2:])
+                    name_str_suffix = name_str[len("p_outlier_") :]
+        else:
+            name_str_prefix = name_str
+            name_str_suffix = ""
+
+        tmp_param = name_str_prefix
+        if tmp_param == self._parent:
+            # If the parameter was parent it is automatically treated as a
+            # regression.
+            if not name_str_suffix:
+                # No suffix --> Intercept
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp["Intercept"], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    return False
+            else:
+                # If the parameter has a suffix --> use it
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+        else:
+            # If the parameter is not a parent, it is treated as a regression
+            # only when actively specified as such.
+            if not name_str_suffix:
+                # If no suffix --> treat as basic parameter.
+                if isinstance(self.params[tmp_param].prior, float) or isinstance(
+                    self.params[tmp_param].prior, np.ndarray
+                ):
+                    if return_value:
+                        return self.params[tmp_param].prior
+                    else:
+                        return True
+                elif isinstance(self.params[tmp_param].prior, bmb.Prior):
+                    args_tmp = getattr(self.params[tmp_param].prior, "args")
+                    if "initval" in args_tmp:
+                        if return_value:
+                            return args_tmp["initval"]
+                        else:
+                            return True
+                    else:
+                        if return_value:
+                            return None
+                        else:
+                            return False
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+            else:
+                # If suffix --> treat as regression and use suffix
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+
+    def _jitter_initvals(
+        self, jitter_epsilon: float = 0.01, vector_only: bool = False
+    ) -> None:
+        """Apply controlled jitter to initial values."""
+        if vector_only:
+            self.__jitter_initvals_vector_only(jitter_epsilon)
+        else:
+            self.__jitter_initvals_all(jitter_epsilon)
+
+    def __jitter_initvals_vector_only(self, jitter_epsilon: float) -> None:
+        # Note: Calling our initial point function here
+        # --> operate on untransformed variables
+        initial_point_dict = self.initvals
+        for name_, starting_value in initial_point_dict.items():
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+            if starting_value.ndim != 0 and starting_value.shape[0] != 1:
+                starting_value_tmp = starting_value + np.random.uniform(
+                    -jitter_epsilon, jitter_epsilon, starting_value.shape
+                ).astype(np.float32)
+
+                # Note: self._initvals shouldn't be None when this is called
+                dtype = self._initvals[name_tmp].dtype
+                self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)
+
+    def __jitter_initvals_all(self, jitter_epsilon: float) -> None:
+        # Note: Calling our initial point function here
+        # --> operate on untransformed variables
+        initial_point_dict = self.initvals
+        # initial_point_dict = self.pymc_model.initial_point()
+        for name_, starting_value in initial_point_dict.items():
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+            starting_value_tmp = starting_value + np.random.uniform(
+                -jitter_epsilon, jitter_epsilon, starting_value.shape
+            ).astype(np.float32)
+
+            dtype = self.initvals[name_tmp].dtype
+            self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)

From f1a6135391bd39491f114adaefe85a55d0d6cd43 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 10:37:34 -0500
Subject: [PATCH 002/104] Extract HSSM base class to hssmbase.py with
 refactorings and add tests

---
 src/hssm/{hssmbase_temp.py => hssmbase.py} |   0
 tests/test_hssmbase.py                     | 364 +++++++++++++++++++++
 2 files changed, 364 insertions(+)
 rename src/hssm/{hssmbase_temp.py => hssmbase.py} (100%)
 create mode 100644 tests/test_hssmbase.py

diff --git a/src/hssm/hssmbase_temp.py b/src/hssm/hssmbase.py
similarity index 100%
rename from src/hssm/hssmbase_temp.py
rename to src/hssm/hssmbase.py
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
new file mode 100644
index 000000000..db9e0ee76
--- /dev/null
+++ b/tests/test_hssmbase.py
@@ -0,0 +1,364 @@
+import bambi as bmb
+import numpy as np
+import pytest
+
+import hssm
+from hssm.hssmbase import HSSM
+from hssm.likelihoods import DDM, logp_ddm
+from copy import deepcopy
+
+hssm.set_floatX("float32", update_jax=True)
+
+param_v = {
+    "name": "v",
+    "prior": {
+        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0},
+        "x": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
+        "y": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
+    },
+    "formula": "v ~ 1 + x + y",
+}
+
+param_a = param_v | dict(name="a", formula="a ~ 1 + x + y")
+
+
+@pytest.mark.slow
+@pytest.mark.parametrize(
+    "include, should_raise_exception",
+    [
+        (
+            [param_v],
+            False,
+        ),
+        (
+            [
+                param_v,
+                param_a,
+            ],
+            False,
+        ),
+        (
+            [{"name": "invalid_param", "prior": "invalid_param"}],
+            True,
+        ),
+        (
+            [
+                {
+                    "name": "v",
+                    "prior": {
+                        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0}
+                    },
+                    "formula": "v ~ 1",
+                    "invalid_key": "identity",
+                }
+            ],
+            True,
+        ),
+        (
+            [
+                {
+                    "name": "v",
+                    "prior": {
+                        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0}
+                    },
+                    "formula": "invalid_formula",
+                }
+            ],
+            True,
+        ),
+    ],
+)
+def test_transform_params_general(data_ddm_reg, include, should_raise_exception):
+    if should_raise_exception:
+        with pytest.raises(Exception):
+            HSSM(data=data_ddm_reg, include=include)
+    else:
+        model = HSSM(data=data_ddm_reg, include=include)
+        # Check model properties using a loop
+        param_names = ["v", "a", "z", "t", "p_outlier"]
+        model_param_names = list(model.params.keys())
+        assert model_param_names == param_names
+        assert len(model.params) == 5
+
+
+@pytest.mark.slow
+def test_custom_model(data_ddm):
+    with pytest.raises(
+        ValueError, match="When using a custom model, please provide a `loglik_kind.`"
+    ):
+        model = HSSM(data=data_ddm, model="custom")
+
+    with pytest.raises(
+        ValueError, match="Please provide `list_params` via `model_config`."
+    ):
+        model = HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
+
+    with pytest.raises(
+        ValueError, match="Please provide `list_params` via `model_config`."
+    ):
+        model = HSSM(
+            data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical"
+        )
+
+    with pytest.raises(
+        ValueError,
+        match="Please provide `list_params` via `model_config`.",
+    ):
+        model = HSSM(
+            data=data_ddm,
+            model="custom",
+            loglik=DDM,
+            loglik_kind="analytical",
+            model_config={},
+        )
+
+    model = HSSM(
+        data=data_ddm,
+        model="custom",
+        model_config={
+            "list_params": ["v", "a", "z", "t"],
+            "choices": [-1, 1],
+            "bounds": {
+                "v": (-3.0, 3.0),
+                "a": (0.3, 2.5),
+                "z": (0.1, 0.9),
+                "t": (0.0, 2.0),
+            },
+        },
+        loglik=logp_ddm,
+        loglik_kind="analytical",
+    )
+
+    assert model.model_name == "custom"
+    assert model.loglik_kind == "analytical"
+    assert model.list_params == ["v", "a", "z", "t", "p_outlier"]
+
+
+@pytest.mark.slow
+def test_model_definition_outside_include(data_ddm):
+    model_with_one_param_fixed = HSSM(data_ddm, a=0.5)
+
+    assert "a" in model_with_one_param_fixed.params
+    assert model_with_one_param_fixed.params["a"].prior == 0.5
+
+    model_with_one_param = HSSM(
+        data_ddm, a={"prior": {"name": "Normal", "mu": 0.5, "sigma": 0.1}}
+    )
+
+    assert "a" in model_with_one_param.params
+    assert model_with_one_param.params["a"].prior.name == "Normal"
+
+    with pytest.raises(
+        ValueError, match="Parameter `a` specified in both `include` and `kwargs`."
+    ):
+        HSSM(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
+
+
+@pytest.mark.slow
+def test_sample_prior_predictive(data_ddm_reg):
+    data_ddm_reg = data_ddm_reg.iloc[:10, :]
+
+    model_no_regression = HSSM(data=data_ddm_reg)
+    rng = np.random.default_rng()
+
+    prior_predictive_1 = model_no_regression.sample_prior_predictive(draws=10)
+    prior_predictive_2 = model_no_regression.sample_prior_predictive(
+        draws=10, random_seed=rng
+    )
+
+    model_regression = HSSM(
+        data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]
+    )
+    prior_predictive_3 = model_regression.sample_prior_predictive(draws=10)
+
+    model_regression_a = HSSM(
+        data=data_ddm_reg, include=[dict(name="a", formula="a ~ 1 + x")]
+    )
+    prior_predictive_4 = model_regression_a.sample_prior_predictive(draws=10)
+
+    model_regression_multi = HSSM(
+        data=data_ddm_reg,
+        include=[
+            dict(name="v", formula="v ~ 1 + x"),
+            dict(name="a", formula="a ~ 1 + y"),
+        ],
+    )
+    prior_predictive_5 = model_regression_multi.sample_prior_predictive(draws=10)
+
+    data_ddm_reg.loc[:, "subject_id"] = np.arange(10)
+
+    model_regression_random_effect = HSSM(
+        data=data_ddm_reg,
+        include=[
+            dict(name="v", formula="v ~ (1|subject_id) + x"),
+            dict(name="a", formula="a ~ (1|subject_id) + y"),
+        ],
+    )
+    prior_predictive_6 = model_regression_random_effect.sample_prior_predictive(
+        draws=10
+    )
+
+
+@pytest.mark.slow
+def test_override_default_link(caplog, data_ddm_reg):
+    param_v = {
+        "name": "v",
+        "prior": {
+            "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0},
+            "x": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
+            "y": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
+        },
+        "formula": "v ~ 1 + x + y",
+    }
+    param_v = param_v | dict(bounds=(-np.inf, np.inf))
+    param_a = param_v | dict(name="a", formula="a ~ 1 + x + y", bounds=(0, np.inf))
+    param_z = param_v | dict(name="z", formula="z ~ 1 + x + y", bounds=(0, 1))
+    param_t = param_v | dict(name="t", formula="t ~ 1 + x + y", bounds=(0.1, np.inf))
+
+    model = HSSM(
+        data=data_ddm_reg,
+        include=[param_v, param_a, param_z, param_t],
+        link_settings="log_logit",
+    )
+
+    assert model.params["v"].link == "identity"
+    assert model.params["a"].link == "log"
+    assert model.params["z"].link.name == "gen_logit"
+    assert model.params["t"].link == "identity"
+
+    assert "t" in caplog.records[0].message
+    assert "strange" in caplog.records[0].message
+
+
+@pytest.mark.slow
+def test_resampling(data_ddm):
+    model = HSSM(data=data_ddm)
+    sample_1 = model.sample(draws=10, chains=1, tune=0)
+    assert sample_1 is model.traces
+
+    sample_2 = model.sample(draws=10, chains=1, tune=0)
+    assert sample_2 is model.traces
+
+    assert sample_1 is not sample_2
+
+
+@pytest.mark.slow
+def test_add_likelihood_parameters_to_data(data_ddm):
+    """Test if the likelihood parameters are added to the InferenceData object."""
+    model = HSSM(data=data_ddm)
+    sample_1 = model.sample(draws=10, chains=1, tune=10)
+    sample_1_copy = deepcopy(sample_1)
+    model.add_likelihood_parameters_to_idata(inplace=True)
+
+    # Get distributional components (make sure to take the right aliases)
+    distributional_component_names = [
+        key_ if key_ not in model._aliases else model._aliases[key_]
+        for key_ in model.model.distributional_components.keys()
+    ]
+
+    # Check that after computing the likelihood parameters
+    # all respective parameters appear in the InferenceData object
+    assert np.all(
+        [
+            component_ in model.traces.posterior.data_vars
+            for component_ in distributional_component_names
+        ]
+    )
+
+    # Check that before computing the likelihood parameters
+    # at least one parameter is missing (in the simplest case
+    # this is the {parent}_mean parameter if nothing received a regression)
+
+    assert not np.all(
+        [
+            component_ in sample_1_copy.posterior.data_vars
+            for component_ in distributional_component_names
+        ]
+    )
+
+
+# Setting any parameter to a fixed value should work:
+@pytest.mark.slow
+def test_model_creation_constant_parameter(data_ddm):
+    for param_name in ["v", "a", "z", "t"]:
+        model = HSSM(data=data_ddm, **{param_name: 1.0})
+        assert model._parent != param_name
+        assert model.params[param_name].prior == 1.0
+
+
+# Setting any single parameter to a regression should respect the default bounds:
+@pytest.mark.slow
+@pytest.mark.parametrize(
+    "param_name, dist_name",
+    [("v", "Normal"), ("a", "Gamma"), ("z", "Beta"), ("t", "Gamma")],
+)
+def test_model_creation_single_regression(data_ddm_reg, param_name, dist_name):
+    model = HSSM(
+        data=data_ddm_reg,
+        include=[{"name": param_name, "formula": f"{param_name} ~ 1 + x"}],
+    )
+    assert model.params[param_name].prior["Intercept"].name == dist_name
+    assert model.params[param_name].prior["x"].name == "Normal"
+
+
+# Setting all parameters to fixed values should throw an error:
+def test_model_creation_all_parameters_constant(data_ddm):
+    with pytest.raises(ValueError):
+        HSSM(data=data_ddm, v=1.0, a=1.0, z=1.0, t=1.0)
+
+
+# Prior settings
+@pytest.mark.slow
+def test_prior_settings_basic(cavanagh_test):
+    model_1 = HSSM(
+        data=cavanagh_test,
+        global_formula="y ~ 1 + (1|participant_id)",
+        prior_settings=None,
+    )
+
+    assert model_1.params["v"].prior is None, (
+        "Default prior doesn't yield Nonetype for 'v'!"
+    )
+
+    model_2 = HSSM(
+        data=cavanagh_test,
+        global_formula="y ~ 1 + (1|participant_id)",
+        prior_settings="safe",
+    )
+
+    assert isinstance(model_2.params[model_2._parent].prior, dict), (
+        "Prior assigned to parent is not a dict!"
+    )
+
+
+@pytest.mark.slow
+def test_compile_logp(cavanagh_test):
+    model_1 = HSSM(
+        data=cavanagh_test,
+        global_formula="y ~ 1 + (1|participant_id)",
+        prior_settings=None,
+    )
+
+    out = model_1.compile_logp(model_1.initial_point(transformed=False))
+    assert out is not None
+
+
+@pytest.mark.slow
+def test_sample_do(data_ddm):
+    model = HSSM(data=data_ddm)
+    sample_do = model.sample_do(params={"v": 1.0}, draws=10)
+    assert sample_do is not None
+    assert "v_mean" in sample_do.prior.data_vars
+    assert set(sample_do.prior_predictive.dims) == {
+        "chain",
+        "draw",
+        "__obs__",
+        "rt,response_dim",
+    }
+    assert set(sample_do.prior_predictive.coords) == {
+        "chain",
+        "draw",
+        "__obs__",
+        "rt,response_dim",
+    }
+    assert np.unique(sample_do.prior["v_mean"].values) == [1.0]

From 61ed5181451603022c8cc5f2eeb647b142dbf2d2 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 10:38:07 -0500
Subject: [PATCH 003/104] refactor: extract init args logic to _get_init_args
 static method

---
 src/hssm/hssmbase.py | 33 +++++++++++++++++++++++++++------
 1 file changed, 27 insertions(+), 6 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 5906c6eac..05e919ad2 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -300,13 +300,9 @@ def __init__(
         # so that we can easily define some
         # methods that need to access these
         # arguments (context: pickling / save - load).
-
+        # assert False, "Temporary prevent instantiation of HSSM class."
         # Define a dict with all call arguments:
-        self._init_args = {
-            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
-        }
-        if kwargs:
-            self._init_args.update(kwargs)
+        self._init_args = self._get_init_args(locals(), kwargs)
 
         self.data = data.copy()
         self._inference_obj: az.InferenceData | None = None
@@ -543,6 +539,31 @@ def __init__(
         )
         _logger.info("Model initialized successfully.")
 
+    @staticmethod
+    def _get_init_args(
+        locals_dict: dict[str, Any], kwargs: dict[str, Any]
+    ) -> dict[str, Any]:
+        """Extract initialization arguments from locals and kwargs.
+
+        Parameters
+        ----------
+        locals_dict : dict[str, Any]
+            The locals() dictionary from __init__.
+        kwargs : dict[str, Any]
+            Additional keyword arguments passed to __init__.
+
+        Returns
+        -------
+        dict[str, Any]
+            A dictionary containing all initialization arguments, excluding 'self'.
+        """
+        init_args = {
+            k: v for k, v in locals_dict.items() if k not in ["self", "kwargs"]
+        }
+        if kwargs:
+            init_args.update(kwargs)
+        return init_args
+
     @classproperty
     def supported_models(cls) -> tuple[SupportedModels, ...]:
         """Get a tuple of all supported models.

From 1d017b596ae863d77c4d51559b6896a54a4e12db Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 10:59:04 -0500
Subject: [PATCH 004/104] refactor: reorganize initialization of input data and
 configuration in HSSM class

---
 src/hssm/hssmbase.py | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 05e919ad2..77f304595 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -304,25 +304,29 @@ def __init__(
         # Define a dict with all call arguments:
         self._init_args = self._get_init_args(locals(), kwargs)
 
+        # ===== Input Data & Configuration =====
         self.data = data.copy()
-        self._inference_obj: az.InferenceData | None = None
-        self._initvals: dict[str, Any] = {}
-        self.initval_jitter = initval_jitter
-        self._inference_obj_vi: pm.Approximation | None = None
-        self._vi_approx = None
-        self._map_dict = None
         self.global_formula = global_formula
-
         self.link_settings = link_settings
         self.prior_settings = prior_settings
-
         self.missing_data_value = -999.0
 
+        # Set up additional namespace for formula evaluation
         additional_namespace = transformations_namespace.copy()
         if extra_namespace is not None:
             additional_namespace.update(extra_namespace)
         self.additional_namespace = additional_namespace
 
+        # ===== Inference Results (initialized to None/empty) =====
+        self._inference_obj: az.InferenceData | None = None
+        self._inference_obj_vi: pm.Approximation | None = None
+        self._vi_approx = None
+        self._map_dict = None
+
+        # ===== Initial Values Configuration =====
+        self._initvals: dict[str, Any] = {}
+        self.initval_jitter = initval_jitter
+
         # Construct a model_config from defaults
         self.model_config = Config.from_defaults(model, loglik_kind)
         # Update defaults with user-provided config, if any

From 78ea09629112ec47a87a120a48f44f0a77c2eb3f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 11:08:24 -0500
Subject: [PATCH 005/104] refactor: enhance comment clarity for model_config
 construction in HSSM class

---
 src/hssm/hssmbase.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 77f304595..d6219883a 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -327,7 +327,7 @@ def __init__(
         self._initvals: dict[str, Any] = {}
         self.initval_jitter = initval_jitter
 
-        # Construct a model_config from defaults
+        # ===== Construct a model_config from defaults and user inputs =====
         self.model_config = Config.from_defaults(model, loglik_kind)
         # Update defaults with user-provided config, if any
         if model_config is not None:

From 7d8609e77e5c32fc1ba8fb1bdbf68b167f26cd8d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 11:35:25 -0500
Subject: [PATCH 006/104] refactor: improve handling of user-provided
 model_config and choices in HSSM class

---
 src/hssm/hssmbase.py | 77 ++++++++++++++++++++++----------------------
 1 file changed, 38 insertions(+), 39 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index d6219883a..4944091b8 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -329,43 +329,52 @@ def __init__(
 
         # ===== Construct a model_config from defaults and user inputs =====
         self.model_config = Config.from_defaults(model, loglik_kind)
-        # Update defaults with user-provided config, if any
+
+        # Handle user-provided model_config
         if model_config is not None:
-            if isinstance(model_config, dict):
-                if "choices" not in model_config:
-                    if choices is not None:
-                        model_config["choices"] = choices
+            # Check if choices already exists in the provided config
+            has_choices = (
+                isinstance(model_config, dict)
+                and "choices" in model_config
+                or isinstance(model_config, ModelConfig)
+                and model_config.choices is not None
+            )
+
+            # Handle choices conflict or missing choices
+            if choices is not None:
+                if has_choices:
+                    _logger.info(
+                        "choices list provided in both model_config and "
+                        "as an argument directly."
+                        " Using the one provided in model_config. \n"
+                        "We recommend providing choices in model_config."
+                    )
                 else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-            elif isinstance(model_config, ModelConfig):
-                if model_config.choices is None:
-                    if choices is not None:
+                    # Add choices to the provided config
+                    if isinstance(model_config, dict):
+                        model_config["choices"] = choices
+                    else:  # ModelConfig instance
                         model_config.choices = choices
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
 
-            self.model_config.update_config(
+            # Convert dict to ModelConfig if needed and update
+            final_config = (
                 model_config
                 if isinstance(model_config, ModelConfig)
-                else ModelConfig(**model_config)  # also serves as dict validation
+                else ModelConfig(**model_config)
             )
+            self.model_config.update_config(final_config)
+
+        # Handle default config (no model_config provided)
         else:
-            # Model config is not provided, but at this point was constructed from
-            # defaults.
-            if model not in typing.get_args(SupportedModels):
-                # TODO: ideally use self.supported_models above but mypy doesn't like it
+            # For supported models, defaults already have choices
+            if model in typing.get_args(SupportedModels):
+                if choices is not None:
+                    _logger.info(
+                        "Model string is in SupportedModels."
+                        " Ignoring choices arguments."
+                    )
+            # For custom models, try to get choices
+            else:
                 if choices is not None:
                     self.model_config.update_choices(choices)
                 elif model in ssms_model_config:
@@ -379,16 +388,6 @@ def __init__(
                         model,
                         ssms_model_config[model]["choices"],
                     )
-            else:
-                # Model config already constructed from defaults, and model string is
-                # in SupportedModels. So we are guaranteed that choices are in
-                # self.model_config already.
-
-                if choices is not None:
-                    _logger.info(
-                        "Model string is in SupportedModels."
-                        " Ignoring choices arguments."
-                    )
 
         # Update loglik with user-provided value
         self.model_config.update_loglik(loglik)

From d0e39f79b2e213fa7e1f4f358c3ff6317b22bf75 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 11:54:25 -0500
Subject: [PATCH 007/104] refactor: implement model_config construction in a
 dedicated method

---
 src/hssm/hssmbase.py | 157 ++++++++++++++++++++++++++-----------------
 1 file changed, 97 insertions(+), 60 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 4944091b8..b5fdeb4e1 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -328,66 +328,9 @@ def __init__(
         self.initval_jitter = initval_jitter
 
         # ===== Construct a model_config from defaults and user inputs =====
-        self.model_config = Config.from_defaults(model, loglik_kind)
-
-        # Handle user-provided model_config
-        if model_config is not None:
-            # Check if choices already exists in the provided config
-            has_choices = (
-                isinstance(model_config, dict)
-                and "choices" in model_config
-                or isinstance(model_config, ModelConfig)
-                and model_config.choices is not None
-            )
-
-            # Handle choices conflict or missing choices
-            if choices is not None:
-                if has_choices:
-                    _logger.info(
-                        "choices list provided in both model_config and "
-                        "as an argument directly."
-                        " Using the one provided in model_config. \n"
-                        "We recommend providing choices in model_config."
-                    )
-                else:
-                    # Add choices to the provided config
-                    if isinstance(model_config, dict):
-                        model_config["choices"] = choices
-                    else:  # ModelConfig instance
-                        model_config.choices = choices
-
-            # Convert dict to ModelConfig if needed and update
-            final_config = (
-                model_config
-                if isinstance(model_config, ModelConfig)
-                else ModelConfig(**model_config)
-            )
-            self.model_config.update_config(final_config)
-
-        # Handle default config (no model_config provided)
-        else:
-            # For supported models, defaults already have choices
-            if model in typing.get_args(SupportedModels):
-                if choices is not None:
-                    _logger.info(
-                        "Model string is in SupportedModels."
-                        " Ignoring choices arguments."
-                    )
-            # For custom models, try to get choices
-            else:
-                if choices is not None:
-                    self.model_config.update_choices(choices)
-                elif model in ssms_model_config:
-                    self.model_config.update_choices(
-                        ssms_model_config[model]["choices"]
-                    )
-                    _logger.info(
-                        "choices argument passed as None, "
-                        "but found %s in ssms-simulators. "
-                        "Using choices, from ssm-simulators configs: %s",
-                        model,
-                        ssms_model_config[model]["choices"],
-                    )
+        self.model_config = self._build_model_config(
+            model, loglik_kind, model_config, choices
+        )
 
         # Update loglik with user-provided value
         self.model_config.update_loglik(loglik)
@@ -567,6 +510,100 @@ def _get_init_args(
             init_args.update(kwargs)
         return init_args
 
+    @staticmethod
+    def _build_model_config(
+        model: SupportedModels | str,
+        loglik_kind: LoglikKind | None,
+        model_config: ModelConfig | dict | None,
+        choices: list[int] | None,
+    ) -> ModelConfig:
+        """Build a ModelConfig object from defaults and user inputs.
+
+        Parameters
+        ----------
+        model : SupportedModels | str
+            The model name.
+        loglik_kind : LoglikKind | None
+            The kind of likelihood function.
+        model_config : ModelConfig | dict | None
+            User-provided model configuration.
+        choices : list[int] | None
+            User-provided choices list.
+
+        Returns
+        -------
+        ModelConfig
+            A complete ModelConfig object with choices and other settings applied.
+        """
+        # Start with defaults
+        config = Config.from_defaults(model, loglik_kind)
+
+        # Handle user-provided model_config
+        if model_config is not None:
+            # Check if choices already exists in the provided config
+            has_choices = (
+                isinstance(model_config, dict)
+                and "choices" in model_config
+                or isinstance(model_config, ModelConfig)
+                and model_config.choices is not None
+            )
+
+            # Handle choices conflict or missing choices
+            if choices is not None:
+                if has_choices:
+                    _logger.info(
+                        "choices list provided in both model_config and "
+                        "as an argument directly."
+                        " Using the one provided in model_config. \n"
+                        "We recommend providing choices in model_config."
+                    )
+                else:
+                    # Add choices to a copy of the config to avoid mutating input
+                    if isinstance(model_config, dict):
+                        model_config = {**model_config, "choices": choices}
+                    else:  # ModelConfig instance
+                        # Create a dict from the ModelConfig and add choices
+                        model_config_dict = {
+                            k: getattr(model_config, k)
+                            for k in model_config.__dataclass_fields__
+                            if getattr(model_config, k) is not None
+                        }
+                        model_config_dict["choices"] = choices
+                        model_config = model_config_dict
+
+            # Convert dict to ModelConfig if needed and update
+            final_config = (
+                model_config
+                if isinstance(model_config, ModelConfig)
+                else ModelConfig(**model_config)
+            )
+            config.update_config(final_config)
+
+        # Handle default config (no model_config provided)
+        else:
+            # For supported models, defaults already have choices
+            if model in typing.get_args(SupportedModels):
+                if choices is not None:
+                    _logger.info(
+                        "Model string is in SupportedModels."
+                        " Ignoring choices arguments."
+                    )
+            # For custom models, try to get choices
+            else:
+                if choices is not None:
+                    config.update_choices(choices)
+                elif model in ssms_model_config:
+                    config.update_choices(ssms_model_config[model]["choices"])
+                    _logger.info(
+                        "choices argument passed as None, "
+                        "but found %s in ssms-simulators. "
+                        "Using choices, from ssm-simulators configs: %s",
+                        model,
+                        ssms_model_config[model]["choices"],
+                    )
+
+        return config
+
     @classproperty
     def supported_models(cls) -> tuple[SupportedModels, ...]:
         """Get a tuple of all supported models.

From a95a588af81ef2dbef6d4ff1833c412eac0b88bb Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 11:54:51 -0500
Subject: [PATCH 008/104] refactor: remove slow marker from multiple test
 functions in test_hssmbase

---
 tests/test_hssmbase.py | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index db9e0ee76..64c03e553 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -22,7 +22,6 @@
 param_a = param_v | dict(name="a", formula="a ~ 1 + x + y")
 
 
-@pytest.mark.slow
 @pytest.mark.parametrize(
     "include, should_raise_exception",
     [
@@ -81,7 +80,6 @@ def test_transform_params_general(data_ddm_reg, include, should_raise_exception)
         assert len(model.params) == 5
 
 
-@pytest.mark.slow
 def test_custom_model(data_ddm):
     with pytest.raises(
         ValueError, match="When using a custom model, please provide a `loglik_kind.`"
@@ -134,7 +132,6 @@ def test_custom_model(data_ddm):
     assert model.list_params == ["v", "a", "z", "t", "p_outlier"]
 
 
-@pytest.mark.slow
 def test_model_definition_outside_include(data_ddm):
     model_with_one_param_fixed = HSSM(data_ddm, a=0.5)
 
@@ -154,7 +151,6 @@ def test_model_definition_outside_include(data_ddm):
         HSSM(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
 
 
-@pytest.mark.slow
 def test_sample_prior_predictive(data_ddm_reg):
     data_ddm_reg = data_ddm_reg.iloc[:10, :]
 
@@ -199,7 +195,6 @@ def test_sample_prior_predictive(data_ddm_reg):
     )
 
 
-@pytest.mark.slow
 def test_override_default_link(caplog, data_ddm_reg):
     param_v = {
         "name": "v",
@@ -230,7 +225,6 @@ def test_override_default_link(caplog, data_ddm_reg):
     assert "strange" in caplog.records[0].message
 
 
-@pytest.mark.slow
 def test_resampling(data_ddm):
     model = HSSM(data=data_ddm)
     sample_1 = model.sample(draws=10, chains=1, tune=0)
@@ -242,7 +236,6 @@ def test_resampling(data_ddm):
     assert sample_1 is not sample_2
 
 
-@pytest.mark.slow
 def test_add_likelihood_parameters_to_data(data_ddm):
     """Test if the likelihood parameters are added to the InferenceData object."""
     model = HSSM(data=data_ddm)
@@ -278,7 +271,6 @@ def test_add_likelihood_parameters_to_data(data_ddm):
 
 
 # Setting any parameter to a fixed value should work:
-@pytest.mark.slow
 def test_model_creation_constant_parameter(data_ddm):
     for param_name in ["v", "a", "z", "t"]:
         model = HSSM(data=data_ddm, **{param_name: 1.0})
@@ -287,7 +279,6 @@ def test_model_creation_constant_parameter(data_ddm):
 
 
 # Setting any single parameter to a regression should respect the default bounds:
-@pytest.mark.slow
 @pytest.mark.parametrize(
     "param_name, dist_name",
     [("v", "Normal"), ("a", "Gamma"), ("z", "Beta"), ("t", "Gamma")],
@@ -308,7 +299,6 @@ def test_model_creation_all_parameters_constant(data_ddm):
 
 
 # Prior settings
-@pytest.mark.slow
 def test_prior_settings_basic(cavanagh_test):
     model_1 = HSSM(
         data=cavanagh_test,
@@ -331,7 +321,6 @@ def test_prior_settings_basic(cavanagh_test):
     )
 
 
-@pytest.mark.slow
 def test_compile_logp(cavanagh_test):
     model_1 = HSSM(
         data=cavanagh_test,
@@ -343,7 +332,6 @@ def test_compile_logp(cavanagh_test):
     assert out is not None
 
 
-@pytest.mark.slow
 def test_sample_do(data_ddm):
     model = HSSM(data=data_ddm)
     sample_do = model.sample_do(params={"v": 1.0}, draws=10)

From c2515cf1d775e0606c2c334c62fb92b6b78ca539 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 12:07:37 -0500
Subject: [PATCH 009/104] refactor: streamline model_config validation and
 enhance shortcut setup in HSSM class

---
 src/hssm/hssmbase.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index b5fdeb4e1..0a512cfb4 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -331,13 +331,10 @@ def __init__(
         self.model_config = self._build_model_config(
             model, loglik_kind, model_config, choices
         )
-
-        # Update loglik with user-provided value
         self.model_config.update_loglik(loglik)
-        # Ensure that all required fields are valid
         self.model_config.validate()
 
-        # Set up shortcuts so old code will work
+        # ===== Set up shortcuts so old code will work ======
         self.response = self.model_config.response
         self.list_params = self.model_config.list_params
         self.choices = self.model_config.choices

From 957ab34e81bb3295f4c884228dce4955c5122e80 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 12:59:33 -0500
Subject: [PATCH 010/104] refactor: enhance type annotation for model_config
 and add validation for list_params in HSSM class

---
 src/hssm/hssmbase.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 0a512cfb4..94135371b 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -328,7 +328,7 @@ def __init__(
         self.initval_jitter = initval_jitter
 
         # ===== Construct a model_config from defaults and user inputs =====
-        self.model_config = self._build_model_config(
+        self.model_config: Config = self._build_model_config(
             model, loglik_kind, model_config, choices
         )
         self.model_config.update_loglik(loglik)
@@ -348,6 +348,12 @@ def __init__(
                 "`choices` must be provided either in `model_config` or as an argument."
             )
 
+        # Avoid mypy error later (None.append). Should list_params be Optional?
+        if self.list_params is None:
+            raise ValueError(
+                "`list_params` must be provided in the model configuration."
+            )
+
         self.n_choices = len(self.choices)
         self._pre_check_data_sanity()
 

From ab611e4f26209ace852d02298482bfe46e4533dc Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:41:46 -0500
Subject: [PATCH 011/104] refactor: replace DataValidator with
 DataValidatorMixin in HSSM and related tests

---
 src/hssm/data_validator.py   | 47 +++++++++++++++---------------------
 src/hssm/hssm.py             |  4 +--
 src/hssm/hssmbase.py         | 22 +++++++++++------
 tests/test_data_sanity.py    |  2 +-
 tests/test_data_validator.py | 34 +++++++++++++-------------
 5 files changed, 54 insertions(+), 55 deletions(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index 85a8ed8d3..fe1e9f750 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -11,30 +11,20 @@
 _logger = logging.getLogger("hssm")
 
 
-class DataValidator:
-    """Class for validating and preprocessing behavioral data for HSSM models."""
-
-    def __init__(
-        self,
-        data,
-        response=["rt", "response"],
-        choices=[0, 1],
-        n_choices=2,
-        extra_fields=None,
-        deadline=False,
-        deadline_name="deadline",
-        missing_data=False,
-        missing_data_value=-999.0,
-    ):
-        self.data = data
-        self.response = response
-        self.choices = choices
-        self.n_choices = n_choices
-        self.extra_fields = extra_fields
-        self.deadline = deadline
-        self.deadline_name = deadline_name
-        self.missing_data = missing_data
-        self.missing_data_value = missing_data_value
+class DataValidatorMixin:
+    """Mixin class providing validation and preprocessing methods for HSSM behavioral models.
+
+    This class expects subclasses to define the following attributes:
+    - data: pd.DataFrame
+    - response: list[str]
+    - choices: list[int]
+    - n_choices: int
+    - extra_fields: list[str] | None
+    - deadline: bool
+    - deadline_name: str
+    - missing_data: bool
+    - missing_data_value: float
+    """
 
     @staticmethod
     def check_fields(a, b):
@@ -50,13 +40,13 @@ def _check_extra_fields(self, data: pd.DataFrame | None = None) -> bool:
 
         data = data if data is not None else self.data
 
-        DataValidator.check_fields(self.extra_fields, data.columns)
+        DataValidatorMixin.check_fields(self.extra_fields, data.columns)
 
         return True
 
     def _pre_check_data_sanity(self):
         """Check if the data is clean enough for the model."""
-        DataValidator.check_fields(self.response, self.data.columns)
+        DataValidatorMixin.check_fields(self.response, self.data.columns)
         self._check_extra_fields()
 
     def _post_check_data_sanity(self):
@@ -169,8 +159,9 @@ def _update_extra_fields(self, new_data: pd.DataFrame | None = None):
         if not new_data:
             new_data = self.data
 
-        # The attribute 'model_distribution' is not defined in DataValidator itself,
-        # but is expected to exist in subclasses (e.g., HSSM).
+        # The attribute 'model_distribution' is not defined in
+        # DataValidatorMixin itself, but is expected to exist in subclasses
+        # (e.g., HSSM).
         # The 'type: ignore[attr-defined]' comment tells mypy to ignore the missing
         # attribute error here and avoid moving this method to the HSSM class.
         self.model_distribution.extra_fields = [  # type: ignore[attr-defined]
diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 5906c6eac..0bb2d5b19 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -32,7 +32,7 @@
 from ssms.config import model_config as ssms_model_config
 
 from hssm._types import LoglikKind, SupportedModels
-from hssm.data_validator import DataValidator
+from hssm.data_validator import DataValidatorMixin
 from hssm.defaults import (
     INITVAL_JITTER_SETTINGS,
     INITVAL_SETTINGS,
@@ -97,7 +97,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidator):
+class HSSM(DataValidatorMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 94135371b..aa6476b06 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -32,7 +32,7 @@
 from ssms.config import model_config as ssms_model_config
 
 from hssm._types import LoglikKind, SupportedModels
-from hssm.data_validator import DataValidator
+from hssm.data_validator import DataValidatorMixin
 from hssm.defaults import (
     INITVAL_JITTER_SETTINGS,
     INITVAL_SETTINGS,
@@ -97,7 +97,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidator):
+class HSSM(DataValidatorMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
@@ -355,7 +355,6 @@ def __init__(
             )
 
         self.n_choices = len(self.choices)
-        self._pre_check_data_sanity()
 
         # Process missing data setting
         # AF-TODO: Could be a function in data validator?
@@ -413,7 +412,11 @@ def __init__(
         )
 
         if self.deadline:
-            self.response.append(self.deadline_name)
+            if self.response is not None:  # Avoid mypy error
+                self.response.append(self.deadline_name)
+
+        # Run pre-check data sanity validation now that all attributes are set
+        self._pre_check_data_sanity()
 
         # Process lapse distribution
         self.has_lapse = p_outlier is not None and p_outlier != 0
@@ -423,7 +426,7 @@ def __init__(
 
         # Process all parameters
         self.params = Params.from_user_specs(
-            model=self,
+            model=self,  # type: ignore[arg-type]
             include=[] if include is None else include,
             kwargs=kwargs,
             p_outlier=p_outlier,
@@ -432,7 +435,7 @@ def __init__(
         self._parent = self.params.parent
         self._parent_param = self.params.parent_param
 
-        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
+        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)  # type: ignore[arg-type]
 
         # For parameters that have a regression backend, apply bounds at the likelihood
         # level to ensure that the samples that are out of bounds
@@ -519,7 +522,7 @@ def _build_model_config(
         loglik_kind: LoglikKind | None,
         model_config: ModelConfig | dict | None,
         choices: list[int] | None,
-    ) -> ModelConfig:
+    ) -> Config:
         """Build a ModelConfig object from defaults and user inputs.
 
         Parameters
@@ -2030,6 +2033,9 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if self.extra_fields is not None:
             params_is_reg += [True for _ in self.extra_fields]
 
+        # Assert that loglik is not None (mypy)
+        # avoiding extra indentation level
+        assert self.loglik is not None, "loglik should be set by model configuration"
         if self.loglik_kind == "approx_differentiable":
             if self.model_config.backend == "jax":
                 likelihood_callable = make_likelihood_callable(
@@ -2097,6 +2103,8 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             )
 
         self.data = _rearrange_data(self.data)
+        # Assertion added for mypy type checking
+        assert self.list_params is not None, "list_params should have been validated"
         return make_distribution(
             rv=self.model_config.rv or self.model_name,
             loglik=self.loglik,
diff --git a/tests/test_data_sanity.py b/tests/test_data_sanity.py
index e45668ce7..a522ef91a 100644
--- a/tests/test_data_sanity.py
+++ b/tests/test_data_sanity.py
@@ -13,7 +13,7 @@ def cpn():
 
 pattern = r"Field\(s\) `.*` not found in data\."
 
-# The DataValidator class is tested in the test_data_validator.py file, so this file
+# The DataValidatorMixin is tested in the test_data_validator.py file, so this file
 # can probably be removed in the future. CP
 
 
diff --git a/tests/test_data_validator.py b/tests/test_data_validator.py
index f491f45c4..704885f22 100644
--- a/tests/test_data_validator.py
+++ b/tests/test_data_validator.py
@@ -4,7 +4,7 @@
 import pytest
 import pandas as pd
 import numpy as np
-from hssm.data_validator import DataValidator
+from hssm.data_validator import DataValidatorMixin
 from hssm.defaults import MissingDataNetwork
 
 
@@ -48,8 +48,8 @@ def base_data_nan_missing():
 
 def dv_instance(
     data_factory: Callable = _base_data, deadline: bool = True
-) -> DataValidator:
-    return DataValidator(
+) -> DataValidatorMixin:
+    return DataValidatorMixin(
         data=data_factory(),
         extra_fields=["extra"],
         deadline=deadline,
@@ -57,13 +57,13 @@ def dv_instance(
 
 
 def test_constructor(base_data):
-    dv = DataValidator(
+    dv = DataValidatorMixin(
         data=base_data,
         extra_fields=["extra"],
         deadline=True,
     )
 
-    assert isinstance(dv, DataValidator)
+    assert isinstance(dv, DataValidatorMixin)
     assert dv.data.equals(_base_data())
     assert dv.response == ["rt", "response"]
     assert dv.choices == [0, 1]
@@ -109,7 +109,7 @@ def test_post_check_data_sanity_valid(base_data):
     ):
         dv_instance_no_missing._post_check_data_sanity()
 
-    dv_instance_no_missing = DataValidator(
+    dv_instance_no_missing = DataValidatorMixin(
         data=base_data,
         deadline=False,
         missing_data=False,
@@ -133,7 +133,7 @@ def test_post_check_data_sanity_valid(base_data):
 def test_handle_missing_data_and_deadline_deadline_column_missing(base_data):
     # Should raise ValueError if deadline is True but deadline_name column is missing
     data = base_data.drop(columns=["deadline"])
-    dv = DataValidator(
+    dv = DataValidatorMixin(
         data=data,
         deadline=True,
     )
@@ -144,7 +144,7 @@ def test_handle_missing_data_and_deadline_deadline_column_missing(base_data):
 def test_handle_missing_data_and_deadline_deadline_applied(base_data):
     # Should set rt to -999.0 where rt >= deadline
     base_data.loc[0, "rt"] = 2.0  # Exceeds deadline
-    dv = DataValidator(
+    dv = DataValidatorMixin(
         data=base_data,
         deadline=True,
     )
@@ -154,7 +154,7 @@ def test_handle_missing_data_and_deadline_deadline_applied(base_data):
 
 
 def test_update_extra_fields(monkeypatch):
-    # Create a DataValidator with extra_fields
+    # Create a DataValidatorMixin with extra_fields
     data = pd.DataFrame(
         {
             "rt": [0.5, 0.7],
@@ -164,7 +164,7 @@ def test_update_extra_fields(monkeypatch):
             "extra2": [100, 200],
         }
     )
-    dv = DataValidator(
+    dv = DataValidatorMixin(
         data=data,
         extra_fields=["extra", "extra2"],
     )
@@ -189,24 +189,24 @@ def test_set_missing_data_and_deadline():
     # No missing data and no deadline
     data = pd.DataFrame({"rt": [0.5, 0.7]})
     assert (
-        DataValidator._set_missing_data_and_deadline(False, False, data)
+        DataValidatorMixin._set_missing_data_and_deadline(False, False, data)
         == MissingDataNetwork.NONE
     )
     # Missing data but no deadline
     data = pd.DataFrame({"rt": [0.5, -999.0]})
     assert (
-        DataValidator._set_missing_data_and_deadline(True, False, data)
+        DataValidatorMixin._set_missing_data_and_deadline(True, False, data)
         == MissingDataNetwork.CPN
     )
     assert (
-        DataValidator._set_missing_data_and_deadline(True, True, data)
+        DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
         == MissingDataNetwork.OPN
     )
     # AF-TODO: I think GONOGO as a network category can go,
     # but needs a little more thought, out of scope for PR,
     # during which this was commented out.
     # assert (
-    #     DataValidator._set_missing_data_and_deadline(True, True, data)
+    #     DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
     #     == MissingDataNetwork.GONOGO
     # )
 
@@ -219,7 +219,7 @@ def test_set_missing_data_and_deadline_all_missing():
         match="`missing_data` is set to True, but you have no valid data in your "
         "dataset.",
     ):
-        DataValidator._set_missing_data_and_deadline(True, False, data)
+        DataValidatorMixin._set_missing_data_and_deadline(True, False, data)
 
     # opn
     with pytest.raises(
@@ -227,7 +227,7 @@ def test_set_missing_data_and_deadline_all_missing():
         match="`missing_data` is set to True, but you have no valid data in your "
         "dataset.",
     ):
-        DataValidator._set_missing_data_and_deadline(True, True, data)
+        DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
 
     # AF-TODO: GONOGO case not yet correctly implemented
     # gonogo
@@ -237,4 +237,4 @@ def test_set_missing_data_and_deadline_all_missing():
     #     match="`missing_data` is set to True, but you have no valid data in your "
     #     + "dataset.",
     # ):
-    #     DataValidator._set_missing_data_and_deadline(True, True, data)
+    #     DataValidatorMixin._set_missing_data_and_deadline(True, True, data)

From 0751046b1a48758b200f4a6a780f809dd48c87c0 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:44:48 -0500
Subject: [PATCH 012/104] refactor: remove unused import of bambi in
 test_hssmbase

---
 tests/test_hssmbase.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 64c03e553..f70448288 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -1,4 +1,3 @@
-import bambi as bmb
 import numpy as np
 import pytest
 

From 11a4e4ed30a483ba4fd3ac4712715772d47ce1b0 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:46:07 -0500
Subject: [PATCH 013/104] refactor: remove unused import of typing and simplify
 SupportedModels check in HSSM class

---
 src/hssm/hssmbase.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index aa6476b06..80321097e 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -8,7 +8,6 @@
 
 import datetime
 import logging
-import typing
 from copy import deepcopy
 from inspect import isclass, signature
 from os import PathLike
@@ -588,7 +587,7 @@ def _build_model_config(
         # Handle default config (no model_config provided)
         else:
             # For supported models, defaults already have choices
-            if model in typing.get_args(SupportedModels):
+            if model in get_args(SupportedModels):
                 if choices is not None:
                     _logger.info(
                         "Model string is in SupportedModels."

From aa473205f3554c0574ef8a73148c791b7e5baf8f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:53:10 -0500
Subject: [PATCH 014/104] refactor: simplify sample_prior_predictive calls in
 test_sample_prior_predictive

---
 tests/test_hssmbase.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index f70448288..49713d283 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -156,10 +156,8 @@ def test_sample_prior_predictive(data_ddm_reg):
     model_no_regression = HSSM(data=data_ddm_reg)
     rng = np.random.default_rng()
 
-    prior_predictive_1 = model_no_regression.sample_prior_predictive(draws=10)
-    prior_predictive_2 = model_no_regression.sample_prior_predictive(
-        draws=10, random_seed=rng
-    )
+    model_no_regression.sample_prior_predictive(draws=10)
+    model_no_regression.sample_prior_predictive(draws=10, random_seed=rng)
 
     model_regression = HSSM(
         data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]

From ded9439465f13e5fcb3fad1ea89765561f286776 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:53:56 -0500
Subject: [PATCH 015/104] refactor: correct typo in comments regarding
 inconsistent dimensions and coordinates

---
 src/hssm/hssm.py     | 4 ++--
 src/hssm/hssmbase.py | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 0bb2d5b19..704319fe3 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -1186,7 +1186,7 @@ def sample_do(
         # clean up `rt,response_mean` to `v`
         do_idata = self._drop_parent_str_from_idata(idata=do_idata)
 
-        # rename otherwise inconsistentdims and coords
+        # rename otherwise inconsistent dims and coords
         if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
             setattr(
                 do_idata,
@@ -1259,7 +1259,7 @@ def sample_prior_predictive(
         # clean up `rt,response_mean` to `v`
         idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
 
-        # rename otherwise inconsistentdims and coords
+        # rename otherwise inconsistent dims and coords
         if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
             setattr(
                 idata,
diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 80321097e..53b0debee 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -1252,7 +1252,7 @@ def sample_do(
         # clean up `rt,response_mean` to `v`
         do_idata = self._drop_parent_str_from_idata(idata=do_idata)
 
-        # rename otherwise inconsistentdims and coords
+        # rename otherwise inconsistent dims and coords
         if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
             setattr(
                 do_idata,
@@ -1325,7 +1325,7 @@ def sample_prior_predictive(
         # clean up `rt,response_mean` to `v`
         idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
 
-        # rename otherwise inconsistentdims and coords
+        # rename otherwise inconsistent dims and coords
         if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
             setattr(
                 idata,

From 95266d3a055b1a7cead0a9f0321051366ff772cc Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:55:05 -0500
Subject: [PATCH 016/104] refactor: remove unused variable assignments in
 test_sample_prior_predictive

---
 tests/test_hssm.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index f6429d323..41d67e218 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -169,12 +169,12 @@ def test_sample_prior_predictive(data_ddm_reg):
     model_regression = HSSM(
         data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]
     )
-    prior_predictive_3 = model_regression.sample_prior_predictive(draws=10)
+    model_regression.sample_prior_predictive(draws=10)
 
     model_regression_a = HSSM(
         data=data_ddm_reg, include=[dict(name="a", formula="a ~ 1 + x")]
     )
-    prior_predictive_4 = model_regression_a.sample_prior_predictive(draws=10)
+    model_regression_a.sample_prior_predictive(draws=10)
 
     model_regression_multi = HSSM(
         data=data_ddm_reg,

From b61349760908950f057160ad5ff596992534e521 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:56:25 -0500
Subject: [PATCH 017/104] refactor: remove unused variable assignment in
 test_sample_prior_predictive

---
 tests/test_hssm.py     | 2 +-
 tests/test_hssmbase.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index 41d67e218..190d32772 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -183,7 +183,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ 1 + y"),
         ],
     )
-    prior_predictive_5 = model_regression_multi.sample_prior_predictive(draws=10)
+    model_regression_multi.sample_prior_predictive(draws=10)
 
     data_ddm_reg.loc[:, "subject_id"] = np.arange(10)
 
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 49713d283..37e54c23f 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -176,7 +176,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ 1 + y"),
         ],
     )
-    prior_predictive_5 = model_regression_multi.sample_prior_predictive(draws=10)
+    model_regression_multi.sample_prior_predictive(draws=10)
 
     data_ddm_reg.loc[:, "subject_id"] = np.arange(10)
 

From a9d54bbbe598bc11969ad9deac69bf288e99390d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:57:10 -0500
Subject: [PATCH 018/104] refactor: remove redundant assignment in
 sample_prior_predictive test

---
 tests/test_hssm.py     | 2 +-
 tests/test_hssmbase.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index 190d32772..bcc531528 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -194,7 +194,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ (1|subject_id) + y"),
         ],
     )
-    prior_predictive_6 = model_regression_random_effect.sample_prior_predictive(
+    model_regression_random_effect.sample_prior_predictive(
         draws=10
     )
 
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 37e54c23f..c04fc49e6 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -187,7 +187,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ (1|subject_id) + y"),
         ],
     )
-    prior_predictive_6 = model_regression_random_effect.sample_prior_predictive(
+    model_regression_random_effect.sample_prior_predictive(
         draws=10
     )
 

From 395478fb8435d11f03f972a2fbd1c93611b4da63 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 13:59:46 -0500
Subject: [PATCH 019/104] refactor: simplify HSSM instantiation in custom model
 tests

---
 tests/test_hssm.py     | 16 ++++++----------
 tests/test_hssmbase.py | 16 ++++++----------
 2 files changed, 12 insertions(+), 20 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index bcc531528..dbb3d30e3 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -86,25 +86,23 @@ def test_custom_model(data_ddm):
     with pytest.raises(
         ValueError, match="When using a custom model, please provide a `loglik_kind.`"
     ):
-        model = HSSM(data=data_ddm, model="custom")
+        HSSM(data=data_ddm, model="custom")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        model = HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
+        HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        model = HSSM(
-            data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical"
-        )
+        HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(
         ValueError,
         match="Please provide `list_params` via `model_config`.",
     ):
-        model = HSSM(
+        HSSM(
             data=data_ddm,
             model="custom",
             loglik=DDM,
@@ -112,7 +110,7 @@ def test_custom_model(data_ddm):
             model_config={},
         )
 
-    model = HSSM(
+    HSSM(
         data=data_ddm,
         model="custom",
         model_config={
@@ -194,9 +192,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ (1|subject_id) + y"),
         ],
     )
-    model_regression_random_effect.sample_prior_predictive(
-        draws=10
-    )
+    model_regression_random_effect.sample_prior_predictive(draws=10)
 
 
 @pytest.mark.slow
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index c04fc49e6..174afeb9b 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -83,25 +83,23 @@ def test_custom_model(data_ddm):
     with pytest.raises(
         ValueError, match="When using a custom model, please provide a `loglik_kind.`"
     ):
-        model = HSSM(data=data_ddm, model="custom")
+        HSSM(data=data_ddm, model="custom")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        model = HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
+        HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        model = HSSM(
-            data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical"
-        )
+        HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(
         ValueError,
         match="Please provide `list_params` via `model_config`.",
     ):
-        model = HSSM(
+        HSSM(
             data=data_ddm,
             model="custom",
             loglik=DDM,
@@ -109,7 +107,7 @@ def test_custom_model(data_ddm):
             model_config={},
         )
 
-    model = HSSM(
+    HSSM(
         data=data_ddm,
         model="custom",
         model_config={
@@ -187,9 +185,7 @@ def test_sample_prior_predictive(data_ddm_reg):
             dict(name="a", formula="a ~ (1|subject_id) + y"),
         ],
     )
-    model_regression_random_effect.sample_prior_predictive(
-        draws=10
-    )
+    model_regression_random_effect.sample_prior_predictive(draws=10)
 
 
 def test_override_default_link(caplog, data_ddm_reg):

From a7daf8145e7edab0c8e5008359a8eca9bd36c374 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:06:24 -0500
Subject: [PATCH 020/104] refactor: implement parameter initialization in
 DataValidatorMixin

---
 src/hssm/data_validator.py | 26 ++++++++++++++++++++++++++
 1 file changed, 26 insertions(+)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index fe1e9f750..dd205527e 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -26,6 +26,32 @@ class DataValidatorMixin:
     - missing_data_value: float
     """
 
+    def __init__(
+        self,
+        data,
+        response=["rt", "response"],
+        choices=[0, 1],
+        n_choices=2,
+        extra_fields=None,
+        deadline=False,
+        deadline_name="deadline",
+        missing_data=False,
+        missing_data_value=-999.0,
+    ):
+        """Initialize the DataValidatorMixin.
+
+        Init method kept for testing purposes.
+        """
+        self.data = data
+        self.response = response
+        self.choices = choices
+        self.n_choices = n_choices
+        self.extra_fields = extra_fields
+        self.deadline = deadline
+        self.deadline_name = deadline_name
+        self.missing_data = missing_data
+        self.missing_data_value = missing_data_value
+
     @staticmethod
     def check_fields(a, b):
         """Check if all fields in a are in b."""

From b706e71229f2bf0a6b3ada391eb25b1afa0ba99f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:14:16 -0500
Subject: [PATCH 021/104] refactor: assign HSSM instance to variable in
 test_custom_model

---
 tests/test_hssmbase.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 174afeb9b..75ece87fb 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -107,7 +107,7 @@ def test_custom_model(data_ddm):
             model_config={},
         )
 
-    HSSM(
+    model = HSSM(
         data=data_ddm,
         model="custom",
         model_config={

From 88efb418212ca99201c3ef8e1764978e7f939386 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:25:55 -0500
Subject: [PATCH 022/104] refactor: enhance parameter initialization in
 DataValidatorMixin and add response handling in HSSM

---
 src/hssm/data_validator.py | 25 +++++++++++++------------
 src/hssm/hssmbase.py       |  4 ++++
 2 files changed, 17 insertions(+), 12 deletions(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index dd205527e..4d79830fc 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -28,15 +28,15 @@ class DataValidatorMixin:
 
     def __init__(
         self,
-        data,
-        response=["rt", "response"],
-        choices=[0, 1],
-        n_choices=2,
-        extra_fields=None,
-        deadline=False,
-        deadline_name="deadline",
-        missing_data=False,
-        missing_data_value=-999.0,
+        data: pd.DataFrame,
+        response: list[str] = ["rt", "response"],
+        choices: list[int] = [0, 1],
+        n_choices: int = 2,
+        extra_fields: list[str] | None = None,
+        deadline: bool = False,
+        deadline_name: str = "deadline",
+        missing_data: bool = False,
+        missing_data_value: float = -999.0,
     ):
         """Initialize the DataValidatorMixin.
 
@@ -190,9 +190,10 @@ def _update_extra_fields(self, new_data: pd.DataFrame | None = None):
         # (e.g., HSSM).
         # The 'type: ignore[attr-defined]' comment tells mypy to ignore the missing
         # attribute error here and avoid moving this method to the HSSM class.
-        self.model_distribution.extra_fields = [  # type: ignore[attr-defined]
-            new_data[field].values for field in self.extra_fields
-        ]
+        if self.extra_fields is not None:
+            self.model_distribution.extra_fields = [  # type: ignore[attr-defined]
+                new_data[field].values for field in self.extra_fields
+            ]
 
     @staticmethod
     def _set_missing_data_and_deadline(
diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 53b0debee..a93fe33f9 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -1375,11 +1375,15 @@ def set_alias(self, aliases: dict[str, str | dict]):
     @property
     def response_c(self) -> str:
         """Return the response variable names in c() format."""
+        if self.response is None:
+            return "c()"
         return f"c({', '.join(self.response)})"
 
     @property
     def response_str(self) -> str:
         """Return the response variable names in string format."""
+        if self.response is None:
+            return ""
         return ",".join(self.response)
 
     # NOTE: can't annotate return type because the graphviz dependency is optional

From 5f06db02a5aa244614bf8f005038c338a1f9d946 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:43:27 -0500
Subject: [PATCH 023/104] refactor: update parameter types in
 DataValidatorMixin constructor

---
 src/hssm/data_validator.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index 4d79830fc..416103052 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -29,8 +29,8 @@ class DataValidatorMixin:
     def __init__(
         self,
         data: pd.DataFrame,
-        response: list[str] = ["rt", "response"],
-        choices: list[int] = [0, 1],
+        response: list[str] | None = ["rt", "response"],
+        choices: list[int] | None = [0, 1],
         n_choices: int = 2,
         extra_fields: list[str] | None = None,
         deadline: bool = False,

From 3491c9e5a7e8a922c9e08a4aa613995860404a61 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:52:20 -0500
Subject: [PATCH 024/104] refactor: assign HSSM instance to variable in
 test_custom_model

---
 tests/test_hssm.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index dbb3d30e3..92804066e 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -110,7 +110,7 @@ def test_custom_model(data_ddm):
             model_config={},
         )
 
-    HSSM(
+    model = HSSM(
         data=data_ddm,
         model="custom",
         model_config={

From d86a94bf4bd9689d7a9a2d1905a5c0f90070a9a8 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 14:52:30 -0500
Subject: [PATCH 025/104] refactor: handle None response in response_c and
 response_str properties

---
 src/hssm/hssm.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 704319fe3..6a57cf4b7 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -1309,11 +1309,15 @@ def set_alias(self, aliases: dict[str, str | dict]):
     @property
     def response_c(self) -> str:
         """Return the response variable names in c() format."""
+        if self.response is None:
+            return "c()"
         return f"c({', '.join(self.response)})"
 
     @property
     def response_str(self) -> str:
         """Return the response variable names in string format."""
+        if self.response is None:
+            return ""
         return ",".join(self.response)
 
     # NOTE: can't annotate return type because the graphviz dependency is optional

From deafa6ec4de5c3121332b23dbe03038ef776bdfe Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 15:00:05 -0500
Subject: [PATCH 026/104] refactor: simplify docstring in DataValidatorMixin
 class

---
 src/hssm/data_validator.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index 416103052..96bb1eb5f 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -12,7 +12,7 @@
 
 
 class DataValidatorMixin:
-    """Mixin class providing validation and preprocessing methods for HSSM behavioral models.
+    """Mixin providing validation and preprocessing methods for HSSM behavioral models.
 
     This class expects subclasses to define the following attributes:
     - data: pd.DataFrame

From a17c406523b44d6bc87b8c2704c42ef70213cbda Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 15:17:16 -0500
Subject: [PATCH 027/104] refactor: remove unused variables in
 test_sample_prior_predictive

---
 tests/test_hssmbase.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 75ece87fb..5e911a6db 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -160,12 +160,12 @@ def test_sample_prior_predictive(data_ddm_reg):
     model_regression = HSSM(
         data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]
     )
-    prior_predictive_3 = model_regression.sample_prior_predictive(draws=10)
+    model_regression.sample_prior_predictive(draws=10)
 
     model_regression_a = HSSM(
         data=data_ddm_reg, include=[dict(name="a", formula="a ~ 1 + x")]
     )
-    prior_predictive_4 = model_regression_a.sample_prior_predictive(draws=10)
+    model_regression_a.sample_prior_predictive(draws=10)
 
     model_regression_multi = HSSM(
         data=data_ddm_reg,

From 7ab1ea0c5c2578057e350fc2297f99689280371f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 15:17:23 -0500
Subject: [PATCH 028/104] fix: correct typo in classproperty docstring

---
 src/hssm/hssmbase.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index a93fe33f9..6b8287958 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -76,7 +76,7 @@ class classproperty:
     properties that need to perform some computation or access class-level data.
 
     This implementation is provided for compatibility with Python versions 3.10 through
-    3.12, as one cannot combine the @property and @classmethod decorators is across all
+    3.12, as one cannot combine the @property and @classmethod decorators across all
     these versions.
 
     Example

From 5d2c2235643305bd12da48f55b54c97770e25cd5 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 15:17:32 -0500
Subject: [PATCH 029/104] refactor: update condition to check for None in
 _update_extra_fields method

---
 src/hssm/data_validator.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index 96bb1eb5f..d611fc939 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -182,7 +182,7 @@ def _update_extra_fields(self, new_data: pd.DataFrame | None = None):
         new_data
             A DataFrame containing new data for update.
         """
-        if not new_data:
+        if new_data is None:
             new_data = self.data
 
         # The attribute 'model_distribution' is not defined in

From 23606bd5cdaf483732cd1705466b660e456956c5 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 16:48:30 -0500
Subject: [PATCH 030/104] refactor: remove unused initialization arguments and
 related method from HSSM class

---
 src/hssm/hssmbase.py | 33 ---------------------------------
 1 file changed, 33 deletions(-)

diff --git a/src/hssm/hssmbase.py b/src/hssm/hssmbase.py
index 6b8287958..b86fd76b0 100644
--- a/src/hssm/hssmbase.py
+++ b/src/hssm/hssmbase.py
@@ -295,14 +295,6 @@ def __init__(
         initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
         **kwargs,
     ):
-        # Attach arguments to the instance
-        # so that we can easily define some
-        # methods that need to access these
-        # arguments (context: pickling / save - load).
-        # assert False, "Temporary prevent instantiation of HSSM class."
-        # Define a dict with all call arguments:
-        self._init_args = self._get_init_args(locals(), kwargs)
-
         # ===== Input Data & Configuration =====
         self.data = data.copy()
         self.global_formula = global_formula
@@ -490,31 +482,6 @@ def __init__(
         )
         _logger.info("Model initialized successfully.")
 
-    @staticmethod
-    def _get_init_args(
-        locals_dict: dict[str, Any], kwargs: dict[str, Any]
-    ) -> dict[str, Any]:
-        """Extract initialization arguments from locals and kwargs.
-
-        Parameters
-        ----------
-        locals_dict : dict[str, Any]
-            The locals() dictionary from __init__.
-        kwargs : dict[str, Any]
-            Additional keyword arguments passed to __init__.
-
-        Returns
-        -------
-        dict[str, Any]
-            A dictionary containing all initialization arguments, excluding 'self'.
-        """
-        init_args = {
-            k: v for k, v in locals_dict.items() if k not in ["self", "kwargs"]
-        }
-        if kwargs:
-            init_args.update(kwargs)
-        return init_args
-
     @staticmethod
     def _build_model_config(
         model: SupportedModels | str,

From 167f480f0d3499daff43e25bf4dfb0ded52df3f2 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 16:57:34 -0500
Subject: [PATCH 031/104] rename hssmbase.py to base.py

---
 src/hssm/{hssmbase.py => base.py} | 0
 tests/test_hssmbase.py            | 2 +-
 2 files changed, 1 insertion(+), 1 deletion(-)
 rename src/hssm/{hssmbase.py => base.py} (100%)

diff --git a/src/hssm/hssmbase.py b/src/hssm/base.py
similarity index 100%
rename from src/hssm/hssmbase.py
rename to src/hssm/base.py
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 5e911a6db..48a1a5ea1 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -2,7 +2,7 @@
 import pytest
 
 import hssm
-from hssm.hssmbase import HSSM
+from hssm.base import HSSM
 from hssm.likelihoods import DDM, logp_ddm
 from copy import deepcopy
 

From 65079ce37ab63499ddb75be0785410a3d90a1506 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 16:58:52 -0500
Subject: [PATCH 032/104] refactor: rename HSSM class to HSSMBase for clarity
 and consistency

---
 src/hssm/base.py       | 2 +-
 tests/test_hssmbase.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index b86fd76b0..dbc9979f0 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -96,7 +96,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidatorMixin):
+class HSSMBase(DataValidatorMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 48a1a5ea1..cece89d6c 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -2,7 +2,7 @@
 import pytest
 
 import hssm
-from hssm.base import HSSM
+from hssm.base import HSSMBase
 from hssm.likelihoods import DDM, logp_ddm
 from copy import deepcopy
 

From 8eb12d609aab33f7c105e5e46afd5857303cb8a8 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 17:02:35 -0500
Subject: [PATCH 033/104] refactor: replace HSSM with HSSMBase in test cases
 for consistency

---
 tests/test_hssmbase.py | 50 +++++++++++++++++++++---------------------
 1 file changed, 25 insertions(+), 25 deletions(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index cece89d6c..02df1ff38 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -69,9 +69,9 @@
 def test_transform_params_general(data_ddm_reg, include, should_raise_exception):
     if should_raise_exception:
         with pytest.raises(Exception):
-            HSSM(data=data_ddm_reg, include=include)
+            HSSMBase(data=data_ddm_reg, include=include)
     else:
-        model = HSSM(data=data_ddm_reg, include=include)
+        model = HSSMBase(data=data_ddm_reg, include=include)
         # Check model properties using a loop
         param_names = ["v", "a", "z", "t", "p_outlier"]
         model_param_names = list(model.params.keys())
@@ -83,23 +83,23 @@ def test_custom_model(data_ddm):
     with pytest.raises(
         ValueError, match="When using a custom model, please provide a `loglik_kind.`"
     ):
-        HSSM(data=data_ddm, model="custom")
+        HSSMBase(data=data_ddm, model="custom")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
+        HSSMBase(data=data_ddm, model="custom", loglik_kind="analytical")
 
     with pytest.raises(
         ValueError, match="Please provide `list_params` via `model_config`."
     ):
-        HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
+        HSSMBase(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(
         ValueError,
         match="Please provide `list_params` via `model_config`.",
     ):
-        HSSM(
+        HSSMBase(
             data=data_ddm,
             model="custom",
             loglik=DDM,
@@ -107,7 +107,7 @@ def test_custom_model(data_ddm):
             model_config={},
         )
 
-    model = HSSM(
+    model = HSSMBase(
         data=data_ddm,
         model="custom",
         model_config={
@@ -130,12 +130,12 @@ def test_custom_model(data_ddm):
 
 
 def test_model_definition_outside_include(data_ddm):
-    model_with_one_param_fixed = HSSM(data_ddm, a=0.5)
+    model_with_one_param_fixed = HSSMBase(data_ddm, a=0.5)
 
     assert "a" in model_with_one_param_fixed.params
     assert model_with_one_param_fixed.params["a"].prior == 0.5
 
-    model_with_one_param = HSSM(
+    model_with_one_param = HSSMBase(
         data_ddm, a={"prior": {"name": "Normal", "mu": 0.5, "sigma": 0.1}}
     )
 
@@ -145,29 +145,29 @@ def test_model_definition_outside_include(data_ddm):
     with pytest.raises(
         ValueError, match="Parameter `a` specified in both `include` and `kwargs`."
     ):
-        HSSM(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
+        HSSMBase(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
 
 
 def test_sample_prior_predictive(data_ddm_reg):
     data_ddm_reg = data_ddm_reg.iloc[:10, :]
 
-    model_no_regression = HSSM(data=data_ddm_reg)
+    model_no_regression = HSSMBase(data=data_ddm_reg)
     rng = np.random.default_rng()
 
     model_no_regression.sample_prior_predictive(draws=10)
     model_no_regression.sample_prior_predictive(draws=10, random_seed=rng)
 
-    model_regression = HSSM(
+    model_regression = HSSMBase(
         data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]
     )
     model_regression.sample_prior_predictive(draws=10)
 
-    model_regression_a = HSSM(
+    model_regression_a = HSSMBase(
         data=data_ddm_reg, include=[dict(name="a", formula="a ~ 1 + x")]
     )
     model_regression_a.sample_prior_predictive(draws=10)
 
-    model_regression_multi = HSSM(
+    model_regression_multi = HSSMBase(
         data=data_ddm_reg,
         include=[
             dict(name="v", formula="v ~ 1 + x"),
@@ -178,7 +178,7 @@ def test_sample_prior_predictive(data_ddm_reg):
 
     data_ddm_reg.loc[:, "subject_id"] = np.arange(10)
 
-    model_regression_random_effect = HSSM(
+    model_regression_random_effect = HSSMBase(
         data=data_ddm_reg,
         include=[
             dict(name="v", formula="v ~ (1|subject_id) + x"),
@@ -203,7 +203,7 @@ def test_override_default_link(caplog, data_ddm_reg):
     param_z = param_v | dict(name="z", formula="z ~ 1 + x + y", bounds=(0, 1))
     param_t = param_v | dict(name="t", formula="t ~ 1 + x + y", bounds=(0.1, np.inf))
 
-    model = HSSM(
+    model = HSSMBase(
         data=data_ddm_reg,
         include=[param_v, param_a, param_z, param_t],
         link_settings="log_logit",
@@ -219,7 +219,7 @@ def test_override_default_link(caplog, data_ddm_reg):
 
 
 def test_resampling(data_ddm):
-    model = HSSM(data=data_ddm)
+    model = HSSMBase(data=data_ddm)
     sample_1 = model.sample(draws=10, chains=1, tune=0)
     assert sample_1 is model.traces
 
@@ -231,7 +231,7 @@ def test_resampling(data_ddm):
 
 def test_add_likelihood_parameters_to_data(data_ddm):
     """Test if the likelihood parameters are added to the InferenceData object."""
-    model = HSSM(data=data_ddm)
+    model = HSSMBase(data=data_ddm)
     sample_1 = model.sample(draws=10, chains=1, tune=10)
     sample_1_copy = deepcopy(sample_1)
     model.add_likelihood_parameters_to_idata(inplace=True)
@@ -266,7 +266,7 @@ def test_add_likelihood_parameters_to_data(data_ddm):
 # Setting any parameter to a fixed value should work:
 def test_model_creation_constant_parameter(data_ddm):
     for param_name in ["v", "a", "z", "t"]:
-        model = HSSM(data=data_ddm, **{param_name: 1.0})
+        model = HSSMBase(data=data_ddm, **{param_name: 1.0})
         assert model._parent != param_name
         assert model.params[param_name].prior == 1.0
 
@@ -277,7 +277,7 @@ def test_model_creation_constant_parameter(data_ddm):
     [("v", "Normal"), ("a", "Gamma"), ("z", "Beta"), ("t", "Gamma")],
 )
 def test_model_creation_single_regression(data_ddm_reg, param_name, dist_name):
-    model = HSSM(
+    model = HSSMBase(
         data=data_ddm_reg,
         include=[{"name": param_name, "formula": f"{param_name} ~ 1 + x"}],
     )
@@ -288,12 +288,12 @@ def test_model_creation_single_regression(data_ddm_reg, param_name, dist_name):
 # Setting all parameters to fixed values should throw an error:
 def test_model_creation_all_parameters_constant(data_ddm):
     with pytest.raises(ValueError):
-        HSSM(data=data_ddm, v=1.0, a=1.0, z=1.0, t=1.0)
+        HSSMBase(data=data_ddm, v=1.0, a=1.0, z=1.0, t=1.0)
 
 
 # Prior settings
 def test_prior_settings_basic(cavanagh_test):
-    model_1 = HSSM(
+    model_1 = HSSMBase(
         data=cavanagh_test,
         global_formula="y ~ 1 + (1|participant_id)",
         prior_settings=None,
@@ -303,7 +303,7 @@ def test_prior_settings_basic(cavanagh_test):
         "Default prior doesn't yield Nonetype for 'v'!"
     )
 
-    model_2 = HSSM(
+    model_2 = HSSMBase(
         data=cavanagh_test,
         global_formula="y ~ 1 + (1|participant_id)",
         prior_settings="safe",
@@ -315,7 +315,7 @@ def test_prior_settings_basic(cavanagh_test):
 
 
 def test_compile_logp(cavanagh_test):
-    model_1 = HSSM(
+    model_1 = HSSMBase(
         data=cavanagh_test,
         global_formula="y ~ 1 + (1|participant_id)",
         prior_settings=None,
@@ -326,7 +326,7 @@ def test_compile_logp(cavanagh_test):
 
 
 def test_sample_do(data_ddm):
-    model = HSSM(data=data_ddm)
+    model = HSSMBase(data=data_ddm)
     sample_do = model.sample_do(params={"v": 1.0}, draws=10)
     assert sample_do is not None
     assert "v_mean" in sample_do.prior.data_vars

From 48abc5bf7ff15ae08a37ca10fd7715c6885a6ed7 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 17:04:44 -0500
Subject: [PATCH 034/104] fix: update load_model and state restoration methods
 to reference HSSMBase instead of HSSM

---
 src/hssm/base.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index dbc9979f0..fc074c12c 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -1670,7 +1670,7 @@ def save_model(
     @classmethod
     def load_model(
         cls, path: Union[str, Path]
-    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
+    ) -> Union["HSSMBase", dict[str, Optional[az.InferenceData]]]:
         """Load a HSSM model instance and its inference results from disk.
 
         Parameters
@@ -1681,7 +1681,7 @@ def load_model(
 
         Returns
         -------
-        HSSM
+        HSSMBase
             The loaded HSSM model instance with inference results attached if available.
         """
         # Convert path to Path object
@@ -1798,7 +1798,7 @@ def __setstate__(self, state):
             A dictionary containing the constructor arguments under the key
             'constructor_args'.
         """
-        new_instance = HSSM(**state["constructor_args"])
+        new_instance = HSSMBase(**state["constructor_args"])
         self.__dict__ = new_instance.__dict__
 
     def __repr__(self) -> str:

From 470fd80300588df30d0c0626f8d87cc99ff78741 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 14 Jan 2026 17:28:29 -0500
Subject: [PATCH 035/104] Make config a class variable

---
 src/hssm/base.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index fc074c12c..ac8608d6a 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -269,6 +269,8 @@ class HSSMBase(DataValidatorMixin):
         The jitter value for the initial values.
     """
 
+    config_class = Config
+
     def __init__(
         self,
         data: pd.DataFrame,
@@ -482,8 +484,9 @@ def __init__(
         )
         _logger.info("Model initialized successfully.")
 
-    @staticmethod
+    @classmethod
     def _build_model_config(
+        cls,
         model: SupportedModels | str,
         loglik_kind: LoglikKind | None,
         model_config: ModelConfig | dict | None,
@@ -508,7 +511,7 @@ def _build_model_config(
             A complete ModelConfig object with choices and other settings applied.
         """
         # Start with defaults
-        config = Config.from_defaults(model, loglik_kind)
+        config = cls.config_class.from_defaults(model, loglik_kind)
 
         # Handle user-provided model_config
         if model_config is not None:

From b3e1effc8e02b77a5860b4d6550115b95c3a6a9a Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 22 Jan 2026 16:04:18 -0500
Subject: [PATCH 036/104] refactor: migrate missing data tests from
 test_data_validator.py to test_missing_data_mixin.py

---
 tests/test_data_validator.py     | 23 -----------
 tests/test_missing_data_mixin.py | 67 ++++++++++++++++++++++++++++++++
 2 files changed, 67 insertions(+), 23 deletions(-)
 create mode 100644 tests/test_missing_data_mixin.py

diff --git a/tests/test_data_validator.py b/tests/test_data_validator.py
index 704885f22..66abc303f 100644
--- a/tests/test_data_validator.py
+++ b/tests/test_data_validator.py
@@ -130,29 +130,6 @@ def test_post_check_data_sanity_valid(base_data):
         dv_instance_no_missing._post_check_data_sanity()
 
 
-def test_handle_missing_data_and_deadline_deadline_column_missing(base_data):
-    # Should raise ValueError if deadline is True but deadline_name column is missing
-    data = base_data.drop(columns=["deadline"])
-    dv = DataValidatorMixin(
-        data=data,
-        deadline=True,
-    )
-    with pytest.raises(ValueError, match="`deadline` is not found in your dataset"):
-        dv._handle_missing_data_and_deadline()
-
-
-def test_handle_missing_data_and_deadline_deadline_applied(base_data):
-    # Should set rt to -999.0 where rt >= deadline
-    base_data.loc[0, "rt"] = 2.0  # Exceeds deadline
-    dv = DataValidatorMixin(
-        data=base_data,
-        deadline=True,
-    )
-    dv._handle_missing_data_and_deadline()
-    assert dv.data.loc[0, "rt"] == -999.0
-    assert all(dv.data.loc[1:, "rt"] < dv.data.loc[1:, "deadline"])
-
-
 def test_update_extra_fields(monkeypatch):
     # Create a DataValidatorMixin with extra_fields
     data = pd.DataFrame(
diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
new file mode 100644
index 000000000..c19a73494
--- /dev/null
+++ b/tests/test_missing_data_mixin.py
@@ -0,0 +1,67 @@
+"""
+Tests for MissingDataMixin
+-------------------------
+1. Old tests migrated from test_data_validator.py that belong to missing data/deadline logic.
+2. Additional tests for new features and edge cases in MissingDataMixin.
+"""
+
+import pytest
+import pandas as pd
+from hssm.missing_data_mixin import MissingDataMixin
+
+
+class DummyModel(MissingDataMixin):
+    """
+    Dummy model for testing MissingDataMixin.
+
+    This class provides stub implementations of methods that the mixin expects
+    to exist on the consuming class. These stubs allow us to verify, via mocks/spies,
+    that the mixin calls them as part of its logic. This is a common pattern for
+    testing mixins: the dummy class provides the required interface, and the test
+    checks the mixin's interaction with it.
+    """
+
+    def __init__(self, data):
+        self.data = data
+        self.response = ["response"]
+        self.missing_data_value = -999.0
+
+
+# --- Fixtures ---
+@pytest.fixture
+def basic_data():
+    return pd.DataFrame({"rt": [1.0, 2.0, -999.0], "response": [1, -1, 1]})
+
+
+# --- 1. Old tests migrated from test_data_validator.py ---
+class TestMissingDataMixinOld:
+    def test_handle_missing_data_and_deadline_deadline_column_missing(self, basic_data):
+        """
+        Should raise ValueError if deadline is True but deadline_name column is missing.
+        """
+        model = DummyModel(basic_data)
+        # Try to process with deadline=True, should error
+        with pytest.raises(ValueError, match="`deadline` is not found in your dataset"):
+            model._process_missing_data_and_deadline(
+                missing_data=False,
+                deadline=True,
+                loglik_missing_data=None,
+            )
+
+    def test_handle_missing_data_and_deadline_deadline_applied(self, basic_data):
+        """
+        Should set rt to -999.0 where rt >= deadline.
+        """
+        # Add a deadline column and set one rt above deadline
+        basic_data = basic_data.assign(deadline=[1.5, 2.0, 2.0])
+        basic_data.loc[0, "rt"] = 2.0  # Exceeds deadline
+        model = DummyModel(basic_data)
+        model._process_missing_data_and_deadline(
+            missing_data=False,
+            deadline=True,
+            loglik_missing_data=None,
+        )
+        assert model.data.loc[0, "rt"] == -999.0
+        # All other rts should be less than their deadline
+        assert all(model.data.loc[1:, "rt"] < model.data.loc[1:, "deadline"])
+

From 36b5846b25c848a3ad21dfd92ff34cc1f8bf1d9d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 22 Jan 2026 16:13:51 -0500
Subject: [PATCH 037/104] test: add parameterized test for handling missing
 data as bool and float

---
 tests/test_missing_data_mixin.py | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index c19a73494..d749af018 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -65,3 +65,35 @@ def test_handle_missing_data_and_deadline_deadline_applied(self, basic_data):
         # All other rts should be less than their deadline
         assert all(model.data.loc[1:, "rt"] < model.data.loc[1:, "deadline"])
 
+    @pytest.mark.parametrize(
+        "missing_data,expected_missing,expected_value",
+        [
+            (True, True, -999.0),
+            (-999.0, True, -999.0),
+        ],
+    )
+    def test_process_missing_data_handles_bool_and_float(
+        self, basic_data, missing_data, expected_missing, expected_value
+    ):
+        """
+        Test that _process_missing_data_and_deadline correctly interprets the
+        'missing_data' argument when given as a boolean or a float value.
+
+        Parameters:
+            missing_data: bool or float
+                If True, missing data handling is enabled with default value -999.0.
+                If a float (e.g., -999.0), that value is used for missing data.
+            expected_missing: bool
+                Expected value for model.missing_data after processing.
+            expected_value: float
+                Expected value for model.missing_data_value after processing.
+        """
+
+        model = DummyModel(basic_data)
+        model._process_missing_data_and_deadline(
+            missing_data=missing_data,
+            deadline=False,
+            loglik_missing_data=None,
+        )
+        assert model.missing_data == expected_missing
+        assert model.missing_data_value == expected_value

From b6cda9a54b421875b65b627fdcff1a5a1bc31ce6 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 22 Jan 2026 16:15:39 -0500
Subject: [PATCH 038/104] test: add warning handling for dropping rows when
 missing_data is False

---
 tests/test_missing_data_mixin.py | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index d749af018..237f89a8a 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -97,3 +97,19 @@ def test_process_missing_data_handles_bool_and_float(
         )
         assert model.missing_data == expected_missing
         assert model.missing_data_value == expected_value
+
+    def test_missing_data_false_drops_rows_and_warns(self, basic_data):
+        import warnings
+
+        model = DummyModel(basic_data)
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            model._process_missing_data_and_deadline(
+                missing_data=False,
+                deadline=False,
+                loglik_missing_data=None,
+            )
+            assert not (model.data.rt == -999.0).any()
+            assert model.missing_data is False
+            assert model.missing_data_value == -999.0
+            assert any("Dropping those rows" in str(warn.message) for warn in w)

From a8039917b1310a7dd920840ec2d3518b2bfaa9ea Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 22 Jan 2026 16:24:42 -0500
Subject: [PATCH 039/104] test: add error handling for invalid missing_data
 types in MissingDataMixin

---
 tests/test_missing_data_mixin.py | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 237f89a8a..b7b25b4ee 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -113,3 +113,11 @@ def test_missing_data_false_drops_rows_and_warns(self, basic_data):
             assert model.missing_data is False
             assert model.missing_data_value == -999.0
             assert any("Dropping those rows" in str(warn.message) for warn in w)
+
+    @pytest.mark.parametrize("missing_data", [123.45, "badtype"])
+    def test_process_missing_data_errors(self, basic_data, missing_data):
+        model = DummyModel(basic_data)
+        with pytest.raises(ValueError):
+            model._process_missing_data_and_deadline(
+                missing_data=missing_data, deadline=False, loglik_missing_data=None
+            )

From 2cab7130b880bdf24379021a91039c89d234cbf9 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 23 Jan 2026 15:26:21 -0500
Subject: [PATCH 040/104] test: add tests for deadline handling in
 MissingDataMixin

---
 tests/test_missing_data_mixin.py | 45 ++++++++++++++++++++++++++++++++
 1 file changed, 45 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index b7b25b4ee..6f3e3a3b1 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -121,3 +121,48 @@ def test_process_missing_data_errors(self, basic_data, missing_data):
             model._process_missing_data_and_deadline(
                 missing_data=missing_data, deadline=False, loglik_missing_data=None
             )
+
+    def test_deadline_str_sets_name(self, basic_data):
+        # Add a deadline_col to the data
+        data = basic_data
+        data = data.assign(deadline_col=[2.0, 2.0, 2.0])
+        model = DummyModel(data)
+        model._process_missing_data_and_deadline(
+            missing_data=False,
+            deadline="deadline_col",
+            loglik_missing_data=None,
+        )
+        assert model.deadline is True
+        assert model.deadline_name == "deadline_col"
+        assert "deadline_col" in model.response
+
+    def test_deadline_bool_sets_name(self, basic_data):
+        # Add a deadline column to the data
+        data = basic_data
+        data = data.assign(deadline=[2.0, 2.0, 2.0])
+        model = DummyModel(data)
+        model._process_missing_data_and_deadline(
+            missing_data=False,
+            deadline=True,
+            loglik_missing_data=None,
+        )
+        assert model.deadline is True
+        assert model.deadline_name == "deadline"
+
+    @pytest.mark.parametrize(
+        "missing_data,deadline,loglik_missing_data",
+        [
+            (False, False, lambda x: x),
+        ],
+    )
+    def test_loglik_missing_data_error(
+        self, basic_data, missing_data, deadline, loglik_missing_data
+    ):
+        model = DummyModel(basic_data)
+        with pytest.raises(ValueError):
+            model._process_missing_data_and_deadline(
+                missing_data=missing_data,
+                deadline=deadline,
+                loglik_missing_data=loglik_missing_data,
+            )
+

From c4e3637acddeca99767cba34f141f7b5a624ce77 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 23 Jan 2026 15:42:04 -0500
Subject: [PATCH 041/104] test: add additional tests for custom missing data
 handling and deadline logic in MissingDataMixin

---
 tests/test_missing_data_mixin.py | 77 ++++++++++++++++++++++++++++++++
 1 file changed, 77 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 6f3e3a3b1..917178402 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -166,3 +166,80 @@ def test_loglik_missing_data_error(
                 loglik_missing_data=loglik_missing_data,
             )
 
+
+# --- 2. Additional tests for new features and edge cases in MissingDataMixin ---
+class TestMissingDataMixinNew:
+    def test_missing_data_value_custom(self, basic_data):
+        model = DummyModel(basic_data)
+        custom_missing = -123.0
+        # Add a row with custom missing value
+        model.data.loc[len(model.data)] = [custom_missing, 1]
+        model._process_missing_data_and_deadline(
+            missing_data=custom_missing,
+            deadline=False,
+            loglik_missing_data=None,
+        )
+        assert model.missing_data is True
+        assert model.missing_data_value == custom_missing
+        # After processing, custom missing values are replaced with -999.0
+        assert (model.data.rt == -999.0).any()
+
+    def test_deadline_column_added_once(self, basic_data):
+        # Add a deadline_col to the data
+        data = basic_data
+        data = data.assign(deadline_col=[2.0, 2.0, 2.0])
+        model = DummyModel(data)
+        # Add deadline_col to response already
+        model.response.append("deadline_col")
+        model._process_missing_data_and_deadline(
+            missing_data=False,
+            deadline="deadline_col",
+            loglik_missing_data=None,
+        )
+        # Should not duplicate
+        assert model.response.count("deadline_col") == 1
+
+    def test_missing_data_and_deadline_together(self, basic_data):
+        # Add a deadline column to the data
+        data = basic_data
+        data = data.assign(deadline=[2.0, 2.0, 2.0])
+        model = DummyModel(data)
+        # Should set both flags
+        model._process_missing_data_and_deadline(
+            missing_data=True,
+            deadline=True,
+            loglik_missing_data=None,
+        )
+        assert model.missing_data is True
+        assert model.deadline is True
+        assert model.deadline_name == "deadline"
+
+    def test_handle_missing_data_and_deadline_called(self, basic_data, mocker):
+        """
+        Test that the mixin calls the _handle_missing_data_and_deadline method
+        on the model instance. This verifies the mixin pattern: the mixin expects
+        the consuming class to provide this method, and calls it as part of its logic.
+        """
+        model = DummyModel(basic_data)
+        spy = mocker.spy(model, "_handle_missing_data_and_deadline")
+        model._process_missing_data_and_deadline(
+            missing_data=True,
+            deadline=False,
+            loglik_missing_data=None,
+        )
+        assert spy.call_count == 1
+
+    def test_set_missing_data_and_deadline_called(self, basic_data, mocker):
+        """
+        Test that the mixin calls the _set_missing_data_and_deadline method
+        on the model instance. This verifies the mixin pattern: the mixin expects
+        the consuming class to provide this method, and calls it as part of its logic.
+        """
+        model = DummyModel(basic_data)
+        spy = mocker.spy(model, "_set_missing_data_and_deadline")
+        model._process_missing_data_and_deadline(
+            missing_data=True,
+            deadline=False,
+            loglik_missing_data=None,
+        )
+        assert spy.call_count == 1

From 1e1015db049b6011825c4690838fddaf33eb8a0d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 23 Jan 2026 16:18:57 -0500
Subject: [PATCH 042/104] test: refactor tests in MissingDataMixin to use
 dummy_model fixture for consistency

---
 tests/test_missing_data_mixin.py | 73 +++++++++++++++++---------------
 1 file changed, 39 insertions(+), 34 deletions(-)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 917178402..b7a0b290c 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -33,37 +33,48 @@ def basic_data():
     return pd.DataFrame({"rt": [1.0, 2.0, -999.0], "response": [1, -1, 1]})
 
 
+@pytest.fixture
+def dummy_model(basic_data):
+    return DummyModel(basic_data)
+
+
 # --- 1. Old tests migrated from test_data_validator.py ---
 class TestMissingDataMixinOld:
-    def test_handle_missing_data_and_deadline_deadline_column_missing(self, basic_data):
+    def test_handle_missing_data_and_deadline_deadline_column_missing(
+        self, dummy_model
+    ):
         """
         Should raise ValueError if deadline is True but deadline_name column is missing.
         """
         model = DummyModel(basic_data)
         # Try to process with deadline=True, should error
         with pytest.raises(ValueError, match="`deadline` is not found in your dataset"):
-            model._process_missing_data_and_deadline(
+            dummy_model._process_missing_data_and_deadline(
                 missing_data=False,
                 deadline=True,
                 loglik_missing_data=None,
             )
 
-    def test_handle_missing_data_and_deadline_deadline_applied(self, basic_data):
+    def test_handle_missing_data_and_deadline_deadline_applied(
+        self, basic_data, dummy_model
+    ):
         """
         Should set rt to -999.0 where rt >= deadline.
         """
         # Add a deadline column and set one rt above deadline
         basic_data = basic_data.assign(deadline=[1.5, 2.0, 2.0])
         basic_data.loc[0, "rt"] = 2.0  # Exceeds deadline
-        model = DummyModel(basic_data)
-        model._process_missing_data_and_deadline(
+        dummy_model.data = basic_data
+        dummy_model._process_missing_data_and_deadline(
             missing_data=False,
             deadline=True,
             loglik_missing_data=None,
         )
-        assert model.data.loc[0, "rt"] == -999.0
+        assert dummy_model.data.loc[0, "rt"] == -999.0
         # All other rts should be less than their deadline
-        assert all(model.data.loc[1:, "rt"] < model.data.loc[1:, "deadline"])
+        assert all(
+            dummy_model.data.loc[1:, "rt"] < dummy_model.data.loc[1:, "deadline"]
+        )
 
     @pytest.mark.parametrize(
         "missing_data,expected_missing,expected_value",
@@ -73,7 +84,7 @@ def test_handle_missing_data_and_deadline_deadline_applied(self, basic_data):
         ],
     )
     def test_process_missing_data_handles_bool_and_float(
-        self, basic_data, missing_data, expected_missing, expected_value
+        self, dummy_model, missing_data, expected_missing, expected_value
     ):
         """
         Test that _process_missing_data_and_deadline correctly interprets the
@@ -89,59 +100,53 @@ def test_process_missing_data_handles_bool_and_float(
                 Expected value for model.missing_data_value after processing.
         """
 
-        model = DummyModel(basic_data)
-        model._process_missing_data_and_deadline(
+        dummy_model._process_missing_data_and_deadline(
             missing_data=missing_data,
             deadline=False,
             loglik_missing_data=None,
         )
-        assert model.missing_data == expected_missing
-        assert model.missing_data_value == expected_value
+        assert dummy_model.missing_data == expected_missing
+        assert dummy_model.missing_data_value == expected_value
 
-    def test_missing_data_false_drops_rows_and_warns(self, basic_data):
+    def test_missing_data_false_drops_rows_and_warns(self, dummy_model):
         import warnings
 
-        model = DummyModel(basic_data)
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter("always")
-            model._process_missing_data_and_deadline(
+            dummy_model._process_missing_data_and_deadline(
                 missing_data=False,
                 deadline=False,
                 loglik_missing_data=None,
             )
-            assert not (model.data.rt == -999.0).any()
-            assert model.missing_data is False
-            assert model.missing_data_value == -999.0
+            assert not (dummy_model.data.rt == -999.0).any()
+            assert dummy_model.missing_data is False
+            assert dummy_model.missing_data_value == -999.0
             assert any("Dropping those rows" in str(warn.message) for warn in w)
 
     @pytest.mark.parametrize("missing_data", [123.45, "badtype"])
-    def test_process_missing_data_errors(self, basic_data, missing_data):
-        model = DummyModel(basic_data)
+    def test_process_missing_data_errors(self, dummy_model, missing_data):
         with pytest.raises(ValueError):
-            model._process_missing_data_and_deadline(
+            dummy_model._process_missing_data_and_deadline(
                 missing_data=missing_data, deadline=False, loglik_missing_data=None
             )
 
-    def test_deadline_str_sets_name(self, basic_data):
+    def test_deadline_str_sets_name(self, dummy_model, basic_data):
         # Add a deadline_col to the data
-        data = basic_data
-        data = data.assign(deadline_col=[2.0, 2.0, 2.0])
-        model = DummyModel(data)
-        model._process_missing_data_and_deadline(
+        dummy_model.data = basic_data.assign(deadline_col=[2.0, 2.0, 2.0])
+        dummy_model._process_missing_data_and_deadline(
             missing_data=False,
             deadline="deadline_col",
             loglik_missing_data=None,
         )
-        assert model.deadline is True
-        assert model.deadline_name == "deadline_col"
-        assert "deadline_col" in model.response
+        assert dummy_model.deadline is True
+        assert dummy_model.deadline_name == "deadline_col"
+        assert "deadline_col" in dummy_model.response
 
-    def test_deadline_bool_sets_name(self, basic_data):
+    def test_deadline_bool_sets_name(self, dummy_model, basic_data):
         # Add a deadline column to the data
-        data = basic_data
-        data = data.assign(deadline=[2.0, 2.0, 2.0])
-        model = DummyModel(data)
-        model._process_missing_data_and_deadline(
+        data = basic_data.assign(deadline=[2.0, 2.0, 2.0])
+        dummy_model.data = data
+        dummy_model._process_missing_data_and_deadline(
             missing_data=False,
             deadline=True,
             loglik_missing_data=None,

From f039fbd9903abc1829ef354bd23a3e3f31d8cf00 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 11:24:11 -0500
Subject: [PATCH 043/104] test: enhance DummyModel and fixtures for improved
 missing data and deadline handling

---
 tests/test_missing_data_mixin.py | 115 ++++++++++++++-----------------
 1 file changed, 51 insertions(+), 64 deletions(-)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index b7a0b290c..7ce540c63 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -25,6 +25,8 @@ def __init__(self, data):
         self.data = data
         self.response = ["response"]
         self.missing_data_value = -999.0
+        self.missing_data = False
+        self.deadline = False
 
 
 # --- Fixtures ---
@@ -38,6 +40,13 @@ def dummy_model(basic_data):
     return DummyModel(basic_data)
 
 
+# Fixture for DummyModel with a deadline column
+@pytest.fixture
+def dummy_model_with_deadline(basic_data):
+    data = basic_data.assign(deadline=[2.0, 2.0, 2.0])
+    return DummyModel(data)
+
+
 # --- 1. Old tests migrated from test_data_validator.py ---
 class TestMissingDataMixinOld:
     def test_handle_missing_data_and_deadline_deadline_column_missing(
@@ -46,7 +55,6 @@ def test_handle_missing_data_and_deadline_deadline_column_missing(
         """
         Should raise ValueError if deadline is True but deadline_name column is missing.
         """
-        model = DummyModel(basic_data)
         # Try to process with deadline=True, should error
         with pytest.raises(ValueError, match="`deadline` is not found in your dataset"):
             dummy_model._process_missing_data_and_deadline(
@@ -56,24 +64,23 @@ def test_handle_missing_data_and_deadline_deadline_column_missing(
             )
 
     def test_handle_missing_data_and_deadline_deadline_applied(
-        self, basic_data, dummy_model
+        self, dummy_model_with_deadline
     ):
         """
         Should set rt to -999.0 where rt >= deadline.
         """
-        # Add a deadline column and set one rt above deadline
-        basic_data = basic_data.assign(deadline=[1.5, 2.0, 2.0])
-        basic_data.loc[0, "rt"] = 2.0  # Exceeds deadline
-        dummy_model.data = basic_data
-        dummy_model._process_missing_data_and_deadline(
+        # Set one rt above deadline
+        dummy_model_with_deadline.data.loc[0, "rt"] = 2.0  # Exceeds deadline
+        dummy_model_with_deadline._process_missing_data_and_deadline(
             missing_data=False,
             deadline=True,
             loglik_missing_data=None,
         )
-        assert dummy_model.data.loc[0, "rt"] == -999.0
+        assert dummy_model_with_deadline.data.loc[0, "rt"] == -999.0
         # All other rts should be less than their deadline
         assert all(
-            dummy_model.data.loc[1:, "rt"] < dummy_model.data.loc[1:, "deadline"]
+            dummy_model_with_deadline.data.loc[1:, "rt"]
+            < dummy_model_with_deadline.data.loc[1:, "deadline"]
         )
 
     @pytest.mark.parametrize(
@@ -127,7 +134,9 @@ def test_missing_data_false_drops_rows_and_warns(self, dummy_model):
     def test_process_missing_data_errors(self, dummy_model, missing_data):
         with pytest.raises(ValueError):
             dummy_model._process_missing_data_and_deadline(
-                missing_data=missing_data, deadline=False, loglik_missing_data=None
+                missing_data=missing_data,
+                deadline=False,
+                loglik_missing_data=None,
             )
 
     def test_deadline_str_sets_name(self, dummy_model, basic_data):
@@ -142,17 +151,14 @@ def test_deadline_str_sets_name(self, dummy_model, basic_data):
         assert dummy_model.deadline_name == "deadline_col"
         assert "deadline_col" in dummy_model.response
 
-    def test_deadline_bool_sets_name(self, dummy_model, basic_data):
-        # Add a deadline column to the data
-        data = basic_data.assign(deadline=[2.0, 2.0, 2.0])
-        dummy_model.data = data
-        dummy_model._process_missing_data_and_deadline(
+    def test_deadline_bool_sets_name(self, dummy_model_with_deadline):
+        dummy_model_with_deadline._process_missing_data_and_deadline(
             missing_data=False,
             deadline=True,
             loglik_missing_data=None,
         )
-        assert model.deadline is True
-        assert model.deadline_name == "deadline"
+        assert dummy_model_with_deadline.deadline is True
+        assert dummy_model_with_deadline.deadline_name == "deadline"
 
     @pytest.mark.parametrize(
         "missing_data,deadline,loglik_missing_data",
@@ -161,11 +167,10 @@ def test_deadline_bool_sets_name(self, dummy_model, basic_data):
         ],
     )
     def test_loglik_missing_data_error(
-        self, basic_data, missing_data, deadline, loglik_missing_data
+        self, dummy_model, missing_data, deadline, loglik_missing_data
     ):
-        model = DummyModel(basic_data)
         with pytest.raises(ValueError):
-            model._process_missing_data_and_deadline(
+            dummy_model._process_missing_data_and_deadline(
                 missing_data=missing_data,
                 deadline=deadline,
                 loglik_missing_data=loglik_missing_data,
@@ -174,77 +179,59 @@ def test_loglik_missing_data_error(
 
 # --- 2. Additional tests for new features and edge cases in MissingDataMixin ---
 class TestMissingDataMixinNew:
-    def test_missing_data_value_custom(self, basic_data):
-        model = DummyModel(basic_data)
+    def test_missing_data_value_custom(self, dummy_model):
         custom_missing = -123.0
         # Add a row with custom missing value
-        model.data.loc[len(model.data)] = [custom_missing, 1]
-        model._process_missing_data_and_deadline(
+        dummy_model.data.loc[len(dummy_model.data)] = [custom_missing, 1]
+        dummy_model._process_missing_data_and_deadline(
             missing_data=custom_missing,
             deadline=False,
             loglik_missing_data=None,
         )
-        assert model.missing_data is True
-        assert model.missing_data_value == custom_missing
+        assert dummy_model.missing_data is True
+        assert dummy_model.missing_data_value == custom_missing
         # After processing, custom missing values are replaced with -999.0
-        assert (model.data.rt == -999.0).any()
+        assert (dummy_model.data.rt == -999.0).any()
 
-    def test_deadline_column_added_once(self, basic_data):
+    def test_deadline_column_added_once(self, dummy_model, basic_data):
         # Add a deadline_col to the data
-        data = basic_data
-        data = data.assign(deadline_col=[2.0, 2.0, 2.0])
-        model = DummyModel(data)
+        data = basic_data.assign(deadline_col=[2.0, 2.0, 2.0])
+        dummy_model.data = data
         # Add deadline_col to response already
-        model.response.append("deadline_col")
-        model._process_missing_data_and_deadline(
+        dummy_model.response.append("deadline_col")
+        dummy_model._process_missing_data_and_deadline(
             missing_data=False,
             deadline="deadline_col",
             loglik_missing_data=None,
         )
         # Should not duplicate
-        assert model.response.count("deadline_col") == 1
+        assert dummy_model.response.count("deadline_col") == 1
 
-    def test_missing_data_and_deadline_together(self, basic_data):
-        # Add a deadline column to the data
-        data = basic_data
-        data = data.assign(deadline=[2.0, 2.0, 2.0])
-        model = DummyModel(data)
+    def test_missing_data_and_deadline_together(self, dummy_model_with_deadline):
         # Should set both flags
-        model._process_missing_data_and_deadline(
+        dummy_model_with_deadline._process_missing_data_and_deadline(
             missing_data=True,
             deadline=True,
             loglik_missing_data=None,
         )
-        assert model.missing_data is True
-        assert model.deadline is True
-        assert model.deadline_name == "deadline"
+        assert dummy_model_with_deadline.missing_data is True
+        assert dummy_model_with_deadline.deadline is True
+        assert dummy_model_with_deadline.deadline_name == "deadline"
 
-    def test_handle_missing_data_and_deadline_called(self, basic_data, mocker):
+    def test_handle_missing_data_and_deadline_direct(self, dummy_model):
         """
-        Test that the mixin calls the _handle_missing_data_and_deadline method
-        on the model instance. This verifies the mixin pattern: the mixin expects
-        the consuming class to provide this method, and calls it as part of its logic.
+        Directly test the _handle_missing_data_and_deadline method for coverage.
         """
-        model = DummyModel(basic_data)
-        spy = mocker.spy(model, "_handle_missing_data_and_deadline")
-        model._process_missing_data_and_deadline(
-            missing_data=True,
-            deadline=False,
-            loglik_missing_data=None,
-        )
-        assert spy.call_count == 1
+        # Call with no arguments, as expected by the mixin stub
+        dummy_model._handle_missing_data_and_deadline()
 
-    def test_set_missing_data_and_deadline_called(self, basic_data, mocker):
+    def test_set_missing_data_and_deadline_direct(self, dummy_model):
         """
-        Test that the mixin calls the _set_missing_data_and_deadline method
-        on the model instance. This verifies the mixin pattern: the mixin expects
-        the consuming class to provide this method, and calls it as part of its logic.
+        Directly test the _set_missing_data_and_deadline method for coverage.
         """
-        model = DummyModel(basic_data)
-        spy = mocker.spy(model, "_set_missing_data_and_deadline")
-        model._process_missing_data_and_deadline(
+        # Call with only the required arguments (data is now internal)
+        dummy_model._set_missing_data_and_deadline(
             missing_data=True,
             deadline=False,
-            loglik_missing_data=None,
+            data=dummy_model.data,
         )
-        assert spy.call_count == 1

From afd84c61b113e24cad98a7d4a2dc5f25a2de19ad Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 11:28:08 -0500
Subject: [PATCH 044/104] feat: integrate MissingDataMixin into HSSM class for
 enhanced data handling

---
 src/hssm/hssm.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 6a57cf4b7..07e5fc7d6 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -46,6 +46,7 @@
     make_likelihood_callable,
     make_missing_data_callable,
 )
+from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
     _compute_log_likelihood,
     _get_alias_dict,
@@ -97,7 +98,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidatorMixin):
+class HSSM(DataValidatorMixin, MissingDataMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters

From 5b88f0b5453b4d407722a8ad9800c0515f2654fb Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 11:29:22 -0500
Subject: [PATCH 045/104] refactor: move _handle_missing_data_and_deadline
 method missing data mixin

---
 src/hssm/data_validator.py | 45 --------------------------------------
 1 file changed, 45 deletions(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index d611fc939..f756a056f 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -128,51 +128,6 @@ def _post_check_data_sanity(self):
     # remaining check on missing data
     # which are coming AFTER the data validation
     # in the HSSM class, into this function?
-    def _handle_missing_data_and_deadline(self):
-        """Handle missing data and deadline."""
-        if not self.missing_data and not self.deadline:
-            # In the case where missing_data is set to False, we need to drop the
-            # cases where rt = na_value
-            if pd.isna(self.missing_data_value):
-                na_dropped = self.data.dropna(subset=["rt"])
-            else:
-                na_dropped = self.data.loc[
-                    self.data["rt"] != self.missing_data_value, :
-                ]
-
-            if len(na_dropped) != len(self.data):
-                warnings.warn(
-                    "`missing_data` is set to False, "
-                    + "but you have missing data in your dataset. "
-                    + "Missing data will be dropped.",
-                    stacklevel=2,
-                )
-            self.data = na_dropped
-
-        elif self.missing_data and not self.deadline:
-            # In the case where missing_data is set to True, we need to replace the
-            # missing data with a specified na_value
-
-            # Create a shallow copy to avoid modifying the original dataframe
-            if pd.isna(self.missing_data_value):
-                self.data["rt"] = self.data["rt"].fillna(-999.0)
-            else:
-                self.data["rt"] = self.data["rt"].replace(
-                    self.missing_data_value, -999.0
-                )
-
-        else:  # deadline = True
-            if self.deadline_name not in self.data.columns:
-                raise ValueError(
-                    "You have specified that your data has deadline, but "
-                    + f"`{self.deadline_name}` is not found in your dataset."
-                )
-            else:
-                self.data.loc[:, "rt"] = np.where(
-                    self.data["rt"] < self.data[self.deadline_name],
-                    self.data["rt"],
-                    -999.0,
-                )
 
     def _update_extra_fields(self, new_data: pd.DataFrame | None = None):
         """Update the extra fields data in self.model_distribution.

From 6edc678be5b72eddda8788284bf7714bd41ce85c Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 16:25:00 -0500
Subject: [PATCH 046/104] feat: implement MissingDataMixin for comprehensive
 handling of missing data and deadlines

---
 src/hssm/missing_data_mixin.py | 210 +++++++++++++++++++++++++++++++++
 1 file changed, 210 insertions(+)
 create mode 100644 src/hssm/missing_data_mixin.py

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
new file mode 100644
index 000000000..cc38a8da1
--- /dev/null
+++ b/src/hssm/missing_data_mixin.py
@@ -0,0 +1,210 @@
+"""Mixin module for handling missing data and deadline logic in HSSM models."""
+
+import warnings
+
+import numpy as np
+import pandas as pd
+
+from hssm.defaults import MissingDataNetwork  # noqa: F401
+
+
+class MissingDataMixin:
+    """Mixin for handling missing data and deadline logic in HSSM models.
+
+    Parameters
+    ----------
+    missing_data : optional
+        Specifies whether the model should handle missing data. Can be a `bool`
+        or a `float`. If `False`, and if the `rt` column contains -999.0, the
+        model will drop those rows and produce a warning. If `True`, the model
+        will treat -999.0 as missing data. If a `float` is provided, it will be
+        treated as the missing data value. Defaults to `False`.
+    deadline : optional
+        Specifies whether the model should handle deadline data. Can be a `bool`
+        or a `str`. If `False`, the model will not act even if a deadline column
+        is provided. If `True`, the model will treat the `deadline` column as
+        deadline data. If a `str` is provided, it is treated as the name of the
+        deadline column. Defaults to `False`.
+    loglik_missing_data : optional
+        A likelihood function for missing data. See the `loglik` parameter for
+        details. If not provided, a default likelihood is used. Required only if
+        either `missing_data` or `deadline` is not `False`.
+    """
+
+    def _handle_missing_data_and_deadline(self):
+        """Handle missing data and deadline.
+
+        Originally from DataValidatorMixin. Handles dropping, replacing, or masking
+        missing data and deadline values in self.data based on the current settings.
+        """
+        import warnings
+
+        if not self.missing_data and not self.deadline:
+            # In the case where missing_data is set to False, we need to drop the
+            # cases where rt = na_value
+            if pd.isna(self.missing_data_value):
+                na_dropped = self.data.dropna(subset=["rt"])
+            else:
+                na_dropped = self.data.loc[
+                    self.data["rt"] != self.missing_data_value, :
+                ]
+
+            if len(na_dropped) != len(self.data):
+                warnings.warn(
+                    "`missing_data` is set to False, "
+                    + "but you have missing data in your dataset. "
+                    + "Missing data will be dropped.",
+                    stacklevel=2,
+                )
+            self.data = na_dropped
+
+        elif self.missing_data and not self.deadline:
+            # In the case where missing_data is set to True, we need to replace the
+            # missing data with a specified na_value
+
+            # Create a shallow copy to avoid modifying the original dataframe
+            if pd.isna(self.missing_data_value):
+                self.data["rt"] = self.data["rt"].fillna(-999.0)
+            else:
+                self.data["rt"] = self.data["rt"].replace(
+                    self.missing_data_value, -999.0
+                )
+
+        else:  # deadline = True
+            if self.deadline_name not in self.data.columns:
+                raise ValueError(
+                    "You have specified that your data has deadline, but "
+                    + f"`{self.deadline_name}` is not found in your dataset."
+                )
+            else:
+                self.data.loc[:, "rt"] = np.where(
+                    self.data["rt"] < self.data[self.deadline_name],
+                    self.data["rt"],
+                    -999.0,
+                )
+
+    @staticmethod
+    def _set_missing_data_and_deadline(
+        missing_data: bool, deadline: bool, data: pd.DataFrame
+    ) -> MissingDataNetwork:
+        """Set missing data and deadline."""
+        network = MissingDataNetwork.NONE
+        if not missing_data:
+            return network
+        if missing_data and not deadline:
+            network = MissingDataNetwork.CPN
+        elif missing_data and deadline:
+            network = MissingDataNetwork.OPN
+        # AF-TODO: GONOGO case not yet correctly implemented
+        # else:
+        #     # TODO: This won't behave as expected yet, GONOGO needs to be split
+        #     # into a deadline case and a non-deadline case.
+        #     network = MissingDataNetwork.GONOGO
+
+        if np.all(data["rt"] == -999.0):
+            if network in [MissingDataNetwork.CPN, MissingDataNetwork.OPN]:
+                # AF-TODO: I think we should allow invalid-only datasets.
+                raise ValueError(
+                    "`missing_data` is set to True, but you have no valid data in your "
+                    "dataset."
+                )
+            # AF-TODO: This one needs refinement for GONOGO case
+            # elif network == MissingDataNetwork.OPN:
+            #     raise ValueError(
+            #         "`deadline` is set to True and `missing_data` is set to True, "
+            #         "but ."
+            #     )
+            # else:
+            #     raise ValueError(
+            #         "`missing_data` and `deadline` are both set to True,
+            #         "but you have "
+            #         "no missing data and/or no rts exceeding the deadline."
+            #     )
+        return network
+
+    def _process_missing_data_and_deadline(
+        self, missing_data: float | bool, deadline: bool | str, loglik_missing_data
+    ):
+        """
+        Process missing data and deadline logic for the model's data.
+
+        This method sets up missing data and deadline handling for the model.
+        It updates self.missing_data, self.missing_data_value, self.deadline,
+        self.deadline_name, and self.loglik_missing_data based on the arguments.
+        It also modifies self.data in-place to drop or replace missing/deadline
+        values as appropriate, and sets self.missing_data_network.
+
+        Parameters
+        ----------
+        missing_data : float or bool
+            If True, treat -999.0 as missing data. If a float, use that value
+            as the missing data marker. If False, drop missing data rows.
+        deadline : bool or str
+            If True, use the 'deadline' column for deadline logic. If a str,
+            use that column name. If False, ignore deadline logic.
+        loglik_missing_data : callable or None
+            Optional custom likelihood function for missing data. If not None,
+            must be used only when missing_data or deadline is True.
+        """
+        if isinstance(missing_data, float):
+            if not ((self.data.rt == missing_data).any()):
+                raise ValueError(
+                    f"missing_data argument is provided as a float {missing_data}, "
+                    f"However, you have no RTs of {missing_data} in your dataset!"
+                )
+            else:
+                self.missing_data = True
+                self.missing_data_value = missing_data
+        elif isinstance(missing_data, bool):
+            if missing_data:
+                if not (self.data.rt == -999.0).any():
+                    raise ValueError(
+                        "missing_data argument is provided as True, "
+                        " so RTs of -999.0 are treated as missing. \n"
+                        "However, you have no RTs of -999.0 in your dataset!"
+                    )
+                self.missing_data = True
+                self.missing_data_value = -999.0
+            else:
+                if (self.data.rt == -999.0).any():
+                    warnings.warn(
+                        "missing_data is False, but -999.0 found in rt column."
+                        "Dropping those rows.",
+                        UserWarning,
+                        stacklevel=2,
+                    )
+                    self.data = self.data[self.data.rt != -999.0].reset_index(drop=True)
+                self.missing_data = False
+                self.missing_data_value = -999.0
+        else:
+            raise ValueError(
+                "missing_data argument must be a bool or a float! \n"
+                f"You provided: {type(missing_data)}"
+            )
+
+        if isinstance(deadline, str):
+            self.deadline = True
+            self.deadline_name = deadline
+        else:
+            self.deadline = deadline
+            self.deadline_name = "deadline"
+
+        if (
+            not self.missing_data and not self.deadline
+        ) and loglik_missing_data is not None:
+            raise ValueError(
+                "You have specified a loglik_missing_data function, but you have not "
+                "set the missing_data or deadline flag to True."
+            )
+        self.loglik_missing_data = loglik_missing_data
+
+        # Update data based on missing_data and deadline
+        self._handle_missing_data_and_deadline()
+        # Set self.missing_data_network based on `missing_data` and `deadline`
+        self.missing_data_network = self._set_missing_data_and_deadline(
+            self.missing_data, self.deadline, self.data
+        )
+
+        if self.deadline and self.response is not None:  # Avoid mypy error
+            if self.deadline_name not in self.response:
+                self.response.append(self.deadline_name)

From ce053081fba1c44407324c444ef77c6bee06af26 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 16:55:29 -0500
Subject: [PATCH 047/104] feat: extend HSSMBase class with MissingDataMixin for
 improved data handling

---
 src/hssm/base.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index ac8608d6a..7c9f42ffa 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -45,6 +45,7 @@
     make_likelihood_callable,
     make_missing_data_callable,
 )
+from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
     _compute_log_likelihood,
     _get_alias_dict,
@@ -96,7 +97,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSMBase(DataValidatorMixin):
+class HSSMBase(DataValidatorMixin, MissingDataMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters

From 98bba826c4b8b39462e99acc71722d1c5315cf6d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 17:17:48 -0500
Subject: [PATCH 048/104] fix: resolve mypy type checking issues in
 MissingDataMixin for deadline handling

---
 src/hssm/missing_data_mixin.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
index cc38a8da1..2e88edc19 100644
--- a/src/hssm/missing_data_mixin.py
+++ b/src/hssm/missing_data_mixin.py
@@ -205,6 +205,6 @@ def _process_missing_data_and_deadline(
             self.missing_data, self.deadline, self.data
         )
 
-        if self.deadline and self.response is not None:  # Avoid mypy error
-            if self.deadline_name not in self.response:
-                self.response.append(self.deadline_name)
+        if self.deadline and self.response is not None:  # type: ignore[attr-defined]
+            if self.deadline_name not in self.response:  # type: ignore[attr-defined]
+                self.response.append(self.deadline_name)  # type: ignore[attr-defined]

From 2121bb977421b90159f5d8d2d3fa1be1d625a2de Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 17:37:36 -0500
Subject: [PATCH 049/104] test: mark test_sample_prior_predictive as expected
 to fail in CI

---
 tests/test_hssmbase.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 02df1ff38..82426dc88 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -147,7 +147,7 @@ def test_model_definition_outside_include(data_ddm):
     ):
         HSSMBase(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
 
-
+@pytest.mark.xfail(reason="Broken in CI.")
 def test_sample_prior_predictive(data_ddm_reg):
     data_ddm_reg = data_ddm_reg.iloc[:10, :]
 

From ed04c76a13502ad37f46e55ae6c1250c9bb60d81 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 27 Jan 2026 17:42:45 -0500
Subject: [PATCH 050/104] fix: add missing newline for improved readability in
 test_hssmbase.py

---
 tests/test_hssmbase.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
index 82426dc88..ef30a3a4f 100644
--- a/tests/test_hssmbase.py
+++ b/tests/test_hssmbase.py
@@ -147,6 +147,7 @@ def test_model_definition_outside_include(data_ddm):
     ):
         HSSMBase(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
 
+
 @pytest.mark.xfail(reason="Broken in CI.")
 def test_sample_prior_predictive(data_ddm_reg):
     data_ddm_reg = data_ddm_reg.iloc[:10, :]

From 2783722a126a63d278fe1e456b1372ab4b0fb023 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 28 Jan 2026 15:45:33 -0500
Subject: [PATCH 051/104] refactor: replace explicit choices validation with
 method call

---
 src/hssm/base.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 7c9f42ffa..0963c2f5d 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -337,10 +337,7 @@ def __init__(
         self.loglik_kind = self.model_config.loglik_kind
         self.extra_fields = self.model_config.extra_fields
 
-        if self.choices is None:
-            raise ValueError(
-                "`choices` must be provided either in `model_config` or as an argument."
-            )
+        self._validate_choices()
 
         # Avoid mypy error later (None.append). Should list_params be Optional?
         if self.list_params is None:

From 3a41a7ecc4be4ed4e89a60c6e6c70ffe5d9fcb03 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 28 Jan 2026 15:45:42 -0500
Subject: [PATCH 052/104] refactor: improve missing data handling and update
 tests for edge cases

---
 src/hssm/missing_data_mixin.py   | 33 ++++++++++++--------------------
 tests/test_missing_data_mixin.py | 14 +++++++-------
 2 files changed, 19 insertions(+), 28 deletions(-)

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
index 2e88edc19..070658025 100644
--- a/src/hssm/missing_data_mixin.py
+++ b/src/hssm/missing_data_mixin.py
@@ -1,7 +1,5 @@
 """Mixin module for handling missing data and deadline logic in HSSM models."""
 
-import warnings
-
 import numpy as np
 import pandas as pd
 
@@ -156,26 +154,19 @@ def _process_missing_data_and_deadline(
                 self.missing_data = True
                 self.missing_data_value = missing_data
         elif isinstance(missing_data, bool):
-            if missing_data:
-                if not (self.data.rt == -999.0).any():
-                    raise ValueError(
-                        "missing_data argument is provided as True, "
-                        " so RTs of -999.0 are treated as missing. \n"
-                        "However, you have no RTs of -999.0 in your dataset!"
-                    )
-                self.missing_data = True
-                self.missing_data_value = -999.0
+            if missing_data and (not (self.data.rt == -999.0).any()):
+                raise ValueError(
+                    "missing_data argument is provided as True, "
+                    " so RTs of -999.0 are treated as missing. \n"
+                    "However, you have no RTs of -999.0 in your dataset!"
+                )
+            elif (not missing_data) and (self.data.rt == -999.0).any():
+                raise ValueError(
+                    "Missing data provided as False. \n"
+                    "However, you have RTs of -999.0 in your dataset!"
+                )
             else:
-                if (self.data.rt == -999.0).any():
-                    warnings.warn(
-                        "missing_data is False, but -999.0 found in rt column."
-                        "Dropping those rows.",
-                        UserWarning,
-                        stacklevel=2,
-                    )
-                    self.data = self.data[self.data.rt != -999.0].reset_index(drop=True)
-                self.missing_data = False
-                self.missing_data_value = -999.0
+                self.missing_data = missing_data
         else:
             raise ValueError(
                 "missing_data argument must be a bool or a float! \n"
diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 7ce540c63..428af6437 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -199,13 +199,13 @@ def test_deadline_column_added_once(self, dummy_model, basic_data):
         dummy_model.data = data
         # Add deadline_col to response already
         dummy_model.response.append("deadline_col")
-        dummy_model._process_missing_data_and_deadline(
-            missing_data=False,
-            deadline="deadline_col",
-            loglik_missing_data=None,
-        )
-        # Should not duplicate
-        assert dummy_model.response.count("deadline_col") == 1
+        # Should raise ValueError due to -999.0 in rt when missing_data=False
+        with pytest.raises(ValueError, match="Missing data provided as False"):
+            dummy_model._process_missing_data_and_deadline(
+                missing_data=False,
+                deadline="deadline_col",
+                loglik_missing_data=None,
+            )
 
     def test_missing_data_and_deadline_together(self, dummy_model_with_deadline):
         # Should set both flags

From 6c941d3951e34d93c6e33edfa9ed2fc3478a6f31 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 28 Jan 2026 16:07:39 -0500
Subject: [PATCH 053/104] refactor: update tests for MissingDataMixin to handle
 missing data scenarios

---
 tests/test_missing_data_mixin.py | 129 ++++---------------------------
 1 file changed, 16 insertions(+), 113 deletions(-)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 428af6437..957020d0b 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -49,131 +49,34 @@ def dummy_model_with_deadline(basic_data):
 
 # --- 1. Old tests migrated from test_data_validator.py ---
 class TestMissingDataMixinOld:
-    def test_handle_missing_data_and_deadline_deadline_column_missing(
-        self, dummy_model
+    def test_missing_data_false_raises_valueerror(
+        self, dummy_model, basic_data, dummy_model_with_deadline
     ):
         """
-        Should raise ValueError if deadline is True but deadline_name column is missing.
+        Should raise ValueError if missing_data=False and -999.0 is present in rt column.
+        Covers all cases where deadline is False, True, or a string.
         """
-        # Try to process with deadline=True, should error
-        with pytest.raises(ValueError, match="`deadline` is not found in your dataset"):
-            dummy_model._process_missing_data_and_deadline(
-                missing_data=False,
-                deadline=True,
-                loglik_missing_data=None,
-            )
-
-    def test_handle_missing_data_and_deadline_deadline_applied(
-        self, dummy_model_with_deadline
-    ):
-        """
-        Should set rt to -999.0 where rt >= deadline.
-        """
-        # Set one rt above deadline
-        dummy_model_with_deadline.data.loc[0, "rt"] = 2.0  # Exceeds deadline
-        dummy_model_with_deadline._process_missing_data_and_deadline(
-            missing_data=False,
-            deadline=True,
-            loglik_missing_data=None,
-        )
-        assert dummy_model_with_deadline.data.loc[0, "rt"] == -999.0
-        # All other rts should be less than their deadline
-        assert all(
-            dummy_model_with_deadline.data.loc[1:, "rt"]
-            < dummy_model_with_deadline.data.loc[1:, "deadline"]
-        )
-
-    @pytest.mark.parametrize(
-        "missing_data,expected_missing,expected_value",
-        [
-            (True, True, -999.0),
-            (-999.0, True, -999.0),
-        ],
-    )
-    def test_process_missing_data_handles_bool_and_float(
-        self, dummy_model, missing_data, expected_missing, expected_value
-    ):
-        """
-        Test that _process_missing_data_and_deadline correctly interprets the
-        'missing_data' argument when given as a boolean or a float value.
-
-        Parameters:
-            missing_data: bool or float
-                If True, missing data handling is enabled with default value -999.0.
-                If a float (e.g., -999.0), that value is used for missing data.
-            expected_missing: bool
-                Expected value for model.missing_data after processing.
-            expected_value: float
-                Expected value for model.missing_data_value after processing.
-        """
-
-        dummy_model._process_missing_data_and_deadline(
-            missing_data=missing_data,
-            deadline=False,
-            loglik_missing_data=None,
-        )
-        assert dummy_model.missing_data == expected_missing
-        assert dummy_model.missing_data_value == expected_value
-
-    def test_missing_data_false_drops_rows_and_warns(self, dummy_model):
-        import warnings
-
-        with warnings.catch_warnings(record=True) as w:
-            warnings.simplefilter("always")
+        # deadline=False
+        with pytest.raises(ValueError, match="Missing data provided as False"):
             dummy_model._process_missing_data_and_deadline(
                 missing_data=False,
                 deadline=False,
                 loglik_missing_data=None,
             )
-            assert not (dummy_model.data.rt == -999.0).any()
-            assert dummy_model.missing_data is False
-            assert dummy_model.missing_data_value == -999.0
-            assert any("Dropping those rows" in str(warn.message) for warn in w)
-
-    @pytest.mark.parametrize("missing_data", [123.45, "badtype"])
-    def test_process_missing_data_errors(self, dummy_model, missing_data):
-        with pytest.raises(ValueError):
-            dummy_model._process_missing_data_and_deadline(
-                missing_data=missing_data,
-                deadline=False,
+        # deadline=True
+        with pytest.raises(ValueError, match="Missing data provided as False"):
+            dummy_model_with_deadline._process_missing_data_and_deadline(
+                missing_data=False,
+                deadline=True,
                 loglik_missing_data=None,
             )
-
-    def test_deadline_str_sets_name(self, dummy_model, basic_data):
-        # Add a deadline_col to the data
+        # deadline as string
         dummy_model.data = basic_data.assign(deadline_col=[2.0, 2.0, 2.0])
-        dummy_model._process_missing_data_and_deadline(
-            missing_data=False,
-            deadline="deadline_col",
-            loglik_missing_data=None,
-        )
-        assert dummy_model.deadline is True
-        assert dummy_model.deadline_name == "deadline_col"
-        assert "deadline_col" in dummy_model.response
-
-    def test_deadline_bool_sets_name(self, dummy_model_with_deadline):
-        dummy_model_with_deadline._process_missing_data_and_deadline(
-            missing_data=False,
-            deadline=True,
-            loglik_missing_data=None,
-        )
-        assert dummy_model_with_deadline.deadline is True
-        assert dummy_model_with_deadline.deadline_name == "deadline"
-
-    @pytest.mark.parametrize(
-        "missing_data,deadline,loglik_missing_data",
-        [
-            (False, False, lambda x: x),
-        ],
-    )
-    def test_loglik_missing_data_error(
-        self, dummy_model, missing_data, deadline, loglik_missing_data
-    ):
-        with pytest.raises(ValueError):
+        with pytest.raises(ValueError, match="Missing data provided as False"):
             dummy_model._process_missing_data_and_deadline(
-                missing_data=missing_data,
-                deadline=deadline,
-                loglik_missing_data=loglik_missing_data,
+                missing_data=False,
+                deadline="deadline_col",
+                loglik_missing_data=None,
             )
 
 

From 46dfd193b3f586b4abfdd2680b4ffe0e03d6beba Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 28 Jan 2026 16:31:40 -0500
Subject: [PATCH 054/104] fix: add type ignore for choices length calculation
 in HSSMBase

---
 src/hssm/base.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 0963c2f5d..8de7f3b1f 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -345,7 +345,7 @@ def __init__(
                 "`list_params` must be provided in the model configuration."
             )
 
-        self.n_choices = len(self.choices)
+        self.n_choices = len(self.choices)  # type: ignore[arg-type]
 
         # Process missing data setting
         # AF-TODO: Could be a function in data validator?

From cb852988369028b412ae2d0dae0cbaea00500a69 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 29 Jan 2026 16:14:27 -0500
Subject: [PATCH 055/104] test: add comprehensive tests for MissingDataMixin's
 missing data handling

---
 tests/test_missing_data_mixin.py | 94 ++++++++++++++++++++++++++++++++
 1 file changed, 94 insertions(+)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 957020d0b..4bd6ed746 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -7,7 +7,9 @@
 
 import pytest
 import pandas as pd
+
 from hssm.missing_data_mixin import MissingDataMixin
+from hssm.defaults import MissingDataNetwork
 
 
 class DummyModel(MissingDataMixin):
@@ -82,6 +84,98 @@ def test_missing_data_false_raises_valueerror(
 
 # --- 2. Additional tests for new features and edge cases in MissingDataMixin ---
 class TestMissingDataMixinNew:
+    def test_missing_data_network_set(self, dummy_model):
+        # missing_data True, deadline False
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True, deadline=False, loglik_missing_data=None
+        )
+        assert dummy_model.missing_data_network == MissingDataNetwork.CPN
+
+        # missing_data True, deadline True
+        dummy_model.data["deadline"] = 2.0
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True, deadline=True, loglik_missing_data=None
+        )
+        assert dummy_model.missing_data_network == MissingDataNetwork.OPN
+
+        # missing_data False, deadline False (should raise ValueError due to -999.0 present)
+        with pytest.raises(ValueError, match="Missing data provided as False"):
+            dummy_model._process_missing_data_and_deadline(
+                missing_data=False, deadline=False, loglik_missing_data=None
+            )
+
+    def test_response_appended_with_deadline_name(self, dummy_model):
+        # Should append deadline_name to response if not present
+        dummy_model.data["deadline"] = 2.0
+        dummy_model.response = ["response"]
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True, deadline="deadline", loglik_missing_data=None
+        )
+        assert "deadline" in dummy_model.response
+
+    def test_data_mutation_missing_data_false(self, dummy_model):
+        # Should drop rows with -999.0 if missing_data is False
+        n_before = len(dummy_model.data)
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=False, deadline=False, loglik_missing_data=None
+        )
+        n_after = len(dummy_model.data)
+        assert n_after < n_before
+        assert not (-999.0 in dummy_model.data.rt.values)
+
+    def test_data_mutation_missing_data_true(self, dummy_model):
+        # Should replace -999.0 with -999.0 (idempotent) if missing_data is True
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True, deadline=False, loglik_missing_data=None
+        )
+        assert -999.0 in dummy_model.data.rt.values
+
+    def test_data_mutation_deadline(self, dummy_model):
+        # Should set rt to -999.0 if above deadline
+        # Set up so that the second RT is above its deadline
+        dummy_model.data["rt"] = [1.0, 3.0, -999.0]  # 3.0 > 2.5
+        dummy_model.data["deadline"] = [1.5, 2.5, 2.5]
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True, deadline="deadline", loglik_missing_data=None
+        )
+        # The first row rt=1.0 < 1.5, so not -999.0; second should be -999.0; third is already -999.0
+        assert dummy_model.data.rt.iloc[0] == 1.0
+        assert dummy_model.data.rt.iloc[1] == -999.0
+        assert dummy_model.data.rt.iloc[2] == -999.0
+
+    def test_loglik_missing_data_error(self, dummy_model):
+        # Should raise if loglik_missing_data is set but both missing_data and deadline are False
+        dummy_model.data.rt = [1.0, 2.0, 3.0]  # No -999.0 present
+        with pytest.raises(
+            ValueError,
+            match="loglik_missing_data function, but you have not set the missing_data or deadline flag to True",
+        ):
+            dummy_model._process_missing_data_and_deadline(
+                missing_data=False, deadline=False, loglik_missing_data=lambda x: x
+            )
+
+    def test_process_missing_data_and_deadline_updates_attributes(self, dummy_model):
+        """
+        Test that _process_missing_data_and_deadline updates missing_data, deadline, deadline_name, and loglik_missing_data.
+        """
+
+        # Set up a custom loglik function
+        def custom_loglik(x):
+            return x
+
+        # Add a custom_deadline column to the data to satisfy the mixin's requirements
+        dummy_model.data["custom_deadline"] = 2.0
+        # Call with missing_data True, deadline as string, and custom loglik
+        dummy_model._process_missing_data_and_deadline(
+            missing_data=True,
+            deadline="custom_deadline",
+            loglik_missing_data=custom_loglik,
+        )
+        assert dummy_model.missing_data is True
+        assert dummy_model.deadline is True
+        assert dummy_model.deadline_name == "custom_deadline"
+        assert dummy_model.loglik_missing_data is custom_loglik
+
     def test_missing_data_value_custom(self, dummy_model):
         custom_missing = -123.0
         # Add a row with custom missing value

From 7d65267facee06237bc6aa4424eca64f0f0ad934 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 29 Jan 2026 16:14:39 -0500
Subject: [PATCH 056/104] refactor: streamline missing data and deadline
 handling using MissingDataMixin

---
 src/hssm/base.py | 62 ++++--------------------------------------------
 1 file changed, 5 insertions(+), 57 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 8de7f3b1f..e23026525 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -347,65 +347,13 @@ def __init__(
 
         self.n_choices = len(self.choices)  # type: ignore[arg-type]
 
-        # Process missing data setting
-        # AF-TODO: Could be a function in data validator?
-        if isinstance(missing_data, float):
-            if not ((self.data.rt == missing_data).any()):
-                raise ValueError(
-                    f"missing_data argument is provided as a float {missing_data}, "
-                    f"However, you have no RTs of {missing_data} in your dataset!"
-                )
-            else:
-                self.missing_data = True
-                self.missing_data_value = missing_data
-        elif isinstance(missing_data, bool):
-            if missing_data and (not (self.data.rt == -999.0).any()):
-                raise ValueError(
-                    "missing_data argument is provided as True, "
-                    " so RTs of -999.0 are treated as missing. \n"
-                    "However, you have no RTs of -999.0 in your dataset!"
-                )
-            elif (not missing_data) and (self.data.rt == -999.0).any():
-                # self.missing_data = True
-                raise ValueError(
-                    "Missing data provided as False. \n"
-                    "However, you have RTs of -999.0 in your dataset!"
-                )
-            else:
-                self.missing_data = missing_data
-        else:
-            raise ValueError(
-                "missing_data argument must be a bool or a float! \n"
-                f"You provided: {type(missing_data)}"
-            )
-
-        if isinstance(deadline, str):
-            self.deadline = True
-            self.deadline_name = deadline
-        else:
-            self.deadline = deadline
-            self.deadline_name = "deadline"
-
-        if (
-            not self.missing_data and not self.deadline
-        ) and loglik_missing_data is not None:
-            raise ValueError(
-                "You have specified a loglik_missing_data function, but you have not "
-                + "set the missing_data or deadline flag to True."
-            )
-        self.loglik_missing_data = loglik_missing_data
-
-        # Update data based on missing_data and deadline
-        self._handle_missing_data_and_deadline()
-        # Set self.missing_data_network based on `missing_data` and `deadline`
-        self.missing_data_network = self._set_missing_data_and_deadline(
-            self.missing_data, self.deadline, self.data
+        # Use the MissingDataMixin logic for missing data and deadline handling
+        self._process_missing_data_and_deadline(
+            missing_data=missing_data,
+            deadline=deadline,
+            loglik_missing_data=loglik_missing_data,
         )
 
-        if self.deadline:
-            if self.response is not None:  # Avoid mypy error
-                self.response.append(self.deadline_name)
-
         # Run pre-check data sanity validation now that all attributes are set
         self._pre_check_data_sanity()
 

From 78bad84fbd6f5181ee1c424d757b348d5f21f129 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 14:59:41 -0500
Subject: [PATCH 057/104] fix: remove uncessary check

---
 src/hssm/missing_data_mixin.py | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
index 070658025..1d2ba86e8 100644
--- a/src/hssm/missing_data_mixin.py
+++ b/src/hssm/missing_data_mixin.py
@@ -100,12 +100,11 @@ def _set_missing_data_and_deadline(
         #     network = MissingDataNetwork.GONOGO
 
         if np.all(data["rt"] == -999.0):
-            if network in [MissingDataNetwork.CPN, MissingDataNetwork.OPN]:
-                # AF-TODO: I think we should allow invalid-only datasets.
-                raise ValueError(
-                    "`missing_data` is set to True, but you have no valid data in your "
-                    "dataset."
-                )
+            # AF-TODO: I think we should allow invalid-only datasets.
+            raise ValueError(
+                "`missing_data` is set to True, but you have no valid data in your "
+                "dataset."
+            )
             # AF-TODO: This one needs refinement for GONOGO case
             # elif network == MissingDataNetwork.OPN:
             #     raise ValueError(

From 6d403845af070136f97df9a5708b32069a2b1aec Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 14:59:59 -0500
Subject: [PATCH 058/104] refactor: simplify network assignment logic in
 MissingDataMixin

---
 src/hssm/missing_data_mixin.py | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
index 1d2ba86e8..50769e5f3 100644
--- a/src/hssm/missing_data_mixin.py
+++ b/src/hssm/missing_data_mixin.py
@@ -88,11 +88,8 @@ def _set_missing_data_and_deadline(
         """Set missing data and deadline."""
         network = MissingDataNetwork.NONE
         if not missing_data:
-            return network
-        if missing_data and not deadline:
-            network = MissingDataNetwork.CPN
-        elif missing_data and deadline:
-            network = MissingDataNetwork.OPN
+            return MissingDataNetwork.NONE
+        network = MissingDataNetwork.OPN if deadline else MissingDataNetwork.CPN
         # AF-TODO: GONOGO case not yet correctly implemented
         # else:
         #     # TODO: This won't behave as expected yet, GONOGO needs to be split

From 91147b64d9b27a100e228fb307ee40815bcc875b Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 15:00:15 -0500
Subject: [PATCH 059/104] fix: remove unnecessary initialization of network in
 MissingDataMixin

---
 src/hssm/missing_data_mixin.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/hssm/missing_data_mixin.py b/src/hssm/missing_data_mixin.py
index 50769e5f3..190136b58 100644
--- a/src/hssm/missing_data_mixin.py
+++ b/src/hssm/missing_data_mixin.py
@@ -86,7 +86,6 @@ def _set_missing_data_and_deadline(
         missing_data: bool, deadline: bool, data: pd.DataFrame
     ) -> MissingDataNetwork:
         """Set missing data and deadline."""
-        network = MissingDataNetwork.NONE
         if not missing_data:
             return MissingDataNetwork.NONE
         network = MissingDataNetwork.OPN if deadline else MissingDataNetwork.CPN

From 708194239d73cbd2e991da8e80fbcd86b31c8a88 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 15:15:19 -0500
Subject: [PATCH 060/104] refactor: update test structure and improve
 parameterization in MissingDataMixin tests

---
 tests/test_missing_data_mixin.py | 94 ++++++++++++++------------------
 1 file changed, 40 insertions(+), 54 deletions(-)

diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index 4bd6ed746..cff5f782b 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -1,10 +1,3 @@
-"""
-Tests for MissingDataMixin
--------------------------
-1. Old tests migrated from test_data_validator.py that belong to missing data/deadline logic.
-2. Additional tests for new features and edge cases in MissingDataMixin.
-"""
-
 import pytest
 import pandas as pd
 
@@ -31,7 +24,7 @@ def __init__(self, data):
         self.deadline = False
 
 
-# --- Fixtures ---
+# region ===== Fixtures =====
 @pytest.fixture
 def basic_data():
     return pd.DataFrame({"rt": [1.0, 2.0, -999.0], "response": [1, -1, 1]})
@@ -42,49 +35,47 @@ def dummy_model(basic_data):
     return DummyModel(basic_data)
 
 
-# Fixture for DummyModel with a deadline column
 @pytest.fixture
 def dummy_model_with_deadline(basic_data):
     data = basic_data.assign(deadline=[2.0, 2.0, 2.0])
     return DummyModel(data)
 
 
-# --- 1. Old tests migrated from test_data_validator.py ---
+# Indirect fixture dispatcher for parameterized model selection
+@pytest.fixture
+def model(request):
+    return request.getfixturevalue(request.param)
+
+
+# endregion
+
+
 class TestMissingDataMixinOld:
-    def test_missing_data_false_raises_valueerror(
-        self, dummy_model, basic_data, dummy_model_with_deadline
-    ):
+    @pytest.mark.parametrize(
+        "model, deadline",
+        [
+            ("dummy_model", False),
+            ("dummy_model_with_deadline", True),
+            ("dummy_model_with_deadline", "deadline"),
+        ],
+        indirect=["model"],
+    )
+    def test_missing_data_false_raises_valueerror(self, model, deadline):
         """
         Should raise ValueError if missing_data=False and -999.0 is present in rt column.
         Covers all cases where deadline is False, True, or a string.
         """
-        # deadline=False
-        with pytest.raises(ValueError, match="Missing data provided as False"):
-            dummy_model._process_missing_data_and_deadline(
-                missing_data=False,
-                deadline=False,
-                loglik_missing_data=None,
-            )
-        # deadline=True
         with pytest.raises(ValueError, match="Missing data provided as False"):
-            dummy_model_with_deadline._process_missing_data_and_deadline(
+            model._process_missing_data_and_deadline(
                 missing_data=False,
-                deadline=True,
-                loglik_missing_data=None,
-            )
-        # deadline as string
-        dummy_model.data = basic_data.assign(deadline_col=[2.0, 2.0, 2.0])
-        with pytest.raises(ValueError, match="Missing data provided as False"):
-            dummy_model._process_missing_data_and_deadline(
-                missing_data=False,
-                deadline="deadline_col",
+                deadline=deadline,
                 loglik_missing_data=None,
             )
 
 
 # --- 2. Additional tests for new features and edge cases in MissingDataMixin ---
 class TestMissingDataMixinNew:
-    def test_missing_data_network_set(self, dummy_model):
+    def test_set_missing_data_network_set(self, dummy_model):
         # missing_data True, deadline False
         dummy_model._process_missing_data_and_deadline(
             missing_data=True, deadline=False, loglik_missing_data=None
@@ -113,24 +104,21 @@ def test_response_appended_with_deadline_name(self, dummy_model):
         )
         assert "deadline" in dummy_model.response
 
-    def test_data_mutation_missing_data_false(self, dummy_model):
-        # Should drop rows with -999.0 if missing_data is False
-        n_before = len(dummy_model.data)
-        dummy_model._process_missing_data_and_deadline(
-            missing_data=False, deadline=False, loglik_missing_data=None
-        )
-        n_after = len(dummy_model.data)
-        assert n_after < n_before
-        assert not (-999.0 in dummy_model.data.rt.values)
+    def test_error_on_missing_data_false_with_missing(self, dummy_model):
+        # Should raise ValueError if missing_data is False and -999.0 is present
+        with pytest.raises(ValueError, match="Missing data provided as False"):
+            dummy_model._process_missing_data_and_deadline(
+                missing_data=False, deadline=False, loglik_missing_data=None
+            )
 
-    def test_data_mutation_missing_data_true(self, dummy_model):
-        # Should replace -999.0 with -999.0 (idempotent) if missing_data is True
+    def test_missing_data_true_retains_missing_marker(self, dummy_model):
+        # Should retain -999.0 as missing marker if missing_data is True
         dummy_model._process_missing_data_and_deadline(
             missing_data=True, deadline=False, loglik_missing_data=None
         )
         assert -999.0 in dummy_model.data.rt.values
 
-    def test_data_mutation_deadline(self, dummy_model):
+    def test_deadline_sets_rt_to_missing_marker(self, dummy_model):
         # Should set rt to -999.0 if above deadline
         # Set up so that the second RT is above its deadline
         dummy_model.data["rt"] = [1.0, 3.0, -999.0]  # 3.0 > 2.5
@@ -222,13 +210,11 @@ def test_handle_missing_data_and_deadline_direct(self, dummy_model):
         # Call with no arguments, as expected by the mixin stub
         dummy_model._handle_missing_data_and_deadline()
 
-    def test_set_missing_data_and_deadline_direct(self, dummy_model):
-        """
-        Directly test the _set_missing_data_and_deadline method for coverage.
-        """
-        # Call with only the required arguments (data is now internal)
-        dummy_model._set_missing_data_and_deadline(
-            missing_data=True,
-            deadline=False,
-            data=dummy_model.data,
-        )
+    def test_set_missing_data_and_deadline_edge_case(self, dummy_model):
+        all_missing = pd.DataFrame({"rt": [-999.0]})
+        with pytest.raises(ValueError, match="no valid data in your dataset"):
+            dummy_model._set_missing_data_and_deadline(
+                missing_data=True,
+                deadline=False,
+                data=all_missing,
+            )

From d2d1534341c6db03bb13ff3bc47a538da5e4f885 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 15:29:01 -0500
Subject: [PATCH 061/104] refactor: organize code sections with region markers
 in HSSMBase class

---
 src/hssm/base.py | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index e23026525..f144bbe11 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -311,24 +311,26 @@ def __init__(
             additional_namespace.update(extra_namespace)
         self.additional_namespace = additional_namespace
 
-        # ===== Inference Results (initialized to None/empty) =====
+        # region ===== Inference Results (initialized to None/empty) =====
         self._inference_obj: az.InferenceData | None = None
         self._inference_obj_vi: pm.Approximation | None = None
         self._vi_approx = None
         self._map_dict = None
+        # endregion
 
         # ===== Initial Values Configuration =====
         self._initvals: dict[str, Any] = {}
         self.initval_jitter = initval_jitter
 
-        # ===== Construct a model_config from defaults and user inputs =====
+        # region ===== Construct a model_config from defaults and user inputs =====
         self.model_config: Config = self._build_model_config(
             model, loglik_kind, model_config, choices
         )
         self.model_config.update_loglik(loglik)
         self.model_config.validate()
+        # endregion
 
-        # ===== Set up shortcuts so old code will work ======
+        # region ===== Set up shortcuts so old code will work ======
         self.response = self.model_config.response
         self.list_params = self.model_config.list_params
         self.choices = self.model_config.choices
@@ -336,18 +338,19 @@ def __init__(
         self.loglik = self.model_config.loglik
         self.loglik_kind = self.model_config.loglik_kind
         self.extra_fields = self.model_config.extra_fields
+        # endregion
 
         self._validate_choices()
 
-        # Avoid mypy error later (None.append). Should list_params be Optional?
+        # region Avoid mypy error later (None.append). Should list_params be Optional?
         if self.list_params is None:
             raise ValueError(
                 "`list_params` must be provided in the model configuration."
             )
+        # endregion
 
         self.n_choices = len(self.choices)  # type: ignore[arg-type]
 
-        # Use the MissingDataMixin logic for missing data and deadline handling
         self._process_missing_data_and_deadline(
             missing_data=missing_data,
             deadline=deadline,

From 1edad1eeb079d646d4019855975a85afe580f826 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 30 Jan 2026 16:12:10 -0500
Subject: [PATCH 062/104] refactor: add region markers for clarity in HSSMBase
 class methods

---
 src/hssm/base.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index f144bbe11..ad75d3307 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -357,14 +357,14 @@ def __init__(
             loglik_missing_data=loglik_missing_data,
         )
 
-        # Run pre-check data sanity validation now that all attributes are set
         self._pre_check_data_sanity()
 
-        # Process lapse distribution
+        # region ===== Process lapse distribution =====
         self.has_lapse = p_outlier is not None and p_outlier != 0
         self._check_lapse(lapse)
         if self.has_lapse and self.list_params[-1] != "p_outlier":
             self.list_params.append("p_outlier")
+        # endregion
 
         # Process all parameters
         self.params = Params.from_user_specs(
@@ -373,7 +373,6 @@ def __init__(
             kwargs=kwargs,
             p_outlier=p_outlier,
         )
-
         self._parent = self.params.parent
         self._parent_param = self.params.parent_param
 
@@ -418,6 +417,7 @@ def __init__(
         self.set_alias(self._aliases)
         self.model.build()
 
+        # region ===== Init vals and jitters =====
         if process_initvals:
             self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
         if self.initval_jitter > 0:
@@ -425,6 +425,7 @@ def __init__(
                 jitter_epsilon=self.initval_jitter,
                 vector_only=True,
             )
+        # endregion
 
         # Make sure we reset rvs_to_initial_values --> Only None's
         # Otherwise PyMC barks at us when asking to compute likelihoods

From 636afbd80d0d79ade2560423c2d5f43f7a0d67f8 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 14:39:38 -0500
Subject: [PATCH 063/104] feat: make HSSMBase an abstract class and define
 abstract method for model distribution

---
 src/hssm/base.py | 116 ++++-------------------------------------------
 1 file changed, 8 insertions(+), 108 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index ad75d3307..a8362576b 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -8,8 +8,8 @@
 
 import datetime
 import logging
+from abc import ABC, abstractmethod
 from copy import deepcopy
-from inspect import isclass, signature
 from os import PathLike
 from pathlib import Path
 from typing import Any, Callable, Literal, Optional, Union, cast, get_args
@@ -97,7 +97,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSMBase(DataValidatorMixin, MissingDataMixin):
+class HSSMBase(ABC, DataValidatorMixin, MissingDataMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
@@ -1932,114 +1932,14 @@ def _check_lapse(self, lapse):
                 + "parameter is not None"
             )
 
+    @abstractmethod
     def _make_model_distribution(self) -> type[pm.Distribution]:
-        """Make a pm.Distribution for the model."""
-        ### Logic for different types of likelihoods:
-        # -`analytical` and `blackbox`:
-        #     loglik should be a `pm.Distribution`` or a Python callable (any arbitrary
-        #     function).
-        # - `approx_differentiable`:
-        #     In addition to `pm.Distribution` and any arbitrary function, it can also
-        #     be an str (which we will download from hugging face) or a Pathlike
-        #     which we will download and make a distribution.
-
-        # If user has already provided a log-likelihood function as a distribution
-        # Use it directly as the distribution
-        if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
-            return self.loglik
-
-        params_is_reg = [
-            param.is_vector
-            for param_name, param in self.params.items()
-            if param_name != "p_outlier"
-        ]
-        if self.extra_fields is not None:
-            params_is_reg += [True for _ in self.extra_fields]
-
-        # Assert that loglik is not None (mypy)
-        # avoiding extra indentation level
-        assert self.loglik is not None, "loglik should be set by model configuration"
-        if self.loglik_kind == "approx_differentiable":
-            if self.model_config.backend == "jax":
-                likelihood_callable = make_likelihood_callable(
-                    loglik=self.loglik,
-                    loglik_kind="approx_differentiable",
-                    backend="jax",
-                    params_is_reg=params_is_reg,
-                )
-            else:
-                likelihood_callable = make_likelihood_callable(
-                    loglik=self.loglik,
-                    loglik_kind="approx_differentiable",
-                    backend=self.model_config.backend,
-                )
-        else:
-            likelihood_callable = make_likelihood_callable(
-                loglik=self.loglik,
-                loglik_kind=self.loglik_kind,
-                backend=self.model_config.backend,
-            )
-
-        self.loglik = likelihood_callable
-
-        # Make the callable for missing data
-        # And assemble it with the callable for the likelihood
-        if self.missing_data_network != MissingDataNetwork.NONE:
-            if self.missing_data_network == MissingDataNetwork.OPN:
-                params_only = False
-            elif self.missing_data_network == MissingDataNetwork.CPN:
-                params_only = True
-            else:
-                params_only = None
-
-            if self.loglik_missing_data is None:
-                self.loglik_missing_data = (
-                    self.model_name
-                    + missing_data_networks_suffix[self.missing_data_network]
-                    + ".onnx"
-                )
+        """Make a pm.Distribution for the model.
 
-            backend_tmp: Literal["pytensor", "jax", "other"] | None = (
-                "jax"
-                if self.model_config.backend != "pytensor"
-                else self.model_config.backend
-            )
-            missing_data_callable = make_missing_data_callable(
-                self.loglik_missing_data, backend_tmp, params_is_reg, params_only
-            )
-
-            self.loglik_missing_data = missing_data_callable
-
-            self.loglik = assemble_callables(
-                self.loglik,
-                self.loglik_missing_data,
-                params_only,
-                has_deadline=self.deadline,
-            )
-
-        if self.missing_data:
-            _logger.info(
-                "Re-arranging data to separate missing and observed datapoints. "
-                "Missing data (rt == %s) will be on top, "
-                "observed datapoints follow.",
-                self.missing_data_value,
-            )
-
-        self.data = _rearrange_data(self.data)
-        # Assertion added for mypy type checking
-        assert self.list_params is not None, "list_params should have been validated"
-        return make_distribution(
-            rv=self.model_config.rv or self.model_name,
-            loglik=self.loglik,
-            list_params=self.list_params,
-            bounds=self.bounds,
-            lapse=self.lapse,
-            extra_fields=(
-                None
-                if not self.extra_fields
-                else [deepcopy(self.data[field].values) for field in self.extra_fields]
-            ),
-        )
+        This method must be implemented by subclasses to create the appropriate
+        distribution for the specific model type.
+        """
+        ...
 
     def _get_deterministic_var_names(self, idata) -> list[str]:
         """Filter out the deterministic variables in var_names."""

From 6fc5f3d4d3b225fd7416f2b97e3512afc7224ebc Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 14:53:23 -0500
Subject: [PATCH 064/104] feat: refactor HSSM class to inherit from HSSMBase
 and remove mixins

---
 src/hssm/hssm.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 4a41d36ec..3e2ec926b 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -32,7 +32,7 @@
 from ssms.config import model_config as ssms_model_config
 
 from hssm._types import LoglikKind, SupportedModels
-from hssm.data_validator import DataValidatorMixin
+from hssm.base import HSSMBase
 from hssm.defaults import (
     INITVAL_JITTER_SETTINGS,
     INITVAL_SETTINGS,
@@ -46,7 +46,6 @@
     make_likelihood_callable,
     make_missing_data_callable,
 )
-from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
     _compute_log_likelihood,
     _get_alias_dict,
@@ -98,7 +97,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidatorMixin, MissingDataMixin):
+class HSSM(HSSMBase):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters

From 45cd5e09af520732e1a81bebbb69f705c7fea5fe Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:27:13 -0500
Subject: [PATCH 065/104] fix: move data sanity check to the correct position
 in HSSMBase class

---
 src/hssm/base.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index a8362576b..2a6a14b01 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -351,14 +351,14 @@ def __init__(
 
         self.n_choices = len(self.choices)  # type: ignore[arg-type]
 
+        self._pre_check_data_sanity()
+
         self._process_missing_data_and_deadline(
             missing_data=missing_data,
             deadline=deadline,
             loglik_missing_data=loglik_missing_data,
         )
 
-        self._pre_check_data_sanity()
-
         # region ===== Process lapse distribution =====
         self.has_lapse = p_outlier is not None and p_outlier != 0
         self._check_lapse(lapse)

From 0dd269dfeb6bb4dc30e0b6082c81ae32dd7e96c4 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:27:28 -0500
Subject: [PATCH 066/104] Implement feature X to enhance user experience and
 fix bug Y in module Z

---
 src/hssm/hssm.py | 1929 +---------------------------------------------
 1 file changed, 4 insertions(+), 1925 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 3e2ec926b..1eb7f2fb8 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -270,1679 +270,6 @@ class HSSM(HSSMBase):
         The jitter value for the initial values.
     """
 
-    def __init__(
-        self,
-        data: pd.DataFrame,
-        model: SupportedModels | str = "ddm",
-        choices: list[int] | None = None,
-        include: list[dict[str, Any] | Param] | None = None,
-        model_config: ModelConfig | dict | None = None,
-        loglik: (
-            str | PathLike | Callable | pytensor.graph.Op | type[pm.Distribution] | None
-        ) = None,
-        loglik_kind: LoglikKind | None = None,
-        p_outlier: float | dict | bmb.Prior | None = 0.05,
-        lapse: dict | bmb.Prior | None = bmb.Prior("Uniform", lower=0.0, upper=20.0),
-        global_formula: str | None = None,
-        link_settings: Literal["log_logit"] | None = None,
-        prior_settings: Literal["safe"] | None = "safe",
-        extra_namespace: dict[str, Any] | None = None,
-        missing_data: bool | float = False,
-        deadline: bool | str = False,
-        loglik_missing_data: (
-            str | PathLike | Callable | pytensor.graph.Op | None
-        ) = None,
-        process_initvals: bool = True,
-        initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
-        **kwargs,
-    ):
-        # Attach arguments to the instance
-        # so that we can easily define some
-        # methods that need to access these
-        # arguments (context: pickling / save - load).
-
-        # Define a dict with all call arguments:
-        self._init_args = {
-            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
-        }
-        if kwargs:
-            self._init_args.update(kwargs)
-
-        self.data = data.copy()
-        self._inference_obj: az.InferenceData | None = None
-        self._initvals: dict[str, Any] = {}
-        self.initval_jitter = initval_jitter
-        self._inference_obj_vi: pm.Approximation | None = None
-        self._vi_approx = None
-        self._map_dict = None
-        self.global_formula = global_formula
-
-        self.link_settings = link_settings
-        self.prior_settings = prior_settings
-
-        self.missing_data_value = -999.0
-
-        additional_namespace = transformations_namespace.copy()
-        if extra_namespace is not None:
-            additional_namespace.update(extra_namespace)
-        self.additional_namespace = additional_namespace
-
-        # Construct a model_config from defaults
-        self.model_config = Config.from_defaults(model, loglik_kind)
-        # Update defaults with user-provided config, if any
-        if model_config is not None:
-            if isinstance(model_config, dict):
-                if "choices" not in model_config:
-                    if choices is not None:
-                        model_config["choices"] = choices
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-            elif isinstance(model_config, ModelConfig):
-                if model_config.choices is None:
-                    if choices is not None:
-                        model_config.choices = choices
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-
-            self.model_config.update_config(
-                model_config
-                if isinstance(model_config, ModelConfig)
-                else ModelConfig(**model_config)  # also serves as dict validation
-            )
-        else:
-            # Model config is not provided, but at this point was constructed from
-            # defaults.
-            if model not in typing.get_args(SupportedModels):
-                # TODO: ideally use self.supported_models above but mypy doesn't like it
-                if choices is not None:
-                    self.model_config.update_choices(choices)
-                elif model in ssms_model_config:
-                    self.model_config.update_choices(
-                        ssms_model_config[model]["choices"]
-                    )
-                    _logger.info(
-                        "choices argument passed as None, "
-                        "but found %s in ssms-simulators. "
-                        "Using choices, from ssm-simulators configs: %s",
-                        model,
-                        ssms_model_config[model]["choices"],
-                    )
-            else:
-                # Model config already constructed from defaults, and model string is
-                # in SupportedModels. So we are guaranteed that choices are in
-                # self.model_config already.
-
-                if choices is not None:
-                    _logger.info(
-                        "Model string is in SupportedModels."
-                        " Ignoring choices arguments."
-                    )
-
-        # Update loglik with user-provided value
-        self.model_config.update_loglik(loglik)
-        # Ensure that all required fields are valid
-        self.model_config.validate()
-
-        # Set up shortcuts so old code will work
-        self.response = self.model_config.response
-        self.list_params = self.model_config.list_params
-        self.choices = self.model_config.choices
-        self.model_name = self.model_config.model_name
-        self.loglik = self.model_config.loglik
-        self.loglik_kind = self.model_config.loglik_kind
-        self.extra_fields = self.model_config.extra_fields
-
-        self.n_choices = len(self.choices)
-
-        self._validate_choices()
-        self._pre_check_data_sanity()
-
-        # Process missing data setting
-        # AF-TODO: Could be a function in data validator?
-        if isinstance(missing_data, float):
-            if not ((self.data.rt == missing_data).any()):
-                raise ValueError(
-                    f"missing_data argument is provided as a float {missing_data}, "
-                    f"However, you have no RTs of {missing_data} in your dataset!"
-                )
-            else:
-                self.missing_data = True
-                self.missing_data_value = missing_data
-        elif isinstance(missing_data, bool):
-            if missing_data and (not (self.data.rt == -999.0).any()):
-                raise ValueError(
-                    "missing_data argument is provided as True, "
-                    " so RTs of -999.0 are treated as missing. \n"
-                    "However, you have no RTs of -999.0 in your dataset!"
-                )
-            elif (not missing_data) and (self.data.rt == -999.0).any():
-                # self.missing_data = True
-                raise ValueError(
-                    "Missing data provided as False. \n"
-                    "However, you have RTs of -999.0 in your dataset!"
-                )
-            else:
-                self.missing_data = missing_data
-        else:
-            raise ValueError(
-                "missing_data argument must be a bool or a float! \n"
-                f"You provided: {type(missing_data)}"
-            )
-
-        if isinstance(deadline, str):
-            self.deadline = True
-            self.deadline_name = deadline
-        else:
-            self.deadline = deadline
-            self.deadline_name = "deadline"
-
-        if (
-            not self.missing_data and not self.deadline
-        ) and loglik_missing_data is not None:
-            raise ValueError(
-                "You have specified a loglik_missing_data function, but you have not "
-                + "set the missing_data or deadline flag to True."
-            )
-        self.loglik_missing_data = loglik_missing_data
-
-        # Update data based on missing_data and deadline
-        self._handle_missing_data_and_deadline()
-        # Set self.missing_data_network based on `missing_data` and `deadline`
-        self.missing_data_network = self._set_missing_data_and_deadline(
-            self.missing_data, self.deadline, self.data
-        )
-
-        if self.deadline:
-            self.response.append(self.deadline_name)
-
-        # Process lapse distribution
-        self.has_lapse = p_outlier is not None and p_outlier != 0
-        self._check_lapse(lapse)
-        if self.has_lapse and self.list_params[-1] != "p_outlier":
-            self.list_params.append("p_outlier")
-
-        # Process all parameters
-        self.params = Params.from_user_specs(
-            model=self,
-            include=[] if include is None else include,
-            kwargs=kwargs,
-            p_outlier=p_outlier,
-        )
-
-        self._parent = self.params.parent
-        self._parent_param = self.params.parent_param
-
-        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
-
-        # For parameters that have a regression backend, apply bounds at the likelihood
-        # level to ensure that the samples that are out of bounds
-        # are discarded (replaced with a large negative value).
-        self.bounds = {
-            name: param.bounds
-            for name, param in self.params.items()
-            if param.is_regression and param.bounds is not None
-        }
-
-        # Set p_outlier and lapse
-        self.p_outlier = self.params.get("p_outlier")
-        self.lapse = lapse if self.has_lapse else None
-
-        self._post_check_data_sanity()
-
-        self.model_distribution = self._make_model_distribution()
-
-        self.family = make_family(
-            self.model_distribution,
-            self.list_params,
-            self.link,
-            self._parent,
-        )
-
-        self.model = bmb.Model(
-            self.formula,
-            data=self.data,
-            family=self.family,
-            priors=self.priors,  # center_predictors=False
-            extra_namespace=self.additional_namespace,
-            **kwargs,
-        )
-
-        self._aliases = _get_alias_dict(
-            self.model, self._parent_param, self.response_c, self.response_str
-        )
-        self.set_alias(self._aliases)
-        self.model.build()
-
-        if process_initvals:
-            self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
-        if self.initval_jitter > 0:
-            self._jitter_initvals(
-                jitter_epsilon=self.initval_jitter,
-                vector_only=True,
-            )
-
-        # Make sure we reset rvs_to_initial_values --> Only None's
-        # Otherwise PyMC barks at us when asking to compute likelihoods
-        self.pymc_model.rvs_to_initial_values.update(
-            {key_: None for key_ in self.pymc_model.rvs_to_initial_values.keys()}
-        )
-        _logger.info("Model initialized successfully.")
-
-    @classproperty
-    def supported_models(cls) -> tuple[SupportedModels, ...]:
-        """Get a tuple of all supported models.
-
-        Returns
-        -------
-        tuple[SupportedModels, ...]
-            A tuple containing all supported model names.
-        """
-        return get_args(SupportedModels)
-
-    @classmethod
-    def _store_init_args(cls, *args, **kwargs):
-        """Store initialization arguments using signature binding."""
-        sig = signature(cls.__init__)
-        bound_args = sig.bind(*args, **kwargs)
-        bound_args.apply_defaults()
-        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
-
-    def find_MAP(self, **kwargs):
-        """Perform Maximum A Posteriori estimation.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        self._map_dict = pm.find_MAP(model=self.pymc_model, **kwargs)
-        return self._map_dict
-
-    def sample(
-        self,
-        sampler: Literal["pymc", "numpyro", "blackjax", "nutpie", "laplace"]
-        | None = None,
-        init: str | None = None,
-        initvals: str | dict | None = None,
-        include_response_params: bool = False,
-        **kwargs,
-    ) -> az.InferenceData | pm.Approximation:
-        """Perform sampling using the `fit` method via bambi.Model.
-
-        Parameters
-        ----------
-        sampler: optional
-            The sampler to use. Can be one of "pymc", "numpyro",
-            "blackjax", "nutpie", or "laplace". If using `blackbox` likelihoods,
-            this cannot be "numpyro", "blackjax", or "nutpie". By default it is None,
-            and sampler will automatically be chosen: when the model uses the
-            `approx_differentiable` likelihood, and `jax` backend, "numpyro" will
-            be used. Otherwise, "pymc" (the default PyMC NUTS sampler) will be used.
-
-            Note that the old sampler names such as "mcmc", "nuts_numpyro",
-            "nuts_blackjax" will be deprecated and removed in future releases. A warning
-            will be raised if any of these old names are used.
-        init: optional
-            Initialization method to use for the sampler. If any of the NUTS samplers
-            is used, defaults to `"adapt_diag"`. Otherwise, defaults to `"auto"`.
-        initvals: optional
-            Pass initial values to the sampler. This can be a dictionary of initial
-            values for parameters of the model, or a string "map" to use initialization
-            at the MAP estimate. If "map" is used, the MAP estimate will be computed if
-            not already attached to the base class from prior call to 'find_MAP`.
-        include_response_params: optional
-            Include parameters of the response distribution in the output. These usually
-            take more space than other parameters as there's one of them per
-            observation. Defaults to False.
-        kwargs
-            Other arguments passed to bmb.Model.fit(). Please see [here]
-            (https://bambinos.github.io/bambi/api_reference.html#bambi.models.Model.fit)
-            for full documentation.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            A reference to the `model.traces` object, which stores the traces of the
-            last call to `model.sample()`. `model.traces` is an ArviZ `InferenceData`
-            instance if `sampler` is `"pymc"` (default), `"numpyro"`,
-            `"blackjax"` or "`laplace".
-        """
-        # If initvals are None (default)
-        # we skip processing initvals here.
-        if sampler in _new_sampler_mapping:
-            _logger.warning(
-                f"Sampler '{sampler}' is deprecated. "
-                "Please use the new sampler names: "
-                "'pymc', 'numpyro', 'blackjax', 'nutpie', or 'laplace'."
-            )
-            sampler = _new_sampler_mapping[sampler]  # type: ignore
-
-        if sampler == "vi":
-            raise ValueError(
-                "VI is not supported via the sample() method. "
-                "Please use the vi() method instead."
-            )
-
-        if initvals is not None:
-            if isinstance(initvals, dict):
-                kwargs["initvals"] = initvals
-            else:
-                if isinstance(initvals, str):
-                    if initvals == "map":
-                        if self._map_dict is None:
-                            _logger.info(
-                                "initvals='map' but no map"
-                                "estimate precomputed. \n"
-                                "Running map estimation first..."
-                            )
-                            self.find_MAP()
-                            kwargs["initvals"] = self._map_dict
-                        else:
-                            kwargs["initvals"] = self._map_dict
-                else:
-                    raise ValueError(
-                        "initvals argument must be a dictionary or 'map'"
-                        " to use the MAP estimate."
-                    )
-        else:
-            kwargs["initvals"] = self._initvals
-            _logger.info("Using default initvals. \n")
-
-        if sampler is None:
-            if (
-                self.loglik_kind == "approx_differentiable"
-                and self.model_config.backend == "jax"
-            ):
-                sampler = "numpyro"
-            else:
-                sampler = "pymc"
-
-        if self.loglik_kind == "blackbox":
-            if sampler in ["blackjax", "numpyro", "nutpie"]:
-                raise ValueError(
-                    f"{sampler} sampler does not work with blackbox likelihoods."
-                )
-
-            if "step" not in kwargs:
-                kwargs |= {"step": pm.Slice(model=self.pymc_model)}
-
-        if (
-            self.loglik_kind == "approx_differentiable"
-            and self.model_config.backend == "jax"
-            and sampler == "pymc"
-            and kwargs.get("cores", None) != 1
-        ):
-            _logger.warning(
-                "Parallel sampling might not work with `jax` backend and the PyMC NUTS "
-                + "sampler on some platforms. Please consider using `numpyro`, "
-                + "`blackjax`, or `nutpie` sampler if that is a problem."
-            )
-
-        if self._check_extra_fields():
-            self._update_extra_fields()
-
-        if init is None:
-            if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]:
-                init = "adapt_diag"
-            else:
-                init = "auto"
-
-        # If sampler is finally `numpyro` make sure
-        # the jitter argument is set to False
-        if sampler == "numpyro":
-            if "nuts_sampler_kwargs" in kwargs:
-                if kwargs["nuts_sampler_kwargs"].get("jitter"):
-                    _logger.warning(
-                        "The jitter argument is set to True. "
-                        + "This argument is not supported "
-                        + "by the numpyro backend. "
-                        + "The jitter argument will be set to False."
-                    )
-                kwargs["nuts_sampler_kwargs"]["jitter"] = False
-            else:
-                kwargs["nuts_sampler_kwargs"] = {"jitter": False}
-
-        if sampler != "pymc" and "step" in kwargs:
-            raise ValueError(
-                "`step` samplers (enabled by the `step` argument) are only supported "
-                "by the `pymc` sampler."
-            )
-
-        if self._inference_obj is not None:
-            _logger.warning(
-                "The model has already been sampled. Overwriting the previous "
-                + "inference object. Any previous reference to the inference object "
-                + "will still point to the old object."
-            )
-
-        # Define whether likelihood should be computed
-        compute_likelihood = True
-        if "idata_kwargs" in kwargs:
-            if "log_likelihood" in kwargs["idata_kwargs"]:
-                compute_likelihood = kwargs["idata_kwargs"].pop("log_likelihood", True)
-
-        omit_offsets = kwargs.pop("omit_offsets", False)
-        self._inference_obj = self.model.fit(
-            inference_method=(
-                "pymc"
-                if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]
-                else sampler
-            ),
-            init=init,
-            include_response_params=include_response_params,
-            omit_offsets=omit_offsets,
-            **kwargs,
-        )
-
-        # Separate out log likelihood computation
-        if compute_likelihood:
-            self.log_likelihood(self._inference_obj, inplace=True)
-
-        # Subset data vars in posterior
-        self._clean_posterior_group(idata=self._inference_obj)
-        return self.traces
-
-    def vi(
-        self,
-        method: str = "advi",
-        niter: int = 10000,
-        draws: int = 1000,
-        return_idata: bool = True,
-        ignore_mcmc_start_point_defaults=False,
-        **vi_kwargs,
-    ) -> pm.Approximation | az.InferenceData:
-        """Perform Variational Inference.
-
-        Parameters
-        ----------
-        niter : int
-            The number of iterations to run the VI algorithm. Defaults to 3000.
-        method : str
-            The method to use for VI. Can be one of "advi" or "fullrank_advi", "svgd",
-            "asvgd".Defaults to "advi".
-        draws : int
-            The number of samples to draw from the posterior distribution.
-            Defaults to 1000.
-        return_idata : bool
-            If True, returns an InferenceData object. Otherwise, returns the
-            approximation object directly. Defaults to True.
-
-        Returns
-        -------
-            pm.Approximation or az.InferenceData: The mean field approximation object.
-        """
-        if self.loglik_kind == "analytical":
-            _logger.warning(
-                "VI is not recommended for the analytical likelihood,"
-                " since gradients can be brittle."
-            )
-        elif self.loglik_kind == "blackbox":
-            raise ValueError(
-                "VI is not supported for blackbox likelihoods, "
-                " since likelihood gradients are needed!"
-            )
-
-        if ("start" not in vi_kwargs) and not ignore_mcmc_start_point_defaults:
-            _logger.info("Using MCMC starting point defaults.")
-            vi_kwargs["start"] = self._initvals
-
-        # Run variational inference directly from pymc model
-        with self.pymc_model:
-            self._vi_approx = pm.fit(n=niter, method=method, **vi_kwargs)
-
-        # Sample from the approximate posterior
-        if self._vi_approx is not None:
-            self._inference_obj_vi = self._vi_approx.sample(draws)
-
-        # Post-processing
-        self._clean_posterior_group(idata=self._inference_obj_vi)
-
-        # Return the InferenceData object if return_idata is True
-        if return_idata:
-            return self._inference_obj_vi
-        # Otherwise return the appromation object directly
-        return self.vi_approx
-
-    def _clean_posterior_group(self, idata: az.InferenceData | None = None):
-        """Clean up the posterior group of the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object to clean up. If None, the last InferenceData object
-            will be used.
-        """
-        # # Logic behind which variables to keep:
-        # # We essentially want to get rid of
-        # # all the trial-wise variables.
-
-        # # We drop all distributional components, IF they are deterministics
-        # # (in which case they will be trial wise systematically)
-        # # and we keep distributional components, IF they are
-        # # basic random-variabels (in which case they should never
-        # # appear trial-wise).
-        if idata is None:
-            raise ValueError(
-                "The InferenceData object is None. Cannot clean up the posterior group."
-            )
-        elif not hasattr(idata, "posterior"):
-            raise ValueError(
-                "The InferenceData object does not have a posterior group. "
-                + "Cannot clean up the posterior group."
-            )
-
-        vars_to_keep = set(idata["posterior"].data_vars.keys()).difference(
-            set(
-                key_
-                for key_ in self.model.distributional_components.keys()
-                if key_ in [var_.name for var_ in self.pymc_model.deterministics]
-            )
-        )
-        vars_to_keep_clean = [
-            var_
-            for var_ in vars_to_keep
-            if isinstance(var_, str) and "_mean" not in var_
-        ]
-
-        setattr(
-            idata,
-            "posterior",
-            idata["posterior"][vars_to_keep_clean],
-        )
-
-    def log_likelihood(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        keep_likelihood_params: bool = False,
-    ) -> az.InferenceData | None:
-        """Compute the log likelihood of the model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-        data : optional
-            A pandas DataFrame with values for the predictors that are used to obtain
-            out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `log_likelihood` group to
-            `idata`. Otherwise, it will return a copy of idata with the predictions
-            added, by default True.
-        keep_likelihood_params : optional
-            If `True`, the trial wise likelihood parameters that are computed
-            on route to getting the log likelihood are kept in the `idata` object.
-            Defaults to False. See also the method `add_likelihood_parameters_to_idata`.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if self._inference_obj is None and idata is None:
-            raise ValueError(
-                "Neither has the model been sampled yet nor"
-                + " an idata object has been provided."
-            )
-
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please provide an idata object."
-                )
-            else:
-                idata = self._inference_obj
-
-        # Actual likelihood computation
-        idata = _compute_log_likelihood(self.model, idata, data, inplace)
-
-        # clean up posterior:
-        if not keep_likelihood_params:
-            self._clean_posterior_group(idata=idata)
-
-        if inplace:
-            return None
-        else:
-            return idata
-
-    def add_likelihood_parameters_to_idata(
-        self,
-        idata: az.InferenceData | None = None,
-        inplace: bool = False,
-    ) -> az.InferenceData | None:
-        """Add likelihood parameters to the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object returned by HSSM.sample().
-        inplace : bool
-            If True, the likelihood parameters are added to idata in-place. Otherwise,
-            a copy of idata with the likelihood parameters added is returned.
-            Defaults to False.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError("No idata provided and model not yet sampled!")
-            else:
-                idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                    deepcopy(self._inference_obj)
-                    if not inplace
-                    else self._inference_obj
-                )
-        else:
-            idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                deepcopy(idata) if not inplace else idata
-            )
-        return idata
-
-    def sample_posterior_predictive(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        include_group_specific: bool = True,
-        kind: Literal["response", "response_params"] = "response",
-        draws: int | float | list[int] | np.ndarray | None = None,
-        safe_mode: bool = True,
-    ) -> az.InferenceData | None:
-        """Perform posterior predictive sampling from the HSSM model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-            the `InferenceData` from the last time `sample()` is called will be used.
-        data : optional
-            An optional data frame with values for the predictors that are used to
-            obtain out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `posterior_predictive`
-            group to `idata`. Otherwise, it will return a copy of idata with the
-            predictions added, by default True.
-        include_group_specific : optional
-            If `True` will make predictions including the group specific effects.
-            Otherwise, predictions are made with common effects only (i.e. group-
-            specific are set to zero), by default True.
-        kind: optional
-            Indicates the type of prediction required. Can be `"response_params"` or
-            `"response"`. The first returns draws from the posterior distribution of the
-            likelihood parameters, while the latter returns the draws from the posterior
-            predictive distribution (i.e. the posterior probability distribution for a
-            new observation) in addition to the posterior distribution. Defaults to
-            "response_params".
-        draws: optional
-            The number of samples to draw from the posterior predictive distribution
-            from each chain.
-            When it's an integer >= 1, the number of samples to be extracted from the
-            `draw` dimension. If this integer is larger than the number of posterior
-            samples in each chain, all posterior samples will be used
-            in posterior predictive sampling. When a float between 0 and 1, the
-            proportion of samples from the draw dimension from each chain to be used in
-            posterior predictive sampling.. If this proportion is very
-            small, at least one sample will be used. When None, all posterior samples
-            will be used. Defaults to None.
-        safe_mode: bool
-            If True, the function will split the draws into chunks of 10 to avoid memory
-            issues. Defaults to True.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet and idata is not provided.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please either provide an idata object or sample the model first."
-                )
-            idata = self._inference_obj
-            _logger.info(
-                "idata=None, we use the traces assigned to the HSSM object as idata."
-            )
-
-        if idata is not None:
-            if "posterior_predictive" in idata.groups():
-                del idata["posterior_predictive"]
-                _logger.warning(
-                    "pre-existing posterior_predictive group deleted from idata. \n"
-                )
-
-        if self._check_extra_fields(data):
-            self._update_extra_fields(data)
-
-        if isinstance(draws, np.ndarray):
-            draws = draws.astype(int)
-        elif isinstance(draws, list):
-            draws = np.array(draws).astype(int)
-        elif isinstance(draws, int | float):
-            draws = np.arange(int(draws))
-        elif draws is None:
-            draws = idata["posterior"].draw.values
-        else:
-            raise ValueError(
-                "draws must be an integer, " + "a list of integers, or a numpy array."
-            )
-
-        assert isinstance(draws, np.ndarray)
-
-        # Make a copy of idata, set the `posterior` group to be a random sub-sample
-        # of the original (draw dimension gets sub-sampled)
-
-        idata_copy = idata.copy()
-
-        if (draws.shape != idata["posterior"].draw.values.shape) or (
-            (draws.shape == idata["posterior"].draw.values.shape)
-            and not np.allclose(draws, idata["posterior"].draw.values)
-        ):
-            # Reassign posterior to sub-sampled version
-            setattr(idata_copy, "posterior", idata["posterior"].isel(draw=draws))
-
-        if kind == "response":
-            # If we run kind == 'response' we actually run the observation RV
-            if safe_mode:
-                # safe mode splits the draws into chunks of 10 to avoid
-                # memory issues (TODO: Figure out the source of memory issues)
-                split_draws = _split_array(
-                    idata_copy["posterior"].draw.values, divisor=10
-                )
-
-                posterior_predictive_list = []
-                for samples_tmp in split_draws:
-                    tmp_posterior = idata["posterior"].sel(draw=samples_tmp)
-                    setattr(idata_copy, "posterior", tmp_posterior)
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-                    posterior_predictive_list.append(idata_copy["posterior_predictive"])
-
-                if inplace:
-                    idata.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    # for inplace, we don't return anything
-                    return None
-                else:
-                    # Reassign original posterior to idata_copy
-                    setattr(idata_copy, "posterior", idata["posterior"])
-                    # Add new posterior predictive group to idata_copy
-                    del idata_copy["posterior_predictive"]
-                    idata_copy.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    return idata_copy
-            else:
-                if inplace:
-                    # If not safe-mode
-                    # We call .predict() directly without any
-                    # chunking of data.
-
-                    # .predict() is called on the copy of idata
-                    # since we still subsampled (or assigned) the draws
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-
-                    # posterior predictive group added to idata
-                    idata.add_groups(
-                        posterior_predictive=idata_copy["posterior_predictive"]
-                    )
-                    # don't return anything if inplace
-                    return None
-                else:
-                    # Not safe mode and not inplace
-                    # Function acts as very thin wrapper around
-                    # .predict(). It just operates on the
-                    # idata_copy object
-                    return self.model.predict(
-                        idata_copy, kind, data, False, include_group_specific
-                    )
-        elif kind == "response_params":
-            # If kind == 'response_params', we don't need to run the RV directly,
-            # there shouldn't really be any significant memory issues here,
-            # we can simply ignore settings, since the computational overhead
-            # should be very small --> nudges user towards good outputs.
-            _logger.warning(
-                "The kind argument is set to 'mean', but 'draws' argument "
-                + "is not None: The draws argument will be ignored!"
-            )
-            return self.model.predict(
-                idata, kind, data, inplace, include_group_specific
-            )
-        else:
-            raise ValueError("`kind` must be either 'response' or 'response_params'.")
-
-    def plot_predictive(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a posterior predictive plot.
-
-        Equivalent to calling `hssm.plotting.plot_predictive()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_predictive].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_predictive(self, **kwargs)
-
-    def plot_quantile_probability(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a quantile probability plot.
-
-        Equivalent to calling `hssm.plotting.plot_quantile_probability()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_quantile_probability].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_quantile_probability(self, **kwargs)
-
-    def predict(self, **kwargs) -> az.InferenceData:
-        """Generate samples from the predictive distribution."""
-        return self.model.predict(**kwargs)
-
-    def sample_do(
-        self, params: dict[str, Any], draws: int = 100, return_model=False, **kwargs
-    ) -> az.InferenceData | tuple[az.InferenceData, pm.Model]:
-        """Generate samples from the predictive distribution using the `do-operator`."""
-        do_model = do(self.pymc_model, params)
-        do_idata = pm.sample_prior_predictive(model=do_model, draws=draws, **kwargs)
-
-        # clean up `rt,response_mean` to `v`
-        do_idata = self._drop_parent_str_from_idata(idata=do_idata)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].coords:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        if return_model:
-            return do_idata, do_model
-        return do_idata
-
-    def sample_prior_predictive(
-        self,
-        draws: int = 500,
-        var_names: str | list[str] | None = None,
-        omit_offsets: bool = True,
-        random_seed: np.random.Generator | None = None,
-    ) -> az.InferenceData:
-        """Generate samples from the prior predictive distribution.
-
-        Parameters
-        ----------
-        draws
-            Number of draws to sample from the prior predictive distribution. Defaults
-            to 500.
-        var_names
-            A list of names of variables for which to compute the prior predictive
-            distribution. Defaults to ``None`` which means both observed and unobserved
-            RVs.
-        omit_offsets
-            Whether to omit offset terms. Defaults to ``True``.
-        random_seed
-            Seed for the random number generator.
-
-        Returns
-        -------
-        az.InferenceData
-            ``InferenceData`` object with the groups ``prior``, ``prior_predictive`` and
-            ``observed_data``.
-        """
-        prior_predictive = self.model.prior_predictive(
-            draws, var_names, omit_offsets, random_seed
-        )
-
-        # AF-COMMENT: Not sure if necessary to include the
-        # mean prior here (which adds deterministics that
-        # could be recomputed elsewhere)
-        prior_predictive.add_groups(posterior=prior_predictive.prior)
-        self.model.predict(prior_predictive, kind="mean", inplace=True)
-
-        # clean
-        setattr(prior_predictive, "prior", prior_predictive["posterior"])
-        del prior_predictive["posterior"]
-
-        if self._inference_obj is None:
-            self._inference_obj = prior_predictive
-        else:
-            self._inference_obj.extend(prior_predictive)
-
-        # clean up `rt,response_mean` to `v`
-        idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].coords:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        # Update self._inference_obj to match the cleaned idata
-        self._inference_obj = idata
-        return deepcopy(self._inference_obj)
-
-    @property
-    def pymc_model(self) -> pm.Model:
-        """Provide access to the PyMC model.
-
-        Returns
-        -------
-        pm.Model
-            The PyMC model built by bambi
-        """
-        return self.model.backend.model
-
-    def set_alias(self, aliases: dict[str, str | dict]):
-        """Set parameter aliases.
-
-        Sets the aliases according to the dictionary passed to it and rebuild the
-        model.
-
-        Parameters
-        ----------
-        aliases
-            A dict specifying the parameter names being aliased and the aliases.
-        """
-        self.model.set_alias(aliases)
-        self.model.build()
-
-    @property
-    def response_c(self) -> str:
-        """Return the response variable names in c() format."""
-        if self.response is None:
-            return "c()"
-        return f"c({', '.join(self.response)})"
-
-    @property
-    def response_str(self) -> str:
-        """Return the response variable names in string format."""
-        if self.response is None:
-            return ""
-        return ",".join(self.response)
-
-    # NOTE: can't annotate return type because the graphviz dependency is optional
-    def graph(self, formatting="plain", name=None, figsize=None, dpi=300, fmt="png"):
-        """Produce a graphviz Digraph from a built HSSM model.
-
-        Requires graphviz, which may be installed most easily with `conda install -c
-        conda-forge python-graphviz`. Alternatively, you may install the `graphviz`
-        binaries yourself, and then `pip install graphviz` to get the python bindings.
-        See http://graphviz.readthedocs.io/en/stable/manual.html for more information.
-
-        Parameters
-        ----------
-        formatting
-            One of `"plain"` or `"plain_with_params"`. Defaults to `"plain"`.
-        name
-            Name of the figure to save. Defaults to `None`, no figure is saved.
-        figsize
-            Maximum width and height of figure in inches. Defaults to `None`, the
-            figure size is set automatically. If defined and the drawing is larger than
-            the given size, the drawing is uniformly scaled down so that it fits within
-            the given size.  Only works if `name` is not `None`.
-        dpi
-            Point per inch of the figure to save.
-            Defaults to 300. Only works if `name` is not `None`.
-        fmt
-            Format of the figure to save.
-            Defaults to `"png"`. Only works if `name` is not `None`.
-
-        Returns
-        -------
-        graphviz.Graph
-            The graph
-        """
-        graph = self.model.graph(formatting, name, figsize, dpi, fmt)
-
-        parent_param = self._parent_param
-        if parent_param.is_regression:
-            return graph
-
-        # Modify the graph
-        # 1. Remove all nodes and edges related to `{parent}_mean`:
-        graph.body = [
-            item for item in graph.body if f"{parent_param.name}_mean" not in item
-        ]
-        # 2. Add a new edge from parent to response
-        graph.edge(parent_param.name, self.response_str)
-
-        return graph
-
-    def compile_logp(self, keep_transformed: bool = False, **kwargs):
-        """Compile the log probability function for the model.
-
-        Parameters
-        ----------
-        keep_transformed : bool, optional
-            If True, keeps the transformed variables in the compiled function.
-            If False, removes value transforms before compilation.
-            Defaults to False.
-        **kwargs
-            Additional keyword arguments passed to PyMC's compile_logp:
-            - vars: List of variables. Defaults to None (all variables).
-            - jacobian: Whether to include log(|det(dP/dQ)|) term for
-            transformed variables. Defaults to True.
-            - sum: Whether to sum all terms instead of returning a vector.
-            Defaults to True.
-
-        Returns
-        -------
-        callable
-            A compiled function that computes the model log probability.
-        """
-        if keep_transformed:
-            return self.pymc_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-        else:
-            new_model = pm.model.transform.conditioning.remove_value_transforms(
-                self.pymc_model
-            )
-            return new_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-
-    def plot_trace(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        tight_layout: bool = True,
-        **kwargs,
-    ) -> None:
-        """Generate trace plot with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.plot_trace() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.plot_trace.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data : optional
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include deterministic` to True.
-        tight_layout : optional
-            Whether to call plt.tight_layout() after plotting. Defaults to True.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                if "var_names" in kwargs:
-                    if isinstance(kwargs["var_names"], str):
-                        if kwargs["var_names"] not in var_names:
-                            var_names.append(kwargs["var_names"])
-                        kwargs["var_names"] = var_names
-                    elif isinstance(kwargs["var_names"], list):
-                        kwargs["var_names"] = list(
-                            set(var_names) | set(kwargs["var_names"])
-                        )
-                    elif kwargs["var_names"] is None:
-                        kwargs["var_names"] = var_names
-                    else:
-                        raise ValueError(
-                            "`var_names` must be a string, a list of strings, or None."
-                        )
-                else:
-                    kwargs["var_names"] = var_names
-        az.plot_trace(data, **kwargs)
-
-        if tight_layout:
-            plt.tight_layout()
-
-    def summary(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        **kwargs,
-    ) -> pd.DataFrame | xr.Dataset:
-        """Produce a summary table with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.summary() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.summary.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include_deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include_deterministic` to True.
-
-        Returns
-        -------
-        pd.DataFrame | xr.Dataset
-            A pandas DataFrame or xarray Dataset containing the summary statistics.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                kwargs["var_names"] = list(set(var_names + kwargs.get("var_names", [])))
-        return az.summary(data, **kwargs)
-
-    def initial_point(self, transformed: bool = False) -> dict[str, np.ndarray]:
-        """Compute the initial point of the model.
-
-        This is a slightly altered version of pm.initial_point.initial_point().
-
-        Parameters
-        ----------
-        transformed : bool, optional
-            If True, return the initial point in transformed space.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial point of the model parameters.
-        """
-        fn = pm.initial_point.make_initial_point_fn(
-            model=self.pymc_model, return_transformed=transformed
-        )
-        return pm.model.Point(fn(None), model=self.pymc_model)
-
-    def restore_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj = cast("az.InferenceData", traces)
-
-    def restore_vi_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore VI traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the VI traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj_vi = cast("az.InferenceData", traces)
-
-    def save_model(
-        self,
-        model_name: str | None = None,
-        allow_absolute_base_path: bool = False,
-        base_path: str | Path = "hssm_models",
-        save_idata_only: bool = False,
-    ) -> None:
-        """Save a HSSM model instance and its inference results to disk.
-
-        Parameters
-        ----------
-        model : HSSM
-            The HSSM model instance to save
-        model_name : str | None
-            Name to use for the saved model files.
-            If None, will use model.model_name with timestamp
-        allow_absolute_base_path : bool
-            Whether to allow absolute paths for base_path
-        base_path : str | Path
-            Base directory to save model files in.
-            Must be relative path if allow_absolute_base_path=False
-        save_idata_only: bool = False,
-            Whether to save the model class instance itself
-
-        Raises
-        ------
-        ValueError
-            If base_path is absolute and allow_absolute_base_path=False
-        """
-        # check if base_path is absolute
-        if not allow_absolute_base_path:
-            if str(base_path).startswith("/"):
-                raise ValueError(
-                    "base_path must be a relative path"
-                    " if allow_absolute_base_path is False"
-                )
-
-        if model_name is None:
-            # Get date string format as suffix to model name
-            model_name = (
-                self.model_name
-                + "_"
-                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
-            )
-
-        # check if folder by name model_name exists
-        model_name = model_name.replace(" ", "_")
-        model_path = Path(base_path).joinpath(model_name)
-        model_path.mkdir(parents=True, exist_ok=True)
-
-        # Save model to pickle file
-        if not save_idata_only:
-            with open(model_path.joinpath("model.pkl"), "wb") as f:
-                cpickle.dump(self, f)
-
-        # Save traces to netcdf file
-        if self._inference_obj is not None:
-            az.to_netcdf(self._inference_obj, model_path.joinpath("traces.nc"))
-
-        # Save vi_traces to netcdf file
-        if self._inference_obj_vi is not None:
-            az.to_netcdf(self._inference_obj_vi, model_path.joinpath("vi_traces.nc"))
-
-    @classmethod
-    def load_model(
-        cls, path: Union[str, Path]
-    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
-        """Load a HSSM model instance and its inference results from disk.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory or model.pkl file. If a directory is provided,
-            will look for model.pkl, traces.nc and vi_traces.nc files within it.
-
-        Returns
-        -------
-        HSSM
-            The loaded HSSM model instance with inference results attached if available.
-        """
-        # Convert path to Path object
-        path = Path(path)
-
-        # If path points to a file, assume it's model.pkl
-        if path.is_file():
-            model_dir = path.parent
-            model_path = path
-        else:
-            # Path points to directory
-            model_dir = path
-            model_path = model_dir.joinpath("model.pkl")
-
-        # check if model_dir exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if model.pkl exists raise logging information if not
-        if not model_path.exists():
-            _logger.info(
-                f"model.pkl file does not exist in {model_dir}. "
-                "Attempting to load traces only."
-            )
-            if (not model_dir.joinpath("traces.nc").exists()) and (
-                not model_dir.joinpath("vi_traces.nc").exists()
-            ):
-                raise FileNotFoundError(f"No traces found in {model_dir}.")
-            else:
-                idata_dict = cls.load_model_idata(model_dir)
-                return idata_dict
-        else:
-            # Load model from pickle file
-            with open(model_path, "rb") as f:
-                model = cpickle.load(f)
-
-            # Load traces if they exist
-            traces_path = model_dir.joinpath("traces.nc")
-            if traces_path.exists():
-                model.restore_traces(traces_path)
-
-            # Load VI traces if they exist
-            vi_traces_path = model_dir.joinpath("vi_traces.nc")
-            if vi_traces_path.exists():
-                model.restore_vi_traces(vi_traces_path)
-        return model
-
-    @classmethod
-    def load_model_idata(cls, path: str | Path) -> dict[str, az.InferenceData | None]:
-        """Load the traces from a model directory.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory containing traces.nc and/or vi_traces.nc files.
-
-        Returns
-        -------
-        dict[str, az.InferenceData | None]
-            A dictionary with keys "idata_mcmc" and "idata_vi" containing the traces
-            from the model directory. If the traces do not exist, the corresponding
-            value will be None.
-        """
-        idata_dict: dict[str, az.InferenceData | None] = {}
-        model_dir = Path(path)
-        # check if path exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if traces.nc exists
-        traces_path = model_dir.joinpath("traces.nc")
-        if not traces_path.exists():
-            _logger.warning(f"traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_mcmc"] = None
-        else:
-            idata_dict["idata_mcmc"] = az.from_netcdf(traces_path)
-
-        # check if vi_traces.nc exists
-        vi_traces_path = model_dir.joinpath("vi_traces.nc")
-        if not vi_traces_path.exists():
-            _logger.warning(f"vi_traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_vi"] = None
-        else:
-            idata_dict["idata_vi"] = az.from_netcdf(vi_traces_path)
-
-        return idata_dict
-
-    def __getstate__(self):
-        """Get the state of the model for pickling.
-
-        This method is called when pickling the model.
-        It returns a dictionary containing the constructor
-        arguments needed to recreate the model instance.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the constructor arguments
-            under the key 'constructor_args'.
-        """
-        state = {"constructor_args": self._init_args}
-        return state
-
-    def __setstate__(self, state):
-        """Set the state of the model when unpickling.
-
-        This method is called when unpickling the model. It creates a new instance
-        of HSSM using the constructor arguments stored in the state dictionary,
-        and copies its attributes to the current instance.
-
-        Parameters
-        ----------
-        state : dict
-            A dictionary containing the constructor arguments under the key
-            'constructor_args'.
-        """
-        new_instance = HSSM(**state["constructor_args"])
-        self.__dict__ = new_instance.__dict__
-
-    def __repr__(self) -> str:
-        """Create a representation of the model."""
-        output = [
-            "Hierarchical Sequential Sampling Model",
-            f"Model: {self.model_name}\n",
-            f"Response variable: {self.response_str}",
-            f"Likelihood: {self.loglik_kind}",
-            f"Observations: {len(self.data)}\n",
-            "Parameters:\n",
-        ]
-
-        for param in self.params.values():
-            if param.name == "p_outlier":
-                continue
-            output.append(f"{param.name}:")
-
-            component = self.model.components[param.name]
-
-            # Regression case:
-            if param.is_regression:
-                assert isinstance(component, DistributionalComponent)
-                output.append(f"    Formula: {param.formula}")
-                output.append("    Priors:")
-                intercept_term = component.intercept_term
-                if intercept_term is not None:
-                    output.append(_print_prior(intercept_term))
-                for _, common_term in component.common_terms.items():
-                    output.append(_print_prior(common_term))
-                for _, group_specific_term in component.group_specific_terms.items():
-                    output.append(_print_prior(group_specific_term))
-                output.append(f"    Link: {param.link}")
-            # None regression case
-            else:
-                if param.prior is None:
-                    prior = (
-                        component.intercept_term.prior
-                        if param.is_parent
-                        else component.prior
-                    )
-                else:
-                    prior = param.prior
-                output.append(f"    Prior: {prior}")
-            output.append(f"    Explicit bounds: {param.bounds}")
-            output.append(
-                " (ignored due to link function)"
-                if self.link_settings is not None
-                else ""
-            )
-
-        # TODO: Handle p_outlier regression correctly here.
-        if self.p_outlier is not None:
-            output.append("")
-            output.append(f"Lapse probability: {self.p_outlier.prior}")
-            output.append(f"Lapse distribution: {self.lapse}")
-
-        return "\n".join(output)
-
-    def __str__(self) -> str:
-        """Create a string representation of the model."""
-        return self.__repr__()
-
-    @property
-    def traces(self) -> az.InferenceData | pm.Approximation:
-        """Return the trace of the model after sampling.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            The trace of the model after the last call to `sample()`.
-        """
-        if not self._inference_obj:
-            raise ValueError("Please sample the model first.")
-
-        return self._inference_obj
-
-    @property
-    def vi_idata(self) -> az.InferenceData:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData
-            The variational inference approximation object.
-        """
-        if not self._inference_obj_vi:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational posterior attached."
-            )
-
-        return self._inference_obj_vi
-
-    @property
-    def vi_approx(self) -> pm.Approximation:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        pm.Approximation
-            The variational inference approximation object.
-        """
-        if not self._vi_approx:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational approximation attached."
-            )
-
-        return self._vi_approx
-
-    @property
-    def map(self) -> dict:
-        """Return the MAP estimates of the model parameters.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        if not self._map_dict:
-            raise ValueError("Please compute map first.")
-
-        return self._map_dict
-
-    @property
-    def initvals(self) -> dict:
-        """Return the initial values of the model parameters for sampling.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial values of the model parameters.
-            This dict serves as the default for initial values, and can be passed
-            directly to the `.sample()` function.
-        """
-        if self._initvals == {}:
-            self._initvals = self.initial_point()
-        return self._initvals
-
-    def _check_lapse(self, lapse):
-        """Determine if p_outlier and lapse is specified correctly."""
-        # Basically, avoid situations where only one of them is specified.
-        if self.has_lapse and lapse is None:
-            raise ValueError(
-                "You have specified `p_outlier`. Please also specify `lapse`."
-            )
-        if lapse is not None and not self.has_lapse:
-            _logger.warning(
-                "You have specified the `lapse` argument to include a lapse "
-                + "distribution, but `p_outlier` is set to either 0 or None. "
-                + "Your lapse distribution will be ignored."
-            )
-        if "p_outlier" in self.list_params and self.list_params[-1] != "p_outlier":
-            raise ValueError(
-                "Please do not include 'p_outlier' in `list_params`. "
-                + "We automatically append it to `list_params` when `p_outlier` "
-                + "parameter is not None"
-            )
-
     def _make_model_distribution(self) -> type[pm.Distribution]:
         """Make a pm.Distribution for the model."""
         ### Logic for different types of likelihoods:
@@ -1959,6 +286,10 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
             return self.loglik
 
+        # Type narrowing: loglik and list_params should be set by this point
+        assert self.loglik is not None, "loglik should be set by model_config"
+        assert self.list_params is not None, "list_params validated in __init__"
+
         params_is_reg = [
             param.is_vector
             for param_name, param in self.params.items()
@@ -2046,255 +377,3 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 else [deepcopy(self.data[field].values) for field in self.extra_fields]
             ),
         )
-
-    def _get_deterministic_var_names(self, idata) -> list[str]:
-        """Filter out the deterministic variables in var_names."""
-        var_names = [
-            f"~{param_name}"
-            for param_name, param in self.params.items()
-            if (param.is_regression)
-        ]
-
-        if f"{self._parent}_mean" in idata["posterior"].data_vars:
-            var_names.append(f"~{self._parent}_mean")
-
-        # Parent parameters (always regression implicitly)
-        # which don't have a formula attached
-        # should be dropped from var_names, since the actual
-        # parent name shows up as a regression.
-        if f"{self._parent}" in idata["posterior"].data_vars:
-            if self.params[self._parent].formula is None:
-                # Drop from var_names
-                var_names = [var for var in var_names if var != f"~{self._parent}"]
-
-        return var_names
-
-    def _drop_parent_str_from_idata(
-        self, idata: az.InferenceData | None
-    ) -> az.InferenceData:
-        """Drop the parent_str variable from an InferenceData object.
-
-        Parameters
-        ----------
-        idata
-            The InferenceData object to be modified.
-
-        Returns
-        -------
-        xr.Dataset
-            The modified InferenceData object.
-        """
-        if idata is None:
-            raise ValueError("Please provide an InferenceData object.")
-        else:
-            for group in idata.groups():
-                if ("rt,response_mean" in idata[group].data_vars) and (
-                    self._parent not in idata[group].data_vars
-                ):
-                    setattr(
-                        idata,
-                        group,
-                        idata[group].rename({"rt,response_mean": self._parent}),
-                    )
-            return idata
-
-    def _postprocess_initvals_deterministic(
-        self, initval_settings: dict = INITVAL_SETTINGS
-    ) -> None:
-        """Set initial values for subset of parameters."""
-        self._initvals = self.initial_point()
-        # Consider case where link functions are set to 'log_logit'
-        # or 'None'
-        if self.link_settings not in ["log_logit", None]:
-            _logger.info(
-                "Not preprocessing initial values, "
-                + "because none of the two standard link settings are chosen!"
-            )
-            return None
-
-        # Set initial values for particular parameters
-        for name_, starting_value in self.pymc_model.initial_point().items():
-            # strip name of `_log__` and `_interval__` suffixes
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-
-            # We need to check if the parameter is actually backed by
-            # a regression.
-
-            # If not, we don't actually apply a link function to it as per default.
-            # Therefore we need to apply the initial value strategy corresponding
-            # to 'None' link function.
-
-            # If the user actively supplies a link function, the user
-            # should also have supplied an initial value insofar it matters.
-
-            if self.params[self._get_prefix(name_tmp)].is_regression:
-                param_link_setting = self.link_settings
-            else:
-                param_link_setting = None
-            if name_tmp in initval_settings[param_link_setting].keys():
-                if self._check_if_initval_user_supplied(name_tmp):
-                    _logger.info(
-                        "User supplied initial value detected for %s, \n"
-                        " skipping overwrite with default value.",
-                        name_tmp,
-                    )
-                    continue
-
-                # Apply specific settings from initval_settings dictionary
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(
-                    initval_settings[param_link_setting][name_tmp]
-                ).astype(dtype)
-
-    def _get_prefix(self, name_str: str) -> str:
-        """Get parameters wise link setting function from parameter prefix."""
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-            else:
-                name_str_prefix = "p_outlier"
-        else:
-            name_str_prefix = name_str
-        return name_str_prefix
-
-    def _check_if_initval_user_supplied(
-        self,
-        name_str: str,
-        return_value: bool = False,
-    ) -> bool | float | int | np.ndarray | dict[str, Any] | None:
-        """Check if initial value is user-supplied."""
-        # The function assumes that the name_str is either raw parameter name
-        # or `paramname_Intercept`, because we only really provide special default
-        # initial values for those types of parameters
-
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-                # name_str_suffix = "".join(name_str.split("_")[1:])
-                name_str_suffix = name_str[len(name_str_prefix + "_") :]
-            else:
-                name_str_prefix = "p_outlier"
-                if name_str == "p_outlier":
-                    name_str_suffix = ""
-                else:
-                    # name_str_suffix = "".join(name_str.split("_")[2:])
-                    name_str_suffix = name_str[len("p_outlier_") :]
-        else:
-            name_str_prefix = name_str
-            name_str_suffix = ""
-
-        tmp_param = name_str_prefix
-        if tmp_param == self._parent:
-            # If the parameter was parent it is automatically treated as a
-            # regression.
-            if not name_str_suffix:
-                # No suffix --> Intercept
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp["Intercept"], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    return False
-            else:
-                # If the parameter has a suffix --> use it
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-        else:
-            # If the parameter is not a parent, it is treated as a regression
-            # only when actively specified as such.
-            if not name_str_suffix:
-                # If no suffix --> treat as basic parameter.
-                if isinstance(self.params[tmp_param].prior, float) or isinstance(
-                    self.params[tmp_param].prior, np.ndarray
-                ):
-                    if return_value:
-                        return self.params[tmp_param].prior
-                    else:
-                        return True
-                elif isinstance(self.params[tmp_param].prior, bmb.Prior):
-                    args_tmp = getattr(self.params[tmp_param].prior, "args")
-                    if "initval" in args_tmp:
-                        if return_value:
-                            return args_tmp["initval"]
-                        else:
-                            return True
-                    else:
-                        if return_value:
-                            return None
-                        else:
-                            return False
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-            else:
-                # If suffix --> treat as regression and use suffix
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-
-    def _jitter_initvals(
-        self, jitter_epsilon: float = 0.01, vector_only: bool = False
-    ) -> None:
-        """Apply controlled jitter to initial values."""
-        if vector_only:
-            self.__jitter_initvals_vector_only(jitter_epsilon)
-        else:
-            self.__jitter_initvals_all(jitter_epsilon)
-
-    def __jitter_initvals_vector_only(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            if starting_value.ndim != 0 and starting_value.shape[0] != 1:
-                starting_value_tmp = starting_value + np.random.uniform(
-                    -jitter_epsilon, jitter_epsilon, starting_value.shape
-                ).astype(np.float32)
-
-                # Note: self._initvals shouldn't be None when this is called
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)
-
-    def __jitter_initvals_all(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        # initial_point_dict = self.pymc_model.initial_point()
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            starting_value_tmp = starting_value + np.random.uniform(
-                -jitter_epsilon, jitter_epsilon, starting_value.shape
-            ).astype(np.float32)
-
-            dtype = self.initvals[name_tmp].dtype
-            self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)

From e3b9a4077f37721e0d55a925f2f924663b35d9e2 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:28:57 -0500
Subject: [PATCH 067/104] test: remove obsolete test_hssmbase.py file

---
 tests/test_hssmbase.py | 346 -----------------------------------------
 1 file changed, 346 deletions(-)
 delete mode 100644 tests/test_hssmbase.py

diff --git a/tests/test_hssmbase.py b/tests/test_hssmbase.py
deleted file mode 100644
index ef30a3a4f..000000000
--- a/tests/test_hssmbase.py
+++ /dev/null
@@ -1,346 +0,0 @@
-import numpy as np
-import pytest
-
-import hssm
-from hssm.base import HSSMBase
-from hssm.likelihoods import DDM, logp_ddm
-from copy import deepcopy
-
-hssm.set_floatX("float32", update_jax=True)
-
-param_v = {
-    "name": "v",
-    "prior": {
-        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0},
-        "x": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
-        "y": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
-    },
-    "formula": "v ~ 1 + x + y",
-}
-
-param_a = param_v | dict(name="a", formula="a ~ 1 + x + y")
-
-
-@pytest.mark.parametrize(
-    "include, should_raise_exception",
-    [
-        (
-            [param_v],
-            False,
-        ),
-        (
-            [
-                param_v,
-                param_a,
-            ],
-            False,
-        ),
-        (
-            [{"name": "invalid_param", "prior": "invalid_param"}],
-            True,
-        ),
-        (
-            [
-                {
-                    "name": "v",
-                    "prior": {
-                        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0}
-                    },
-                    "formula": "v ~ 1",
-                    "invalid_key": "identity",
-                }
-            ],
-            True,
-        ),
-        (
-            [
-                {
-                    "name": "v",
-                    "prior": {
-                        "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0}
-                    },
-                    "formula": "invalid_formula",
-                }
-            ],
-            True,
-        ),
-    ],
-)
-def test_transform_params_general(data_ddm_reg, include, should_raise_exception):
-    if should_raise_exception:
-        with pytest.raises(Exception):
-            HSSMBase(data=data_ddm_reg, include=include)
-    else:
-        model = HSSMBase(data=data_ddm_reg, include=include)
-        # Check model properties using a loop
-        param_names = ["v", "a", "z", "t", "p_outlier"]
-        model_param_names = list(model.params.keys())
-        assert model_param_names == param_names
-        assert len(model.params) == 5
-
-
-def test_custom_model(data_ddm):
-    with pytest.raises(
-        ValueError, match="When using a custom model, please provide a `loglik_kind.`"
-    ):
-        HSSMBase(data=data_ddm, model="custom")
-
-    with pytest.raises(
-        ValueError, match="Please provide `list_params` via `model_config`."
-    ):
-        HSSMBase(data=data_ddm, model="custom", loglik_kind="analytical")
-
-    with pytest.raises(
-        ValueError, match="Please provide `list_params` via `model_config`."
-    ):
-        HSSMBase(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
-
-    with pytest.raises(
-        ValueError,
-        match="Please provide `list_params` via `model_config`.",
-    ):
-        HSSMBase(
-            data=data_ddm,
-            model="custom",
-            loglik=DDM,
-            loglik_kind="analytical",
-            model_config={},
-        )
-
-    model = HSSMBase(
-        data=data_ddm,
-        model="custom",
-        model_config={
-            "list_params": ["v", "a", "z", "t"],
-            "choices": [-1, 1],
-            "bounds": {
-                "v": (-3.0, 3.0),
-                "a": (0.3, 2.5),
-                "z": (0.1, 0.9),
-                "t": (0.0, 2.0),
-            },
-        },
-        loglik=logp_ddm,
-        loglik_kind="analytical",
-    )
-
-    assert model.model_name == "custom"
-    assert model.loglik_kind == "analytical"
-    assert model.list_params == ["v", "a", "z", "t", "p_outlier"]
-
-
-def test_model_definition_outside_include(data_ddm):
-    model_with_one_param_fixed = HSSMBase(data_ddm, a=0.5)
-
-    assert "a" in model_with_one_param_fixed.params
-    assert model_with_one_param_fixed.params["a"].prior == 0.5
-
-    model_with_one_param = HSSMBase(
-        data_ddm, a={"prior": {"name": "Normal", "mu": 0.5, "sigma": 0.1}}
-    )
-
-    assert "a" in model_with_one_param.params
-    assert model_with_one_param.params["a"].prior.name == "Normal"
-
-    with pytest.raises(
-        ValueError, match="Parameter `a` specified in both `include` and `kwargs`."
-    ):
-        HSSMBase(data_ddm, include=[{"name": "a", "prior": 0.5}], a=0.5)
-
-
-@pytest.mark.xfail(reason="Broken in CI.")
-def test_sample_prior_predictive(data_ddm_reg):
-    data_ddm_reg = data_ddm_reg.iloc[:10, :]
-
-    model_no_regression = HSSMBase(data=data_ddm_reg)
-    rng = np.random.default_rng()
-
-    model_no_regression.sample_prior_predictive(draws=10)
-    model_no_regression.sample_prior_predictive(draws=10, random_seed=rng)
-
-    model_regression = HSSMBase(
-        data=data_ddm_reg, include=[dict(name="v", formula="v ~ 1 + x")]
-    )
-    model_regression.sample_prior_predictive(draws=10)
-
-    model_regression_a = HSSMBase(
-        data=data_ddm_reg, include=[dict(name="a", formula="a ~ 1 + x")]
-    )
-    model_regression_a.sample_prior_predictive(draws=10)
-
-    model_regression_multi = HSSMBase(
-        data=data_ddm_reg,
-        include=[
-            dict(name="v", formula="v ~ 1 + x"),
-            dict(name="a", formula="a ~ 1 + y"),
-        ],
-    )
-    model_regression_multi.sample_prior_predictive(draws=10)
-
-    data_ddm_reg.loc[:, "subject_id"] = np.arange(10)
-
-    model_regression_random_effect = HSSMBase(
-        data=data_ddm_reg,
-        include=[
-            dict(name="v", formula="v ~ (1|subject_id) + x"),
-            dict(name="a", formula="a ~ (1|subject_id) + y"),
-        ],
-    )
-    model_regression_random_effect.sample_prior_predictive(draws=10)
-
-
-def test_override_default_link(caplog, data_ddm_reg):
-    param_v = {
-        "name": "v",
-        "prior": {
-            "Intercept": {"name": "Uniform", "lower": -3.0, "upper": 3.0},
-            "x": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
-            "y": {"name": "Uniform", "lower": -0.50, "upper": 0.50},
-        },
-        "formula": "v ~ 1 + x + y",
-    }
-    param_v = param_v | dict(bounds=(-np.inf, np.inf))
-    param_a = param_v | dict(name="a", formula="a ~ 1 + x + y", bounds=(0, np.inf))
-    param_z = param_v | dict(name="z", formula="z ~ 1 + x + y", bounds=(0, 1))
-    param_t = param_v | dict(name="t", formula="t ~ 1 + x + y", bounds=(0.1, np.inf))
-
-    model = HSSMBase(
-        data=data_ddm_reg,
-        include=[param_v, param_a, param_z, param_t],
-        link_settings="log_logit",
-    )
-
-    assert model.params["v"].link == "identity"
-    assert model.params["a"].link == "log"
-    assert model.params["z"].link.name == "gen_logit"
-    assert model.params["t"].link == "identity"
-
-    assert "t" in caplog.records[0].message
-    assert "strange" in caplog.records[0].message
-
-
-def test_resampling(data_ddm):
-    model = HSSMBase(data=data_ddm)
-    sample_1 = model.sample(draws=10, chains=1, tune=0)
-    assert sample_1 is model.traces
-
-    sample_2 = model.sample(draws=10, chains=1, tune=0)
-    assert sample_2 is model.traces
-
-    assert sample_1 is not sample_2
-
-
-def test_add_likelihood_parameters_to_data(data_ddm):
-    """Test if the likelihood parameters are added to the InferenceData object."""
-    model = HSSMBase(data=data_ddm)
-    sample_1 = model.sample(draws=10, chains=1, tune=10)
-    sample_1_copy = deepcopy(sample_1)
-    model.add_likelihood_parameters_to_idata(inplace=True)
-
-    # Get distributional components (make sure to take the right aliases)
-    distributional_component_names = [
-        key_ if key_ not in model._aliases else model._aliases[key_]
-        for key_ in model.model.distributional_components.keys()
-    ]
-
-    # Check that after computing the likelihood parameters
-    # all respective parameters appear in the InferenceData object
-    assert np.all(
-        [
-            component_ in model.traces.posterior.data_vars
-            for component_ in distributional_component_names
-        ]
-    )
-
-    # Check that before computing the likelihood parameters
-    # at least one parameter is missing (in the simplest case
-    # this is the {parent}_mean parameter if nothing received a regression)
-
-    assert not np.all(
-        [
-            component_ in sample_1_copy.posterior.data_vars
-            for component_ in distributional_component_names
-        ]
-    )
-
-
-# Setting any parameter to a fixed value should work:
-def test_model_creation_constant_parameter(data_ddm):
-    for param_name in ["v", "a", "z", "t"]:
-        model = HSSMBase(data=data_ddm, **{param_name: 1.0})
-        assert model._parent != param_name
-        assert model.params[param_name].prior == 1.0
-
-
-# Setting any single parameter to a regression should respect the default bounds:
-@pytest.mark.parametrize(
-    "param_name, dist_name",
-    [("v", "Normal"), ("a", "Gamma"), ("z", "Beta"), ("t", "Gamma")],
-)
-def test_model_creation_single_regression(data_ddm_reg, param_name, dist_name):
-    model = HSSMBase(
-        data=data_ddm_reg,
-        include=[{"name": param_name, "formula": f"{param_name} ~ 1 + x"}],
-    )
-    assert model.params[param_name].prior["Intercept"].name == dist_name
-    assert model.params[param_name].prior["x"].name == "Normal"
-
-
-# Setting all parameters to fixed values should throw an error:
-def test_model_creation_all_parameters_constant(data_ddm):
-    with pytest.raises(ValueError):
-        HSSMBase(data=data_ddm, v=1.0, a=1.0, z=1.0, t=1.0)
-
-
-# Prior settings
-def test_prior_settings_basic(cavanagh_test):
-    model_1 = HSSMBase(
-        data=cavanagh_test,
-        global_formula="y ~ 1 + (1|participant_id)",
-        prior_settings=None,
-    )
-
-    assert model_1.params["v"].prior is None, (
-        "Default prior doesn't yield Nonetype for 'v'!"
-    )
-
-    model_2 = HSSMBase(
-        data=cavanagh_test,
-        global_formula="y ~ 1 + (1|participant_id)",
-        prior_settings="safe",
-    )
-
-    assert isinstance(model_2.params[model_2._parent].prior, dict), (
-        "Prior assigned to parent is not a dict!"
-    )
-
-
-def test_compile_logp(cavanagh_test):
-    model_1 = HSSMBase(
-        data=cavanagh_test,
-        global_formula="y ~ 1 + (1|participant_id)",
-        prior_settings=None,
-    )
-
-    out = model_1.compile_logp(model_1.initial_point(transformed=False))
-    assert out is not None
-
-
-def test_sample_do(data_ddm):
-    model = HSSMBase(data=data_ddm)
-    sample_do = model.sample_do(params={"v": 1.0}, draws=10)
-    assert sample_do is not None
-    assert "v_mean" in sample_do.prior.data_vars
-    assert set(sample_do.prior_predictive.dims) == {
-        "chain",
-        "draw",
-        "__obs__",
-        "rt,response_dim",
-    }
-    assert set(sample_do.prior_predictive.coords) == {
-        "chain",
-        "draw",
-        "__obs__",
-        "rt,response_dim",
-    }
-    assert np.unique(sample_do.prior["v_mean"].values) == [1.0]

From a6a1f73086080a5c2df75051bbe358dfdb0b09cb Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:44:20 -0500
Subject: [PATCH 068/104] refactor: clean up imports in hssm.py for better
 readability

---
 src/hssm/hssm.py | 39 ++++-----------------------------------
 1 file changed, 4 insertions(+), 35 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 1eb7f2fb8..ec63d5d10 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -6,59 +6,28 @@
 This file defines the entry class HSSM.
 """
 
-import datetime
 import logging
-import typing
 from copy import deepcopy
-from inspect import isclass, signature
-from os import PathLike
-from pathlib import Path
-from typing import Any, Callable, Literal, Optional, Union, cast, get_args
-
-import arviz as az
-import bambi as bmb
-import cloudpickle as cpickle
-import matplotlib as mpl
-import matplotlib.pyplot as plt
-import numpy as np
-import pandas as pd
+from inspect import isclass
+from typing import Literal
+
 import pymc as pm
-import pytensor
-import seaborn as sns
-import xarray as xr
-from bambi.model_components import DistributionalComponent
-from bambi.transformations import transformations_namespace
-from pymc.model.transform.conditioning import do
-from ssms.config import model_config as ssms_model_config
-
-from hssm._types import LoglikKind, SupportedModels
+
 from hssm.base import HSSMBase
 from hssm.defaults import (
-    INITVAL_JITTER_SETTINGS,
-    INITVAL_SETTINGS,
     MissingDataNetwork,
     missing_data_networks_suffix,
 )
 from hssm.distribution_utils import (
     assemble_callables,
     make_distribution,
-    make_family,
     make_likelihood_callable,
     make_missing_data_callable,
 )
 from hssm.utils import (
-    _compute_log_likelihood,
-    _get_alias_dict,
-    _print_prior,
     _rearrange_data,
-    _split_array,
 )
 
-from . import plotting
-from .config import Config, ModelConfig
-from .param import Params
-from .param import UserParam as Param
-
 _logger = logging.getLogger("hssm")
 
 # NOTE: Temporary mapping from old sampler names to new ones in bambi 0.16.0

From 88cd7cc80951651ecb9f2f6bdac4aca1edac9dbd Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:54:57 -0500
Subject: [PATCH 069/104] fix: update prior type hint in fill_defaults and
 from_defaults methods to include bmb.Prior

---
 src/hssm/param/simple_param.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/hssm/param/simple_param.py b/src/hssm/param/simple_param.py
index 3158198ff..22938c45f 100644
--- a/src/hssm/param/simple_param.py
+++ b/src/hssm/param/simple_param.py
@@ -111,7 +111,7 @@ def from_user_param(cls, user_param: UserParam) -> "SimpleParam":
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:
@@ -208,7 +208,10 @@ def __init__(
 
     @classmethod
     def from_defaults(
-        cls, name: str, prior: dict[str, Any], bounds: tuple[int, int]
+        cls,
+        name: str,
+        prior: float | dict[str, Any] | bmb.Prior,
+        bounds: tuple[float, float],
     ) -> "DefaultParam":
         """Create a DefaultParam object from default values.
 
@@ -248,7 +251,7 @@ def process_prior(self) -> None:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From 2a27766b905700a4eb6ab5d9e0dd421c674790d3 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:56:03 -0500
Subject: [PATCH 070/104] fix: update fill_defaults method to include bmb.Prior
 type hint for prior parameter

---
 src/hssm/param/regression_param.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/param/regression_param.py b/src/hssm/param/regression_param.py
index 26c7fc9f4..1e0a19d67 100644
--- a/src/hssm/param/regression_param.py
+++ b/src/hssm/param/regression_param.py
@@ -111,7 +111,7 @@ def from_defaults(
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From 9330ab1e2367ff5d6ce9b889ffe07ef61505aa5f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:58:33 -0500
Subject: [PATCH 071/104] fix: add type ignore comments for model.list_params
 and DefaultParam.from_defaults parameters

---
 src/hssm/param/params.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/hssm/param/params.py b/src/hssm/param/params.py
index 601f755a3..2e5b901af 100644
--- a/src/hssm/param/params.py
+++ b/src/hssm/param/params.py
@@ -206,7 +206,7 @@ def collect_user_params(
         user_param = UserParam.from_dict(param) if isinstance(param, dict) else param
         if user_param.name is None:
             raise ValueError("Parameter name must be specified.")
-        if user_param.name not in model.list_params:
+        if user_param.name not in model.list_params:  # type: ignore
             raise ValueError(
                 f"Parameter {user_param.name} not found in list_params."
                 " This implies that the parameter is not valid for the chosen model."
@@ -222,7 +222,7 @@ def collect_user_params(
     # If any of the keys is found in `list_params` it is a parameter specification.
     # We add the parameter specification to `user_params` and remove it from
     # `kwargs`
-    for param_name in model.list_params:
+    for param_name in model.list_params:  # type: ignore
         # Update user_params only if param_name is in kwargs
         # and not already in user_params
         if param_name in kwargs:
@@ -265,7 +265,7 @@ def make_params(model: HSSM, user_params: dict[str, UserParam]) -> dict[str, Par
         and model.loglik_kind != "approx_differentiable"
     )
 
-    for name in model.list_params:
+    for name in model.list_params:  # type: ignore
         if name in user_params:
             param = make_param_from_user_param(model, name, user_params[name])
         else:
@@ -352,6 +352,10 @@ def make_param_from_defaults(model: HSSM, name: str) -> Param:
             link_settings=model.link_settings,
         )
     else:
-        param = DefaultParam.from_defaults(name, default_prior, default_bounds)
+        param = DefaultParam.from_defaults(
+            name,
+            default_prior,
+            default_bounds,  # type: ignore
+        )
 
     return param

From 6b5ee2ac9fd05d0a6f8c8d6b0bd00189d3e3c8e7 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 15:59:03 -0500
Subject: [PATCH 072/104] fix: update fill_defaults method to include bmb.Prior
 type hint for prior parameter

---
 src/hssm/param/param.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/param/param.py b/src/hssm/param/param.py
index 945f60ec7..cd46e4bdf 100644
--- a/src/hssm/param/param.py
+++ b/src/hssm/param/param.py
@@ -132,7 +132,7 @@ def is_vector(self) -> bool:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From 7e9f6809ba5a083c9532b24af8d21b4856c3c4e9 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:00:00 -0500
Subject: [PATCH 073/104] fix: replace assertions with ValueError for loglik
 and list_params validation in HSSM class

---
 src/hssm/hssm.py | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index ec63d5d10..2cd5fb1d8 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -256,8 +256,16 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             return self.loglik
 
         # Type narrowing: loglik and list_params should be set by this point
-        assert self.loglik is not None, "loglik should be set by model_config"
-        assert self.list_params is not None, "list_params validated in __init__"
+        if self.loglik is None:
+            raise ValueError(
+                "Likelihood function (loglik) has not been set. "
+                "This should have been configured during model initialization."
+            )
+        if self.list_params is None:
+            raise ValueError(
+                "list_params has not been set. "
+                "This should have been validated during model initialization."
+            )
 
         params_is_reg = [
             param.is_vector

From 7eb08631c1eae41190f3c6e5f158ceacce37cc4d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:01:30 -0500
Subject: [PATCH 074/104] refactor: remove unused imports from base.py

---
 src/hssm/base.py | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 2a6a14b01..1b0127e87 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -35,22 +35,15 @@
 from hssm.defaults import (
     INITVAL_JITTER_SETTINGS,
     INITVAL_SETTINGS,
-    MissingDataNetwork,
-    missing_data_networks_suffix,
 )
 from hssm.distribution_utils import (
-    assemble_callables,
-    make_distribution,
     make_family,
-    make_likelihood_callable,
-    make_missing_data_callable,
 )
 from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
     _compute_log_likelihood,
     _get_alias_dict,
     _print_prior,
-    _rearrange_data,
     _split_array,
 )
 

From ed692bd05e840316787944d2d203e3fc84ac29ab Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:12:17 -0500
Subject: [PATCH 075/104] fix: update error message for missing list_params in
 HSSM initialization

---
 tests/test_hssm.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index 92804066e..dac020d4d 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -89,18 +89,18 @@ def test_custom_model(data_ddm):
         HSSM(data=data_ddm, model="custom")
 
     with pytest.raises(
-        ValueError, match="Please provide `list_params` via `model_config`."
+        ValueError, match="Please provide `list_params`*"
     ):
         HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
 
     with pytest.raises(
-        ValueError, match="Please provide `list_params` via `model_config`."
+        ValueError, match="Please provide `list_params`*"
     ):
         HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(
         ValueError,
-        match="Please provide `list_params` via `model_config`.",
+        match="Please provide `list_params`*",
     ):
         HSSM(
             data=data_ddm,

From 0a514c73e90a25576055d330cbb2acd5230f126f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:12:33 -0500
Subject: [PATCH 076/104] fix: add validation for loglik_kind in HSSM class
 initialization

---
 src/hssm/hssm.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 2cd5fb1d8..3fc6d0345 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -266,6 +266,11 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 "list_params has not been set. "
                 "This should have been validated during model initialization."
             )
+        if self.loglik_kind is None:
+            raise ValueError(
+                "Likelihood kind (loglik_kind) has not been set. "
+                "This should have been configured during model initialization."
+            )
 
         params_is_reg = [
             param.is_vector

From 88edb79e485d8ba18d6fc1e1ad503bcd9926c07a Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:12:39 -0500
Subject: [PATCH 077/104] refactor: update comment style for clarity in
 _make_model_distribution method

---
 src/hssm/hssm.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 3fc6d0345..ed29c7425 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -241,7 +241,7 @@ class HSSM(HSSMBase):
 
     def _make_model_distribution(self) -> type[pm.Distribution]:
         """Make a pm.Distribution for the model."""
-        ### Logic for different types of likelihoods:
+        # == Logic for different types of likelihoods:
         # -`analytical` and `blackbox`:
         #     loglik should be a `pm.Distribution`` or a Python callable (any arbitrary
         #     function).

From 8c3c811e0e47eda1819ad834f333a7550261febf Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 16:16:01 -0500
Subject: [PATCH 078/104] fix: handle None values for response and choices in
 HSSMBase initialization

---
 src/hssm/base.py | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 1b0127e87..f48b42e21 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -324,9 +324,17 @@ def __init__(
         # endregion
 
         # region ===== Set up shortcuts so old code will work ======
-        self.response = self.model_config.response
+        self.response = (
+            list(self.model_config.response)
+            if self.model_config.response is not None
+            else None
+        )
         self.list_params = self.model_config.list_params
-        self.choices = self.model_config.choices
+        self.choices = (
+            list(self.model_config.choices)
+            if self.model_config.choices is not None
+            else None
+        )
         self.model_name = self.model_config.model_name
         self.loglik = self.model_config.loglik
         self.loglik_kind = self.model_config.loglik_kind
@@ -533,14 +541,6 @@ def supported_models(cls) -> tuple[SupportedModels, ...]:
         """
         return get_args(SupportedModels)
 
-    @classmethod
-    def _store_init_args(cls, *args, **kwargs):
-        """Store initialization arguments using signature binding."""
-        sig = signature(cls.__init__)
-        bound_args = sig.bind(*args, **kwargs)
-        bound_args.apply_defaults()
-        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
-
     def find_MAP(self, **kwargs):
         """Perform Maximum A Posteriori estimation.
 

From d99163904dd18126440e3e2df3861e72b49976c6 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 11 Feb 2026 18:04:41 -0500
Subject: [PATCH 079/104] fix: streamline exception handling for missing
 list_params in HSSM initialization

---
 tests/test_hssm.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index dac020d4d..93817470d 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -88,14 +88,10 @@ def test_custom_model(data_ddm):
     ):
         HSSM(data=data_ddm, model="custom")
 
-    with pytest.raises(
-        ValueError, match="Please provide `list_params`*"
-    ):
+    with pytest.raises(ValueError, match="Please provide `list_params`*"):
         HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
 
-    with pytest.raises(
-        ValueError, match="Please provide `list_params`*"
-    ):
+    with pytest.raises(ValueError, match="Please provide `list_params`*"):
         HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(

From d7ff4d3c6338501dbf7d645fd94c373943d7316a Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 12 Feb 2026 09:00:02 -0500
Subject: [PATCH 080/104] Restore init args so tests pass

---
 src/hssm/base.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index f48b42e21..6c6971ede 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -291,6 +291,15 @@ def __init__(
         initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
         **kwargs,
     ):
+
+        # ===== init args for save/load models =====
+        self._init_args = {
+            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
+        }
+        if kwargs:
+            self._init_args.update(kwargs)
+        # endregion
+
         # ===== Input Data & Configuration =====
         self.data = data.copy()
         self.global_formula = global_formula

From 03624f8971c6486fd4c338d4b9d83aa9e9113891 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Thu, 12 Feb 2026 09:00:18 -0500
Subject: [PATCH 081/104] fix: update instance creation in HSSMBase to use
 class reference

---
 src/hssm/base.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 6c6971ede..e580a6c0b 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -1753,7 +1753,7 @@ def __setstate__(self, state):
             A dictionary containing the constructor arguments under the key
             'constructor_args'.
         """
-        new_instance = HSSMBase(**state["constructor_args"])
+        new_instance = self.__class__(**state["constructor_args"])
         self.__dict__ = new_instance.__dict__
 
     def __repr__(self) -> str:

From 6c7ee40c721f6680693e7bfc3637b4789a238d39 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 12:10:15 -0500
Subject: [PATCH 082/104] refactor: remove extra _set_missing_data_and_deadline
 method from DataValidatorMixin

---
 src/hssm/data_validator.py | 39 --------------------------------------
 1 file changed, 39 deletions(-)

diff --git a/src/hssm/data_validator.py b/src/hssm/data_validator.py
index 19dc2c58e..ae09a43fc 100644
--- a/src/hssm/data_validator.py
+++ b/src/hssm/data_validator.py
@@ -150,45 +150,6 @@ def _update_extra_fields(self, new_data: pd.DataFrame | None = None):
                 new_data[field].values for field in self.extra_fields
             ]
 
-    @staticmethod
-    def _set_missing_data_and_deadline(
-        missing_data: bool, deadline: bool, data: pd.DataFrame
-    ) -> MissingDataNetwork:
-        """Set missing data and deadline."""
-        network = MissingDataNetwork.NONE
-        if not missing_data:
-            return network
-        if missing_data and not deadline:
-            network = MissingDataNetwork.CPN
-        elif missing_data and deadline:
-            network = MissingDataNetwork.OPN
-        # AF-TODO: GONOGO case not yet correctly implemented
-        # else:
-        #     # TODO: This won't behave as expected yet, GONOGO needs to be split
-        #     # into a deadline case and a non-deadline case.
-        #     network = MissingDataNetwork.GONOGO
-
-        if np.all(data["rt"] == -999.0):
-            if network in [MissingDataNetwork.CPN, MissingDataNetwork.OPN]:
-                # AF-TODO: I think we should allow invalid-only datasets.
-                raise ValueError(
-                    "`missing_data` is set to True, but you have no valid data in your "
-                    "dataset."
-                )
-            # AF-TODO: This one needs refinement for GONOGO case
-            # elif network == MissingDataNetwork.OPN:
-            #     raise ValueError(
-            #         "`deadline` is set to True and `missing_data` is set to True, "
-            #         "but ."
-            #     )
-            # else:
-            #     raise ValueError(
-            #         "`missing_data` and `deadline` are both set to True,
-            #         "but you have "
-            #         "no missing data and/or no rts exceeding the deadline."
-            #     )
-        return network
-
     def _validate_choices(self):
         """
         Ensure that `choices` is provided (not None).

From 6443785650db92282f6a84ef88066b7dba8be799 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 12:28:34 -0500
Subject: [PATCH 083/104] refactor: rename test class for clarity in missing
 data handling

---
 tests/test_data_validator.py     | 55 --------------------------------
 tests/test_missing_data_mixin.py |  2 +-
 2 files changed, 1 insertion(+), 56 deletions(-)

diff --git a/tests/test_data_validator.py b/tests/test_data_validator.py
index ab7db255a..ecdc927fa 100644
--- a/tests/test_data_validator.py
+++ b/tests/test_data_validator.py
@@ -162,61 +162,6 @@ class DummyModelDist:
         assert (dv.model_distribution.extra_fields[i] == data[field].values).all()
 
 
-def test_set_missing_data_and_deadline():
-    # No missing data and no deadline
-    data = pd.DataFrame({"rt": [0.5, 0.7]})
-    assert (
-        DataValidatorMixin._set_missing_data_and_deadline(False, False, data)
-        == MissingDataNetwork.NONE
-    )
-    # Missing data but no deadline
-    data = pd.DataFrame({"rt": [0.5, -999.0]})
-    assert (
-        DataValidatorMixin._set_missing_data_and_deadline(True, False, data)
-        == MissingDataNetwork.CPN
-    )
-    assert (
-        DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
-        == MissingDataNetwork.OPN
-    )
-    # AF-TODO: I think GONOGO as a network category can go,
-    # but needs a little more thought, out of scope for PR,
-    # during which this was commented out.
-    # assert (
-    #     DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
-    #     == MissingDataNetwork.GONOGO
-    # )
-
-
-def test_set_missing_data_and_deadline_all_missing():
-    data = pd.DataFrame({"rt": [-999.0, -999.0]})
-    # cpn
-    with pytest.raises(
-        ValueError,
-        match="`missing_data` is set to True, but you have no valid data in your "
-        "dataset.",
-    ):
-        DataValidatorMixin._set_missing_data_and_deadline(True, False, data)
-
-    # opn
-    with pytest.raises(
-        ValueError,
-        match="`missing_data` is set to True, but you have no valid data in your "
-        "dataset.",
-    ):
-        DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
-
-    # AF-TODO: GONOGO case not yet correctly implemented
-    # gonogo
-    # data = pd.DataFrame({"rt": [-999.0, -999.0]})
-    # with pytest.raises(
-    #     ValueError,
-    #     match="`missing_data` is set to True, but you have no valid data in your "
-    #     + "dataset.",
-    # ):
-    #     DataValidatorMixin._set_missing_data_and_deadline(True, True, data)
-
-
 def test_validate_choices():
     # ====== Valid choices =====
     dv = DataValidatorMixin(
diff --git a/tests/test_missing_data_mixin.py b/tests/test_missing_data_mixin.py
index cff5f782b..ed33d3097 100644
--- a/tests/test_missing_data_mixin.py
+++ b/tests/test_missing_data_mixin.py
@@ -50,7 +50,7 @@ def model(request):
 # endregion
 
 
-class TestMissingDataMixinOld:
+class TestProcessMissingDataAndDeadline:
     @pytest.mark.parametrize(
         "model, deadline",
         [

From 4f6eb7bcc7df6af64489d9e7df8799e1c613d890 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 12:29:09 -0500
Subject: [PATCH 084/104] fix: update exception message regex for list_params
 validation in HSSM

---
 tests/test_hssm.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index 93817470d..81d4a2011 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -88,10 +88,10 @@ def test_custom_model(data_ddm):
     ):
         HSSM(data=data_ddm, model="custom")
 
-    with pytest.raises(ValueError, match="Please provide `list_params`*"):
+    with pytest.raises(ValueError, match=r"^Please provide `list_params`"):
         HSSM(data=data_ddm, model="custom", loglik_kind="analytical")
 
-    with pytest.raises(ValueError, match="Please provide `list_params`*"):
+    with pytest.raises(ValueError, match=r"^Please provide `list_params`"):
         HSSM(data=data_ddm, model="custom", loglik=DDM, loglik_kind="analytical")
 
     with pytest.raises(

From 0a05fc8b62a4a71777e2ff9c764c388042e0117a Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 13:09:41 -0500
Subject: [PATCH 085/104] fix: improve error message for unspecified bounds in
 _make_default_prior function

---
 src/hssm/param/utils.py           | 2 +-
 tests/param/test_default_param.py | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/hssm/param/utils.py b/src/hssm/param/utils.py
index 96965f272..6d630f673 100644
--- a/src/hssm/param/utils.py
+++ b/src/hssm/param/utils.py
@@ -26,7 +26,7 @@ def _make_default_prior(bounds: tuple[float, float] | None) -> bmb.Prior:
         A bmb.Prior object representing the default prior for the provided bounds.
     """
     if bounds is None:
-        raise ValueError("Parameter unspecified.")
+        raise ValueError("Bounds parameter unspecified.")
     lower, upper = bounds
     if np.isinf(lower) and np.isinf(upper):
         prior = bmb.Prior("Normal", mu=0.0, sigma=2.0)
diff --git a/tests/param/test_default_param.py b/tests/param/test_default_param.py
index 2a90be3f1..3f86ebaa7 100644
--- a/tests/param/test_default_param.py
+++ b/tests/param/test_default_param.py
@@ -4,6 +4,7 @@
 
 from hssm import Prior
 from hssm.param.simple_param import DefaultParam
+from hssm.param.utils import _make_default_prior
 
 
 def test_from_defaults():
@@ -40,3 +41,7 @@ def test_make_default_prior(bounds, prior):
     assert param.prior.name == prior.pop("name")
     for key, value in prior.items():
         assert param.prior.args[key] == value
+
+
+def test_make_default_prior_no_bounds():
+    pytest.raises(ValueError, _make_default_prior, None)

From d20b0a4f27dcdd4fdc50c6cc32419bed7cf3dbda Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 13:35:49 -0500
Subject: [PATCH 086/104] fix: ensure model_name is retrieved correctly in
 RLSSMConfig initialization

---
 src/hssm/config.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/hssm/config.py b/src/hssm/config.py
index 9386d982e..58f2e9224 100644
--- a/src/hssm/config.py
+++ b/src/hssm/config.py
@@ -326,8 +326,8 @@ def from_rlssm_dict(cls, model_name: str, config_dict: dict[str, Any]):
                 raise ValueError(f"{field_name} must be provided in config_dict")
 
         return cls(
-            model_name=model_name,
-            description=config_dict.get("description"),
+            model_name=config_dict.get("model_name", model_name),
+            description=config_dict["description"],
             list_params=config_dict["list_params"],
             extra_fields=config_dict.get("extra_fields"),
             params_default=config_dict["params_default"],

From 6ba3d9dab00e912db642530206a68fe35e9efabf Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 15:04:02 -0500
Subject: [PATCH 087/104] fix: remove 'data' field from RLSSM_REQUIRED_FIELDS

---
 src/hssm/config.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/hssm/config.py b/src/hssm/config.py
index 58f2e9224..23f5a921b 100644
--- a/src/hssm/config.py
+++ b/src/hssm/config.py
@@ -31,7 +31,6 @@
     "list_params",
     "bounds",
     "params_default",
-    "data",
     "choices",
     "decision_process",
     "learning_process",

From 0f4bd5125ac087eed7948b1129cab48a7e68fbea Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 16:19:21 -0500
Subject: [PATCH 088/104] Use base in HSSM class

---
 src/hssm/hssm.py | 2067 +---------------------------------------------
 1 file changed, 27 insertions(+), 2040 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 19508a342..ed29c7425 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -6,60 +6,28 @@
 This file defines the entry class HSSM.
 """
 
-import datetime
 import logging
-import typing
 from copy import deepcopy
-from inspect import isclass, signature
-from os import PathLike
-from pathlib import Path
-from typing import Any, Callable, Literal, Optional, Union, cast, get_args
+from inspect import isclass
+from typing import Literal
 
-import arviz as az
-import bambi as bmb
-import cloudpickle as cpickle
-import matplotlib as mpl
-import matplotlib.pyplot as plt
-import numpy as np
-import pandas as pd
 import pymc as pm
-import pytensor
-import seaborn as sns
-import xarray as xr
-from bambi.model_components import DistributionalComponent
-from bambi.transformations import transformations_namespace
-from pymc.model.transform.conditioning import do
-from ssms.config import model_config as ssms_model_config
 
-from hssm._types import LoglikKind, SupportedModels
-from hssm.data_validator import DataValidatorMixin
+from hssm.base import HSSMBase
 from hssm.defaults import (
-    INITVAL_JITTER_SETTINGS,
-    INITVAL_SETTINGS,
     MissingDataNetwork,
     missing_data_networks_suffix,
 )
 from hssm.distribution_utils import (
     assemble_callables,
     make_distribution,
-    make_family,
     make_likelihood_callable,
     make_missing_data_callable,
 )
-from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
-    _compute_log_likelihood,
-    _get_alias_dict,
-    _print_prior,
     _rearrange_data,
-    _split_array,
 )
 
-from . import plotting
-from .config import Config, ModelConfig
-from .param import Params
-from .param import UserParam as Param
-
 _logger = logging.getLogger("hssm")
 
 # NOTE: Temporary mapping from old sampler names to new ones in bambi 0.16.0
@@ -98,7 +66,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidatorMixin, MissingDataMixin):
+class HSSM(HSSMBase):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
@@ -271,1735 +239,9 @@ class HSSM(DataValidatorMixin, MissingDataMixin):
         The jitter value for the initial values.
     """
 
-    def __init__(
-        self,
-        data: pd.DataFrame,
-        model: SupportedModels | str = "ddm",
-        choices: list[int] | None = None,
-        include: list[dict[str, Any] | Param] | None = None,
-        model_config: ModelConfig | dict | None = None,
-        loglik: (
-            str | PathLike | Callable | pytensor.graph.Op | type[pm.Distribution] | None
-        ) = None,
-        loglik_kind: LoglikKind | None = None,
-        p_outlier: float | dict | bmb.Prior | None = 0.05,
-        lapse: dict | bmb.Prior | None = bmb.Prior("Uniform", lower=0.0, upper=20.0),
-        global_formula: str | None = None,
-        link_settings: Literal["log_logit"] | None = None,
-        prior_settings: Literal["safe"] | None = "safe",
-        extra_namespace: dict[str, Any] | None = None,
-        missing_data: bool | float = False,
-        deadline: bool | str = False,
-        loglik_missing_data: (
-            str | PathLike | Callable | pytensor.graph.Op | None
-        ) = None,
-        process_initvals: bool = True,
-        initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
-        **kwargs,
-    ):
-        # Attach arguments to the instance
-        # so that we can easily define some
-        # methods that need to access these
-        # arguments (context: pickling / save - load).
-
-        # Define a dict with all call arguments:
-        self._init_args = {
-            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
-        }
-        if kwargs:
-            self._init_args.update(kwargs)
-
-        self.data = data.copy()
-        self._inference_obj: az.InferenceData | None = None
-        self._initvals: dict[str, Any] = {}
-        self.initval_jitter = initval_jitter
-        self._inference_obj_vi: pm.Approximation | None = None
-        self._vi_approx = None
-        self._map_dict = None
-        self.global_formula = global_formula
-
-        self.link_settings = link_settings
-        self.prior_settings = prior_settings
-
-        self.missing_data_value = -999.0
-
-        additional_namespace = transformations_namespace.copy()
-        if extra_namespace is not None:
-            additional_namespace.update(extra_namespace)
-        self.additional_namespace = additional_namespace
-
-        # Construct a model_config from defaults
-        self.model_config = Config.from_defaults(model, loglik_kind)
-        # Update defaults with user-provided config, if any
-        if model_config is not None:
-            if isinstance(model_config, dict):
-                if "choices" not in model_config:
-                    if choices is not None:
-                        model_config["choices"] = tuple(choices)
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-            elif isinstance(model_config, ModelConfig):
-                if model_config.choices is None:
-                    if choices is not None:
-                        model_config.choices = tuple(choices)
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-
-            self.model_config.update_config(
-                model_config
-                if isinstance(model_config, ModelConfig)
-                else ModelConfig(**model_config)  # also serves as dict validation
-            )
-        else:
-            # Model config is not provided, but at this point was constructed from
-            # defaults.
-            if model not in typing.get_args(SupportedModels):
-                # TODO: ideally use self.supported_models above but mypy doesn't like it
-                if choices is not None:
-                    self.model_config.update_choices(choices)
-                elif model in ssms_model_config:
-                    self.model_config.update_choices(
-                        ssms_model_config[model]["choices"]
-                    )
-                    _logger.info(
-                        "choices argument passed as None, "
-                        "but found %s in ssms-simulators. "
-                        "Using choices, from ssm-simulators configs: %s",
-                        model,
-                        ssms_model_config[model]["choices"],
-                    )
-            else:
-                # Model config already constructed from defaults, and model string is
-                # in SupportedModels. So we are guaranteed that choices are in
-                # self.model_config already.
-
-                if choices is not None:
-                    _logger.info(
-                        "Model string is in SupportedModels."
-                        " Ignoring choices arguments."
-                    )
-
-        # Update loglik with user-provided value
-        self.model_config.update_loglik(loglik)
-        # Ensure that all required fields are valid
-        self.model_config.validate()
-
-        # Set up shortcuts so old code will work
-        self.response = self.model_config.response
-        self.list_params = self.model_config.list_params
-        self.choices = self.model_config.choices
-        self.model_name = self.model_config.model_name
-        self.loglik = self.model_config.loglik
-        self.loglik_kind = self.model_config.loglik_kind
-        self.extra_fields = self.model_config.extra_fields
-
-        self.n_choices = len(self.choices)
-
-        self._validate_choices()
-        self._pre_check_data_sanity()
-
-        # Process missing data setting
-        # AF-TODO: Could be a function in data validator?
-        if isinstance(missing_data, float):
-            if not ((self.data.rt == missing_data).any()):
-                raise ValueError(
-                    f"missing_data argument is provided as a float {missing_data}, "
-                    f"However, you have no RTs of {missing_data} in your dataset!"
-                )
-            else:
-                self.missing_data = True
-                self.missing_data_value = missing_data
-        elif isinstance(missing_data, bool):
-            if missing_data and (not (self.data.rt == -999.0).any()):
-                raise ValueError(
-                    "missing_data argument is provided as True, "
-                    " so RTs of -999.0 are treated as missing. \n"
-                    "However, you have no RTs of -999.0 in your dataset!"
-                )
-            elif (not missing_data) and (self.data.rt == -999.0).any():
-                # self.missing_data = True
-                raise ValueError(
-                    "Missing data provided as False. \n"
-                    "However, you have RTs of -999.0 in your dataset!"
-                )
-            else:
-                self.missing_data = missing_data
-        else:
-            raise ValueError(
-                "missing_data argument must be a bool or a float! \n"
-                f"You provided: {type(missing_data)}"
-            )
-
-        if isinstance(deadline, str):
-            self.deadline = True
-            self.deadline_name = deadline
-        else:
-            self.deadline = deadline
-            self.deadline_name = "deadline"
-
-        if (
-            not self.missing_data and not self.deadline
-        ) and loglik_missing_data is not None:
-            raise ValueError(
-                "You have specified a loglik_missing_data function, but you have not "
-                + "set the missing_data or deadline flag to True."
-            )
-        self.loglik_missing_data = loglik_missing_data
-
-        # Update data based on missing_data and deadline
-        self._handle_missing_data_and_deadline()
-        # Set self.missing_data_network based on `missing_data` and `deadline`
-        self.missing_data_network = self._set_missing_data_and_deadline(
-            self.missing_data, self.deadline, self.data
-        )
-
-        if self.deadline:
-            # self.response is a tuple (from Config); use concatenation.
-            self.response.append(self.deadline_name)
-
-        # Process lapse distribution
-        self.has_lapse = p_outlier is not None and p_outlier != 0
-        self._check_lapse(lapse)
-        if self.has_lapse and self.list_params[-1] != "p_outlier":
-            self.list_params.append("p_outlier")
-
-        # Process all parameters
-        self.params = Params.from_user_specs(
-            model=self,
-            include=[] if include is None else include,
-            kwargs=kwargs,
-            p_outlier=p_outlier,
-        )
-
-        self._parent = self.params.parent
-        self._parent_param = self.params.parent_param
-
-        self._validate_fixed_vectors()
-        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
-
-        # For parameters that have a regression backend, apply bounds at the likelihood
-        # level to ensure that the samples that are out of bounds
-        # are discarded (replaced with a large negative value).
-        self.bounds = {
-            name: param.bounds
-            for name, param in self.params.items()
-            if param.is_regression and param.bounds is not None
-        }
-
-        # Set p_outlier and lapse
-        self.p_outlier = self.params.get("p_outlier")
-        self.lapse = lapse if self.has_lapse else None
-
-        self._post_check_data_sanity()
-
-        self.model_distribution = self._make_model_distribution()
-
-        self.family = make_family(
-            self.model_distribution,
-            self.list_params,
-            self.link,
-            self._parent,
-        )
-
-        self.model = bmb.Model(
-            self.formula,
-            data=self.data,
-            family=self.family,
-            priors=self.priors,  # center_predictors=False
-            extra_namespace=self.additional_namespace,
-            **kwargs,
-        )
-
-        self._aliases = _get_alias_dict(
-            self.model, self._parent_param, self.response_c, self.response_str
-        )
-        self.set_alias(self._aliases)
-        self.model.build()
-
-        # Bambi >= 0.17 declares dims=("__obs__",) for intercept-only
-        # deterministics that actually have shape (1,). This causes an
-        # xarray CoordinateValidationError during pm.sample() when ArviZ
-        # tries to create a DataArray with mismatched dimension sizes.
-        # Fix by removing the dims declaration for these deterministics.
-        self._fix_scalar_deterministic_dims()
-
-        if process_initvals:
-            self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
-        if self.initval_jitter > 0:
-            self._jitter_initvals(
-                jitter_epsilon=self.initval_jitter,
-                vector_only=True,
-            )
-
-        # Make sure we reset rvs_to_initial_values --> Only None's
-        # Otherwise PyMC barks at us when asking to compute likelihoods
-        self.pymc_model.rvs_to_initial_values.update(
-            {key_: None for key_ in self.pymc_model.rvs_to_initial_values.keys()}
-        )
-        _logger.info("Model initialized successfully.")
-
-    def _fix_scalar_deterministic_dims(self) -> None:
-        """Fix dims metadata for scalar deterministics.
-
-        Bambi >= 0.17 returns shape ``(1,)`` for intercept-only
-        deterministics but still declares ``dims=("__obs__",)``. This causes
-        an xarray ``CoordinateValidationError`` during ``pm.sample()`` because
-        the ``__obs__`` coordinate has ``n_obs`` entries. Removing the dims
-        declaration for these variables lets ArviZ handle them as
-        un-dimensioned arrays, avoiding the conflict.
-        """
-        n_obs = len(self.data)
-        dims_dict = self.pymc_model.named_vars_to_dims
-        for det in self.pymc_model.deterministics:
-            if det.name not in dims_dict:
-                continue
-            dims = dims_dict[det.name]
-            if "__obs__" in dims:
-                # Check static shape: if it doesn't match n_obs, remove dims
-                try:
-                    shape_0 = det.type.shape[0]
-                except (IndexError, TypeError):
-                    continue
-                if shape_0 is not None and shape_0 != n_obs:
-                    del dims_dict[det.name]
-
-    def _validate_fixed_vectors(self) -> None:
-        """Validate that fixed-vector parameters have the correct length.
-
-        Fixed-vector parameters (``prior=np.ndarray``) bypass Bambi's formula
-        system entirely --- they are passed as a scalar ``0.0`` placeholder to
-        Bambi, and the real vector is substituted inside
-        ``HSSMDistribution.logp()`` (see ``dist.py``).  Because this
-        substitution is invisible to Bambi, we must validate the vector length
-        against ``len(self.data)`` up front to catch shape mismatches early.
-        """
-        for name, param in self.params.items():
-            if isinstance(param.prior, np.ndarray):
-                if len(param.prior) != len(self.data):
-                    raise ValueError(
-                        f"Fixed vector for parameter '{name}' has length "
-                        f"{len(param.prior)}, but data has {len(self.data)} rows."
-                    )
-
-    @classproperty
-    def supported_models(cls) -> tuple[SupportedModels, ...]:
-        """Get a tuple of all supported models.
-
-        Returns
-        -------
-        tuple[SupportedModels, ...]
-            A tuple containing all supported model names.
-        """
-        return get_args(SupportedModels)
-
-    @classmethod
-    def _store_init_args(cls, *args, **kwargs):
-        """Store initialization arguments using signature binding."""
-        sig = signature(cls.__init__)
-        bound_args = sig.bind(*args, **kwargs)
-        bound_args.apply_defaults()
-        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
-
-    def find_MAP(self, **kwargs):
-        """Perform Maximum A Posteriori estimation.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        self._map_dict = pm.find_MAP(model=self.pymc_model, **kwargs)
-        return self._map_dict
-
-    def sample(
-        self,
-        sampler: Literal["pymc", "numpyro", "blackjax", "nutpie", "laplace"]
-        | None = None,
-        init: str | None = None,
-        initvals: str | dict | None = None,
-        include_response_params: bool = False,
-        **kwargs,
-    ) -> az.InferenceData | pm.Approximation:
-        """Perform sampling using the `fit` method via bambi.Model.
-
-        Parameters
-        ----------
-        sampler: optional
-            The sampler to use. Can be one of "pymc", "numpyro",
-            "blackjax", "nutpie", or "laplace". If using `blackbox` likelihoods,
-            this cannot be "numpyro", "blackjax", or "nutpie". By default it is None,
-            and sampler will automatically be chosen: when the model uses the
-            `approx_differentiable` likelihood, and `jax` backend, "numpyro" will
-            be used. Otherwise, "pymc" (the default PyMC NUTS sampler) will be used.
-
-            Note that the old sampler names such as "mcmc", "nuts_numpyro",
-            "nuts_blackjax" will be deprecated and removed in future releases. A warning
-            will be raised if any of these old names are used.
-        init: optional
-            Initialization method to use for the sampler. If any of the NUTS samplers
-            is used, defaults to `"adapt_diag"`. Otherwise, defaults to `"auto"`.
-        initvals: optional
-            Pass initial values to the sampler. This can be a dictionary of initial
-            values for parameters of the model, or a string "map" to use initialization
-            at the MAP estimate. If "map" is used, the MAP estimate will be computed if
-            not already attached to the base class from prior call to 'find_MAP'.
-        include_response_params: optional
-            Include parameters of the response distribution in the output. These usually
-            take more space than other parameters as there's one of them per
-            observation. Defaults to False.
-        kwargs
-            Other arguments passed to bmb.Model.fit(). Please see [here]
-            (https://bambinos.github.io/bambi/api_reference.html#bambi.models.Model.fit)
-            for full documentation.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            A reference to the `model.traces` object, which stores the traces of the
-            last call to `model.sample()`. `model.traces` is an ArviZ `InferenceData`
-            instance if `sampler` is `"pymc"` (default), `"numpyro"`,
-            `"blackjax"` or "`laplace".
-        """
-        # If initvals are None (default)
-        # we skip processing initvals here.
-        if sampler in _new_sampler_mapping:
-            _logger.warning(
-                f"Sampler '{sampler}' is deprecated. "
-                "Please use the new sampler names: "
-                "'pymc', 'numpyro', 'blackjax', 'nutpie', or 'laplace'."
-            )
-            sampler = _new_sampler_mapping[sampler]  # type: ignore
-
-        if sampler == "vi":
-            raise ValueError(
-                "VI is not supported via the sample() method. "
-                "Please use the vi() method instead."
-            )
-
-        if initvals is not None:
-            if isinstance(initvals, dict):
-                kwargs["initvals"] = initvals
-            else:
-                if isinstance(initvals, str):
-                    if initvals == "map":
-                        if self._map_dict is None:
-                            _logger.info(
-                                "initvals='map' but no map"
-                                "estimate precomputed. \n"
-                                "Running map estimation first..."
-                            )
-                            self.find_MAP()
-                            kwargs["initvals"] = self._map_dict
-                        else:
-                            kwargs["initvals"] = self._map_dict
-                else:
-                    raise ValueError(
-                        "initvals argument must be a dictionary or 'map'"
-                        " to use the MAP estimate."
-                    )
-        else:
-            kwargs["initvals"] = self._initvals
-            _logger.info("Using default initvals. \n")
-
-        if sampler is None:
-            if (
-                self.loglik_kind == "approx_differentiable"
-                and self.model_config.backend == "jax"
-            ):
-                sampler = "numpyro"
-            else:
-                sampler = "pymc"
-
-        if self.loglik_kind == "blackbox":
-            if sampler in ["blackjax", "numpyro", "nutpie"]:
-                raise ValueError(
-                    f"{sampler} sampler does not work with blackbox likelihoods."
-                )
-
-            if "step" not in kwargs:
-                kwargs |= {"step": pm.Slice(model=self.pymc_model)}
-
-        if (
-            self.loglik_kind == "approx_differentiable"
-            and self.model_config.backend == "jax"
-            and sampler == "pymc"
-            and kwargs.get("cores", None) != 1
-        ):
-            _logger.warning(
-                "Parallel sampling might not work with `jax` backend and the PyMC NUTS "
-                + "sampler on some platforms. Please consider using `numpyro`, "
-                + "`blackjax`, or `nutpie` sampler if that is a problem."
-            )
-
-        if self._check_extra_fields():
-            self._update_extra_fields()
-
-        if init is None:
-            if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]:
-                init = "adapt_diag"
-            else:
-                init = "auto"
-
-        # If sampler is finally `numpyro` make sure
-        # the jitter argument is set to False
-        if sampler == "numpyro":
-            if "nuts_sampler_kwargs" in kwargs:
-                if kwargs["nuts_sampler_kwargs"].get("jitter"):
-                    _logger.warning(
-                        "The jitter argument is set to True. "
-                        + "This argument is not supported "
-                        + "by the numpyro backend. "
-                        + "The jitter argument will be set to False."
-                    )
-                kwargs["nuts_sampler_kwargs"]["jitter"] = False
-            else:
-                kwargs["nuts_sampler_kwargs"] = {"jitter": False}
-
-        if sampler != "pymc" and "step" in kwargs:
-            raise ValueError(
-                "`step` samplers (enabled by the `step` argument) are only supported "
-                "by the `pymc` sampler."
-            )
-
-        if self._inference_obj is not None:
-            _logger.warning(
-                "The model has already been sampled. Overwriting the previous "
-                + "inference object. Any previous reference to the inference object "
-                + "will still point to the old object."
-            )
-
-        # Define whether likelihood should be computed
-        compute_likelihood = True
-        if "idata_kwargs" in kwargs:
-            if "log_likelihood" in kwargs["idata_kwargs"]:
-                compute_likelihood = kwargs["idata_kwargs"].pop("log_likelihood", True)
-
-        omit_offsets = kwargs.pop("omit_offsets", False)
-        self._inference_obj = self.model.fit(
-            inference_method=(
-                "pymc"
-                if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]
-                else sampler
-            ),
-            init=init,
-            include_response_params=include_response_params,
-            omit_offsets=omit_offsets,
-            **kwargs,
-        )
-
-        # Separate out log likelihood computation
-        if compute_likelihood:
-            self.log_likelihood(self._inference_obj, inplace=True)
-
-        # Subset data vars in posterior
-        self._clean_posterior_group(idata=self._inference_obj)
-        return self.traces
-
-    def vi(
-        self,
-        method: str = "advi",
-        niter: int = 10000,
-        draws: int = 1000,
-        return_idata: bool = True,
-        ignore_mcmc_start_point_defaults=False,
-        **vi_kwargs,
-    ) -> pm.Approximation | az.InferenceData:
-        """Perform Variational Inference.
-
-        Parameters
-        ----------
-        niter : int
-            The number of iterations to run the VI algorithm. Defaults to 3000.
-        method : str
-            The method to use for VI. Can be one of "advi" or "fullrank_advi", "svgd",
-            "asvgd".Defaults to "advi".
-        draws : int
-            The number of samples to draw from the posterior distribution.
-            Defaults to 1000.
-        return_idata : bool
-            If True, returns an InferenceData object. Otherwise, returns the
-            approximation object directly. Defaults to True.
-
-        Returns
-        -------
-            pm.Approximation or az.InferenceData: The mean field approximation object.
-        """
-        if self.loglik_kind == "analytical":
-            _logger.warning(
-                "VI is not recommended for the analytical likelihood,"
-                " since gradients can be brittle."
-            )
-        elif self.loglik_kind == "blackbox":
-            raise ValueError(
-                "VI is not supported for blackbox likelihoods, "
-                " since likelihood gradients are needed!"
-            )
-
-        if ("start" not in vi_kwargs) and not ignore_mcmc_start_point_defaults:
-            _logger.info("Using MCMC starting point defaults.")
-            vi_kwargs["start"] = self._initvals
-
-        # Run variational inference directly from pymc model
-        with self.pymc_model:
-            self._vi_approx = pm.fit(n=niter, method=method, **vi_kwargs)
-
-        # Sample from the approximate posterior
-        if self._vi_approx is not None:
-            self._inference_obj_vi = self._vi_approx.sample(draws)
-
-        # Post-processing
-        self._clean_posterior_group(idata=self._inference_obj_vi)
-
-        # Return the InferenceData object if return_idata is True
-        if return_idata:
-            return self._inference_obj_vi
-        # Otherwise return the appromation object directly
-        return self.vi_approx
-
-    def _clean_posterior_group(self, idata: az.InferenceData | None = None):
-        """Clean up the posterior group of the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object to clean up. If None, the last InferenceData object
-            will be used.
-        """
-        # # Logic behind which variables to keep:
-        # # We essentially want to get rid of
-        # # all the trial-wise variables.
-
-        # # We drop all distributional components, IF they are deterministics
-        # # (in which case they will be trial wise systematically)
-        # # and we keep distributional components, IF they are
-        # # basic random-variabels (in which case they should never
-        # # appear trial-wise).
-        if idata is None:
-            raise ValueError(
-                "The InferenceData object is None. Cannot clean up the posterior group."
-            )
-        elif not hasattr(idata, "posterior"):
-            raise ValueError(
-                "The InferenceData object does not have a posterior group. "
-                + "Cannot clean up the posterior group."
-            )
-
-        vars_to_keep = set(idata["posterior"].data_vars.keys()).difference(
-            set(
-                key_
-                for key_ in self.model.distributional_components.keys()
-                if key_ in [var_.name for var_ in self.pymc_model.deterministics]
-            )
-        )
-        vars_to_keep_clean = [
-            var_
-            for var_ in vars_to_keep
-            if isinstance(var_, str) and "_mean" not in var_
-        ]
-
-        setattr(
-            idata,
-            "posterior",
-            idata["posterior"][vars_to_keep_clean],
-        )
-
-    def log_likelihood(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        keep_likelihood_params: bool = False,
-    ) -> az.InferenceData | None:
-        """Compute the log likelihood of the model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-        data : optional
-            A pandas DataFrame with values for the predictors that are used to obtain
-            out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `log_likelihood` group to
-            `idata`. Otherwise, it will return a copy of idata with the predictions
-            added, by default True.
-        keep_likelihood_params : optional
-            If `True`, the trial wise likelihood parameters that are computed
-            on route to getting the log likelihood are kept in the `idata` object.
-            Defaults to False. See also the method `add_likelihood_parameters_to_idata`.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if self._inference_obj is None and idata is None:
-            raise ValueError(
-                "Neither has the model been sampled yet nor"
-                + " an idata object has been provided."
-            )
-
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please provide an idata object."
-                )
-            else:
-                idata = self._inference_obj
-
-        # Actual likelihood computation
-        idata = _compute_log_likelihood(self.model, idata, data, inplace)
-
-        # clean up posterior:
-        if not keep_likelihood_params:
-            self._clean_posterior_group(idata=idata)
-
-        if inplace:
-            return None
-        else:
-            return idata
-
-    def add_likelihood_parameters_to_idata(
-        self,
-        idata: az.InferenceData | None = None,
-        inplace: bool = False,
-    ) -> az.InferenceData | None:
-        """Add likelihood parameters to the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object returned by HSSM.sample().
-        inplace : bool
-            If True, the likelihood parameters are added to idata in-place. Otherwise,
-            a copy of idata with the likelihood parameters added is returned.
-            Defaults to False.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError("No idata provided and model not yet sampled!")
-            else:
-                idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                    deepcopy(self._inference_obj)
-                    if not inplace
-                    else self._inference_obj
-                )
-        else:
-            idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                deepcopy(idata) if not inplace else idata
-            )
-        return idata
-
-    def sample_posterior_predictive(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        include_group_specific: bool = True,
-        kind: Literal["response", "response_params"] = "response",
-        draws: int | float | list[int] | np.ndarray | None = None,
-        safe_mode: bool = True,
-    ) -> az.InferenceData | None:
-        """Perform posterior predictive sampling from the HSSM model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-            the `InferenceData` from the last time `sample()` is called will be used.
-        data : optional
-            An optional data frame with values for the predictors that are used to
-            obtain out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `posterior_predictive`
-            group to `idata`. Otherwise, it will return a copy of idata with the
-            predictions added, by default True.
-        include_group_specific : optional
-            If `True` will make predictions including the group specific effects.
-            Otherwise, predictions are made with common effects only (i.e. group-
-            specific are set to zero), by default True.
-        kind: optional
-            Indicates the type of prediction required. Can be `"response_params"` or
-            `"response"`. The first returns draws from the posterior distribution of the
-            likelihood parameters, while the latter returns the draws from the posterior
-            predictive distribution (i.e. the posterior probability distribution for a
-            new observation) in addition to the posterior distribution. Defaults to
-            "response_params".
-        draws: optional
-            The number of samples to draw from the posterior predictive distribution
-            from each chain.
-            When it's an integer >= 1, the number of samples to be extracted from the
-            `draw` dimension. If this integer is larger than the number of posterior
-            samples in each chain, all posterior samples will be used
-            in posterior predictive sampling. When a float between 0 and 1, the
-            proportion of samples from the draw dimension from each chain to be used in
-            posterior predictive sampling.. If this proportion is very
-            small, at least one sample will be used. When None, all posterior samples
-            will be used. Defaults to None.
-        safe_mode: bool
-            If True, the function will split the draws into chunks of 10 to avoid memory
-            issues. Defaults to True.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet and idata is not provided.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please either provide an idata object or sample the model first."
-                )
-            idata = self._inference_obj
-            _logger.info(
-                "idata=None, we use the traces assigned to the HSSM object as idata."
-            )
-
-        if idata is not None:
-            if "posterior_predictive" in idata.groups():
-                del idata["posterior_predictive"]
-                _logger.warning(
-                    "pre-existing posterior_predictive group deleted from idata. \n"
-                )
-
-        if self._check_extra_fields(data):
-            self._update_extra_fields(data)
-
-        if isinstance(draws, np.ndarray):
-            draws = draws.astype(int)
-        elif isinstance(draws, list):
-            draws = np.array(draws).astype(int)
-        elif isinstance(draws, int | float):
-            draws = np.arange(int(draws))
-        elif draws is None:
-            draws = idata["posterior"].draw.values
-        else:
-            raise ValueError(
-                "draws must be an integer, " + "a list of integers, or a numpy array."
-            )
-
-        assert isinstance(draws, np.ndarray)
-
-        # Make a copy of idata, set the `posterior` group to be a random sub-sample
-        # of the original (draw dimension gets sub-sampled)
-
-        idata_copy = idata.copy()
-
-        if (draws.shape != idata["posterior"].draw.values.shape) or (
-            (draws.shape == idata["posterior"].draw.values.shape)
-            and not np.allclose(draws, idata["posterior"].draw.values)
-        ):
-            # Reassign posterior to sub-sampled version
-            setattr(idata_copy, "posterior", idata["posterior"].isel(draw=draws))
-
-        if kind == "response":
-            # If we run kind == 'response' we actually run the observation RV
-            if safe_mode:
-                # safe mode splits the draws into chunks of 10 to avoid
-                # memory issues (TODO: Figure out the source of memory issues)
-                split_draws = _split_array(
-                    idata_copy["posterior"].draw.values, divisor=10
-                )
-
-                posterior_predictive_list = []
-                for samples_tmp in split_draws:
-                    tmp_posterior = idata["posterior"].sel(draw=samples_tmp)
-                    setattr(idata_copy, "posterior", tmp_posterior)
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-                    posterior_predictive_list.append(idata_copy["posterior_predictive"])
-
-                if inplace:
-                    idata.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    # for inplace, we don't return anything
-                    return None
-                else:
-                    # Reassign original posterior to idata_copy
-                    setattr(idata_copy, "posterior", idata["posterior"])
-                    # Add new posterior predictive group to idata_copy
-                    del idata_copy["posterior_predictive"]
-                    idata_copy.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    return idata_copy
-            else:
-                if inplace:
-                    # If not safe-mode
-                    # We call .predict() directly without any
-                    # chunking of data.
-
-                    # .predict() is called on the copy of idata
-                    # since we still subsampled (or assigned) the draws
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-
-                    # posterior predictive group added to idata
-                    idata.add_groups(
-                        posterior_predictive=idata_copy["posterior_predictive"]
-                    )
-                    # don't return anything if inplace
-                    return None
-                else:
-                    # Not safe mode and not inplace
-                    # Function acts as very thin wrapper around
-                    # .predict(). It just operates on the
-                    # idata_copy object
-                    return self.model.predict(
-                        idata_copy, kind, data, False, include_group_specific
-                    )
-        elif kind == "response_params":
-            # If kind == 'response_params', we don't need to run the RV directly,
-            # there shouldn't really be any significant memory issues here,
-            # we can simply ignore settings, since the computational overhead
-            # should be very small --> nudges user towards good outputs.
-            _logger.warning(
-                "The kind argument is set to 'mean', but 'draws' argument "
-                + "is not None: The draws argument will be ignored!"
-            )
-            return self.model.predict(
-                idata, kind, data, inplace, include_group_specific
-            )
-        else:
-            raise ValueError("`kind` must be either 'response' or 'response_params'.")
-
-    def plot_predictive(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a posterior predictive plot.
-
-        Equivalent to calling `hssm.plotting.plot_predictive()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_predictive].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_predictive(self, **kwargs)
-
-    def plot_quantile_probability(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a quantile probability plot.
-
-        Equivalent to calling `hssm.plotting.plot_quantile_probability()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_quantile_probability].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_quantile_probability(self, **kwargs)
-
-    def predict(self, **kwargs) -> az.InferenceData:
-        """Generate samples from the predictive distribution."""
-        return self.model.predict(**kwargs)
-
-    def sample_do(
-        self, params: dict[str, Any], draws: int = 100, return_model=False, **kwargs
-    ) -> az.InferenceData | tuple[az.InferenceData, pm.Model]:
-        """Generate samples from the predictive distribution using the `do-operator`."""
-        do_model = do(self.pymc_model, params)
-        do_idata = pm.sample_prior_predictive(model=do_model, draws=draws, **kwargs)
-
-        # clean up `rt,response_mean` to `v`
-        do_idata = self._drop_parent_str_from_idata(idata=do_idata)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].coords:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        if return_model:
-            return do_idata, do_model
-        return do_idata
-
-    def sample_prior_predictive(
-        self,
-        draws: int = 500,
-        var_names: str | list[str] | None = None,
-        omit_offsets: bool = True,
-        random_seed: np.random.Generator | None = None,
-    ) -> az.InferenceData:
-        """Generate samples from the prior predictive distribution.
-
-        Parameters
-        ----------
-        draws
-            Number of draws to sample from the prior predictive distribution. Defaults
-            to 500.
-        var_names
-            A list of names of variables for which to compute the prior predictive
-            distribution. Defaults to ``None`` which means both observed and unobserved
-            RVs.
-        omit_offsets
-            Whether to omit offset terms. Defaults to ``True``.
-        random_seed
-            Seed for the random number generator.
-
-        Returns
-        -------
-        az.InferenceData
-            ``InferenceData`` object with the groups ``prior``, ``prior_predictive`` and
-            ``observed_data``.
-        """
-        prior_predictive = self.model.prior_predictive(
-            draws, var_names, omit_offsets, random_seed
-        )
-
-        # AF-COMMENT: Not sure if necessary to include the
-        # mean prior here (which adds deterministics that
-        # could be recomputed elsewhere)
-        prior_predictive.add_groups(posterior=prior_predictive.prior)
-        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
-        self.model.predict(prior_predictive, kind="response_params", inplace=True)
-
-        # clean
-        setattr(prior_predictive, "prior", prior_predictive["posterior"])
-        del prior_predictive["posterior"]
-
-        if self._inference_obj is None:
-            self._inference_obj = prior_predictive
-        else:
-            self._inference_obj.extend(prior_predictive)
-
-        # clean up `rt,response_mean` to `v`
-        idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].coords:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        # Update self._inference_obj to match the cleaned idata
-        self._inference_obj = idata
-        return deepcopy(self._inference_obj)
-
-    @property
-    def pymc_model(self) -> pm.Model:
-        """Provide access to the PyMC model.
-
-        Returns
-        -------
-        pm.Model
-            The PyMC model built by bambi
-        """
-        return self.model.backend.model
-
-    def set_alias(self, aliases: dict[str, str | dict]):
-        """Set parameter aliases.
-
-        Sets the aliases according to the dictionary passed to it and rebuild the
-        model.
-
-        Parameters
-        ----------
-        aliases
-            A dict specifying the parameter names being aliased and the aliases.
-        """
-        self.model.set_alias(aliases)
-        self.model.build()
-
-    @property
-    def response_c(self) -> str:
-        """Return the response variable names in c() format."""
-        if self.response is None:
-            return "c()"
-        return f"c({', '.join(self.response)})"
-
-    @property
-    def response_str(self) -> str:
-        """Return the response variable names in string format."""
-        if self.response is None:
-            return ""
-        return ",".join(self.response)
-
-    # NOTE: can't annotate return type because the graphviz dependency is optional
-    def graph(self, formatting="plain", name=None, figsize=None, dpi=300, fmt="png"):
-        """Produce a graphviz Digraph from a built HSSM model.
-
-        Requires graphviz, which may be installed most easily with `conda install -c
-        conda-forge python-graphviz`. Alternatively, you may install the `graphviz`
-        binaries yourself, and then `pip install graphviz` to get the python bindings.
-        See http://graphviz.readthedocs.io/en/stable/manual.html for more information.
-
-        Parameters
-        ----------
-        formatting
-            One of `"plain"` or `"plain_with_params"`. Defaults to `"plain"`.
-        name
-            Name of the figure to save. Defaults to `None`, no figure is saved.
-        figsize
-            Maximum width and height of figure in inches. Defaults to `None`, the
-            figure size is set automatically. If defined and the drawing is larger than
-            the given size, the drawing is uniformly scaled down so that it fits within
-            the given size.  Only works if `name` is not `None`.
-        dpi
-            Point per inch of the figure to save.
-            Defaults to 300. Only works if `name` is not `None`.
-        fmt
-            Format of the figure to save.
-            Defaults to `"png"`. Only works if `name` is not `None`.
-
-        Returns
-        -------
-        graphviz.Graph
-            The graph
-        """
-        graph = self.model.graph(formatting, name, figsize, dpi, fmt)
-
-        parent_param = self._parent_param
-        if parent_param.is_regression:
-            return graph
-
-        # Modify the graph
-        # 1. Remove all nodes and edges related to `{parent}_mean`:
-        graph.body = [
-            item for item in graph.body if f"{parent_param.name}_mean" not in item
-        ]
-        # 2. Add a new edge from parent to response
-        graph.edge(parent_param.name, self.response_str)
-
-        return graph
-
-    def compile_logp(self, keep_transformed: bool = False, **kwargs):
-        """Compile the log probability function for the model.
-
-        Parameters
-        ----------
-        keep_transformed : bool, optional
-            If True, keeps the transformed variables in the compiled function.
-            If False, removes value transforms before compilation.
-            Defaults to False.
-        **kwargs
-            Additional keyword arguments passed to PyMC's compile_logp:
-            - vars: List of variables. Defaults to None (all variables).
-            - jacobian: Whether to include log(|det(dP/dQ)|) term for
-            transformed variables. Defaults to True.
-            - sum: Whether to sum all terms instead of returning a vector.
-            Defaults to True.
-
-        Returns
-        -------
-        callable
-            A compiled function that computes the model log probability.
-        """
-        if keep_transformed:
-            return self.pymc_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-        else:
-            new_model = pm.model.transform.conditioning.remove_value_transforms(
-                self.pymc_model
-            )
-            return new_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-
-    def plot_trace(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        tight_layout: bool = True,
-        **kwargs,
-    ) -> None:
-        """Generate trace plot with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.plot_trace() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.plot_trace.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data : optional
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include deterministic` to True.
-        tight_layout : optional
-            Whether to call plt.tight_layout() after plotting. Defaults to True.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                if "var_names" in kwargs:
-                    if isinstance(kwargs["var_names"], str):
-                        if kwargs["var_names"] not in var_names:
-                            var_names.append(kwargs["var_names"])
-                        kwargs["var_names"] = var_names
-                    elif isinstance(kwargs["var_names"], list):
-                        kwargs["var_names"] = list(
-                            set(var_names) | set(kwargs["var_names"])
-                        )
-                    elif kwargs["var_names"] is None:
-                        kwargs["var_names"] = var_names
-                    else:
-                        raise ValueError(
-                            "`var_names` must be a string, a list of strings, or None."
-                        )
-                else:
-                    kwargs["var_names"] = var_names
-        az.plot_trace(data, **kwargs)
-
-        if tight_layout:
-            plt.tight_layout()
-
-    def summary(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        **kwargs,
-    ) -> pd.DataFrame | xr.Dataset:
-        """Produce a summary table with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.summary() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.summary.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include_deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include_deterministic` to True.
-
-        Returns
-        -------
-        pd.DataFrame | xr.Dataset
-            A pandas DataFrame or xarray Dataset containing the summary statistics.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                kwargs["var_names"] = list(set(var_names + kwargs.get("var_names", [])))
-        return az.summary(data, **kwargs)
-
-    def initial_point(self, transformed: bool = False) -> dict[str, np.ndarray]:
-        """Compute the initial point of the model.
-
-        This is a slightly altered version of pm.initial_point.initial_point().
-
-        Parameters
-        ----------
-        transformed : bool, optional
-            If True, return the initial point in transformed space.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial point of the model parameters.
-        """
-        fn = pm.initial_point.make_initial_point_fn(
-            model=self.pymc_model, return_transformed=transformed
-        )
-        return pm.model.Point(fn(None), model=self.pymc_model)
-
-    def restore_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj = cast("az.InferenceData", traces)
-
-    def restore_vi_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore VI traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the VI traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj_vi = cast("az.InferenceData", traces)
-
-    def save_model(
-        self,
-        model_name: str | None = None,
-        allow_absolute_base_path: bool = False,
-        base_path: str | Path = "hssm_models",
-        save_idata_only: bool = False,
-    ) -> None:
-        """Save a HSSM model instance and its inference results to disk.
-
-        Parameters
-        ----------
-        model : HSSM
-            The HSSM model instance to save
-        model_name : str | None
-            Name to use for the saved model files.
-            If None, will use model.model_name with timestamp
-        allow_absolute_base_path : bool
-            Whether to allow absolute paths for base_path
-        base_path : str | Path
-            Base directory to save model files in.
-            Must be relative path if allow_absolute_base_path=False
-        save_idata_only: bool = False,
-            Whether to save the model class instance itself
-
-        Raises
-        ------
-        ValueError
-            If base_path is absolute and allow_absolute_base_path=False
-        """
-        # check if base_path is absolute
-        if not allow_absolute_base_path:
-            if str(base_path).startswith("/"):
-                raise ValueError(
-                    "base_path must be a relative path"
-                    " if allow_absolute_base_path is False"
-                )
-
-        if model_name is None:
-            # Get date string format as suffix to model name
-            model_name = (
-                self.model_name
-                + "_"
-                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
-            )
-
-        # check if folder by name model_name exists
-        model_name = model_name.replace(" ", "_")
-        model_path = Path(base_path).joinpath(model_name)
-        model_path.mkdir(parents=True, exist_ok=True)
-
-        # Save model to pickle file
-        if not save_idata_only:
-            with open(model_path.joinpath("model.pkl"), "wb") as f:
-                cpickle.dump(self, f)
-
-        # Save traces to netcdf file
-        if self._inference_obj is not None:
-            az.to_netcdf(self._inference_obj, model_path.joinpath("traces.nc"))
-
-        # Save vi_traces to netcdf file
-        if self._inference_obj_vi is not None:
-            az.to_netcdf(self._inference_obj_vi, model_path.joinpath("vi_traces.nc"))
-
-    @classmethod
-    def load_model(
-        cls, path: Union[str, Path]
-    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
-        """Load a HSSM model instance and its inference results from disk.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory or model.pkl file. If a directory is provided,
-            will look for model.pkl, traces.nc and vi_traces.nc files within it.
-
-        Returns
-        -------
-        HSSM
-            The loaded HSSM model instance with inference results attached if available.
-        """
-        # Convert path to Path object
-        path = Path(path)
-
-        # If path points to a file, assume it's model.pkl
-        if path.is_file():
-            model_dir = path.parent
-            model_path = path
-        else:
-            # Path points to directory
-            model_dir = path
-            model_path = model_dir.joinpath("model.pkl")
-
-        # check if model_dir exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if model.pkl exists raise logging information if not
-        if not model_path.exists():
-            _logger.info(
-                f"model.pkl file does not exist in {model_dir}. "
-                "Attempting to load traces only."
-            )
-            if (not model_dir.joinpath("traces.nc").exists()) and (
-                not model_dir.joinpath("vi_traces.nc").exists()
-            ):
-                raise FileNotFoundError(f"No traces found in {model_dir}.")
-            else:
-                idata_dict = cls.load_model_idata(model_dir)
-                return idata_dict
-        else:
-            # Load model from pickle file
-            with open(model_path, "rb") as f:
-                model = cpickle.load(f)
-
-            # Load traces if they exist
-            traces_path = model_dir.joinpath("traces.nc")
-            if traces_path.exists():
-                model.restore_traces(traces_path)
-
-            # Load VI traces if they exist
-            vi_traces_path = model_dir.joinpath("vi_traces.nc")
-            if vi_traces_path.exists():
-                model.restore_vi_traces(vi_traces_path)
-        return model
-
-    @classmethod
-    def load_model_idata(cls, path: str | Path) -> dict[str, az.InferenceData | None]:
-        """Load the traces from a model directory.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory containing traces.nc and/or vi_traces.nc files.
-
-        Returns
-        -------
-        dict[str, az.InferenceData | None]
-            A dictionary with keys "idata_mcmc" and "idata_vi" containing the traces
-            from the model directory. If the traces do not exist, the corresponding
-            value will be None.
-        """
-        idata_dict: dict[str, az.InferenceData | None] = {}
-        model_dir = Path(path)
-        # check if path exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if traces.nc exists
-        traces_path = model_dir.joinpath("traces.nc")
-        if not traces_path.exists():
-            _logger.warning(f"traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_mcmc"] = None
-        else:
-            idata_dict["idata_mcmc"] = az.from_netcdf(traces_path)
-
-        # check if vi_traces.nc exists
-        vi_traces_path = model_dir.joinpath("vi_traces.nc")
-        if not vi_traces_path.exists():
-            _logger.warning(f"vi_traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_vi"] = None
-        else:
-            idata_dict["idata_vi"] = az.from_netcdf(vi_traces_path)
-
-        return idata_dict
-
-    def __getstate__(self):
-        """Get the state of the model for pickling.
-
-        This method is called when pickling the model.
-        It returns a dictionary containing the constructor
-        arguments needed to recreate the model instance.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the constructor arguments
-            under the key 'constructor_args'.
-        """
-        state = {"constructor_args": self._init_args}
-        return state
-
-    def __setstate__(self, state):
-        """Set the state of the model when unpickling.
-
-        This method is called when unpickling the model. It creates a new instance
-        of HSSM using the constructor arguments stored in the state dictionary,
-        and copies its attributes to the current instance.
-
-        Parameters
-        ----------
-        state : dict
-            A dictionary containing the constructor arguments under the key
-            'constructor_args'.
-        """
-        new_instance = HSSM(**state["constructor_args"])
-        self.__dict__ = new_instance.__dict__
-
-    def __repr__(self) -> str:
-        """Create a representation of the model."""
-        output = [
-            "Hierarchical Sequential Sampling Model",
-            f"Model: {self.model_name}\n",
-            f"Response variable: {self.response_str}",
-            f"Likelihood: {self.loglik_kind}",
-            f"Observations: {len(self.data)}\n",
-            "Parameters:\n",
-        ]
-
-        for param in self.params.values():
-            if param.name == "p_outlier":
-                continue
-            output.append(f"{param.name}:")
-
-            component = self.model.components[param.name]
-
-            # Regression case:
-            if param.is_regression:
-                assert isinstance(component, DistributionalComponent)
-                output.append(f"    Formula: {param.formula}")
-                output.append("    Priors:")
-                intercept_term = component.intercept_term
-                if intercept_term is not None:
-                    output.append(_print_prior(intercept_term))
-                for _, common_term in component.common_terms.items():
-                    output.append(_print_prior(common_term))
-                for _, group_specific_term in component.group_specific_terms.items():
-                    output.append(_print_prior(group_specific_term))
-                output.append(f"    Link: {param.link}")
-            # None regression case
-            else:
-                if param.prior is None:
-                    prior = (
-                        component.intercept_term.prior
-                        if param.is_parent
-                        else component.prior
-                    )
-                else:
-                    prior = param.prior
-                output.append(f"    Prior: {prior}")
-            output.append(f"    Explicit bounds: {param.bounds}")
-            output.append(
-                " (ignored due to link function)"
-                if self.link_settings is not None
-                else ""
-            )
-
-        # TODO: Handle p_outlier regression correctly here.
-        if self.p_outlier is not None:
-            output.append("")
-            output.append(f"Lapse probability: {self.p_outlier.prior}")
-            output.append(f"Lapse distribution: {self.lapse}")
-
-        return "\n".join(output)
-
-    def __str__(self) -> str:
-        """Create a string representation of the model."""
-        return self.__repr__()
-
-    @property
-    def traces(self) -> az.InferenceData | pm.Approximation:
-        """Return the trace of the model after sampling.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            The trace of the model after the last call to `sample()`.
-        """
-        if not self._inference_obj:
-            raise ValueError("Please sample the model first.")
-
-        return self._inference_obj
-
-    @property
-    def vi_idata(self) -> az.InferenceData:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData
-            The variational inference approximation object.
-        """
-        if not self._inference_obj_vi:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational posterior attached."
-            )
-
-        return self._inference_obj_vi
-
-    @property
-    def vi_approx(self) -> pm.Approximation:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        pm.Approximation
-            The variational inference approximation object.
-        """
-        if not self._vi_approx:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational approximation attached."
-            )
-
-        return self._vi_approx
-
-    @property
-    def map(self) -> dict:
-        """Return the MAP estimates of the model parameters.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        if not self._map_dict:
-            raise ValueError("Please compute map first.")
-
-        return self._map_dict
-
-    @property
-    def initvals(self) -> dict:
-        """Return the initial values of the model parameters for sampling.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial values of the model parameters.
-            This dict serves as the default for initial values, and can be passed
-            directly to the `.sample()` function.
-        """
-        if self._initvals == {}:
-            self._initvals = self.initial_point()
-        return self._initvals
-
-    def _check_lapse(self, lapse):
-        """Determine if p_outlier and lapse is specified correctly."""
-        # Basically, avoid situations where only one of them is specified.
-        if self.has_lapse and lapse is None:
-            raise ValueError(
-                "You have specified `p_outlier`. Please also specify `lapse`."
-            )
-        if lapse is not None and not self.has_lapse:
-            _logger.warning(
-                "You have specified the `lapse` argument to include a lapse "
-                + "distribution, but `p_outlier` is set to either 0 or None. "
-                + "Your lapse distribution will be ignored."
-            )
-        if "p_outlier" in self.list_params and self.list_params[-1] != "p_outlier":
-            raise ValueError(
-                "Please do not include 'p_outlier' in `list_params`. "
-                + "We automatically append it to `list_params` when `p_outlier` "
-                + "parameter is not None"
-            )
-
     def _make_model_distribution(self) -> type[pm.Distribution]:
         """Make a pm.Distribution for the model."""
-        ### Logic for different types of likelihoods:
+        # == Logic for different types of likelihoods:
         # -`analytical` and `blackbox`:
         #     loglik should be a `pm.Distribution`` or a Python callable (any arbitrary
         #     function).
@@ -2013,22 +255,30 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
             return self.loglik
 
-        # params_is_trialwise_base: one entry per model param (excluding
-        # p_outlier). Used for graph-level broadcasting in logp() and
-        # make_distribution, where dist_params does not include extra_fields.
-        params_is_trialwise_base = [
-            param.is_trialwise
+        # Type narrowing: loglik and list_params should be set by this point
+        if self.loglik is None:
+            raise ValueError(
+                "Likelihood function (loglik) has not been set. "
+                "This should have been configured during model initialization."
+            )
+        if self.list_params is None:
+            raise ValueError(
+                "list_params has not been set. "
+                "This should have been validated during model initialization."
+            )
+        if self.loglik_kind is None:
+            raise ValueError(
+                "Likelihood kind (loglik_kind) has not been set. "
+                "This should have been configured during model initialization."
+            )
+
+        params_is_reg = [
+            param.is_vector
             for param_name, param in self.params.items()
             if param_name != "p_outlier"
         ]
-
-        # params_is_trialwise: extends the base list with extra_fields
-        # (always trialwise). Used for vmap construction in
-        # make_likelihood_callable and for assemble_callables, where
-        # dist_params includes extra_fields flattened in.
-        params_is_trialwise = list(params_is_trialwise_base)
         if self.extra_fields is not None:
-            params_is_trialwise += [True for _ in self.extra_fields]
+            params_is_reg += [True for _ in self.extra_fields]
 
         if self.loglik_kind == "approx_differentiable":
             if self.model_config.backend == "jax":
@@ -2036,7 +286,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                     loglik=self.loglik,
                     loglik_kind="approx_differentiable",
                     backend="jax",
-                    params_is_reg=params_is_trialwise,
+                    params_is_reg=params_is_reg,
                 )
             else:
                 likelihood_callable = make_likelihood_callable(
@@ -2076,7 +326,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 else self.model_config.backend
             )
             missing_data_callable = make_missing_data_callable(
-                self.loglik_missing_data, backend_tmp, params_is_trialwise, params_only
+                self.loglik_missing_data, backend_tmp, params_is_reg, params_only
             )
 
             self.loglik_missing_data = missing_data_callable
@@ -2086,7 +336,6 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 self.loglik_missing_data,
                 params_only,
                 has_deadline=self.deadline,
-                params_is_trialwise=params_is_trialwise,
             )
 
         if self.missing_data:
@@ -2098,14 +347,6 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             )
 
         self.data = _rearrange_data(self.data)
-
-        # Collect fixed-vector params to substitute in the distribution logp
-        fixed_vector_params = {
-            name: param.prior
-            for name, param in self.params.items()
-            if isinstance(param.prior, np.ndarray)
-        }
-
         return make_distribution(
             rv=self.model_config.rv or self.model_name,
             loglik=self.loglik,
@@ -2117,258 +358,4 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 if not self.extra_fields
                 else [deepcopy(self.data[field].values) for field in self.extra_fields]
             ),
-            fixed_vector_params=fixed_vector_params if fixed_vector_params else None,
-            params_is_trialwise=params_is_trialwise_base,
         )
-
-    def _get_deterministic_var_names(self, idata) -> list[str]:
-        """Filter out the deterministic variables in var_names."""
-        var_names = [
-            f"~{param_name}"
-            for param_name, param in self.params.items()
-            if (param.is_regression)
-        ]
-
-        if f"{self._parent}_mean" in idata["posterior"].data_vars:
-            var_names.append(f"~{self._parent}_mean")
-
-        # Parent parameters (always regression implicitly)
-        # which don't have a formula attached
-        # should be dropped from var_names, since the actual
-        # parent name shows up as a regression.
-        if f"{self._parent}" in idata["posterior"].data_vars:
-            if self.params[self._parent].formula is None:
-                # Drop from var_names
-                var_names = [var for var in var_names if var != f"~{self._parent}"]
-
-        return var_names
-
-    def _drop_parent_str_from_idata(
-        self, idata: az.InferenceData | None
-    ) -> az.InferenceData:
-        """Drop the parent_str variable from an InferenceData object.
-
-        Parameters
-        ----------
-        idata
-            The InferenceData object to be modified.
-
-        Returns
-        -------
-        xr.Dataset
-            The modified InferenceData object.
-        """
-        if idata is None:
-            raise ValueError("Please provide an InferenceData object.")
-        else:
-            for group in idata.groups():
-                if ("rt,response_mean" in idata[group].data_vars) and (
-                    self._parent not in idata[group].data_vars
-                ):
-                    setattr(
-                        idata,
-                        group,
-                        idata[group].rename({"rt,response_mean": self._parent}),
-                    )
-            return idata
-
-    def _postprocess_initvals_deterministic(
-        self, initval_settings: dict = INITVAL_SETTINGS
-    ) -> None:
-        """Set initial values for subset of parameters."""
-        self._initvals = self.initial_point()
-        # Consider case where link functions are set to 'log_logit'
-        # or 'None'
-        if self.link_settings not in ["log_logit", None]:
-            _logger.info(
-                "Not preprocessing initial values, "
-                + "because none of the two standard link settings are chosen!"
-            )
-            return None
-
-        # Set initial values for particular parameters
-        for name_, starting_value in self.pymc_model.initial_point().items():
-            # strip name of `_log__` and `_interval__` suffixes
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-
-            # We need to check if the parameter is actually backed by
-            # a regression.
-
-            # If not, we don't actually apply a link function to it as per default.
-            # Therefore we need to apply the initial value strategy corresponding
-            # to 'None' link function.
-
-            # If the user actively supplies a link function, the user
-            # should also have supplied an initial value insofar it matters.
-
-            if self.params[self._get_prefix(name_tmp)].is_regression:
-                param_link_setting = self.link_settings
-            else:
-                param_link_setting = None
-            if name_tmp in initval_settings[param_link_setting].keys():
-                if self._check_if_initval_user_supplied(name_tmp):
-                    _logger.info(
-                        "User supplied initial value detected for %s, \n"
-                        " skipping overwrite with default value.",
-                        name_tmp,
-                    )
-                    continue
-
-                # Apply specific settings from initval_settings dictionary
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(
-                    initval_settings[param_link_setting][name_tmp]
-                ).astype(dtype)
-
-    def _get_prefix(self, name_str: str) -> str:
-        """Get parameters wise link setting function from parameter prefix."""
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-            else:
-                name_str_prefix = "p_outlier"
-        else:
-            name_str_prefix = name_str
-        return name_str_prefix
-
-    def _check_if_initval_user_supplied(
-        self,
-        name_str: str,
-        return_value: bool = False,
-    ) -> bool | float | int | np.ndarray | dict[str, Any] | None:
-        """Check if initial value is user-supplied."""
-        # The function assumes that the name_str is either raw parameter name
-        # or `paramname_Intercept`, because we only really provide special default
-        # initial values for those types of parameters
-
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-                # name_str_suffix = "".join(name_str.split("_")[1:])
-                name_str_suffix = name_str[len(name_str_prefix + "_") :]
-            else:
-                name_str_prefix = "p_outlier"
-                if name_str == "p_outlier":
-                    name_str_suffix = ""
-                else:
-                    # name_str_suffix = "".join(name_str.split("_")[2:])
-                    name_str_suffix = name_str[len("p_outlier_") :]
-        else:
-            name_str_prefix = name_str
-            name_str_suffix = ""
-
-        tmp_param = name_str_prefix
-        if tmp_param == self._parent:
-            # If the parameter was parent it is automatically treated as a
-            # regression.
-            if not name_str_suffix:
-                # No suffix --> Intercept
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp["Intercept"], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    return False
-            else:
-                # If the parameter has a suffix --> use it
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-        else:
-            # If the parameter is not a parent, it is treated as a regression
-            # only when actively specified as such.
-            if not name_str_suffix:
-                # If no suffix --> treat as basic parameter.
-                if isinstance(self.params[tmp_param].prior, float) or isinstance(
-                    self.params[tmp_param].prior, np.ndarray
-                ):
-                    if return_value:
-                        return self.params[tmp_param].prior
-                    else:
-                        return True
-                elif isinstance(self.params[tmp_param].prior, bmb.Prior):
-                    args_tmp = getattr(self.params[tmp_param].prior, "args")
-                    if "initval" in args_tmp:
-                        if return_value:
-                            return args_tmp["initval"]
-                        else:
-                            return True
-                    else:
-                        if return_value:
-                            return None
-                        else:
-                            return False
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-            else:
-                # If suffix --> treat as regression and use suffix
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-
-    def _jitter_initvals(
-        self, jitter_epsilon: float = 0.01, vector_only: bool = False
-    ) -> None:
-        """Apply controlled jitter to initial values."""
-        if vector_only:
-            self.__jitter_initvals_vector_only(jitter_epsilon)
-        else:
-            self.__jitter_initvals_all(jitter_epsilon)
-
-    def __jitter_initvals_vector_only(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            if starting_value.ndim != 0 and starting_value.shape[0] != 1:
-                starting_value_tmp = starting_value + np.random.uniform(
-                    -jitter_epsilon, jitter_epsilon, starting_value.shape
-                ).astype(np.float32)
-
-                # Note: self._initvals shouldn't be None when this is called
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)
-
-    def __jitter_initvals_all(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        # initial_point_dict = self.pymc_model.initial_point()
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            starting_value_tmp = starting_value + np.random.uniform(
-                -jitter_epsilon, jitter_epsilon, starting_value.shape
-            ).astype(np.float32)
-
-            dtype = self.initvals[name_tmp].dtype
-            self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)

From 6633d14de6318850034e3c5a90465bfc8b057662 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 16:32:47 -0500
Subject: [PATCH 089/104] Cast choices to list

---
 src/hssm/base.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index ad75d3307..c7049583b 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -333,7 +333,7 @@ def __init__(
         # region ===== Set up shortcuts so old code will work ======
         self.response = self.model_config.response
         self.list_params = self.model_config.list_params
-        self.choices = self.model_config.choices
+        self.choices = list(self.model_config.choices)
         self.model_name = self.model_config.model_name
         self.loglik = self.model_config.loglik
         self.loglik_kind = self.model_config.loglik_kind

From 78ac213871ef802a8efe446bffce6d7075e63934 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Fri, 13 Feb 2026 16:39:24 -0500
Subject: [PATCH 090/104] Fix response assertion in test_from_defaults to use
 list instead of tuple

---
 tests/test_config.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_config.py b/tests/test_config.py
index 47c0b4f91..558f83a50 100644
--- a/tests/test_config.py
+++ b/tests/test_config.py
@@ -12,7 +12,7 @@ def test_from_defaults():
     config1 = Config.from_defaults("ddm", "analytical")
 
     assert config1.model_name == "ddm"
-    assert config1.response == ("rt", "response")
+    assert config1.response == ["rt", "response"]
     assert config1.list_params == ["v", "a", "z", "t"]
     assert config1.loglik_kind == "analytical"
     assert config1.loglik is not None

From 55b28bccfbc607de24504589bb68445d4568f083 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 11:24:11 -0500
Subject: [PATCH 091/104] Refactor HSSM class to improve parameter handling in
 likelihood and distribution functions

---
 src/hssm/base.py   |  3 +--
 src/hssm/config.py |  2 +-
 src/hssm/hssm.py   | 31 ++++++++++++++++++++++++++-----
 3 files changed, 28 insertions(+), 8 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 2f973e6f4..30ea75fc8 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -291,7 +291,6 @@ def __init__(
         initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
         **kwargs,
     ):
-
         # ===== init args for save/load models =====
         self._init_args = {
             k: v for k, v in locals().items() if k not in ["self", "kwargs"]
@@ -339,7 +338,7 @@ def __init__(
             else None
         )
         self.list_params = self.model_config.list_params
-        self.choices = list(self.model_config.choices)
+        self.choices = self.model_config.choices  # type: ignore[assignment]
         self.model_name = self.model_config.model_name
         self.loglik = self.model_config.loglik
         self.loglik_kind = self.model_config.loglik_kind
diff --git a/src/hssm/config.py b/src/hssm/config.py
index 432ccc140..1e842f331 100644
--- a/src/hssm/config.py
+++ b/src/hssm/config.py
@@ -216,7 +216,7 @@ def update_config(self, user_config: ModelConfig) -> None:
             User specified ModelConfig used update self.
         """
         if user_config.response is not None:
-            self.response = user_config.response
+            self.response = list(user_config.response)  # type: ignore[assignment]
         if user_config.list_params is not None:
             self.list_params = user_config.list_params
         if user_config.choices is not None:
diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index ed29c7425..400f2f515 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -11,6 +11,7 @@
 from inspect import isclass
 from typing import Literal
 
+import numpy as np
 import pymc as pm
 
 from hssm.base import HSSMBase
@@ -272,13 +273,22 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 "This should have been configured during model initialization."
             )
 
-        params_is_reg = [
-            param.is_vector
+        # params_is_trialwise_base: one entry per model param (excluding
+        # p_outlier). Used for graph-level broadcasting in logp() and
+        # make_distribution, where dist_params does not include extra_fields.
+        params_is_trialwise_base = [
+            param.is_trialwise
             for param_name, param in self.params.items()
             if param_name != "p_outlier"
         ]
+
+        # params_is_trialwise: extends the base list with extra_fields
+        # (always trialwise). Used for vmap construction in
+        # make_likelihood_callable and for assemble_callables, where
+        # dist_params includes extra_fields flattened in.
+        params_is_trialwise = list(params_is_trialwise_base)
         if self.extra_fields is not None:
-            params_is_reg += [True for _ in self.extra_fields]
+            params_is_trialwise += [True for _ in self.extra_fields]
 
         if self.loglik_kind == "approx_differentiable":
             if self.model_config.backend == "jax":
@@ -286,7 +296,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                     loglik=self.loglik,
                     loglik_kind="approx_differentiable",
                     backend="jax",
-                    params_is_reg=params_is_reg,
+                    params_is_reg=params_is_trialwise,
                 )
             else:
                 likelihood_callable = make_likelihood_callable(
@@ -326,7 +336,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 else self.model_config.backend
             )
             missing_data_callable = make_missing_data_callable(
-                self.loglik_missing_data, backend_tmp, params_is_reg, params_only
+                self.loglik_missing_data, backend_tmp, params_is_trialwise, params_only
             )
 
             self.loglik_missing_data = missing_data_callable
@@ -336,6 +346,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 self.loglik_missing_data,
                 params_only,
                 has_deadline=self.deadline,
+                params_is_trialwise=params_is_trialwise,
             )
 
         if self.missing_data:
@@ -347,6 +358,14 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             )
 
         self.data = _rearrange_data(self.data)
+
+        # Collect fixed-vector params to substitute in the distribution logp
+        fixed_vector_params = {
+            name: param.prior
+            for name, param in self.params.items()
+            if isinstance(param.prior, np.ndarray)
+        }
+
         return make_distribution(
             rv=self.model_config.rv or self.model_name,
             loglik=self.loglik,
@@ -358,4 +377,6 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
                 if not self.extra_fields
                 else [deepcopy(self.data[field].values) for field in self.extra_fields]
             ),
+            fixed_vector_params=fixed_vector_params if fixed_vector_params else None,
+            params_is_trialwise=params_is_trialwise_base,
         )

From 6ad0935c0480d8a4772c0cd7195f067b1d2007be Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 11:36:28 -0500
Subject: [PATCH 092/104] Update response assertions in test_from_defaults to
 use lists instead of tuples

---
 tests/test_config.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/test_config.py b/tests/test_config.py
index 558f83a50..ba8429d06 100644
--- a/tests/test_config.py
+++ b/tests/test_config.py
@@ -23,7 +23,7 @@ def test_from_defaults():
     config2 = Config.from_defaults("angle", "analytical")
 
     assert config2.model_name == "angle"
-    assert config2.response == ("rt", "response")
+    assert config2.response == ["rt", "response"]
     assert config2.list_params == ["v", "a", "z", "t", "theta"]
     assert config2.loglik_kind == "analytical"
     assert config2.loglik is None
@@ -38,7 +38,7 @@ def test_from_defaults():
     # Case 4: No supported model, provided loglik_kind
     config4 = Config.from_defaults("custom", "analytical")
     assert config4.model_name == "custom"
-    assert config4.response == ("rt", "response")
+    assert config4.response == ["rt", "response"]
     assert config4.list_params is None
     assert config4.loglik_kind == "analytical"
     assert config4.loglik is None
@@ -52,7 +52,7 @@ def test_from_defaults():
 
 def test_update_config():
     config1 = Config.from_defaults("ddm", "analytical")
-    assert config1.response == ("rt", "response")
+    assert config1.response == ["rt", "response"]
 
     v_prior, v_bounds = config1.get_defaults("v")
 

From 7ac1d809aa35e689fb934d5ecdedc79839666908 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 17:47:25 -0500
Subject: [PATCH 093/104] Restore hssm.py as in main

---
 src/hssm/hssm.py | 2036 +++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 2014 insertions(+), 22 deletions(-)

diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 400f2f515..19508a342 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -6,29 +6,60 @@
 This file defines the entry class HSSM.
 """
 
+import datetime
 import logging
+import typing
 from copy import deepcopy
-from inspect import isclass
-from typing import Literal
+from inspect import isclass, signature
+from os import PathLike
+from pathlib import Path
+from typing import Any, Callable, Literal, Optional, Union, cast, get_args
 
+import arviz as az
+import bambi as bmb
+import cloudpickle as cpickle
+import matplotlib as mpl
+import matplotlib.pyplot as plt
 import numpy as np
+import pandas as pd
 import pymc as pm
+import pytensor
+import seaborn as sns
+import xarray as xr
+from bambi.model_components import DistributionalComponent
+from bambi.transformations import transformations_namespace
+from pymc.model.transform.conditioning import do
+from ssms.config import model_config as ssms_model_config
 
-from hssm.base import HSSMBase
+from hssm._types import LoglikKind, SupportedModels
+from hssm.data_validator import DataValidatorMixin
 from hssm.defaults import (
+    INITVAL_JITTER_SETTINGS,
+    INITVAL_SETTINGS,
     MissingDataNetwork,
     missing_data_networks_suffix,
 )
 from hssm.distribution_utils import (
     assemble_callables,
     make_distribution,
+    make_family,
     make_likelihood_callable,
     make_missing_data_callable,
 )
+from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
+    _compute_log_likelihood,
+    _get_alias_dict,
+    _print_prior,
     _rearrange_data,
+    _split_array,
 )
 
+from . import plotting
+from .config import Config, ModelConfig
+from .param import Params
+from .param import UserParam as Param
+
 _logger = logging.getLogger("hssm")
 
 # NOTE: Temporary mapping from old sampler names to new ones in bambi 0.16.0
@@ -67,7 +98,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(HSSMBase):
+class HSSM(DataValidatorMixin, MissingDataMixin):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
@@ -240,9 +271,1735 @@ class HSSM(HSSMBase):
         The jitter value for the initial values.
     """
 
+    def __init__(
+        self,
+        data: pd.DataFrame,
+        model: SupportedModels | str = "ddm",
+        choices: list[int] | None = None,
+        include: list[dict[str, Any] | Param] | None = None,
+        model_config: ModelConfig | dict | None = None,
+        loglik: (
+            str | PathLike | Callable | pytensor.graph.Op | type[pm.Distribution] | None
+        ) = None,
+        loglik_kind: LoglikKind | None = None,
+        p_outlier: float | dict | bmb.Prior | None = 0.05,
+        lapse: dict | bmb.Prior | None = bmb.Prior("Uniform", lower=0.0, upper=20.0),
+        global_formula: str | None = None,
+        link_settings: Literal["log_logit"] | None = None,
+        prior_settings: Literal["safe"] | None = "safe",
+        extra_namespace: dict[str, Any] | None = None,
+        missing_data: bool | float = False,
+        deadline: bool | str = False,
+        loglik_missing_data: (
+            str | PathLike | Callable | pytensor.graph.Op | None
+        ) = None,
+        process_initvals: bool = True,
+        initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
+        **kwargs,
+    ):
+        # Attach arguments to the instance
+        # so that we can easily define some
+        # methods that need to access these
+        # arguments (context: pickling / save - load).
+
+        # Define a dict with all call arguments:
+        self._init_args = {
+            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
+        }
+        if kwargs:
+            self._init_args.update(kwargs)
+
+        self.data = data.copy()
+        self._inference_obj: az.InferenceData | None = None
+        self._initvals: dict[str, Any] = {}
+        self.initval_jitter = initval_jitter
+        self._inference_obj_vi: pm.Approximation | None = None
+        self._vi_approx = None
+        self._map_dict = None
+        self.global_formula = global_formula
+
+        self.link_settings = link_settings
+        self.prior_settings = prior_settings
+
+        self.missing_data_value = -999.0
+
+        additional_namespace = transformations_namespace.copy()
+        if extra_namespace is not None:
+            additional_namespace.update(extra_namespace)
+        self.additional_namespace = additional_namespace
+
+        # Construct a model_config from defaults
+        self.model_config = Config.from_defaults(model, loglik_kind)
+        # Update defaults with user-provided config, if any
+        if model_config is not None:
+            if isinstance(model_config, dict):
+                if "choices" not in model_config:
+                    if choices is not None:
+                        model_config["choices"] = tuple(choices)
+                else:
+                    if choices is not None:
+                        _logger.info(
+                            "choices list provided in both model_config and "
+                            "as an argument directly."
+                            " Using the one provided in model_config. \n"
+                            "We recommend providing choices in model_config."
+                        )
+            elif isinstance(model_config, ModelConfig):
+                if model_config.choices is None:
+                    if choices is not None:
+                        model_config.choices = tuple(choices)
+                else:
+                    if choices is not None:
+                        _logger.info(
+                            "choices list provided in both model_config and "
+                            "as an argument directly."
+                            " Using the one provided in model_config. \n"
+                            "We recommend providing choices in model_config."
+                        )
+
+            self.model_config.update_config(
+                model_config
+                if isinstance(model_config, ModelConfig)
+                else ModelConfig(**model_config)  # also serves as dict validation
+            )
+        else:
+            # Model config is not provided, but at this point was constructed from
+            # defaults.
+            if model not in typing.get_args(SupportedModels):
+                # TODO: ideally use self.supported_models above but mypy doesn't like it
+                if choices is not None:
+                    self.model_config.update_choices(choices)
+                elif model in ssms_model_config:
+                    self.model_config.update_choices(
+                        ssms_model_config[model]["choices"]
+                    )
+                    _logger.info(
+                        "choices argument passed as None, "
+                        "but found %s in ssms-simulators. "
+                        "Using choices, from ssm-simulators configs: %s",
+                        model,
+                        ssms_model_config[model]["choices"],
+                    )
+            else:
+                # Model config already constructed from defaults, and model string is
+                # in SupportedModels. So we are guaranteed that choices are in
+                # self.model_config already.
+
+                if choices is not None:
+                    _logger.info(
+                        "Model string is in SupportedModels."
+                        " Ignoring choices arguments."
+                    )
+
+        # Update loglik with user-provided value
+        self.model_config.update_loglik(loglik)
+        # Ensure that all required fields are valid
+        self.model_config.validate()
+
+        # Set up shortcuts so old code will work
+        self.response = self.model_config.response
+        self.list_params = self.model_config.list_params
+        self.choices = self.model_config.choices
+        self.model_name = self.model_config.model_name
+        self.loglik = self.model_config.loglik
+        self.loglik_kind = self.model_config.loglik_kind
+        self.extra_fields = self.model_config.extra_fields
+
+        self.n_choices = len(self.choices)
+
+        self._validate_choices()
+        self._pre_check_data_sanity()
+
+        # Process missing data setting
+        # AF-TODO: Could be a function in data validator?
+        if isinstance(missing_data, float):
+            if not ((self.data.rt == missing_data).any()):
+                raise ValueError(
+                    f"missing_data argument is provided as a float {missing_data}, "
+                    f"However, you have no RTs of {missing_data} in your dataset!"
+                )
+            else:
+                self.missing_data = True
+                self.missing_data_value = missing_data
+        elif isinstance(missing_data, bool):
+            if missing_data and (not (self.data.rt == -999.0).any()):
+                raise ValueError(
+                    "missing_data argument is provided as True, "
+                    " so RTs of -999.0 are treated as missing. \n"
+                    "However, you have no RTs of -999.0 in your dataset!"
+                )
+            elif (not missing_data) and (self.data.rt == -999.0).any():
+                # self.missing_data = True
+                raise ValueError(
+                    "Missing data provided as False. \n"
+                    "However, you have RTs of -999.0 in your dataset!"
+                )
+            else:
+                self.missing_data = missing_data
+        else:
+            raise ValueError(
+                "missing_data argument must be a bool or a float! \n"
+                f"You provided: {type(missing_data)}"
+            )
+
+        if isinstance(deadline, str):
+            self.deadline = True
+            self.deadline_name = deadline
+        else:
+            self.deadline = deadline
+            self.deadline_name = "deadline"
+
+        if (
+            not self.missing_data and not self.deadline
+        ) and loglik_missing_data is not None:
+            raise ValueError(
+                "You have specified a loglik_missing_data function, but you have not "
+                + "set the missing_data or deadline flag to True."
+            )
+        self.loglik_missing_data = loglik_missing_data
+
+        # Update data based on missing_data and deadline
+        self._handle_missing_data_and_deadline()
+        # Set self.missing_data_network based on `missing_data` and `deadline`
+        self.missing_data_network = self._set_missing_data_and_deadline(
+            self.missing_data, self.deadline, self.data
+        )
+
+        if self.deadline:
+            # self.response is a tuple (from Config); use concatenation.
+            self.response.append(self.deadline_name)
+
+        # Process lapse distribution
+        self.has_lapse = p_outlier is not None and p_outlier != 0
+        self._check_lapse(lapse)
+        if self.has_lapse and self.list_params[-1] != "p_outlier":
+            self.list_params.append("p_outlier")
+
+        # Process all parameters
+        self.params = Params.from_user_specs(
+            model=self,
+            include=[] if include is None else include,
+            kwargs=kwargs,
+            p_outlier=p_outlier,
+        )
+
+        self._parent = self.params.parent
+        self._parent_param = self.params.parent_param
+
+        self._validate_fixed_vectors()
+        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
+
+        # For parameters that have a regression backend, apply bounds at the likelihood
+        # level to ensure that the samples that are out of bounds
+        # are discarded (replaced with a large negative value).
+        self.bounds = {
+            name: param.bounds
+            for name, param in self.params.items()
+            if param.is_regression and param.bounds is not None
+        }
+
+        # Set p_outlier and lapse
+        self.p_outlier = self.params.get("p_outlier")
+        self.lapse = lapse if self.has_lapse else None
+
+        self._post_check_data_sanity()
+
+        self.model_distribution = self._make_model_distribution()
+
+        self.family = make_family(
+            self.model_distribution,
+            self.list_params,
+            self.link,
+            self._parent,
+        )
+
+        self.model = bmb.Model(
+            self.formula,
+            data=self.data,
+            family=self.family,
+            priors=self.priors,  # center_predictors=False
+            extra_namespace=self.additional_namespace,
+            **kwargs,
+        )
+
+        self._aliases = _get_alias_dict(
+            self.model, self._parent_param, self.response_c, self.response_str
+        )
+        self.set_alias(self._aliases)
+        self.model.build()
+
+        # Bambi >= 0.17 declares dims=("__obs__",) for intercept-only
+        # deterministics that actually have shape (1,). This causes an
+        # xarray CoordinateValidationError during pm.sample() when ArviZ
+        # tries to create a DataArray with mismatched dimension sizes.
+        # Fix by removing the dims declaration for these deterministics.
+        self._fix_scalar_deterministic_dims()
+
+        if process_initvals:
+            self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
+        if self.initval_jitter > 0:
+            self._jitter_initvals(
+                jitter_epsilon=self.initval_jitter,
+                vector_only=True,
+            )
+
+        # Make sure we reset rvs_to_initial_values --> Only None's
+        # Otherwise PyMC barks at us when asking to compute likelihoods
+        self.pymc_model.rvs_to_initial_values.update(
+            {key_: None for key_ in self.pymc_model.rvs_to_initial_values.keys()}
+        )
+        _logger.info("Model initialized successfully.")
+
+    def _fix_scalar_deterministic_dims(self) -> None:
+        """Fix dims metadata for scalar deterministics.
+
+        Bambi >= 0.17 returns shape ``(1,)`` for intercept-only
+        deterministics but still declares ``dims=("__obs__",)``. This causes
+        an xarray ``CoordinateValidationError`` during ``pm.sample()`` because
+        the ``__obs__`` coordinate has ``n_obs`` entries. Removing the dims
+        declaration for these variables lets ArviZ handle them as
+        un-dimensioned arrays, avoiding the conflict.
+        """
+        n_obs = len(self.data)
+        dims_dict = self.pymc_model.named_vars_to_dims
+        for det in self.pymc_model.deterministics:
+            if det.name not in dims_dict:
+                continue
+            dims = dims_dict[det.name]
+            if "__obs__" in dims:
+                # Check static shape: if it doesn't match n_obs, remove dims
+                try:
+                    shape_0 = det.type.shape[0]
+                except (IndexError, TypeError):
+                    continue
+                if shape_0 is not None and shape_0 != n_obs:
+                    del dims_dict[det.name]
+
+    def _validate_fixed_vectors(self) -> None:
+        """Validate that fixed-vector parameters have the correct length.
+
+        Fixed-vector parameters (``prior=np.ndarray``) bypass Bambi's formula
+        system entirely --- they are passed as a scalar ``0.0`` placeholder to
+        Bambi, and the real vector is substituted inside
+        ``HSSMDistribution.logp()`` (see ``dist.py``).  Because this
+        substitution is invisible to Bambi, we must validate the vector length
+        against ``len(self.data)`` up front to catch shape mismatches early.
+        """
+        for name, param in self.params.items():
+            if isinstance(param.prior, np.ndarray):
+                if len(param.prior) != len(self.data):
+                    raise ValueError(
+                        f"Fixed vector for parameter '{name}' has length "
+                        f"{len(param.prior)}, but data has {len(self.data)} rows."
+                    )
+
+    @classproperty
+    def supported_models(cls) -> tuple[SupportedModels, ...]:
+        """Get a tuple of all supported models.
+
+        Returns
+        -------
+        tuple[SupportedModels, ...]
+            A tuple containing all supported model names.
+        """
+        return get_args(SupportedModels)
+
+    @classmethod
+    def _store_init_args(cls, *args, **kwargs):
+        """Store initialization arguments using signature binding."""
+        sig = signature(cls.__init__)
+        bound_args = sig.bind(*args, **kwargs)
+        bound_args.apply_defaults()
+        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
+
+    def find_MAP(self, **kwargs):
+        """Perform Maximum A Posteriori estimation.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the MAP estimates of the model parameters.
+        """
+        self._map_dict = pm.find_MAP(model=self.pymc_model, **kwargs)
+        return self._map_dict
+
+    def sample(
+        self,
+        sampler: Literal["pymc", "numpyro", "blackjax", "nutpie", "laplace"]
+        | None = None,
+        init: str | None = None,
+        initvals: str | dict | None = None,
+        include_response_params: bool = False,
+        **kwargs,
+    ) -> az.InferenceData | pm.Approximation:
+        """Perform sampling using the `fit` method via bambi.Model.
+
+        Parameters
+        ----------
+        sampler: optional
+            The sampler to use. Can be one of "pymc", "numpyro",
+            "blackjax", "nutpie", or "laplace". If using `blackbox` likelihoods,
+            this cannot be "numpyro", "blackjax", or "nutpie". By default it is None,
+            and sampler will automatically be chosen: when the model uses the
+            `approx_differentiable` likelihood, and `jax` backend, "numpyro" will
+            be used. Otherwise, "pymc" (the default PyMC NUTS sampler) will be used.
+
+            Note that the old sampler names such as "mcmc", "nuts_numpyro",
+            "nuts_blackjax" will be deprecated and removed in future releases. A warning
+            will be raised if any of these old names are used.
+        init: optional
+            Initialization method to use for the sampler. If any of the NUTS samplers
+            is used, defaults to `"adapt_diag"`. Otherwise, defaults to `"auto"`.
+        initvals: optional
+            Pass initial values to the sampler. This can be a dictionary of initial
+            values for parameters of the model, or a string "map" to use initialization
+            at the MAP estimate. If "map" is used, the MAP estimate will be computed if
+            not already attached to the base class from prior call to 'find_MAP'.
+        include_response_params: optional
+            Include parameters of the response distribution in the output. These usually
+            take more space than other parameters as there's one of them per
+            observation. Defaults to False.
+        kwargs
+            Other arguments passed to bmb.Model.fit(). Please see [here]
+            (https://bambinos.github.io/bambi/api_reference.html#bambi.models.Model.fit)
+            for full documentation.
+
+        Returns
+        -------
+        az.InferenceData | pm.Approximation
+            A reference to the `model.traces` object, which stores the traces of the
+            last call to `model.sample()`. `model.traces` is an ArviZ `InferenceData`
+            instance if `sampler` is `"pymc"` (default), `"numpyro"`,
+            `"blackjax"` or "`laplace".
+        """
+        # If initvals are None (default)
+        # we skip processing initvals here.
+        if sampler in _new_sampler_mapping:
+            _logger.warning(
+                f"Sampler '{sampler}' is deprecated. "
+                "Please use the new sampler names: "
+                "'pymc', 'numpyro', 'blackjax', 'nutpie', or 'laplace'."
+            )
+            sampler = _new_sampler_mapping[sampler]  # type: ignore
+
+        if sampler == "vi":
+            raise ValueError(
+                "VI is not supported via the sample() method. "
+                "Please use the vi() method instead."
+            )
+
+        if initvals is not None:
+            if isinstance(initvals, dict):
+                kwargs["initvals"] = initvals
+            else:
+                if isinstance(initvals, str):
+                    if initvals == "map":
+                        if self._map_dict is None:
+                            _logger.info(
+                                "initvals='map' but no map"
+                                "estimate precomputed. \n"
+                                "Running map estimation first..."
+                            )
+                            self.find_MAP()
+                            kwargs["initvals"] = self._map_dict
+                        else:
+                            kwargs["initvals"] = self._map_dict
+                else:
+                    raise ValueError(
+                        "initvals argument must be a dictionary or 'map'"
+                        " to use the MAP estimate."
+                    )
+        else:
+            kwargs["initvals"] = self._initvals
+            _logger.info("Using default initvals. \n")
+
+        if sampler is None:
+            if (
+                self.loglik_kind == "approx_differentiable"
+                and self.model_config.backend == "jax"
+            ):
+                sampler = "numpyro"
+            else:
+                sampler = "pymc"
+
+        if self.loglik_kind == "blackbox":
+            if sampler in ["blackjax", "numpyro", "nutpie"]:
+                raise ValueError(
+                    f"{sampler} sampler does not work with blackbox likelihoods."
+                )
+
+            if "step" not in kwargs:
+                kwargs |= {"step": pm.Slice(model=self.pymc_model)}
+
+        if (
+            self.loglik_kind == "approx_differentiable"
+            and self.model_config.backend == "jax"
+            and sampler == "pymc"
+            and kwargs.get("cores", None) != 1
+        ):
+            _logger.warning(
+                "Parallel sampling might not work with `jax` backend and the PyMC NUTS "
+                + "sampler on some platforms. Please consider using `numpyro`, "
+                + "`blackjax`, or `nutpie` sampler if that is a problem."
+            )
+
+        if self._check_extra_fields():
+            self._update_extra_fields()
+
+        if init is None:
+            if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]:
+                init = "adapt_diag"
+            else:
+                init = "auto"
+
+        # If sampler is finally `numpyro` make sure
+        # the jitter argument is set to False
+        if sampler == "numpyro":
+            if "nuts_sampler_kwargs" in kwargs:
+                if kwargs["nuts_sampler_kwargs"].get("jitter"):
+                    _logger.warning(
+                        "The jitter argument is set to True. "
+                        + "This argument is not supported "
+                        + "by the numpyro backend. "
+                        + "The jitter argument will be set to False."
+                    )
+                kwargs["nuts_sampler_kwargs"]["jitter"] = False
+            else:
+                kwargs["nuts_sampler_kwargs"] = {"jitter": False}
+
+        if sampler != "pymc" and "step" in kwargs:
+            raise ValueError(
+                "`step` samplers (enabled by the `step` argument) are only supported "
+                "by the `pymc` sampler."
+            )
+
+        if self._inference_obj is not None:
+            _logger.warning(
+                "The model has already been sampled. Overwriting the previous "
+                + "inference object. Any previous reference to the inference object "
+                + "will still point to the old object."
+            )
+
+        # Define whether likelihood should be computed
+        compute_likelihood = True
+        if "idata_kwargs" in kwargs:
+            if "log_likelihood" in kwargs["idata_kwargs"]:
+                compute_likelihood = kwargs["idata_kwargs"].pop("log_likelihood", True)
+
+        omit_offsets = kwargs.pop("omit_offsets", False)
+        self._inference_obj = self.model.fit(
+            inference_method=(
+                "pymc"
+                if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]
+                else sampler
+            ),
+            init=init,
+            include_response_params=include_response_params,
+            omit_offsets=omit_offsets,
+            **kwargs,
+        )
+
+        # Separate out log likelihood computation
+        if compute_likelihood:
+            self.log_likelihood(self._inference_obj, inplace=True)
+
+        # Subset data vars in posterior
+        self._clean_posterior_group(idata=self._inference_obj)
+        return self.traces
+
+    def vi(
+        self,
+        method: str = "advi",
+        niter: int = 10000,
+        draws: int = 1000,
+        return_idata: bool = True,
+        ignore_mcmc_start_point_defaults=False,
+        **vi_kwargs,
+    ) -> pm.Approximation | az.InferenceData:
+        """Perform Variational Inference.
+
+        Parameters
+        ----------
+        niter : int
+            The number of iterations to run the VI algorithm. Defaults to 3000.
+        method : str
+            The method to use for VI. Can be one of "advi" or "fullrank_advi", "svgd",
+            "asvgd".Defaults to "advi".
+        draws : int
+            The number of samples to draw from the posterior distribution.
+            Defaults to 1000.
+        return_idata : bool
+            If True, returns an InferenceData object. Otherwise, returns the
+            approximation object directly. Defaults to True.
+
+        Returns
+        -------
+            pm.Approximation or az.InferenceData: The mean field approximation object.
+        """
+        if self.loglik_kind == "analytical":
+            _logger.warning(
+                "VI is not recommended for the analytical likelihood,"
+                " since gradients can be brittle."
+            )
+        elif self.loglik_kind == "blackbox":
+            raise ValueError(
+                "VI is not supported for blackbox likelihoods, "
+                " since likelihood gradients are needed!"
+            )
+
+        if ("start" not in vi_kwargs) and not ignore_mcmc_start_point_defaults:
+            _logger.info("Using MCMC starting point defaults.")
+            vi_kwargs["start"] = self._initvals
+
+        # Run variational inference directly from pymc model
+        with self.pymc_model:
+            self._vi_approx = pm.fit(n=niter, method=method, **vi_kwargs)
+
+        # Sample from the approximate posterior
+        if self._vi_approx is not None:
+            self._inference_obj_vi = self._vi_approx.sample(draws)
+
+        # Post-processing
+        self._clean_posterior_group(idata=self._inference_obj_vi)
+
+        # Return the InferenceData object if return_idata is True
+        if return_idata:
+            return self._inference_obj_vi
+        # Otherwise return the appromation object directly
+        return self.vi_approx
+
+    def _clean_posterior_group(self, idata: az.InferenceData | None = None):
+        """Clean up the posterior group of the InferenceData object.
+
+        Parameters
+        ----------
+        idata : az.InferenceData
+            The InferenceData object to clean up. If None, the last InferenceData object
+            will be used.
+        """
+        # # Logic behind which variables to keep:
+        # # We essentially want to get rid of
+        # # all the trial-wise variables.
+
+        # # We drop all distributional components, IF they are deterministics
+        # # (in which case they will be trial wise systematically)
+        # # and we keep distributional components, IF they are
+        # # basic random-variabels (in which case they should never
+        # # appear trial-wise).
+        if idata is None:
+            raise ValueError(
+                "The InferenceData object is None. Cannot clean up the posterior group."
+            )
+        elif not hasattr(idata, "posterior"):
+            raise ValueError(
+                "The InferenceData object does not have a posterior group. "
+                + "Cannot clean up the posterior group."
+            )
+
+        vars_to_keep = set(idata["posterior"].data_vars.keys()).difference(
+            set(
+                key_
+                for key_ in self.model.distributional_components.keys()
+                if key_ in [var_.name for var_ in self.pymc_model.deterministics]
+            )
+        )
+        vars_to_keep_clean = [
+            var_
+            for var_ in vars_to_keep
+            if isinstance(var_, str) and "_mean" not in var_
+        ]
+
+        setattr(
+            idata,
+            "posterior",
+            idata["posterior"][vars_to_keep_clean],
+        )
+
+    def log_likelihood(
+        self,
+        idata: az.InferenceData | None = None,
+        data: pd.DataFrame | None = None,
+        inplace: bool = True,
+        keep_likelihood_params: bool = False,
+    ) -> az.InferenceData | None:
+        """Compute the log likelihood of the model.
+
+        Parameters
+        ----------
+        idata : optional
+            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
+        data : optional
+            A pandas DataFrame with values for the predictors that are used to obtain
+            out-of-sample predictions. If omitted, the original dataset is used.
+        inplace : optional
+            If `True` will modify idata in-place and append a `log_likelihood` group to
+            `idata`. Otherwise, it will return a copy of idata with the predictions
+            added, by default True.
+        keep_likelihood_params : optional
+            If `True`, the trial wise likelihood parameters that are computed
+            on route to getting the log likelihood are kept in the `idata` object.
+            Defaults to False. See also the method `add_likelihood_parameters_to_idata`.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if self._inference_obj is None and idata is None:
+            raise ValueError(
+                "Neither has the model been sampled yet nor"
+                + " an idata object has been provided."
+            )
+
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError(
+                    "The model has not been sampled yet. "
+                    + "Please provide an idata object."
+                )
+            else:
+                idata = self._inference_obj
+
+        # Actual likelihood computation
+        idata = _compute_log_likelihood(self.model, idata, data, inplace)
+
+        # clean up posterior:
+        if not keep_likelihood_params:
+            self._clean_posterior_group(idata=idata)
+
+        if inplace:
+            return None
+        else:
+            return idata
+
+    def add_likelihood_parameters_to_idata(
+        self,
+        idata: az.InferenceData | None = None,
+        inplace: bool = False,
+    ) -> az.InferenceData | None:
+        """Add likelihood parameters to the InferenceData object.
+
+        Parameters
+        ----------
+        idata : az.InferenceData
+            The InferenceData object returned by HSSM.sample().
+        inplace : bool
+            If True, the likelihood parameters are added to idata in-place. Otherwise,
+            a copy of idata with the likelihood parameters added is returned.
+            Defaults to False.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError("No idata provided and model not yet sampled!")
+            else:
+                idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
+                    deepcopy(self._inference_obj)
+                    if not inplace
+                    else self._inference_obj
+                )
+        else:
+            idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
+                deepcopy(idata) if not inplace else idata
+            )
+        return idata
+
+    def sample_posterior_predictive(
+        self,
+        idata: az.InferenceData | None = None,
+        data: pd.DataFrame | None = None,
+        inplace: bool = True,
+        include_group_specific: bool = True,
+        kind: Literal["response", "response_params"] = "response",
+        draws: int | float | list[int] | np.ndarray | None = None,
+        safe_mode: bool = True,
+    ) -> az.InferenceData | None:
+        """Perform posterior predictive sampling from the HSSM model.
+
+        Parameters
+        ----------
+        idata : optional
+            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
+            the `InferenceData` from the last time `sample()` is called will be used.
+        data : optional
+            An optional data frame with values for the predictors that are used to
+            obtain out-of-sample predictions. If omitted, the original dataset is used.
+        inplace : optional
+            If `True` will modify idata in-place and append a `posterior_predictive`
+            group to `idata`. Otherwise, it will return a copy of idata with the
+            predictions added, by default True.
+        include_group_specific : optional
+            If `True` will make predictions including the group specific effects.
+            Otherwise, predictions are made with common effects only (i.e. group-
+            specific are set to zero), by default True.
+        kind: optional
+            Indicates the type of prediction required. Can be `"response_params"` or
+            `"response"`. The first returns draws from the posterior distribution of the
+            likelihood parameters, while the latter returns the draws from the posterior
+            predictive distribution (i.e. the posterior probability distribution for a
+            new observation) in addition to the posterior distribution. Defaults to
+            "response_params".
+        draws: optional
+            The number of samples to draw from the posterior predictive distribution
+            from each chain.
+            When it's an integer >= 1, the number of samples to be extracted from the
+            `draw` dimension. If this integer is larger than the number of posterior
+            samples in each chain, all posterior samples will be used
+            in posterior predictive sampling. When a float between 0 and 1, the
+            proportion of samples from the draw dimension from each chain to be used in
+            posterior predictive sampling.. If this proportion is very
+            small, at least one sample will be used. When None, all posterior samples
+            will be used. Defaults to None.
+        safe_mode: bool
+            If True, the function will split the draws into chunks of 10 to avoid memory
+            issues. Defaults to True.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet and idata is not provided.
+
+        Returns
+        -------
+        az.InferenceData | None
+            InferenceData or None
+        """
+        if idata is None:
+            if self._inference_obj is None:
+                raise ValueError(
+                    "The model has not been sampled yet. "
+                    + "Please either provide an idata object or sample the model first."
+                )
+            idata = self._inference_obj
+            _logger.info(
+                "idata=None, we use the traces assigned to the HSSM object as idata."
+            )
+
+        if idata is not None:
+            if "posterior_predictive" in idata.groups():
+                del idata["posterior_predictive"]
+                _logger.warning(
+                    "pre-existing posterior_predictive group deleted from idata. \n"
+                )
+
+        if self._check_extra_fields(data):
+            self._update_extra_fields(data)
+
+        if isinstance(draws, np.ndarray):
+            draws = draws.astype(int)
+        elif isinstance(draws, list):
+            draws = np.array(draws).astype(int)
+        elif isinstance(draws, int | float):
+            draws = np.arange(int(draws))
+        elif draws is None:
+            draws = idata["posterior"].draw.values
+        else:
+            raise ValueError(
+                "draws must be an integer, " + "a list of integers, or a numpy array."
+            )
+
+        assert isinstance(draws, np.ndarray)
+
+        # Make a copy of idata, set the `posterior` group to be a random sub-sample
+        # of the original (draw dimension gets sub-sampled)
+
+        idata_copy = idata.copy()
+
+        if (draws.shape != idata["posterior"].draw.values.shape) or (
+            (draws.shape == idata["posterior"].draw.values.shape)
+            and not np.allclose(draws, idata["posterior"].draw.values)
+        ):
+            # Reassign posterior to sub-sampled version
+            setattr(idata_copy, "posterior", idata["posterior"].isel(draw=draws))
+
+        if kind == "response":
+            # If we run kind == 'response' we actually run the observation RV
+            if safe_mode:
+                # safe mode splits the draws into chunks of 10 to avoid
+                # memory issues (TODO: Figure out the source of memory issues)
+                split_draws = _split_array(
+                    idata_copy["posterior"].draw.values, divisor=10
+                )
+
+                posterior_predictive_list = []
+                for samples_tmp in split_draws:
+                    tmp_posterior = idata["posterior"].sel(draw=samples_tmp)
+                    setattr(idata_copy, "posterior", tmp_posterior)
+                    self.model.predict(
+                        idata_copy, kind, data, True, include_group_specific
+                    )
+                    posterior_predictive_list.append(idata_copy["posterior_predictive"])
+
+                if inplace:
+                    idata.add_groups(
+                        posterior_predictive=xr.concat(
+                            posterior_predictive_list, dim="draw"
+                        )
+                    )
+                    # for inplace, we don't return anything
+                    return None
+                else:
+                    # Reassign original posterior to idata_copy
+                    setattr(idata_copy, "posterior", idata["posterior"])
+                    # Add new posterior predictive group to idata_copy
+                    del idata_copy["posterior_predictive"]
+                    idata_copy.add_groups(
+                        posterior_predictive=xr.concat(
+                            posterior_predictive_list, dim="draw"
+                        )
+                    )
+                    return idata_copy
+            else:
+                if inplace:
+                    # If not safe-mode
+                    # We call .predict() directly without any
+                    # chunking of data.
+
+                    # .predict() is called on the copy of idata
+                    # since we still subsampled (or assigned) the draws
+                    self.model.predict(
+                        idata_copy, kind, data, True, include_group_specific
+                    )
+
+                    # posterior predictive group added to idata
+                    idata.add_groups(
+                        posterior_predictive=idata_copy["posterior_predictive"]
+                    )
+                    # don't return anything if inplace
+                    return None
+                else:
+                    # Not safe mode and not inplace
+                    # Function acts as very thin wrapper around
+                    # .predict(). It just operates on the
+                    # idata_copy object
+                    return self.model.predict(
+                        idata_copy, kind, data, False, include_group_specific
+                    )
+        elif kind == "response_params":
+            # If kind == 'response_params', we don't need to run the RV directly,
+            # there shouldn't really be any significant memory issues here,
+            # we can simply ignore settings, since the computational overhead
+            # should be very small --> nudges user towards good outputs.
+            _logger.warning(
+                "The kind argument is set to 'mean', but 'draws' argument "
+                + "is not None: The draws argument will be ignored!"
+            )
+            return self.model.predict(
+                idata, kind, data, inplace, include_group_specific
+            )
+        else:
+            raise ValueError("`kind` must be either 'response' or 'response_params'.")
+
+    def plot_predictive(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
+        """Produce a posterior predictive plot.
+
+        Equivalent to calling `hssm.plotting.plot_predictive()` with the
+        model. Please see that function for
+        [full documentation][hssm.plotting.plot_predictive].
+
+        Returns
+        -------
+        mpl.axes.Axes | sns.FacetGrid
+            The matplotlib axis or seaborn FacetGrid object containing the plot.
+        """
+        return plotting.plot_predictive(self, **kwargs)
+
+    def plot_quantile_probability(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
+        """Produce a quantile probability plot.
+
+        Equivalent to calling `hssm.plotting.plot_quantile_probability()` with the
+        model. Please see that function for
+        [full documentation][hssm.plotting.plot_quantile_probability].
+
+        Returns
+        -------
+        mpl.axes.Axes | sns.FacetGrid
+            The matplotlib axis or seaborn FacetGrid object containing the plot.
+        """
+        return plotting.plot_quantile_probability(self, **kwargs)
+
+    def predict(self, **kwargs) -> az.InferenceData:
+        """Generate samples from the predictive distribution."""
+        return self.model.predict(**kwargs)
+
+    def sample_do(
+        self, params: dict[str, Any], draws: int = 100, return_model=False, **kwargs
+    ) -> az.InferenceData | tuple[az.InferenceData, pm.Model]:
+        """Generate samples from the predictive distribution using the `do-operator`."""
+        do_model = do(self.pymc_model, params)
+        do_idata = pm.sample_prior_predictive(model=do_model, draws=draws, **kwargs)
+
+        # clean up `rt,response_mean` to `v`
+        do_idata = self._drop_parent_str_from_idata(idata=do_idata)
+
+        # rename otherwise inconsistent dims and coords
+        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
+            setattr(
+                do_idata,
+                "prior_predictive",
+                do_idata["prior_predictive"].rename_dims(
+                    {"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].coords:
+            setattr(
+                do_idata,
+                "prior_predictive",
+                do_idata["prior_predictive"].rename_vars(
+                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+
+        if return_model:
+            return do_idata, do_model
+        return do_idata
+
+    def sample_prior_predictive(
+        self,
+        draws: int = 500,
+        var_names: str | list[str] | None = None,
+        omit_offsets: bool = True,
+        random_seed: np.random.Generator | None = None,
+    ) -> az.InferenceData:
+        """Generate samples from the prior predictive distribution.
+
+        Parameters
+        ----------
+        draws
+            Number of draws to sample from the prior predictive distribution. Defaults
+            to 500.
+        var_names
+            A list of names of variables for which to compute the prior predictive
+            distribution. Defaults to ``None`` which means both observed and unobserved
+            RVs.
+        omit_offsets
+            Whether to omit offset terms. Defaults to ``True``.
+        random_seed
+            Seed for the random number generator.
+
+        Returns
+        -------
+        az.InferenceData
+            ``InferenceData`` object with the groups ``prior``, ``prior_predictive`` and
+            ``observed_data``.
+        """
+        prior_predictive = self.model.prior_predictive(
+            draws, var_names, omit_offsets, random_seed
+        )
+
+        # AF-COMMENT: Not sure if necessary to include the
+        # mean prior here (which adds deterministics that
+        # could be recomputed elsewhere)
+        prior_predictive.add_groups(posterior=prior_predictive.prior)
+        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
+        self.model.predict(prior_predictive, kind="response_params", inplace=True)
+
+        # clean
+        setattr(prior_predictive, "prior", prior_predictive["posterior"])
+        del prior_predictive["posterior"]
+
+        if self._inference_obj is None:
+            self._inference_obj = prior_predictive
+        else:
+            self._inference_obj.extend(prior_predictive)
+
+        # clean up `rt,response_mean` to `v`
+        idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
+
+        # rename otherwise inconsistent dims and coords
+        if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
+            setattr(
+                idata,
+                "prior_predictive",
+                idata["prior_predictive"].rename_dims(
+                    {"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+        if "rt,response_extra_dim_0" in idata["prior_predictive"].coords:
+            setattr(
+                idata,
+                "prior_predictive",
+                idata["prior_predictive"].rename_vars(
+                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
+                ),
+            )
+
+        # Update self._inference_obj to match the cleaned idata
+        self._inference_obj = idata
+        return deepcopy(self._inference_obj)
+
+    @property
+    def pymc_model(self) -> pm.Model:
+        """Provide access to the PyMC model.
+
+        Returns
+        -------
+        pm.Model
+            The PyMC model built by bambi
+        """
+        return self.model.backend.model
+
+    def set_alias(self, aliases: dict[str, str | dict]):
+        """Set parameter aliases.
+
+        Sets the aliases according to the dictionary passed to it and rebuild the
+        model.
+
+        Parameters
+        ----------
+        aliases
+            A dict specifying the parameter names being aliased and the aliases.
+        """
+        self.model.set_alias(aliases)
+        self.model.build()
+
+    @property
+    def response_c(self) -> str:
+        """Return the response variable names in c() format."""
+        if self.response is None:
+            return "c()"
+        return f"c({', '.join(self.response)})"
+
+    @property
+    def response_str(self) -> str:
+        """Return the response variable names in string format."""
+        if self.response is None:
+            return ""
+        return ",".join(self.response)
+
+    # NOTE: can't annotate return type because the graphviz dependency is optional
+    def graph(self, formatting="plain", name=None, figsize=None, dpi=300, fmt="png"):
+        """Produce a graphviz Digraph from a built HSSM model.
+
+        Requires graphviz, which may be installed most easily with `conda install -c
+        conda-forge python-graphviz`. Alternatively, you may install the `graphviz`
+        binaries yourself, and then `pip install graphviz` to get the python bindings.
+        See http://graphviz.readthedocs.io/en/stable/manual.html for more information.
+
+        Parameters
+        ----------
+        formatting
+            One of `"plain"` or `"plain_with_params"`. Defaults to `"plain"`.
+        name
+            Name of the figure to save. Defaults to `None`, no figure is saved.
+        figsize
+            Maximum width and height of figure in inches. Defaults to `None`, the
+            figure size is set automatically. If defined and the drawing is larger than
+            the given size, the drawing is uniformly scaled down so that it fits within
+            the given size.  Only works if `name` is not `None`.
+        dpi
+            Point per inch of the figure to save.
+            Defaults to 300. Only works if `name` is not `None`.
+        fmt
+            Format of the figure to save.
+            Defaults to `"png"`. Only works if `name` is not `None`.
+
+        Returns
+        -------
+        graphviz.Graph
+            The graph
+        """
+        graph = self.model.graph(formatting, name, figsize, dpi, fmt)
+
+        parent_param = self._parent_param
+        if parent_param.is_regression:
+            return graph
+
+        # Modify the graph
+        # 1. Remove all nodes and edges related to `{parent}_mean`:
+        graph.body = [
+            item for item in graph.body if f"{parent_param.name}_mean" not in item
+        ]
+        # 2. Add a new edge from parent to response
+        graph.edge(parent_param.name, self.response_str)
+
+        return graph
+
+    def compile_logp(self, keep_transformed: bool = False, **kwargs):
+        """Compile the log probability function for the model.
+
+        Parameters
+        ----------
+        keep_transformed : bool, optional
+            If True, keeps the transformed variables in the compiled function.
+            If False, removes value transforms before compilation.
+            Defaults to False.
+        **kwargs
+            Additional keyword arguments passed to PyMC's compile_logp:
+            - vars: List of variables. Defaults to None (all variables).
+            - jacobian: Whether to include log(|det(dP/dQ)|) term for
+            transformed variables. Defaults to True.
+            - sum: Whether to sum all terms instead of returning a vector.
+            Defaults to True.
+
+        Returns
+        -------
+        callable
+            A compiled function that computes the model log probability.
+        """
+        if keep_transformed:
+            return self.pymc_model.compile_logp(
+                vars=kwargs.get("vars", None),
+                jacobian=kwargs.get("jacobian", True),
+                sum=kwargs.get("sum", True),
+            )
+        else:
+            new_model = pm.model.transform.conditioning.remove_value_transforms(
+                self.pymc_model
+            )
+            return new_model.compile_logp(
+                vars=kwargs.get("vars", None),
+                jacobian=kwargs.get("jacobian", True),
+                sum=kwargs.get("sum", True),
+            )
+
+    def plot_trace(
+        self,
+        data: az.InferenceData | None = None,
+        include_deterministic: bool = False,
+        tight_layout: bool = True,
+        **kwargs,
+    ) -> None:
+        """Generate trace plot with ArviZ but with additional convenience features.
+
+        This is a simple wrapper for the az.plot_trace() function. By default, it
+        filters out the deterministic values from the plot. Please see the
+        [arviz documentation]
+        (https://arviz-devs.github.io/arviz/api/generated/arviz.plot_trace.html)
+        for additional parameters that can be specified.
+
+        Parameters
+        ----------
+        data : optional
+            An ArviZ InferenceData object. If None, the traces stored in the model will
+            be used.
+        include_deterministic : optional
+            Whether to include deterministic variables in the plot. Defaults to False.
+            Note that if include deterministic is set to False and and `var_names` is
+            provided, the `var_names` provided will be modified to also exclude the
+            deterministic values. If this is not desirable, set
+            `include deterministic` to True.
+        tight_layout : optional
+            Whether to call plt.tight_layout() after plotting. Defaults to True.
+        """
+        data = data or self.traces
+        if not isinstance(data, az.InferenceData):
+            raise TypeError("data must be an InferenceData object.")
+
+        if not include_deterministic:
+            var_names = list(
+                set([var.name for var in self.pymc_model.free_RVs]).intersection(
+                    set(list(data["posterior"].data_vars.keys()))
+                )
+            )
+            # var_names = self._get_deterministic_var_names(data)
+            if var_names:
+                if "var_names" in kwargs:
+                    if isinstance(kwargs["var_names"], str):
+                        if kwargs["var_names"] not in var_names:
+                            var_names.append(kwargs["var_names"])
+                        kwargs["var_names"] = var_names
+                    elif isinstance(kwargs["var_names"], list):
+                        kwargs["var_names"] = list(
+                            set(var_names) | set(kwargs["var_names"])
+                        )
+                    elif kwargs["var_names"] is None:
+                        kwargs["var_names"] = var_names
+                    else:
+                        raise ValueError(
+                            "`var_names` must be a string, a list of strings, or None."
+                        )
+                else:
+                    kwargs["var_names"] = var_names
+        az.plot_trace(data, **kwargs)
+
+        if tight_layout:
+            plt.tight_layout()
+
+    def summary(
+        self,
+        data: az.InferenceData | None = None,
+        include_deterministic: bool = False,
+        **kwargs,
+    ) -> pd.DataFrame | xr.Dataset:
+        """Produce a summary table with ArviZ but with additional convenience features.
+
+        This is a simple wrapper for the az.summary() function. By default, it
+        filters out the deterministic values from the plot. Please see the
+        [arviz documentation]
+        (https://arviz-devs.github.io/arviz/api/generated/arviz.summary.html)
+        for additional parameters that can be specified.
+
+        Parameters
+        ----------
+        data
+            An ArviZ InferenceData object. If None, the traces stored in the model will
+            be used.
+        include_deterministic : optional
+            Whether to include deterministic variables in the plot. Defaults to False.
+            Note that if include_deterministic is set to False and and `var_names` is
+            provided, the `var_names` provided will be modified to also exclude the
+            deterministic values. If this is not desirable, set
+            `include_deterministic` to True.
+
+        Returns
+        -------
+        pd.DataFrame | xr.Dataset
+            A pandas DataFrame or xarray Dataset containing the summary statistics.
+        """
+        data = data or self.traces
+        if not isinstance(data, az.InferenceData):
+            raise TypeError("data must be an InferenceData object.")
+
+        if not include_deterministic:
+            var_names = list(
+                set([var.name for var in self.pymc_model.free_RVs]).intersection(
+                    set(list(data["posterior"].data_vars.keys()))
+                )
+            )
+            # var_names = self._get_deterministic_var_names(data)
+            if var_names:
+                kwargs["var_names"] = list(set(var_names + kwargs.get("var_names", [])))
+        return az.summary(data, **kwargs)
+
+    def initial_point(self, transformed: bool = False) -> dict[str, np.ndarray]:
+        """Compute the initial point of the model.
+
+        This is a slightly altered version of pm.initial_point.initial_point().
+
+        Parameters
+        ----------
+        transformed : bool, optional
+            If True, return the initial point in transformed space.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the initial point of the model parameters.
+        """
+        fn = pm.initial_point.make_initial_point_fn(
+            model=self.pymc_model, return_transformed=transformed
+        )
+        return pm.model.Point(fn(None), model=self.pymc_model)
+
+    def restore_traces(
+        self, traces: az.InferenceData | pm.Approximation | str | PathLike
+    ) -> None:
+        """Restore traces from an InferenceData object or a .netcdf file.
+
+        Parameters
+        ----------
+        traces
+            An InferenceData object or a path to a file containing the traces.
+        """
+        if isinstance(traces, pm.Approximation):
+            self._inference_obj_vi = traces
+            return
+
+        if isinstance(traces, (str, PathLike)):
+            traces = az.from_netcdf(traces)
+        self._inference_obj = cast("az.InferenceData", traces)
+
+    def restore_vi_traces(
+        self, traces: az.InferenceData | pm.Approximation | str | PathLike
+    ) -> None:
+        """Restore VI traces from an InferenceData object or a .netcdf file.
+
+        Parameters
+        ----------
+        traces
+            An InferenceData object or a path to a file containing the VI traces.
+        """
+        if isinstance(traces, pm.Approximation):
+            self._inference_obj_vi = traces
+            return
+
+        if isinstance(traces, (str, PathLike)):
+            traces = az.from_netcdf(traces)
+        self._inference_obj_vi = cast("az.InferenceData", traces)
+
+    def save_model(
+        self,
+        model_name: str | None = None,
+        allow_absolute_base_path: bool = False,
+        base_path: str | Path = "hssm_models",
+        save_idata_only: bool = False,
+    ) -> None:
+        """Save a HSSM model instance and its inference results to disk.
+
+        Parameters
+        ----------
+        model : HSSM
+            The HSSM model instance to save
+        model_name : str | None
+            Name to use for the saved model files.
+            If None, will use model.model_name with timestamp
+        allow_absolute_base_path : bool
+            Whether to allow absolute paths for base_path
+        base_path : str | Path
+            Base directory to save model files in.
+            Must be relative path if allow_absolute_base_path=False
+        save_idata_only: bool = False,
+            Whether to save the model class instance itself
+
+        Raises
+        ------
+        ValueError
+            If base_path is absolute and allow_absolute_base_path=False
+        """
+        # check if base_path is absolute
+        if not allow_absolute_base_path:
+            if str(base_path).startswith("/"):
+                raise ValueError(
+                    "base_path must be a relative path"
+                    " if allow_absolute_base_path is False"
+                )
+
+        if model_name is None:
+            # Get date string format as suffix to model name
+            model_name = (
+                self.model_name
+                + "_"
+                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
+            )
+
+        # check if folder by name model_name exists
+        model_name = model_name.replace(" ", "_")
+        model_path = Path(base_path).joinpath(model_name)
+        model_path.mkdir(parents=True, exist_ok=True)
+
+        # Save model to pickle file
+        if not save_idata_only:
+            with open(model_path.joinpath("model.pkl"), "wb") as f:
+                cpickle.dump(self, f)
+
+        # Save traces to netcdf file
+        if self._inference_obj is not None:
+            az.to_netcdf(self._inference_obj, model_path.joinpath("traces.nc"))
+
+        # Save vi_traces to netcdf file
+        if self._inference_obj_vi is not None:
+            az.to_netcdf(self._inference_obj_vi, model_path.joinpath("vi_traces.nc"))
+
+    @classmethod
+    def load_model(
+        cls, path: Union[str, Path]
+    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
+        """Load a HSSM model instance and its inference results from disk.
+
+        Parameters
+        ----------
+        path : str | Path
+            Path to the model directory or model.pkl file. If a directory is provided,
+            will look for model.pkl, traces.nc and vi_traces.nc files within it.
+
+        Returns
+        -------
+        HSSM
+            The loaded HSSM model instance with inference results attached if available.
+        """
+        # Convert path to Path object
+        path = Path(path)
+
+        # If path points to a file, assume it's model.pkl
+        if path.is_file():
+            model_dir = path.parent
+            model_path = path
+        else:
+            # Path points to directory
+            model_dir = path
+            model_path = model_dir.joinpath("model.pkl")
+
+        # check if model_dir exists
+        if not model_dir.exists():
+            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
+
+        # check if model.pkl exists raise logging information if not
+        if not model_path.exists():
+            _logger.info(
+                f"model.pkl file does not exist in {model_dir}. "
+                "Attempting to load traces only."
+            )
+            if (not model_dir.joinpath("traces.nc").exists()) and (
+                not model_dir.joinpath("vi_traces.nc").exists()
+            ):
+                raise FileNotFoundError(f"No traces found in {model_dir}.")
+            else:
+                idata_dict = cls.load_model_idata(model_dir)
+                return idata_dict
+        else:
+            # Load model from pickle file
+            with open(model_path, "rb") as f:
+                model = cpickle.load(f)
+
+            # Load traces if they exist
+            traces_path = model_dir.joinpath("traces.nc")
+            if traces_path.exists():
+                model.restore_traces(traces_path)
+
+            # Load VI traces if they exist
+            vi_traces_path = model_dir.joinpath("vi_traces.nc")
+            if vi_traces_path.exists():
+                model.restore_vi_traces(vi_traces_path)
+        return model
+
+    @classmethod
+    def load_model_idata(cls, path: str | Path) -> dict[str, az.InferenceData | None]:
+        """Load the traces from a model directory.
+
+        Parameters
+        ----------
+        path : str | Path
+            Path to the model directory containing traces.nc and/or vi_traces.nc files.
+
+        Returns
+        -------
+        dict[str, az.InferenceData | None]
+            A dictionary with keys "idata_mcmc" and "idata_vi" containing the traces
+            from the model directory. If the traces do not exist, the corresponding
+            value will be None.
+        """
+        idata_dict: dict[str, az.InferenceData | None] = {}
+        model_dir = Path(path)
+        # check if path exists
+        if not model_dir.exists():
+            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
+
+        # check if traces.nc exists
+        traces_path = model_dir.joinpath("traces.nc")
+        if not traces_path.exists():
+            _logger.warning(f"traces.nc file does not exist in {model_dir}.")
+            idata_dict["idata_mcmc"] = None
+        else:
+            idata_dict["idata_mcmc"] = az.from_netcdf(traces_path)
+
+        # check if vi_traces.nc exists
+        vi_traces_path = model_dir.joinpath("vi_traces.nc")
+        if not vi_traces_path.exists():
+            _logger.warning(f"vi_traces.nc file does not exist in {model_dir}.")
+            idata_dict["idata_vi"] = None
+        else:
+            idata_dict["idata_vi"] = az.from_netcdf(vi_traces_path)
+
+        return idata_dict
+
+    def __getstate__(self):
+        """Get the state of the model for pickling.
+
+        This method is called when pickling the model.
+        It returns a dictionary containing the constructor
+        arguments needed to recreate the model instance.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the constructor arguments
+            under the key 'constructor_args'.
+        """
+        state = {"constructor_args": self._init_args}
+        return state
+
+    def __setstate__(self, state):
+        """Set the state of the model when unpickling.
+
+        This method is called when unpickling the model. It creates a new instance
+        of HSSM using the constructor arguments stored in the state dictionary,
+        and copies its attributes to the current instance.
+
+        Parameters
+        ----------
+        state : dict
+            A dictionary containing the constructor arguments under the key
+            'constructor_args'.
+        """
+        new_instance = HSSM(**state["constructor_args"])
+        self.__dict__ = new_instance.__dict__
+
+    def __repr__(self) -> str:
+        """Create a representation of the model."""
+        output = [
+            "Hierarchical Sequential Sampling Model",
+            f"Model: {self.model_name}\n",
+            f"Response variable: {self.response_str}",
+            f"Likelihood: {self.loglik_kind}",
+            f"Observations: {len(self.data)}\n",
+            "Parameters:\n",
+        ]
+
+        for param in self.params.values():
+            if param.name == "p_outlier":
+                continue
+            output.append(f"{param.name}:")
+
+            component = self.model.components[param.name]
+
+            # Regression case:
+            if param.is_regression:
+                assert isinstance(component, DistributionalComponent)
+                output.append(f"    Formula: {param.formula}")
+                output.append("    Priors:")
+                intercept_term = component.intercept_term
+                if intercept_term is not None:
+                    output.append(_print_prior(intercept_term))
+                for _, common_term in component.common_terms.items():
+                    output.append(_print_prior(common_term))
+                for _, group_specific_term in component.group_specific_terms.items():
+                    output.append(_print_prior(group_specific_term))
+                output.append(f"    Link: {param.link}")
+            # None regression case
+            else:
+                if param.prior is None:
+                    prior = (
+                        component.intercept_term.prior
+                        if param.is_parent
+                        else component.prior
+                    )
+                else:
+                    prior = param.prior
+                output.append(f"    Prior: {prior}")
+            output.append(f"    Explicit bounds: {param.bounds}")
+            output.append(
+                " (ignored due to link function)"
+                if self.link_settings is not None
+                else ""
+            )
+
+        # TODO: Handle p_outlier regression correctly here.
+        if self.p_outlier is not None:
+            output.append("")
+            output.append(f"Lapse probability: {self.p_outlier.prior}")
+            output.append(f"Lapse distribution: {self.lapse}")
+
+        return "\n".join(output)
+
+    def __str__(self) -> str:
+        """Create a string representation of the model."""
+        return self.__repr__()
+
+    @property
+    def traces(self) -> az.InferenceData | pm.Approximation:
+        """Return the trace of the model after sampling.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        az.InferenceData | pm.Approximation
+            The trace of the model after the last call to `sample()`.
+        """
+        if not self._inference_obj:
+            raise ValueError("Please sample the model first.")
+
+        return self._inference_obj
+
+    @property
+    def vi_idata(self) -> az.InferenceData:
+        """Return the variational inference approximation object.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        az.InferenceData
+            The variational inference approximation object.
+        """
+        if not self._inference_obj_vi:
+            raise ValueError(
+                "Please run variational inference first, "
+                "no variational posterior attached."
+            )
+
+        return self._inference_obj_vi
+
+    @property
+    def vi_approx(self) -> pm.Approximation:
+        """Return the variational inference approximation object.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        pm.Approximation
+            The variational inference approximation object.
+        """
+        if not self._vi_approx:
+            raise ValueError(
+                "Please run variational inference first, "
+                "no variational approximation attached."
+            )
+
+        return self._vi_approx
+
+    @property
+    def map(self) -> dict:
+        """Return the MAP estimates of the model parameters.
+
+        Raises
+        ------
+        ValueError
+            If the model has not been sampled yet.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the MAP estimates of the model parameters.
+        """
+        if not self._map_dict:
+            raise ValueError("Please compute map first.")
+
+        return self._map_dict
+
+    @property
+    def initvals(self) -> dict:
+        """Return the initial values of the model parameters for sampling.
+
+        Returns
+        -------
+        dict
+            A dictionary containing the initial values of the model parameters.
+            This dict serves as the default for initial values, and can be passed
+            directly to the `.sample()` function.
+        """
+        if self._initvals == {}:
+            self._initvals = self.initial_point()
+        return self._initvals
+
+    def _check_lapse(self, lapse):
+        """Determine if p_outlier and lapse is specified correctly."""
+        # Basically, avoid situations where only one of them is specified.
+        if self.has_lapse and lapse is None:
+            raise ValueError(
+                "You have specified `p_outlier`. Please also specify `lapse`."
+            )
+        if lapse is not None and not self.has_lapse:
+            _logger.warning(
+                "You have specified the `lapse` argument to include a lapse "
+                + "distribution, but `p_outlier` is set to either 0 or None. "
+                + "Your lapse distribution will be ignored."
+            )
+        if "p_outlier" in self.list_params and self.list_params[-1] != "p_outlier":
+            raise ValueError(
+                "Please do not include 'p_outlier' in `list_params`. "
+                + "We automatically append it to `list_params` when `p_outlier` "
+                + "parameter is not None"
+            )
+
     def _make_model_distribution(self) -> type[pm.Distribution]:
         """Make a pm.Distribution for the model."""
-        # == Logic for different types of likelihoods:
+        ### Logic for different types of likelihoods:
         # -`analytical` and `blackbox`:
         #     loglik should be a `pm.Distribution`` or a Python callable (any arbitrary
         #     function).
@@ -256,23 +2013,6 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
             return self.loglik
 
-        # Type narrowing: loglik and list_params should be set by this point
-        if self.loglik is None:
-            raise ValueError(
-                "Likelihood function (loglik) has not been set. "
-                "This should have been configured during model initialization."
-            )
-        if self.list_params is None:
-            raise ValueError(
-                "list_params has not been set. "
-                "This should have been validated during model initialization."
-            )
-        if self.loglik_kind is None:
-            raise ValueError(
-                "Likelihood kind (loglik_kind) has not been set. "
-                "This should have been configured during model initialization."
-            )
-
         # params_is_trialwise_base: one entry per model param (excluding
         # p_outlier). Used for graph-level broadcasting in logp() and
         # make_distribution, where dist_params does not include extra_fields.
@@ -380,3 +2120,255 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             fixed_vector_params=fixed_vector_params if fixed_vector_params else None,
             params_is_trialwise=params_is_trialwise_base,
         )
+
+    def _get_deterministic_var_names(self, idata) -> list[str]:
+        """Filter out the deterministic variables in var_names."""
+        var_names = [
+            f"~{param_name}"
+            for param_name, param in self.params.items()
+            if (param.is_regression)
+        ]
+
+        if f"{self._parent}_mean" in idata["posterior"].data_vars:
+            var_names.append(f"~{self._parent}_mean")
+
+        # Parent parameters (always regression implicitly)
+        # which don't have a formula attached
+        # should be dropped from var_names, since the actual
+        # parent name shows up as a regression.
+        if f"{self._parent}" in idata["posterior"].data_vars:
+            if self.params[self._parent].formula is None:
+                # Drop from var_names
+                var_names = [var for var in var_names if var != f"~{self._parent}"]
+
+        return var_names
+
+    def _drop_parent_str_from_idata(
+        self, idata: az.InferenceData | None
+    ) -> az.InferenceData:
+        """Drop the parent_str variable from an InferenceData object.
+
+        Parameters
+        ----------
+        idata
+            The InferenceData object to be modified.
+
+        Returns
+        -------
+        xr.Dataset
+            The modified InferenceData object.
+        """
+        if idata is None:
+            raise ValueError("Please provide an InferenceData object.")
+        else:
+            for group in idata.groups():
+                if ("rt,response_mean" in idata[group].data_vars) and (
+                    self._parent not in idata[group].data_vars
+                ):
+                    setattr(
+                        idata,
+                        group,
+                        idata[group].rename({"rt,response_mean": self._parent}),
+                    )
+            return idata
+
+    def _postprocess_initvals_deterministic(
+        self, initval_settings: dict = INITVAL_SETTINGS
+    ) -> None:
+        """Set initial values for subset of parameters."""
+        self._initvals = self.initial_point()
+        # Consider case where link functions are set to 'log_logit'
+        # or 'None'
+        if self.link_settings not in ["log_logit", None]:
+            _logger.info(
+                "Not preprocessing initial values, "
+                + "because none of the two standard link settings are chosen!"
+            )
+            return None
+
+        # Set initial values for particular parameters
+        for name_, starting_value in self.pymc_model.initial_point().items():
+            # strip name of `_log__` and `_interval__` suffixes
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+
+            # We need to check if the parameter is actually backed by
+            # a regression.
+
+            # If not, we don't actually apply a link function to it as per default.
+            # Therefore we need to apply the initial value strategy corresponding
+            # to 'None' link function.
+
+            # If the user actively supplies a link function, the user
+            # should also have supplied an initial value insofar it matters.
+
+            if self.params[self._get_prefix(name_tmp)].is_regression:
+                param_link_setting = self.link_settings
+            else:
+                param_link_setting = None
+            if name_tmp in initval_settings[param_link_setting].keys():
+                if self._check_if_initval_user_supplied(name_tmp):
+                    _logger.info(
+                        "User supplied initial value detected for %s, \n"
+                        " skipping overwrite with default value.",
+                        name_tmp,
+                    )
+                    continue
+
+                # Apply specific settings from initval_settings dictionary
+                dtype = self._initvals[name_tmp].dtype
+                self._initvals[name_tmp] = np.array(
+                    initval_settings[param_link_setting][name_tmp]
+                ).astype(dtype)
+
+    def _get_prefix(self, name_str: str) -> str:
+        """Get parameters wise link setting function from parameter prefix."""
+        # `p_outlier` is the only basic parameter floating around that has
+        # an underscore in it's name.
+        # We need to handle it separately. (Renaming might be better...)
+        if "_" in name_str:
+            if "p_outlier" not in name_str:
+                name_str_prefix = name_str.split("_")[0]
+            else:
+                name_str_prefix = "p_outlier"
+        else:
+            name_str_prefix = name_str
+        return name_str_prefix
+
+    def _check_if_initval_user_supplied(
+        self,
+        name_str: str,
+        return_value: bool = False,
+    ) -> bool | float | int | np.ndarray | dict[str, Any] | None:
+        """Check if initial value is user-supplied."""
+        # The function assumes that the name_str is either raw parameter name
+        # or `paramname_Intercept`, because we only really provide special default
+        # initial values for those types of parameters
+
+        # `p_outlier` is the only basic parameter floating around that has
+        # an underscore in it's name.
+        # We need to handle it separately. (Renaming might be better...)
+        if "_" in name_str:
+            if "p_outlier" not in name_str:
+                name_str_prefix = name_str.split("_")[0]
+                # name_str_suffix = "".join(name_str.split("_")[1:])
+                name_str_suffix = name_str[len(name_str_prefix + "_") :]
+            else:
+                name_str_prefix = "p_outlier"
+                if name_str == "p_outlier":
+                    name_str_suffix = ""
+                else:
+                    # name_str_suffix = "".join(name_str.split("_")[2:])
+                    name_str_suffix = name_str[len("p_outlier_") :]
+        else:
+            name_str_prefix = name_str
+            name_str_suffix = ""
+
+        tmp_param = name_str_prefix
+        if tmp_param == self._parent:
+            # If the parameter was parent it is automatically treated as a
+            # regression.
+            if not name_str_suffix:
+                # No suffix --> Intercept
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp["Intercept"], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    return False
+            else:
+                # If the parameter has a suffix --> use it
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+        else:
+            # If the parameter is not a parent, it is treated as a regression
+            # only when actively specified as such.
+            if not name_str_suffix:
+                # If no suffix --> treat as basic parameter.
+                if isinstance(self.params[tmp_param].prior, float) or isinstance(
+                    self.params[tmp_param].prior, np.ndarray
+                ):
+                    if return_value:
+                        return self.params[tmp_param].prior
+                    else:
+                        return True
+                elif isinstance(self.params[tmp_param].prior, bmb.Prior):
+                    args_tmp = getattr(self.params[tmp_param].prior, "args")
+                    if "initval" in args_tmp:
+                        if return_value:
+                            return args_tmp["initval"]
+                        else:
+                            return True
+                    else:
+                        if return_value:
+                            return None
+                        else:
+                            return False
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+            else:
+                # If suffix --> treat as regression and use suffix
+                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
+                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
+                    if return_value:
+                        return args_tmp.get("initval", None)
+                    else:
+                        return "initval" in args_tmp
+                else:
+                    if return_value:
+                        return None
+                    else:
+                        return False
+
+    def _jitter_initvals(
+        self, jitter_epsilon: float = 0.01, vector_only: bool = False
+    ) -> None:
+        """Apply controlled jitter to initial values."""
+        if vector_only:
+            self.__jitter_initvals_vector_only(jitter_epsilon)
+        else:
+            self.__jitter_initvals_all(jitter_epsilon)
+
+    def __jitter_initvals_vector_only(self, jitter_epsilon: float) -> None:
+        # Note: Calling our initial point function here
+        # --> operate on untransformed variables
+        initial_point_dict = self.initvals
+        for name_, starting_value in initial_point_dict.items():
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+            if starting_value.ndim != 0 and starting_value.shape[0] != 1:
+                starting_value_tmp = starting_value + np.random.uniform(
+                    -jitter_epsilon, jitter_epsilon, starting_value.shape
+                ).astype(np.float32)
+
+                # Note: self._initvals shouldn't be None when this is called
+                dtype = self._initvals[name_tmp].dtype
+                self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)
+
+    def __jitter_initvals_all(self, jitter_epsilon: float) -> None:
+        # Note: Calling our initial point function here
+        # --> operate on untransformed variables
+        initial_point_dict = self.initvals
+        # initial_point_dict = self.pymc_model.initial_point()
+        for name_, starting_value in initial_point_dict.items():
+            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
+            starting_value_tmp = starting_value + np.random.uniform(
+                -jitter_epsilon, jitter_epsilon, starting_value.shape
+            ).astype(np.float32)
+
+            dtype = self.initvals[name_tmp].dtype
+            self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)

From 8b584ff3ab7d563d0446967a0fa474bebf09addc Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 17:50:01 -0500
Subject: [PATCH 094/104] Restore param

---
 src/hssm/param/param.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/param/param.py b/src/hssm/param/param.py
index 48062ef46..4ea8493f5 100644
--- a/src/hssm/param/param.py
+++ b/src/hssm/param/param.py
@@ -157,7 +157,7 @@ def is_trialwise(self) -> bool:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | bmb.Prior | None = None,
+        prior: dict[str, Any] | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From d5eb0e6f40caec7ad3e3f3d2eef1a6f09f6d2c5d Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 17:51:43 -0500
Subject: [PATCH 095/104] Restore params

---
 src/hssm/param/params.py | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/src/hssm/param/params.py b/src/hssm/param/params.py
index f417d0025..f542c803d 100644
--- a/src/hssm/param/params.py
+++ b/src/hssm/param/params.py
@@ -213,7 +213,7 @@ def collect_user_params(
         user_param = UserParam.from_dict(param) if isinstance(param, dict) else param
         if user_param.name is None:
             raise ValueError("Parameter name must be specified.")
-        if user_param.name not in model.list_params:  # type: ignore
+        if user_param.name not in model.list_params:
             raise ValueError(
                 f"Parameter {user_param.name} not found in list_params."
                 " This implies that the parameter is not valid for the chosen model."
@@ -229,7 +229,7 @@ def collect_user_params(
     # If any of the keys is found in `list_params` it is a parameter specification.
     # We add the parameter specification to `user_params` and remove it from
     # `kwargs`
-    for param_name in model.list_params:  # type: ignore
+    for param_name in model.list_params:
         # Update user_params only if param_name is in kwargs
         # and not already in user_params
         if param_name in kwargs:
@@ -272,7 +272,7 @@ def make_params(model: HSSM, user_params: dict[str, UserParam]) -> dict[str, Par
         and model.loglik_kind != "approx_differentiable"
     )
 
-    for name in model.list_params:  # type: ignore
+    for name in model.list_params:
         if name in user_params:
             param = make_param_from_user_param(model, name, user_params[name])
         else:
@@ -359,10 +359,6 @@ def make_param_from_defaults(model: HSSM, name: str) -> Param:
             link_settings=model.link_settings,
         )
     else:
-        param = DefaultParam.from_defaults(
-            name,
-            default_prior,
-            default_bounds,  # type: ignore
-        )
+        param = DefaultParam.from_defaults(name, default_prior, default_bounds)
 
     return param

From bc90471f8c0f2d9448e44e0e6e2d50139c820621 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 17:52:33 -0500
Subject: [PATCH 096/104] Restore regression_params

---
 src/hssm/param/regression_param.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/param/regression_param.py b/src/hssm/param/regression_param.py
index 06c1ae53c..462b37955 100644
--- a/src/hssm/param/regression_param.py
+++ b/src/hssm/param/regression_param.py
@@ -111,7 +111,7 @@ def from_defaults(
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | bmb.Prior | None = None,
+        prior: dict[str, Any] | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From 153a2cb18b40f8ce956366393e5330411134909b Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 17:53:20 -0500
Subject: [PATCH 097/104] Restore simple param

---
 src/hssm/param/simple_param.py | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/src/hssm/param/simple_param.py b/src/hssm/param/simple_param.py
index 967ce09bb..70d001047 100644
--- a/src/hssm/param/simple_param.py
+++ b/src/hssm/param/simple_param.py
@@ -111,7 +111,7 @@ def from_user_param(cls, user_param: UserParam) -> "SimpleParam":
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | bmb.Prior | None = None,
+        prior: dict[str, Any] | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:
@@ -208,10 +208,7 @@ def __init__(
 
     @classmethod
     def from_defaults(
-        cls,
-        name: str,
-        prior: float | dict[str, Any] | bmb.Prior,
-        bounds: tuple[float, float],
+        cls, name: str, prior: dict[str, Any], bounds: tuple[int, int]
     ) -> "DefaultParam":
         """Create a DefaultParam object from default values.
 
@@ -251,7 +248,7 @@ def process_prior(self) -> None:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | bmb.Prior | None = None,
+        prior: dict[str, Any] | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From 22e1035c5ee7b9cf4948f5e3e0055d4cd7263de0 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Tue, 17 Feb 2026 18:14:07 -0500
Subject: [PATCH 098/104] Restore test_hsmm

---
 tests/test_hssm.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_hssm.py b/tests/test_hssm.py
index 3e3c3dc3e..8309bf013 100644
--- a/tests/test_hssm.py
+++ b/tests/test_hssm.py
@@ -96,7 +96,7 @@ def test_custom_model(data_ddm):
 
     with pytest.raises(
         ValueError,
-        match="Please provide `list_params`*",
+        match=r"^Please provide `list_params`",
     ):
         HSSM(
             data=data_ddm,

From 7d76550c7448b37cd7f1851fa896316135c9e44f Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 18 Feb 2026 14:32:11 -0500
Subject: [PATCH 099/104] Fix base for dimensionality problems

---
 src/hssm/base.py |  133 ++-
 src/hssm/hssm.py | 2016 +---------------------------------------------
 2 files changed, 102 insertions(+), 2047 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 30ea75fc8..405e4d47d 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -10,6 +10,7 @@
 import logging
 from abc import ABC, abstractmethod
 from copy import deepcopy
+from inspect import signature
 from os import PathLike
 from pathlib import Path
 from typing import Any, Callable, Literal, Optional, Union, cast, get_args
@@ -381,6 +382,7 @@ def __init__(
         self._parent = self.params.parent
         self._parent_param = self.params.parent_param
 
+        self._validate_fixed_vectors()
         self.formula, self.priors, self.link = self.params.parse_bambi(model=self)  # type: ignore[arg-type]
 
         # For parameters that have a regression backend, apply bounds at the likelihood
@@ -422,6 +424,15 @@ def __init__(
         self.set_alias(self._aliases)
         self.model.build()
 
+        # region ===== Fix scalar deterministic dims for bambi >= 0.17 =====
+        # Bambi >= 0.17 declares dims=("__obs__",) for intercept-only
+        # deterministics that actually have shape (1,). This causes an
+        # xarray CoordinateValidationError during pm.sample() when ArviZ
+        # tries to create a DataArray with mismatched dimension sizes.
+        # Fix by removing the dims declaration for these deterministics.
+        self._fix_scalar_deterministic_dims()
+        # endregion
+
         # region ===== Init vals and jitters =====
         if process_initvals:
             self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
@@ -439,6 +450,58 @@ def __init__(
         )
         _logger.info("Model initialized successfully.")
 
+    @abstractmethod
+    def _make_model_distribution(self) -> type[pm.Distribution]:
+        """Make a pm.Distribution for the model.
+
+        This method must be implemented by subclasses to create the appropriate
+        distribution for the specific model type.
+        """
+        ...
+
+    def _fix_scalar_deterministic_dims(self) -> None:
+        """Fix dims metadata for scalar deterministics.
+
+        Bambi >= 0.17 returns shape ``(1,)`` for intercept-only
+        deterministics but still declares ``dims=("__obs__",)``. This causes
+        an xarray ``CoordinateValidationError`` during ``pm.sample()`` because
+        the ``__obs__`` coordinate has ``n_obs`` entries. Removing the dims
+        declaration for these variables lets ArviZ handle them as
+        un-dimensioned arrays, avoiding the conflict.
+        """
+        n_obs = len(self.data)
+        dims_dict = self.pymc_model.named_vars_to_dims
+        for det in self.pymc_model.deterministics:
+            if det.name not in dims_dict:
+                continue
+            dims = dims_dict[det.name]
+            if "__obs__" in dims:
+                # Check static shape: if it doesn't match n_obs, remove dims
+                try:
+                    shape_0 = det.type.shape[0]
+                except (IndexError, TypeError):
+                    continue
+                if shape_0 is not None and shape_0 != n_obs:
+                    del dims_dict[det.name]
+
+    def _validate_fixed_vectors(self) -> None:
+        """Validate that fixed-vector parameters have the correct length.
+
+        Fixed-vector parameters (``prior=np.ndarray``) bypass Bambi's formula
+        system entirely --- they are passed as a scalar ``0.0`` placeholder to
+        Bambi, and the real vector is substituted inside
+        ``HSSMDistribution.logp()`` (see ``dist.py``).  Because this
+        substitution is invisible to Bambi, we must validate the vector length
+        against ``len(self.data)`` up front to catch shape mismatches early.
+        """
+        for name, param in self.params.items():
+            if isinstance(param.prior, np.ndarray):
+                if len(param.prior) != len(self.data):
+                    raise ValueError(
+                        f"Fixed vector for parameter '{name}' has length "
+                        f"{len(param.prior)}, but data has {len(self.data)} rows."
+                    )
+
     @classmethod
     def _build_model_config(
         cls,
@@ -462,8 +525,8 @@ def _build_model_config(
 
         Returns
         -------
-        ModelConfig
-            A complete ModelConfig object with choices and other settings applied.
+        Config
+            A complete Config object with choices and other settings applied.
         """
         # Start with defaults
         config = cls.config_class.from_defaults(model, loglik_kind)
@@ -545,6 +608,14 @@ def supported_models(cls) -> tuple[SupportedModels, ...]:
         """
         return get_args(SupportedModels)
 
+    @classmethod
+    def _store_init_args(cls, *args, **kwargs):
+        """Store initialization arguments using signature binding."""
+        sig = signature(cls.__init__)
+        bound_args = sig.bind(*args, **kwargs)
+        bound_args.apply_defaults()
+        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
+
     def find_MAP(self, **kwargs):
         """Perform Maximum A Posteriori estimation.
 
@@ -587,7 +658,7 @@ def sample(
             Pass initial values to the sampler. This can be a dictionary of initial
             values for parameters of the model, or a string "map" to use initialization
             at the MAP estimate. If "map" is used, the MAP estimate will be computed if
-            not already attached to the base class from prior call to 'find_MAP`.
+            not already attached to the base class from prior call to 'find_MAP'.
         include_response_params: optional
             Include parameters of the response distribution in the output. These usually
             take more space than other parameters as there's one of them per
@@ -1228,7 +1299,9 @@ def sample_prior_predictive(
         # mean prior here (which adds deterministics that
         # could be recomputed elsewhere)
         prior_predictive.add_groups(posterior=prior_predictive.prior)
-        self.model.predict(prior_predictive, kind="mean", inplace=True)
+        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
+        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
+        self.model.predict(prior_predictive, kind="response_params", inplace=True)
 
         # clean
         setattr(prior_predictive, "prior", prior_predictive["posterior"])
@@ -1565,41 +1638,40 @@ def save_model(
 
         Parameters
         ----------
-        model : HSSM
-            The HSSM model instance to save
         model_name : str | None
             Name to use for the saved model files.
             If None, will use model.model_name with timestamp
         allow_absolute_base_path : bool
-            Whether to allow absolute paths for base_path
+            Whether to allow absolute paths for base_path.
+            Defaults to False for safety.
         base_path : str | Path
             Base directory to save model files in.
-            Must be relative path if allow_absolute_base_path=False
-        save_idata_only: bool = False,
-            Whether to save the model class instance itself
+            Must be relative path if allow_absolute_base_path=False.
+            Defaults to "hssm_models".
+        save_idata_only : bool
+            If True, only saves inference data (traces), not the model pickle.
+            Defaults to False (saves both model and traces).
 
         Raises
         ------
         ValueError
             If base_path is absolute and allow_absolute_base_path=False
         """
-        # check if base_path is absolute
-        if not allow_absolute_base_path:
-            if str(base_path).startswith("/"):
-                raise ValueError(
-                    "base_path must be a relative path"
-                    " if allow_absolute_base_path is False"
-                )
+        # Convert to Path object for cross-platform compatibility
+        base_path = Path(base_path)
+
+        # Check if base_path is absolute (works on all platforms)
+        if not allow_absolute_base_path and base_path.is_absolute():
+            raise ValueError(
+                "base_path must be a relative path if allow_absolute_base_path is False"
+            )
 
         if model_name is None:
             # Get date string format as suffix to model name
-            model_name = (
-                self.model_name
-                + "_"
-                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
-            )
+            timestamp = datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
+            model_name = f"{self.model_name}_{timestamp}"
 
-        # check if folder by name model_name exists
+        # Sanitize model_name and construct full path
         model_name = model_name.replace(" ", "_")
         model_path = Path(base_path).joinpath(model_name)
         model_path.mkdir(parents=True, exist_ok=True)
@@ -1620,7 +1692,7 @@ def save_model(
     @classmethod
     def load_model(
         cls, path: Union[str, Path]
-    ) -> Union["HSSMBase", dict[str, Optional[az.InferenceData]]]:
+    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
         """Load a HSSM model instance and its inference results from disk.
 
         Parameters
@@ -1631,7 +1703,7 @@ def load_model(
 
         Returns
         -------
-        HSSMBase
+        HSSM
             The loaded HSSM model instance with inference results attached if available.
         """
         # Convert path to Path object
@@ -1748,7 +1820,7 @@ def __setstate__(self, state):
             A dictionary containing the constructor arguments under the key
             'constructor_args'.
         """
-        new_instance = self.__class__(**state["constructor_args"])
+        new_instance = HSSM(**state["constructor_args"])
         self.__dict__ = new_instance.__dict__
 
     def __repr__(self) -> str:
@@ -1929,15 +2001,6 @@ def _check_lapse(self, lapse):
                 + "parameter is not None"
             )
 
-    @abstractmethod
-    def _make_model_distribution(self) -> type[pm.Distribution]:
-        """Make a pm.Distribution for the model.
-
-        This method must be implemented by subclasses to create the appropriate
-        distribution for the specific model type.
-        """
-        ...
-
     def _get_deterministic_var_names(self, idata) -> list[str]:
         """Filter out the deterministic variables in var_names."""
         var_names = [
diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 19508a342..7e86a8829 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -6,59 +6,29 @@
 This file defines the entry class HSSM.
 """
 
-import datetime
 import logging
-import typing
 from copy import deepcopy
-from inspect import isclass, signature
-from os import PathLike
-from pathlib import Path
-from typing import Any, Callable, Literal, Optional, Union, cast, get_args
+from inspect import isclass
+from typing import Literal
 
-import arviz as az
-import bambi as bmb
-import cloudpickle as cpickle
-import matplotlib as mpl
-import matplotlib.pyplot as plt
 import numpy as np
-import pandas as pd
 import pymc as pm
-import pytensor
-import seaborn as sns
-import xarray as xr
-from bambi.model_components import DistributionalComponent
-from bambi.transformations import transformations_namespace
-from pymc.model.transform.conditioning import do
-from ssms.config import model_config as ssms_model_config
 
-from hssm._types import LoglikKind, SupportedModels
-from hssm.data_validator import DataValidatorMixin
 from hssm.defaults import (
-    INITVAL_JITTER_SETTINGS,
-    INITVAL_SETTINGS,
     MissingDataNetwork,
     missing_data_networks_suffix,
 )
 from hssm.distribution_utils import (
     assemble_callables,
     make_distribution,
-    make_family,
     make_likelihood_callable,
     make_missing_data_callable,
 )
-from hssm.missing_data_mixin import MissingDataMixin
 from hssm.utils import (
-    _compute_log_likelihood,
-    _get_alias_dict,
-    _print_prior,
     _rearrange_data,
-    _split_array,
 )
 
-from . import plotting
-from .config import Config, ModelConfig
-from .param import Params
-from .param import UserParam as Param
+from .base import HSSMBase
 
 _logger = logging.getLogger("hssm")
 
@@ -98,7 +68,7 @@ def __get__(self, instance, owner):  # noqa: D105
         return self.fget(owner)
 
 
-class HSSM(DataValidatorMixin, MissingDataMixin):
+class HSSM(HSSMBase):
     """The basic Hierarchical Sequential Sampling Model (HSSM) class.
 
     Parameters
@@ -271,1732 +241,6 @@ class HSSM(DataValidatorMixin, MissingDataMixin):
         The jitter value for the initial values.
     """
 
-    def __init__(
-        self,
-        data: pd.DataFrame,
-        model: SupportedModels | str = "ddm",
-        choices: list[int] | None = None,
-        include: list[dict[str, Any] | Param] | None = None,
-        model_config: ModelConfig | dict | None = None,
-        loglik: (
-            str | PathLike | Callable | pytensor.graph.Op | type[pm.Distribution] | None
-        ) = None,
-        loglik_kind: LoglikKind | None = None,
-        p_outlier: float | dict | bmb.Prior | None = 0.05,
-        lapse: dict | bmb.Prior | None = bmb.Prior("Uniform", lower=0.0, upper=20.0),
-        global_formula: str | None = None,
-        link_settings: Literal["log_logit"] | None = None,
-        prior_settings: Literal["safe"] | None = "safe",
-        extra_namespace: dict[str, Any] | None = None,
-        missing_data: bool | float = False,
-        deadline: bool | str = False,
-        loglik_missing_data: (
-            str | PathLike | Callable | pytensor.graph.Op | None
-        ) = None,
-        process_initvals: bool = True,
-        initval_jitter: float = INITVAL_JITTER_SETTINGS["jitter_epsilon"],
-        **kwargs,
-    ):
-        # Attach arguments to the instance
-        # so that we can easily define some
-        # methods that need to access these
-        # arguments (context: pickling / save - load).
-
-        # Define a dict with all call arguments:
-        self._init_args = {
-            k: v for k, v in locals().items() if k not in ["self", "kwargs"]
-        }
-        if kwargs:
-            self._init_args.update(kwargs)
-
-        self.data = data.copy()
-        self._inference_obj: az.InferenceData | None = None
-        self._initvals: dict[str, Any] = {}
-        self.initval_jitter = initval_jitter
-        self._inference_obj_vi: pm.Approximation | None = None
-        self._vi_approx = None
-        self._map_dict = None
-        self.global_formula = global_formula
-
-        self.link_settings = link_settings
-        self.prior_settings = prior_settings
-
-        self.missing_data_value = -999.0
-
-        additional_namespace = transformations_namespace.copy()
-        if extra_namespace is not None:
-            additional_namespace.update(extra_namespace)
-        self.additional_namespace = additional_namespace
-
-        # Construct a model_config from defaults
-        self.model_config = Config.from_defaults(model, loglik_kind)
-        # Update defaults with user-provided config, if any
-        if model_config is not None:
-            if isinstance(model_config, dict):
-                if "choices" not in model_config:
-                    if choices is not None:
-                        model_config["choices"] = tuple(choices)
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-            elif isinstance(model_config, ModelConfig):
-                if model_config.choices is None:
-                    if choices is not None:
-                        model_config.choices = tuple(choices)
-                else:
-                    if choices is not None:
-                        _logger.info(
-                            "choices list provided in both model_config and "
-                            "as an argument directly."
-                            " Using the one provided in model_config. \n"
-                            "We recommend providing choices in model_config."
-                        )
-
-            self.model_config.update_config(
-                model_config
-                if isinstance(model_config, ModelConfig)
-                else ModelConfig(**model_config)  # also serves as dict validation
-            )
-        else:
-            # Model config is not provided, but at this point was constructed from
-            # defaults.
-            if model not in typing.get_args(SupportedModels):
-                # TODO: ideally use self.supported_models above but mypy doesn't like it
-                if choices is not None:
-                    self.model_config.update_choices(choices)
-                elif model in ssms_model_config:
-                    self.model_config.update_choices(
-                        ssms_model_config[model]["choices"]
-                    )
-                    _logger.info(
-                        "choices argument passed as None, "
-                        "but found %s in ssms-simulators. "
-                        "Using choices, from ssm-simulators configs: %s",
-                        model,
-                        ssms_model_config[model]["choices"],
-                    )
-            else:
-                # Model config already constructed from defaults, and model string is
-                # in SupportedModels. So we are guaranteed that choices are in
-                # self.model_config already.
-
-                if choices is not None:
-                    _logger.info(
-                        "Model string is in SupportedModels."
-                        " Ignoring choices arguments."
-                    )
-
-        # Update loglik with user-provided value
-        self.model_config.update_loglik(loglik)
-        # Ensure that all required fields are valid
-        self.model_config.validate()
-
-        # Set up shortcuts so old code will work
-        self.response = self.model_config.response
-        self.list_params = self.model_config.list_params
-        self.choices = self.model_config.choices
-        self.model_name = self.model_config.model_name
-        self.loglik = self.model_config.loglik
-        self.loglik_kind = self.model_config.loglik_kind
-        self.extra_fields = self.model_config.extra_fields
-
-        self.n_choices = len(self.choices)
-
-        self._validate_choices()
-        self._pre_check_data_sanity()
-
-        # Process missing data setting
-        # AF-TODO: Could be a function in data validator?
-        if isinstance(missing_data, float):
-            if not ((self.data.rt == missing_data).any()):
-                raise ValueError(
-                    f"missing_data argument is provided as a float {missing_data}, "
-                    f"However, you have no RTs of {missing_data} in your dataset!"
-                )
-            else:
-                self.missing_data = True
-                self.missing_data_value = missing_data
-        elif isinstance(missing_data, bool):
-            if missing_data and (not (self.data.rt == -999.0).any()):
-                raise ValueError(
-                    "missing_data argument is provided as True, "
-                    " so RTs of -999.0 are treated as missing. \n"
-                    "However, you have no RTs of -999.0 in your dataset!"
-                )
-            elif (not missing_data) and (self.data.rt == -999.0).any():
-                # self.missing_data = True
-                raise ValueError(
-                    "Missing data provided as False. \n"
-                    "However, you have RTs of -999.0 in your dataset!"
-                )
-            else:
-                self.missing_data = missing_data
-        else:
-            raise ValueError(
-                "missing_data argument must be a bool or a float! \n"
-                f"You provided: {type(missing_data)}"
-            )
-
-        if isinstance(deadline, str):
-            self.deadline = True
-            self.deadline_name = deadline
-        else:
-            self.deadline = deadline
-            self.deadline_name = "deadline"
-
-        if (
-            not self.missing_data and not self.deadline
-        ) and loglik_missing_data is not None:
-            raise ValueError(
-                "You have specified a loglik_missing_data function, but you have not "
-                + "set the missing_data or deadline flag to True."
-            )
-        self.loglik_missing_data = loglik_missing_data
-
-        # Update data based on missing_data and deadline
-        self._handle_missing_data_and_deadline()
-        # Set self.missing_data_network based on `missing_data` and `deadline`
-        self.missing_data_network = self._set_missing_data_and_deadline(
-            self.missing_data, self.deadline, self.data
-        )
-
-        if self.deadline:
-            # self.response is a tuple (from Config); use concatenation.
-            self.response.append(self.deadline_name)
-
-        # Process lapse distribution
-        self.has_lapse = p_outlier is not None and p_outlier != 0
-        self._check_lapse(lapse)
-        if self.has_lapse and self.list_params[-1] != "p_outlier":
-            self.list_params.append("p_outlier")
-
-        # Process all parameters
-        self.params = Params.from_user_specs(
-            model=self,
-            include=[] if include is None else include,
-            kwargs=kwargs,
-            p_outlier=p_outlier,
-        )
-
-        self._parent = self.params.parent
-        self._parent_param = self.params.parent_param
-
-        self._validate_fixed_vectors()
-        self.formula, self.priors, self.link = self.params.parse_bambi(model=self)
-
-        # For parameters that have a regression backend, apply bounds at the likelihood
-        # level to ensure that the samples that are out of bounds
-        # are discarded (replaced with a large negative value).
-        self.bounds = {
-            name: param.bounds
-            for name, param in self.params.items()
-            if param.is_regression and param.bounds is not None
-        }
-
-        # Set p_outlier and lapse
-        self.p_outlier = self.params.get("p_outlier")
-        self.lapse = lapse if self.has_lapse else None
-
-        self._post_check_data_sanity()
-
-        self.model_distribution = self._make_model_distribution()
-
-        self.family = make_family(
-            self.model_distribution,
-            self.list_params,
-            self.link,
-            self._parent,
-        )
-
-        self.model = bmb.Model(
-            self.formula,
-            data=self.data,
-            family=self.family,
-            priors=self.priors,  # center_predictors=False
-            extra_namespace=self.additional_namespace,
-            **kwargs,
-        )
-
-        self._aliases = _get_alias_dict(
-            self.model, self._parent_param, self.response_c, self.response_str
-        )
-        self.set_alias(self._aliases)
-        self.model.build()
-
-        # Bambi >= 0.17 declares dims=("__obs__",) for intercept-only
-        # deterministics that actually have shape (1,). This causes an
-        # xarray CoordinateValidationError during pm.sample() when ArviZ
-        # tries to create a DataArray with mismatched dimension sizes.
-        # Fix by removing the dims declaration for these deterministics.
-        self._fix_scalar_deterministic_dims()
-
-        if process_initvals:
-            self._postprocess_initvals_deterministic(initval_settings=INITVAL_SETTINGS)
-        if self.initval_jitter > 0:
-            self._jitter_initvals(
-                jitter_epsilon=self.initval_jitter,
-                vector_only=True,
-            )
-
-        # Make sure we reset rvs_to_initial_values --> Only None's
-        # Otherwise PyMC barks at us when asking to compute likelihoods
-        self.pymc_model.rvs_to_initial_values.update(
-            {key_: None for key_ in self.pymc_model.rvs_to_initial_values.keys()}
-        )
-        _logger.info("Model initialized successfully.")
-
-    def _fix_scalar_deterministic_dims(self) -> None:
-        """Fix dims metadata for scalar deterministics.
-
-        Bambi >= 0.17 returns shape ``(1,)`` for intercept-only
-        deterministics but still declares ``dims=("__obs__",)``. This causes
-        an xarray ``CoordinateValidationError`` during ``pm.sample()`` because
-        the ``__obs__`` coordinate has ``n_obs`` entries. Removing the dims
-        declaration for these variables lets ArviZ handle them as
-        un-dimensioned arrays, avoiding the conflict.
-        """
-        n_obs = len(self.data)
-        dims_dict = self.pymc_model.named_vars_to_dims
-        for det in self.pymc_model.deterministics:
-            if det.name not in dims_dict:
-                continue
-            dims = dims_dict[det.name]
-            if "__obs__" in dims:
-                # Check static shape: if it doesn't match n_obs, remove dims
-                try:
-                    shape_0 = det.type.shape[0]
-                except (IndexError, TypeError):
-                    continue
-                if shape_0 is not None and shape_0 != n_obs:
-                    del dims_dict[det.name]
-
-    def _validate_fixed_vectors(self) -> None:
-        """Validate that fixed-vector parameters have the correct length.
-
-        Fixed-vector parameters (``prior=np.ndarray``) bypass Bambi's formula
-        system entirely --- they are passed as a scalar ``0.0`` placeholder to
-        Bambi, and the real vector is substituted inside
-        ``HSSMDistribution.logp()`` (see ``dist.py``).  Because this
-        substitution is invisible to Bambi, we must validate the vector length
-        against ``len(self.data)`` up front to catch shape mismatches early.
-        """
-        for name, param in self.params.items():
-            if isinstance(param.prior, np.ndarray):
-                if len(param.prior) != len(self.data):
-                    raise ValueError(
-                        f"Fixed vector for parameter '{name}' has length "
-                        f"{len(param.prior)}, but data has {len(self.data)} rows."
-                    )
-
-    @classproperty
-    def supported_models(cls) -> tuple[SupportedModels, ...]:
-        """Get a tuple of all supported models.
-
-        Returns
-        -------
-        tuple[SupportedModels, ...]
-            A tuple containing all supported model names.
-        """
-        return get_args(SupportedModels)
-
-    @classmethod
-    def _store_init_args(cls, *args, **kwargs):
-        """Store initialization arguments using signature binding."""
-        sig = signature(cls.__init__)
-        bound_args = sig.bind(*args, **kwargs)
-        bound_args.apply_defaults()
-        return {k: v for k, v in bound_args.arguments.items() if k != "self"}
-
-    def find_MAP(self, **kwargs):
-        """Perform Maximum A Posteriori estimation.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        self._map_dict = pm.find_MAP(model=self.pymc_model, **kwargs)
-        return self._map_dict
-
-    def sample(
-        self,
-        sampler: Literal["pymc", "numpyro", "blackjax", "nutpie", "laplace"]
-        | None = None,
-        init: str | None = None,
-        initvals: str | dict | None = None,
-        include_response_params: bool = False,
-        **kwargs,
-    ) -> az.InferenceData | pm.Approximation:
-        """Perform sampling using the `fit` method via bambi.Model.
-
-        Parameters
-        ----------
-        sampler: optional
-            The sampler to use. Can be one of "pymc", "numpyro",
-            "blackjax", "nutpie", or "laplace". If using `blackbox` likelihoods,
-            this cannot be "numpyro", "blackjax", or "nutpie". By default it is None,
-            and sampler will automatically be chosen: when the model uses the
-            `approx_differentiable` likelihood, and `jax` backend, "numpyro" will
-            be used. Otherwise, "pymc" (the default PyMC NUTS sampler) will be used.
-
-            Note that the old sampler names such as "mcmc", "nuts_numpyro",
-            "nuts_blackjax" will be deprecated and removed in future releases. A warning
-            will be raised if any of these old names are used.
-        init: optional
-            Initialization method to use for the sampler. If any of the NUTS samplers
-            is used, defaults to `"adapt_diag"`. Otherwise, defaults to `"auto"`.
-        initvals: optional
-            Pass initial values to the sampler. This can be a dictionary of initial
-            values for parameters of the model, or a string "map" to use initialization
-            at the MAP estimate. If "map" is used, the MAP estimate will be computed if
-            not already attached to the base class from prior call to 'find_MAP'.
-        include_response_params: optional
-            Include parameters of the response distribution in the output. These usually
-            take more space than other parameters as there's one of them per
-            observation. Defaults to False.
-        kwargs
-            Other arguments passed to bmb.Model.fit(). Please see [here]
-            (https://bambinos.github.io/bambi/api_reference.html#bambi.models.Model.fit)
-            for full documentation.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            A reference to the `model.traces` object, which stores the traces of the
-            last call to `model.sample()`. `model.traces` is an ArviZ `InferenceData`
-            instance if `sampler` is `"pymc"` (default), `"numpyro"`,
-            `"blackjax"` or "`laplace".
-        """
-        # If initvals are None (default)
-        # we skip processing initvals here.
-        if sampler in _new_sampler_mapping:
-            _logger.warning(
-                f"Sampler '{sampler}' is deprecated. "
-                "Please use the new sampler names: "
-                "'pymc', 'numpyro', 'blackjax', 'nutpie', or 'laplace'."
-            )
-            sampler = _new_sampler_mapping[sampler]  # type: ignore
-
-        if sampler == "vi":
-            raise ValueError(
-                "VI is not supported via the sample() method. "
-                "Please use the vi() method instead."
-            )
-
-        if initvals is not None:
-            if isinstance(initvals, dict):
-                kwargs["initvals"] = initvals
-            else:
-                if isinstance(initvals, str):
-                    if initvals == "map":
-                        if self._map_dict is None:
-                            _logger.info(
-                                "initvals='map' but no map"
-                                "estimate precomputed. \n"
-                                "Running map estimation first..."
-                            )
-                            self.find_MAP()
-                            kwargs["initvals"] = self._map_dict
-                        else:
-                            kwargs["initvals"] = self._map_dict
-                else:
-                    raise ValueError(
-                        "initvals argument must be a dictionary or 'map'"
-                        " to use the MAP estimate."
-                    )
-        else:
-            kwargs["initvals"] = self._initvals
-            _logger.info("Using default initvals. \n")
-
-        if sampler is None:
-            if (
-                self.loglik_kind == "approx_differentiable"
-                and self.model_config.backend == "jax"
-            ):
-                sampler = "numpyro"
-            else:
-                sampler = "pymc"
-
-        if self.loglik_kind == "blackbox":
-            if sampler in ["blackjax", "numpyro", "nutpie"]:
-                raise ValueError(
-                    f"{sampler} sampler does not work with blackbox likelihoods."
-                )
-
-            if "step" not in kwargs:
-                kwargs |= {"step": pm.Slice(model=self.pymc_model)}
-
-        if (
-            self.loglik_kind == "approx_differentiable"
-            and self.model_config.backend == "jax"
-            and sampler == "pymc"
-            and kwargs.get("cores", None) != 1
-        ):
-            _logger.warning(
-                "Parallel sampling might not work with `jax` backend and the PyMC NUTS "
-                + "sampler on some platforms. Please consider using `numpyro`, "
-                + "`blackjax`, or `nutpie` sampler if that is a problem."
-            )
-
-        if self._check_extra_fields():
-            self._update_extra_fields()
-
-        if init is None:
-            if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]:
-                init = "adapt_diag"
-            else:
-                init = "auto"
-
-        # If sampler is finally `numpyro` make sure
-        # the jitter argument is set to False
-        if sampler == "numpyro":
-            if "nuts_sampler_kwargs" in kwargs:
-                if kwargs["nuts_sampler_kwargs"].get("jitter"):
-                    _logger.warning(
-                        "The jitter argument is set to True. "
-                        + "This argument is not supported "
-                        + "by the numpyro backend. "
-                        + "The jitter argument will be set to False."
-                    )
-                kwargs["nuts_sampler_kwargs"]["jitter"] = False
-            else:
-                kwargs["nuts_sampler_kwargs"] = {"jitter": False}
-
-        if sampler != "pymc" and "step" in kwargs:
-            raise ValueError(
-                "`step` samplers (enabled by the `step` argument) are only supported "
-                "by the `pymc` sampler."
-            )
-
-        if self._inference_obj is not None:
-            _logger.warning(
-                "The model has already been sampled. Overwriting the previous "
-                + "inference object. Any previous reference to the inference object "
-                + "will still point to the old object."
-            )
-
-        # Define whether likelihood should be computed
-        compute_likelihood = True
-        if "idata_kwargs" in kwargs:
-            if "log_likelihood" in kwargs["idata_kwargs"]:
-                compute_likelihood = kwargs["idata_kwargs"].pop("log_likelihood", True)
-
-        omit_offsets = kwargs.pop("omit_offsets", False)
-        self._inference_obj = self.model.fit(
-            inference_method=(
-                "pymc"
-                if sampler in ["pymc", "numpyro", "blackjax", "nutpie"]
-                else sampler
-            ),
-            init=init,
-            include_response_params=include_response_params,
-            omit_offsets=omit_offsets,
-            **kwargs,
-        )
-
-        # Separate out log likelihood computation
-        if compute_likelihood:
-            self.log_likelihood(self._inference_obj, inplace=True)
-
-        # Subset data vars in posterior
-        self._clean_posterior_group(idata=self._inference_obj)
-        return self.traces
-
-    def vi(
-        self,
-        method: str = "advi",
-        niter: int = 10000,
-        draws: int = 1000,
-        return_idata: bool = True,
-        ignore_mcmc_start_point_defaults=False,
-        **vi_kwargs,
-    ) -> pm.Approximation | az.InferenceData:
-        """Perform Variational Inference.
-
-        Parameters
-        ----------
-        niter : int
-            The number of iterations to run the VI algorithm. Defaults to 3000.
-        method : str
-            The method to use for VI. Can be one of "advi" or "fullrank_advi", "svgd",
-            "asvgd".Defaults to "advi".
-        draws : int
-            The number of samples to draw from the posterior distribution.
-            Defaults to 1000.
-        return_idata : bool
-            If True, returns an InferenceData object. Otherwise, returns the
-            approximation object directly. Defaults to True.
-
-        Returns
-        -------
-            pm.Approximation or az.InferenceData: The mean field approximation object.
-        """
-        if self.loglik_kind == "analytical":
-            _logger.warning(
-                "VI is not recommended for the analytical likelihood,"
-                " since gradients can be brittle."
-            )
-        elif self.loglik_kind == "blackbox":
-            raise ValueError(
-                "VI is not supported for blackbox likelihoods, "
-                " since likelihood gradients are needed!"
-            )
-
-        if ("start" not in vi_kwargs) and not ignore_mcmc_start_point_defaults:
-            _logger.info("Using MCMC starting point defaults.")
-            vi_kwargs["start"] = self._initvals
-
-        # Run variational inference directly from pymc model
-        with self.pymc_model:
-            self._vi_approx = pm.fit(n=niter, method=method, **vi_kwargs)
-
-        # Sample from the approximate posterior
-        if self._vi_approx is not None:
-            self._inference_obj_vi = self._vi_approx.sample(draws)
-
-        # Post-processing
-        self._clean_posterior_group(idata=self._inference_obj_vi)
-
-        # Return the InferenceData object if return_idata is True
-        if return_idata:
-            return self._inference_obj_vi
-        # Otherwise return the appromation object directly
-        return self.vi_approx
-
-    def _clean_posterior_group(self, idata: az.InferenceData | None = None):
-        """Clean up the posterior group of the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object to clean up. If None, the last InferenceData object
-            will be used.
-        """
-        # # Logic behind which variables to keep:
-        # # We essentially want to get rid of
-        # # all the trial-wise variables.
-
-        # # We drop all distributional components, IF they are deterministics
-        # # (in which case they will be trial wise systematically)
-        # # and we keep distributional components, IF they are
-        # # basic random-variabels (in which case they should never
-        # # appear trial-wise).
-        if idata is None:
-            raise ValueError(
-                "The InferenceData object is None. Cannot clean up the posterior group."
-            )
-        elif not hasattr(idata, "posterior"):
-            raise ValueError(
-                "The InferenceData object does not have a posterior group. "
-                + "Cannot clean up the posterior group."
-            )
-
-        vars_to_keep = set(idata["posterior"].data_vars.keys()).difference(
-            set(
-                key_
-                for key_ in self.model.distributional_components.keys()
-                if key_ in [var_.name for var_ in self.pymc_model.deterministics]
-            )
-        )
-        vars_to_keep_clean = [
-            var_
-            for var_ in vars_to_keep
-            if isinstance(var_, str) and "_mean" not in var_
-        ]
-
-        setattr(
-            idata,
-            "posterior",
-            idata["posterior"][vars_to_keep_clean],
-        )
-
-    def log_likelihood(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        keep_likelihood_params: bool = False,
-    ) -> az.InferenceData | None:
-        """Compute the log likelihood of the model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-        data : optional
-            A pandas DataFrame with values for the predictors that are used to obtain
-            out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `log_likelihood` group to
-            `idata`. Otherwise, it will return a copy of idata with the predictions
-            added, by default True.
-        keep_likelihood_params : optional
-            If `True`, the trial wise likelihood parameters that are computed
-            on route to getting the log likelihood are kept in the `idata` object.
-            Defaults to False. See also the method `add_likelihood_parameters_to_idata`.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if self._inference_obj is None and idata is None:
-            raise ValueError(
-                "Neither has the model been sampled yet nor"
-                + " an idata object has been provided."
-            )
-
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please provide an idata object."
-                )
-            else:
-                idata = self._inference_obj
-
-        # Actual likelihood computation
-        idata = _compute_log_likelihood(self.model, idata, data, inplace)
-
-        # clean up posterior:
-        if not keep_likelihood_params:
-            self._clean_posterior_group(idata=idata)
-
-        if inplace:
-            return None
-        else:
-            return idata
-
-    def add_likelihood_parameters_to_idata(
-        self,
-        idata: az.InferenceData | None = None,
-        inplace: bool = False,
-    ) -> az.InferenceData | None:
-        """Add likelihood parameters to the InferenceData object.
-
-        Parameters
-        ----------
-        idata : az.InferenceData
-            The InferenceData object returned by HSSM.sample().
-        inplace : bool
-            If True, the likelihood parameters are added to idata in-place. Otherwise,
-            a copy of idata with the likelihood parameters added is returned.
-            Defaults to False.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError("No idata provided and model not yet sampled!")
-            else:
-                idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                    deepcopy(self._inference_obj)
-                    if not inplace
-                    else self._inference_obj
-                )
-        else:
-            idata = self.model._compute_likelihood_params(  # pylint: disable=protected-access
-                deepcopy(idata) if not inplace else idata
-            )
-        return idata
-
-    def sample_posterior_predictive(
-        self,
-        idata: az.InferenceData | None = None,
-        data: pd.DataFrame | None = None,
-        inplace: bool = True,
-        include_group_specific: bool = True,
-        kind: Literal["response", "response_params"] = "response",
-        draws: int | float | list[int] | np.ndarray | None = None,
-        safe_mode: bool = True,
-    ) -> az.InferenceData | None:
-        """Perform posterior predictive sampling from the HSSM model.
-
-        Parameters
-        ----------
-        idata : optional
-            The `InferenceData` object returned by `HSSM.sample()`. If not provided,
-            the `InferenceData` from the last time `sample()` is called will be used.
-        data : optional
-            An optional data frame with values for the predictors that are used to
-            obtain out-of-sample predictions. If omitted, the original dataset is used.
-        inplace : optional
-            If `True` will modify idata in-place and append a `posterior_predictive`
-            group to `idata`. Otherwise, it will return a copy of idata with the
-            predictions added, by default True.
-        include_group_specific : optional
-            If `True` will make predictions including the group specific effects.
-            Otherwise, predictions are made with common effects only (i.e. group-
-            specific are set to zero), by default True.
-        kind: optional
-            Indicates the type of prediction required. Can be `"response_params"` or
-            `"response"`. The first returns draws from the posterior distribution of the
-            likelihood parameters, while the latter returns the draws from the posterior
-            predictive distribution (i.e. the posterior probability distribution for a
-            new observation) in addition to the posterior distribution. Defaults to
-            "response_params".
-        draws: optional
-            The number of samples to draw from the posterior predictive distribution
-            from each chain.
-            When it's an integer >= 1, the number of samples to be extracted from the
-            `draw` dimension. If this integer is larger than the number of posterior
-            samples in each chain, all posterior samples will be used
-            in posterior predictive sampling. When a float between 0 and 1, the
-            proportion of samples from the draw dimension from each chain to be used in
-            posterior predictive sampling.. If this proportion is very
-            small, at least one sample will be used. When None, all posterior samples
-            will be used. Defaults to None.
-        safe_mode: bool
-            If True, the function will split the draws into chunks of 10 to avoid memory
-            issues. Defaults to True.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet and idata is not provided.
-
-        Returns
-        -------
-        az.InferenceData | None
-            InferenceData or None
-        """
-        if idata is None:
-            if self._inference_obj is None:
-                raise ValueError(
-                    "The model has not been sampled yet. "
-                    + "Please either provide an idata object or sample the model first."
-                )
-            idata = self._inference_obj
-            _logger.info(
-                "idata=None, we use the traces assigned to the HSSM object as idata."
-            )
-
-        if idata is not None:
-            if "posterior_predictive" in idata.groups():
-                del idata["posterior_predictive"]
-                _logger.warning(
-                    "pre-existing posterior_predictive group deleted from idata. \n"
-                )
-
-        if self._check_extra_fields(data):
-            self._update_extra_fields(data)
-
-        if isinstance(draws, np.ndarray):
-            draws = draws.astype(int)
-        elif isinstance(draws, list):
-            draws = np.array(draws).astype(int)
-        elif isinstance(draws, int | float):
-            draws = np.arange(int(draws))
-        elif draws is None:
-            draws = idata["posterior"].draw.values
-        else:
-            raise ValueError(
-                "draws must be an integer, " + "a list of integers, or a numpy array."
-            )
-
-        assert isinstance(draws, np.ndarray)
-
-        # Make a copy of idata, set the `posterior` group to be a random sub-sample
-        # of the original (draw dimension gets sub-sampled)
-
-        idata_copy = idata.copy()
-
-        if (draws.shape != idata["posterior"].draw.values.shape) or (
-            (draws.shape == idata["posterior"].draw.values.shape)
-            and not np.allclose(draws, idata["posterior"].draw.values)
-        ):
-            # Reassign posterior to sub-sampled version
-            setattr(idata_copy, "posterior", idata["posterior"].isel(draw=draws))
-
-        if kind == "response":
-            # If we run kind == 'response' we actually run the observation RV
-            if safe_mode:
-                # safe mode splits the draws into chunks of 10 to avoid
-                # memory issues (TODO: Figure out the source of memory issues)
-                split_draws = _split_array(
-                    idata_copy["posterior"].draw.values, divisor=10
-                )
-
-                posterior_predictive_list = []
-                for samples_tmp in split_draws:
-                    tmp_posterior = idata["posterior"].sel(draw=samples_tmp)
-                    setattr(idata_copy, "posterior", tmp_posterior)
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-                    posterior_predictive_list.append(idata_copy["posterior_predictive"])
-
-                if inplace:
-                    idata.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    # for inplace, we don't return anything
-                    return None
-                else:
-                    # Reassign original posterior to idata_copy
-                    setattr(idata_copy, "posterior", idata["posterior"])
-                    # Add new posterior predictive group to idata_copy
-                    del idata_copy["posterior_predictive"]
-                    idata_copy.add_groups(
-                        posterior_predictive=xr.concat(
-                            posterior_predictive_list, dim="draw"
-                        )
-                    )
-                    return idata_copy
-            else:
-                if inplace:
-                    # If not safe-mode
-                    # We call .predict() directly without any
-                    # chunking of data.
-
-                    # .predict() is called on the copy of idata
-                    # since we still subsampled (or assigned) the draws
-                    self.model.predict(
-                        idata_copy, kind, data, True, include_group_specific
-                    )
-
-                    # posterior predictive group added to idata
-                    idata.add_groups(
-                        posterior_predictive=idata_copy["posterior_predictive"]
-                    )
-                    # don't return anything if inplace
-                    return None
-                else:
-                    # Not safe mode and not inplace
-                    # Function acts as very thin wrapper around
-                    # .predict(). It just operates on the
-                    # idata_copy object
-                    return self.model.predict(
-                        idata_copy, kind, data, False, include_group_specific
-                    )
-        elif kind == "response_params":
-            # If kind == 'response_params', we don't need to run the RV directly,
-            # there shouldn't really be any significant memory issues here,
-            # we can simply ignore settings, since the computational overhead
-            # should be very small --> nudges user towards good outputs.
-            _logger.warning(
-                "The kind argument is set to 'mean', but 'draws' argument "
-                + "is not None: The draws argument will be ignored!"
-            )
-            return self.model.predict(
-                idata, kind, data, inplace, include_group_specific
-            )
-        else:
-            raise ValueError("`kind` must be either 'response' or 'response_params'.")
-
-    def plot_predictive(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a posterior predictive plot.
-
-        Equivalent to calling `hssm.plotting.plot_predictive()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_predictive].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_predictive(self, **kwargs)
-
-    def plot_quantile_probability(self, **kwargs) -> mpl.axes.Axes | sns.FacetGrid:
-        """Produce a quantile probability plot.
-
-        Equivalent to calling `hssm.plotting.plot_quantile_probability()` with the
-        model. Please see that function for
-        [full documentation][hssm.plotting.plot_quantile_probability].
-
-        Returns
-        -------
-        mpl.axes.Axes | sns.FacetGrid
-            The matplotlib axis or seaborn FacetGrid object containing the plot.
-        """
-        return plotting.plot_quantile_probability(self, **kwargs)
-
-    def predict(self, **kwargs) -> az.InferenceData:
-        """Generate samples from the predictive distribution."""
-        return self.model.predict(**kwargs)
-
-    def sample_do(
-        self, params: dict[str, Any], draws: int = 100, return_model=False, **kwargs
-    ) -> az.InferenceData | tuple[az.InferenceData, pm.Model]:
-        """Generate samples from the predictive distribution using the `do-operator`."""
-        do_model = do(self.pymc_model, params)
-        do_idata = pm.sample_prior_predictive(model=do_model, draws=draws, **kwargs)
-
-        # clean up `rt,response_mean` to `v`
-        do_idata = self._drop_parent_str_from_idata(idata=do_idata)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].dims:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in do_idata["prior_predictive"].coords:
-            setattr(
-                do_idata,
-                "prior_predictive",
-                do_idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        if return_model:
-            return do_idata, do_model
-        return do_idata
-
-    def sample_prior_predictive(
-        self,
-        draws: int = 500,
-        var_names: str | list[str] | None = None,
-        omit_offsets: bool = True,
-        random_seed: np.random.Generator | None = None,
-    ) -> az.InferenceData:
-        """Generate samples from the prior predictive distribution.
-
-        Parameters
-        ----------
-        draws
-            Number of draws to sample from the prior predictive distribution. Defaults
-            to 500.
-        var_names
-            A list of names of variables for which to compute the prior predictive
-            distribution. Defaults to ``None`` which means both observed and unobserved
-            RVs.
-        omit_offsets
-            Whether to omit offset terms. Defaults to ``True``.
-        random_seed
-            Seed for the random number generator.
-
-        Returns
-        -------
-        az.InferenceData
-            ``InferenceData`` object with the groups ``prior``, ``prior_predictive`` and
-            ``observed_data``.
-        """
-        prior_predictive = self.model.prior_predictive(
-            draws, var_names, omit_offsets, random_seed
-        )
-
-        # AF-COMMENT: Not sure if necessary to include the
-        # mean prior here (which adds deterministics that
-        # could be recomputed elsewhere)
-        prior_predictive.add_groups(posterior=prior_predictive.prior)
-        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
-        self.model.predict(prior_predictive, kind="response_params", inplace=True)
-
-        # clean
-        setattr(prior_predictive, "prior", prior_predictive["posterior"])
-        del prior_predictive["posterior"]
-
-        if self._inference_obj is None:
-            self._inference_obj = prior_predictive
-        else:
-            self._inference_obj.extend(prior_predictive)
-
-        # clean up `rt,response_mean` to `v`
-        idata = self._drop_parent_str_from_idata(idata=self._inference_obj)
-
-        # rename otherwise inconsistent dims and coords
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].dims:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_dims(
-                    {"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-        if "rt,response_extra_dim_0" in idata["prior_predictive"].coords:
-            setattr(
-                idata,
-                "prior_predictive",
-                idata["prior_predictive"].rename_vars(
-                    name_dict={"rt,response_extra_dim_0": "rt,response_dim"}
-                ),
-            )
-
-        # Update self._inference_obj to match the cleaned idata
-        self._inference_obj = idata
-        return deepcopy(self._inference_obj)
-
-    @property
-    def pymc_model(self) -> pm.Model:
-        """Provide access to the PyMC model.
-
-        Returns
-        -------
-        pm.Model
-            The PyMC model built by bambi
-        """
-        return self.model.backend.model
-
-    def set_alias(self, aliases: dict[str, str | dict]):
-        """Set parameter aliases.
-
-        Sets the aliases according to the dictionary passed to it and rebuild the
-        model.
-
-        Parameters
-        ----------
-        aliases
-            A dict specifying the parameter names being aliased and the aliases.
-        """
-        self.model.set_alias(aliases)
-        self.model.build()
-
-    @property
-    def response_c(self) -> str:
-        """Return the response variable names in c() format."""
-        if self.response is None:
-            return "c()"
-        return f"c({', '.join(self.response)})"
-
-    @property
-    def response_str(self) -> str:
-        """Return the response variable names in string format."""
-        if self.response is None:
-            return ""
-        return ",".join(self.response)
-
-    # NOTE: can't annotate return type because the graphviz dependency is optional
-    def graph(self, formatting="plain", name=None, figsize=None, dpi=300, fmt="png"):
-        """Produce a graphviz Digraph from a built HSSM model.
-
-        Requires graphviz, which may be installed most easily with `conda install -c
-        conda-forge python-graphviz`. Alternatively, you may install the `graphviz`
-        binaries yourself, and then `pip install graphviz` to get the python bindings.
-        See http://graphviz.readthedocs.io/en/stable/manual.html for more information.
-
-        Parameters
-        ----------
-        formatting
-            One of `"plain"` or `"plain_with_params"`. Defaults to `"plain"`.
-        name
-            Name of the figure to save. Defaults to `None`, no figure is saved.
-        figsize
-            Maximum width and height of figure in inches. Defaults to `None`, the
-            figure size is set automatically. If defined and the drawing is larger than
-            the given size, the drawing is uniformly scaled down so that it fits within
-            the given size.  Only works if `name` is not `None`.
-        dpi
-            Point per inch of the figure to save.
-            Defaults to 300. Only works if `name` is not `None`.
-        fmt
-            Format of the figure to save.
-            Defaults to `"png"`. Only works if `name` is not `None`.
-
-        Returns
-        -------
-        graphviz.Graph
-            The graph
-        """
-        graph = self.model.graph(formatting, name, figsize, dpi, fmt)
-
-        parent_param = self._parent_param
-        if parent_param.is_regression:
-            return graph
-
-        # Modify the graph
-        # 1. Remove all nodes and edges related to `{parent}_mean`:
-        graph.body = [
-            item for item in graph.body if f"{parent_param.name}_mean" not in item
-        ]
-        # 2. Add a new edge from parent to response
-        graph.edge(parent_param.name, self.response_str)
-
-        return graph
-
-    def compile_logp(self, keep_transformed: bool = False, **kwargs):
-        """Compile the log probability function for the model.
-
-        Parameters
-        ----------
-        keep_transformed : bool, optional
-            If True, keeps the transformed variables in the compiled function.
-            If False, removes value transforms before compilation.
-            Defaults to False.
-        **kwargs
-            Additional keyword arguments passed to PyMC's compile_logp:
-            - vars: List of variables. Defaults to None (all variables).
-            - jacobian: Whether to include log(|det(dP/dQ)|) term for
-            transformed variables. Defaults to True.
-            - sum: Whether to sum all terms instead of returning a vector.
-            Defaults to True.
-
-        Returns
-        -------
-        callable
-            A compiled function that computes the model log probability.
-        """
-        if keep_transformed:
-            return self.pymc_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-        else:
-            new_model = pm.model.transform.conditioning.remove_value_transforms(
-                self.pymc_model
-            )
-            return new_model.compile_logp(
-                vars=kwargs.get("vars", None),
-                jacobian=kwargs.get("jacobian", True),
-                sum=kwargs.get("sum", True),
-            )
-
-    def plot_trace(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        tight_layout: bool = True,
-        **kwargs,
-    ) -> None:
-        """Generate trace plot with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.plot_trace() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.plot_trace.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data : optional
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include deterministic` to True.
-        tight_layout : optional
-            Whether to call plt.tight_layout() after plotting. Defaults to True.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                if "var_names" in kwargs:
-                    if isinstance(kwargs["var_names"], str):
-                        if kwargs["var_names"] not in var_names:
-                            var_names.append(kwargs["var_names"])
-                        kwargs["var_names"] = var_names
-                    elif isinstance(kwargs["var_names"], list):
-                        kwargs["var_names"] = list(
-                            set(var_names) | set(kwargs["var_names"])
-                        )
-                    elif kwargs["var_names"] is None:
-                        kwargs["var_names"] = var_names
-                    else:
-                        raise ValueError(
-                            "`var_names` must be a string, a list of strings, or None."
-                        )
-                else:
-                    kwargs["var_names"] = var_names
-        az.plot_trace(data, **kwargs)
-
-        if tight_layout:
-            plt.tight_layout()
-
-    def summary(
-        self,
-        data: az.InferenceData | None = None,
-        include_deterministic: bool = False,
-        **kwargs,
-    ) -> pd.DataFrame | xr.Dataset:
-        """Produce a summary table with ArviZ but with additional convenience features.
-
-        This is a simple wrapper for the az.summary() function. By default, it
-        filters out the deterministic values from the plot. Please see the
-        [arviz documentation]
-        (https://arviz-devs.github.io/arviz/api/generated/arviz.summary.html)
-        for additional parameters that can be specified.
-
-        Parameters
-        ----------
-        data
-            An ArviZ InferenceData object. If None, the traces stored in the model will
-            be used.
-        include_deterministic : optional
-            Whether to include deterministic variables in the plot. Defaults to False.
-            Note that if include_deterministic is set to False and and `var_names` is
-            provided, the `var_names` provided will be modified to also exclude the
-            deterministic values. If this is not desirable, set
-            `include_deterministic` to True.
-
-        Returns
-        -------
-        pd.DataFrame | xr.Dataset
-            A pandas DataFrame or xarray Dataset containing the summary statistics.
-        """
-        data = data or self.traces
-        if not isinstance(data, az.InferenceData):
-            raise TypeError("data must be an InferenceData object.")
-
-        if not include_deterministic:
-            var_names = list(
-                set([var.name for var in self.pymc_model.free_RVs]).intersection(
-                    set(list(data["posterior"].data_vars.keys()))
-                )
-            )
-            # var_names = self._get_deterministic_var_names(data)
-            if var_names:
-                kwargs["var_names"] = list(set(var_names + kwargs.get("var_names", [])))
-        return az.summary(data, **kwargs)
-
-    def initial_point(self, transformed: bool = False) -> dict[str, np.ndarray]:
-        """Compute the initial point of the model.
-
-        This is a slightly altered version of pm.initial_point.initial_point().
-
-        Parameters
-        ----------
-        transformed : bool, optional
-            If True, return the initial point in transformed space.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial point of the model parameters.
-        """
-        fn = pm.initial_point.make_initial_point_fn(
-            model=self.pymc_model, return_transformed=transformed
-        )
-        return pm.model.Point(fn(None), model=self.pymc_model)
-
-    def restore_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj = cast("az.InferenceData", traces)
-
-    def restore_vi_traces(
-        self, traces: az.InferenceData | pm.Approximation | str | PathLike
-    ) -> None:
-        """Restore VI traces from an InferenceData object or a .netcdf file.
-
-        Parameters
-        ----------
-        traces
-            An InferenceData object or a path to a file containing the VI traces.
-        """
-        if isinstance(traces, pm.Approximation):
-            self._inference_obj_vi = traces
-            return
-
-        if isinstance(traces, (str, PathLike)):
-            traces = az.from_netcdf(traces)
-        self._inference_obj_vi = cast("az.InferenceData", traces)
-
-    def save_model(
-        self,
-        model_name: str | None = None,
-        allow_absolute_base_path: bool = False,
-        base_path: str | Path = "hssm_models",
-        save_idata_only: bool = False,
-    ) -> None:
-        """Save a HSSM model instance and its inference results to disk.
-
-        Parameters
-        ----------
-        model : HSSM
-            The HSSM model instance to save
-        model_name : str | None
-            Name to use for the saved model files.
-            If None, will use model.model_name with timestamp
-        allow_absolute_base_path : bool
-            Whether to allow absolute paths for base_path
-        base_path : str | Path
-            Base directory to save model files in.
-            Must be relative path if allow_absolute_base_path=False
-        save_idata_only: bool = False,
-            Whether to save the model class instance itself
-
-        Raises
-        ------
-        ValueError
-            If base_path is absolute and allow_absolute_base_path=False
-        """
-        # check if base_path is absolute
-        if not allow_absolute_base_path:
-            if str(base_path).startswith("/"):
-                raise ValueError(
-                    "base_path must be a relative path"
-                    " if allow_absolute_base_path is False"
-                )
-
-        if model_name is None:
-            # Get date string format as suffix to model name
-            model_name = (
-                self.model_name
-                + "_"
-                + datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
-            )
-
-        # check if folder by name model_name exists
-        model_name = model_name.replace(" ", "_")
-        model_path = Path(base_path).joinpath(model_name)
-        model_path.mkdir(parents=True, exist_ok=True)
-
-        # Save model to pickle file
-        if not save_idata_only:
-            with open(model_path.joinpath("model.pkl"), "wb") as f:
-                cpickle.dump(self, f)
-
-        # Save traces to netcdf file
-        if self._inference_obj is not None:
-            az.to_netcdf(self._inference_obj, model_path.joinpath("traces.nc"))
-
-        # Save vi_traces to netcdf file
-        if self._inference_obj_vi is not None:
-            az.to_netcdf(self._inference_obj_vi, model_path.joinpath("vi_traces.nc"))
-
-    @classmethod
-    def load_model(
-        cls, path: Union[str, Path]
-    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
-        """Load a HSSM model instance and its inference results from disk.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory or model.pkl file. If a directory is provided,
-            will look for model.pkl, traces.nc and vi_traces.nc files within it.
-
-        Returns
-        -------
-        HSSM
-            The loaded HSSM model instance with inference results attached if available.
-        """
-        # Convert path to Path object
-        path = Path(path)
-
-        # If path points to a file, assume it's model.pkl
-        if path.is_file():
-            model_dir = path.parent
-            model_path = path
-        else:
-            # Path points to directory
-            model_dir = path
-            model_path = model_dir.joinpath("model.pkl")
-
-        # check if model_dir exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if model.pkl exists raise logging information if not
-        if not model_path.exists():
-            _logger.info(
-                f"model.pkl file does not exist in {model_dir}. "
-                "Attempting to load traces only."
-            )
-            if (not model_dir.joinpath("traces.nc").exists()) and (
-                not model_dir.joinpath("vi_traces.nc").exists()
-            ):
-                raise FileNotFoundError(f"No traces found in {model_dir}.")
-            else:
-                idata_dict = cls.load_model_idata(model_dir)
-                return idata_dict
-        else:
-            # Load model from pickle file
-            with open(model_path, "rb") as f:
-                model = cpickle.load(f)
-
-            # Load traces if they exist
-            traces_path = model_dir.joinpath("traces.nc")
-            if traces_path.exists():
-                model.restore_traces(traces_path)
-
-            # Load VI traces if they exist
-            vi_traces_path = model_dir.joinpath("vi_traces.nc")
-            if vi_traces_path.exists():
-                model.restore_vi_traces(vi_traces_path)
-        return model
-
-    @classmethod
-    def load_model_idata(cls, path: str | Path) -> dict[str, az.InferenceData | None]:
-        """Load the traces from a model directory.
-
-        Parameters
-        ----------
-        path : str | Path
-            Path to the model directory containing traces.nc and/or vi_traces.nc files.
-
-        Returns
-        -------
-        dict[str, az.InferenceData | None]
-            A dictionary with keys "idata_mcmc" and "idata_vi" containing the traces
-            from the model directory. If the traces do not exist, the corresponding
-            value will be None.
-        """
-        idata_dict: dict[str, az.InferenceData | None] = {}
-        model_dir = Path(path)
-        # check if path exists
-        if not model_dir.exists():
-            raise FileNotFoundError(f"Model directory {model_dir} does not exist.")
-
-        # check if traces.nc exists
-        traces_path = model_dir.joinpath("traces.nc")
-        if not traces_path.exists():
-            _logger.warning(f"traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_mcmc"] = None
-        else:
-            idata_dict["idata_mcmc"] = az.from_netcdf(traces_path)
-
-        # check if vi_traces.nc exists
-        vi_traces_path = model_dir.joinpath("vi_traces.nc")
-        if not vi_traces_path.exists():
-            _logger.warning(f"vi_traces.nc file does not exist in {model_dir}.")
-            idata_dict["idata_vi"] = None
-        else:
-            idata_dict["idata_vi"] = az.from_netcdf(vi_traces_path)
-
-        return idata_dict
-
-    def __getstate__(self):
-        """Get the state of the model for pickling.
-
-        This method is called when pickling the model.
-        It returns a dictionary containing the constructor
-        arguments needed to recreate the model instance.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the constructor arguments
-            under the key 'constructor_args'.
-        """
-        state = {"constructor_args": self._init_args}
-        return state
-
-    def __setstate__(self, state):
-        """Set the state of the model when unpickling.
-
-        This method is called when unpickling the model. It creates a new instance
-        of HSSM using the constructor arguments stored in the state dictionary,
-        and copies its attributes to the current instance.
-
-        Parameters
-        ----------
-        state : dict
-            A dictionary containing the constructor arguments under the key
-            'constructor_args'.
-        """
-        new_instance = HSSM(**state["constructor_args"])
-        self.__dict__ = new_instance.__dict__
-
-    def __repr__(self) -> str:
-        """Create a representation of the model."""
-        output = [
-            "Hierarchical Sequential Sampling Model",
-            f"Model: {self.model_name}\n",
-            f"Response variable: {self.response_str}",
-            f"Likelihood: {self.loglik_kind}",
-            f"Observations: {len(self.data)}\n",
-            "Parameters:\n",
-        ]
-
-        for param in self.params.values():
-            if param.name == "p_outlier":
-                continue
-            output.append(f"{param.name}:")
-
-            component = self.model.components[param.name]
-
-            # Regression case:
-            if param.is_regression:
-                assert isinstance(component, DistributionalComponent)
-                output.append(f"    Formula: {param.formula}")
-                output.append("    Priors:")
-                intercept_term = component.intercept_term
-                if intercept_term is not None:
-                    output.append(_print_prior(intercept_term))
-                for _, common_term in component.common_terms.items():
-                    output.append(_print_prior(common_term))
-                for _, group_specific_term in component.group_specific_terms.items():
-                    output.append(_print_prior(group_specific_term))
-                output.append(f"    Link: {param.link}")
-            # None regression case
-            else:
-                if param.prior is None:
-                    prior = (
-                        component.intercept_term.prior
-                        if param.is_parent
-                        else component.prior
-                    )
-                else:
-                    prior = param.prior
-                output.append(f"    Prior: {prior}")
-            output.append(f"    Explicit bounds: {param.bounds}")
-            output.append(
-                " (ignored due to link function)"
-                if self.link_settings is not None
-                else ""
-            )
-
-        # TODO: Handle p_outlier regression correctly here.
-        if self.p_outlier is not None:
-            output.append("")
-            output.append(f"Lapse probability: {self.p_outlier.prior}")
-            output.append(f"Lapse distribution: {self.lapse}")
-
-        return "\n".join(output)
-
-    def __str__(self) -> str:
-        """Create a string representation of the model."""
-        return self.__repr__()
-
-    @property
-    def traces(self) -> az.InferenceData | pm.Approximation:
-        """Return the trace of the model after sampling.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData | pm.Approximation
-            The trace of the model after the last call to `sample()`.
-        """
-        if not self._inference_obj:
-            raise ValueError("Please sample the model first.")
-
-        return self._inference_obj
-
-    @property
-    def vi_idata(self) -> az.InferenceData:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        az.InferenceData
-            The variational inference approximation object.
-        """
-        if not self._inference_obj_vi:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational posterior attached."
-            )
-
-        return self._inference_obj_vi
-
-    @property
-    def vi_approx(self) -> pm.Approximation:
-        """Return the variational inference approximation object.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        pm.Approximation
-            The variational inference approximation object.
-        """
-        if not self._vi_approx:
-            raise ValueError(
-                "Please run variational inference first, "
-                "no variational approximation attached."
-            )
-
-        return self._vi_approx
-
-    @property
-    def map(self) -> dict:
-        """Return the MAP estimates of the model parameters.
-
-        Raises
-        ------
-        ValueError
-            If the model has not been sampled yet.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the MAP estimates of the model parameters.
-        """
-        if not self._map_dict:
-            raise ValueError("Please compute map first.")
-
-        return self._map_dict
-
-    @property
-    def initvals(self) -> dict:
-        """Return the initial values of the model parameters for sampling.
-
-        Returns
-        -------
-        dict
-            A dictionary containing the initial values of the model parameters.
-            This dict serves as the default for initial values, and can be passed
-            directly to the `.sample()` function.
-        """
-        if self._initvals == {}:
-            self._initvals = self.initial_point()
-        return self._initvals
-
-    def _check_lapse(self, lapse):
-        """Determine if p_outlier and lapse is specified correctly."""
-        # Basically, avoid situations where only one of them is specified.
-        if self.has_lapse and lapse is None:
-            raise ValueError(
-                "You have specified `p_outlier`. Please also specify `lapse`."
-            )
-        if lapse is not None and not self.has_lapse:
-            _logger.warning(
-                "You have specified the `lapse` argument to include a lapse "
-                + "distribution, but `p_outlier` is set to either 0 or None. "
-                + "Your lapse distribution will be ignored."
-            )
-        if "p_outlier" in self.list_params and self.list_params[-1] != "p_outlier":
-            raise ValueError(
-                "Please do not include 'p_outlier' in `list_params`. "
-                + "We automatically append it to `list_params` when `p_outlier` "
-                + "parameter is not None"
-            )
-
     def _make_model_distribution(self) -> type[pm.Distribution]:
         """Make a pm.Distribution for the model."""
         ### Logic for different types of likelihoods:
@@ -2120,255 +364,3 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             fixed_vector_params=fixed_vector_params if fixed_vector_params else None,
             params_is_trialwise=params_is_trialwise_base,
         )
-
-    def _get_deterministic_var_names(self, idata) -> list[str]:
-        """Filter out the deterministic variables in var_names."""
-        var_names = [
-            f"~{param_name}"
-            for param_name, param in self.params.items()
-            if (param.is_regression)
-        ]
-
-        if f"{self._parent}_mean" in idata["posterior"].data_vars:
-            var_names.append(f"~{self._parent}_mean")
-
-        # Parent parameters (always regression implicitly)
-        # which don't have a formula attached
-        # should be dropped from var_names, since the actual
-        # parent name shows up as a regression.
-        if f"{self._parent}" in idata["posterior"].data_vars:
-            if self.params[self._parent].formula is None:
-                # Drop from var_names
-                var_names = [var for var in var_names if var != f"~{self._parent}"]
-
-        return var_names
-
-    def _drop_parent_str_from_idata(
-        self, idata: az.InferenceData | None
-    ) -> az.InferenceData:
-        """Drop the parent_str variable from an InferenceData object.
-
-        Parameters
-        ----------
-        idata
-            The InferenceData object to be modified.
-
-        Returns
-        -------
-        xr.Dataset
-            The modified InferenceData object.
-        """
-        if idata is None:
-            raise ValueError("Please provide an InferenceData object.")
-        else:
-            for group in idata.groups():
-                if ("rt,response_mean" in idata[group].data_vars) and (
-                    self._parent not in idata[group].data_vars
-                ):
-                    setattr(
-                        idata,
-                        group,
-                        idata[group].rename({"rt,response_mean": self._parent}),
-                    )
-            return idata
-
-    def _postprocess_initvals_deterministic(
-        self, initval_settings: dict = INITVAL_SETTINGS
-    ) -> None:
-        """Set initial values for subset of parameters."""
-        self._initvals = self.initial_point()
-        # Consider case where link functions are set to 'log_logit'
-        # or 'None'
-        if self.link_settings not in ["log_logit", None]:
-            _logger.info(
-                "Not preprocessing initial values, "
-                + "because none of the two standard link settings are chosen!"
-            )
-            return None
-
-        # Set initial values for particular parameters
-        for name_, starting_value in self.pymc_model.initial_point().items():
-            # strip name of `_log__` and `_interval__` suffixes
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-
-            # We need to check if the parameter is actually backed by
-            # a regression.
-
-            # If not, we don't actually apply a link function to it as per default.
-            # Therefore we need to apply the initial value strategy corresponding
-            # to 'None' link function.
-
-            # If the user actively supplies a link function, the user
-            # should also have supplied an initial value insofar it matters.
-
-            if self.params[self._get_prefix(name_tmp)].is_regression:
-                param_link_setting = self.link_settings
-            else:
-                param_link_setting = None
-            if name_tmp in initval_settings[param_link_setting].keys():
-                if self._check_if_initval_user_supplied(name_tmp):
-                    _logger.info(
-                        "User supplied initial value detected for %s, \n"
-                        " skipping overwrite with default value.",
-                        name_tmp,
-                    )
-                    continue
-
-                # Apply specific settings from initval_settings dictionary
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(
-                    initval_settings[param_link_setting][name_tmp]
-                ).astype(dtype)
-
-    def _get_prefix(self, name_str: str) -> str:
-        """Get parameters wise link setting function from parameter prefix."""
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-            else:
-                name_str_prefix = "p_outlier"
-        else:
-            name_str_prefix = name_str
-        return name_str_prefix
-
-    def _check_if_initval_user_supplied(
-        self,
-        name_str: str,
-        return_value: bool = False,
-    ) -> bool | float | int | np.ndarray | dict[str, Any] | None:
-        """Check if initial value is user-supplied."""
-        # The function assumes that the name_str is either raw parameter name
-        # or `paramname_Intercept`, because we only really provide special default
-        # initial values for those types of parameters
-
-        # `p_outlier` is the only basic parameter floating around that has
-        # an underscore in it's name.
-        # We need to handle it separately. (Renaming might be better...)
-        if "_" in name_str:
-            if "p_outlier" not in name_str:
-                name_str_prefix = name_str.split("_")[0]
-                # name_str_suffix = "".join(name_str.split("_")[1:])
-                name_str_suffix = name_str[len(name_str_prefix + "_") :]
-            else:
-                name_str_prefix = "p_outlier"
-                if name_str == "p_outlier":
-                    name_str_suffix = ""
-                else:
-                    # name_str_suffix = "".join(name_str.split("_")[2:])
-                    name_str_suffix = name_str[len("p_outlier_") :]
-        else:
-            name_str_prefix = name_str
-            name_str_suffix = ""
-
-        tmp_param = name_str_prefix
-        if tmp_param == self._parent:
-            # If the parameter was parent it is automatically treated as a
-            # regression.
-            if not name_str_suffix:
-                # No suffix --> Intercept
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp["Intercept"], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    return False
-            else:
-                # If the parameter has a suffix --> use it
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-        else:
-            # If the parameter is not a parent, it is treated as a regression
-            # only when actively specified as such.
-            if not name_str_suffix:
-                # If no suffix --> treat as basic parameter.
-                if isinstance(self.params[tmp_param].prior, float) or isinstance(
-                    self.params[tmp_param].prior, np.ndarray
-                ):
-                    if return_value:
-                        return self.params[tmp_param].prior
-                    else:
-                        return True
-                elif isinstance(self.params[tmp_param].prior, bmb.Prior):
-                    args_tmp = getattr(self.params[tmp_param].prior, "args")
-                    if "initval" in args_tmp:
-                        if return_value:
-                            return args_tmp["initval"]
-                        else:
-                            return True
-                    else:
-                        if return_value:
-                            return None
-                        else:
-                            return False
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-            else:
-                # If suffix --> treat as regression and use suffix
-                if isinstance(prior_tmp := self.params[tmp_param].prior, dict):
-                    args_tmp = getattr(prior_tmp[name_str_suffix], "args")
-                    if return_value:
-                        return args_tmp.get("initval", None)
-                    else:
-                        return "initval" in args_tmp
-                else:
-                    if return_value:
-                        return None
-                    else:
-                        return False
-
-    def _jitter_initvals(
-        self, jitter_epsilon: float = 0.01, vector_only: bool = False
-    ) -> None:
-        """Apply controlled jitter to initial values."""
-        if vector_only:
-            self.__jitter_initvals_vector_only(jitter_epsilon)
-        else:
-            self.__jitter_initvals_all(jitter_epsilon)
-
-    def __jitter_initvals_vector_only(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            if starting_value.ndim != 0 and starting_value.shape[0] != 1:
-                starting_value_tmp = starting_value + np.random.uniform(
-                    -jitter_epsilon, jitter_epsilon, starting_value.shape
-                ).astype(np.float32)
-
-                # Note: self._initvals shouldn't be None when this is called
-                dtype = self._initvals[name_tmp].dtype
-                self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)
-
-    def __jitter_initvals_all(self, jitter_epsilon: float) -> None:
-        # Note: Calling our initial point function here
-        # --> operate on untransformed variables
-        initial_point_dict = self.initvals
-        # initial_point_dict = self.pymc_model.initial_point()
-        for name_, starting_value in initial_point_dict.items():
-            name_tmp = name_.replace("_log__", "").replace("_interval__", "")
-            starting_value_tmp = starting_value + np.random.uniform(
-                -jitter_epsilon, jitter_epsilon, starting_value.shape
-            ).astype(np.float32)
-
-            dtype = self.initvals[name_tmp].dtype
-            self._initvals[name_tmp] = np.array(starting_value_tmp).astype(dtype)

From 99c0a3f3557e80034c444091e74cfacbccb641d5 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 18 Feb 2026 15:05:06 -0500
Subject: [PATCH 100/104] Fix mypy bugs

---
 src/hssm/base.py                   |  6 +++---
 src/hssm/hssm.py                   | 24 ++++++++++++++++++++----
 src/hssm/param/param.py            |  2 +-
 src/hssm/param/params.py           |  3 +++
 src/hssm/param/regression_param.py |  2 +-
 src/hssm/param/simple_param.py     | 13 ++++++++-----
 6 files changed, 36 insertions(+), 14 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 405e4d47d..0c15568cd 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -1692,7 +1692,7 @@ def save_model(
     @classmethod
     def load_model(
         cls, path: Union[str, Path]
-    ) -> Union["HSSM", dict[str, Optional[az.InferenceData]]]:
+    ) -> Union["HSSMBase", dict[str, Optional[az.InferenceData]]]:
         """Load a HSSM model instance and its inference results from disk.
 
         Parameters
@@ -1811,7 +1811,7 @@ def __setstate__(self, state):
         """Set the state of the model when unpickling.
 
         This method is called when unpickling the model. It creates a new instance
-        of HSSM using the constructor arguments stored in the state dictionary,
+        using the constructor arguments stored in the state dictionary,
         and copies its attributes to the current instance.
 
         Parameters
@@ -1820,7 +1820,7 @@ def __setstate__(self, state):
             A dictionary containing the constructor arguments under the key
             'constructor_args'.
         """
-        new_instance = HSSM(**state["constructor_args"])
+        new_instance = self.__class__(**state["constructor_args"])
         self.__dict__ = new_instance.__dict__
 
     def __repr__(self) -> str:
diff --git a/src/hssm/hssm.py b/src/hssm/hssm.py
index 7e86a8829..8f179d942 100644
--- a/src/hssm/hssm.py
+++ b/src/hssm/hssm.py
@@ -9,7 +9,8 @@
 import logging
 from copy import deepcopy
 from inspect import isclass
-from typing import Literal
+from typing import TYPE_CHECKING, Any, Callable, Literal
+from typing import cast as typing_cast
 
 import numpy as np
 import pymc as pm
@@ -30,6 +31,11 @@
 
 from .base import HSSMBase
 
+if TYPE_CHECKING:
+    from os import PathLike
+
+    from pytensor.graph.op import Op
+
 _logger = logging.getLogger("hssm")
 
 # NOTE: Temporary mapping from old sampler names to new ones in bambi 0.16.0
@@ -257,6 +263,15 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if isclass(self.loglik) and issubclass(self.loglik, pm.Distribution):
             return self.loglik
 
+        # At this point, loglik should not be a type[Distribution] and should be set
+
+        assert self.loglik is not None, "loglik should be set"
+        assert self.loglik_kind is not None, "loglik_kind should be set"
+        assert not (isclass(self.loglik) and issubclass(self.loglik, pm.Distribution))
+        loglik_callable = typing_cast(
+            "Op | Callable[..., Any] | PathLike | str", self.loglik
+        )
+
         # params_is_trialwise_base: one entry per model param (excluding
         # p_outlier). Used for graph-level broadcasting in logp() and
         # make_distribution, where dist_params does not include extra_fields.
@@ -277,20 +292,20 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
         if self.loglik_kind == "approx_differentiable":
             if self.model_config.backend == "jax":
                 likelihood_callable = make_likelihood_callable(
-                    loglik=self.loglik,
+                    loglik=loglik_callable,
                     loglik_kind="approx_differentiable",
                     backend="jax",
                     params_is_reg=params_is_trialwise,
                 )
             else:
                 likelihood_callable = make_likelihood_callable(
-                    loglik=self.loglik,
+                    loglik=loglik_callable,
                     loglik_kind="approx_differentiable",
                     backend=self.model_config.backend,
                 )
         else:
             likelihood_callable = make_likelihood_callable(
-                loglik=self.loglik,
+                loglik=loglik_callable,
                 loglik_kind=self.loglik_kind,
                 backend=self.model_config.backend,
             )
@@ -350,6 +365,7 @@ def _make_model_distribution(self) -> type[pm.Distribution]:
             if isinstance(param.prior, np.ndarray)
         }
 
+        assert self.list_params is not None, "list_params should be set"
         return make_distribution(
             rv=self.model_config.rv or self.model_name,
             loglik=self.loglik,
diff --git a/src/hssm/param/param.py b/src/hssm/param/param.py
index 4ea8493f5..3d1897dcf 100644
--- a/src/hssm/param/param.py
+++ b/src/hssm/param/param.py
@@ -157,7 +157,7 @@ def is_trialwise(self) -> bool:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:
diff --git a/src/hssm/param/params.py b/src/hssm/param/params.py
index f542c803d..d90de35ff 100644
--- a/src/hssm/param/params.py
+++ b/src/hssm/param/params.py
@@ -213,6 +213,7 @@ def collect_user_params(
         user_param = UserParam.from_dict(param) if isinstance(param, dict) else param
         if user_param.name is None:
             raise ValueError("Parameter name must be specified.")
+        assert model.list_params is not None, "list_params should be set"
         if user_param.name not in model.list_params:
             raise ValueError(
                 f"Parameter {user_param.name} not found in list_params."
@@ -229,6 +230,7 @@ def collect_user_params(
     # If any of the keys is found in `list_params` it is a parameter specification.
     # We add the parameter specification to `user_params` and remove it from
     # `kwargs`
+    assert model.list_params is not None, "list_params should be set"
     for param_name in model.list_params:
         # Update user_params only if param_name is in kwargs
         # and not already in user_params
@@ -272,6 +274,7 @@ def make_params(model: HSSM, user_params: dict[str, UserParam]) -> dict[str, Par
         and model.loglik_kind != "approx_differentiable"
     )
 
+    assert model.list_params is not None, "list_params should be set"
     for name in model.list_params:
         if name in user_params:
             param = make_param_from_user_param(model, name, user_params[name])
diff --git a/src/hssm/param/regression_param.py b/src/hssm/param/regression_param.py
index 462b37955..406731a4a 100644
--- a/src/hssm/param/regression_param.py
+++ b/src/hssm/param/regression_param.py
@@ -111,7 +111,7 @@ def from_defaults(
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:
diff --git a/src/hssm/param/simple_param.py b/src/hssm/param/simple_param.py
index 70d001047..a71528acf 100644
--- a/src/hssm/param/simple_param.py
+++ b/src/hssm/param/simple_param.py
@@ -111,7 +111,7 @@ def from_user_param(cls, user_param: UserParam) -> "SimpleParam":
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:
@@ -201,14 +201,17 @@ class DefaultParam(SimpleParam):
     def __init__(
         self,
         name: str,
-        prior: float | np.ndarray | dict[str, Any] | bmb.Prior,
-        bounds: tuple[float, float],
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None,
+        bounds: tuple[float, float] | None,
     ) -> None:
         super().__init__(name, prior=prior, bounds=bounds)
 
     @classmethod
     def from_defaults(
-        cls, name: str, prior: dict[str, Any], bounds: tuple[int, int]
+        cls,
+        name: str,
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None,
+        bounds: tuple[float, float] | None,
     ) -> "DefaultParam":
         """Create a DefaultParam object from default values.
 
@@ -248,7 +251,7 @@ def process_prior(self) -> None:
 
     def fill_defaults(
         self,
-        prior: dict[str, Any] | None = None,
+        prior: float | np.ndarray | dict[str, Any] | bmb.Prior | None = None,
         bounds: tuple[float, float] | None = None,
         **kwargs,
     ) -> None:

From e0369c560c9d966db7ef91d82a9d87f064040fc4 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 18 Feb 2026 17:31:43 -0500
Subject: [PATCH 101/104] Remove duplicate comment regarding Bambi's kind
 parameter renaming

---
 src/hssm/base.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 0c15568cd..f477511e4 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -1300,7 +1300,6 @@ def sample_prior_predictive(
         # could be recomputed elsewhere)
         prior_predictive.add_groups(posterior=prior_predictive.prior)
         # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
-        # Bambi >= 0.17 renamed kind="mean" to kind="response_params".
         self.model.predict(prior_predictive, kind="response_params", inplace=True)
 
         # clean

From f58c2d476022582b4f5d3711d9ce40fc14c7594e Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 18 Feb 2026 17:31:52 -0500
Subject: [PATCH 102/104] Fix RLSSMConfig to require model_name in config_dict

---
 src/hssm/config.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/hssm/config.py b/src/hssm/config.py
index 1e842f331..1ae0ea2a0 100644
--- a/src/hssm/config.py
+++ b/src/hssm/config.py
@@ -325,7 +325,7 @@ def from_rlssm_dict(cls, model_name: str, config_dict: dict[str, Any]):
                 raise ValueError(f"{field_name} must be provided in config_dict")
 
         return cls(
-            model_name=config_dict.get("model_name", model_name),
+            model_name=config_dict["model_name"],
             description=config_dict["description"],
             list_params=config_dict["list_params"],
             extra_fields=config_dict.get("extra_fields"),

From 00e6f318184f08d7a8ecce1c3bbc401433f21199 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 25 Feb 2026 10:14:07 -0500
Subject: [PATCH 103/104] Update docstrings in HSSMBase for clarity on initial
 values and return types

---
 src/hssm/base.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index f477511e4..0dd07db30 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -658,7 +658,7 @@ def sample(
             Pass initial values to the sampler. This can be a dictionary of initial
             values for parameters of the model, or a string "map" to use initialization
             at the MAP estimate. If "map" is used, the MAP estimate will be computed if
-            not already attached to the base class from prior call to 'find_MAP'.
+            not already attached to the base class from prior call to `find_MAP`.
         include_response_params: optional
             Include parameters of the response distribution in the output. These usually
             take more space than other parameters as there's one of them per
@@ -1702,8 +1702,9 @@ def load_model(
 
         Returns
         -------
-        HSSM
-            The loaded HSSM model instance with inference results attached if available.
+        HSSMBase or dict[str, az.InferenceData | None]
+            The loaded model instance (with inference results attached if available),
+            or a dictionary of traces-only InferenceData objects when no model.pkl is found.
         """
         # Convert path to Path object
         path = Path(path)

From d103bafda2d4e424f217891edd60a35114c93ad1 Mon Sep 17 00:00:00 2001
From: Carlos Paniagua <cpaniaguam@gmail.com>
Date: Wed, 25 Feb 2026 10:25:04 -0500
Subject: [PATCH 104/104] Fix line too long

---
 src/hssm/base.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/hssm/base.py b/src/hssm/base.py
index 0dd07db30..0aa1dec10 100644
--- a/src/hssm/base.py
+++ b/src/hssm/base.py
@@ -1704,7 +1704,8 @@ def load_model(
         -------
         HSSMBase or dict[str, az.InferenceData | None]
             The loaded model instance (with inference results attached if available),
-            or a dictionary of traces-only InferenceData objects when no model.pkl is found.
+            or a dictionary of traces-only InferenceData objects when no model.pkl is
+            found.
         """
         # Convert path to Path object
         path = Path(path)