bayesflow-org
diff --git a/‎README.md‎
Lines changed: 39 additions & 35 deletions b/‎README.md‎
Lines changed: 39 additions & 35 deletions
diff --git a/‎bayesflow/adapters/adapter.py‎
Lines changed: 38 additions & 0 deletions b/‎bayesflow/adapters/adapter.py‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎bayesflow/adapters/transforms/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎bayesflow/adapters/transforms/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎bayesflow/adapters/transforms/nnpe.py‎
Lines changed: 187 additions & 0 deletions b/‎bayesflow/adapters/transforms/nnpe.py‎
Lines changed: 187 additions & 0 deletions
diff --git a/‎bayesflow/networks/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎bayesflow/networks/__init__.py‎
Lines changed: 1 addition & 0 deletions
@@ -49,39 +49,6 @@ neural networks for parameter estimation, model comparison, and model validation
 when working with intractable simulators whose behavior as a whole is too
 complex to be described analytically.
 
-## Getting Started
-
-Using the high-level interface is easy, as demonstrated by the minimal working example below:
-
-```python
-import bayesflow as bf
-
-workflow = bf.BasicWorkflow(
-    inference_network=bf.networks.CouplingFlow(),
-    summary_network=bf.networks.TimeSeriesNetwork(),
-    inference_variables=["parameters"],
-    summary_variables=["observables"],
-    simulator=bf.simulators.SIR()
-)
-
-history = workflow.fit_online(epochs=15, batch_size=32, num_batches_per_epoch=200)
-
-diagnostics = workflow.plot_default_diagnostics(test_data=300)
-```
-
-For an in-depth exposition, check out our walkthrough notebooks below.
-
-1. [Linear regression starter example](examples/Linear_Regression_Starter.ipynb)
-2. [From ABC to BayesFlow](examples/From_ABC_to_BayesFlow.ipynb)
-3. [Two moons starter example](examples/Two_Moons_Starter.ipynb)
-4. [Rapid iteration with point estimators](examples/Lotka_Volterra_Point_Estimation_and_Expert_Stats.ipynb)
-5. [SIR model with custom summary network](examples/SIR_Posterior_Estimation.ipynb)
-6. [Bayesian experimental design](examples/Bayesian_Experimental_Design.ipynb)
-7. [Simple model comparison example](examples/One_Sample_TTest.ipynb)
-8. [Moving from BayesFlow v1.1 to v2.0](examples/From_BayesFlow_1.1_to_2.0.ipynb)
-
-More tutorials are always welcome! Please consider making a pull request if you have a cool application that you want to contribute.
-
 ## Install
 
 You can install the latest stable version from PyPI using:
@@ -132,9 +99,46 @@ export KERAS_BACKEND=jax
 
 This way, you also don't have to manually set the backend every time you are starting Python to use BayesFlow.
 
-**Caution:** Some development environments (e.g., VSCode or PyCharm) can silently overwrite environment variables. If you have set your backend as an environment variable and you still get keras-related import errors when loading BayesFlow, these IDE shenanigans might be the culprit. Try setting the keras backend in your Python script via `import os; os.environ["KERAS_BACKEND"] = "<YOUR-BACKEND>"`.
+## Getting Started
+
+Using the high-level interface is easy, as demonstrated by the minimal working example below:
+
+```python
+import bayesflow as bf
+
+workflow = bf.BasicWorkflow(
+    inference_network=bf.networks.CouplingFlow(),
+    summary_network=bf.networks.TimeSeriesNetwork(),
+    inference_variables=["parameters"],
+    summary_variables=["observables"],
+    simulator=bf.simulators.SIR()
+)
+
+history = workflow.fit_online(epochs=15, batch_size=32, num_batches_per_epoch=200)
+
+diagnostics = workflow.plot_default_diagnostics(test_data=300)
+```
+
+For an in-depth exposition, check out our expanding list of resources below.
+
+### Books
+
+Many examples from [Bayesian Cognitive Modeling: A Practical Course](https://bayesmodels.com/) by Lee & Wagenmakers (2013) in [BayesFlow](https://kucharssim.github.io/bayesflow-cognitive-modeling-book/).
+
+### Tutorial notebooks
+
+1. [Linear regression starter example](examples/Linear_Regression_Starter.ipynb)
+2. [From ABC to BayesFlow](examples/From_ABC_to_BayesFlow.ipynb)
+3. [Two moons starter example](examples/Two_Moons_Starter.ipynb)
+4. [Rapid iteration with point estimators](examples/Lotka_Volterra_Point_Estimation_and_Expert_Stats.ipynb)
+5. [SIR model with custom summary network](examples/SIR_Posterior_Estimation.ipynb)
+6. [Bayesian experimental design](examples/Bayesian_Experimental_Design.ipynb)
+7. [Simple model comparison example](examples/One_Sample_TTest.ipynb)
+8. [Moving from BayesFlow v1.1 to v2.0](examples/From_BayesFlow_1.1_to_2.0.ipynb)
+
+More tutorials are always welcome! Please consider making a pull request if you have a cool application that you want to contribute.
 
-### From Source
+## Contributing
 
 If you want to contribute to BayesFlow, we recommend installing it from source, see [CONTRIBUTING.md](CONTRIBUTING.md) for more details.
 
 
@@ -18,6 +18,7 @@
     Keep,
     Log,
     MapTransform,
+    NNPE,
     NumpyTransform,
     OneHot,
     Rename,
@@ -699,6 +700,43 @@ def map_dtype(self, keys: str | Sequence[str], to_dtype: str):
         self.transforms.append(transform)
         return self
 
+    def nnpe(
+        self,
+        keys: str | Sequence[str],
+        *,
+        spike_scale: float | None = None,
+        slab_scale: float | None = None,
+        per_dimension: bool = True,
+        seed: int | None = None,
+    ):
+        """Append an :py:class:`~transforms.NNPE` transform to the adapter.
+
+        Parameters
+        ----------
+        keys : str or Sequence of str
+            The names of the variables to transform.
+        spike_scale : float or np.ndarray or None, default=None
+            The scale of the spike (Normal) distribution. Automatically determined if None.
+        slab_scale : float or np.ndarray or None, default=None
+            The scale of the slab (Cauchy) distribution. Automatically determined if None.
+        per_dimension : bool, default=True
+            If true, noise is applied per dimension of the last axis of the input data.
+            If false, noise is applied globally.
+        seed : int or None
+            The seed for the random number generator. If None, a random seed is used.
+        """
+        if isinstance(keys, str):
+            keys = [keys]
+
+        transform = MapTransform(
+            {
+                key: NNPE(spike_scale=spike_scale, slab_scale=slab_scale, per_dimension=per_dimension, seed=seed)
+                for key in keys
+            }
+        )
+        self.transforms.append(transform)
+        return self
+
     def one_hot(self, keys: str | Sequence[str], num_classes: int):
         """Append a :py:class:`~transforms.OneHot` transform to the adapter.
 
 
@@ -12,6 +12,7 @@
 from .keep import Keep
 from .log import Log
 from .map_transform import MapTransform
+from .nnpe import NNPE
 from .numpy_transform import NumpyTransform
 from .one_hot import OneHot
 from .rename import Rename
 
@@ -0,0 +1,187 @@
+import numpy as np
+
+from bayesflow.utils.serialization import serializable, serialize
+
+from .elementwise_transform import ElementwiseTransform
+
+
+@serializable("bayesflow.adapters")
+class NNPE(ElementwiseTransform):
+    """Implements noisy neural posterior estimation (NNPE) as described in [1], which adds noise following a
+    spike-and-slab distribution to the training data as a mild form of data augmentation to robustify against noisy
+    real-world data (see [1, 2] for benchmarks). Adds the options of automatic noise scale determination and
+    dimensionwise noise application to the original implementation in [1] to provide more flexibility in dealing with
+    unstandardized and heterogeneous data.
+
+    [1] Ward, D., Cannon, P., Beaumont, M., Fasiolo, M., & Schmon, S. (2022). Robust neural posterior estimation and
+    statistical model criticism. Advances in Neural Information Processing Systems, 35, 33845-33859.
+    [2] Elsemüller, L., Pratz, V., von Krause, M., Voss, A., Bürkner, P. C., & Radev, S. T. (2025). Does Unsupervised
+    Domain Adaptation Improve the Robustness of Amortized Bayesian Inference? A Systematic Evaluation. arXiv preprint
+    arXiv:2502.04949.
+
+    Parameters
+    ----------
+    spike_scale : float or np.ndarray or None, default=None
+        The scale of the spike (Normal) distribution. Automatically determined if None (see “Notes” section).
+        Expects a float if `per_dimension=False` or a 1D array of length `data.shape[-1]` if `per_dimension=True`.
+    slab_scale : float or np.ndarray or None, default=None
+        The scale of the slab (Cauchy) distribution. Automatically determined if None (see “Notes” section).
+        Expects a float if `per_dimension=False` or a 1D array of length `data.shape[-1]` if `per_dimension=True`.
+    per_dimension : bool, default=True
+        If true, noise is applied per dimension of the last axis of the input data. If false, noise is applied globally.
+        Thus, if per_dimension=True, any provided scales must be arrays with shape (n_dimensions,) and automatic
+        scale determination occurs separately per dimension. If per_dimension=False, provided scales must be floats and
+        automatic scale determination occurs globally. The original implementation in [1] uses global application
+        (i.e., per_dimension=False), whereas dimensionwise is recommended if the data dimensions are heterogeneous.
+    seed : int or None
+        The seed for the random number generator. If None, a random seed is used. Used instead of np.random.Generator
+        here to enable easy serialization.
+
+    Notes
+    -----
+    The spike-and-slab distribution consists of a mixture of a Normal distribution (spike) and Cauchy distribution
+    (slab), which are applied based on a Bernoulli random variable with p=0.5.
+
+    The scales of the spike and slab distributions can be set manually, or they are automatically determined by scaling
+    the default scales of [1] (which expect standardized data) by the standard deviation of the input data.
+    For automatic determination, the standard deviation is determined either globally (if `per_dimension=False`) or per
+    dimension of the last axis of the input data (if `per_dimension=True`). Note that automatic scale determination is
+    applied batch-wise in the forward method, which means that determined scales can vary between batches due to varying
+    standard deviations in the batch input data.
+
+    The original implementation in [1] can be recovered by applying the following settings on standardized data:
+    - `spike_scale=0.01`
+    - `slab_scale=0.25`
+    - `per_dimension=False`
+
+    Examples
+    --------
+    >>> adapter = bf.Adapter().nnpe(["x"])
+    """
+
+    DEFAULT_SPIKE = 0.01
+    DEFAULT_SLAB = 0.25
+
+    def __init__(
+        self,
+        *,
+        spike_scale: float | np.ndarray | None = None,
+        slab_scale: float | np.ndarray | None = None,
+        per_dimension: bool = True,
+        seed: int | None = None,
+    ):
+        super().__init__()
+        self.spike_scale = spike_scale
+        self.slab_scale = slab_scale
+        self.per_dimension = per_dimension
+        self.seed = seed
+        self.rng = np.random.default_rng(seed)
+
+    def _resolve_scale(
+        self,
+        name: str,
+        passed: float | np.ndarray | None,
+        default: float,
+        data: np.ndarray,
+    ) -> np.ndarray | float:
+        """
+        Determine spike/slab scale:
+         - If passed is None: Automatic determination via default * std(data) (per‐dimension or global).
+         - Else: validate & cast passed to the correct shape/type.
+
+        Parameters
+        ----------
+        name : str
+            Identifier for error messages (e.g., 'spike_scale' or 'slab_scale').
+        passed : float or np.ndarray or None
+            User-specified scale. If None, compute as default * std(data).
+            If self.per_dimension is True, this may be a 1D array of length data.shape[-1].
+        default : float
+            Default multiplier from [1] to apply to the standard deviation of the data.
+        data : np.ndarray
+            Data array to compute standard deviation from.
+
+        Returns
+        -------
+        float or np.ndarray
+            The resolved scale, either as a scalar (if per_dimension=False) or an 1D array of length data.shape[-1]
+            (if per_dimension=True).
+        """
+
+        # Get std and (expected shape) dimensionwise or globally
+        if self.per_dimension:
+            axes = tuple(range(data.ndim - 1))
+            std = np.std(data, axis=axes)
+            expected_shape = (data.shape[-1],)
+        else:
+            std = np.std(data)
+            expected_shape = None
+
+        # If no scale is passed, determine scale automatically given the dimensionwise or global std
+        if passed is None:
+            return default * std
+        # If a scale is passed, check if the passed shape matches the expected shape
+        else:
+            if self.per_dimension:
+                arr = np.asarray(passed, dtype=float)
+                if arr.shape != expected_shape or arr.ndim != 1:
+                    raise ValueError(f"{name}: expected array of shape {expected_shape}, got {arr.shape}")
+                return arr
+            else:
+                try:
+                    scalar = float(passed)
+                except TypeError:
+                    raise TypeError(f"{name}: expected a scalar convertible to float, got type {type(passed).__name__}")
+                except ValueError:
+                    raise ValueError(f"{name}: expected a scalar convertible to float, got value {passed!r}")
+                return scalar
+
+    def forward(self, data: np.ndarray, stage: str = "inference", **kwargs) -> np.ndarray:
+        """
+        Add spike‐and‐slab noise to `data` during training, using automatic scale determination if not provided (see
+        “Notes” section of the class docstring for details).
+
+        Parameters
+        ----------
+        data : np.ndarray
+            Input array to be perturbed.
+        stage : str, default='inference'
+            If 'training', noise is added; else data is returned unchanged.
+        **kwargs
+            Unused keyword arguments.
+
+        Returns
+        -------
+        np.ndarray
+            Noisy data when `stage` is 'training', otherwise the original input.
+        """
+        if stage != "training":
+            return data
+
+        # Check data validity
+        if not np.all(np.isfinite(data)):
+            raise ValueError("NNPE.forward: `data` contains NaN or infinite values.")
+
+        spike_scale = self._resolve_scale("spike_scale", self.spike_scale, self.DEFAULT_SPIKE, data)
+        slab_scale = self._resolve_scale("slab_scale", self.slab_scale, self.DEFAULT_SLAB, data)
+
+        # Apply spike-and-slab noise
+        mixture_mask = self.rng.binomial(n=1, p=0.5, size=data.shape).astype(bool)
+        noise_spike = self.rng.standard_normal(size=data.shape) * spike_scale
+        noise_slab = self.rng.standard_cauchy(size=data.shape) * slab_scale
+        noise = np.where(mixture_mask, noise_slab, noise_spike)
+        return data + noise
+
+    def inverse(self, data: np.ndarray, **kwargs) -> np.ndarray:
+        """Non-invertible transform."""
+        return data
+
+    def get_config(self) -> dict:
+        return serialize(
+            {
+                "spike_scale": self.spike_scale,
+                "slab_scale": self.slab_scale,
+                "per_dimension": self.per_dimension,
+                "seed": self.seed,
+            }
+        )
@@ -12,6 +12,7 @@
 from .point_inference_network import PointInferenceNetwork
 from .mlp import MLP
 from .fusion_network import FusionNetwork
+from .sequential import Sequential
 from .summary_network import SummaryNetwork
 from .time_series_network import TimeSeriesNetwork
 from .transformers import SetTransformer, TimeSeriesTransformer, FusionTransformer