PySATL
diff --git a/‎examples/example_bootstrap.ipynb‎
Lines changed: 417 additions & 0 deletions b/‎examples/example_bootstrap.ipynb‎
Lines changed: 417 additions & 0 deletions
diff --git a/‎src/pysatl_core/inference/__init__.py‎
Lines changed: 27 additions & 0 deletions b/‎src/pysatl_core/inference/__init__.py‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎src/pysatl_core/inference/bootstrap.py‎
Lines changed: 171 additions & 0 deletions b/‎src/pysatl_core/inference/bootstrap.py‎
Lines changed: 171 additions & 0 deletions
diff --git a/‎tests/unit/inference/__init__.py‎ b/‎tests/unit/inference/__init__.py‎
diff --git a/‎tests/unit/inference/test_bootstrap.py‎
Lines changed: 173 additions & 0 deletions b/‎tests/unit/inference/test_bootstrap.py‎
Lines changed: 173 additions & 0 deletions
@@ -0,0 +1,27 @@
+"""
+Statistical inference utilities.
+"""
+
+from __future__ import annotations
+
+__author__ = "Artem Romanyuk"
+__copyright__ = "Copyright (c) 2025 PySATL project"
+__license__ = "SPDX-License-Identifier: MIT"
+
+from pysatl_core.inference.bootstrap import (
+    Bootstrap,
+    BootstrapResult,
+    ClassicalResampling,
+    ResamplingMethod,
+    SmoothResampling,
+    StatisticalFunctional,
+)
+
+__all__ = [
+    "Bootstrap",
+    "BootstrapResult",
+    "ClassicalResampling",
+    "ResamplingMethod",
+    "SmoothResampling",
+    "StatisticalFunctional",
+]
@@ -0,0 +1,171 @@
+"""
+Bootstrap inference for statistical functionals.
+
+Supports classical resampling (sampling with replacement from the empirical
+distribution) and smooth resampling (sampling from a KDE-fitted continuous
+approximation).
+"""
+
+from __future__ import annotations
+
+__author__ = "Artem Romanyuk"
+__copyright__ = "Copyright (c) 2025 PySATL project"
+__license__ = "SPDX-License-Identifier: MIT"
+
+from dataclasses import dataclass
+from typing import Protocol
+
+import numpy as np
+from numpy.random import Generator
+from numpy.typing import NDArray
+
+from pysatl_core.distributions.empirical.distribution import EmpiricalDistribution, EmpiricalMethod, ScipyGaussianKde
+
+
+class StatisticalFunctional(Protocol):
+    """A function that maps a sample to a scalar summary."""
+
+    def __call__(self, sample: NDArray[np.float64]) -> float: ...
+
+
+class ResamplingMethod(Protocol):
+    """Strategy for generating a single bootstrap resample from data."""
+
+    def resample(self, data: NDArray[np.float64], size: int) -> NDArray[np.float64]: ...
+
+
+class ClassicalResampling:
+    """Sample with replacement from the original data (discrete empirical distribution)."""
+
+    def __init__(self, rng: Generator | None = None) -> None:
+        self._rng = rng if rng is not None else np.random.default_rng()
+
+    def resample(self, data: NDArray[np.float64], size: int) -> NDArray[np.float64]:
+        return self._rng.choice(data, size=size, replace=True)
+
+
+class SmoothResampling:
+    """Sample from a KDE-fitted continuous approximation of the empirical distribution.
+
+    The fitted distribution is cached after the first resample call and reused
+    across bootstrap iterations for the same data array.
+    """
+
+    def __init__(self, method: EmpiricalMethod = ScipyGaussianKde()) -> None:
+        self._method = method
+        self._distr: EmpiricalDistribution | None = None
+
+    def resample(self, data: NDArray[np.float64], size: int) -> NDArray[np.float64]:
+        if self._distr is None or self._distr.data is not data:
+            self._distr = EmpiricalDistribution(data, method=self._method)
+        return self._distr.sample(size)
+
+
+@dataclass
+class BootstrapResult:
+    """Outcome of a bootstrap run for a single statistical functional.
+
+    Parameters
+    ----------
+    observed:
+        Value of the functional on the original data.
+    replicates:
+        Array of shape ``(B,)`` holding the functional value on each
+        bootstrap resample.
+    """
+
+    observed: float
+    replicates: NDArray[np.float64]
+
+    def standard_error(self) -> float:
+        """Standard deviation of the bootstrap replicates."""
+        return float(self.replicates.std())
+
+    def bias(self) -> float:
+        """Estimated bias: mean of replicates minus the observed value."""
+        return float(self.replicates.mean() - self.observed)
+
+    def confidence_interval(self, level: float = 0.95) -> tuple[float, float]:
+        """Percentile bootstrap confidence interval.
+
+        Parameters
+        ----------
+        level:
+            Coverage level in the open interval (0, 1). Default is 0.95.
+
+        Returns
+        -------
+        (lower, upper) bounds of the interval.
+
+        TODO: implement BCa (bias-corrected and accelerated) and Normal
+        approximation methods for better accuracy in skewed or small-sample
+        settings.
+        """
+        alpha = 1.0 - level
+        lo, hi = np.percentile(self.replicates, [100 * alpha / 2, 100 * (1 - alpha / 2)])
+        return float(lo), float(hi)
+
+
+class Bootstrap:
+    """Bootstrap procedure for estimating the sampling distribution of a functional.
+
+    Parameters
+    ----------
+    data:
+        One-dimensional array of observed values.
+    B:
+        Number of bootstrap resamples. Default is 1000.
+    method:
+        Strategy for generating each resample. Defaults to
+        :class:`ClassicalResampling` (sampling with replacement).
+    rng:
+        NumPy random generator. A fresh generator is created when ``None``.
+
+    Examples
+    --------
+    >>> import numpy as np
+    >>> rng = np.random.default_rng(0)
+    >>> data = rng.normal(0, 1, 200)
+    >>> result = Bootstrap(data, B=500, rng=rng).run(np.mean)
+    >>> lo, hi = result.confidence_interval()
+    """
+
+    def __init__(
+        self,
+        data: NDArray[np.float64],
+        B: int = 1000,
+        method: ResamplingMethod | None = None,
+        rng: Generator | None = None,
+    ) -> None:
+        self._data = np.asarray(data, dtype=float)
+        self._B = B
+        self._rng = rng if rng is not None else np.random.default_rng()
+        self._method = method if method is not None else ClassicalResampling(rng=self._rng)
+
+    def run(self, functional: StatisticalFunctional) -> BootstrapResult:
+        """Run the bootstrap and return a :class:`BootstrapResult`.
+
+        Parameters
+        ----------
+        functional:
+            A callable that accepts a sample array and returns a scalar.
+        """
+        observed = float(functional(self._data))
+        n = len(self._data)
+        replicates = np.array(
+            [
+                float(functional(self._method.resample(self._data, n)))
+                for _ in range(self._B)
+            ]
+        )
+        return BootstrapResult(observed=observed, replicates=replicates)
+
+
+__all__ = [
+    "Bootstrap",
+    "BootstrapResult",
+    "ClassicalResampling",
+    "ResamplingMethod",
+    "SmoothResampling",
+    "StatisticalFunctional",
+]
@@ -0,0 +1,173 @@
+"""
+Unit tests for Bootstrap, BootstrapResult, ClassicalResampling, SmoothResampling.
+"""
+
+from __future__ import annotations
+
+__author__ = "Artem Romanyuk"
+__copyright__ = "Copyright (c) 2025 PySATL project"
+__license__ = "SPDX-License-Identifier: MIT"
+
+import numpy as np
+import pytest
+from numpy.typing import NDArray
+
+from pysatl_core.inference import (
+    Bootstrap,
+    BootstrapResult,
+    ClassicalResampling,
+    SmoothResampling,
+)
+
+
+@pytest.fixture
+def rng() -> np.random.Generator:
+    return np.random.default_rng(42)
+
+
+@pytest.fixture
+def data(rng: np.random.Generator) -> NDArray[np.float64]:
+    return rng.normal(0.0, 1.0, 100)
+
+
+class TestClassicalResampling:
+    def test_returns_correct_size(self, data: NDArray[np.float64]) -> None:
+        result = ClassicalResampling().resample(data, len(data))
+        assert result.shape == (len(data),)
+
+    def test_custom_size(self, data: NDArray[np.float64]) -> None:
+        result = ClassicalResampling().resample(data, 50)
+        assert result.shape == (50,)
+
+    def test_samples_only_from_original_data(self, data: NDArray[np.float64]) -> None:
+        result = ClassicalResampling().resample(data, len(data))
+        assert all(v in data for v in result)
+
+    def test_can_repeat_elements(self) -> None:
+        tiny = np.array([1.0, 2.0])
+        method = ClassicalResampling()
+        seen_repeats = False
+        for _ in range(50):
+            sample = method.resample(tiny, 10)
+            if len(set(sample.tolist())) < len(sample):
+                seen_repeats = True
+                break
+        assert seen_repeats
+
+    def test_reproducible_with_same_seed(self, data: NDArray[np.float64]) -> None:
+        r1 = ClassicalResampling(rng=np.random.default_rng(0)).resample(data, len(data))
+        r2 = ClassicalResampling(rng=np.random.default_rng(0)).resample(data, len(data))
+        assert np.array_equal(r1, r2)
+
+    def test_different_seeds_give_different_results(self, data: NDArray[np.float64]) -> None:
+        r1 = ClassicalResampling(rng=np.random.default_rng(0)).resample(data, len(data))
+        r2 = ClassicalResampling(rng=np.random.default_rng(1)).resample(data, len(data))
+        assert not np.array_equal(r1, r2)
+
+
+class TestSmoothResampling:
+    def test_returns_correct_size(self, data: NDArray[np.float64]) -> None:
+        result = SmoothResampling().resample(data, len(data))
+        assert result.shape == (len(data),)
+
+    def test_custom_size(self, data: NDArray[np.float64]) -> None:
+        result = SmoothResampling().resample(data, 30)
+        assert result.shape == (30,)
+
+    def test_caches_distribution_for_same_data(self, data: NDArray[np.float64]) -> None:
+        method = SmoothResampling()
+        method.resample(data, 10)
+        distr_first = method._distr
+        method.resample(data, 10)
+        assert method._distr is distr_first
+
+    def test_refits_when_data_changes(self, data: NDArray[np.float64]) -> None:
+        method = SmoothResampling()
+        method.resample(data, 10)
+        other = data * 2.0
+        method.resample(other, 10)
+        assert method._distr is not None
+        assert method._distr.data is other
+
+
+class TestBootstrapResult:
+    @pytest.fixture
+    def result(self) -> BootstrapResult:
+        replicates = np.random.default_rng(0).normal(3.0, 0.5, 1000)
+        return BootstrapResult(observed=3.1, replicates=replicates)
+
+    def test_standard_error_matches_std(self, result: BootstrapResult) -> None:
+        assert result.standard_error() == pytest.approx(result.replicates.std())
+
+    def test_bias_formula(self, result: BootstrapResult) -> None:
+        expected = float(result.replicates.mean()) - result.observed
+        assert result.bias() == pytest.approx(expected)
+
+    def test_confidence_interval_lower_less_than_upper(self, result: BootstrapResult) -> None:
+        lo, hi = result.confidence_interval()
+        assert lo < hi
+
+    def test_confidence_interval_matches_percentiles(self, result: BootstrapResult) -> None:
+        lo, hi = result.confidence_interval(level=0.95)
+        assert lo == pytest.approx(float(np.percentile(result.replicates, 2.5)))
+        assert hi == pytest.approx(float(np.percentile(result.replicates, 97.5)))
+
+    def test_confidence_interval_custom_level(self, result: BootstrapResult) -> None:
+        lo, hi = result.confidence_interval(level=0.90)
+        assert lo == pytest.approx(float(np.percentile(result.replicates, 5.0)))
+        assert hi == pytest.approx(float(np.percentile(result.replicates, 95.0)))
+
+    def test_bias_zero_when_replicates_centered_on_observed(self) -> None:
+        result = BootstrapResult(observed=2.0, replicates=np.array([1.0, 2.0, 3.0]))
+        assert result.bias() == pytest.approx(0.0)
+
+
+class TestBootstrap:
+    def test_run_returns_bootstrap_result(self, data: NDArray[np.float64], rng: np.random.Generator) -> None:
+        assert isinstance(Bootstrap(data, B=100, rng=rng).run(np.mean), BootstrapResult)
+
+    def test_observed_is_functional_on_original_data(
+        self, data: NDArray[np.float64], rng: np.random.Generator
+    ) -> None:
+        result = Bootstrap(data, B=100, rng=rng).run(np.mean)
+        assert result.observed == pytest.approx(float(np.mean(data)))
+
+    def test_replicates_shape(self, data: NDArray[np.float64], rng: np.random.Generator) -> None:
+        result = Bootstrap(data, B=250, rng=rng).run(np.mean)
+        assert result.replicates.shape == (250,)
+
+    def test_works_with_std(self, data: NDArray[np.float64], rng: np.random.Generator) -> None:
+        result = Bootstrap(data, B=100, rng=rng).run(np.std)
+        assert result.observed == pytest.approx(float(np.std(data)))
+
+    def test_works_with_median(self, data: NDArray[np.float64], rng: np.random.Generator) -> None:
+        result = Bootstrap(data, B=100, rng=rng).run(np.median)
+        assert result.observed == pytest.approx(float(np.median(data)))
+
+    def test_works_with_custom_functional(
+        self, data: NDArray[np.float64], rng: np.random.Generator
+    ) -> None:
+        p90 = lambda x: float(np.percentile(x, 90))
+        result = Bootstrap(data, B=100, rng=rng).run(p90)
+        assert result.observed == pytest.approx(float(np.percentile(data, 90)))
+
+    def test_reproducible_with_same_seed(self, data: NDArray[np.float64]) -> None:
+        r1 = Bootstrap(data, B=200, rng=np.random.default_rng(7)).run(np.mean)
+        r2 = Bootstrap(data, B=200, rng=np.random.default_rng(7)).run(np.mean)
+        assert np.array_equal(r1.replicates, r2.replicates)
+
+    def test_default_method_uses_bootstrap_rng(self, data: NDArray[np.float64]) -> None:
+        r1 = Bootstrap(data, B=50, rng=np.random.default_rng(99)).run(np.mean)
+        r2 = Bootstrap(data, B=50, rng=np.random.default_rng(99)).run(np.mean)
+        assert np.array_equal(r1.replicates, r2.replicates)
+
+    def test_smooth_resampling_produces_correct_shape(self, data: NDArray[np.float64]) -> None:
+        result = Bootstrap(data, B=50, method=SmoothResampling()).run(np.mean)
+        assert result.replicates.shape == (50,)
+
+    def test_smooth_resampling_observed_equals_classical(
+        self, data: NDArray[np.float64], rng: np.random.Generator
+    ) -> None:
+        r_classical = Bootstrap(data, B=50, rng=rng).run(np.mean)
+        r_smooth = Bootstrap(data, B=50, method=SmoothResampling()).run(np.mean)
+        assert r_classical.observed == pytest.approx(r_smooth.observed)