devmotion
diff --git a/‎README.md‎
Lines changed: 2 additions & 3 deletions b/‎README.md‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎docs/src/kce.md‎
Lines changed: 4 additions & 20 deletions b/‎docs/src/kce.md‎
Lines changed: 4 additions & 20 deletions
diff --git a/‎examples/classification/script.jl‎
Lines changed: 3 additions & 3 deletions b/‎examples/classification/script.jl‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎examples/distribution/script.jl‎
Lines changed: 11 additions & 7 deletions b/‎examples/distribution/script.jl‎
Lines changed: 11 additions & 7 deletions
diff --git a/‎src/CalibrationErrors.jl‎
Lines changed: 2 additions & 4 deletions b/‎src/CalibrationErrors.jl‎
Lines changed: 2 additions & 4 deletions
diff --git a/‎src/skce/generic.jl‎ ‎src/skce.jl‎src/skce/generic.jl renamed to src/skce.jl
Lines changed: 215 additions & 1 deletion b/‎src/skce/generic.jl‎ ‎src/skce.jl‎src/skce/generic.jl renamed to src/skce.jl
Lines changed: 215 additions & 1 deletion
@@ -31,9 +31,8 @@ estimator(predictions, targets)
 
 The sets of predictions and targets have to be provided as vectors.
 
-This package implements the estimator `ECE` of the ECE, the estimators
-`BiasedSKCE`, `UnbiasedSKCE`, and `BlockUnbiasedSKCE` for the SKCE, and `UCME` for the
-UCME.
+This package implements the estimator `ECE` of the ECE, the estimator `SKCE` for the SKCE
+(unbiased and biased variants with different sample complexity), and `UCME` for the UCME.
 
 ## Related packages
 
 
@@ -74,28 +74,12 @@ which only the most-confident predictions are considered.[^WLZ19]
 
 [^WLZ21]: Widmann, D., Lindsten, F., & Zachariah, D. (2021). [Calibration tests beyond classification](https://openreview.net/forum?id=-bxf89v3Nx). To be presented at *ICLR 2021*.
 
-## Estimators
+## Estimator
 
 For the SKCE biased and unbiased estimators exist. In CalibrationErrors.jl
-three types of estimators are available, namely [`BiasedSKCE`](@ref),
-[`UnbiasedSKCE`](@ref), and [`BlockUnbiasedSKCE`](@ref). Unsurprisingly,
-[`BiasedSKCE`](@ref) is a biased estimator whereas the other two
-estimators are unbiased. [`BiasedSKCE`](@ref) and [`UnbiasedSKCE`](@ref)
-have quadratic sample complexity whereas [`BlockUnbiasedSKCE`](@ref)
-is an estimator with linear sample complexity.
-
-### Biased estimator
-
-```@docs
-BiasedSKCE
-```
-
-### Unbiased estimators
-
-```@docs
-UnbiasedSKCE
-```
+[`SKCE`](@ref) lets you construct unbiased and biased estimators with quadratic
+and sub-quadratic sample complexity.
 
 ```@docs
-BlockUnbiasedSKCE
+SKCE
 ```
@@ -228,14 +228,14 @@ kernel = with_lengthscale(GaussianKernel(), ν) ⊗ WhiteKernel();
 
 # We obtain the following biased estimate of the squared KCE (SKCE):
 
-skce = BiasedSKCE(kernel)
+skce = SKCE(kernel; unbiased=false)
 skce(val_probs, val_yint)
 
 # Similar to the biased estimates of the ECE, the biased estimates of the SKCE are always
 # non-negative. The unbiased estimates can be negative as well, in particular if the model
 # is (close to being) calibrated:
 
-skce = UnbiasedSKCE(kernel)
+skce = SKCE(kernel)
 skce(val_probs, val_yint)
 
 # When the datasets are large, the quadratic sample complexity of the standard biased and
@@ -246,5 +246,5 @@ skce(val_probs, val_yint)
 # Here we consider the extreme case of blocks with two samples, which yields an estimator
 # with linear sample complexity:
 
-skce = BlockUnbiasedSKCE(kernel, 2)
+skce = SKCE(kernel; blocksize=2)
 skce(val_probs, val_yint)
@@ -226,20 +226,24 @@ Random.seed!(1234)
 data = estimates(_ -> ECE(MedianVarianceBinning(10), TotalVariation()))
 plot_estimates(data; ece=true)
 
-# ## Biased estimator of the squared kernel calibration error
+# ## Unbiased estimators of the squared kernel calibration error
 #
 
 Random.seed!(1234)
-data = estimates(BiasedSKCE ∘ MedianHeuristicKernel(250))
+data = estimates(SKCE ∘ MedianHeuristicKernel(250))
 plot_estimates(data)
 
-# ## Unbiased estimators of the squared kernel calibration error
-#
-
 Random.seed!(1234)
-data = estimates(UnbiasedSKCE ∘ MedianHeuristicKernel(250))
+data = estimates() do predictions_targets
+    return SKCE(MedianHeuristicKernel(250)(predictions_targets); blocksize=2)
+end
 plot_estimates(data)
 
+# ## Biased estimator of the squared kernel calibration error
+#
+
 Random.seed!(1234)
-data = estimates(BlockUnbiasedSKCE ∘ MedianHeuristicKernel(250))
+data = estimates() do predictions_targets
+    return SKCE(MedianHeuristicKernel(250)(predictions_targets); unbiased=false)
+end
 plot_estimates(data)
@@ -21,7 +21,7 @@ const OT = ExactOptimalTransport
 export calibrationerror
 
 # estimators
-export ECE, BiasedSKCE, UnbiasedSKCE, BlockUnbiasedSKCE, UCME
+export ECE, SKCE, UCME
 
 # binning algorithms
 export UniformBinning, MedianVarianceBinning
@@ -35,9 +35,7 @@ include("binning/uniform.jl")
 include("binning/medianvariance.jl")
 include("ece.jl")
 
-include("skce/generic.jl")
-include("skce/biased.jl")
-include("skce/unbiased.jl")
+include("skce.jl")
 
 include("ucme.jl")
 
 
@@ -1,4 +1,218 @@
-abstract type SKCE <: CalibrationErrorEstimator end
+@doc raw"""
+    SKCE(k; unbiased::Bool=true, blocksize=identity)
+
+Estimator of the squared kernel calibration error (SKCE) with kernel `k`.
+
+Kernel `k` on the product space of predictions and targets has to be a `Kernel` from the
+Julia package
+[KernelFunctions.jl](https://github.com/JuliaGaussianProcesses/KernelFunctions.jl)
+that can be evaluated for inputs that are tuples of predictions and targets.
+
+One can choose an unbiased or a biased variant with `unbiased=true` or `unbiased=false`,
+respectively (see details below).
+
+The SKCE is estimated as the average estimate of different blocks of samples. The number of
+samples per block is set by `blocksize`:
+- If `blocksize` is a function `blocksize(n::Int)`, then the number of samples per block is
+  set to `blocksize(n)` where `n` is the total number of samples.
+- If `blocksize` is an integer, then the number of samplers per block is set to `blocksize`,
+  indepedent of the total number of samples.
+The default setting `blocksize=identity` implies that a single block with all samples is
+used.
+
+The number of samples per block must be at least 1 if `unbiased=false` and 2 if
+`unbiased=true`. Additionally, it must be at most the total number of samples. Note that the
+last block is neglected if it is incomplete (see details below).
+
+# Details
+
+The unbiased estimator is not guaranteed to be non-negative whereas the biased estimator is
+always non-negative.
+
+The sample complexity of the estimator is ``O(mn)``, where ``m`` is the block size and ``n``
+is the total number of samples. In particular, with the default setting `blocksize=identity`
+the estimator has a quadratic sample complexity.
+
+Let ``(P_{X_i}, Y_i)_{i=1,\ldots,n}`` be a data set of predictions and corresponding
+targets. The estimator with block size ``m`` is defined as
+```math
+{\bigg\lfloor \frac{n}{m} \bigg\rfloor}^{-1} \sum_{b=1}^{\lfloor n/m \rfloor}
+|B_b|^{-1} \sum_{(i, j) \in B_b} h_k\big((P_{X_i}, Y_i), (P_{X_j}, Y_j)\big),
+```
+where
+```math
+\begin{aligned}
+h_k\big((μ, y), (μ', y')\big) ={}&   k\big((μ, y), (μ', y')\big)
+                                   - 𝔼_{Z ∼ μ} k\big((μ, Z), (μ', y')\big) \\
+                                 & - 𝔼_{Z' ∼ μ'} k\big((μ, y), (μ', Z')\big)
+                                   + 𝔼_{Z ∼ μ, Z' ∼ μ'} k\big((μ, Z), (μ', Z')\big)
+\end{aligned}
+```
+and blocks ``B_b`` (``b = 1, \ldots, \lfloor n/m \rfloor``) are defined as
+```math
+B_b = \begin{cases}
+\{(i, j): (b - 1) m < i < j \leq bm \} & \text{(unbiased)}, \\
+\{(i, j): (b - 1) m < i, j \leq bm \} & \text{(biased)}.
+\end{cases}
+```
+
+# References
+
+Widmann, D., Lindsten, F., & Zachariah, D. (2019). [Calibration tests in multi-class
+classification: A unifying framework](https://proceedings.neurips.cc/paper/2019/hash/1c336b8080f82bcc2cd2499b4c57261d-Abstract.html).
+In: Advances in Neural Information Processing Systems (NeurIPS 2019) (pp. 12257–12267).
+
+Widmann, D., Lindsten, F., & Zachariah, D. (2021). [Calibration tests beyond
+classification](https://openreview.net/forum?id=-bxf89v3Nx).
+"""
+struct SKCE{K<:Kernel,B} <: CalibrationErrorEstimator
+    """Kernel of estimator."""
+    kernel::K
+    """Whether the unbiased estimator is used."""
+    unbiased::Bool
+    """Number of samples per block."""
+    blocksize::B
+
+    function SKCE{K,B}(kernel::K, unbiased::Bool, blocksize::B) where {K,B}
+        if blocksize isa Integer
+            blocksize ≥ 1 + unbiased || throw(
+                ArgumentError(
+                    "there must be at least $(1 + unbiased) $(unbiased ? "samples" : "sample") per block",
+                ),
+            )
+        end
+        return new{K,B}(kernel, unbiased, blocksize)
+    end
+end
+
+function SKCE(kernel::Kernel; unbiased::Bool=true, blocksize::B=identity) where {B}
+    return SKCE{typeof(kernel),B}(kernel, unbiased, blocksize)
+end
+
+## estimators without blocks
+function (skce::SKCE{<:Kernel,typeof(identity)})(
+    predictions::AbstractVector, targets::AbstractVector
+)
+    @unpack kernel, unbiased = skce
+    return if unbiased
+        unbiasedskce(kernel, predictions, targets)
+    else
+        biasedskce(kernel, predictions, targets)
+    end
+end
+
+### unbiased estimator (no blocks)
+function unbiasedskce(kernel::Kernel, predictions::AbstractVector, targets::AbstractVector)
+    # obtain number of samples
+    nsamples = check_nsamples(predictions, targets, 2)
+
+    @inbounds begin
+        # evaluate the kernel function for the first pair of samples
+        hij = unsafe_skce_eval(
+            kernel, predictions[1], targets[1], predictions[2], targets[2]
+        )
+
+        # initialize the estimate
+        estimate = hij / 1
+
+        # for all other pairs of samples
+        n = 1
+        for j in 3:nsamples
+            predictionj = predictions[j]
+            targetj = targets[j]
+
+            for i in 1:(j - 1)
+                predictioni = predictions[i]
+                targeti = targets[i]
+
+                # evaluate the kernel function
+                hij = unsafe_skce_eval(kernel, predictioni, targeti, predictionj, targetj)
+
+                # update the estimate
+                n += 1
+                estimate += (hij - estimate) / n
+            end
+        end
+    end
+
+    return estimate
+end
+
+### biased estimator (no blocks)
+function biasedskce(kernel::Kernel, predictions::AbstractVector, targets::AbstractVector)
+    # obtain number of samples
+    nsamples = check_nsamples(predictions, targets, 1)
+
+    @inbounds begin
+        # evaluate kernel function for the first sample
+        prediction = predictions[1]
+        target = targets[1]
+        hij = unsafe_skce_eval(kernel, prediction, target, prediction, target)
+
+        # initialize the calibration error estimate
+        estimate = hij / 1
+
+        # for all other pairs of samples
+        n = 1
+        for i in 2:nsamples
+            predictioni = predictions[i]
+            targeti = targets[i]
+
+            for j in 1:(i - 1)
+                predictionj = predictions[j]
+                targetj = targets[j]
+
+                # evaluate the kernel function
+                hij = unsafe_skce_eval(kernel, predictioni, targeti, predictionj, targetj)
+
+                # update the estimate (add two terms due to symmetry!)
+                n += 2
+                estimate += 2 * (hij - estimate) / n
+            end
+
+            # evaluate the kernel function
+            hij = unsafe_skce_eval(kernel, predictioni, targeti, predictioni, targeti)
+
+            # update the estimate
+            n += 1
+            estimate += (hij - estimate) / n
+        end
+    end
+
+    return estimate
+end
+
+## estimators with blocks
+function (skce::SKCE)(predictions::AbstractVector, targets::AbstractVector)
+    @unpack kernel, unbiased, blocksize = skce
+
+    # obtain number of samples
+    nsamples = check_nsamples(predictions, targets, 1 + unbiased)
+
+    # compute number of blocks
+    _blocksize = blocksize isa Integer ? blocksize : blocksize(nsamples)
+    (_blocksize isa Integer && _blocksize >= 1 + unbiased) ||
+        error("number of samples per block must be an integer >= $(1 + unbiased)")
+    nblocks = nsamples ÷ _blocksize
+    nblocks >= 1 || error("at least one block of samples is required")
+
+    # create iterator of partitions
+    blocks = Iterators.take(
+        zip(
+            Iterators.partition(predictions, _blocksize),
+            Iterators.partition(targets, _blocksize),
+        ),
+        nblocks,
+    )
+
+    # compute average estimate
+    estimator = SKCE(kernel; unbiased=unbiased)
+    estimate = mean(
+        estimator(_predictions, _targets) for (_predictions, _targets) in blocks
+    )
+
+    return estimate
+end
 
 """
     unsafe_skce_eval(k, p, y, p̃, ỹ)