TorchDrift
diff --git a/‎notebooks/drift_detection_on_images.ipynb
Lines changed: 67 additions & 90 deletions b/‎notebooks/drift_detection_on_images.ipynb
Lines changed: 67 additions & 90 deletions
diff --git a/‎torchdrift/detectors/detector.py
Lines changed: 11 additions & 3 deletions b/‎torchdrift/detectors/detector.py
Lines changed: 11 additions & 3 deletions
diff --git a/‎torchdrift/detectors/isolation_forest.py
Lines changed: 0 additions & 45 deletions b/‎torchdrift/detectors/isolation_forest.py
Lines changed: 0 additions & 45 deletions
diff --git a/‎torchdrift/detectors/ks.py
Lines changed: 48 additions & 4 deletions b/‎torchdrift/detectors/ks.py
Lines changed: 48 additions & 4 deletions
diff --git a/‎torchdrift/detectors/mmd.py
Lines changed: 15 additions & 5 deletions b/‎torchdrift/detectors/mmd.py
Lines changed: 15 additions & 5 deletions
@@ -4,9 +4,10 @@
 import torch
 
 class DriftDetector(torch.nn.Module):
-    def __init__(self):
+    def __init__(self, *, return_p_value=False):
         super().__init__()
         self.register_buffer('base_outputs', None)
+        self.return_p_value = return_p_value
 
     def fit(
         self,
@@ -28,13 +29,20 @@ def fit(
         all_outputs = torch.cat(all_outputs, dim=0)
         self.base_outputs = all_outputs
 
-    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, individual_samples: bool = False):
+    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, compute_score: bool, compute_p_value: bool, individual_samples: bool = False):
         raise NotImplementedError("Override predict_shift_from_features in detectors")
 
+    def compute_p_value(self, inputs: torch.Tensor):
+        assert self.base_outputs is not None, "Please call fit before compute_p_value"
+        _, p_value = self.predict_shift_from_features(self.base_outputs, inputs, compute_score=False, compute_p_value=True)
+        return p_value
+
     def forward(
             self, inputs: torch.Tensor,
             individual_samples: bool = False
     ):
         assert self.base_outputs is not None, "Please call fit before predict_shift"
-        ood_score = self.predict_shift_from_features(self.base_outputs, inputs, individual_samples=individual_samples)
+        ood_score, p_value = self.predict_shift_from_features(self.base_outputs, inputs, compute_score=not self.return_p_value, compute_p_value=self.return_p_value, individual_samples=individual_samples)
+        if self.return_p_value:
+            return p_value
         return ood_score
@@ -1,10 +1,46 @@
 from typing import Optional
 
 import torch
+import numpy
 
 from . import DriftDetector
 
-# TODO: ks p-value computation...
+try:
+    import numba
+    njit = numba.jit(nopython=True, fastmath=True)
+except ImportError:
+    njit = lambda x: x
+
+
+# Numerically stable p-Value computation, see
+# T. Viehmann: Numerically more stable computation of the p-values for the
+#              two-sample Kolmogorov-Smirnov test
+# https://arxiv.org/abs/2102.xxxxx
+
+@njit
+def ks_p_value(n, m, d):
+    size = int(2*m*d+2)
+    lastrow, row = numpy.zeros((2, size), dtype=numpy.float64)
+    last_start_j = 0
+    for i in range(n + 1):
+        start_j = max(int(m * (i/n + d)) + 1-size, 0)
+        lastrow, row = row, lastrow
+        val = 0.0
+        for jj in range(size):
+            j = jj + start_j
+            dist = i/n - j/m
+            if dist > d or dist < -d:
+                val = 1.0
+            elif i == 0 or j == 0:
+                val = 0.0
+            elif jj + start_j - last_start_j >= size:
+                val = (i + val * j) / (i + j)
+            else:
+                val = (lastrow[jj + start_j - last_start_j] * i + val * j) / (i + j)
+            row[jj] = val
+        jjmax = min(size, m + 1 - start_j)
+        last_start_j = start_j
+    return row[m - start_j]
 
 def ks_two_sample_multi_dim(x, y):
     """
@@ -20,12 +56,20 @@ def ks_two_sample_multi_dim(x, y):
 
     # Like failing loudly suggests to return the minimum p-Value under the
     # label Bonferroni correction, this would correspond to the maximum score
+    # see the p-value computation below...
     return ks_scores.max()
 
 class KSDriftDetector(DriftDetector):
-    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, individual_samples: bool = False):
+    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, compute_score: bool, compute_p_value: bool, individual_samples: bool = False):
         assert (
             not individual_samples
-        ), "Individual samples not supported by KS detector"
+        ), "Individual samples not supported by MMD detector"
         ood_score = ks_two_sample_multi_dim(outputs, self.base_outputs)
-        return ood_score
+        if compute_p_value:
+            nx, n_features = base_outputs.shape
+            ny, _ = outputs.shape
+            # multiply by n_features for Bonferroni correction.
+            p_value = min(1.0, ks_p_value(nx, ny, ood_score.item()) * n_features)
+        else:
+            p_value = None
+        return ood_score, p_value
@@ -52,11 +52,21 @@ def kernel_mmd(x, y, n_perm=1000):
 
 
 class KernelMMDDriftDetector(DriftDetector):
-    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, individual_samples: bool = False):
+    def __init__(self, *, return_p_value=False, n_perm: int = 1000):
+        super().__init__(return_p_value=return_p_value)
+        self.n_perm = n_perm
+
+    def predict_shift_from_features(self, base_outputs: torch.Tensor, outputs: torch.Tensor, compute_score: bool, compute_p_value: bool, individual_samples: bool = False):
         assert (
             not individual_samples
         ), "Individual samples not supported by MMD detector"
-        ood_score = kernel_mmd(
-            outputs, self.base_outputs, n_perm=None
-        )  # we have higher == more abnormal
-        return ood_score
+        if not compute_p_value:
+            ood_score = kernel_mmd(
+                outputs, base_outputs, n_perm=None
+            )
+            p_value = None
+        else:
+            ood_score, p_value = kernel_mmd(
+                outputs, base_outputs, n_perm=self.n_perm
+            )
+        return ood_score, p_value