Merge pull request #10 from EleutherAI/cdf

Add QuantileNormalizer class
EleutherAI · Jan 18, 2024 · 3d33e1f · 3d33e1f
2 parents 9b18b3d + 8f3af13
commit 3d33e1f
Show file tree

Hide file tree

Showing 8 changed files with 506 additions and 2 deletions.
diff --git a/.gitignore b/.gitignore
@@ -158,3 +158,7 @@ cython_debug/
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
 #.idea/
+
+# Weights & Biases logs
+*.ckpt
+wandb/
diff --git a/concept_erasure/__init__.py b/concept_erasure/__init__.py
@@ -3,12 +3,15 @@
 from .leace import ErasureMethod, LeaceEraser, LeaceFitter
 from .oracle import OracleEraser, OracleFitter
 from .quadratic import QuadraticEditor, QuadraticEraser, QuadraticFitter
+from .quantile import QuantileNormalizer, cdf, icdf
 from .shrinkage import optimal_linear_shrinkage
 from .utils import assert_type
 
 __all__ = [
     "assert_type",
+    "cdf",
     "groupby",
+    "icdf",
     "optimal_linear_shrinkage",
     "ConceptScrubber",
     "ErasureMethod",
@@ -20,4 +23,5 @@
     "QuadraticEditor",
     "QuadraticEraser",
     "QuadraticFitter",
+    "QuantileNormalizer",
 ]
diff --git a/concept_erasure/quadratic.py b/concept_erasure/quadratic.py
@@ -51,8 +51,11 @@ class QuadraticEditor:
 
     def transport(self, x: Tensor, source_z: int, target_z: int) -> Tensor:
         """Transport `x` from class `source_z` to class `target_z`"""
+        x_ = x.flatten(1)
+
         T = self.ot_maps[source_z, target_z]
-        return (x - self.class_means[source_z]) @ T.mH + self.class_means[target_z]
+        x_ = (x_ - self.class_means[source_z]) @ T.mH + self.class_means[target_z]
+        return x_.view_as(x)
 
     def __call__(self, x: Tensor, source_z: Tensor, target_z: int) -> Tensor:
         """Transport `x` from classes `source_z` to class `target_z`."""
@@ -146,7 +149,7 @@ def update_single(self, x: Tensor, z: int) -> "QuadraticFitter":
 
         return self
 
-    def editor(self, device: str | None = None) -> QuadraticEditor:
+    def editor(self, device: str | torch.device | None = None) -> QuadraticEditor:
         """Quadratic editor for the concept."""
         sigma = self.sigma_xx
         device = device or sigma.device

diff --git a/concept_erasure/quantile.py b/concept_erasure/quantile.py
@@ -0,0 +1,105 @@
+import torch
+from torch import Tensor
+
+from .groupby import groupby
+
+
+def cdf(x: float | Tensor, q: Tensor) -> Tensor:
+    """Evaluate empirical CDF defined by quantiles `q` on `x`.
+
+    Args:
+        x: `[...]` Scalar or tensor of data points of arbitrary shape.
+        q: `[..., num_quantiles]` batch of quantiles. Must be sorted, and
+            should broadcast with `x` except for the last dimension.
+
+    Returns:
+        `[...]` Empirical CDF evaluated for each element of `x`.
+    """
+    n = q.shape[-1]
+    assert n > 2, "Must have at least two quantiles to interpolate."
+
+    # Approach used by SciPy interp1d with kind='previous'
+    # Shift x toward +inf by epsilon to appropriately handle ties
+    x = torch.nextafter(torch.as_tensor(x), q.new_tensor(torch.inf))
+    return torch.searchsorted(q, x, out_int32=True) / n
+
+
+def icdf(p: Tensor, q: Tensor) -> Tensor:
+    """(Pseudo-)inverse of the ECDF defined by quantiles `q`.
+
+    Returns the *smallest* `x` such that the ECDF of `x` is greater than or
+    equal to `p`.
+
+    NOTE: Strictly speaking, this function should return `-inf` when `p` is exactly
+    zero, because there is no smallest `x` such that `p(x) = 0`. But in practice we
+    want this function to always return a finite value, so we clip to the minimum
+    value in `q`.
+
+    Args:
+        x: `[...]` Tensor of data points of arbitrary shape.
+        q: `[..., num_quantiles]` batch of quantiles. Must be sorted, and
+            should broadcast with `x` except for the last dimension.
+
+    Returns:
+        `[...]` Empirical CDF evaluated for each element of `x`.
+    """
+    n = q.shape[-1]
+    assert n > 2, "Must have at least two quantiles to interpolate."
+
+    soft_ranks = torch.nextafter(p * n, p.new_tensor(0.0))
+    return q.gather(-1, soft_ranks.long())
+
+
+class QuantileNormalizer:
+    """Componentwise quantile normalization."""
+
+    lut: Tensor
+    """`[k, ..., num_bins]` batch of lookup tables."""
+
+    dim: int
+    """Dimension along which to group the data."""
+
+    def __init__(
+        self,
+        x: Tensor,
+        z: Tensor,
+        num_bins: int = 256,
+        dim: int = 0,
+    ):
+        # Efficiently get a view onto each class
+        grouped = groupby(x, z, dim=dim)
+        self.dim = dim
+
+        k = len(grouped.labels)
+        self.lut = x.new_empty([k, *x.shape[1:], num_bins])
+
+        grid = torch.linspace(0, 1, num_bins, device=x.device)
+        for i, grp in grouped:
+            self.lut[i] = grp.quantile(grid, dim=dim).movedim(0, -1)
+
+    @property
+    def num_bins(self) -> int:
+        return self.lut.shape[-1]
+
+    def cdf(self, z: int, x: Tensor) -> Tensor:
+        return cdf(x.movedim(0, -1), self.lut[z]).movedim(-1, 0)
+
+    def sample(self, z: int, n: int) -> Tensor:
+        lut = self.lut[z]
+
+        # Sample p from uniform distribution, then apply inverse CDF
+        p = torch.rand(*lut[..., 0].shape, n, device=lut.device)
+        return icdf(p, lut).movedim(-1, 0)
+
+    def transport(self, x: Tensor, source_z: Tensor, target_z: int) -> Tensor:
+        """Transport `x` from class `source_z` to class `target_z`"""
+        return (
+            groupby(x, source_z, dim=self.dim)
+            .map(
+                # Probability integral transform, followed by inverse for target class
+                lambda z, x: icdf(
+                    cdf(x.movedim(0, -1), self.lut[z]), self.lut[target_z]
+                ).movedim(-1, 0)
+            )
+            .coalesce()
+        )
diff --git a/experiments/prediction_steering/models.py b/experiments/prediction_steering/models.py
@@ -0,0 +1,173 @@
+from itertools import pairwise
+from typing import Literal
+
+import pytorch_lightning as pl
+import torch
+import torchmetrics as tm
+import torchvision as tv
+from torch import nn
+from torch.optim import RAdam
+from torch.optim.lr_scheduler import CosineAnnealingLR
+
+
+class Mlp(pl.LightningModule):
+    def __init__(self, k, h=512, **kwargs):
+        super().__init__()
+        self.save_hyperparameters()
+
+        self.build_net()
+        self.train_acc = tm.Accuracy("multiclass", num_classes=k)
+        self.val_acc = tm.Accuracy("multiclass", num_classes=k)
+        self.test_acc = tm.Accuracy("multiclass", num_classes=k)
+
+    def build_net(self):
+        sizes = [3 * 32 * 32] + [self.hparams["h"]] * 4
+
+        self.net = nn.Sequential(
+            *[
+                MlpBlock(
+                    in_dim,
+                    out_dim,
+                    device=self.device,
+                    dtype=self.dtype,
+                    residual=True,
+                    act="gelu",
+                )
+                for in_dim, out_dim in pairwise(sizes)
+            ]
+        )
+        self.net.append(nn.Linear(self.hparams["h"], self.hparams["k"]))
+
+    def forward(self, x):
+        return self.net(x)
+
+    def training_step(self, batch, batch_idx):
+        x, y = batch
+
+        y_hat = self(x)
+        loss = torch.nn.functional.cross_entropy(y_hat, y)
+        self.log("train_loss", loss)
+
+        self.train_acc(y_hat, y)
+        self.log("train_acc", self.train_acc, on_epoch=True, on_step=False)
+        # Log the norm of the weights
+        fc = self.net[-1] if isinstance(self.net, nn.Sequential) else None
+        if isinstance(fc, nn.Linear):
+            self.log("weight_norm", fc.weight.data.norm())
+
+        return loss
+
+    def validation_step(self, batch, batch_idx):
+        x, y = batch
+
+        y_hat = self(x)
+        loss = torch.nn.functional.cross_entropy(y_hat, y)
+
+        self.val_acc(y_hat, y)
+        self.log("val_loss", loss)
+        self.log("val_acc", self.val_acc, prog_bar=True)
+        return loss
+
+    def test_step(self, batch, batch_idx):
+        x, y = batch
+
+        y_hat = self(x)
+        loss = torch.nn.functional.cross_entropy(y_hat, y)
+
+        self.test_acc(y_hat, y)
+        self.log("test_loss", loss)
+        self.log("test_acc", self.test_acc, prog_bar=True)
+        return loss
+
+    def configure_optimizers(self):
+        opt = RAdam(self.parameters(), lr=1e-4)
+        return [opt], [CosineAnnealingLR(opt, T_max=200)]
+
+
+class MlpMixer(Mlp):
+    def build_net(self):
+        from mlp_mixer_pytorch import MLPMixer
+
+        self.net = MLPMixer(
+            image_size=32,
+            channels=3,
+            patch_size=self.hparams.get("patch_size", 4),
+            num_classes=self.hparams["k"],
+            dim=512,
+            depth=6,
+            dropout=0.1,
+        )
+
+
+class ResNet(Mlp):
+    def build_net(self):
+        self.net = tv.models.resnet18(pretrained=False, num_classes=self.hparams["k"])
+
+
+class ViT(MlpMixer):
+    def build_net(self):
+        from vit_pytorch import ViT
+
+        self.net = ViT(
+            image_size=32,
+            patch_size=self.hparams.get("patch_size", 4),
+            num_classes=self.hparams["k"],
+            dim=512,
+            depth=6,
+            heads=8,
+            mlp_dim=512,
+            dropout=0.1,
+            emb_dropout=0.1,
+        )
+
+
+class MlpBlock(nn.Module):
+    def __init__(
+        self,
+        in_features: int,
+        out_features: int,
+        device=None,
+        dtype=None,
+        residual: bool = True,
+        *,
+        act: Literal["relu", "gelu"] = "relu",
+        norm: Literal["batch", "layer"] = "batch",
+    ):
+        super().__init__()
+
+        self.linear1 = nn.Linear(
+            in_features, out_features, bias=False, device=device, dtype=dtype
+        )
+        self.linear2 = nn.Linear(
+            out_features, out_features, bias=False, device=device, dtype=dtype
+        )
+        self.act_fn = nn.ReLU() if act == "relu" else nn.GELU()
+
+        norm_cls = nn.BatchNorm1d if norm == "batch" else nn.LayerNorm
+        self.bn1 = norm_cls(out_features, device=device, dtype=dtype)
+        self.bn2 = norm_cls(out_features, device=device, dtype=dtype)
+        self.downsample = (
+            nn.Linear(in_features, out_features, bias=False, device=device, dtype=dtype)
+            if in_features != out_features
+            else None
+        )
+        self.residual = residual
+
+    def forward(self, x):
+        identity = x
+
+        out = self.linear1(x)
+        out = self.bn1(out)
+        out = self.act_fn(out)
+
+        out = self.linear2(out)
+        out = self.bn2(out)
+
+        if self.downsample is not None:
+            identity = self.downsample(identity)
+
+        if self.residual:
+            out += identity
+
+        out = self.act_fn(out)
+        return out